Compare commits
No commits in common. "fe61b63a0b82261854f785761f5ef3a2d821e7f4" and "091e0b27e68b76aec57d0d7c66ac317f3efa95b8" have entirely different histories.
fe61b63a0b
...
091e0b27e6
|
@ -47,7 +47,7 @@ def answer(
|
||||||
results: tuple[list[str], list[str]] = internet.Google(
|
results: tuple[list[str], list[str]] = internet.Google(
|
||||||
query, GOOGLE_SEARCH_API_KEY, GOOGLE_SEARCH_ENGINE_ID
|
query, GOOGLE_SEARCH_API_KEY, GOOGLE_SEARCH_ENGINE_ID
|
||||||
).google()
|
).google()
|
||||||
context: str = str(" ".join([str(string) for string in results]))
|
context: str = str(" ".join([str(string) for string in results[0]]))
|
||||||
print(f"context: {context}")
|
print(f"context: {context}")
|
||||||
|
|
||||||
if model.startswith("openai-"):
|
if model.startswith("openai-"):
|
||||||
|
@ -90,6 +90,6 @@ def answer(
|
||||||
print(
|
print(
|
||||||
answer(
|
answer(
|
||||||
query="What is the newest pokemon game?",
|
query="What is the newest pokemon game?",
|
||||||
model="openai-chatgpt",
|
model="hf-deepset/xlm-roberta-large-squad2",
|
||||||
)
|
)
|
||||||
)
|
)
|
||||||
|
|
|
@ -100,7 +100,9 @@ class Google:
|
||||||
soup = BeautifulSoup(html, "html.parser")
|
soup = BeautifulSoup(html, "html.parser")
|
||||||
text = soup.get_text()
|
text = soup.get_text()
|
||||||
normalized_text = normalizer(text)
|
normalized_text = normalizer(text)
|
||||||
return normalized_text
|
sentences: list[str] = sentencizer(normalized_text)
|
||||||
|
sentence: str = str(" ".join(sentences))
|
||||||
|
return sentence
|
||||||
except Exception:
|
except Exception:
|
||||||
error: str = ""
|
error: str = ""
|
||||||
return error
|
return error
|
||||||
|
@ -116,9 +118,8 @@ class Google:
|
||||||
def __get_urls_contents(self: "Google") -> None:
|
def __get_urls_contents(self: "Google") -> None:
|
||||||
loop = asyncio.new_event_loop()
|
loop = asyncio.new_event_loop()
|
||||||
asyncio.set_event_loop(loop)
|
asyncio.set_event_loop(loop)
|
||||||
contents = loop.run_until_complete(self.__fetch_urls(self.__urls))
|
self.__content = loop.run_until_complete(self.__fetch_urls(self.__urls))
|
||||||
loop.close()
|
loop.close()
|
||||||
self.__content = contents
|
|
||||||
|
|
||||||
def __filter_irrelevant_processing(self: "Google") -> None:
|
def __filter_irrelevant_processing(self: "Google") -> None:
|
||||||
with concurrent.futures.ThreadPoolExecutor(max_workers=500) as executor:
|
with concurrent.futures.ThreadPoolExecutor(max_workers=500) as executor:
|
||||||
|
@ -136,7 +137,7 @@ class Google:
|
||||||
self.__get_urls_contents()
|
self.__get_urls_contents()
|
||||||
if filter_irrelevant:
|
if filter_irrelevant:
|
||||||
self.__filter_irrelevant_processing()
|
self.__filter_irrelevant_processing()
|
||||||
results: tuple[list[str], list[str]] = (self.__content, self.__urls) # type: ignore
|
results: tuple[list[str], list[str]] = (self.__content[0], self.__urls) # type: ignore
|
||||||
return results
|
return results
|
||||||
|
|
||||||
|
|
||||||
|
|
|
@ -5,7 +5,7 @@ build-backend = "poetry.core.masonry.api"
|
||||||
|
|
||||||
[tool.poetry]
|
[tool.poetry]
|
||||||
name = "internet-ml"
|
name = "internet-ml"
|
||||||
version = "3.0.0" # fresh start from 3.0.0
|
version = "0.1.0"
|
||||||
description = "Internet-ML: Allowing ML to connect to the internet"
|
description = "Internet-ML: Allowing ML to connect to the internet"
|
||||||
readme = "./.github/README.md"
|
readme = "./.github/README.md"
|
||||||
authors = ["Thamognya Kodi <contact@thamognya.com>"]
|
authors = ["Thamognya Kodi <contact@thamognya.com>"]
|
||||||
|
|
Loading…
Reference in New Issue