internet_ml/internet_ml/NLP/no_context/QA.py

# type: ignore
"""
model naming convention
# Open-AI models:
include prefix openai-*
# HuggingFace
include prefix hf-*
"""
from typing import Any, List, Tuple

import os
import sys
from pathlib import Path

sys.path.append(str(Path(__file__).parent.parent.parent) + "/tools/NLP/data")
sys.path.append(str(Path(__file__).parent.parent.parent) + "/tools/NLP")
sys.path.append(str(Path(__file__).parent.parent.parent) + "/tools")
sys.path.append(str(Path(__file__).parent.parent.parent) + "/utils")

import config
import dotenv
import internet
import openai
from ChatGPT import Chatbot
from transformers import pipeline

dotenv.load_dotenv()


def answer(
    query: str,
    model: str = "openai-chatgpt",
    GOOGLE_SEARCH_API_KEY: str = "",
    GOOGLE_SEARCH_ENGINE_ID: str = "",
    OPENAI_API_KEY: str = "",
    CHATGPT_SESSION_TOKEN: str = "",
) -> tuple[Any, list[str]]:
    if OPENAI_API_KEY == "":
        OPENAI_API_KEY = str(os.environ.get("OPENAI_API_KEY"))
        openai.api_key = OPENAI_API_KEY
    if CHATGPT_SESSION_TOKEN == "":
        CHATGPT_SESSION_TOKEN = str(os.environ.get("CHATGPT_SESSION_TOKEN"))

    if not (model.startswith("openai-") or model.startswith("hf-")):
        model = "openai-chatgpt"  # Default

    results: tuple[list[str], list[str]] = internet.Google(
        query, GOOGLE_SEARCH_API_KEY, GOOGLE_SEARCH_ENGINE_ID
    ).google()
    context: str = str(" ".join([str(string) for string in results[0]]))
    print(f"context: {context}")

    if model.startswith("openai-"):
        if model == "openai-chatgpt":
            # ChatGPT
            prompt = f'Use the context: {context[:4000]} and answer the question: "{query}" with the context and prior knowledge. Also write at the very least long answers.'
            chatbot = Chatbot(
                {"session_token": CHATGPT_SESSION_TOKEN},
                conversation_id=None,
                parent_id=None,
            )
            response = chatbot.ask(
                prompt=prompt,
                conversation_id=None,
                parent_id=None,
            )
            return (response["message"], results[1])
        else:
            if model == "openai-text-davinci-003":
                # text-davinci-003
                prompt = f'Use the context: {context[:3000]} and answer the question: "{query}" with the context and prior knowledge. Also write at the very least long answers.'
                response = openai.Completion.create(
                    model="text-davinci-003",
                    prompt=prompt,
                    max_tokens=len(context),
                    n=1,
                    stop=None,
                    temperature=0.5,
                )
                return (response.choices[0].text, results[1])
            # TODO: add suport later
    else:
        # HuggingFace
        model = model.replace("hf-", "", 1)
        qa_model = pipeline("question-answering", model=model)
        response = qa_model(question=query, context=context)
        return (response["answer"], results[1])


print(
    answer(
        query="What is the newest pokemon game?",
        model="hf-deepset/xlm-roberta-large-squad2",
    )
)
update: look at todo 2023-01-11 15:59:46 +00:00			`# type: ignore`
update: look at todo 2023-01-14 14:20:23 +00:00			`"""`
			`model naming convention`
			`# Open-AI models:`
			`include prefix openai-*`
			`# HuggingFace`
			`include prefix hf-*`
			`"""`
updates to code via mypy 2022-12-27 06:38:47 +00:00			`from typing import Any, List, Tuple`
update 2022-12-26 15:43:10 +00:00
update: look at todo 2022-12-30 05:28:26 +00:00			`import os`
update 2022-12-25 17:15:24 +00:00			`import sys`
			`from pathlib import Path`

			`sys.path.append(str(Path(__file__).parent.parent.parent) + "/tools/NLP/data")`
update: look at todo 2023-01-11 15:59:46 +00:00			`sys.path.append(str(Path(__file__).parent.parent.parent) + "/tools/NLP")`
update: look at todo 2023-01-12 05:50:18 +00:00			`sys.path.append(str(Path(__file__).parent.parent.parent) + "/tools")`
updates to code via mypy 2022-12-27 06:38:47 +00:00			`sys.path.append(str(Path(__file__).parent.parent.parent) + "/utils")`
update: look at todo 2023-01-12 05:50:18 +00:00
updates to code via mypy 2022-12-27 06:38:47 +00:00			`import config`
final fixes: huggingface works now 2023-01-18 14:38:51 +00:00			`import dotenv`
update 2022-12-25 17:15:24 +00:00			`import internet`
final fixes: huggingface works now 2023-01-18 14:38:51 +00:00			`import openai`
update: look at todo 2023-01-11 15:59:46 +00:00			`from ChatGPT import Chatbot`
final fixes: huggingface works now 2023-01-18 14:38:51 +00:00			`from transformers import pipeline`
update 2022-12-25 17:15:24 +00:00
update: look at todo 2023-01-10 12:50:43 +00:00			`dotenv.load_dotenv()`

update 2022-12-26 15:43:10 +00:00
update 2022-12-30 06:50:36 +00:00			`def answer(`
update: look at todo 2023-01-10 12:50:43 +00:00			`query: str,`
update: look at todo 2023-01-11 15:59:46 +00:00			`model: str = "openai-chatgpt",`
update: look at todo 2023-01-10 12:50:43 +00:00			`GOOGLE_SEARCH_API_KEY: str = "",`
			`GOOGLE_SEARCH_ENGINE_ID: str = "",`
			`OPENAI_API_KEY: str = "",`
			`CHATGPT_SESSION_TOKEN: str = "",`
update 2022-12-30 06:50:36 +00:00			`) -> tuple[Any, list[str]]:`
update: look at todo 2023-01-10 12:50:43 +00:00			`if OPENAI_API_KEY == "":`
			`OPENAI_API_KEY = str(os.environ.get("OPENAI_API_KEY"))`
			`openai.api_key = OPENAI_API_KEY`
			`if CHATGPT_SESSION_TOKEN == "":`
			`CHATGPT_SESSION_TOKEN = str(os.environ.get("CHATGPT_SESSION_TOKEN"))`
update: look at todo 2023-01-14 14:20:23 +00:00
update: look at todo 2023-01-11 15:59:46 +00:00			`if not (model.startswith("openai-") or model.startswith("hf-")):`
			`model = "openai-chatgpt" # Default`
update: look at todo 2023-01-14 14:20:23 +00:00
			`results: tuple[list[str], list[str]] = internet.Google(`
			`query, GOOGLE_SEARCH_API_KEY, GOOGLE_SEARCH_ENGINE_ID`
			`).google()`
final fixes: huggingface works now 2023-01-18 14:38:51 +00:00			`context: str = str(" ".join([str(string) for string in results[0]]))`
			`print(f"context: {context}")`
update: look at todo 2023-01-14 14:20:23 +00:00
update: look at todo 2023-01-11 15:59:46 +00:00			`if model.startswith("openai-"):`
			`if model == "openai-chatgpt":`
			`# ChatGPT`
final fixes: huggingface works now 2023-01-18 14:38:51 +00:00			`prompt = f'Use the context: {context[:4000]} and answer the question: "{query}" with the context and prior knowledge. Also write at the very least long answers.'`
update: look at todo 2023-01-11 15:59:46 +00:00			`chatbot = Chatbot(`
			`{"session_token": CHATGPT_SESSION_TOKEN},`
update: look at todo 2023-01-14 13:12:43 +00:00			`conversation_id=None,`
			`parent_id=None,`
update: look at todo 2023-01-11 15:59:46 +00:00			`)`
			`response = chatbot.ask(`
update: look at todo 2023-01-12 05:50:18 +00:00			`prompt=prompt,`
update: look at todo 2023-01-14 13:12:43 +00:00			`conversation_id=None,`
			`parent_id=None,`
update: look at todo 2023-01-11 15:59:46 +00:00			`)`
update: look at todo 2023-01-12 04:51:03 +00:00			`return (response["message"], results[1])`
update: look at todo 2023-01-11 15:59:46 +00:00			`else:`
			`if model == "openai-text-davinci-003":`
update: look at todo 2023-01-14 14:20:23 +00:00			`# text-davinci-003`
final fixes: huggingface works now 2023-01-18 14:38:51 +00:00			`prompt = f'Use the context: {context[:3000]} and answer the question: "{query}" with the context and prior knowledge. Also write at the very least long answers.'`
update: look at todo 2023-01-11 15:59:46 +00:00			`response = openai.Completion.create(`
			`model="text-davinci-003",`
update: look at todo 2023-01-14 14:20:23 +00:00			`prompt=prompt,`
update: look at todo 2023-01-11 15:59:46 +00:00			`max_tokens=len(context),`
			`n=1,`
			`stop=None,`
			`temperature=0.5,`
			`)`
			`return (response.choices[0].text, results[1])`
			`# TODO: add suport later`
update: look at todo 2023-01-10 12:50:43 +00:00			`else:`
final fixes: huggingface works now 2023-01-18 14:38:51 +00:00			`# HuggingFace`
update: look at todo 2023-01-10 12:50:43 +00:00			`model = model.replace("hf-", "", 1)`
update: look at todo 2023-01-11 15:59:46 +00:00			`qa_model = pipeline("question-answering", model=model)`
final fixes: huggingface works now 2023-01-18 14:38:51 +00:00			`response = qa_model(question=query, context=context)`
update: look at todo 2023-01-11 15:59:46 +00:00			`return (response["answer"], results[1])`
updates to code via mypy 2022-12-27 06:38:47 +00:00

update: look at todo 2023-01-12 10:41:31 +00:00			`print(`
			`answer(`
final fixes: huggingface works now 2023-01-18 14:38:51 +00:00			`query="What is the newest pokemon game?",`
			`model="hf-deepset/xlm-roberta-large-squad2",`
update: look at todo 2023-01-12 10:41:31 +00:00			`)`
			`)`