wip

2024-01-07 19:20:09 +01:00
parent 671bd13cd8
commit 28749f0526
13 changed files with 334 additions and 2 deletions
--- a/.env.example
+++ b/.env.example
@@ -0,0 +1 @@
+OPENAI_KEY = sk...
--- a/.vscode/launch.json
+++ b/.vscode/launch.json
@@ -0,0 +1,17 @@
+{
+    // Use IntelliSense to learn about possible attributes.
+    // Hover to view descriptions of existing attributes.
+    // For more information, visit: https://go.microsoft.com/fwlink/?linkid=830387
+    "version": "0.2.0",
+    "configurations": [
+        {
+            "name": "Python: Current File",
+            "type": "python",
+            "request": "launch",
+            "program": "${file}",
+            "console": "integratedTerminal",
+            "cwd": "${workspaceFolder}",
+            "justMyCode": false
+        }
+    ]
+}
--- a/.vscode/settings.json
+++ b/.vscode/settings.json
@@ -0,0 +1,4 @@
+{
+    "python.analysis.autoImportCompletions": true,
+    "python.analysis.typeCheckingMode": "basic"
+}
--- a/README.md
+++ b/README.md
@@ -1,3 +1,3 @@
-# copeai-ai-backend
+# ai

-CopeAI Backend AI
+[Showdown76py](https://github.com/showdown76py)'s "AI lib"
--- a/copeai_backend/init.py
+++ b/copeai_backend/init.py
@@ -0,0 +1,3 @@
+from .conversation import Conversation, ConversationResponse, Role
+from .generate import process_text_streaming, simple_process_text
+from .models import Model, Service, GPT_3, GPT_4
--- a/copeai_backend/conversation.py
+++ b/copeai_backend/conversation.py
@@ -0,0 +1,101 @@
+from dataclasses import dataclass
+import typing
+from openai import AsyncStream
+from openai.types.chat import ChatCompletionChunk, ChatCompletion
+import tiktoken
+from enum import Enum
+
+from copeai_backend.exception import ConversationLockedException
+
+from . import models
+
+encoding = tiktoken.get_encoding("cl100k_base")
+
+BASE_PROMPT = ""
+
+
+def text_to_tokens(string_or_messages: str | list[str | dict | list]) -> int:
+    """Returns the number of tokens in a text string."""
+    num_tokens = 0
+
+    messages = []
+    if isinstance(string_or_messages, str):
+        messages = [{"role": "user", "content": string_or_messages}]
+    else:
+        messages = string_or_messages
+
+    for message in messages:
+        # every message follows <im_start>{role/name}\n{content}<im_end>\n
+        num_tokens += 4
+
+        if isinstance(message, dict):
+            for key, value in message.items():
+                num_tokens += len(encoding.encode(str(value)))
+                if key == "name":  # if there's a name, the role is omitted
+                    num_tokens += -1  # role is always required and always 1 token
+        elif isinstance(message, list):
+            for item in message:
+                if item["type"] == "text":
+                    num_tokens += len(encoding.encode(item["text"]))
+        elif isinstance(message, str):
+            num_tokens += len(encoding.encode(message))
+    num_tokens += 2  # every reply is primed with <im_start>assistant
+
+    return num_tokens
+
+
+class Role(Enum):
+    SYSTEM = "system"
+    USER = "user"
+    ASSISTANT = "assistant"
+
+
+@dataclass
+class GeneratingResponseChunk:
+    """A chunk of a response from the model. You receive this when the **generation is still going on**, and streamed."""
+
+    text: str
+    raw: ChatCompletionChunk
+
+
+class Conversation:
+    def __init__(self, add_base_prompt: bool = True, storage: dict = {}) -> None:
+        self.messages = []
+        self.last_used_model: models.Model | None = None
+        self.locked = False
+        self.interruput = False
+        self.store = storage
+
+        if add_base_prompt and BASE_PROMPT:
+            self.messages.append({"role": Role.SYSTEM, "content": BASE_PROMPT})
+
+    def add_message(self, role: Role, message, username: str | None = None):
+        if not self.locked:
+            d = {"role": role.value, "content": message}
+            if username:
+                d["name"] = username
+            self.messages.append(d)
+        else:
+            raise ConversationLockedException()
+
+    def interrupt(self):
+        """Interrupts any conversations going on."""
+        self.interruput = True
+
+    def get_tokens(self):
+        return text_to_tokens(self.messages)
+
+    def last_role(self):
+        return Role(self.messages[-1]["role"])
+
+    def last_message(self):
+        return self.messages[-1]["content"]
+
+
+@dataclass
+class ConversationResponse:
+    """A response from the generation. You receive this when the **generation is done**, or non-streamed requests."""
+
+    conversation: Conversation
+    response: str | list[str]
+    raw_response: list[ChatCompletion] | list[ChatCompletionChunk]
--- a/copeai_backend/exception/LockedConversationException.py
+++ b/copeai_backend/exception/LockedConversationException.py
@@ -0,0 +1,7 @@
+class ConversationLockedException(Exception):
+    """Raised when there is already an ongoing conversation."""
+
+    def __init__(self):
+        super().__init__(
+            "There is already an ongoing conversation. Please wait until it is finished."
+        )
--- a/copeai_backend/exception/init.py
+++ b/copeai_backend/exception/init.py
@@ -0,0 +1 @@
+from .LockedConversationException import ConversationLockedException
--- a/copeai_backend/generate.py
+++ b/copeai_backend/generate.py
@@ -0,0 +1,93 @@
+import json
+import traceback
+import requests
+import openai
+
+import asyncio
+from dotenv import load_dotenv
+import os
+from .conversation import (
+    Conversation,
+    Role,
+    ConversationResponse,
+    GeneratingResponseChunk,
+)
+from .models import Model
+from .exception import ConversationLockedException
+
+load_dotenv()
+
+oclient = openai.AsyncOpenAI(api_key=os.environ.get("OPENAI_KEY"))
+
+
+async def simple_process_text(
+    conversation: Conversation,
+    model: Model,
+    new_message: str,
+    additional_args: dict = {},
+) -> ConversationResponse:
+    conversation.add_message(Role.USER, new_message)
+    conversation.last_used_model = model
+    r = await oclient.chat.completions.create(
+        model=model.id, messages=conversation.messages, **additional_args
+    )
+    conversation.add_message(Role.ASSISTANT, r.choices[0].message.content)
+    return ConversationResponse(conversation, r.choices[0].message.content, r)
+
+
+async def process_text_streaming(
+    conversation: Conversation,
+    model: Model,
+    new_message: str,
+    additional_args: dict = {},
+):
+    if conversation.locked:
+        raise ConversationLockedException()
+
+    try:
+        text_parts = []
+        resp_parts = []
+
+        conversation.add_message(
+            Role.USER,
+            new_message,
+            (additional_args["userid"] if "userid" in additional_args else "unknown"),
+        )
+        conversation.last_used_model = model
+        conversation.locked = True
+        if model.service == "openai":
+            response = await oclient.chat.completions.create(
+                model=model.id,
+                messages=conversation.messages,
+                temperature=0.9,
+                top_p=1.0,
+                presence_penalty=0.6,
+                frequency_penalty=0.0,
+                max_tokens=4096,
+                stream=True,
+            )
+
+            async for chunk in response:
+                partition = chunk.choices[0].delta
+                if (
+                    "content"
+                    in json.loads(chunk.model_dump_json())["choices"][0]["delta"].keys()
+                ):
+                    if partition.content is not None:
+                        text_parts.append(partition.content)
+                        resp_parts.append(chunk)
+                        yield GeneratingResponseChunk(partition.content, chunk)
+
+                    if conversation.interruput:
+                        conversation.add_message(Role.ASSISTANT, text_parts)
+                        yield ConversationResponse(conversation, text_parts, resp_parts)
+
+        conversation.locked = False
+        conversation.add_message(Role.ASSISTANT, text_parts)
+        yield ConversationResponse(conversation, text_parts, resp_parts)
+
+        conversation.locked = False
+
+    except Exception as e:
+        conversation.locked = False
+        raise e
--- a/copeai_backend/models.py
+++ b/copeai_backend/models.py
@@ -0,0 +1,17 @@
+from dataclasses import dataclass
+from typing import Literal
+
+
+Service = Literal["openai", "bard"]
+
+
+@dataclass
+class Model:
+    id: str
+    usage_name: str
+    service: Service
+
+
+GPT_3 = Model(id="gpt-3.5-turbo-16k-0613", usage_name="GPT-3", service="openai")
+
+GPT_4 = Model(id="gpt-4-16k-0613", usage_name="GPT-4", service="openai")
--- a/examples/basic-generation.py
+++ b/examples/basic-generation.py
@@ -0,0 +1,42 @@
+# fmt: off
+
+from copeai_backend import generate, models, conversation
+import asyncio
+
+async def main():
+    # Add a base prompt, if you wish to.
+    conversation.BASE_PROMPT = "You are CopeAI. You are kind, and useful. Answer to questions properly and make sure that it is really useful."
+
+    # Create a conversation object, that will store the history of the messages.
+    conv = generate.Conversation(
+        add_base_prompt=True,               # Add the base prompt to the conversation. By default, it is True.
+                                            # However, the base prompt is empty by default. You must set it yourself.
+        storage={}                          # If you need to store some data.
+    )
+
+    # Generate a response. This is a non-streamed request, so it will return a ConversationResponse object. This is a blocking call.
+    response: generate.ConversationResponse = await generate.simple_process_text(
+        conversation=conv,          # The conversation object.
+        model=models.GPT_3,     # The model to use. Add your own models to the MODELS dict in models.py.
+        new_message="Hello, how are you?",  # The message to send.
+        # additional_args={}                  # Additional arguments to send to the API. These are different for each API.
+    )
+
+    # Print the response.
+    print(response.response)
+
+    # The assistant's message is automatically implemented into the conversation object.
+    # Add a new user message.
+    conv.add_message(
+        role=generate.Role.USER,            # The role of the message. This is an enum, so you can use generate.Role.USER, generate.Role.ASSISTANT, or generate.Role.SYSTEM.
+        message="I am fine, thanks!"        # The message.
+    )
+
+    # Generate a response.
+    response: generate.ConversationResponse = await generate.simple_process_text(
+        conversation=conv,
+        model=models.GPT_3,
+        new_message="...",
+    )
+
+asyncio.run(main())
--- a/examples/streamed-generation.py
+++ b/examples/streamed-generation.py
@@ -0,0 +1,42 @@
+# fmt: off
+
+from copeai_backend import generate, models, conversation
+import asyncio
+
+async def main():
+    # Add a base prompt, if you wish to.
+    conversation.BASE_PROMPT = "You are CopeAI. You are kind, and useful. Answer to questions properly and make sure that it is really useful."
+
+    # Create a conversation object, that will store the history of the messages.
+    conv = generate.Conversation(
+        add_base_prompt=True,               # Add the base prompt to the conversation. By default, it is True.
+                                            # However, the base prompt is empty by default. You must set it yourself.
+        storage={}                          # If you need to store some data.
+    )
+
+    # Generate a response. This is a non-streamed request, so it will return a ConversationResponse object. This is a blocking call.
+    response: generate.ConversationResponse = await generate.simple_process_text(
+        conversation=conv,          # The conversation object.
+        model=models.GPT_3,     # The model to use. Add your own models to the MODELS dict in models.py.
+        new_message="Hello, how are you?",  # The message to send.
+        # additional_args={}                  # Additional arguments to send to the API. These are different for each API.
+    )
+
+    # Print the response.
+    print(response.response)
+
+    # The assistant's message is automatically implemented into the conversation object.
+    # Add a new user message.
+    conv.add_message(
+        role=generate.Role.USER,            # The role of the message. This is an enum, so you can use generate.Role.USER, generate.Role.ASSISTANT, or generate.Role.SYSTEM.
+        message="I am fine, thanks!"        # The message.
+    )
+
+    # Generate a response.
+    response: generate.ConversationResponse = await generate.simple_process_text(
+        conversation=conv,
+        model=models.GPT_3,
+        new_message="...",
+    )
+
+asyncio.run(main())
--- a/requirements.txt
+++ b/requirements.txt
@@ -0,0 +1,4 @@
+openai
+tiktoken
+python-dotenv
+discord
				`@@ -0,0 +1 @@`
				`from .LockedConversationException import ConversationLockedException`