wip
This commit is contained in:
parent
671bd13cd8
commit
28749f0526
1
.env.example
Normal file
1
.env.example
Normal file
@ -0,0 +1 @@
|
|||||||
|
OPENAI_KEY = sk...
|
17
.vscode/launch.json
vendored
Normal file
17
.vscode/launch.json
vendored
Normal file
@ -0,0 +1,17 @@
|
|||||||
|
{
|
||||||
|
// Use IntelliSense to learn about possible attributes.
|
||||||
|
// Hover to view descriptions of existing attributes.
|
||||||
|
// For more information, visit: https://go.microsoft.com/fwlink/?linkid=830387
|
||||||
|
"version": "0.2.0",
|
||||||
|
"configurations": [
|
||||||
|
{
|
||||||
|
"name": "Python: Current File",
|
||||||
|
"type": "python",
|
||||||
|
"request": "launch",
|
||||||
|
"program": "${file}",
|
||||||
|
"console": "integratedTerminal",
|
||||||
|
"cwd": "${workspaceFolder}",
|
||||||
|
"justMyCode": false
|
||||||
|
}
|
||||||
|
]
|
||||||
|
}
|
4
.vscode/settings.json
vendored
Normal file
4
.vscode/settings.json
vendored
Normal file
@ -0,0 +1,4 @@
|
|||||||
|
{
|
||||||
|
"python.analysis.autoImportCompletions": true,
|
||||||
|
"python.analysis.typeCheckingMode": "basic"
|
||||||
|
}
|
@ -1,3 +1,3 @@
|
|||||||
# copeai-ai-backend
|
# ai
|
||||||
|
|
||||||
CopeAI Backend AI
|
[Showdown76py](https://github.com/showdown76py)'s "AI lib"
|
||||||
|
3
copeai_backend/__init__.py
Normal file
3
copeai_backend/__init__.py
Normal file
@ -0,0 +1,3 @@
|
|||||||
|
from .conversation import Conversation, ConversationResponse, Role
|
||||||
|
from .generate import process_text_streaming, simple_process_text
|
||||||
|
from .models import Model, Service, GPT_3, GPT_4
|
101
copeai_backend/conversation.py
Normal file
101
copeai_backend/conversation.py
Normal file
@ -0,0 +1,101 @@
|
|||||||
|
from dataclasses import dataclass
|
||||||
|
import typing
|
||||||
|
from openai import AsyncStream
|
||||||
|
from openai.types.chat import ChatCompletionChunk, ChatCompletion
|
||||||
|
import tiktoken
|
||||||
|
from enum import Enum
|
||||||
|
|
||||||
|
from copeai_backend.exception import ConversationLockedException
|
||||||
|
|
||||||
|
from . import models
|
||||||
|
|
||||||
|
encoding = tiktoken.get_encoding("cl100k_base")
|
||||||
|
|
||||||
|
BASE_PROMPT = ""
|
||||||
|
|
||||||
|
|
||||||
|
def text_to_tokens(string_or_messages: str | list[str | dict | list]) -> int:
|
||||||
|
"""Returns the number of tokens in a text string."""
|
||||||
|
num_tokens = 0
|
||||||
|
|
||||||
|
messages = []
|
||||||
|
if isinstance(string_or_messages, str):
|
||||||
|
messages = [{"role": "user", "content": string_or_messages}]
|
||||||
|
else:
|
||||||
|
messages = string_or_messages
|
||||||
|
|
||||||
|
for message in messages:
|
||||||
|
# every message follows <im_start>{role/name}\n{content}<im_end>\n
|
||||||
|
num_tokens += 4
|
||||||
|
|
||||||
|
if isinstance(message, dict):
|
||||||
|
for key, value in message.items():
|
||||||
|
num_tokens += len(encoding.encode(str(value)))
|
||||||
|
if key == "name": # if there's a name, the role is omitted
|
||||||
|
num_tokens += -1 # role is always required and always 1 token
|
||||||
|
elif isinstance(message, list):
|
||||||
|
for item in message:
|
||||||
|
if item["type"] == "text":
|
||||||
|
num_tokens += len(encoding.encode(item["text"]))
|
||||||
|
elif isinstance(message, str):
|
||||||
|
num_tokens += len(encoding.encode(message))
|
||||||
|
num_tokens += 2 # every reply is primed with <im_start>assistant
|
||||||
|
|
||||||
|
return num_tokens
|
||||||
|
|
||||||
|
|
||||||
|
class Role(Enum):
|
||||||
|
SYSTEM = "system"
|
||||||
|
USER = "user"
|
||||||
|
ASSISTANT = "assistant"
|
||||||
|
|
||||||
|
|
||||||
|
@dataclass
|
||||||
|
class GeneratingResponseChunk:
|
||||||
|
"""A chunk of a response from the model. You receive this when the **generation is still going on**, and streamed."""
|
||||||
|
|
||||||
|
text: str
|
||||||
|
raw: ChatCompletionChunk
|
||||||
|
|
||||||
|
|
||||||
|
class Conversation:
|
||||||
|
def __init__(self, add_base_prompt: bool = True, storage: dict = {}) -> None:
|
||||||
|
self.messages = []
|
||||||
|
self.last_used_model: models.Model | None = None
|
||||||
|
self.locked = False
|
||||||
|
self.interruput = False
|
||||||
|
self.store = storage
|
||||||
|
|
||||||
|
if add_base_prompt and BASE_PROMPT:
|
||||||
|
self.messages.append({"role": Role.SYSTEM, "content": BASE_PROMPT})
|
||||||
|
|
||||||
|
def add_message(self, role: Role, message, username: str | None = None):
|
||||||
|
if not self.locked:
|
||||||
|
d = {"role": role.value, "content": message}
|
||||||
|
if username:
|
||||||
|
d["name"] = username
|
||||||
|
self.messages.append(d)
|
||||||
|
else:
|
||||||
|
raise ConversationLockedException()
|
||||||
|
|
||||||
|
def interrupt(self):
|
||||||
|
"""Interrupts any conversations going on."""
|
||||||
|
self.interruput = True
|
||||||
|
|
||||||
|
def get_tokens(self):
|
||||||
|
return text_to_tokens(self.messages)
|
||||||
|
|
||||||
|
def last_role(self):
|
||||||
|
return Role(self.messages[-1]["role"])
|
||||||
|
|
||||||
|
def last_message(self):
|
||||||
|
return self.messages[-1]["content"]
|
||||||
|
|
||||||
|
|
||||||
|
@dataclass
|
||||||
|
class ConversationResponse:
|
||||||
|
"""A response from the generation. You receive this when the **generation is done**, or non-streamed requests."""
|
||||||
|
|
||||||
|
conversation: Conversation
|
||||||
|
response: str | list[str]
|
||||||
|
raw_response: list[ChatCompletion] | list[ChatCompletionChunk]
|
7
copeai_backend/exception/LockedConversationException.py
Normal file
7
copeai_backend/exception/LockedConversationException.py
Normal file
@ -0,0 +1,7 @@
|
|||||||
|
class ConversationLockedException(Exception):
|
||||||
|
"""Raised when there is already an ongoing conversation."""
|
||||||
|
|
||||||
|
def __init__(self):
|
||||||
|
super().__init__(
|
||||||
|
"There is already an ongoing conversation. Please wait until it is finished."
|
||||||
|
)
|
1
copeai_backend/exception/__init__.py
Normal file
1
copeai_backend/exception/__init__.py
Normal file
@ -0,0 +1 @@
|
|||||||
|
from .LockedConversationException import ConversationLockedException
|
93
copeai_backend/generate.py
Normal file
93
copeai_backend/generate.py
Normal file
@ -0,0 +1,93 @@
|
|||||||
|
import json
|
||||||
|
import traceback
|
||||||
|
import requests
|
||||||
|
import openai
|
||||||
|
|
||||||
|
import asyncio
|
||||||
|
from dotenv import load_dotenv
|
||||||
|
import os
|
||||||
|
from .conversation import (
|
||||||
|
Conversation,
|
||||||
|
Role,
|
||||||
|
ConversationResponse,
|
||||||
|
GeneratingResponseChunk,
|
||||||
|
)
|
||||||
|
from .models import Model
|
||||||
|
from .exception import ConversationLockedException
|
||||||
|
|
||||||
|
load_dotenv()
|
||||||
|
|
||||||
|
oclient = openai.AsyncOpenAI(api_key=os.environ.get("OPENAI_KEY"))
|
||||||
|
|
||||||
|
|
||||||
|
async def simple_process_text(
|
||||||
|
conversation: Conversation,
|
||||||
|
model: Model,
|
||||||
|
new_message: str,
|
||||||
|
additional_args: dict = {},
|
||||||
|
) -> ConversationResponse:
|
||||||
|
conversation.add_message(Role.USER, new_message)
|
||||||
|
conversation.last_used_model = model
|
||||||
|
r = await oclient.chat.completions.create(
|
||||||
|
model=model.id, messages=conversation.messages, **additional_args
|
||||||
|
)
|
||||||
|
conversation.add_message(Role.ASSISTANT, r.choices[0].message.content)
|
||||||
|
return ConversationResponse(conversation, r.choices[0].message.content, r)
|
||||||
|
|
||||||
|
|
||||||
|
async def process_text_streaming(
|
||||||
|
conversation: Conversation,
|
||||||
|
model: Model,
|
||||||
|
new_message: str,
|
||||||
|
additional_args: dict = {},
|
||||||
|
):
|
||||||
|
if conversation.locked:
|
||||||
|
raise ConversationLockedException()
|
||||||
|
|
||||||
|
try:
|
||||||
|
text_parts = []
|
||||||
|
resp_parts = []
|
||||||
|
|
||||||
|
conversation.add_message(
|
||||||
|
Role.USER,
|
||||||
|
new_message,
|
||||||
|
(additional_args["userid"] if "userid" in additional_args else "unknown"),
|
||||||
|
)
|
||||||
|
conversation.last_used_model = model
|
||||||
|
conversation.locked = True
|
||||||
|
if model.service == "openai":
|
||||||
|
response = await oclient.chat.completions.create(
|
||||||
|
model=model.id,
|
||||||
|
messages=conversation.messages,
|
||||||
|
temperature=0.9,
|
||||||
|
top_p=1.0,
|
||||||
|
presence_penalty=0.6,
|
||||||
|
frequency_penalty=0.0,
|
||||||
|
max_tokens=4096,
|
||||||
|
stream=True,
|
||||||
|
)
|
||||||
|
|
||||||
|
async for chunk in response:
|
||||||
|
partition = chunk.choices[0].delta
|
||||||
|
if (
|
||||||
|
"content"
|
||||||
|
in json.loads(chunk.model_dump_json())["choices"][0]["delta"].keys()
|
||||||
|
):
|
||||||
|
if partition.content is not None:
|
||||||
|
text_parts.append(partition.content)
|
||||||
|
resp_parts.append(chunk)
|
||||||
|
yield GeneratingResponseChunk(partition.content, chunk)
|
||||||
|
|
||||||
|
if conversation.interruput:
|
||||||
|
conversation.add_message(Role.ASSISTANT, text_parts)
|
||||||
|
yield ConversationResponse(conversation, text_parts, resp_parts)
|
||||||
|
|
||||||
|
conversation.locked = False
|
||||||
|
conversation.add_message(Role.ASSISTANT, text_parts)
|
||||||
|
yield ConversationResponse(conversation, text_parts, resp_parts)
|
||||||
|
|
||||||
|
conversation.locked = False
|
||||||
|
|
||||||
|
except Exception as e:
|
||||||
|
conversation.locked = False
|
||||||
|
raise e
|
17
copeai_backend/models.py
Normal file
17
copeai_backend/models.py
Normal file
@ -0,0 +1,17 @@
|
|||||||
|
from dataclasses import dataclass
|
||||||
|
from typing import Literal
|
||||||
|
|
||||||
|
|
||||||
|
Service = Literal["openai", "bard"]
|
||||||
|
|
||||||
|
|
||||||
|
@dataclass
|
||||||
|
class Model:
|
||||||
|
id: str
|
||||||
|
usage_name: str
|
||||||
|
service: Service
|
||||||
|
|
||||||
|
|
||||||
|
GPT_3 = Model(id="gpt-3.5-turbo-16k-0613", usage_name="GPT-3", service="openai")
|
||||||
|
|
||||||
|
GPT_4 = Model(id="gpt-4-16k-0613", usage_name="GPT-4", service="openai")
|
42
examples/basic-generation.py
Normal file
42
examples/basic-generation.py
Normal file
@ -0,0 +1,42 @@
|
|||||||
|
# fmt: off
|
||||||
|
|
||||||
|
from copeai_backend import generate, models, conversation
|
||||||
|
import asyncio
|
||||||
|
|
||||||
|
async def main():
|
||||||
|
# Add a base prompt, if you wish to.
|
||||||
|
conversation.BASE_PROMPT = "You are CopeAI. You are kind, and useful. Answer to questions properly and make sure that it is really useful."
|
||||||
|
|
||||||
|
# Create a conversation object, that will store the history of the messages.
|
||||||
|
conv = generate.Conversation(
|
||||||
|
add_base_prompt=True, # Add the base prompt to the conversation. By default, it is True.
|
||||||
|
# However, the base prompt is empty by default. You must set it yourself.
|
||||||
|
storage={} # If you need to store some data.
|
||||||
|
)
|
||||||
|
|
||||||
|
# Generate a response. This is a non-streamed request, so it will return a ConversationResponse object. This is a blocking call.
|
||||||
|
response: generate.ConversationResponse = await generate.simple_process_text(
|
||||||
|
conversation=conv, # The conversation object.
|
||||||
|
model=models.GPT_3, # The model to use. Add your own models to the MODELS dict in models.py.
|
||||||
|
new_message="Hello, how are you?", # The message to send.
|
||||||
|
# additional_args={} # Additional arguments to send to the API. These are different for each API.
|
||||||
|
)
|
||||||
|
|
||||||
|
# Print the response.
|
||||||
|
print(response.response)
|
||||||
|
|
||||||
|
# The assistant's message is automatically implemented into the conversation object.
|
||||||
|
# Add a new user message.
|
||||||
|
conv.add_message(
|
||||||
|
role=generate.Role.USER, # The role of the message. This is an enum, so you can use generate.Role.USER, generate.Role.ASSISTANT, or generate.Role.SYSTEM.
|
||||||
|
message="I am fine, thanks!" # The message.
|
||||||
|
)
|
||||||
|
|
||||||
|
# Generate a response.
|
||||||
|
response: generate.ConversationResponse = await generate.simple_process_text(
|
||||||
|
conversation=conv,
|
||||||
|
model=models.GPT_3,
|
||||||
|
new_message="...",
|
||||||
|
)
|
||||||
|
|
||||||
|
asyncio.run(main())
|
42
examples/streamed-generation.py
Normal file
42
examples/streamed-generation.py
Normal file
@ -0,0 +1,42 @@
|
|||||||
|
# fmt: off
|
||||||
|
|
||||||
|
from copeai_backend import generate, models, conversation
|
||||||
|
import asyncio
|
||||||
|
|
||||||
|
async def main():
|
||||||
|
# Add a base prompt, if you wish to.
|
||||||
|
conversation.BASE_PROMPT = "You are CopeAI. You are kind, and useful. Answer to questions properly and make sure that it is really useful."
|
||||||
|
|
||||||
|
# Create a conversation object, that will store the history of the messages.
|
||||||
|
conv = generate.Conversation(
|
||||||
|
add_base_prompt=True, # Add the base prompt to the conversation. By default, it is True.
|
||||||
|
# However, the base prompt is empty by default. You must set it yourself.
|
||||||
|
storage={} # If you need to store some data.
|
||||||
|
)
|
||||||
|
|
||||||
|
# Generate a response. This is a non-streamed request, so it will return a ConversationResponse object. This is a blocking call.
|
||||||
|
response: generate.ConversationResponse = await generate.simple_process_text(
|
||||||
|
conversation=conv, # The conversation object.
|
||||||
|
model=models.GPT_3, # The model to use. Add your own models to the MODELS dict in models.py.
|
||||||
|
new_message="Hello, how are you?", # The message to send.
|
||||||
|
# additional_args={} # Additional arguments to send to the API. These are different for each API.
|
||||||
|
)
|
||||||
|
|
||||||
|
# Print the response.
|
||||||
|
print(response.response)
|
||||||
|
|
||||||
|
# The assistant's message is automatically implemented into the conversation object.
|
||||||
|
# Add a new user message.
|
||||||
|
conv.add_message(
|
||||||
|
role=generate.Role.USER, # The role of the message. This is an enum, so you can use generate.Role.USER, generate.Role.ASSISTANT, or generate.Role.SYSTEM.
|
||||||
|
message="I am fine, thanks!" # The message.
|
||||||
|
)
|
||||||
|
|
||||||
|
# Generate a response.
|
||||||
|
response: generate.ConversationResponse = await generate.simple_process_text(
|
||||||
|
conversation=conv,
|
||||||
|
model=models.GPT_3,
|
||||||
|
new_message="...",
|
||||||
|
)
|
||||||
|
|
||||||
|
asyncio.run(main())
|
4
requirements.txt
Normal file
4
requirements.txt
Normal file
@ -0,0 +1,4 @@
|
|||||||
|
openai
|
||||||
|
tiktoken
|
||||||
|
python-dotenv
|
||||||
|
discord
|
Loading…
Reference in New Issue
Block a user