copeai-ai-backend/examples/streamed-generation.py

59 lines
2.5 KiB
Python

# fmt: off
from typing import AsyncGenerator
from copeai_backend import generate, models, conversation
import asyncio
async def main():
# Add a base prompt, if you wish to.
conversation.BASE_PROMPT = "You are CopeAI. You are kind, and useful. Answer to questions properly and make sure that it is really useful."
# Create a conversation object, that will store the history of the messages.
conv = generate.Conversation(
add_base_prompt=True, # Add the base prompt to the conversation. By default, it is True.
# However, the base prompt is empty by default. You must set it yourself.
storage={} # If you need to store some data.
)
# Generate a response. This is a streamed request, so it will return a GeneratingResponseChunk object.
# Then, at the end of the generation, ConversationResponse will be returned.
# This is a non-blocking call.
response = generate.process_text_streaming(
conversation=conv, # The conversation object.
model=models.GPT_3, # The model to use. Add your own models to the MODELS dict in models.py.
new_message="Hello, how are you?", # The message to send.
# additional_args={} # Additional arguments to send to the API. These are different for each API.
) # type: ignore
async for chunk in response:
if isinstance(chunk, conversation.GeneratingResponseChunk):
print(chunk.text, end="")
else:
print('\nConversation ended!')
# To retrieve the response, you can use the ConversationResponse object, from the last iteration.
_response = chunk.text
# The assistant's message is automatically implemented into the conversation object.
# Add a new user message.
conv.add_message(
role=generate.Role.USER, # The role of the message. This is an enum, so you can use generate.Role.USER, generate.Role.ASSISTANT, or generate.Role.SYSTEM.
message="I am fine, thanks!" # The message.
)
# Generate a response.
response: generate.ConversationResponse = generate.process_text_streaming(
conversation=conv,
model=models.GPT_3,
new_message="...",
)
async for chunk in response:
if isinstance(chunk, conversation.GeneratingResponseChunk):
print(chunk.text, end="")
else:
print('\nConversation ended!')
asyncio.run(main())