[FEAT][GenerationOutputMetadata]

pull/449/head
Kye 9 months ago
parent 5728bff63a
commit cad23b9471

@ -12,6 +12,7 @@ class Schema(BaseModel):
..., title="List of courses the person is taking"
)
# Convert the schema to a JSON string
tool_schema = Schema(
name="Tool Name",
@ -42,9 +43,9 @@ agent = Agent(
output_type=tool_schema, # or dict, or str
metadata_output_type="json",
# List of schemas that the agent can handle
list_tool_schemas = [tool_schema],
function_calling_format_type = "OpenAI",
function_calling_type = "json" # or soon yaml
list_tool_schemas=[tool_schema],
function_calling_format_type="OpenAI",
function_calling_type="json", # or soon yaml
)
# Run the agent to generate the person's information

@ -5,7 +5,7 @@ build-backend = "poetry.core.masonry.api"
[tool.poetry]
name = "swarms"
version = "4.8.6"
version = "4.8.7"
description = "Swarms - Pytorch"
license = "MIT"
authors = ["Kye Gomez <kye@apac.ai>"]

@ -7,10 +7,11 @@ from langchain_community.chat_models.openai import (
from langchain.llms.anthropic import Anthropic
from langchain.llms.cohere import Cohere
from langchain.llms.mosaicml import MosaicML
from langchain.llms.openai import OpenAI #, OpenAIChat, AzureOpenAI
from langchain.llms.openai import OpenAI # , OpenAIChat, AzureOpenAI
from langchain_community.llms.octoai_endpoint import OctoAIEndpoint
from langchain.llms.replicate import Replicate
class AnthropicChat(Anthropic):
def __call__(self, *args, **kwargs):
return self.invoke(*args, **kwargs)

@ -323,10 +323,7 @@ class Agent:
# If the stopping function is provided then set the stopping condition to the stopping function
self.short_memory = Conversation(
system_prompt=system_prompt,
time_enabled=True,
*args,
**kwargs
system_prompt=system_prompt, time_enabled=True, *args, **kwargs
)
# If the docs exist then ingest the docs
@ -467,6 +464,48 @@ class Agent:
except Exception as error:
print(colored(f"Error adding task to memory: {error}", "red"))
# ############## TOKENIZER FUNCTIONS ##############
def count_tokens(self, text: str) -> int:
"""Count the number of tokens in the text."""
return self.tokenizer.len(text)
def tokens_per_second(self, text: str) -> float:
"""
Calculates the number of tokens processed per second.
Args:
text (str): The input text to count tokens from.
Returns:
float: The number of tokens processed per second.
"""
import time
start_time = time.time()
tokens = self.count_tokens(text)
end_time = time.time()
elapsed_time = end_time - start_time
return tokens / elapsed_time
def time_to_generate(self, text: str) -> float:
"""
Calculates the time taken to generate the output.
Args:
text (str): The input text to generate output from.
Returns:
float: The time taken to generate the output.
"""
import time
start_time = time.time()
self.llm(text)
end_time = time.time()
return end_time - start_time
# ############## TOKENIZER FUNCTIONS ##############
def add_message_to_memory(self, message: str):
"""Add the message to the memory"""
try:

@ -81,7 +81,6 @@ class BaseStructure:
self.save_metadata_path = save_metadata_path
self.save_error_path = save_error_path
def run(self, *args, **kwargs):
"""Run the structure."""

@ -164,3 +164,91 @@ class ManySteps(BaseModel):
[],
description="A list of task steps.",
)
class GenerationOutputMetadata(BaseModel):
num_of_tokens: int = Field(
...,
description="The number of tokens generated.",
examples=[7894],
)
estimated_cost: str = Field(
...,
description="The estimated cost of the generation.",
examples=["0,24$"],
)
time_to_generate: str = Field(
...,
description="The time taken to generate the output.",
examples=["1.2s"],
)
tokens_per_second: int = Field(
...,
description="The number of tokens generated per second.",
examples=[657],
)
model_name: str = Field(
...,
description="The model used to generate the output.",
examples=["gpt-3.5-turbo"],
)
max_tokens: int = Field(
...,
description="The maximum number of tokens allowed to generate.",
examples=[2048],
)
temperature: float = Field(
...,
description="The temperature used for generation.",
examples=[0.7],
)
top_p: float = Field(
...,
description="The top p value used for generation.",
examples=[0.9],
)
frequency_penalty: float = Field(
...,
description="The frequency penalty used for generation.",
examples=[0.0],
)
presence_penalty: float = Field(
...,
description="The presence penalty used for generation.",
examples=[0.0],
)
stop_sequence: str | None = Field(
None,
description="The sequence used to stop the generation.",
examples=["<stop_sequence>"],
)
model_type: str = Field(
...,
description="The type of model used for generation.",
examples=["text"],
)
model_version: str = Field(
...,
description="The version of the model used for generation.",
examples=["1.0.0"],
)
model_description: str = Field(
...,
description="The description of the model used for generation.",
examples=["A model that generates text."],
)
model_author: str = Field(
...,
description="The author of the model used for generation.",
examples=["John Doe"],
)
n: int = Field(
...,
description="The number of outputs generated.",
examples=[1],
)
n_best: int = Field(
...,
description="The number of best outputs generated.",
examples=[1],
)

@ -1,4 +1,4 @@
from typing import Any, Optional, List
from typing import Any, List
from docstring_parser import parse
from pydantic import BaseModel
@ -72,7 +72,7 @@ def pydantic_to_functions(
def multi_pydantic_to_functions(
pydantic_types: List[BaseModel] = None
pydantic_types: List[BaseModel] = None,
) -> dict[str, Any]:
"""
Converts multiple Pydantic types to a dictionary of functions.

Loading…
Cancel
Save