You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
swarms/swarms/utils/llm.py

75 lines
2.8 KiB

from typing import Optional
import os
import logging
from langchain import PromptTemplate, HuggingFaceHub, ChatOpenAI, LLMChain
# Configure logging
logging.basicConfig(level=logging.INFO)
logger = logging.getLogger(__name__)
class LLM:
def __init__(self,
openai_api_key: Optional[str] = None,
hf_repo_id: Optional[str] = None,
hf_api_token: Optional[str] = None,
temperature: Optional[float] = 0.5,
max_length: Optional[int] = 64):
# Check if keys are in the environment variables
openai_api_key = openai_api_key or os.getenv('OPENAI_API_KEY')
hf_api_token = hf_api_token or os.getenv('HUGGINGFACEHUB_API_TOKEN')
self.openai_api_key = openai_api_key
self.hf_repo_id = hf_repo_id
self.hf_api_token = hf_api_token
self.temperature = temperature
self.max_length = max_length
# If the HuggingFace API token is provided, set it in environment variables
if self.hf_api_token:
os.environ["HUGGINGFACEHUB_API_TOKEN"] = self.hf_api_token
# Initialize the LLM object
self.initialize_llm()
def initialize_llm(self):
model_kwargs = {"temperature": self.temperature, "max_length": self.max_length}
try:
if self.hf_repo_id and self.hf_api_token:
self.llm = HuggingFaceHub(repo_id=self.hf_repo_id, model_kwargs=model_kwargs)
elif self.openai_api_key:
self.llm = ChatOpenAI(api_key=self.openai_api_key, model_kwargs=model_kwargs)
else:
raise ValueError("Please provide either OpenAI API key or both HuggingFace repository ID and API token.")
except Exception as e:
logger.error("Failed to initialize LLM: %s", e)
raise
def run(self, prompt: str) -> str:
template = """Question: {question}
Answer: Let's think step by step."""
try:
prompt_template = PromptTemplate(template=template, input_variables=["question"])
llm_chain = LLMChain(prompt=prompt_template, llm=self.llm)
return llm_chain.run({"question": prompt})
except Exception as e:
logger.error("Failed to generate response: %s", e)
raise
# # example
# from swarms.utils.llm import LLM
# llm_instance = LLM(openai_api_key="your_openai_key")
# result = llm_instance.run("Who won the FIFA World Cup in 1998?")
# print(result)
# # using HuggingFaceHub
# llm_instance = LLM(hf_repo_id="google/flan-t5-xl", hf_api_token="your_hf_api_token")
# result = llm_instance.run("Who won the FIFA World Cup in 1998?")
# print(result)
# make super easy to chaneg parameters, in class, use cpu and
#add qlora, 8bit inference
# look into adding deepspeed