fuyu + zephyr fixes

2 years ago · 9aa40842a6
parent 6b4c2d45d3
commit 9aa40842a6
7 changed files with 136 additions and 41 deletions
--- a/demos/accountant_team/accountant_team.py
+++ b/demos/accountant_team/accountant_team.py
@ -1,43 +1,36 @@
 # !pip install --upgrade swarms==2.0.6
-
+from swarms.models import BioGPT
 from swarms.models import OpenAIChat
 from swarms.models.nougat import Nougat
 from swarms.structs import Flow
 from swarms.structs.sequential_workflow import SequentialWorkflow
 # # URL of the image of the financial document
 IMAGE_OF_FINANCIAL_DOC_URL = "bank_statement_2.jpg"
 # Example usage
-api_key = (
+api_key = ""  # Your actual API key here
    "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"  # Your actual API key here
 )
 # Initialize the OCR model
 def ocr_model(img: str):
    ocr = Nougat()
    analyze_finance_docs = ocr(img)
    return str(analyze_finance_docs)
 # Initialize the language flow
-llm = OpenAIChat(
+llm = BioGPT()
    openai_api_key=api_key,
    temperature=0.5,
 )
 # Create a prompt for the language model
 def summary_agent_prompt(analyzed_doc: str):
-    analyzed_doc = ocr_model(img=analyzed_doc)
+    model = Nougat(
        max_new_tokens=5000,
    )
    out = model(analyzed_doc)
    return f"""
    Generate an actionable summary of this financial document, provide bulletpoints:
    Here is the Analyzed Document:
    ---
-    {analyzed_doc}
+    {out}
    """
@ -47,21 +40,11 @@ flow1 = Flow(llm=llm, max_loops=1, dashboard=False)
 # Create another Flow for a different task
 flow2 = Flow(llm=llm, max_loops=1, dashboard=False)
 # Create the workflow
 workflow = SequentialWorkflow(max_loops=1)
 # Add tasks to the workflow
-workflow.add(summary_agent_prompt(IMAGE_OF_FINANCIAL_DOC_URL), flow1)
+summary_agent = flow1.run(summary_agent_prompt(IMAGE_OF_FINANCIAL_DOC_URL))
 # Suppose the next task takes the output of the first task as input
-workflow.add(
+out = flow2.run(
-    "Provide an actionable step by step plan on how to cut costs from the analyzed financial document.",
+    f"Provide an actionable step by step plan on how to cut costs from the analyzed financial document. {summary_agent}"
    flow2,
 )
 # Run the workflow
 workflow.run()
 # Output the results
 for task in workflow.tasks:
    print(f"Task: {task.description}, Result: {task.result}")
--- a/playground/models/anthropic_example.py
+++ b/playground/models/anthropic_example.py
@ -4,6 +4,6 @@ from swarms.models.anthropic import Anthropic
 model = Anthropic(anthropic_api_key="")
-task = "Say hello to"
+task = "What is quantum field theory? What are 3 books on the field?"
 print(model(task))
--- a/pyproject.toml
+++ b/pyproject.toml
@ -4,7 +4,7 @@ build-backend = "poetry.core.masonry.api"
 [tool.poetry]
 name = "swarms"
-version = "2.0.8"
+version = "2.1.0"
 description = "Swarms - Pytorch"
 license = "MIT"
 authors = ["Kye Gomez <kye@apac.ai>"]
--- a/swarms/models/fastvit.py
+++ b/swarms/models/fastvit.py
@ -43,8 +43,9 @@ class FastViT:
    To use, create a json file called: fast_vit_classes.json
-    
+
    """
    def __init__(self):
        self.model = timm.create_model(
            "hf_hub:timm/fastvit_s12.apple_in1k", pretrained=True
--- a/swarms/models/fuyu.py
+++ b/swarms/models/fuyu.py
@ -1,8 +1,8 @@
 """Fuyu model by Kye"""
 from transformers import (
    FuyuProcessor,
    FuyuForCausalLM,
    AutoTokenizer,
    FuyuProcessor,
    FuyuImageProcessor,
 )
 from PIL import Image
@ -50,9 +50,9 @@ class Fuyu:
            pretrained_path, device_map=device_map
        )
-    def __call__(self, text: str, img_path: str):
+    def __call__(self, text: str, img: str):
        """Call the model with text and img paths"""
-        image_pil = Image.open(img_path)
+        image_pil = Image.open(img)
        model_inputs = self.processor(
            text=text, images=[image_pil], device=self.device_map
        )
@ -62,3 +62,4 @@ class Fuyu:
        output = self.model.generate(**model_inputs, max_new_tokens=self.max_new_tokens)
        text = self.processor.batch_decode(output[:, -7:], skip_special_tokens=True)
        return print(str(text))
--- a/swarms/models/timm.py
+++ b/swarms/models/timm.py
@ -0,0 +1,67 @@
 from typing import List
 import timm
 import torch
 from pydantic import BaseModel, conlist
 class TimmModelInfo(BaseModel):
    model_name: str
    pretrained: bool
    in_chans: int
    class Config:
        # Use strict typing for all fields
        strict = True
 class TimmModel:
    """
    # Usage
    model_handler = TimmModelHandler()
    model_info = TimmModelInfo(model_name='resnet34', pretrained=True, in_chans=1)
    input_tensor = torch.randn(1, 1, 224, 224)
    output_shape = model_handler(model_info=model_info, input_tensor=input_tensor)
    print(output_shape)
    """
    def __init__(self):
        self.models = self._get_supported_models()
    def _get_supported_models(self) -> List[str]:
        """Retrieve the list of supported models from timm."""
        return timm.list_models()
    def _create_model(self, model_info: TimmModelInfo) -> torch.nn.Module:
        """
        Create a model instance from timm with specified parameters.
        Args:
            model_info: An instance of TimmModelInfo containing model specifications.
        Returns:
            An instance of a pytorch model.
        """
        return timm.create_model(
            model_info.model_name,
            pretrained=model_info.pretrained,
            in_chans=model_info.in_chans,
        )
    def __call__(
        self, model_info: TimmModelInfo, input_tensor: torch.Tensor
    ) -> torch.Size:
        """
        Create and run a model specified by `model_info` on `input_tensor`.
        Args:
            model_info: An instance of TimmModelInfo containing model specifications.
            input_tensor: A torch tensor representing the input data.
        Returns:
            The shape of the output from the model.
        """
        model = self._create_model(model_info)
        return model(input_tensor).shape
--- a/swarms/models/zephyr.py
+++ b/swarms/models/zephyr.py
@ -25,12 +25,22 @@ class Zephyr:
    def __init__(
        self,
        model_name: str = "HuggingFaceH4/zephyr-7b-alpha",
        tokenize: bool = False,
        add_generation_prompt: bool = True,
        system_prompt: str = "You are a friendly chatbot who always responds in the style of a pirate",
        max_new_tokens: int = 300,
        temperature: float = 0.5,
        top_k: float = 50,
        top_p: float = 0.95,
        *args,
        **kwargs,
    ):
        super().__init__()
        self.model_name = model_name
        self.tokenize = tokenize
        self.add_generation_prompt = add_generation_prompt
        self.system_prompt = system_prompt
        self.max_new_tokens = max_new_tokens
        self.temperature = temperature
        self.top_k = top_k
@ -38,14 +48,14 @@ class Zephyr:
        self.pipe = pipeline(
            "text-generation",
-            model="HuggingFaceH4/zephyr-7b-alpha",
+            model=self.model_name,
            torch_dtype=torch.bfloat16,
            device_map="auto",
        )
        self.messages = [
            {
                "role": "system",
-                "content": "You are a friendly chatbot who always responds in the style of a pirate",
+                "content": f"{self.systen_prompt}\n\nUser:",
            },
            {
                "role": "user",
@ -53,10 +63,43 @@ class Zephyr:
            },
        ]
-    def __call__(self, text: str):
+    def __call__(self, task: str):
        """Call the model"""
        prompt = self.pipe.tokenizer.apply_chat_template(
-            self.messages, tokenize=False, add_generation_prompt=True
+            self.messages,
            tokenize=self.tokenize,
            add_generation_prompt=self.add_generation_prompt,
        )
-        outputs = self.pipe(prompt, max_new_token=self.max_new_tokens)
+        outputs = self.pipe(prompt)  # max_new_token=self.max_new_tokens)
        print(outputs[0])["generated_text"]
    def chat(self, message: str):
        """
        Adds a user message to the conversation and generates a chatbot response.
        """
        # Add the user message to the conversation
        self.messages.append({"role": "user", "content": message})
        # Apply the chat template to format the messages
        prompt = self.pipe.tokenizer.apply_chat_template(
            self.messages, tokenize=False, add_generation_prompt=True
        )
        # Generate a response
        outputs = self.pipe(
            prompt,
            max_new_tokens=self.max_new_tokens,
            do_sample=True,
            temperature=self.temperature,
            top_k=self.top_k,
            top_p=self.top_p,
        )
        # Extract the generated text
        generated_text = outputs[0]["generated_text"]
        # Optionally, you could also add the chatbot's response to the messages list
        # However, the below line should be adjusted to extract the chatbot's response only
        # self.messages.append({"role": "bot", "content": generated_text})
        return generated_text