[OMNIMODALAGENT Fix]

pull/286/head
Kye 1 year ago
parent 03d6f689ef
commit ff7bcec999

@ -39,9 +39,26 @@ For streaming mode, this function yields the response token by token, ensuring a
## Examples & Use Cases ## Examples & Use Cases
Initialize the `OmniModalAgent` and communicate with it: Initialize the `OmniModalAgent` and communicate with it:
```python ```python
from swarms import OmniModalAgent, OpenAIChat from swarms.agents.omni_modal_agent import OmniModalAgent, OpenAIChat
llm_instance = OpenAIChat() from swarms.models import OpenAIChat
agent = OmniModalAgent(llm_instance) from dotenv import load_dotenv
import os
# Load the environment variables
load_dotenv()
# Get the API key from the environment
api_key = os.environ.get("OPENAI_API_KEY")
# Initialize the language model
llm = OpenAIChat(
temperature=0.5,
model_name="gpt-4",
openai_api_key=api_key,
)
agent = OmniModalAgent(llm)
response = agent.run("Translate 'Hello' to French.") response = agent.run("Translate 'Hello' to French.")
print(response) print(response)
``` ```

@ -311,4 +311,3 @@ class BaseMultiModalModel:
def set_max_length(self, max_length): def set_max_length(self, max_length):
"""Set max_length""" """Set max_length"""
self.max_length = max_length self.max_length = max_length

@ -1,4 +1,3 @@
from PIL import Image from PIL import Image
from termcolor import colored from termcolor import colored
from transformers import ( from transformers import (
@ -15,7 +14,7 @@ class Fuyu(BaseMultiModalModel):
""" """
Fuyu model by Adept Fuyu model by Adept
Args: Args:
BaseMultiModalModel (BaseMultiModalModel): [description] BaseMultiModalModel (BaseMultiModalModel): [description]
model_name (str, optional): [description]. Defaults to "adept/fuyu-8b". model_name (str, optional): [description]. Defaults to "adept/fuyu-8b".
@ -23,9 +22,9 @@ class Fuyu(BaseMultiModalModel):
max_new_tokens (int, optional): [description]. Defaults to 500. max_new_tokens (int, optional): [description]. Defaults to 500.
*args: [description] *args: [description]
**kwargs: [description] **kwargs: [description]
Examples: Examples:
>>> from swarms.models import Fuyu >>> from swarms.models import Fuyu
>>> model = Fuyu() >>> model = Fuyu()
@ -45,9 +44,7 @@ class Fuyu(BaseMultiModalModel):
self.device_map = device_map self.device_map = device_map
self.max_new_tokens = max_new_tokens self.max_new_tokens = max_new_tokens
self.tokenizer = AutoTokenizer.from_pretrained( self.tokenizer = AutoTokenizer.from_pretrained(model_name)
model_name
)
self.image_processor = FuyuImageProcessor() self.image_processor = FuyuImageProcessor()
self.processor = FuyuProcessor( self.processor = FuyuProcessor(
image_processor=self.image_processor, image_processor=self.image_processor,
@ -111,4 +108,4 @@ class Fuyu(BaseMultiModalModel):
), ),
"red", "red",
) )
) )

@ -1,4 +1,3 @@
from unittest.mock import patch from unittest.mock import patch
import pytest import pytest
@ -127,7 +126,6 @@ def test_processor_initialization(fuyu_instance):
assert isinstance(fuyu_instance.processor, FuyuProcessor) assert isinstance(fuyu_instance.processor, FuyuProcessor)
# Test `get_img` method with a valid image path # Test `get_img` method with a valid image path
def test_get_img_valid_path(fuyu_instance): def test_get_img_valid_path(fuyu_instance):
with patch("PIL.Image.open") as mock_open: with patch("PIL.Image.open") as mock_open:
@ -135,6 +133,7 @@ def test_get_img_valid_path(fuyu_instance):
result = fuyu_instance.get_img("valid/path/to/image.png") result = fuyu_instance.get_img("valid/path/to/image.png")
assert result == "Test image" assert result == "Test image"
# Test `get_img` method with an invalid image path # Test `get_img` method with an invalid image path
def test_get_img_invalid_path(fuyu_instance): def test_get_img_invalid_path(fuyu_instance):
with patch("PIL.Image.open") as mock_open: with patch("PIL.Image.open") as mock_open:
@ -142,39 +141,55 @@ def test_get_img_invalid_path(fuyu_instance):
with pytest.raises(FileNotFoundError): with pytest.raises(FileNotFoundError):
fuyu_instance.get_img("invalid/path/to/image.png") fuyu_instance.get_img("invalid/path/to/image.png")
# Test `run` method with valid inputs # Test `run` method with valid inputs
def test_run_valid_inputs(fuyu_instance): def test_run_valid_inputs(fuyu_instance):
with patch.object(fuyu_instance, "get_img") as mock_get_img, \ with patch.object(
patch.object(fuyu_instance, "processor") as mock_processor, \ fuyu_instance, "get_img"
patch.object(fuyu_instance, "model") as mock_model: ) as mock_get_img, patch.object(
fuyu_instance, "processor"
) as mock_processor, patch.object(
fuyu_instance, "model"
) as mock_model:
mock_get_img.return_value = "Test image" mock_get_img.return_value = "Test image"
mock_processor.return_value = {"input_ids": torch.tensor([1, 2, 3])} mock_processor.return_value = {
"input_ids": torch.tensor([1, 2, 3])
}
mock_model.generate.return_value = torch.tensor([1, 2, 3]) mock_model.generate.return_value = torch.tensor([1, 2, 3])
mock_processor.batch_decode.return_value = ["Test text"] mock_processor.batch_decode.return_value = ["Test text"]
result = fuyu_instance.run("Hello, world!", "valid/path/to/image.png") result = fuyu_instance.run(
"Hello, world!", "valid/path/to/image.png"
)
assert result == ["Test text"] assert result == ["Test text"]
# Test `run` method with invalid text input # Test `run` method with invalid text input
def test_run_invalid_text_input(fuyu_instance): def test_run_invalid_text_input(fuyu_instance):
with pytest.raises(Exception): with pytest.raises(Exception):
fuyu_instance.run(None, "valid/path/to/image.png") fuyu_instance.run(None, "valid/path/to/image.png")
# Test `run` method with empty text input # Test `run` method with empty text input
def test_run_empty_text_input(fuyu_instance): def test_run_empty_text_input(fuyu_instance):
with pytest.raises(Exception): with pytest.raises(Exception):
fuyu_instance.run("", "valid/path/to/image.png") fuyu_instance.run("", "valid/path/to/image.png")
# Test `run` method with very long text input # Test `run` method with very long text input
def test_run_very_long_text_input(fuyu_instance): def test_run_very_long_text_input(fuyu_instance):
with pytest.raises(Exception): with pytest.raises(Exception):
fuyu_instance.run("A" * 10000, "valid/path/to/image.png") fuyu_instance.run("A" * 10000, "valid/path/to/image.png")
# Test `run` method with invalid image path # Test `run` method with invalid image path
def test_run_invalid_image_path(fuyu_instance): def test_run_invalid_image_path(fuyu_instance):
with patch.object(fuyu_instance, "get_img") as mock_get_img: with patch.object(fuyu_instance, "get_img") as mock_get_img:
mock_get_img.side_effect = FileNotFoundError mock_get_img.side_effect = FileNotFoundError
with pytest.raises(FileNotFoundError): with pytest.raises(FileNotFoundError):
fuyu_instance.run("Hello, world!", "invalid/path/to/image.png") fuyu_instance.run(
"Hello, world!", "invalid/path/to/image.png"
)
# Test `__init__` method with default parameters # Test `__init__` method with default parameters
def test_init_default_parameters(): def test_init_default_parameters():
@ -183,10 +198,10 @@ def test_init_default_parameters():
assert fuyu_instance.device_map == "auto" assert fuyu_instance.device_map == "auto"
assert fuyu_instance.max_new_tokens == 500 assert fuyu_instance.max_new_tokens == 500
# Test `__init__` method with custom parameters # Test `__init__` method with custom parameters
def test_init_custom_parameters(): def test_init_custom_parameters():
fuyu_instance = Fuyu("custom/path", "cpu", 1000) fuyu_instance = Fuyu("custom/path", "cpu", 1000)
assert fuyu_instance.pretrained_path == "custom/path" assert fuyu_instance.pretrained_path == "custom/path"
assert fuyu_instance.device_map == "cpu" assert fuyu_instance.device_map == "cpu"
assert fuyu_instance.max_new_tokens == 1000 assert fuyu_instance.max_new_tokens == 1000

@ -157,16 +157,18 @@ def test_run_batched_mode_false(idefics_instance):
assert result == ["Test"] assert result == ["Test"]
# Test `run` method with an exception # Test `run` method with an exception
def test_run_with_exception(idefics_instance): def test_run_with_exception(idefics_instance):
task = "User: Test" task = "User: Test"
with patch.object( with patch.object(
idefics_instance, "processor" idefics_instance, "processor"
) as mock_processor: ) as mock_processor:
mock_processor.side_effect = Exception('Test exception') mock_processor.side_effect = Exception("Test exception")
with pytest.raises(Exception): with pytest.raises(Exception):
idefics_instance.run(task) idefics_instance.run(task)
# Test `set_model_name` method # Test `set_model_name` method
def test_set_model_name(idefics_instance): def test_set_model_name(idefics_instance):
new_model_name = "new_model_name" new_model_name = "new_model_name"
@ -182,6 +184,7 @@ def test_set_model_name(idefics_instance):
new_model_name, torch_dtype=torch.bfloat16 new_model_name, torch_dtype=torch.bfloat16
) )
# Test `__init__` method with device set to None # Test `__init__` method with device set to None
def test_init_device_none(): def test_init_device_none():
with patch( with patch(
@ -191,6 +194,7 @@ def test_init_device_none():
instance = Idefics(device=None) instance = Idefics(device=None)
assert instance.device == "cpu" assert instance.device == "cpu"
# Test `__init__` method with device set to "cuda" # Test `__init__` method with device set to "cuda"
def test_init_device_cuda(): def test_init_device_cuda():
with patch( with patch(
@ -198,4 +202,4 @@ def test_init_device_cuda():
return_value=True, return_value=True,
): ):
instance = Idefics(device="cuda") instance = Idefics(device="cuda")
assert instance.device == "cuda" assert instance.device == "cuda"

Loading…
Cancel
Save