swarms/examples/demos/multi_modal_chain_of_thought/vcot_example.py

import os

from dotenv import load_dotenv

from swarm_models.gpt4_vision_api import GPT4VisionAPI
from swarms.prompts.visual_cot import VISUAL_CHAIN_OF_THOUGHT
from swarms.structs import Agent

# Load the environment variables
load_dotenv()

# Get the API key from the environment
api_key = os.environ.get("OPENAI_API_KEY")

# Initialize the language model
llm = GPT4VisionAPI(
    openai_api_key=api_key,
    max_tokens=500,
)

# Initialize the task
task = "This is an eye test. What do you see?"
img = "examples/demos/multi_modal_chain_of_thought/eyetest.jpg"

## Initialize the workflow
agent = Agent(
    llm=llm,
    max_loops=2,
    autosave=True,
    sop=VISUAL_CHAIN_OF_THOUGHT,
)

# Run the workflow on a task
out = agent.run(task=task, img=img)
print(out)
[5.4.8] 5 months ago			`import os`

			`from dotenv import load_dotenv`

[CLEANUP] 4 months ago			`from swarm_models.gpt4_vision_api import GPT4VisionAPI`
[5.4.8] 5 months ago			`from swarms.prompts.visual_cot import VISUAL_CHAIN_OF_THOUGHT`
			`from swarms.structs import Agent`

			`# Load the environment variables`
			`load_dotenv()`

			`# Get the API key from the environment`
			`api_key = os.environ.get("OPENAI_API_KEY")`

			`# Initialize the language model`
			`llm = GPT4VisionAPI(`
			`openai_api_key=api_key,`
			`max_tokens=500,`
			`)`

			`# Initialize the task`
			`task = "This is an eye test. What do you see?"`
[FEAT][SpreadSheetSwarm] [FEAT][TaskQueueSwarm] 5 months ago			`img = "examples/demos/multi_modal_chain_of_thought/eyetest.jpg"`
[5.4.8] 5 months ago
			`## Initialize the workflow`
			`agent = Agent(`
			`llm=llm,`
			`max_loops=2,`
			`autosave=True,`
			`sop=VISUAL_CHAIN_OF_THOUGHT,`
			`)`

			`# Run the workflow on a task`
			`out = agent.run(task=task, img=img)`
			`print(out)`