You can not select more than 25 topics
			Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
		
		
		
		
		
			
		
			
				
					
					
						
							36 lines
						
					
					
						
							732 B
						
					
					
				
			
		
		
	
	
							36 lines
						
					
					
						
							732 B
						
					
					
				| # Description: This is an example of how to use the Agent class to run a multi-modal workflow
 | |
| import os
 | |
| 
 | |
| from dotenv import load_dotenv
 | |
| 
 | |
| from swarms import Agent, GPT4VisionAPI
 | |
| 
 | |
| # Load the environment variables
 | |
| load_dotenv()
 | |
| 
 | |
| # Get the API key from the environment
 | |
| api_key = os.environ.get("OPENAI_API_KEY")
 | |
| 
 | |
| # Initialize the language model
 | |
| llm = GPT4VisionAPI(
 | |
|     openai_api_key=api_key,
 | |
|     max_tokens=500,
 | |
| )
 | |
| 
 | |
| # Initialize the language model
 | |
| task = "What is the color of the object?"
 | |
| img = "images/swarms.jpeg"
 | |
| 
 | |
| ## Initialize the workflow
 | |
| agent = Agent(
 | |
|     llm=llm,
 | |
|     max_loops="auto",
 | |
|     autosave=True,
 | |
|     dashboard=True,
 | |
|     multi_modal=True,
 | |
| )
 | |
| 
 | |
| # Run the workflow on a task
 | |
| out = agent.run(task=task, img=img)
 | |
| print(out)
 |