You can not select more than 25 topics
			Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
		
		
		
		
		
			
		
			
				
					
					
						
							22 lines
						
					
					
						
							733 B
						
					
					
				
			
		
		
	
	
							22 lines
						
					
					
						
							733 B
						
					
					
				| from swarms import AgentJudge
 | |
| 
 | |
| # Initialize the agent judge with custom evaluation criteria
 | |
| judge = AgentJudge(
 | |
|     agent_name="technical-judge",
 | |
|     model_name="gpt-4",
 | |
|     max_loops=1,
 | |
|     evaluation_criteria={
 | |
|         "accuracy": 0.4,
 | |
|         "completeness": 0.3,
 | |
|         "clarity": 0.2,
 | |
|         "logic": 0.1,
 | |
|     },
 | |
| )
 | |
| 
 | |
| # Example technical agent output to evaluate
 | |
| technical_output = "To solve the quadratic equation x² + 5x + 6 = 0, we can use the quadratic formula: x = (-b ± √(b² - 4ac)) / 2a. Here, a=1, b=5, c=6. Substituting: x = (-5 ± √(25 - 24)) / 2 = (-5 ± √1) / 2 = (-5 ± 1) / 2. So x = -2 or x = -3."
 | |
| 
 | |
| # Run evaluation with context building
 | |
| evaluations = judge.run(task=technical_output)
 | |
| print(evaluations)
 |