You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
swarms/benchmark_results/benchmark_results_20250418_...

467 lines
10 KiB

{
"metadata": {
"timestamp": "2025-04-18T13:30:51.812685",
"num_iterations": 3,
"agent_config": {
"model_name": "gpt-4o-mini",
"max_loops": 1
}
},
"results": {
"Conduct an analysis of the best real undervalued ETFs": {
"execution_times": [
8.791961,
15.974623,
10.00903
],
"system_metrics": [
{
"cpu_percent": 3.9,
"memory_mb": 73.96875
},
{
"cpu_percent": 4.6,
"memory_mb": 71.171875
},
{
"cpu_percent": 21.5,
"memory_mb": 76.015625
}
],
"iterations": [
{
"iteration": 1,
"execution_time": 8.792,
"success": true,
"system_metrics": {
"pre": {
"cpu_percent": 0.0,
"memory_mb": 133.765625
},
"post": {
"cpu_percent": 3.9,
"memory_mb": 73.96875
}
}
},
{
"iteration": 2,
"execution_time": 15.975,
"success": true,
"system_metrics": {
"pre": {
"cpu_percent": 96.7,
"memory_mb": 133.8125
},
"post": {
"cpu_percent": 4.6,
"memory_mb": 71.171875
}
}
},
{
"iteration": 3,
"execution_time": 10.009,
"success": true,
"system_metrics": {
"pre": {
"cpu_percent": 76.2,
"memory_mb": 137.15625
},
"post": {
"cpu_percent": 21.5,
"memory_mb": 76.015625
}
}
}
],
"statistics": {
"execution_time": {
"mean": 11.592,
"median": 10.009,
"min": 8.792,
"max": 15.975,
"std_dev": 3.139
},
"memory_usage": {
"mean": 73.719,
"median": 73.969,
"min": 71.172,
"max": 76.016,
"std_dev": 1.985
},
"cpu_usage": {
"mean": 10.0,
"median": 4.6,
"min": 3.9,
"max": 21.5,
"std_dev": 8.137
}
}
},
"What are the top performing tech stocks this quarter?": {
"execution_times": [
10.980763,
11.800057,
18.108609
],
"system_metrics": [
{
"cpu_percent": 2.8,
"memory_mb": 76.203125
},
{
"cpu_percent": 2.4,
"memory_mb": 76.65625
},
{
"cpu_percent": 0.4,
"memory_mb": 69.515625
}
],
"iterations": [
{
"iteration": 1,
"execution_time": 10.981,
"success": true,
"system_metrics": {
"pre": {
"cpu_percent": 40.8,
"memory_mb": 137.40625
},
"post": {
"cpu_percent": 2.8,
"memory_mb": 76.203125
}
}
},
{
"iteration": 2,
"execution_time": 11.8,
"success": true,
"system_metrics": {
"pre": {
"cpu_percent": 87.4,
"memory_mb": 137.4375
},
"post": {
"cpu_percent": 2.4,
"memory_mb": 76.65625
}
}
},
{
"iteration": 3,
"execution_time": 18.109,
"success": true,
"system_metrics": {
"pre": {
"cpu_percent": 180.9,
"memory_mb": 137.640625
},
"post": {
"cpu_percent": 0.4,
"memory_mb": 69.515625
}
}
}
],
"statistics": {
"execution_time": {
"mean": 13.63,
"median": 11.8,
"min": 10.981,
"max": 18.109,
"std_dev": 3.185
},
"memory_usage": {
"mean": 74.125,
"median": 76.203,
"min": 69.516,
"max": 76.656,
"std_dev": 3.265
},
"cpu_usage": {
"mean": 1.867,
"median": 2.4,
"min": 0.4,
"max": 2.8,
"std_dev": 1.05
}
}
},
"Analyze current market trends in renewable energy sector": {
"execution_times": [
15.015125,
9.916293,
6.958686
],
"system_metrics": [
{
"cpu_percent": 1.3,
"memory_mb": 69.953125
},
{
"cpu_percent": 14.6,
"memory_mb": 74.765625
},
{
"cpu_percent": 5.0,
"memory_mb": 72.90625
}
],
"iterations": [
{
"iteration": 1,
"execution_time": 15.015,
"success": true,
"system_metrics": {
"pre": {
"cpu_percent": 169.6,
"memory_mb": 137.9375
},
"post": {
"cpu_percent": 1.3,
"memory_mb": 69.953125
}
}
},
{
"iteration": 2,
"execution_time": 9.916,
"success": true,
"system_metrics": {
"pre": {
"cpu_percent": 212.3,
"memory_mb": 138.171875
},
"post": {
"cpu_percent": 14.6,
"memory_mb": 74.765625
}
}
},
{
"iteration": 3,
"execution_time": 6.959,
"success": true,
"system_metrics": {
"pre": {
"cpu_percent": 149.0,
"memory_mb": 138.4375
},
"post": {
"cpu_percent": 5.0,
"memory_mb": 72.90625
}
}
}
],
"statistics": {
"execution_time": {
"mean": 10.63,
"median": 9.916,
"min": 6.959,
"max": 15.015,
"std_dev": 3.328
},
"memory_usage": {
"mean": 72.542,
"median": 72.906,
"min": 69.953,
"max": 74.766,
"std_dev": 1.982
},
"cpu_usage": {
"mean": 6.967,
"median": 5.0,
"min": 1.3,
"max": 14.6,
"std_dev": 5.605
}
}
},
"Compare Bitcoin and Ethereum investment potential": {
"execution_times": [
15.44115,
13.797926,
8.355462
],
"system_metrics": [
{
"cpu_percent": 2.4,
"memory_mb": 70.59375
},
{
"cpu_percent": 1.0,
"memory_mb": 69.875
},
{
"cpu_percent": 1.1,
"memory_mb": 73.5
}
],
"iterations": [
{
"iteration": 1,
"execution_time": 15.441,
"success": true,
"system_metrics": {
"pre": {
"cpu_percent": 218.0,
"memory_mb": 138.515625
},
"post": {
"cpu_percent": 2.4,
"memory_mb": 70.59375
}
}
},
{
"iteration": 2,
"execution_time": 13.798,
"success": true,
"system_metrics": {
"pre": {
"cpu_percent": 298.8,
"memory_mb": 138.59375
},
"post": {
"cpu_percent": 1.0,
"memory_mb": 69.875
}
}
},
{
"iteration": 3,
"execution_time": 8.355,
"success": true,
"system_metrics": {
"pre": {
"cpu_percent": 226.1,
"memory_mb": 139.984375
},
"post": {
"cpu_percent": 1.1,
"memory_mb": 73.5
}
}
}
],
"statistics": {
"execution_time": {
"mean": 12.532,
"median": 13.798,
"min": 8.355,
"max": 15.441,
"std_dev": 3.028
},
"memory_usage": {
"mean": 71.323,
"median": 70.594,
"min": 69.875,
"max": 73.5,
"std_dev": 1.567
},
"cpu_usage": {
"mean": 1.5,
"median": 1.1,
"min": 1.0,
"max": 2.4,
"std_dev": 0.638
}
}
},
"Evaluate the risk factors in emerging markets": {
"execution_times": [
6.380516,
9.943111,
9.821866
],
"system_metrics": [
{
"cpu_percent": 126.4,
"memory_mb": 118.28125
},
{
"cpu_percent": 18.0,
"memory_mb": 75.28125
},
{
"cpu_percent": 1.8,
"memory_mb": 74.1875
}
],
"iterations": [
{
"iteration": 1,
"execution_time": 6.381,
"success": true,
"system_metrics": {
"pre": {
"cpu_percent": 83.4,
"memory_mb": 140.046875
},
"post": {
"cpu_percent": 126.4,
"memory_mb": 118.28125
}
}
},
{
"iteration": 2,
"execution_time": 9.943,
"success": true,
"system_metrics": {
"pre": {
"cpu_percent": 197.8,
"memory_mb": 140.109375
},
"post": {
"cpu_percent": 18.0,
"memory_mb": 75.28125
}
}
},
{
"iteration": 3,
"execution_time": 9.822,
"success": true,
"system_metrics": {
"pre": {
"cpu_percent": 181.7,
"memory_mb": 140.171875
},
"post": {
"cpu_percent": 1.8,
"memory_mb": 74.1875
}
}
}
],
"statistics": {
"execution_time": {
"mean": 8.715,
"median": 9.822,
"min": 6.381,
"max": 9.943,
"std_dev": 1.652
},
"memory_usage": {
"mean": 89.25,
"median": 75.281,
"min": 74.188,
"max": 118.281,
"std_dev": 20.533
},
"cpu_usage": {
"mean": 48.733,
"median": 18.0,
"min": 1.8,
"max": 126.4,
"std_dev": 55.315
}
}
}
}
}