You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
swarms/benchmark_results/benchmark_results_20250418_...

467 lines
10 KiB

{
"metadata": {
"timestamp": "2025-04-18T13:30:16.543562",
"num_iterations": 3,
"agent_config": {
"model_name": "gpt-4o-mini",
"max_loops": 1
}
},
"results": {
"Conduct an analysis of the best real undervalued ETFs": {
"execution_times": [
14.789254,
13.413338,
13.084335
],
"system_metrics": [
{
"cpu_percent": 5.1,
"memory_mb": 67.765625
},
{
"cpu_percent": 3.7,
"memory_mb": 199.875
},
{
"cpu_percent": 16.2,
"memory_mb": 203.453125
}
],
"iterations": [
{
"iteration": 1,
"execution_time": 14.789,
"success": true,
"system_metrics": {
"pre": {
"cpu_percent": 0.0,
"memory_mb": 243.046875
},
"post": {
"cpu_percent": 5.1,
"memory_mb": 67.765625
}
}
},
{
"iteration": 2,
"execution_time": 13.413,
"success": true,
"system_metrics": {
"pre": {
"cpu_percent": 202.0,
"memory_mb": 243.109375
},
"post": {
"cpu_percent": 3.7,
"memory_mb": 199.875
}
}
},
{
"iteration": 3,
"execution_time": 13.084,
"success": true,
"system_metrics": {
"pre": {
"cpu_percent": 107.1,
"memory_mb": 243.21875
},
"post": {
"cpu_percent": 16.2,
"memory_mb": 203.453125
}
}
}
],
"statistics": {
"execution_time": {
"mean": 13.762,
"median": 13.413,
"min": 13.084,
"max": 14.789,
"std_dev": 0.738
},
"memory_usage": {
"mean": 157.031,
"median": 199.875,
"min": 67.766,
"max": 203.453,
"std_dev": 63.137
},
"cpu_usage": {
"mean": 8.333,
"median": 5.1,
"min": 3.7,
"max": 16.2,
"std_dev": 5.592
}
}
},
"What are the top performing tech stocks this quarter?": {
"execution_times": [
14.40021,
7.619928,
9.870042
],
"system_metrics": [
{
"cpu_percent": 2.5,
"memory_mb": 69.734375
},
{
"cpu_percent": 0.5,
"memory_mb": 204.46875
},
{
"cpu_percent": 0.8,
"memory_mb": 204.640625
}
],
"iterations": [
{
"iteration": 1,
"execution_time": 14.4,
"success": true,
"system_metrics": {
"pre": {
"cpu_percent": 109.3,
"memory_mb": 243.1875
},
"post": {
"cpu_percent": 2.5,
"memory_mb": 69.734375
}
}
},
{
"iteration": 2,
"execution_time": 7.62,
"success": true,
"system_metrics": {
"pre": {
"cpu_percent": 194.6,
"memory_mb": 243.328125
},
"post": {
"cpu_percent": 0.5,
"memory_mb": 204.46875
}
}
},
{
"iteration": 3,
"execution_time": 9.87,
"success": true,
"system_metrics": {
"pre": {
"cpu_percent": 187.1,
"memory_mb": 243.734375
},
"post": {
"cpu_percent": 0.8,
"memory_mb": 204.640625
}
}
}
],
"statistics": {
"execution_time": {
"mean": 10.63,
"median": 9.87,
"min": 7.62,
"max": 14.4,
"std_dev": 2.82
},
"memory_usage": {
"mean": 159.615,
"median": 204.469,
"min": 69.734,
"max": 204.641,
"std_dev": 63.555
},
"cpu_usage": {
"mean": 1.267,
"median": 0.8,
"min": 0.5,
"max": 2.5,
"std_dev": 0.881
}
}
},
"Analyze current market trends in renewable energy sector": {
"execution_times": [
3.193721,
11.01429,
13.543417
],
"system_metrics": [
{
"cpu_percent": 5.7,
"memory_mb": 223.109375
},
{
"cpu_percent": 1.4,
"memory_mb": 203.46875
},
{
"cpu_percent": 9.9,
"memory_mb": 199.1875
}
],
"iterations": [
{
"iteration": 1,
"execution_time": 3.194,
"success": true,
"system_metrics": {
"pre": {
"cpu_percent": 223.0,
"memory_mb": 243.8125
},
"post": {
"cpu_percent": 5.7,
"memory_mb": 223.109375
}
}
},
{
"iteration": 2,
"execution_time": 11.014,
"success": true,
"system_metrics": {
"pre": {
"cpu_percent": 270.1,
"memory_mb": 243.953125
},
"post": {
"cpu_percent": 1.4,
"memory_mb": 203.46875
}
}
},
{
"iteration": 3,
"execution_time": 13.543,
"success": true,
"system_metrics": {
"pre": {
"cpu_percent": 340.8,
"memory_mb": 244.0625
},
"post": {
"cpu_percent": 9.9,
"memory_mb": 199.1875
}
}
}
],
"statistics": {
"execution_time": {
"mean": 9.25,
"median": 11.014,
"min": 3.194,
"max": 13.543,
"std_dev": 4.405
},
"memory_usage": {
"mean": 208.589,
"median": 203.469,
"min": 199.188,
"max": 223.109,
"std_dev": 10.415
},
"cpu_usage": {
"mean": 5.667,
"median": 5.7,
"min": 1.4,
"max": 9.9,
"std_dev": 3.47
}
}
},
"Compare Bitcoin and Ethereum investment potential": {
"execution_times": [
3.424122,
12.162575,
9.831582
],
"system_metrics": [
{
"cpu_percent": 1.9,
"memory_mb": 217.640625
},
{
"cpu_percent": 2.9,
"memory_mb": 203.171875
},
{
"cpu_percent": 31.2,
"memory_mb": 204.765625
}
],
"iterations": [
{
"iteration": 1,
"execution_time": 3.424,
"success": true,
"system_metrics": {
"pre": {
"cpu_percent": 364.2,
"memory_mb": 245.671875
},
"post": {
"cpu_percent": 1.9,
"memory_mb": 217.640625
}
}
},
{
"iteration": 2,
"execution_time": 12.163,
"success": true,
"system_metrics": {
"pre": {
"cpu_percent": 659.7,
"memory_mb": 245.734375
},
"post": {
"cpu_percent": 2.9,
"memory_mb": 203.171875
}
}
},
{
"iteration": 3,
"execution_time": 9.832,
"success": true,
"system_metrics": {
"pre": {
"cpu_percent": 612.4,
"memory_mb": 245.953125
},
"post": {
"cpu_percent": 31.2,
"memory_mb": 204.765625
}
}
}
],
"statistics": {
"execution_time": {
"mean": 8.473,
"median": 9.832,
"min": 3.424,
"max": 12.163,
"std_dev": 3.695
},
"memory_usage": {
"mean": 208.526,
"median": 204.766,
"min": 203.172,
"max": 217.641,
"std_dev": 6.478
},
"cpu_usage": {
"mean": 12.0,
"median": 2.9,
"min": 1.9,
"max": 31.2,
"std_dev": 13.583
}
}
},
"Evaluate the risk factors in emerging markets": {
"execution_times": [
2.948636,
12.942413,
11.361344
],
"system_metrics": [
{
"cpu_percent": 402.2,
"memory_mb": 246.078125
},
{
"cpu_percent": 2.2,
"memory_mb": 203.34375
},
{
"cpu_percent": 4.5,
"memory_mb": 203.59375
}
],
"iterations": [
{
"iteration": 1,
"execution_time": 2.949,
"success": true,
"system_metrics": {
"pre": {
"cpu_percent": 1494.6,
"memory_mb": 246.140625
},
"post": {
"cpu_percent": 402.2,
"memory_mb": 246.078125
}
}
},
{
"iteration": 2,
"execution_time": 12.942,
"success": true,
"system_metrics": {
"pre": {
"cpu_percent": 529.1,
"memory_mb": 246.265625
},
"post": {
"cpu_percent": 2.2,
"memory_mb": 203.34375
}
}
},
{
"iteration": 3,
"execution_time": 11.361,
"success": true,
"system_metrics": {
"pre": {
"cpu_percent": 578.8,
"memory_mb": 246.65625
},
"post": {
"cpu_percent": 4.5,
"memory_mb": 203.59375
}
}
}
],
"statistics": {
"execution_time": {
"mean": 9.084,
"median": 11.361,
"min": 2.949,
"max": 12.942,
"std_dev": 4.386
},
"memory_usage": {
"mean": 217.672,
"median": 203.594,
"min": 203.344,
"max": 246.078,
"std_dev": 20.087
},
"cpu_usage": {
"mean": 136.3,
"median": 4.5,
"min": 2.2,
"max": 402.2,
"std_dev": 188.022
}
}
}
}
}