|
{ |
|
"config": { |
|
"max_vus": 128, |
|
"duration_secs": 120, |
|
"benchmark_kind": "Rate", |
|
"warmup_duration_secs": 30, |
|
"rates": [ |
|
0.8, |
|
2.4, |
|
4.0, |
|
5.6, |
|
7.2, |
|
8.8, |
|
10.4, |
|
12.0, |
|
13.6, |
|
15.2, |
|
16.8, |
|
18.4, |
|
20.0, |
|
21.6, |
|
23.2, |
|
24.0 |
|
], |
|
"num_rates": 10, |
|
"prompt_options": null, |
|
"decode_options": { |
|
"num_tokens": 200, |
|
"min_tokens": 200, |
|
"max_tokens": 200, |
|
"variance": 100 |
|
}, |
|
"tokenizer": "meta-llama/Llama-3.1-8B-Instruct", |
|
"model_name": "meta-llama/Llama-3.1-8B-Instruct", |
|
"profile": null, |
|
"meta": { |
|
"version": "4d28897b4e345f4dfdd93d3434e50ac8afcdf9e1", |
|
"engine": "TGI", |
|
"tp": "1" |
|
}, |
|
"run_id": "TGI-3.2.1" |
|
}, |
|
"results": [ |
|
{ |
|
"id": "warmup", |
|
"executor_type": "ConstantVUs", |
|
"config": { |
|
"max_vus": 1, |
|
"duration_secs": 30, |
|
"rate": null |
|
}, |
|
"total_requests": 22, |
|
"total_tokens": 3726, |
|
"token_throughput_secs": 121.61045252166194, |
|
"duration_ms": 30638, |
|
"time_to_first_token_ms": { |
|
"p50": 46.607, |
|
"p60": 46.786, |
|
"p70": 46.957, |
|
"p80": 47.13, |
|
"p90": 48.231, |
|
"p95": 78.293, |
|
"p99": 80.85, |
|
"avg": 48.554 |
|
}, |
|
"inter_token_latency_ms": { |
|
"p50": 7.973, |
|
"p60": 7.982, |
|
"p70": 7.99, |
|
"p80": 8.0, |
|
"p90": 8.043, |
|
"p95": 8.083, |
|
"p99": 8.125, |
|
"avg": 7.927 |
|
}, |
|
"failed_requests": 0, |
|
"successful_requests": 22, |
|
"request_rate": 0.7180434663114769, |
|
"total_tokens_sent": 1613, |
|
"e2e_latency_ms": { |
|
"p50": 1632.456, |
|
"p60": 1633.79, |
|
"p70": 1636.485, |
|
"p80": 1638.246, |
|
"p90": 1647.577, |
|
"p95": 1688.143, |
|
"p99": 1697.2, |
|
"avg": 1392.459 |
|
} |
|
}, |
|
{ |
|
"id": "[email protected]/s", |
|
"executor_type": "ConstantArrivalRate", |
|
"config": { |
|
"max_vus": 128, |
|
"duration_secs": 120, |
|
"rate": 0.8 |
|
}, |
|
"total_requests": 94, |
|
"total_tokens": 14823, |
|
"token_throughput_secs": 125.70685354915, |
|
"duration_ms": 117917, |
|
"time_to_first_token_ms": { |
|
"p50": 26.689, |
|
"p60": 28.276, |
|
"p70": 29.925, |
|
"p80": 31.171, |
|
"p90": 31.927, |
|
"p95": 32.252, |
|
"p99": 33.737, |
|
"avg": 27.559 |
|
}, |
|
"inter_token_latency_ms": { |
|
"p50": 8.297, |
|
"p60": 8.308, |
|
"p70": 8.327, |
|
"p80": 8.348, |
|
"p90": 8.372, |
|
"p95": 8.387, |
|
"p99": 8.48, |
|
"avg": 8.274 |
|
}, |
|
"failed_requests": 0, |
|
"successful_requests": 94, |
|
"request_rate": 0.7971695495932065, |
|
"total_tokens_sent": 13915, |
|
"e2e_latency_ms": { |
|
"p50": 1675.47, |
|
"p60": 1680.097, |
|
"p70": 1683.628, |
|
"p80": 1686.037, |
|
"p90": 1689.112, |
|
"p95": 1692.598, |
|
"p99": 1711.849, |
|
"avg": 1329.915 |
|
} |
|
}, |
|
{ |
|
"id": "[email protected]/s", |
|
"executor_type": "ConstantArrivalRate", |
|
"config": { |
|
"max_vus": 128, |
|
"duration_secs": 120, |
|
"rate": 2.4 |
|
}, |
|
"total_requests": 283, |
|
"total_tokens": 49472, |
|
"token_throughput_secs": 417.57128544344323, |
|
"duration_ms": 118475, |
|
"time_to_first_token_ms": { |
|
"p50": 29.056, |
|
"p60": 29.943, |
|
"p70": 30.586, |
|
"p80": 31.684, |
|
"p90": 32.58, |
|
"p95": 33.297, |
|
"p99": 42.848, |
|
"avg": 29.12 |
|
}, |
|
"inter_token_latency_ms": { |
|
"p50": 8.925, |
|
"p60": 8.931, |
|
"p70": 8.939, |
|
"p80": 8.947, |
|
"p90": 8.954, |
|
"p95": 8.965, |
|
"p99": 8.982, |
|
"avg": 8.669 |
|
}, |
|
"failed_requests": 0, |
|
"successful_requests": 283, |
|
"request_rate": 2.3886779143858026, |
|
"total_tokens_sent": 44403, |
|
"e2e_latency_ms": { |
|
"p50": 1804.541, |
|
"p60": 1805.909, |
|
"p70": 1807.748, |
|
"p80": 1809.553, |
|
"p90": 1812.308, |
|
"p95": 1814.507, |
|
"p99": 1817.862, |
|
"avg": 1579.6 |
|
} |
|
}, |
|
{ |
|
"id": "[email protected]/s", |
|
"executor_type": "ConstantArrivalRate", |
|
"config": { |
|
"max_vus": 128, |
|
"duration_secs": 120, |
|
"rate": 4.0 |
|
}, |
|
"total_requests": 474, |
|
"total_tokens": 85697, |
|
"token_throughput_secs": 720.8187174458998, |
|
"duration_ms": 118888, |
|
"time_to_first_token_ms": { |
|
"p50": 28.261, |
|
"p60": 29.236, |
|
"p70": 30.047, |
|
"p80": 31.071, |
|
"p90": 32.258, |
|
"p95": 32.956, |
|
"p99": 44.447, |
|
"avg": 28.686 |
|
}, |
|
"inter_token_latency_ms": { |
|
"p50": 9.365, |
|
"p60": 9.383, |
|
"p70": 9.396, |
|
"p80": 9.415, |
|
"p90": 9.433, |
|
"p95": 9.446, |
|
"p99": 9.457, |
|
"avg": 9.313 |
|
}, |
|
"failed_requests": 0, |
|
"successful_requests": 474, |
|
"request_rate": 3.9869315386694577, |
|
"total_tokens_sent": 56591, |
|
"e2e_latency_ms": { |
|
"p50": 1890.864, |
|
"p60": 1894.873, |
|
"p70": 1898.381, |
|
"p80": 1902.406, |
|
"p90": 1906.151, |
|
"p95": 1909.095, |
|
"p99": 1912.544, |
|
"avg": 1712.674 |
|
} |
|
}, |
|
{ |
|
"id": "[email protected]/s", |
|
"executor_type": "ConstantArrivalRate", |
|
"config": { |
|
"max_vus": 128, |
|
"duration_secs": 120, |
|
"rate": 5.6 |
|
}, |
|
"total_requests": 660, |
|
"total_tokens": 115159, |
|
"token_throughput_secs": 966.2563530237055, |
|
"duration_ms": 119180, |
|
"time_to_first_token_ms": { |
|
"p50": 29.312, |
|
"p60": 30.64, |
|
"p70": 31.75, |
|
"p80": 32.952, |
|
"p90": 44.096, |
|
"p95": 46.404, |
|
"p99": 48.15, |
|
"avg": 30.915 |
|
}, |
|
"inter_token_latency_ms": { |
|
"p50": 9.98, |
|
"p60": 9.996, |
|
"p70": 10.004, |
|
"p80": 10.013, |
|
"p90": 10.022, |
|
"p95": 10.028, |
|
"p99": 10.062, |
|
"avg": 9.803 |
|
}, |
|
"failed_requests": 0, |
|
"successful_requests": 660, |
|
"request_rate": 5.537814612801827, |
|
"total_tokens_sent": 113449, |
|
"e2e_latency_ms": { |
|
"p50": 2013.741, |
|
"p60": 2017.376, |
|
"p70": 2019.935, |
|
"p80": 2021.638, |
|
"p90": 2024.968, |
|
"p95": 2026.227, |
|
"p99": 2032.895, |
|
"avg": 1754.082 |
|
} |
|
}, |
|
{ |
|
"id": "[email protected]/s", |
|
"executor_type": "ConstantArrivalRate", |
|
"config": { |
|
"max_vus": 128, |
|
"duration_secs": 120, |
|
"rate": 7.2 |
|
}, |
|
"total_requests": 849, |
|
"total_tokens": 151779, |
|
"token_throughput_secs": 1267.369912316427, |
|
"duration_ms": 119759, |
|
"time_to_first_token_ms": { |
|
"p50": 30.493, |
|
"p60": 31.719, |
|
"p70": 33.123, |
|
"p80": 36.078, |
|
"p90": 46.155, |
|
"p95": 46.769, |
|
"p99": 48.162, |
|
"avg": 32.604 |
|
}, |
|
"inter_token_latency_ms": { |
|
"p50": 10.423, |
|
"p60": 10.475, |
|
"p70": 10.5, |
|
"p80": 10.524, |
|
"p90": 10.555, |
|
"p95": 10.575, |
|
"p99": 10.597, |
|
"avg": 10.321 |
|
}, |
|
"failed_requests": 0, |
|
"successful_requests": 849, |
|
"request_rate": 7.089235372196724, |
|
"total_tokens_sent": 145128, |
|
"e2e_latency_ms": { |
|
"p50": 2100.596, |
|
"p60": 2114.214, |
|
"p70": 2119.354, |
|
"p80": 2124.055, |
|
"p90": 2130.161, |
|
"p95": 2134.421, |
|
"p99": 2140.161, |
|
"avg": 1884.625 |
|
} |
|
}, |
|
{ |
|
"id": "[email protected]/s", |
|
"executor_type": "ConstantArrivalRate", |
|
"config": { |
|
"max_vus": 128, |
|
"duration_secs": 120, |
|
"rate": 8.8 |
|
}, |
|
"total_requests": 1041, |
|
"total_tokens": 181439, |
|
"token_throughput_secs": 1528.9336762174746, |
|
"duration_ms": 118670, |
|
"time_to_first_token_ms": { |
|
"p50": 33.409, |
|
"p60": 41.426, |
|
"p70": 45.116, |
|
"p80": 45.65, |
|
"p90": 47.216, |
|
"p95": 47.524, |
|
"p99": 47.814, |
|
"avg": 36.264 |
|
}, |
|
"inter_token_latency_ms": { |
|
"p50": 11.019, |
|
"p60": 11.044, |
|
"p70": 11.072, |
|
"p80": 11.102, |
|
"p90": 11.136, |
|
"p95": 11.159, |
|
"p99": 11.222, |
|
"avg": 10.862 |
|
}, |
|
"failed_requests": 0, |
|
"successful_requests": 1041, |
|
"request_rate": 8.77220419503189, |
|
"total_tokens_sent": 191937, |
|
"e2e_latency_ms": { |
|
"p50": 2223.571, |
|
"p60": 2232.271, |
|
"p70": 2241.046, |
|
"p80": 2246.104, |
|
"p90": 2253.422, |
|
"p95": 2259.594, |
|
"p99": 2267.867, |
|
"avg": 1944.18 |
|
} |
|
}, |
|
{ |
|
"id": "[email protected]/s", |
|
"executor_type": "ConstantArrivalRate", |
|
"config": { |
|
"max_vus": 128, |
|
"duration_secs": 120, |
|
"rate": 10.4 |
|
}, |
|
"total_requests": 1225, |
|
"total_tokens": 208853, |
|
"token_throughput_secs": 1750.44303623107, |
|
"duration_ms": 119314, |
|
"time_to_first_token_ms": { |
|
"p50": 34.056, |
|
"p60": 40.904, |
|
"p70": 44.889, |
|
"p80": 45.567, |
|
"p90": 47.156, |
|
"p95": 47.537, |
|
"p99": 47.805, |
|
"avg": 36.461 |
|
}, |
|
"inter_token_latency_ms": { |
|
"p50": 11.655, |
|
"p60": 11.693, |
|
"p70": 11.73, |
|
"p80": 11.772, |
|
"p90": 11.827, |
|
"p95": 11.861, |
|
"p99": 11.909, |
|
"avg": 11.475 |
|
}, |
|
"failed_requests": 0, |
|
"successful_requests": 1225, |
|
"request_rate": 10.266995060559632, |
|
"total_tokens_sent": 219623, |
|
"e2e_latency_ms": { |
|
"p50": 2351.289, |
|
"p60": 2360.059, |
|
"p70": 2368.244, |
|
"p80": 2378.908, |
|
"p90": 2388.768, |
|
"p95": 2395.775, |
|
"p99": 2405.872, |
|
"avg": 2012.23 |
|
} |
|
}, |
|
{ |
|
"id": "[email protected]/s", |
|
"executor_type": "ConstantArrivalRate", |
|
"config": { |
|
"max_vus": 128, |
|
"duration_secs": 120, |
|
"rate": 12.0 |
|
}, |
|
"total_requests": 1411, |
|
"total_tokens": 255188, |
|
"token_throughput_secs": 2159.7525641398156, |
|
"duration_ms": 118156, |
|
"time_to_first_token_ms": { |
|
"p50": 40.727, |
|
"p60": 44.09, |
|
"p70": 44.798, |
|
"p80": 46.295, |
|
"p90": 46.858, |
|
"p95": 48.094, |
|
"p99": 48.34, |
|
"avg": 38.454 |
|
}, |
|
"inter_token_latency_ms": { |
|
"p50": 12.566, |
|
"p60": 12.629, |
|
"p70": 12.67, |
|
"p80": 12.718, |
|
"p90": 12.802, |
|
"p95": 12.951, |
|
"p99": 13.08, |
|
"avg": 12.404 |
|
}, |
|
"failed_requests": 0, |
|
"successful_requests": 1411, |
|
"request_rate": 11.941826684645358, |
|
"total_tokens_sent": 272561, |
|
"e2e_latency_ms": { |
|
"p50": 2532.282, |
|
"p60": 2547.776, |
|
"p70": 2560.142, |
|
"p80": 2570.947, |
|
"p90": 2585.7, |
|
"p95": 2612.572, |
|
"p99": 2635.79, |
|
"avg": 2297.575 |
|
} |
|
}, |
|
{ |
|
"id": "[email protected]/s", |
|
"executor_type": "ConstantArrivalRate", |
|
"config": { |
|
"max_vus": 128, |
|
"duration_secs": 120, |
|
"rate": 13.6 |
|
}, |
|
"total_requests": 1564, |
|
"total_tokens": 272803, |
|
"token_throughput_secs": 2293.5215462094866, |
|
"duration_ms": 118945, |
|
"time_to_first_token_ms": { |
|
"p50": 44.852, |
|
"p60": 46.319, |
|
"p70": 46.872, |
|
"p80": 48.169, |
|
"p90": 49.674, |
|
"p95": 51.154, |
|
"p99": 53.485, |
|
"avg": 42.864 |
|
}, |
|
"inter_token_latency_ms": { |
|
"p50": 25.88, |
|
"p60": 26.011, |
|
"p70": 26.149, |
|
"p80": 26.243, |
|
"p90": 26.308, |
|
"p95": 26.354, |
|
"p99": 26.436, |
|
"avg": 24.547 |
|
}, |
|
"failed_requests": 0, |
|
"successful_requests": 1564, |
|
"request_rate": 13.148930540615892, |
|
"total_tokens_sent": 255933, |
|
"e2e_latency_ms": { |
|
"p50": 5177.262, |
|
"p60": 5201.64, |
|
"p70": 5238.214, |
|
"p80": 5261.34, |
|
"p90": 5275.17, |
|
"p95": 5286.208, |
|
"p99": 5302.579, |
|
"avg": 4359.271 |
|
} |
|
}, |
|
{ |
|
"id": "[email protected]/s", |
|
"executor_type": "ConstantArrivalRate", |
|
"config": { |
|
"max_vus": 128, |
|
"duration_secs": 120, |
|
"rate": 15.2 |
|
}, |
|
"total_requests": 1759, |
|
"total_tokens": 309348, |
|
"token_throughput_secs": 2580.5086165701296, |
|
"duration_ms": 119878, |
|
"time_to_first_token_ms": { |
|
"p50": 45.707, |
|
"p60": 47.05, |
|
"p70": 47.656, |
|
"p80": 48.721, |
|
"p90": 51.476, |
|
"p95": 53.138, |
|
"p99": 55.565, |
|
"avg": 44.101 |
|
}, |
|
"inter_token_latency_ms": { |
|
"p50": 26.733, |
|
"p60": 26.968, |
|
"p70": 27.102, |
|
"p80": 27.19, |
|
"p90": 27.265, |
|
"p95": 27.368, |
|
"p99": 27.441, |
|
"avg": 26.359 |
|
}, |
|
"failed_requests": 0, |
|
"successful_requests": 1759, |
|
"request_rate": 14.673166325778274, |
|
"total_tokens_sent": 270134, |
|
"e2e_latency_ms": { |
|
"p50": 5326.968, |
|
"p60": 5382.346, |
|
"p70": 5428.823, |
|
"p80": 5452.294, |
|
"p90": 5469.218, |
|
"p95": 5483.97, |
|
"p99": 5502.975, |
|
"avg": 4685.437 |
|
} |
|
}, |
|
{ |
|
"id": "[email protected]/s", |
|
"executor_type": "ConstantArrivalRate", |
|
"config": { |
|
"max_vus": 128, |
|
"duration_secs": 120, |
|
"rate": 16.8 |
|
}, |
|
"total_requests": 1928, |
|
"total_tokens": 330549, |
|
"token_throughput_secs": 2759.3148813615194, |
|
"duration_ms": 119793, |
|
"time_to_first_token_ms": { |
|
"p50": 46.472, |
|
"p60": 46.857, |
|
"p70": 48.168, |
|
"p80": 50.368, |
|
"p90": 53.407, |
|
"p95": 55.802, |
|
"p99": 72.801, |
|
"avg": 45.931 |
|
}, |
|
"inter_token_latency_ms": { |
|
"p50": 27.881, |
|
"p60": 28.021, |
|
"p70": 28.093, |
|
"p80": 28.16, |
|
"p90": 28.336, |
|
"p95": 28.602, |
|
"p99": 29.638, |
|
"avg": 27.078 |
|
}, |
|
"failed_requests": 0, |
|
"successful_requests": 1928, |
|
"request_rate": 16.094313070876055, |
|
"total_tokens_sent": 320581, |
|
"e2e_latency_ms": { |
|
"p50": 5553.009, |
|
"p60": 5600.423, |
|
"p70": 5629.869, |
|
"p80": 5644.616, |
|
"p90": 5671.609, |
|
"p95": 5710.139, |
|
"p99": 5944.138, |
|
"avg": 4721.266 |
|
} |
|
}, |
|
{ |
|
"id": "[email protected]/s", |
|
"executor_type": "ConstantArrivalRate", |
|
"config": { |
|
"max_vus": 128, |
|
"duration_secs": 120, |
|
"rate": 18.4 |
|
}, |
|
"total_requests": 2118, |
|
"total_tokens": 357373, |
|
"token_throughput_secs": 2982.4464814578682, |
|
"duration_ms": 119825, |
|
"time_to_first_token_ms": { |
|
"p50": 59.209, |
|
"p60": 64.399, |
|
"p70": 69.696, |
|
"p80": 75.067, |
|
"p90": 80.705, |
|
"p95": 84.049, |
|
"p99": 88.502, |
|
"avg": 59.862 |
|
}, |
|
"inter_token_latency_ms": { |
|
"p50": 28.563, |
|
"p60": 28.749, |
|
"p70": 28.916, |
|
"p80": 29.057, |
|
"p90": 29.191, |
|
"p95": 29.317, |
|
"p99": 30.202, |
|
"avg": 28.34 |
|
}, |
|
"failed_requests": 0, |
|
"successful_requests": 2118, |
|
"request_rate": 17.67571038586509, |
|
"total_tokens_sent": 398184, |
|
"e2e_latency_ms": { |
|
"p50": 5708.277, |
|
"p60": 5743.555, |
|
"p70": 5787.666, |
|
"p80": 5828.147, |
|
"p90": 5862.892, |
|
"p95": 5894.271, |
|
"p99": 6066.881, |
|
"avg": 4844.433 |
|
} |
|
}, |
|
{ |
|
"id": "[email protected]/s", |
|
"executor_type": "ConstantArrivalRate", |
|
"config": { |
|
"max_vus": 128, |
|
"duration_secs": 120, |
|
"rate": 20.0 |
|
}, |
|
"total_requests": 2290, |
|
"total_tokens": 386940, |
|
"token_throughput_secs": 3227.511698507537, |
|
"duration_ms": 119888, |
|
"time_to_first_token_ms": { |
|
"p50": 58.122, |
|
"p60": 63.978, |
|
"p70": 70.049, |
|
"p80": 76.219, |
|
"p90": 82.824, |
|
"p95": 86.111, |
|
"p99": 90.923, |
|
"avg": 59.703 |
|
}, |
|
"inter_token_latency_ms": { |
|
"p50": 29.32, |
|
"p60": 29.492, |
|
"p70": 29.895, |
|
"p80": 30.4, |
|
"p90": 30.546, |
|
"p95": 31.209, |
|
"p99": 31.92, |
|
"avg": 28.595 |
|
}, |
|
"failed_requests": 0, |
|
"successful_requests": 2290, |
|
"request_rate": 19.10115725844384, |
|
"total_tokens_sent": 346259, |
|
"e2e_latency_ms": { |
|
"p50": 5821.093, |
|
"p60": 5905.813, |
|
"p70": 5981.542, |
|
"p80": 6088.576, |
|
"p90": 6138.484, |
|
"p95": 6172.066, |
|
"p99": 6421.6, |
|
"avg": 4983.079 |
|
} |
|
}, |
|
{ |
|
"id": "[email protected]/s", |
|
"executor_type": "ConstantArrivalRate", |
|
"config": { |
|
"max_vus": 128, |
|
"duration_secs": 120, |
|
"rate": 21.6 |
|
}, |
|
"total_requests": 2445, |
|
"total_tokens": 438323, |
|
"token_throughput_secs": 3667.2404231554137, |
|
"duration_ms": 119523, |
|
"time_to_first_token_ms": { |
|
"p50": 60.891, |
|
"p60": 67.221, |
|
"p70": 73.352, |
|
"p80": 80.009, |
|
"p90": 86.246, |
|
"p95": 89.966, |
|
"p99": 95.937, |
|
"avg": 62.545 |
|
}, |
|
"inter_token_latency_ms": { |
|
"p50": 31.059, |
|
"p60": 31.174, |
|
"p70": 31.267, |
|
"p80": 31.363, |
|
"p90": 31.564, |
|
"p95": 31.98, |
|
"p99": 32.368, |
|
"avg": 30.585 |
|
}, |
|
"failed_requests": 0, |
|
"successful_requests": 2445, |
|
"request_rate": 20.456154102374246, |
|
"total_tokens_sent": 375764, |
|
"e2e_latency_ms": { |
|
"p50": 6210.518, |
|
"p60": 6251.837, |
|
"p70": 6276.884, |
|
"p80": 6301.657, |
|
"p90": 6339.383, |
|
"p95": 6390.942, |
|
"p99": 6504.767, |
|
"avg": 5545.311 |
|
} |
|
}, |
|
{ |
|
"id": "[email protected]/s", |
|
"executor_type": "ConstantArrivalRate", |
|
"config": { |
|
"max_vus": 128, |
|
"duration_secs": 120, |
|
"rate": 23.2 |
|
}, |
|
"total_requests": 2557, |
|
"total_tokens": 451146, |
|
"token_throughput_secs": 3774.5098883710634, |
|
"duration_ms": 119524, |
|
"time_to_first_token_ms": { |
|
"p50": 61.047, |
|
"p60": 67.493, |
|
"p70": 74.009, |
|
"p80": 80.579, |
|
"p90": 87.143, |
|
"p95": 90.788, |
|
"p99": 95.729, |
|
"avg": 63.122 |
|
}, |
|
"inter_token_latency_ms": { |
|
"p50": 31.013, |
|
"p60": 31.094, |
|
"p70": 31.187, |
|
"p80": 31.29, |
|
"p90": 31.621, |
|
"p95": 32.321, |
|
"p99": 32.547, |
|
"avg": 30.814 |
|
}, |
|
"failed_requests": 0, |
|
"successful_requests": 2557, |
|
"request_rate": 21.393122812935964, |
|
"total_tokens_sent": 397220, |
|
"e2e_latency_ms": { |
|
"p50": 6207.811, |
|
"p60": 6232.278, |
|
"p70": 6255.491, |
|
"p80": 6280.109, |
|
"p90": 6327.14, |
|
"p95": 6467.71, |
|
"p99": 6530.251, |
|
"avg": 5488.01 |
|
} |
|
}, |
|
{ |
|
"id": "[email protected]/s", |
|
"executor_type": "ConstantArrivalRate", |
|
"config": { |
|
"max_vus": 128, |
|
"duration_secs": 120, |
|
"rate": 24.0 |
|
}, |
|
"total_requests": 2540, |
|
"total_tokens": 454462, |
|
"token_throughput_secs": 3793.8392202012997, |
|
"duration_ms": 119789, |
|
"time_to_first_token_ms": { |
|
"p50": 61.504, |
|
"p60": 67.687, |
|
"p70": 74.328, |
|
"p80": 81.247, |
|
"p90": 87.806, |
|
"p95": 91.29, |
|
"p99": 96.912, |
|
"avg": 63.516 |
|
}, |
|
"inter_token_latency_ms": { |
|
"p50": 31.192, |
|
"p60": 31.251, |
|
"p70": 31.333, |
|
"p80": 31.475, |
|
"p90": 31.907, |
|
"p95": 32.12, |
|
"p99": 32.242, |
|
"avg": 30.921 |
|
}, |
|
"failed_requests": 0, |
|
"successful_requests": 2540, |
|
"request_rate": 21.203866592391226, |
|
"total_tokens_sent": 455432, |
|
"e2e_latency_ms": { |
|
"p50": 6257.817, |
|
"p60": 6275.79, |
|
"p70": 6293.476, |
|
"p80": 6317.243, |
|
"p90": 6372.71, |
|
"p95": 6449.819, |
|
"p99": 6483.148, |
|
"avg": 5596.165 |
|
} |
|
} |
|
], |
|
"start_time": "2025-04-02T07:17:06.471305459+00:00", |
|
"end_time": "2025-04-02T07:50:23.157564514+00:00", |
|
"system": { |
|
"cpu": [ |
|
"AMD EPYC 7R13 Processor cpu0@2649MHz", |
|
"AMD EPYC 7R13 Processor cpu1@2516MHz", |
|
"AMD EPYC 7R13 Processor cpu2@2516MHz", |
|
"AMD EPYC 7R13 Processor cpu3@2649MHz", |
|
"AMD EPYC 7R13 Processor cpu4@2516MHz", |
|
"AMD EPYC 7R13 Processor cpu5@2516MHz", |
|
"AMD EPYC 7R13 Processor cpu6@2516MHz", |
|
"AMD EPYC 7R13 Processor cpu7@2649MHz", |
|
"AMD EPYC 7R13 Processor cpu8@2649MHz", |
|
"AMD EPYC 7R13 Processor cpu9@2649MHz", |
|
"AMD EPYC 7R13 Processor cpu10@2649MHz", |
|
"AMD EPYC 7R13 Processor cpu11@2649MHz", |
|
"AMD EPYC 7R13 Processor cpu12@2516MHz", |
|
"AMD EPYC 7R13 Processor cpu13@2881MHz", |
|
"AMD EPYC 7R13 Processor cpu14@2516MHz", |
|
"AMD EPYC 7R13 Processor cpu15@2649MHz", |
|
"AMD EPYC 7R13 Processor cpu16@2649MHz", |
|
"AMD EPYC 7R13 Processor cpu17@2649MHz", |
|
"AMD EPYC 7R13 Processor cpu18@2516MHz", |
|
"AMD EPYC 7R13 Processor cpu19@2516MHz", |
|
"AMD EPYC 7R13 Processor cpu20@2516MHz", |
|
"AMD EPYC 7R13 Processor cpu21@2516MHz", |
|
"AMD EPYC 7R13 Processor cpu22@3083MHz", |
|
"AMD EPYC 7R13 Processor cpu23@2649MHz", |
|
"AMD EPYC 7R13 Processor cpu24@2516MHz", |
|
"AMD EPYC 7R13 Processor cpu25@2516MHz", |
|
"AMD EPYC 7R13 Processor cpu26@2516MHz", |
|
"AMD EPYC 7R13 Processor cpu27@2516MHz", |
|
"AMD EPYC 7R13 Processor cpu28@2649MHz", |
|
"AMD EPYC 7R13 Processor cpu29@2516MHz", |
|
"AMD EPYC 7R13 Processor cpu30@2516MHz", |
|
"AMD EPYC 7R13 Processor cpu31@2516MHz", |
|
"AMD EPYC 7R13 Processor cpu32@2516MHz", |
|
"AMD EPYC 7R13 Processor cpu33@2516MHz", |
|
"AMD EPYC 7R13 Processor cpu34@2649MHz", |
|
"AMD EPYC 7R13 Processor cpu35@2649MHz", |
|
"AMD EPYC 7R13 Processor cpu36@2516MHz", |
|
"AMD EPYC 7R13 Processor cpu37@2516MHz", |
|
"AMD EPYC 7R13 Processor cpu38@2516MHz", |
|
"AMD EPYC 7R13 Processor cpu39@2649MHz", |
|
"AMD EPYC 7R13 Processor cpu40@2649MHz", |
|
"AMD EPYC 7R13 Processor cpu41@2649MHz", |
|
"AMD EPYC 7R13 Processor cpu42@2516MHz", |
|
"AMD EPYC 7R13 Processor cpu43@2516MHz", |
|
"AMD EPYC 7R13 Processor cpu44@2881MHz", |
|
"AMD EPYC 7R13 Processor cpu45@2516MHz", |
|
"AMD EPYC 7R13 Processor cpu46@2516MHz", |
|
"AMD EPYC 7R13 Processor cpu47@2649MHz", |
|
"AMD EPYC 7R13 Processor cpu48@2516MHz", |
|
"AMD EPYC 7R13 Processor cpu49@2516MHz", |
|
"AMD EPYC 7R13 Processor cpu50@2516MHz", |
|
"AMD EPYC 7R13 Processor cpu51@2649MHz", |
|
"AMD EPYC 7R13 Processor cpu52@2649MHz", |
|
"AMD EPYC 7R13 Processor cpu53@2649MHz", |
|
"AMD EPYC 7R13 Processor cpu54@2516MHz", |
|
"AMD EPYC 7R13 Processor cpu55@2516MHz", |
|
"AMD EPYC 7R13 Processor cpu56@2516MHz", |
|
"AMD EPYC 7R13 Processor cpu57@2516MHz", |
|
"AMD EPYC 7R13 Processor cpu58@2516MHz", |
|
"AMD EPYC 7R13 Processor cpu59@2516MHz", |
|
"AMD EPYC 7R13 Processor cpu60@2516MHz", |
|
"AMD EPYC 7R13 Processor cpu61@2516MHz", |
|
"AMD EPYC 7R13 Processor cpu62@3007MHz", |
|
"AMD EPYC 7R13 Processor cpu63@2649MHz", |
|
"AMD EPYC 7R13 Processor cpu64@2649MHz", |
|
"AMD EPYC 7R13 Processor cpu65@2649MHz", |
|
"AMD EPYC 7R13 Processor cpu66@2649MHz", |
|
"AMD EPYC 7R13 Processor cpu67@2649MHz", |
|
"AMD EPYC 7R13 Processor cpu68@2649MHz", |
|
"AMD EPYC 7R13 Processor cpu69@2649MHz", |
|
"AMD EPYC 7R13 Processor cpu70@2649MHz", |
|
"AMD EPYC 7R13 Processor cpu71@2649MHz", |
|
"AMD EPYC 7R13 Processor cpu72@2649MHz", |
|
"AMD EPYC 7R13 Processor cpu73@2649MHz", |
|
"AMD EPYC 7R13 Processor cpu74@2649MHz", |
|
"AMD EPYC 7R13 Processor cpu75@2649MHz", |
|
"AMD EPYC 7R13 Processor cpu76@2649MHz", |
|
"AMD EPYC 7R13 Processor cpu77@2649MHz", |
|
"AMD EPYC 7R13 Processor cpu78@2516MHz", |
|
"AMD EPYC 7R13 Processor cpu79@2516MHz", |
|
"AMD EPYC 7R13 Processor cpu80@2516MHz", |
|
"AMD EPYC 7R13 Processor cpu81@2649MHz", |
|
"AMD EPYC 7R13 Processor cpu82@2649MHz", |
|
"AMD EPYC 7R13 Processor cpu83@2649MHz", |
|
"AMD EPYC 7R13 Processor cpu84@2516MHz", |
|
"AMD EPYC 7R13 Processor cpu85@2516MHz", |
|
"AMD EPYC 7R13 Processor cpu86@2649MHz", |
|
"AMD EPYC 7R13 Processor cpu87@2649MHz", |
|
"AMD EPYC 7R13 Processor cpu88@2649MHz", |
|
"AMD EPYC 7R13 Processor cpu89@2649MHz", |
|
"AMD EPYC 7R13 Processor cpu90@2649MHz", |
|
"AMD EPYC 7R13 Processor cpu91@2649MHz", |
|
"AMD EPYC 7R13 Processor cpu92@2649MHz", |
|
"AMD EPYC 7R13 Processor cpu93@2649MHz", |
|
"AMD EPYC 7R13 Processor cpu94@2649MHz", |
|
"AMD EPYC 7R13 Processor cpu95@2649MHz" |
|
], |
|
"memory": "1999.99 GB", |
|
"os_name": "Debian GNU/Linux", |
|
"os_version": "11", |
|
"kernel": "5.15.0-1048-aws", |
|
"hostname": "ip-26-0-161-153" |
|
} |
|
} |