Skip to content

Commit

Permalink
Browse files Browse the repository at this point in the history
  • Loading branch information
dartpain committed Aug 14, 2024
2 parents 1af0ae0 + e93d0e7 commit 8c7d596
Show file tree
Hide file tree
Showing 2 changed files with 30 additions and 2 deletions.
5 changes: 3 additions & 2 deletions gpu-benchmarks.csv
Original file line number Diff line number Diff line change
@@ -1,2 +1,3 @@
"backend","best_of","completed","cost_per_hour","date","duration","gpu","input_throughput","model_id","num_prompts","output_throughput","provider","request_rate","request_throughput","tokenizer_id","total_input_tokens","total_output_tokens","use_beam_search"
"vllm",1,1000,0.84,"20240813-143958",385.30312793600024,"NVIDIA L4",558.5109084184351,"meta-llama/Meta-Llama-3.1-8B-Instruct",1000,513.2037236740132,"scaleway","inf",2.5953591536015312,"meta-llama/Meta-Llama-3.1-8B-Instruct",215196,197739,false
"backend","benchmark_duration","best_of","completed","cost_per_hour","date","duration","gpu","input_throughput","input_token_throughput","mean_e2e_latency","mean_itl","mean_tpot","mean_ttft","median_e2e_latency","median_itl","median_tpot","median_ttft","model_id","num_prompts","output_throughput","output_token_throughput","p99_itl","p99_tpot","p99_ttft","provider","request_rate","request_throughput","successful_requests","tokenizer_id","total_generated_tokens","total_generated_tokens_ret","total_input_tokens","total_output_tokens","traffic_request_rate","use_beam_search"
"sglang",35.45,,,3.02,"20240814-155812",,"NVIDIA H100",,6070.48,14328.17,71.79,145.31,773.1,13759.53,49.35,81.55,193.72,,,,5595.07,291.88,915.34,4118.65,"scaleway",,28.21,1000,,198343,197967,215196,,200,
"vllm",,1,1000,0.84,"20240813-143958",385.30312793600024,"NVIDIA L4",558.5109084184351,,,,,,,,,,"meta-llama/Meta-Llama-3.1-8B-Instruct",1000,513.2037236740132,,,,,"scaleway","inf",2.5953591536015312,,"meta-llama/Meta-Llama-3.1-8B-Instruct",,,215196,197739,,false
27 changes: 27 additions & 0 deletions gpu-benchmarks.json
Original file line number Diff line number Diff line change
@@ -1,4 +1,31 @@
[
{
"date": "20240814-155812",
"provider": "scaleway",
"gpu": "NVIDIA H100",
"cost_per_hour": 3.02,
"backend": "sglang",
"traffic_request_rate": 200,
"successful_requests": 1000,
"benchmark_duration": 35.45,
"total_input_tokens": 215196,
"total_generated_tokens": 198343,
"total_generated_tokens_ret": 197967,
"request_throughput": 28.21,
"input_token_throughput": 6070.48,
"output_token_throughput": 5595.07,
"mean_e2e_latency": 14328.17,
"median_e2e_latency": 13759.53,
"mean_ttft": 773.1,
"median_ttft": 193.72,
"p99_ttft": 4118.65,
"mean_tpot": 145.31,
"median_tpot": 81.55,
"p99_tpot": 915.34,
"mean_itl": 71.79,
"median_itl": 49.35,
"p99_itl": 291.88
},
{
"date": "20240813-143958",
"provider": "scaleway",
Expand Down

0 comments on commit 8c7d596

Please sign in to comment.