Spaces:
Running
Running
Update app.py
Browse files
app.py
CHANGED
|
@@ -37,6 +37,7 @@ def json_to_row(path: str, metrics: dict) -> dict:
|
|
| 37 |
e2e_s = metrics.get("e2e_s", None)
|
| 38 |
batch_size = metrics.get("batch_size", None)
|
| 39 |
gpu_type = metrics.get("gpu_type", "")
|
|
|
|
| 40 |
|
| 41 |
em = metrics.get("exact_match")
|
| 42 |
correct = metrics.get("correct")
|
|
@@ -65,6 +66,7 @@ def json_to_row(path: str, metrics: dict) -> dict:
|
|
| 65 |
"Batch size": batch_size,
|
| 66 |
"GPU": gpu_type,
|
| 67 |
"Accuracy(%)": pct(acc),
|
|
|
|
| 68 |
"Decoding T/s": f2(metrics.get("decoding_throughput")),
|
| 69 |
"Prefill T/s": f2(metrics.get("prefill_tp")),
|
| 70 |
"Prefill<br>S-MBU(%)": pct(metrics.get("prefill_smbu")),
|
|
@@ -301,6 +303,7 @@ def build_app() -> gr.Blocks:
|
|
| 301 |
"- Batch Size \n"
|
| 302 |
"- GPU Type \n"
|
| 303 |
"- Accuracy (%) \n"
|
|
|
|
| 304 |
"- Decoding Throughput (tokens/s) \n"
|
| 305 |
"- Prefill Throughput (tokens/s) \n"
|
| 306 |
"- Prefill S-MBU (%) \n"
|
|
@@ -384,7 +387,7 @@ def build_app() -> gr.Blocks:
|
|
| 384 |
outputs=[leaderboard_output],
|
| 385 |
)
|
| 386 |
|
| 387 |
-
timer = gr.Timer(
|
| 388 |
timer.tick(
|
| 389 |
fn=auto_refresh_from_dir,
|
| 390 |
inputs=[dir_path, task_filter, framework_filter, model_type_filter, precision_filter],
|
|
|
|
| 37 |
e2e_s = metrics.get("e2e_s", None)
|
| 38 |
batch_size = metrics.get("batch_size", None)
|
| 39 |
gpu_type = metrics.get("gpu_type", "")
|
| 40 |
+
cost = metrics.get("cost", None)
|
| 41 |
|
| 42 |
em = metrics.get("exact_match")
|
| 43 |
correct = metrics.get("correct")
|
|
|
|
| 66 |
"Batch size": batch_size,
|
| 67 |
"GPU": gpu_type,
|
| 68 |
"Accuracy(%)": pct(acc),
|
| 69 |
+
"Cost($)": cost,
|
| 70 |
"Decoding T/s": f2(metrics.get("decoding_throughput")),
|
| 71 |
"Prefill T/s": f2(metrics.get("prefill_tp")),
|
| 72 |
"Prefill<br>S-MBU(%)": pct(metrics.get("prefill_smbu")),
|
|
|
|
| 303 |
"- Batch Size \n"
|
| 304 |
"- GPU Type \n"
|
| 305 |
"- Accuracy (%) \n"
|
| 306 |
+
"- Cost ($) \n"
|
| 307 |
"- Decoding Throughput (tokens/s) \n"
|
| 308 |
"- Prefill Throughput (tokens/s) \n"
|
| 309 |
"- Prefill S-MBU (%) \n"
|
|
|
|
| 387 |
outputs=[leaderboard_output],
|
| 388 |
)
|
| 389 |
|
| 390 |
+
timer = gr.Timer(60.0)
|
| 391 |
timer.tick(
|
| 392 |
fn=auto_refresh_from_dir,
|
| 393 |
inputs=[dir_path, task_filter, framework_filter, model_type_filter, precision_filter],
|