Commit
·
32636cd
1
Parent(s):
d5645ee
update to new file ref
Browse files
app.py
CHANGED
|
@@ -283,7 +283,7 @@ with demo:
|
|
| 283 |
)
|
| 284 |
gr.Markdown("### Visualization")
|
| 285 |
gr.Markdown("This figure presents a fine-grained heatmap illustrating task-level completion across different agents. Each row corresponds to a specific agent, and each column represents a task (identified by its task ID). Blue bars indicate successful completions, while white spaces denote failures. Any agent: A task is considered successful if at least one agent is able to complete it. (This style of visualization is inspired by [HAL](https://hal.cs.princeton.edu/).)")
|
| 286 |
-
fig = plot_heatmap_with_performance_bar("./
|
| 287 |
gr.Plot(fig)
|
| 288 |
gr.Markdown(EVALUATION_DETAILS)
|
| 289 |
|
|
|
|
| 283 |
)
|
| 284 |
gr.Markdown("### Visualization")
|
| 285 |
gr.Markdown("This figure presents a fine-grained heatmap illustrating task-level completion across different agents. Each row corresponds to a specific agent, and each column represents a task (identified by its task ID). Blue bars indicate successful completions, while white spaces denote failures. Any agent: A task is considered successful if at least one agent is able to complete it. (This style of visualization is inspired by [HAL](https://hal.cs.princeton.edu/).)")
|
| 286 |
+
fig = plot_heatmap_with_performance_bar("./human_label_082325.json")
|
| 287 |
gr.Plot(fig)
|
| 288 |
gr.Markdown(EVALUATION_DETAILS)
|
| 289 |
|