{% extends "ui/base_ui.html" %} {% block title %}{{ benchmark.name }} - ATP Platform{% endblock %} {% block content %}
{{ benchmark.description }}
{% endif %}| ID | Name | Description | Assertions |
|---|---|---|---|
| {{ test.id }} | {{ test.name }} | {{ test.task.description[:80] }}{% if test.task.description|length > 80 %}...{% endif %} | {{ test.assertions|length }} |
No tests defined.
{% endif %}| Run | Agent | Status | Score | Date |
|---|---|---|---|---|
| #{{ run.id }} | {{ run.agent_name or "—" }} | {{ run.status }} | {% if run.total_score is not none %}{{ "%.1f"|format(run.total_score) }}{% else %}—{% endif %} | {% if run.started_at %}{{ run.started_at.strftime("%Y-%m-%d %H:%M") }}{% else %}—{% endif %} |
No runs yet.
{% endif %}| # | Agent | Best Score | Runs |
|---|---|---|---|
| {{ loop.index }} | {{ entry.agent_name }} | {{ "%.1f"|format(entry.best_score or 0) }} | {{ entry.run_count }} |
No completed runs yet.
{% endif %} {% endblock %}