Cost
{% include "eval/components/_metric_static.html" with metric_label="Total Cost" metric_value=run_breakdown.cost metric_target=run_breakdown.target_cost metric_delta=run_breakdown.delta_cost %}
{% include "eval/components/_metric_static.html" with metric_label="Input Token Cost" metric_value=run_breakdown.cost_input metric_target=run_breakdown.target_cost_input metric_delta=run_breakdown.delta_cost_input %}
{% include "eval/components/_metric_static.html" with metric_label="Output Token Cost" metric_value=run_breakdown.cost_output metric_target=run_breakdown.target_cost_output metric_delta=run_breakdown.delta_cost_output %}
Tokens
{% include "eval/components/_metric_static.html" with metric_label="Input Tokens" metric_value=run_breakdown.input_tokens metric_target=run_breakdown.target_tokens metric_delta=run_breakdown.delta_input_tok %}
{% include "eval/components/_metric_static.html" with metric_label="Output Tokens" metric_value=run_breakdown.output_tokens metric_target=run_breakdown.target_output_tokens metric_delta=run_breakdown.delta_output_tok %}
{% include "eval/components/_metric_static.html" with metric_label="Total Tokens" metric_value=run_breakdown.total_tokens metric_target=run_breakdown.target_total_tokens metric_delta=run_breakdown.delta_total_tok %}
Latency
{% include "eval/components/_metric_static.html" with metric_label="Total Latency" metric_value=run_breakdown.latency metric_target=run_breakdown.target_latency metric_delta=run_breakdown.delta_latency %}
{% include "eval/components/_metric_static.html" with metric_label="Agent Latency" metric_value=run_breakdown.agent_latency metric_target=run_breakdown.target_agent_latency metric_delta=run_breakdown.delta_agent_latency %}
{% include "eval/components/_metric_static.html" with metric_label="Tool Latency" metric_value=run_breakdown.tool_latency metric_target=run_breakdown.target_tool_latency metric_delta=run_breakdown.delta_tool_latency %}
{% if run_breakdown.threshold_total %}
{% if run_breakdown.threshold_all_pass %}All metrics within threshold ✓{% else %}{{ run_breakdown.threshold_failing }} metric{{ run_breakdown.threshold_failing|pluralize }} exceeding threshold ✗{% endif %}
{{ run_breakdown.threshold_passing }}/{{ run_breakdown.threshold_total }} passing
{% endif %}