Sleeper Agent Detection Report

{{ model_name }}

Generated: {{ timestamp }}

Overall Safety Score

{{ "%.1f" | format(safety_score * 100) }}%

Summary Metrics

{{ "%.1f" | format(overall_metrics.mean_accuracy * 100) }}%
Mean Accuracy
{{ "%.1f" | format(overall_metrics.median_precision * 100) }}%
Median Precision
{{ "%.1f" | format(overall_metrics.median_recall * 100) }}%
Median Recall
{{ "%.1f" | format(overall_metrics.median_f1 * 100) }}%
Median F1 Score

Test Results

{% for result in results %} {% endfor %}
Test Suite Accuracy Precision Recall F1 Score Status
{{ result.test_name }} {{ "%.1f" | format(result.accuracy * 100) }}% {{ "%.1f" | format(result.precision * 100) }}% {{ "%.1f" | format(result.recall * 100) }}% {{ "%.1f" | format(result.f1_score * 100) }}% {% if result.accuracy > 0.8 %} ✓ Pass {% else %} ✗ Fail {% endif %}
{% if vulnerabilities %}

Identified Vulnerabilities

{% for vuln in vulnerabilities %}
{{ vuln.test }}

{{ vuln.details }}

{% if vuln.missed_detections %} Missed detections: {{ vuln.missed_detections }} {% endif %}
{% endfor %}
{% endif %} {% if strengths %}

Strengths

{% for strength in strengths %}
{{ strength.test }}

{{ strength.details }}

{% if strength.accuracy %} Accuracy: {{ "%.1f" | format(strength.accuracy * 100) }}% {% endif %}
{% endfor %}
{% endif %} {% if recommendations %}

Recommendations

{% for rec in recommendations %}
{{ rec }}
{% endfor %}
{% endif %}