diff --git a/competitors.example.yaml b/competitors.example.yaml index ab624ed..ffb26f0 100644 --- a/competitors.example.yaml +++ b/competitors.example.yaml @@ -305,6 +305,15 @@ size_class: large knowledge_cutoff: 2025-06 +- name: raw-api-loop/gpt-5.5-pro + model: openai/gpt-5.5-pro + runtime: raw-api-loop + tool_profile: read-grep + auth_profile: openrouter-api-key + cost_model: '{"base_url": "https://openrouter.ai/api/v1", "input_usd_per_mtok": 30.0, "output_usd_per_mtok": 180.0}' + size_class: large + knowledge_cutoff: 2025-06 + - name: raw-api-loop/glm-5.1 model: z-ai/glm-5.1 runtime: raw-api-loop diff --git a/nelson/html_report.py b/nelson/html_report.py index d6ae1aa..c44d71a 100644 --- a/nelson/html_report.py +++ b/nelson/html_report.py @@ -997,17 +997,27 @@ def generate_leaderboard_report( '
* Partial coverage: this competitor completed fewer ' + f"than the full {full_n} cases (see the Cases column). Its detection " + "rate is therefore based on fewer audited cases and is not directly " + "rank-comparable with full-corpus competitors — read it alongside the " + "Cases count, not the rank.
" + ) # Pareto scatter plots. parts.append("