OpenHands · simonrosenberg · Dec 2, 2025 · Nov 25, 2025 · Nov 25, 2025 · Nov 25, 2025
diff --git a/.github/run-eval/allowed-model-stubs.json b/.github/run-eval/allowed-model-stubs.json
diff --git a/.github/run-eval/authorized-labelers.txt b/.github/run-eval/authorized-labelers.txt
diff --git a/.github/run-eval/resolve_model_config.py b/.github/run-eval/resolve_model_config.py
@@ -0,0 +1,112 @@
+#!/usr/bin/env python3
+"""
+Resolve model IDs to full model configurations.
+
+Reads:
+- MODEL_IDS: comma-separated model IDs
+
+Outputs to GITHUB_OUTPUT:
+- models_json: JSON array of full model configs with display names
+"""
+
+import json
+import os
+import sys
+
+
+# Model configurations dictionary
+MODELS = {
+    "claude-sonnet-4-5-20250929": {
+        "id": "claude-sonnet-4-5-20250929",
+        "display_name": "Claude Sonnet 4.5",
+        "llm_config": {
+            "model": "litellm_proxy/claude-sonnet-4-5-20250929",
+            "temperature": 0.0,
+        },
+    },
+    "claude-haiku-4-5-20251001": {
+        "id": "claude-haiku-4-5-20251001",
+        "display_name": "Claude Haiku 4.5",
+        "llm_config": {
+            "model": "litellm_proxy/claude-haiku-4-5-20251001",
+            "temperature": 0.0,
+        },
+    },
+    "gpt-5-mini-2025-08-07": {
+        "id": "gpt-5-mini-2025-08-07",
+        "display_name": "GPT-5 Mini",
+        "llm_config": {
+            "model": "litellm_proxy/gpt-5-mini-2025-08-07",
+            "temperature": 1.0,
+        },
+    },
+    "deepseek-chat": {
+        "id": "deepseek-chat",
+        "display_name": "DeepSeek Chat",
+        "llm_config": {"model": "litellm_proxy/deepseek/deepseek-chat"},
+    },
+    "kimi-k2-thinking": {
+        "id": "kimi-k2-thinking",
+        "display_name": "Kimi K2 Thinking",
+        "llm_config": {"model": "litellm_proxy/moonshot/kimi-k2-thinking"},
+    },
+}
+
+
+def error_exit(msg: str, exit_code: int = 1) -> None:
+    """Print error message and exit."""
+    print(f"ERROR: {msg}", file=sys.stderr)
+    sys.exit(exit_code)
+
+
+def get_required_env(key: str) -> str:
+    """Get required environment variable or exit with error."""
+    value = os.environ.get(key)
+    if not value:
+        error_exit(f"{key} not set")
+    return value
+
+
+def find_models_by_id(model_ids: list[str]) -> list[dict]:
+    """Find models by ID. Fails fast on missing ID.
+
+    Args:
+        model_ids: List of model IDs to find
+
+    Returns:
+        List of model dictionaries matching the IDs
+
+    Raises:
+        SystemExit: If any model ID is not found
+    """
+    resolved = []
+    for model_id in model_ids:
+        if model_id not in MODELS:
+            available = ", ".join(sorted(MODELS.keys()))
+            error_exit(
+                f"Model ID '{model_id}' not found. Available models: {available}"
+            )
+        resolved.append(MODELS[model_id])
+    return resolved
+
+
+def main() -> None:
+    model_ids_str = get_required_env("MODEL_IDS")
+    github_output = get_required_env("GITHUB_OUTPUT")
+
+    # Parse requested model IDs
+    model_ids = [mid.strip() for mid in model_ids_str.split(",") if mid.strip()]
+
+    # Resolve model configs
+    resolved = find_models_by_id(model_ids)
+
+    # Output as JSON
+    models_json = json.dumps(resolved, separators=(",", ":"))
+    with open(github_output, "a", encoding="utf-8") as f:
+        f.write(f"models_json={models_json}\n")
+
+    print(f"Resolved {len(resolved)} model(s): {', '.join(model_ids)}")
+
+
+if __name__ == "__main__":
+    main()