diff --git a/.github/workflows/integration-runner.yml b/.github/workflows/integration-runner.yml index 63cb881303..f2d2e45561 100644 --- a/.github/workflows/integration-runner.yml +++ b/.github/workflows/integration-runner.yml @@ -22,7 +22,7 @@ on: model_ids: description: >- Comma-separated model IDs to test (from resolve_model_config.py). - Example: claude-sonnet-4-5-20250929,glm-4.7. Defaults to a standard set. + Example: claude-sonnet-4-6,glm-4.7. Defaults to a standard set. required: false default: '' type: string @@ -50,7 +50,7 @@ on: env: N_PROCESSES: 4 # Global configuration for number of parallel processes for evaluation # Default models for scheduled/label-triggered runs (subset of models from resolve_model_config.py) - DEFAULT_MODEL_IDS: claude-sonnet-4-5-20250929,deepseek-v3.2-reasoner,kimi-k2-thinking,gemini-3-pro + DEFAULT_MODEL_IDS: claude-sonnet-4-6,deepseek-v3.2-reasoner,kimi-k2-thinking,gemini-3-pro jobs: setup-matrix: @@ -215,7 +215,7 @@ jobs: (github.event_name == 'schedule' && github.repository == 'OpenHands/software-agent-sdk') ) && needs.setup-matrix.result == 'success' needs: [setup-matrix, post-label-comment, post-dispatch-comment] - runs-on: ubuntu-22.04 + runs-on: blacksmith-4vcpu-ubuntu-2204 permissions: contents: read id-token: write @@ -367,7 +367,7 @@ jobs: github.event_name == 'workflow_dispatch' || (github.event_name == 'schedule' && github.repository == 'OpenHands/software-agent-sdk') ) - runs-on: ubuntu-24.04 + runs-on: blacksmith-2vcpu-ubuntu-2404 permissions: contents: read pull-requests: write diff --git a/openhands-sdk/openhands/sdk/llm/utils/model_features.py b/openhands-sdk/openhands/sdk/llm/utils/model_features.py index d454f5aa88..3f16b9c8ab 100644 --- a/openhands-sdk/openhands/sdk/llm/utils/model_features.py +++ b/openhands-sdk/openhands/sdk/llm/utils/model_features.py @@ -71,6 +71,7 @@ class ModelFeatures: # Anthropic Opus 4.5 and 4.6 "claude-opus-4-5", "claude-opus-4-6", + "claude-sonnet-4-6", # Nova 2 Lite "nova-2-lite", ] @@ -96,6 +97,7 @@ class ModelFeatures: "claude-haiku-4-5", "claude-opus-4-5", "claude-opus-4-6", + "claude-sonnet-4-6", ] # Models that support a top-level prompt_cache_retention parameter