Skip to content
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
59 changes: 59 additions & 0 deletions .github/workflows/run-bot-aib-tournament.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -86,6 +86,65 @@ jobs:

# NOTE: don't remove any of the open source models, since these are the best option for a long term baseline (other models get deprecated)

#################################### June 2026 new bots ####################################

bot_claude_fable_5_high:
needs: precache_asknews
uses: ./.github/workflows/run-bot-launcher.yaml
with:
bot_name: "METAC_CLAUDE_FABLE_5_HIGH"
metac_name: "metac-claude-fable-5-high+asknews"
cache_key: asknews-cache-${{ github.run_id }}
secrets:
INPUT_METACULUS_TOKENS: ${{ secrets.METACULUS_TOKENS }}
INPUT_METACULUS_API_BASE_URL: ${{ secrets.METACULUS_API_BASE_URL }}
INPUT_ANTHROPIC_API_KEY: ${{ secrets.ANTHROPIC_API_KEY }}
INPUT_ASKNEWS_CLIENT_ID: ${{ secrets.ASKNEWS_CLIENT_ID }}
INPUT_ASKNEWS_SECRET: ${{ secrets.ASKNEWS_SECRET }}
INPUT_OPENROUTER_API_KEY: ${{ secrets.OPENROUTER_API_KEY }}

bot_nemotron_3_ultra:
needs: precache_asknews
uses: ./.github/workflows/run-bot-launcher.yaml
with:
bot_name: "METAC_NEMOTRON_3_ULTRA"
metac_name: "metac-nemotron-3-ultra+asknews"
cache_key: asknews-cache-${{ github.run_id }}
secrets:
INPUT_METACULUS_TOKENS: ${{ secrets.METACULUS_TOKENS }}
INPUT_METACULUS_API_BASE_URL: ${{ secrets.METACULUS_API_BASE_URL }}
INPUT_OPENROUTER_API_KEY: ${{ secrets.OPENROUTER_API_KEY }}
INPUT_ASKNEWS_CLIENT_ID: ${{ secrets.ASKNEWS_CLIENT_ID }}
INPUT_ASKNEWS_SECRET: ${{ secrets.ASKNEWS_SECRET }}

bot_qwen_3_7_plus:
needs: precache_asknews
uses: ./.github/workflows/run-bot-launcher.yaml
with:
bot_name: "METAC_QWEN_3_7_PLUS"
metac_name: "metac-qwen-3-7-plus+asknews"
cache_key: asknews-cache-${{ github.run_id }}
secrets:
INPUT_METACULUS_TOKENS: ${{ secrets.METACULUS_TOKENS }}
INPUT_METACULUS_API_BASE_URL: ${{ secrets.METACULUS_API_BASE_URL }}
INPUT_OPENROUTER_API_KEY: ${{ secrets.OPENROUTER_API_KEY }}
INPUT_ASKNEWS_CLIENT_ID: ${{ secrets.ASKNEWS_CLIENT_ID }}
INPUT_ASKNEWS_SECRET: ${{ secrets.ASKNEWS_SECRET }}

bot_minimax_m3:
needs: precache_asknews
uses: ./.github/workflows/run-bot-launcher.yaml
with:
bot_name: "METAC_MINIMAX_M3"
metac_name: "metac-minimax-m3+asknews"
cache_key: asknews-cache-${{ github.run_id }}
secrets:
INPUT_METACULUS_TOKENS: ${{ secrets.METACULUS_TOKENS }}
INPUT_METACULUS_API_BASE_URL: ${{ secrets.METACULUS_API_BASE_URL }}
INPUT_OPENROUTER_API_KEY: ${{ secrets.OPENROUTER_API_KEY }}
INPUT_ASKNEWS_CLIENT_ID: ${{ secrets.ASKNEWS_CLIENT_ID }}
INPUT_ASKNEWS_SECRET: ${{ secrets.ASKNEWS_SECRET }}

#################################### May 2026 new bots ####################################

bot_gemini_3_5_flash:
Expand Down
42 changes: 42 additions & 0 deletions run_bots.py
Original file line number Diff line number Diff line change
Expand Up @@ -579,6 +579,48 @@ def get_default_bot_dict() -> dict[str, RunBotConfig]: # NOSONAR
}

mode_base_bot_mapping = {
############################ Bots started in June 2026 ############################
"METAC_CLAUDE_FABLE_5_HIGH": {
"estimated_cost_per_question": roughly_opus_4_5_cost * 2,
"bot": create_bot(
llm=GeneralLlm(
model="anthropic/claude-fable-5",
**claude_adaptive_thinking_settings_high,
),
),
"tournaments": TournConfig.aib_and_site + [AllowedTourn.METACULUS_CUP],
},
"METAC_NEMOTRON_3_ULTRA": {
"estimated_cost_per_question": roughly_deepseek_r1_cost,
"bot": create_bot(
llm=GeneralLlm(
model="openrouter/nvidia/nemotron-3-ultra-550b-a55b",
temperature=default_temperature,
timeout=kimi_k2_timeout,
),
),
"tournaments": TournConfig.aib_and_site,
},
"METAC_QWEN_3_7_PLUS": {
"estimated_cost_per_question": roughly_deepseek_r1_cost,
"bot": create_bot(
GeneralLlm(
model="openrouter/qwen/qwen3.7-plus",
temperature=default_temperature,
),
),
"tournaments": TournConfig.aib_and_site,
},
"METAC_MINIMAX_M3": {
"estimated_cost_per_question": roughly_deepseek_r1_cost,
"bot": create_bot(
GeneralLlm(
model="openrouter/minimax/minimax-m3",
temperature=default_temperature,
),
),
"tournaments": TournConfig.aib_and_site,
},
############################ Bots started in May 2026 ############################
"METAC_GEMINI_3_5_FLASH": {
"estimated_cost_per_question": roughly_opus_4_5_cost / 2,
Expand Down
Loading