Skip to content

Commit b224716

Browse files
chore: upgrade claude model to opus 4.6
1 parent d44c1f2 commit b224716

4 files changed

Lines changed: 6 additions & 6 deletions

File tree

README.md

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -19,7 +19,7 @@ FinBench is a professional LLM benchmarking tool for evaluating the capabilities
1919
| DeepSeek | deepseek-chat | api.deepseek.com |
2020
| Qwen | qwen3-max | dashscope.aliyuncs.com |
2121
| OpenAI | gpt-5.2 | api.openai.com |
22-
| Claude | claude-opus-4-5-20251101 | api.anthropic.com |
22+
| Claude | claude-opus-4-6 | api.anthropic.com |
2323
| Gemini | gemini-3-pro-preview | generativelanguage.googleapis.com |
2424
| Grok | grok-3-latest | api.x.ai |
2525
| Kimi | moonshot-v1-auto | api.moonshot.ai |

benchmark/models.go

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -27,7 +27,7 @@ const (
2727
DefaultDeepSeekModel = "deepseek-chat" // nofx/mcp/deepseek_client.go:10
2828
DefaultQwenModel = "qwen3-max" // nofx/mcp/qwen_client.go:10
2929
DefaultOpenAIModel = "gpt-5.2" // nofx/mcp/openai_client.go:10
30-
DefaultClaudeModel = "claude-opus-4-5-20251101" // nofx/mcp/claude_client.go:12
30+
DefaultClaudeModel = "claude-opus-4-6" // nofx/mcp/claude_client.go:12
3131
DefaultGeminiModel = "gemini-3-pro-preview" // nofx/mcp/gemini_client.go:10
3232
DefaultGrokModel = "grok-3-latest" // nofx/mcp/grok_client.go:10
3333
DefaultKimiModel = "moonshot-v1-auto" // nofx/mcp/kimi_client.go:10
@@ -71,7 +71,7 @@ func GetDefaultModels() []ModelInfo {
7171
{
7272
Provider: ProviderClaude,
7373
Model: DefaultClaudeModel,
74-
DisplayName: "Claude-Opus-4.5",
74+
DisplayName: "Claude-Opus-4.6",
7575
BaseURL: DefaultClaudeBaseURL,
7676
},
7777
{

config.template.json

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -19,9 +19,9 @@
1919
"api_key": "YOUR_OPENAI_API_KEY"
2020
},
2121
{
22-
"name": "Claude-Opus-4.5",
22+
"name": "Claude-Opus-4.6",
2323
"provider": "claude",
24-
"model": "claude-opus-4-5-20251101",
24+
"model": "claude-opus-4-6",
2525
"api_key": "YOUR_CLAUDE_API_KEY"
2626
},
2727
{

docs/plans/2025-01-22-finbench-design.md

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -38,7 +38,7 @@ FinBench supports 7 major LLM providers, aligned with the nofx trading system.
3838
| DeepSeek | deepseek-chat | nofx/mcp/deepseek_client.go:10 |
3939
| Qwen | qwen3-max | nofx/mcp/qwen_client.go:10 |
4040
| OpenAI | gpt-5.2 | nofx/mcp/openai_client.go:10 |
41-
| Claude | claude-opus-4-5-20251101 | nofx/mcp/claude_client.go:12 |
41+
| Claude | claude-opus-4-6 | nofx/mcp/claude_client.go:12 |
4242
| Gemini | gemini-3-pro-preview | nofx/mcp/gemini_client.go:10 |
4343
| Grok | grok-3-latest | nofx/mcp/grok_client.go:10 |
4444
| Kimi | moonshot-v1-auto | nofx/mcp/kimi_client.go:10 |

0 commit comments

Comments
 (0)