From edd28066e1f2916094f93ecd1b84bdf8e7b4ce67 Mon Sep 17 00:00:00 2001 From: Hunter B Date: Mon, 8 Jun 2026 06:47:21 -0700 Subject: [PATCH] =?UTF-8?q?chore(release):=20v0.8.54=20=E2=80=94=20benchma?= =?UTF-8?q?rk=20harness=20runners,=20MiMo=20routing?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- CHANGELOG.md | 15 ++++++++++++++- Cargo.lock | 30 +++++++++++++++--------------- Cargo.toml | 2 +- crates/agent/Cargo.toml | 2 +- crates/app-server/Cargo.toml | 18 +++++++++--------- crates/cli/Cargo.toml | 16 ++++++++-------- crates/config/Cargo.toml | 4 ++-- crates/core/Cargo.toml | 16 ++++++++-------- crates/execpolicy/Cargo.toml | 2 +- crates/hooks/Cargo.toml | 2 +- crates/tools/Cargo.toml | 2 +- crates/tui/CHANGELOG.md | 15 ++++++++++++++- crates/tui/Cargo.toml | 10 +++++----- npm/codewhale/package.json | 4 ++-- 14 files changed, 82 insertions(+), 56 deletions(-) diff --git a/CHANGELOG.md b/CHANGELOG.md index dec9b971..3e53b09a 100644 --- a/CHANGELOG.md +++ b/CHANGELOG.md @@ -7,6 +7,18 @@ and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0 ## [Unreleased] +## [0.8.54] - 2026-06-08 + +### Added + +- **Benchmark harness runners.** Added CodeWhale-native benchmark entry points for SWE-bench, Terminal-Bench, and PinchBench, plus a local PinchBench runner that can grade tool-use traces with an LLM judge. +- **Direct MiMo benchmark routing.** The benchmark runner now defaults to direct Xiaomi MiMo v2.5 Pro routing when configured, while keeping provider/model selection explicit. + +### Fixed + +- **Benchmark workspace copying.** Fixed benchmark workspace file copying so local benchmark tasks can preserve their intended file layout during agent runs. +- **MiMo default tests.** Guarded Xiaomi MiMo default-model tests against ambient CI provider environment variables. + ## [0.8.53] - 2026-06-03 ### Added @@ -5411,7 +5423,8 @@ Welcome — and thank you. - Hooks system and config profiles - Example skills and launch assets -[Unreleased]: https://github.com/Hmbown/CodeWhale/compare/v0.8.53...HEAD +[Unreleased]: https://github.com/Hmbown/CodeWhale/compare/v0.8.54...HEAD +[0.8.54]: https://github.com/Hmbown/CodeWhale/compare/v0.8.53...v0.8.54 [0.8.53]: https://github.com/Hmbown/CodeWhale/compare/v0.8.52...v0.8.53 [0.8.52]: https://github.com/Hmbown/CodeWhale/compare/v0.8.51...v0.8.52 [0.8.51]: https://github.com/Hmbown/CodeWhale/compare/v0.8.50...v0.8.51 diff --git a/Cargo.lock b/Cargo.lock index 139ac2a7..a10841c7 100644 --- a/Cargo.lock +++ b/Cargo.lock @@ -803,7 +803,7 @@ checksum = "e9b18233253483ce2f65329a24072ec414db782531bdbb7d0bbc4bd2ce6b7e21" [[package]] name = "codewhale-agent" -version = "0.8.53" +version = "0.8.54" dependencies = [ "codewhale-config", "serde", @@ -811,7 +811,7 @@ dependencies = [ [[package]] name = "codewhale-app-server" -version = "0.8.53" +version = "0.8.54" dependencies = [ "anyhow", "axum", @@ -836,7 +836,7 @@ dependencies = [ [[package]] name = "codewhale-cli" -version = "0.8.53" +version = "0.8.54" dependencies = [ "anyhow", "chrono", @@ -863,7 +863,7 @@ dependencies = [ [[package]] name = "codewhale-config" -version = "0.8.53" +version = "0.8.54" dependencies = [ "anyhow", "codewhale-execpolicy", @@ -877,7 +877,7 @@ dependencies = [ [[package]] name = "codewhale-core" -version = "0.8.53" +version = "0.8.54" dependencies = [ "anyhow", "chrono", @@ -895,7 +895,7 @@ dependencies = [ [[package]] name = "codewhale-execpolicy" -version = "0.8.53" +version = "0.8.54" dependencies = [ "anyhow", "codewhale-protocol", @@ -904,7 +904,7 @@ dependencies = [ [[package]] name = "codewhale-hooks" -version = "0.8.53" +version = "0.8.54" dependencies = [ "anyhow", "async-trait", @@ -918,7 +918,7 @@ dependencies = [ [[package]] name = "codewhale-mcp" -version = "0.8.53" +version = "0.8.54" dependencies = [ "anyhow", "serde", @@ -927,7 +927,7 @@ dependencies = [ [[package]] name = "codewhale-protocol" -version = "0.8.53" +version = "0.8.54" dependencies = [ "serde", "serde_json", @@ -935,7 +935,7 @@ dependencies = [ [[package]] name = "codewhale-release" -version = "0.8.53" +version = "0.8.54" dependencies = [ "anyhow", "reqwest", @@ -946,7 +946,7 @@ dependencies = [ [[package]] name = "codewhale-secrets" -version = "0.8.53" +version = "0.8.54" dependencies = [ "dirs", "keyring", @@ -959,7 +959,7 @@ dependencies = [ [[package]] name = "codewhale-state" -version = "0.8.53" +version = "0.8.54" dependencies = [ "anyhow", "chrono", @@ -971,7 +971,7 @@ dependencies = [ [[package]] name = "codewhale-tools" -version = "0.8.53" +version = "0.8.54" dependencies = [ "anyhow", "async-trait", @@ -985,7 +985,7 @@ dependencies = [ [[package]] name = "codewhale-tui" -version = "0.8.53" +version = "0.8.54" dependencies = [ "anyhow", "arboard", @@ -1054,7 +1054,7 @@ dependencies = [ [[package]] name = "codewhale-tui-core" -version = "0.8.53" +version = "0.8.54" [[package]] name = "colorchoice" diff --git a/Cargo.toml b/Cargo.toml index 32f94939..73a4dd53 100644 --- a/Cargo.toml +++ b/Cargo.toml @@ -20,7 +20,7 @@ default-members = ["crates/cli", "crates/app-server", "crates/tui"] resolver = "2" [workspace.package] -version = "0.8.53" +version = "0.8.54" edition = "2024" # Rust 1.88 stabilized `let_chains` in `if`/`while` conditions, which the # codebase relies on extensively. Cargo enforces this so users on older diff --git a/crates/agent/Cargo.toml b/crates/agent/Cargo.toml index 5e563534..ba9c851a 100644 --- a/crates/agent/Cargo.toml +++ b/crates/agent/Cargo.toml @@ -7,5 +7,5 @@ repository.workspace = true description = "Model/provider registry and fallback strategy for DeepSeek workspace architecture" [dependencies] -codewhale-config = { path = "../config", version = "0.8.53" } +codewhale-config = { path = "../config", version = "0.8.54" } serde.workspace = true diff --git a/crates/app-server/Cargo.toml b/crates/app-server/Cargo.toml index aa5a1cf3..941221c2 100644 --- a/crates/app-server/Cargo.toml +++ b/crates/app-server/Cargo.toml @@ -10,15 +10,15 @@ description = "Codex-style app-server transport for DeepSeek workspace architect anyhow.workspace = true axum.workspace = true clap.workspace = true -codewhale-agent = { path = "../agent", version = "0.8.53" } -codewhale-config = { path = "../config", version = "0.8.53" } -codewhale-core = { path = "../core", version = "0.8.53" } -codewhale-execpolicy = { path = "../execpolicy", version = "0.8.53" } -codewhale-hooks = { path = "../hooks", version = "0.8.53" } -codewhale-mcp = { path = "../mcp", version = "0.8.53" } -codewhale-protocol = { path = "../protocol", version = "0.8.53" } -codewhale-state = { path = "../state", version = "0.8.53" } -codewhale-tools = { path = "../tools", version = "0.8.53" } +codewhale-agent = { path = "../agent", version = "0.8.54" } +codewhale-config = { path = "../config", version = "0.8.54" } +codewhale-core = { path = "../core", version = "0.8.54" } +codewhale-execpolicy = { path = "../execpolicy", version = "0.8.54" } +codewhale-hooks = { path = "../hooks", version = "0.8.54" } +codewhale-mcp = { path = "../mcp", version = "0.8.54" } +codewhale-protocol = { path = "../protocol", version = "0.8.54" } +codewhale-state = { path = "../state", version = "0.8.54" } +codewhale-tools = { path = "../tools", version = "0.8.54" } serde.workspace = true serde_json.workspace = true tokio.workspace = true diff --git a/crates/cli/Cargo.toml b/crates/cli/Cargo.toml index 8c23f204..729b4056 100644 --- a/crates/cli/Cargo.toml +++ b/crates/cli/Cargo.toml @@ -25,14 +25,14 @@ path = "src/bin/deepseek_legacy_shim.rs" anyhow.workspace = true clap.workspace = true clap_complete.workspace = true -codewhale-agent = { path = "../agent", version = "0.8.53" } -codewhale-app-server = { path = "../app-server", version = "0.8.53" } -codewhale-config = { path = "../config", version = "0.8.53" } -codewhale-execpolicy = { path = "../execpolicy", version = "0.8.53" } -codewhale-mcp = { path = "../mcp", version = "0.8.53" } -codewhale-release = { path = "../release", version = "0.8.53" } -codewhale-secrets = { path = "../secrets", version = "0.8.53" } -codewhale-state = { path = "../state", version = "0.8.53" } +codewhale-agent = { path = "../agent", version = "0.8.54" } +codewhale-app-server = { path = "../app-server", version = "0.8.54" } +codewhale-config = { path = "../config", version = "0.8.54" } +codewhale-execpolicy = { path = "../execpolicy", version = "0.8.54" } +codewhale-mcp = { path = "../mcp", version = "0.8.54" } +codewhale-release = { path = "../release", version = "0.8.54" } +codewhale-secrets = { path = "../secrets", version = "0.8.54" } +codewhale-state = { path = "../state", version = "0.8.54" } chrono.workspace = true dirs.workspace = true serde.workspace = true diff --git a/crates/config/Cargo.toml b/crates/config/Cargo.toml index 034f988f..8f6dc5f8 100644 --- a/crates/config/Cargo.toml +++ b/crates/config/Cargo.toml @@ -8,8 +8,8 @@ description = "Config schema and precedence model for DeepSeek workspace archite [dependencies] anyhow.workspace = true -codewhale-execpolicy = { path = "../execpolicy", version = "0.8.53" } -codewhale-secrets = { path = "../secrets", version = "0.8.53" } +codewhale-execpolicy = { path = "../execpolicy", version = "0.8.54" } +codewhale-secrets = { path = "../secrets", version = "0.8.54" } dirs.workspace = true serde.workspace = true serde_json.workspace = true diff --git a/crates/core/Cargo.toml b/crates/core/Cargo.toml index b8a5cb56..dd4ddfad 100644 --- a/crates/core/Cargo.toml +++ b/crates/core/Cargo.toml @@ -9,13 +9,13 @@ description = "Core runtime boundaries for DeepSeek workspace architecture" [dependencies] anyhow.workspace = true chrono.workspace = true -codewhale-agent = { path = "../agent", version = "0.8.53" } -codewhale-config = { path = "../config", version = "0.8.53" } -codewhale-execpolicy = { path = "../execpolicy", version = "0.8.53" } -codewhale-hooks = { path = "../hooks", version = "0.8.53" } -codewhale-mcp = { path = "../mcp", version = "0.8.53" } -codewhale-protocol = { path = "../protocol", version = "0.8.53" } -codewhale-state = { path = "../state", version = "0.8.53" } -codewhale-tools = { path = "../tools", version = "0.8.53" } +codewhale-agent = { path = "../agent", version = "0.8.54" } +codewhale-config = { path = "../config", version = "0.8.54" } +codewhale-execpolicy = { path = "../execpolicy", version = "0.8.54" } +codewhale-hooks = { path = "../hooks", version = "0.8.54" } +codewhale-mcp = { path = "../mcp", version = "0.8.54" } +codewhale-protocol = { path = "../protocol", version = "0.8.54" } +codewhale-state = { path = "../state", version = "0.8.54" } +codewhale-tools = { path = "../tools", version = "0.8.54" } serde_json.workspace = true uuid.workspace = true diff --git a/crates/execpolicy/Cargo.toml b/crates/execpolicy/Cargo.toml index dfe0d1bb..670a7d75 100644 --- a/crates/execpolicy/Cargo.toml +++ b/crates/execpolicy/Cargo.toml @@ -8,5 +8,5 @@ description = "Execution policy and approval model parity for DeepSeek workspace [dependencies] anyhow.workspace = true -codewhale-protocol = { path = "../protocol", version = "0.8.53" } +codewhale-protocol = { path = "../protocol", version = "0.8.54" } serde.workspace = true diff --git a/crates/hooks/Cargo.toml b/crates/hooks/Cargo.toml index 3083a3b3..3f37af18 100644 --- a/crates/hooks/Cargo.toml +++ b/crates/hooks/Cargo.toml @@ -10,7 +10,7 @@ description = "Hook dispatch and notifications parity for DeepSeek workspace arc anyhow.workspace = true async-trait.workspace = true chrono.workspace = true -codewhale-protocol = { path = "../protocol", version = "0.8.53" } +codewhale-protocol = { path = "../protocol", version = "0.8.54" } reqwest.workspace = true serde.workspace = true serde_json.workspace = true diff --git a/crates/tools/Cargo.toml b/crates/tools/Cargo.toml index fc65af8d..91c5c449 100644 --- a/crates/tools/Cargo.toml +++ b/crates/tools/Cargo.toml @@ -9,7 +9,7 @@ description = "Tool invocation lifecycle, schema validation, and scheduler paral [dependencies] anyhow.workspace = true async-trait.workspace = true -codewhale-protocol = { path = "../protocol", version = "0.8.53" } +codewhale-protocol = { path = "../protocol", version = "0.8.54" } serde.workspace = true serde_json.workspace = true thiserror.workspace = true diff --git a/crates/tui/CHANGELOG.md b/crates/tui/CHANGELOG.md index dec9b971..3e53b09a 100644 --- a/crates/tui/CHANGELOG.md +++ b/crates/tui/CHANGELOG.md @@ -7,6 +7,18 @@ and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0 ## [Unreleased] +## [0.8.54] - 2026-06-08 + +### Added + +- **Benchmark harness runners.** Added CodeWhale-native benchmark entry points for SWE-bench, Terminal-Bench, and PinchBench, plus a local PinchBench runner that can grade tool-use traces with an LLM judge. +- **Direct MiMo benchmark routing.** The benchmark runner now defaults to direct Xiaomi MiMo v2.5 Pro routing when configured, while keeping provider/model selection explicit. + +### Fixed + +- **Benchmark workspace copying.** Fixed benchmark workspace file copying so local benchmark tasks can preserve their intended file layout during agent runs. +- **MiMo default tests.** Guarded Xiaomi MiMo default-model tests against ambient CI provider environment variables. + ## [0.8.53] - 2026-06-03 ### Added @@ -5411,7 +5423,8 @@ Welcome — and thank you. - Hooks system and config profiles - Example skills and launch assets -[Unreleased]: https://github.com/Hmbown/CodeWhale/compare/v0.8.53...HEAD +[Unreleased]: https://github.com/Hmbown/CodeWhale/compare/v0.8.54...HEAD +[0.8.54]: https://github.com/Hmbown/CodeWhale/compare/v0.8.53...v0.8.54 [0.8.53]: https://github.com/Hmbown/CodeWhale/compare/v0.8.52...v0.8.53 [0.8.52]: https://github.com/Hmbown/CodeWhale/compare/v0.8.51...v0.8.52 [0.8.51]: https://github.com/Hmbown/CodeWhale/compare/v0.8.50...v0.8.51 diff --git a/crates/tui/Cargo.toml b/crates/tui/Cargo.toml index 6a577538..0539dad5 100644 --- a/crates/tui/Cargo.toml +++ b/crates/tui/Cargo.toml @@ -27,11 +27,11 @@ path = "src/bin/deepseek_tui_legacy_shim.rs" [dependencies] anyhow = "1.0.100" arboard = "3.4" -codewhale-config = { path = "../config", version = "0.8.53" } -codewhale-protocol = { path = "../protocol", version = "0.8.53" } -codewhale-release = { path = "../release", version = "0.8.53" } -codewhale-secrets = { path = "../secrets", version = "0.8.53" } -codewhale-tools = { path = "../tools", version = "0.8.53" } +codewhale-config = { path = "../config", version = "0.8.54" } +codewhale-protocol = { path = "../protocol", version = "0.8.54" } +codewhale-release = { path = "../release", version = "0.8.54" } +codewhale-secrets = { path = "../secrets", version = "0.8.54" } +codewhale-tools = { path = "../tools", version = "0.8.54" } schemaui = { version = "0.12.0", default-features = false, optional = true } async-stream = "0.3.6" async-trait = "0.1" diff --git a/npm/codewhale/package.json b/npm/codewhale/package.json index 7209b6dc..e8b0af37 100644 --- a/npm/codewhale/package.json +++ b/npm/codewhale/package.json @@ -1,7 +1,7 @@ { "name": "codewhale", - "version": "0.8.53", - "codewhaleBinaryVersion": "0.8.53", + "version": "0.8.54", + "codewhaleBinaryVersion": "0.8.54", "description": "Install and run CodeWhale, the agentic terminal for open-source and open-weight coding models, from GitHub release artifacts.", "author": "Hmbown", "license": "MIT",