chore(release): prep v0.8.51 — Arcee provider, cycle removal, UI fixes

Release-preparation checkpoint for v0.8.51 (workspace + npm bumped to 0.8.51). Added: - Arcee AI direct provider: [providers.arcee], ARCEE_API_KEY/BASE_URL/MODEL, CLI auth, provider + model picker, registry. Default direct-API model is trinity-large-thinking (reasoning, 262K ctx/out); preview + mini selectable. Cloudflare-WAF-safe opening turn (benign read-only tool surface, system-prompt payload splitting) and reasoning_content replay on tool-call turns. - Expanded model catalog (qwen3.6 flash/plus/max-preview, Xiaomi MiMo v2.5 chat/ASR/TTS); provider-aware model picker with per-provider saved models. Changed: - Auto-compaction is percentage- and model-aware (compaction_threshold_for_model_at_percent; default 80%; auto-enable for <=256K windows, opt-in for 1M models). - Provider/gateway HTTP errors sanitized (HTML/WAF interstitials collapsed, 401/403 split into authentication vs authorization). Removed: - The session cycle / checkpoint-restart system: /cycles, /cycle, /recall, recall_archive tool, cycle_manager, cycle-handoff prompt, sidebar cycle lines, EngineConfig.cycle / Event::CycleAdvanced / seam cycle thresholds. Fixed: - Orphaned assistant 'blue dot' role glyph on whitespace-only turns. - Sidebar mouse-wheel scroll leaking into the transcript. - Sidebar hover tooltip overlap + warning-orange styling. - README Constitution description corrected to match prompts/base.md. - Repaired release-blocking unit/integration tests after the refactors. Preflight: cargo fmt clean, workspace builds, 3903 tui tests pass (1 known flaky MCP SSE test under parallel load, passes in isolation).
2026-06-02 17:36:18 -07:00
parent 8eca757633
commit 06612495fc
67 changed files with 2965 additions and 3201 deletions
@@ -45,13 +45,14 @@ base_url = "https://api.deepseek.com/beta"
 #   deepseek-ai/deepseek-v4-flash   — default AtlasCloud model ID
 #   deepseek-reasoner               — default Wanjie Ark model ID
 #   mimo-v2.5-pro                   — default Xiaomi MiMo model ID
-#   mimo-v2.5-tts                   ? Xiaomi MiMo speech/TTS model ID
-#   mimo-v2.5-tts-voicedesign       ? Xiaomi MiMo voice-design TTS model ID
-#   mimo-v2.5-tts-voiceclone        ? Xiaomi MiMo voice-clone TTS model ID
+#   mimo-v2.5                       — Xiaomi MiMo V2.5 Omni model ID
+#   mimo-v2.5-tts                   — Xiaomi MiMo speech/TTS model ID
+#   mimo-v2.5-tts-voicedesign       — Xiaomi MiMo voice-design TTS model ID
+#   mimo-v2.5-tts-voiceclone        — Xiaomi MiMo voice-clone TTS model ID
 #   accounts/fireworks/models/deepseek-v4-pro — Fireworks AI Pro model ID
 #   deepseek-ai/DeepSeek-V4-Pro      — SiliconFlow hosted Pro model ID
 #   deepseek-ai/DeepSeek-V4-Flash    — SiliconFlow hosted Flash model ID
-#   trinity-mini                     — default direct Arcee AI API model ID
+#   trinity-large-thinking           — default direct Arcee AI API model ID
 #   trinity-large-preview            — direct Arcee AI API model ID
 #   deepseek-ai/DeepSeek-V4-Pro      — SGLang self-hosted Pro model ID
 #   deepseek-ai/DeepSeek-V4-Flash    — SGLang self-hosted Flash model ID
@@ -304,7 +305,8 @@ max_subagents = 10 # optional (1-20)
 # base_url = "https://openrouter.ai/api/v1"
 # model = "deepseek/deepseek-v4-pro"
 # Recent large model IDs also accepted here include arcee-ai/trinity-large-thinking,
-# xiaomi/mimo-v2.5-pro, qwen/qwen3.6-35b-a3b,
+# xiaomi/mimo-v2.5-pro, qwen/qwen3.6-flash, qwen/qwen3.6-35b-a3b,
+# qwen/qwen3.6-max-preview, qwen/qwen3.6-27b, qwen/qwen3.6-plus,
 # google/gemma-4-31b-it, z-ai/glm-5.1, moonshotai/kimi-k2.6, and
 # nvidia/nemotron-3-nano-omni-30b-a3b-reasoning:free.

@@ -313,6 +315,7 @@ max_subagents = 10 # optional (1-20)
 # api_key = "YOUR_XIAOMI_KEY"
 # base_url = "https://api.xiaomimimo.com/v1"
 # model = "mimo-v2.5-pro"              # chat/reasoning
+# Chat model IDs: mimo-v2.5-pro, mimo-v2.5
 # TTS aliases are also accepted by `codewhale speech`: tts, voice-design, voice-clone
 # TTS model IDs: mimo-v2.5-tts, mimo-v2.5-tts-voicedesign, mimo-v2.5-tts-voiceclone, mimo-v2-tts

@@ -338,7 +341,7 @@ max_subagents = 10 # optional (1-20)
 [providers.arcee]
 # api_key = "YOUR_ARCEE_API_KEY"
 # base_url = "https://api.arcee.ai/api/v1"
-# model = "trinity-mini"                    # or trinity-large-preview
+# model = "trinity-large-thinking"          # or trinity-large-preview

 # Moonshot/Kimi OpenAI-compatible endpoint (https://platform.moonshot.ai)
 [providers.moonshot]
@@ -510,7 +513,7 @@ exponential_base = 2.0
 # ─────────────────────────────────────────────────────────────────────────────────
 # Auto-compaction is a saved UI setting edited with `/config` (`auto_compact`).
 # The optional saved threshold setting is `auto_compact_threshold_percent`
-# (default 70, still gated by the 500K-token floor). There is no config-file
+# (default 80). There is no config-file
 # `[compaction]` table yet; runtime compaction budgets are chosen by the TUI
 # from the active model/context window.

@@ -524,9 +527,6 @@ verbatim_window_turns = 16
 l1_threshold = 192000
 l2_threshold = 384000
 l3_threshold = 576000
-# Hard cycle reserves the normal 262144-token internal turn budget plus 1024
-# safety tokens, separate from V4's official 384000 max-output metadata.
-cycle_threshold = 768000
 seam_model = "deepseek-v4-flash"

 # ─────────────────────────────────────────────────────────────────────────────────