chore(release): prep v0.8.51 — Arcee provider, cycle removal, UI fixes

Release-preparation checkpoint for v0.8.51 (workspace + npm bumped to 0.8.51).

Added:
- Arcee AI direct provider: [providers.arcee], ARCEE_API_KEY/BASE_URL/MODEL,
  CLI auth, provider + model picker, registry. Default direct-API model is
  trinity-large-thinking (reasoning, 262K ctx/out); preview + mini selectable.
  Cloudflare-WAF-safe opening turn (benign read-only tool surface, system-prompt
  payload splitting) and reasoning_content replay on tool-call turns.
- Expanded model catalog (qwen3.6 flash/plus/max-preview, Xiaomi MiMo v2.5
  chat/ASR/TTS); provider-aware model picker with per-provider saved models.

Changed:
- Auto-compaction is percentage- and model-aware
  (compaction_threshold_for_model_at_percent; default 80%; auto-enable for
  <=256K windows, opt-in for 1M models).
- Provider/gateway HTTP errors sanitized (HTML/WAF interstitials collapsed,
  401/403 split into authentication vs authorization).

Removed:
- The session cycle / checkpoint-restart system: /cycles, /cycle, /recall,
  recall_archive tool, cycle_manager, cycle-handoff prompt, sidebar cycle lines,
  EngineConfig.cycle / Event::CycleAdvanced / seam cycle thresholds.

Fixed:
- Orphaned assistant 'blue dot' role glyph on whitespace-only turns.
- Sidebar mouse-wheel scroll leaking into the transcript.
- Sidebar hover tooltip overlap + warning-orange styling.
- README Constitution description corrected to match prompts/base.md.
- Repaired release-blocking unit/integration tests after the refactors.

Preflight: cargo fmt clean, workspace builds, 3903 tui tests pass (1 known
flaky MCP SSE test under parallel load, passes in isolation).
This commit is contained in:
Hunter Bown
2026-06-02 17:36:18 -07:00
parent 8eca757633
commit 06612495fc
67 changed files with 2965 additions and 3201 deletions
+10 -10
View File
@@ -45,13 +45,14 @@ base_url = "https://api.deepseek.com/beta"
# deepseek-ai/deepseek-v4-flash — default AtlasCloud model ID
# deepseek-reasoner — default Wanjie Ark model ID
# mimo-v2.5-pro — default Xiaomi MiMo model ID
# mimo-v2.5-tts ? Xiaomi MiMo speech/TTS model ID
# mimo-v2.5-tts-voicedesign ? Xiaomi MiMo voice-design TTS model ID
# mimo-v2.5-tts-voiceclone ? Xiaomi MiMo voice-clone TTS model ID
# mimo-v2.5 Xiaomi MiMo V2.5 Omni model ID
# mimo-v2.5-tts Xiaomi MiMo speech/TTS model ID
# mimo-v2.5-tts-voicedesign Xiaomi MiMo voice-design TTS model ID
# mimo-v2.5-tts-voiceclone — Xiaomi MiMo voice-clone TTS model ID
# accounts/fireworks/models/deepseek-v4-pro — Fireworks AI Pro model ID
# deepseek-ai/DeepSeek-V4-Pro — SiliconFlow hosted Pro model ID
# deepseek-ai/DeepSeek-V4-Flash — SiliconFlow hosted Flash model ID
# trinity-mini — default direct Arcee AI API model ID
# trinity-large-thinking — default direct Arcee AI API model ID
# trinity-large-preview — direct Arcee AI API model ID
# deepseek-ai/DeepSeek-V4-Pro — SGLang self-hosted Pro model ID
# deepseek-ai/DeepSeek-V4-Flash — SGLang self-hosted Flash model ID
@@ -304,7 +305,8 @@ max_subagents = 10 # optional (1-20)
# base_url = "https://openrouter.ai/api/v1"
# model = "deepseek/deepseek-v4-pro"
# Recent large model IDs also accepted here include arcee-ai/trinity-large-thinking,
# xiaomi/mimo-v2.5-pro, qwen/qwen3.6-35b-a3b,
# xiaomi/mimo-v2.5-pro, qwen/qwen3.6-flash, qwen/qwen3.6-35b-a3b,
# qwen/qwen3.6-max-preview, qwen/qwen3.6-27b, qwen/qwen3.6-plus,
# google/gemma-4-31b-it, z-ai/glm-5.1, moonshotai/kimi-k2.6, and
# nvidia/nemotron-3-nano-omni-30b-a3b-reasoning:free.
@@ -313,6 +315,7 @@ max_subagents = 10 # optional (1-20)
# api_key = "YOUR_XIAOMI_KEY"
# base_url = "https://api.xiaomimimo.com/v1"
# model = "mimo-v2.5-pro" # chat/reasoning
# Chat model IDs: mimo-v2.5-pro, mimo-v2.5
# TTS aliases are also accepted by `codewhale speech`: tts, voice-design, voice-clone
# TTS model IDs: mimo-v2.5-tts, mimo-v2.5-tts-voicedesign, mimo-v2.5-tts-voiceclone, mimo-v2-tts
@@ -338,7 +341,7 @@ max_subagents = 10 # optional (1-20)
[providers.arcee]
# api_key = "YOUR_ARCEE_API_KEY"
# base_url = "https://api.arcee.ai/api/v1"
# model = "trinity-mini" # or trinity-large-preview
# model = "trinity-large-thinking" # or trinity-large-preview
# Moonshot/Kimi OpenAI-compatible endpoint (https://platform.moonshot.ai)
[providers.moonshot]
@@ -510,7 +513,7 @@ exponential_base = 2.0
# ─────────────────────────────────────────────────────────────────────────────────
# Auto-compaction is a saved UI setting edited with `/config` (`auto_compact`).
# The optional saved threshold setting is `auto_compact_threshold_percent`
# (default 70, still gated by the 500K-token floor). There is no config-file
# (default 80). There is no config-file
# `[compaction]` table yet; runtime compaction budgets are chosen by the TUI
# from the active model/context window.
@@ -524,9 +527,6 @@ verbatim_window_turns = 16
l1_threshold = 192000
l2_threshold = 384000
l3_threshold = 576000
# Hard cycle reserves the normal 262144-token internal turn budget plus 1024
# safety tokens, separate from V4's official 384000 max-output metadata.
cycle_threshold = 768000
seam_model = "deepseek-v4-flash"
# ─────────────────────────────────────────────────────────────────────────────────