Add new TTS/STT Logic

This commit is contained in:
2026-05-16 19:55:51 +02:00
parent a13af83655
commit 5df8f6cf1e
2 changed files with 17 additions and 8 deletions

View File

@@ -199,10 +199,12 @@ export function OnboardingWizard({
agentName: "Assistant", agentName: "Assistant",
soulMd: FALLBACK_SOUL.replace("{company}", displayOrgName), soulMd: FALLBACK_SOUL.replace("{company}", displayOrgName),
agentsMd: FALLBACK_AGENTS, agentsMd: FALLBACK_AGENTS,
// CORE defaults: heartbeat + cron pre-selected so the assistant // CORE defaults: heartbeat + cron + active-memory pre-selected so
// can be proactive and run scheduled tasks out of the box. // the assistant can be proactive, run scheduled tasks, and recall
// Customers can untoggle either before submitting. core-voice // stable context out of the box. Customers can untoggle any of
// stays unselected — its toggle is disabled until Phase B. // them before submitting. core-voice is fully wired (Phase B)
// but stays unselected — opt-in keeps audio spend predictable
// for tenants who don't intend to use voice channels.
packages: [...DEFAULT_PACKAGE_IDS] as string[], packages: [...DEFAULT_PACKAGE_IDS] as string[],
billingAddress: { billingAddress: {
// For personal accounts, leave the company field empty — it'll // For personal accounts, leave the company field empty — it'll

View File

@@ -13,8 +13,10 @@
* Category model (Phase A rework): * Category model (Phase A rework):
* - core — platform-behaviour toggles (heartbeat, cron, * - core — platform-behaviour toggles (heartbeat, cron,
* active-memory, voice). Mostly no secrets. core-voice is * active-memory, voice). Mostly no secrets. core-voice is
* a catalog stub in Phase A — toggling stores customer * fully wired (Phase B): toggling installs the STT / TTS /
* intent only; the OCI config_patch lands in Phase B. * Talk surface via the operator's config_patch, routed
* through LiteLLM (pieced-stt, pieced-tts-inbound,
* pieced-tts-talk).
* - channel — messaging integration. * - channel — messaging integration.
* - skill — ClawHub skill install. * - skill — ClawHub skill install.
*/ */
@@ -271,8 +273,13 @@ export const CHANNEL_PACKAGE_IDS: string[] = PACKAGE_CATALOG
* *
* Each adds some token cost — active-memory the most (one extra * Each adds some token cost — active-memory the most (one extra
* sub-agent turn per inbound message) — so customers can untoggle any * sub-agent turn per inbound message) — so customers can untoggle any
* of them before submitting. core-voice is deliberately excluded from * of them before submitting.
* defaults until its config_patch lands in Phase B. *
* core-voice is intentionally NOT a default. It is fully wired (Phase B)
* and customers can enable it from the wizard, but it incurs separate
* audio spend on every inbound voice note (Whisper STT) and every
* outbound reply (kani-tts / kokoro-fastapi via LiteLLM). Opt-in keeps
* cost predictable for tenants who don't intend to use voice channels.
*/ */
export const DEFAULT_PACKAGE_IDS: string[] = [ export const DEFAULT_PACKAGE_IDS: string[] = [
"core-heartbeat", "core-heartbeat",