@warmdrift/kgauto-compiler 2.0.0-alpha.14 → 2.0.0-alpha.16

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -614,6 +614,420 @@ var PROFILES_RAW = [
614
614
  hunt: 4
615
615
  // sequential tools — same as V4-Flash
616
616
  }
617
+ },
618
+ // ── OpenAI ──
619
+ // alpha.16 (2026-05-17): close the half-supported provider gap. env.ts
620
+ // already registered OPENAI_API_KEY + executeOpenAI + normalizeOpenAILike
621
+ // + lowerOpenAI all existed; profile entries were missing, so the
622
+ // alpha.10 auto-filter would mark openai-keyed models reachable but
623
+ // there were no profiles to filter IN. Half-supported is now fully
624
+ // supported. PB request `openai-provider-profiles` (2026-05-16).
625
+ //
626
+ // Profile data verified against developers.openai.com/api/docs/pricing
627
+ // + per-model pages 2026-05-17. L-049/L-081 step-zero: no AI-trained
628
+ // numbers — fetched live from OpenAI's docs. As of 2026-05, OpenAI's
629
+ // current flagship is gpt-5.5 (2025-12 cutoff); gpt-5.4-{base,mini,nano}
630
+ // are the workhorse family. gpt-4.1 + gpt-4o are legacy.
631
+ //
632
+ // Both 5.5 and 5.4 carry a 272K input-token pricing cliff (2x input,
633
+ // 1.5x output beyond that). Modeled as a `downgrade_quality_warning`
634
+ // cliff because it ranks the model down at large-context shapes — the
635
+ // semantics of "this model is now 2x more expensive" map onto the
636
+ // existing penalty mechanism. Cost-watcher will catch high-context
637
+ // spikes empirically; the cliff prevents naive routing into the doubled
638
+ // pricing zone.
639
+ {
640
+ id: "gpt-5.5",
641
+ verifiedAgainstDocs: "2026-05-17",
642
+ provider: "openai",
643
+ status: "current",
644
+ maxContextTokens: 105e4,
645
+ maxOutputTokens: 128e3,
646
+ maxTools: 64,
647
+ parallelToolCalls: true,
648
+ structuredOutput: "native",
649
+ systemPromptMode: "inline",
650
+ streaming: true,
651
+ cliffs: [
652
+ {
653
+ metric: "input_tokens",
654
+ threshold: 272e3,
655
+ action: "downgrade_quality_warning",
656
+ reason: "OpenAI pricing tier shift: >272K input tokens billed at 2x input + 1.5x output rates"
657
+ }
658
+ ],
659
+ costInputPer1m: 5,
660
+ costOutputPer1m: 30,
661
+ lowering: {
662
+ system: { mode: "inline" },
663
+ // OpenAI caching is implicit (auto-applied to repeated prefixes
664
+ // ≥1024 tokens for prompt_tokens_details.cached_tokens). No
665
+ // wire-format marker. Discount: 10x for cached input ($0.50/$5.00).
666
+ cache: { strategy: "unsupported", minTokens: 1024, discount: 0.1 },
667
+ tools: { format: "openai" }
668
+ },
669
+ recovery: [
670
+ { signal: "rate_limit", action: "escalate", reason: "429 \u2014 escalate to fallback chain" },
671
+ { signal: "model_not_found", action: "escalate", reason: "Model deprecated/renamed \u2014 escalate (L-061)" }
672
+ ],
673
+ strengths: ["reasoning", "agentic_coding", "long_context", "structured_output", "reliable_tool_use", "reasoning_effort_knob"],
674
+ weaknesses: ["cost", "pricing_cliff_at_272k"],
675
+ notes: "OpenAI frontier (2026-05). 1M context (1.05M total), 128K max output, 2025-12 cutoff. Reasoning effort knob (none/low/medium/high/xhigh). Pricing cliff at 272K input.",
676
+ // Frontier-tier perf hypothesis. Anchored to Opus 4.7 row (similar
677
+ // price/positioning). Brain evidence will refine; no telemetry yet.
678
+ archetypePerf: {
679
+ critique: 9,
680
+ plan: 9,
681
+ generate: 9,
682
+ ask: 9,
683
+ extract: 9,
684
+ transform: 9,
685
+ hunt: 8,
686
+ // parallel tool support good but cliff at 272K hurts deep multi-step
687
+ summarize: 7,
688
+ // overkill for tolerant archetype
689
+ classify: 7
690
+ // overkill; cheaper models cover this
691
+ }
692
+ },
693
+ {
694
+ id: "gpt-5.4",
695
+ verifiedAgainstDocs: "2026-05-17",
696
+ provider: "openai",
697
+ status: "current",
698
+ maxContextTokens: 105e4,
699
+ maxOutputTokens: 128e3,
700
+ maxTools: 64,
701
+ parallelToolCalls: true,
702
+ structuredOutput: "native",
703
+ systemPromptMode: "inline",
704
+ streaming: true,
705
+ cliffs: [
706
+ {
707
+ metric: "input_tokens",
708
+ threshold: 272e3,
709
+ action: "downgrade_quality_warning",
710
+ reason: "OpenAI pricing tier shift: >272K input tokens billed at 2x input + 1.5x output rates"
711
+ }
712
+ ],
713
+ costInputPer1m: 2.5,
714
+ costOutputPer1m: 15,
715
+ lowering: {
716
+ system: { mode: "inline" },
717
+ cache: { strategy: "unsupported", minTokens: 1024, discount: 0.1 },
718
+ tools: { format: "openai" }
719
+ },
720
+ recovery: [
721
+ { signal: "rate_limit", action: "escalate", reason: "429 \u2014 escalate to fallback chain" },
722
+ { signal: "model_not_found", action: "escalate", reason: "Model deprecated/renamed \u2014 escalate (L-061)" }
723
+ ],
724
+ strengths: ["reasoning", "long_context", "structured_output", "reliable_tool_use"],
725
+ weaknesses: ["pricing_cliff_at_272k"],
726
+ notes: "OpenAI workhorse (2026-05). 1M context (1.05M total), 128K max output, 2025-08 cutoff. Pricing cliff at 272K input. Pairs cleanly with Sonnet 4.6 on cost ($2.50/$15.00 vs $3.00/$15.00).",
727
+ // Anchored to Sonnet 4.6 row (similar price/positioning). Slight
728
+ // anthropic-side edge on agentic coding per master plan vibe.
729
+ archetypePerf: {
730
+ critique: 8,
731
+ plan: 8,
732
+ generate: 8,
733
+ ask: 8,
734
+ extract: 8,
735
+ transform: 8,
736
+ hunt: 7,
737
+ summarize: 7,
738
+ classify: 7
739
+ }
740
+ },
741
+ {
742
+ id: "gpt-5.4-mini",
743
+ verifiedAgainstDocs: "2026-05-17",
744
+ provider: "openai",
745
+ status: "current",
746
+ maxContextTokens: 4e5,
747
+ maxOutputTokens: 128e3,
748
+ maxTools: 64,
749
+ parallelToolCalls: true,
750
+ structuredOutput: "native",
751
+ systemPromptMode: "inline",
752
+ streaming: true,
753
+ cliffs: [],
754
+ costInputPer1m: 0.75,
755
+ costOutputPer1m: 4.5,
756
+ lowering: {
757
+ system: { mode: "inline" },
758
+ cache: { strategy: "unsupported", minTokens: 1024, discount: 0.1 },
759
+ tools: { format: "openai" }
760
+ },
761
+ recovery: [
762
+ { signal: "rate_limit", action: "escalate", reason: "429 \u2014 escalate to fallback chain" },
763
+ { signal: "model_not_found", action: "escalate", reason: "Model deprecated/renamed \u2014 escalate (L-061)" }
764
+ ],
765
+ strengths: ["cost", "speed", "agentic_coding", "structured_output", "reliable_tool_use"],
766
+ weaknesses: ["reasoning_depth"],
767
+ notes: "OpenAI mini-tier (2026-05). 400K context, 128K max output, 2025-08 cutoff. OpenAI describes as 'strongest mini model for coding, computer use, subagents.' Cache discount 10x ($0.075 input).",
768
+ // Mini-tier hypothesis. Anchored to Haiku 4.5 + Flash row pricing.
769
+ // Cost is slightly higher than Haiku ($0.75 vs $0.50 input) but
770
+ // OpenAI claims strong coding/subagent perf.
771
+ archetypePerf: {
772
+ ask: 7,
773
+ generate: 7,
774
+ extract: 7,
775
+ transform: 7,
776
+ classify: 7,
777
+ summarize: 7,
778
+ hunt: 7,
779
+ plan: 6,
780
+ critique: 5
781
+ // reasoning depth gap — frontier models handle this
782
+ }
783
+ },
784
+ {
785
+ id: "gpt-5.4-nano",
786
+ verifiedAgainstDocs: "2026-05-17",
787
+ provider: "openai",
788
+ status: "current",
789
+ maxContextTokens: 4e5,
790
+ maxOutputTokens: 128e3,
791
+ maxTools: 64,
792
+ parallelToolCalls: true,
793
+ structuredOutput: "native",
794
+ systemPromptMode: "inline",
795
+ streaming: true,
796
+ cliffs: [],
797
+ costInputPer1m: 0.2,
798
+ costOutputPer1m: 1.25,
799
+ lowering: {
800
+ system: { mode: "inline" },
801
+ cache: { strategy: "unsupported", minTokens: 1024, discount: 0.1 },
802
+ tools: { format: "openai" }
803
+ },
804
+ recovery: [
805
+ { signal: "rate_limit", action: "escalate", reason: "429 \u2014 escalate to fallback chain" },
806
+ { signal: "model_not_found", action: "escalate", reason: "Model deprecated/renamed \u2014 escalate (L-061)" }
807
+ ],
808
+ strengths: ["cost", "speed", "volume", "structured_output"],
809
+ weaknesses: ["reasoning_depth", "no_computer_use"],
810
+ notes: "OpenAI nano-tier (2026-05). 400K context, 128K max output, 2025-08 cutoff. 'Cheapest GPT-5.4-class for simple high-volume tasks.' No fine-tuning, no computer-use tools. Cache discount 10x.",
811
+ // Nano-tier. Anchored to Flash-Lite row ($0.10/$0.40 vs nano's
812
+ // $0.20/$1.25). Slightly more expensive than Flash-Lite but with
813
+ // OpenAI brand reliability. Good fit for classify/summarize floor.
814
+ archetypePerf: {
815
+ classify: 7,
816
+ summarize: 6,
817
+ ask: 6,
818
+ transform: 6,
819
+ extract: 6,
820
+ generate: 5,
821
+ hunt: 5,
822
+ plan: 4,
823
+ critique: 3
824
+ // not for reasoning archetypes
825
+ }
826
+ },
827
+ // ── Auto-onboarded (UNVERIFIED) ──
828
+ // Cloned by scripts/auto-onboard-models.mjs from a same-family template.
829
+ // Each entry's pricing/context/cliffs/lowering reflects the template, NOT
830
+ // provider docs. Verify before promoting status to 'current' (L-049/L-081).
831
+ {
832
+ id: "gemini-3-flash-preview",
833
+ verifiedAgainstDocs: "UNVERIFIED-AUTO-ONBOARD",
834
+ provider: "google",
835
+ status: "preview",
836
+ maxContextTokens: 1048576,
837
+ maxOutputTokens: 65535,
838
+ maxTools: 128,
839
+ parallelToolCalls: true,
840
+ structuredOutput: "native",
841
+ systemPromptMode: "separate",
842
+ streaming: true,
843
+ cliffs: [
844
+ {
845
+ metric: "input_tokens",
846
+ threshold: 8e3,
847
+ action: "downgrade_quality_warning",
848
+ reason: "Quality degrades significantly above ~8K context tokens"
849
+ },
850
+ {
851
+ metric: "tool_count",
852
+ threshold: 20,
853
+ action: "drop_to_top_relevant",
854
+ reason: "Tool reliability drops above ~20 tools (despite 128 hard limit)"
855
+ },
856
+ {
857
+ metric: "thinking_with_short_output",
858
+ threshold: 1,
859
+ action: "force_thinking_budget_zero",
860
+ reason: "Thinking tokens consume maxOutputTokens \u2014 empty response if drained"
861
+ },
862
+ {
863
+ // s11 trust artifact (2026-05-02): brain showed 5/5 empty rate on
864
+ // tt-intelligence/summarize/gemini-2.5-flash with tools offered.
865
+ // v1's disable_thinking_for_short_output already fired and didn't
866
+ // help — disabling thinking is necessary but not sufficient. Tools
867
+ // present + summarize intent confuses Flash into a no-output state
868
+ // (likely tool-decision purgatory). Strip tools entirely for this
869
+ // archetype on this model.
870
+ metric: "tool_count",
871
+ threshold: 1,
872
+ whenIntent: "summarize",
873
+ action: "strip_tools",
874
+ reason: "Gemini Flash returns empty when summarize intent has tools offered (5/5 empty rate observed in v1 prod 2026-04-19, replayed into v2 brain 2026-04-29)"
875
+ }
876
+ ],
877
+ costInputPer1m: 0.3,
878
+ costOutputPer1m: 2.5,
879
+ lowering: {
880
+ ...GOOGLE_LOWERING_BASE,
881
+ thinking: { field: "generationConfig.thinkingConfig.thinkingBudget", default: "auto" }
882
+ },
883
+ recovery: [
884
+ {
885
+ signal: "empty_response_after_tool",
886
+ action: "retry_with_params",
887
+ retryParams: { "generationConfig.thinkingConfig.thinkingBudget": 0 },
888
+ maxRetries: 1,
889
+ reason: "Known: empty after tool result \u2014 retry with thinking off"
890
+ },
891
+ {
892
+ signal: "empty_response",
893
+ action: "retry_with_params",
894
+ retryParams: { "generationConfig.thinkingConfig.thinkingBudget": 0 },
895
+ maxRetries: 1,
896
+ reason: "Empty response \u2014 try with thinking off"
897
+ },
898
+ {
899
+ signal: "malformed_function_call",
900
+ action: "escalate",
901
+ reason: "MALFORMED_FUNCTION_CALL maps to stop \u2014 escalate to next target"
902
+ }
903
+ ],
904
+ strengths: ["speed", "volume", "classification", "1m_context", "cost"],
905
+ weaknesses: ["complex_schemas", "large_tool_sets", "high_context_quality"],
906
+ notes: "AUTO-ONBOARDED 2026-05-16 from `gemini-2.5-flash`. Pricing, context, cliffs are template-cloned and UNVERIFIED \u2014 confirm against provider docs before promoting status to 'current'.",
907
+ // Master plan §6.2 anchor. Tier 0 for hunt (parallel tool throughput
908
+ // 15-75 calls/step beats Sonnet — L-040), summarize, classify.
909
+ archetypePerf: {
910
+ hunt: 9,
911
+ // L-040: parallel tool throughput 15-75/step
912
+ classify: 7,
913
+ // brain-validated, 218 rows
914
+ summarize: 7,
915
+ // brain-validated; cliff strips tools when present
916
+ transform: 7,
917
+ ask: 7,
918
+ generate: 6,
919
+ plan: 5,
920
+ extract: 6,
921
+ // alpha.8 MAX_TOKENS history on structured output
922
+ critique: 4
923
+ // reasoning shallower than Sonnet/Opus
924
+ }
925
+ },
926
+ {
927
+ // ── Gemini 2.5 Flash-Lite ──
928
+ // Onboarded 2026-05-13 (s22) after the model-release watcher surfaced
929
+ // it as a UNREGISTERED + NEW candidate. Released by Google July 2025,
930
+ // stable. Positioned BELOW Flash on the cost/perf frontier:
931
+ // input $0.10/M (Flash $0.30/M) — 3× cheaper
932
+ // output $0.40/M (Flash $2.50/M) — 6× cheaper
933
+ // cache $0.01/M — 1/10 of input (vs Flash 0.25 discount)
934
+ // Cliffs are HYPOTHESIZED from Flash's known failure modes — Flash-Lite
935
+ // is a smaller sibling, so we inherit Flash's cliffs at equal-or-tighter
936
+ // thresholds. The brain will validate/relax these as evidence accumulates
937
+ // per (archetype, model) tuple. Currently ZERO brain rows for this model.
938
+ id: "gemini-3.1-flash-lite",
939
+ verifiedAgainstDocs: "UNVERIFIED-AUTO-ONBOARD",
940
+ provider: "google",
941
+ status: "preview",
942
+ maxContextTokens: 1048576,
943
+ maxOutputTokens: 65536,
944
+ maxTools: 128,
945
+ parallelToolCalls: true,
946
+ structuredOutput: "native",
947
+ systemPromptMode: "separate",
948
+ streaming: true,
949
+ cliffs: [
950
+ {
951
+ metric: "input_tokens",
952
+ threshold: 8e3,
953
+ action: "downgrade_quality_warning",
954
+ reason: "Inherited from Flash: quality degrades above ~8K. Smaller model \u2014 likely degrades faster. Re-tune from brain after n\u226520."
955
+ },
956
+ {
957
+ metric: "tool_count",
958
+ threshold: 10,
959
+ action: "drop_to_top_relevant",
960
+ reason: "Conservative: Flash drops at 20, Flash-Lite is smaller \u2014 assume tighter ceiling until brain proves otherwise."
961
+ },
962
+ {
963
+ metric: "thinking_with_short_output",
964
+ threshold: 1,
965
+ action: "force_thinking_budget_zero",
966
+ reason: "Thinking enabled per Google API (thinking: true). Same drain risk as Flash \u2014 thinking tokens consume maxOutputTokens."
967
+ },
968
+ {
969
+ // Strong prior: Flash hit 5/5 empty rate on summarize+tools (s11
970
+ // trust artifact, kgauto commit 3872832). Flash-Lite shares the
971
+ // same architectural family — almost certainly inherits this cliff.
972
+ // Ship the guard preemptively; brain telemetry confirms or relaxes.
973
+ metric: "tool_count",
974
+ threshold: 1,
975
+ whenIntent: "summarize",
976
+ action: "strip_tools",
977
+ reason: "Inherited from Flash s11 cliff: summarize+tools \u2192 empty response. Preemptive guard until brain evidence on Flash-Lite specifically."
978
+ }
979
+ ],
980
+ costInputPer1m: 0.1,
981
+ costOutputPer1m: 0.4,
982
+ lowering: {
983
+ ...GOOGLE_LOWERING_BASE,
984
+ // Cache discount 10× (vs Flash 4×) — Google's spec is $0.01/M cache vs
985
+ // $0.10/M input. Material for repeat-prompt workloads (classify shape).
986
+ cache: { ...GOOGLE_LOWERING_BASE.cache, discount: 0.1 },
987
+ thinking: { field: "generationConfig.thinkingConfig.thinkingBudget", default: "auto" }
988
+ },
989
+ recovery: [
990
+ {
991
+ signal: "empty_response_after_tool",
992
+ action: "retry_with_params",
993
+ retryParams: { "generationConfig.thinkingConfig.thinkingBudget": 0 },
994
+ maxRetries: 1,
995
+ reason: "Known on Flash family: empty after tool result \u2014 retry with thinking off."
996
+ },
997
+ {
998
+ signal: "empty_response",
999
+ action: "retry_with_params",
1000
+ retryParams: { "generationConfig.thinkingConfig.thinkingBudget": 0 },
1001
+ maxRetries: 1,
1002
+ reason: "Empty response \u2014 try with thinking off."
1003
+ },
1004
+ {
1005
+ signal: "malformed_function_call",
1006
+ action: "escalate",
1007
+ reason: "MALFORMED_FUNCTION_CALL maps to stop \u2014 escalate to next target."
1008
+ }
1009
+ ],
1010
+ strengths: ["lowest_cost", "speed", "volume", "classification", "summarize", "1m_context", "cache_friendly"],
1011
+ weaknesses: ["complex_reasoning", "large_tool_sets", "complex_schemas", "structured_output_unproven", "long_context_quality"],
1012
+ notes: "AUTO-ONBOARDED 2026-05-16 from `gemini-2.5-flash-lite`. Pricing, context, cliffs are template-cloned and UNVERIFIED \u2014 confirm against provider docs before promoting status to 'current'.",
1013
+ // Tier 3 emergency floor for summarize/classify chains. ZERO brain
1014
+ // rows — all values are starter hypotheses anchored to "smaller
1015
+ // sibling of Flash, at-or-below Flash perf on every archetype." The
1016
+ // first 50 brain rows per archetype will validate or relax these.
1017
+ archetypePerf: {
1018
+ classify: 6,
1019
+ // starter hypothesis — verify (Flash is 7, lite likely ≤)
1020
+ summarize: 6,
1021
+ // starter hypothesis — verify; cliff strips tools
1022
+ transform: 6,
1023
+ // starter hypothesis — verify
1024
+ ask: 5,
1025
+ hunt: 5,
1026
+ generate: 4,
1027
+ extract: 4,
1028
+ plan: 3,
1029
+ critique: 3
1030
+ }
617
1031
  }
618
1032
  ];
619
1033
  var ALIASES = {
package/dist/index.d.mts CHANGED
@@ -1,5 +1,5 @@
1
- import { M as ModelProfile, C as CompilePolicy, N as NormalizedResponse, A as ApiKeys, P as ProviderOverrides, a as CompiledRequest, b as PromptIR, c as CallOptions, d as CallResult, R as RecordInput, O as OracleScore, e as CompileResult, B as BestPracticeAdvisory, f as Provider } from './profiles-DTnIzGsA.mjs';
2
- export { g as ALIASES, h as CacheStrategy, i as CallAttempt, j as CallError, k as CliffRule, l as Constraints, F as FallbackReason, H as HistoryCachePolicy, I as IntentDeclaration, L as LoweringSpec, m as Message, n as MutationApplied, o as NormalizedTokens, p as PromptSection, q as RecoveryRule, S as StructuredOutputCapability, r as SystemPromptMode, T as ToolCall, s as ToolDefinition, t as allProfiles, u as getProfile, v as profilesByProvider, w as tryGetProfile } from './profiles-DTnIzGsA.mjs';
1
+ import { M as ModelProfile, C as CompilePolicy, N as NormalizedResponse, A as ApiKeys, P as ProviderOverrides, a as CompiledRequest, b as PromptIR, c as CallOptions, d as CallResult, R as RecordInput, O as OracleScore, e as CompileResult, B as BestPracticeAdvisory, f as Provider } from './profiles-BoLYdl7F.mjs';
2
+ export { g as ALIASES, h as CacheStrategy, i as CallAttempt, j as CallError, k as CliffRule, l as Constraints, F as FallbackReason, H as HistoryCachePolicy, I as IntentDeclaration, L as LoweringSpec, m as Message, n as MutationApplied, o as NormalizedTokens, p as PromptSection, q as RecoveryRule, S as StructuredOutputCapability, r as SystemPromptMode, T as ToolCall, s as ToolDefinition, t as allProfiles, u as getProfile, v as profilesByProvider, w as tryGetProfile } from './profiles-BoLYdl7F.mjs';
3
3
  import { IntentArchetypeName } from './dialect.mjs';
4
4
  export { ALL_ARCHETYPES, ContextBucket, DIALECT_VERSION, HistoryDepth, INTENT_ARCHETYPES, OutputMode, ShapeSignature, ToolCountBucket, bucketContext, bucketHistory, bucketToolCount, hashShape, isArchetype, learningKey } from './dialect.mjs';
5
5
 
package/dist/index.d.ts CHANGED
@@ -1,5 +1,5 @@
1
- import { M as ModelProfile, C as CompilePolicy, N as NormalizedResponse, A as ApiKeys, P as ProviderOverrides, a as CompiledRequest, b as PromptIR, c as CallOptions, d as CallResult, R as RecordInput, O as OracleScore, e as CompileResult, B as BestPracticeAdvisory, f as Provider } from './profiles-D0y6aLk0.js';
2
- export { g as ALIASES, h as CacheStrategy, i as CallAttempt, j as CallError, k as CliffRule, l as Constraints, F as FallbackReason, H as HistoryCachePolicy, I as IntentDeclaration, L as LoweringSpec, m as Message, n as MutationApplied, o as NormalizedTokens, p as PromptSection, q as RecoveryRule, S as StructuredOutputCapability, r as SystemPromptMode, T as ToolCall, s as ToolDefinition, t as allProfiles, u as getProfile, v as profilesByProvider, w as tryGetProfile } from './profiles-D0y6aLk0.js';
1
+ import { M as ModelProfile, C as CompilePolicy, N as NormalizedResponse, A as ApiKeys, P as ProviderOverrides, a as CompiledRequest, b as PromptIR, c as CallOptions, d as CallResult, R as RecordInput, O as OracleScore, e as CompileResult, B as BestPracticeAdvisory, f as Provider } from './profiles-CVB2_5C8.js';
2
+ export { g as ALIASES, h as CacheStrategy, i as CallAttempt, j as CallError, k as CliffRule, l as Constraints, F as FallbackReason, H as HistoryCachePolicy, I as IntentDeclaration, L as LoweringSpec, m as Message, n as MutationApplied, o as NormalizedTokens, p as PromptSection, q as RecoveryRule, S as StructuredOutputCapability, r as SystemPromptMode, T as ToolCall, s as ToolDefinition, t as allProfiles, u as getProfile, v as profilesByProvider, w as tryGetProfile } from './profiles-CVB2_5C8.js';
3
3
  import { IntentArchetypeName } from './dialect.js';
4
4
  export { ALL_ARCHETYPES, ContextBucket, DIALECT_VERSION, HistoryDepth, INTENT_ARCHETYPES, OutputMode, ShapeSignature, ToolCountBucket, bucketContext, bucketHistory, bucketToolCount, hashShape, isArchetype, learningKey } from './dialect.js';
5
5