npm - @fugood/bricks-project - Versions diffs - 2.22.0-beta.16 → 2.22.0-beta.17 - Mend

@fugood/bricks-project 2.22.0-beta.16 → 2.22.0-beta.17

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (5) hide show

package/compile/action-name-map.ts +1 -0
package/package.json +3 -3
package/types/common.ts +1 -1
package/types/generators.ts +178 -134
package/utils/event-props.ts +27 -0

package/compile/action-name-map.ts CHANGED Viewed

@@ -630,6 +630,7 @@ export const templateActionNameMap = {
       samplesOverlap: 'GENERATOR_VAD_INFERENCE_SAMPLES_OVERLAP',
     },
   },
   GENERATOR_LLM: {
     GENERATOR_LLM_TOKENIZE: {
       mode: 'GENERATOR_LLM_MODE',

package/package.json CHANGED Viewed

@@ -1,12 +1,12 @@
 {
   "name": "@fugood/bricks-project",
-  "version": "2.22.0-beta.16",
+  "version": "2.22.0-beta.17",
   "main": "index.ts",
   "scripts": {
     "build": "node scripts/build.js"
   },
   "dependencies": {
-    "@modelcontextprotocol/sdk": "^1.11.1",
+    "@modelcontextprotocol/sdk": "^1.15.0",
     "@types/escodegen": "^0.0.10",
     "@types/lodash": "^4.17.12",
     "acorn": "^8.13.0",
@@ -14,5 +14,5 @@
     "lodash": "^4.17.4",
     "uuid": "^8.3.1"
   },
-  "gitHead": "d8231fa6787b8d95bc2bec94a86ceba596cf57f0"
+  "gitHead": "5e8893af505fa5a7b1a902e11764c1f9ebb36a4f"
 }

package/types/common.ts CHANGED Viewed

@@ -39,7 +39,7 @@ export type SubpsaceAction = string
 export type Action = {
   __actionName: string
   parent: 'Brick' | 'Generator' | 'Subspace' | 'System'
-  name: string
+  name?: string
 }
 // Find correct key in bricks-project/utils/event-props for EventAction

package/types/generators.ts CHANGED Viewed

@@ -4868,39 +4868,9 @@ Default property:
     init?: boolean | DataLink
     /* TTS model
  The mms-tts models are licensed under CC-BY-NC-4.0 */
-    model?:
-      | 'Custom'
-      | 'BricksDisplay/vits-eng'
-      | 'BricksDisplay/vits-cmn'
-      | 'BricksDisplay/ellie-Bert-VITS2'
-      | 'onnx-community/Kokoro-82M-v1.0-ONNX'
-      | 'onnx-community/Kokoro-82M-v1.1-zh-ONNX'
-      | 'onnx-community/OuteTTS-1.0-0.6B-ONNX'
-      | 'mms-tts-ara (NC)'
-      | 'mms-tts-deu (NC)'
-      | 'mms-tts-eng (NC)'
-      | 'mms-tts-fra (NC)'
-      | 'mms-tts-hin (NC)'
-      | 'mms-tts-kor (NC)'
-      | 'mms-tts-por (NC)'
-      | 'mms-tts-ron (NC)'
-      | 'mms-tts-rus (NC)'
-      | 'mms-tts-spa (NC)'
-      | 'mms-tts-vie (NC)'
-      | 'mms-tts-yor (NC)'
-      | 'speecht5_tts'
-      | DataLink
+    model?: string | DataLink
     /* Model type */
-    modelType?:
-      | 'auto'
-      | 'vits'
-      | 'bert_vits2'
-      | 'style_text_to_speech_2'
-      | 'speecht5'
-      | 'outetts-1.0'
-      | DataLink
-    /* Load quantized model (deprecated, use `quantizeType` instead) */
-    quantized?: boolean | DataLink
+    modelType?: string | DataLink
     /* Quantize type */
     quantizeType?:
       | 'auto'
@@ -4913,9 +4883,6 @@ Default property:
       | 'bnb4'
       | 'q4f16'
       | DataLink
-    /* Custom model name
- Choose model from https://huggingface.co/models?pipeline_tag=text-to-audio&library=transformers.js */
-    customModel?: string | DataLink
     /* Vocoder model for SpeechT5 */
     vocoderModel?: 'Custom' | 'speecht5_hifigan' | DataLink
     /* Custom vocoder model
@@ -4923,8 +4890,10 @@ Default property:
     customVocoderModel?: string | DataLink
     /* Speaker embedding, for SpeechT5 or StyleTTS (Kokoro) */
     speakerEmbedUrl?: string | DataLink
-    /* MD5 checksum of `speakerEmbedUrl` */
-    speakerEmbedMd5?: string | DataLink
+    /* Hash of `speakerEmbedUrl` */
+    speakerEmbedHash?: string | DataLink
+    /* Hash type of `speakerEmbedUrl` */
+    speakerEmbedHashType?: 'md5' | 'sha256' | 'sha1' | DataLink
     /* Speaker config, for OuteTTS model */
     speakerConfig?: {} | DataLink
     /* Audio token generation max length */
@@ -5054,7 +5023,6 @@ interface GeneratorOnnxLLMDef {
   /*
 Default property:
 {
-  "model": "BricksDisplay/phi-1_5-q4",
   "modelType": "auto",
   "toolCallParser": "llama3_json",
   "toolChoice": "auto",
@@ -5073,70 +5041,9 @@ Default property:
     /* Initialize the TTS context on generator initialization */
     init?: boolean | DataLink
     /* LLM model */
-    model?:
-      | 'Custom'
-      | 'onnx-community/gemma-3-1b-it-ONNX'
-      | 'BricksDisplay/phi-1_5'
-      | 'BricksDisplay/phi-1_5-q4'
-      | 'onnx-community/Phi-3.5-vision-instruct'
-      | 'onnx-community/Phi-3-vision-128k-instruct'
-      | 'onnx-community/Phi-4-mini-instruct-ONNX-MHA'
-      | 'onnx-community/Qwen2.5-0.5B'
-      | 'onnx-community/Qwen2.5-0.5B-Instruct'
-      | 'onnx-community/Qwen2.5-1.5B'
-      | 'onnx-community/Qwen2.5-1.5B-Instruct'
-      | 'onnx-community/Qwen2-VL-2B-Instruct'
-      | 'stablelm-2-1_6b'
-      | 'BricksDisplay/stablelm-2-1_6b-q4'
-      | 'stablelm-2-zephyr-1_6b'
-      | 'BricksDisplay/stablelm-2-zephyr-1_6b-q4'
-      | 'BricksDisplay/Llama-2-7b-chat-q4'
-      | 'TinyLLama-v0'
-      | 'TinyLlama-1.1B-Chat-v1.0'
-      | 'BricksDisplay/TinyLlama-1.1B-Chat-v1.0-q4'
-      | 'llama-160m'
-      | 'llama-68m'
-      | 'BricksDisplay/Yi-6B-q4'
-      | 'BricksDisplay/Yi-6B-Chat-q4'
-      | 'BricksDisplay/Mistral-7B-v0.1-q4'
-      | 'BricksDisplay/Mistral-7B-Instruct-v0.2-q4'
-      | 'BricksDisplay/Breeze-7B-Base-v1_0-q4'
-      | 'BricksDisplay/Breeze-7B-Instruct-v1_0-q4'
-      | 'gpt2'
-      | 'distilgpt2'
-      | 'gpt-neo-125M'
-      | 'opt-125m'
-      | 'opt-350m'
-      | 'bloom-560m'
-      | 'bloomz-560m'
-      | 't5-small'
-      | 't5-base'
-      | 'flan-t5-small'
-      | 'flan-t5-base'
-      | 'mt5-small'
-      | 'mt5-base'
-      | 'long-t5-lobal-base'
-      | 'long-t5-tglobal-base'
-      | DataLink
+    model?: string | DataLink
     /* Model type */
-    modelType?:
-      | 'auto'
-      | 'text-generation'
-      | 'qwen2-vl'
-      | 'paligemma'
-      | 'llava'
-      | 'llava_onevision'
-      | 'moondream1'
-      | 'florence2'
-      | 'idefics3'
-      | 'smolvlm'
-      | 'phi3_v'
-      | 't5'
-      | 'mt5'
-      | 'longt5'
-      | DataLink
-    /* Load quantized model (deprecated, use `quantizeType` instead) */
-    quantized?: boolean | DataLink
+    modelType?: string | DataLink
     /* Quantize type */
     quantizeType?:
       | 'auto'
@@ -5149,10 +5056,6 @@ Default property:
       | 'bnb4'
       | 'q4f16'
       | DataLink
-    /* Custom model name
- Choose model from https://huggingface.co/models?pipeline_tag=text2text-generation&library=transformers.js
- or https://huggingface.co/models?pipeline_tag=text-generation&library=transformers.js&sort=trending */
-    customModel?: string | DataLink
     /* Prompt to inference */
     prompt?: string | DataLink
     /* Messages to inference */
@@ -5282,27 +5185,9 @@ Default property:
     /* Initialize the TTS context on generator initialization */
     init?: boolean | DataLink
     /* STT model */
-    model?:
-      | 'Custom'
-      | 'whisper-tiny'
-      | 'whisper-tiny.en'
-      | 'whisper-small'
-      | 'whisper-small.en'
-      | 'whisper-base'
-      | 'whisper-base.en'
-      | 'whisper-medium'
-      | 'whisper-medium.en'
-      | 'whisper-large'
-      | 'whisper-large-v2'
-      | 'whisper-large-v3'
-      | 'mms-1b-all'
-      | 'mms-1b-fl102'
-      | 'mms-1b-l1107'
-      | DataLink
+    model?: string | DataLink
     /* Model type */
-    modelType?: 'auto' | 'whisper' | 'hubert' | 'wav2vec2' | 'wav2vec2-bert' | DataLink
-    /* Load quantized model (deprecated, use `quantizeType` instead) */
-    quantized?: boolean | DataLink
+    modelType?: string | DataLink
     /* Quantize type */
     quantizeType?:
       | 'auto'
@@ -5315,9 +5200,6 @@ Default property:
       | 'bnb4'
       | 'q4f16'
       | DataLink
-    /* Custom model name
- Choose model from https://huggingface.co/models?pipeline_tag=automatic-speech-recognition&library=transformers.js */
-    customModel?: string | DataLink
     /* Return timestamps */
     returnTimestamps?: 'none' | 'enable' | 'word' | DataLink
     /* Transcription language
@@ -5550,7 +5432,7 @@ export type GeneratorSpeechInferenceActionTranscribeData = ActionWithParams & {
   >
 }
-/* Transcribe microphone audio source */
+/* [Deprecated] Transcribe microphone audio source */
 export type GeneratorSpeechInferenceActionTranscribeRealtime = ActionWithParams & {
   __actionName: 'GENERATOR_SPEECH_INFERENCE_TRANSCRIBE_REALTIME'
   params?: Array<
@@ -5617,7 +5499,7 @@ export type GeneratorSpeechInferenceActionTranscribeRealtime = ActionWithParams
   >
 }
-/* Stop transcribing microphone audio source */
+/* [Deprecated] Stop transcribing microphone audio source */
 export type GeneratorSpeechInferenceActionTranscribeRealtimeStop = Action & {
   __actionName: 'GENERATOR_SPEECH_INFERENCE_TRANSCRIBE_REALTIME_STOP'
 }
@@ -5865,7 +5747,7 @@ Default property:
     inferRealtimeVadFreqThold?: number | DataLink
   }
   events?: {
-    /* Event triggered when load is done */
+    /* Event triggered when context state changes */
     onContextStateChange?: Array<EventAction>
     /* Event triggered when error occurs */
     onError?: Array<EventAction>
@@ -6074,7 +5956,7 @@ Default property:
     detectFileMd5?: string | DataLink
   }
   events?: {
-    /* Event triggered when load is done */
+    /* Event triggered when context state changes */
     onContextStateChange?: Array<EventAction>
     /* Event triggered when error occurs */
     onError?: Array<EventAction>
@@ -6122,6 +6004,168 @@ export type GeneratorVadInference = Generator &
     >
   }
+/* Start realtime transcription */
+export type GeneratorRealtimeTranscriptionActionStart = Action & {
+  __actionName: 'GENERATOR_REALTIME_TRANSCRIPTION_START'
+}
+/* Stop realtime transcription */
+export type GeneratorRealtimeTranscriptionActionStop = Action & {
+  __actionName: 'GENERATOR_REALTIME_TRANSCRIPTION_STOP'
+}
+/* Force move to next slice */
+export type GeneratorRealtimeTranscriptionActionNextSlice = Action & {
+  __actionName: 'GENERATOR_REALTIME_TRANSCRIPTION_NEXT_SLICE'
+}
+/* Reset transcriber state */
+export type GeneratorRealtimeTranscriptionActionReset = Action & {
+  __actionName: 'GENERATOR_REALTIME_TRANSCRIPTION_RESET'
+}
+interface GeneratorRealtimeTranscriptionDef {
+  /*
+Default property:
+{
+  "sttLivePolicy": "only-in-use",
+  "vadInferenceLivePolicy": "only-in-use",
+  "vadEnabled": true,
+  "audioSliceSec": 30,
+  "audioMinSec": 1,
+  "maxSlicesInMemory": 5,
+  "vadStrategy": "use-preset",
+  "vadPreset": "default",
+  "autoSliceOnSpeechEnd": true,
+  "autoSliceThreshold": 2,
+  "initialPrompt": "",
+  "promptPreviousSlices": false,
+  "saveAudio": true,
+  "testMode": false,
+  "testPlaybackSpeed": 1,
+  "testChunkDurationMs": 100,
+  "testLoop": false
+}
+  */
+  property?: {
+    /* STT Generator for Whisper context */
+    sttGeneratorId?: string | DataLink
+    /* STT Live Policy. If the policy is `only-in-use`, the STT context will be released when not in use. */
+    sttLivePolicy?: 'only-in-use' | 'manual' | DataLink
+    /* VAD Inference Generator for voice activity detection */
+    vadInferenceGeneratorId?: string | DataLink
+    /* VAD Inference Live Policy. If the policy is `only-in-use`, the VAD Inference context will be released when not in use. */
+    vadInferenceLivePolicy?: 'only-in-use' | 'manual' | DataLink
+    /* Enable VAD (Voice Activity Detection) */
+    vadEnabled?: boolean | DataLink
+    /* Audio slice duration in seconds */
+    audioSliceSec?: number | DataLink
+    /* Minimum audio duration to start transcription in seconds */
+    audioMinSec?: number | DataLink
+    /* Maximum number of slices to keep in memory */
+    maxSlicesInMemory?: number | DataLink
+    /* VAD Strategy */
+    vadStrategy?: 'use-preset' | 'use-generator-options' | DataLink
+    /* VAD preset configuration */
+    vadPreset?:
+      | 'default'
+      | 'sensitive'
+      | 'very-sensitive'
+      | 'conservative'
+      | 'very-conservative'
+      | 'continuous-speech'
+      | 'meeting'
+      | 'noisy-environment'
+      | DataLink
+    /* Auto slice on speech end */
+    autoSliceOnSpeechEnd?: boolean | DataLink
+    /* Auto slice threshold in seconds */
+    autoSliceThreshold?: number | DataLink
+    /* Initial prompt for transcription */
+    initialPrompt?: string | DataLink
+    /* Include previous slices in prompt */
+    promptPreviousSlices?: boolean | DataLink
+    /* Enable audio output saving (auto-generates file path) */
+    saveAudio?: boolean | DataLink
+    /* Use test mode with file simulation */
+    testMode?: boolean | DataLink
+    /* Test audio file path for simulation */
+    testFilePath?: string | DataLink
+    /* Test audio file hash */
+    testFileHash?: string | DataLink
+    /* Test audio file hash type */
+    testFileHashType?: string | DataLink
+    /* Test playback speed */
+    testPlaybackSpeed?: number | DataLink
+    /* Test chunk duration in milliseconds */
+    testChunkDurationMs?: number | DataLink
+    /* Loop test audio file */
+    testLoop?: boolean | DataLink
+  }
+  events?: {
+    /* Event triggered when transcription starts, processes, or ends */
+    onTranscribe?: Array<EventAction>
+    /* Event triggered on VAD (Voice Activity Detection) events */
+    onVad?: Array<EventAction>
+    /* Event triggered when error occurs */
+    onError?: Array<EventAction>
+    /* Event triggered when status changes */
+    onStatusChange?: Array<EventAction>
+    /* Event triggered when statistics update */
+    onStatsUpdate?: Array<EventAction>
+    /* Event triggered when transcription ends */
+    onEnd?: Array<EventAction>
+  }
+  outlets?: {
+    /* Is realtime transcription currently active */
+    isActive?: () => Data
+    /* Is currently transcribing audio */
+    isTranscribing?: () => Data
+    /* Current transcription results */
+    results?: () => Data
+    /* Current transcription result text */
+    resultText?: () => Data
+    /* Current statistics */
+    statistics?: () => Data
+    /* Latest transcribe event */
+    lastTranscribeEvent?: () => Data
+    /* Latest VAD event */
+    lastVadEvent?: () => Data
+    /* Audio output file path (auto-generated when saving audio) */
+    audioOutputPath?: () => Data
+  }
+}
+/* Realtime speech-to-text transcription using Whisper and VAD with live audio streaming */
+export type GeneratorRealtimeTranscription = Generator &
+  GeneratorRealtimeTranscriptionDef & {
+    templateKey: 'GENERATOR_REALTIME_TRANSCRIPTION'
+    switches: Array<
+      SwitchDef &
+        GeneratorRealtimeTranscriptionDef & {
+          conds?: Array<{
+            method: '==' | '!=' | '>' | '<' | '>=' | '<='
+            cond:
+              | SwitchCondInnerStateCurrentCanvas
+              | SwitchCondData
+              | {
+                  __typename: 'SwitchCondInnerStateOutlet'
+                  outlet:
+                    | 'isActive'
+                    | 'isTranscribing'
+                    | 'results'
+                    | 'resultText'
+                    | 'statistics'
+                    | 'lastTranscribeEvent'
+                    | 'lastVadEvent'
+                    | 'audioOutputPath'
+                  value: any
+                }
+          }>
+        }
+    >
+  }
 /* Load the model */
 export type GeneratorLLMActionLoadModel = Action & {
   __actionName: 'GENERATOR_LLM_LOAD_MODEL'
@@ -6705,7 +6749,7 @@ Default property:
     completionIgnoreEOS?: boolean | DataLink
   }
   events?: {
-    /* Event triggered when load is done */
+    /* Event triggered when context state changes */
     onContextStateChange?: Array<EventAction>
     /* Event triggered when error occurs */
     onError?: Array<EventAction>
@@ -7214,7 +7258,7 @@ Default property:
     greedy?: boolean | DataLink
   }
   events?: {
-    /* Event triggered when load is done */
+    /* Event triggered when context state changes */
     onContextStateChange?: Array<EventAction>
     /* Event triggered when generate is done */
     onGenerate?: Array<EventAction>

package/utils/event-props.ts CHANGED Viewed

@@ -774,6 +774,33 @@ export const templateEventPropsMap = {
       'GENERATOR_VAD_INFERENCE_DETECTION_TIME', // type: number
     ],
   },
+  GENERATOR_REALTIME_TRANSCRIPTION: {
+    onTranscribe: [
+      'GENERATOR_REALTIME_TRANSCRIPTION_TRANSCRIBE_EVENT', // type: object
+    ],
+    onVad: [
+      'GENERATOR_REALTIME_TRANSCRIPTION_VAD_EVENT', // type: object
+      'GENERATOR_REALTIME_TRANSCRIPTION_VAD_EVENT_TYPE', // type: string
+      'GENERATOR_REALTIME_TRANSCRIPTION_VAD_EVENT_CONFIDENCE', // type: number
+      'GENERATOR_REALTIME_TRANSCRIPTION_VAD_EVENT_DURATION', // type: number
+      'GENERATOR_REALTIME_TRANSCRIPTION_VAD_EVENT_SLICE_INDEX', // type: number
+    ],
+    onError: [
+      'GENERATOR_REALTIME_TRANSCRIPTION_ERROR', // type: string
+    ],
+    onStatusChange: [
+      'GENERATOR_REALTIME_TRANSCRIPTION_IS_ACTIVE', // type: bool
+    ],
+    onStatsUpdate: [
+      'GENERATOR_REALTIME_TRANSCRIPTION_STATS_TYPE', // type: string
+      'GENERATOR_REALTIME_TRANSCRIPTION_STATS_TIMESTAMP', // type: number
+      'GENERATOR_REALTIME_TRANSCRIPTION_STATS', // type: object
+    ],
+    onEnd: [
+      'GENERATOR_REALTIME_TRANSCRIPTION_END_RESULTS', // type: array
+      'GENERATOR_REALTIME_TRANSCRIPTION_END_AUDIO_OUTPUT_PATH', // type: string
+    ],
+  },
   GENERATOR_LLM: {
     onContextStateChange: [
       'GENERATOR_LLM_CONTEXT_STATE', // type: string