@fugood/bricks-project 2.21.10 → 2.21.12

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
package/package.json CHANGED
@@ -1,6 +1,6 @@
1
1
  {
2
2
  "name": "@fugood/bricks-project",
3
- "version": "2.21.10",
3
+ "version": "2.21.12",
4
4
  "main": "index.ts",
5
5
  "scripts": {
6
6
  "build": "node scripts/build.js"
@@ -6622,6 +6622,8 @@ Default property:
6622
6622
  useMmap?: boolean | DataLink
6623
6623
  /* Use Flash Attention for inference (Recommended with GPU enabled) */
6624
6624
  useFlashAttn?: boolean | DataLink
6625
+ /* Use full-size SWA cache. May improve performance for multiple sequences but uses more memory. */
6626
+ useSwaFull?: boolean | DataLink
6625
6627
  /* KV cache data type for the K (Default: f16) */
6626
6628
  cacheKType?: 'f16' | 'f32' | 'q8_0' | 'q4_0' | 'q4_1' | 'iq4_nl' | 'q5_0' | 'q5_1' | DataLink
6627
6629
  /* KV cache data type for the V (Default: f16) */
@@ -6858,6 +6860,7 @@ Default property:
6858
6860
  "vocoderUrl": "https://huggingface.co/ggml-org/WavTokenizer/resolve/main/WavTokenizer-Large-75-F16.gguf",
6859
6861
  "vocoderHashType": "sha256",
6860
6862
  "vocoderHash": "2356baa8631cc2995ea3465196a017a2733600d849a91180c0f97fa7fb375bbe",
6863
+ "vocoderBatchSize": 4096,
6861
6864
  "outputType": "play",
6862
6865
  "cacheGenerated": true,
6863
6866
  "autoInferEnable": false,
@@ -6868,10 +6871,11 @@ Default property:
6868
6871
  "completionTopK": 40,
6869
6872
  "completionTopP": 0.9,
6870
6873
  "completionMinP": 0.05,
6871
- "useGuideToken": false,
6872
- "contextSize": 4096,
6873
- "batchSize": 512,
6874
- "maxThreads": 1,
6874
+ "useGuideToken": true,
6875
+ "contextSize": 8192,
6876
+ "batchSize": 8192,
6877
+ "microBatchSize": 512,
6878
+ "maxThreads": 2,
6875
6879
  "accelVariant": "default",
6876
6880
  "mainGpu": 0,
6877
6881
  "gpuLayers": 0,
@@ -6896,6 +6900,8 @@ Default property:
6896
6900
  vocoderHashType?: 'md5' | 'sha256' | 'sha1' | DataLink
6897
6901
  /* Hash of vocoder model */
6898
6902
  vocoderHash?: string | DataLink
6903
+ /* Batch size of vocoder model */
6904
+ vocoderBatchSize?: number | DataLink
6899
6905
  /* Output mode */
6900
6906
  outputType?: 'play' | 'file' | DataLink
6901
6907
  /* Enable cache for generated audio */
@@ -6922,12 +6928,16 @@ Default property:
6922
6928
  completionMinP?: number | DataLink
6923
6929
  /* Set the random number generator (RNG) seed (default: -1, -1 = random seed) */
6924
6930
  completionSeed?: number | DataLink
6931
+ /* Number of tokens to predict */
6932
+ completionPredict?: number | DataLink
6925
6933
  /* Enable guide token to help prevent hallucinations by forcing the TTS to use the correct words. */
6926
6934
  useGuideToken?: boolean | DataLink
6927
6935
  /* Context size, for OutTTS recommended 4096 ~ 8192 (Default to 4096) */
6928
6936
  contextSize?: number | DataLink
6929
6937
  /* Logical batch size for prompt processing */
6930
6938
  batchSize?: number | DataLink
6939
+ /* Physical batch size for prompt processing */
6940
+ microBatchSize?: number | DataLink
6931
6941
  /* Number of threads */
6932
6942
  maxThreads?: number | DataLink
6933
6943
  /* Accelerator variant (Only for desktop)
@@ -841,6 +841,7 @@ export const templateEventPropsMap = {
841
841
  ],
842
842
  onCompletionFunctionCall: [
843
843
  'GENERATOR_LLM_COMPLETION_SESSION_KEY', // type: string
844
+ 'GENERATOR_LLM_COMPLETION_FUNCTION_CALL_ID', // type: string
844
845
  'GENERATOR_LLM_COMPLETION_FUNCTION_CALL_NAME', // type: string
845
846
  'GENERATOR_LLM_COMPLETION_FUNCTION_ARGUMENTS', // type: object
846
847
  'GENERATOR_LLM_COMPLETION_FUNCTION_DETAILS', // type: object