@fugood/bricks-project 2.21.11 → 2.21.12

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
package/package.json CHANGED
@@ -1,6 +1,6 @@
1
1
  {
2
2
  "name": "@fugood/bricks-project",
3
- "version": "2.21.11",
3
+ "version": "2.21.12",
4
4
  "main": "index.ts",
5
5
  "scripts": {
6
6
  "build": "node scripts/build.js"
@@ -6622,6 +6622,8 @@ Default property:
6622
6622
  useMmap?: boolean | DataLink
6623
6623
  /* Use Flash Attention for inference (Recommended with GPU enabled) */
6624
6624
  useFlashAttn?: boolean | DataLink
6625
+ /* Use full-size SWA cache. May improve performance for multiple sequences but uses more memory. */
6626
+ useSwaFull?: boolean | DataLink
6625
6627
  /* KV cache data type for the K (Default: f16) */
6626
6628
  cacheKType?: 'f16' | 'f32' | 'q8_0' | 'q4_0' | 'q4_1' | 'iq4_nl' | 'q5_0' | 'q5_1' | DataLink
6627
6629
  /* KV cache data type for the V (Default: f16) */
@@ -6869,7 +6871,7 @@ Default property:
6869
6871
  "completionTopK": 40,
6870
6872
  "completionTopP": 0.9,
6871
6873
  "completionMinP": 0.05,
6872
- "useGuideToken": false,
6874
+ "useGuideToken": true,
6873
6875
  "contextSize": 8192,
6874
6876
  "batchSize": 8192,
6875
6877
  "microBatchSize": 512,