@shenghuabi/knowledge 1.0.21

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (112) hide show
  1. package/embedding/embedding.service.d.ts +4 -0
  2. package/embedding/index.d.ts +2 -0
  3. package/embedding/type.d.ts +12 -0
  4. package/embedding.mjs +61 -0
  5. package/embedding.mjs.map +7 -0
  6. package/file-parser/const.d.ts +20 -0
  7. package/file-parser/dict/dict-format/dsl/dsl-parse.service.d.ts +6 -0
  8. package/file-parser/dict/dict-format/dsl/dsl.format.d.ts +1 -0
  9. package/file-parser/dict/dict-format/mdict-parse.service.d.ts +20 -0
  10. package/file-parser/dict/dict-format/stardict-parse.service.d.ts +12 -0
  11. package/file-parser/dict/dict-format/yaml-parse.service.d.ts +25 -0
  12. package/file-parser/dict/dict.service.d.ts +10 -0
  13. package/file-parser/dict/index.d.ts +2 -0
  14. package/file-parser/dict/type.d.ts +24 -0
  15. package/file-parser/document-file-parser.service.d.ts +15 -0
  16. package/file-parser/document-loader/pdf-img.loader.d.ts +8 -0
  17. package/file-parser/document-loader/xlsx.loader.d.ts +6 -0
  18. package/file-parser/file-parser.service.d.ts +13 -0
  19. package/file-parser/index.d.ts +6 -0
  20. package/file-parser/text-analyse.d.ts +1 -0
  21. package/file-parser/text-parser.d.ts +3 -0
  22. package/file-parser/vl-parser/markdown.parser.d.ts +8 -0
  23. package/file-parser.mjs +850 -0
  24. package/file-parser.mjs.map +7 -0
  25. package/image/convert.d.ts +25 -0
  26. package/image/extract.d.ts +2 -0
  27. package/image/image-metadata.d.ts +2 -0
  28. package/image/index.d.ts +3 -0
  29. package/image.mjs +134 -0
  30. package/image.mjs.map +7 -0
  31. package/knowledge/article/article.knowledge.service.d.ts +53 -0
  32. package/knowledge/article/define/config.d.ts +60 -0
  33. package/knowledge/article/define/index.d.ts +2 -0
  34. package/knowledge/article/define/payload.d.ts +16 -0
  35. package/knowledge/article/index.d.ts +2 -0
  36. package/knowledge/common/common.knowledge.service.d.ts +240 -0
  37. package/knowledge/common/define/base.d.ts +7 -0
  38. package/knowledge/common/define/chunk.d.ts +14 -0
  39. package/knowledge/common/define/embedding.d.ts +5 -0
  40. package/knowledge/common/define/index.d.ts +3 -0
  41. package/knowledge/common/index.d.ts +1 -0
  42. package/knowledge/common/query.d.ts +7 -0
  43. package/knowledge/const.d.ts +95 -0
  44. package/knowledge/define/index.d.ts +245 -0
  45. package/knowledge/dict/define/config.d.ts +68 -0
  46. package/knowledge/dict/define/index.d.ts +1 -0
  47. package/knowledge/dict/dict.knowledge.service.d.ts +67 -0
  48. package/knowledge/graph/const.d.ts +20 -0
  49. package/knowledge/graph/define/config.d.ts +169 -0
  50. package/knowledge/graph/define/define.d.ts +402 -0
  51. package/knowledge/graph/define/index.d.ts +2 -0
  52. package/knowledge/graph/define/query.d.ts +14 -0
  53. package/knowledge/graph/graph.handle.service.d.ts +28 -0
  54. package/knowledge/graph/graph.knowledge.service.d.ts +40 -0
  55. package/knowledge/graph/graph.local.service.d.ts +85 -0
  56. package/knowledge/graph/graph.query.service.d.ts +160 -0
  57. package/knowledge/graph/graph.service.d.ts +24 -0
  58. package/knowledge/graph/graph.util.service.d.ts +31 -0
  59. package/knowledge/graph/type.d.ts +11 -0
  60. package/knowledge/graph/util/format-attr.d.ts +48 -0
  61. package/knowledge/graph/util/graph-util.d.ts +5 -0
  62. package/knowledge/graph/util.d.ts +1 -0
  63. package/knowledge/graph/vecotr-format.d.ts +11 -0
  64. package/knowledge/index.d.ts +17 -0
  65. package/knowledge/knowledge.manager.service.d.ts +42 -0
  66. package/knowledge/knowledge.util.service.d.ts +21 -0
  67. package/knowledge/normal/define/config.d.ts +60 -0
  68. package/knowledge/normal/define/index.d.ts +1 -0
  69. package/knowledge/normal/normal.knowledge.service.d.ts +49 -0
  70. package/knowledge/template.format.d.ts +6 -0
  71. package/knowledge/type.d.ts +28 -0
  72. package/knowledge.mjs +2856 -0
  73. package/knowledge.mjs.map +7 -0
  74. package/ocr/FileUtils.d.ts +4 -0
  75. package/ocr/ImageRaw.d.ts +11 -0
  76. package/ocr/index.d.ts +2 -0
  77. package/ocr/model-config.d.ts +8 -0
  78. package/ocr/ocr.d.ts +29 -0
  79. package/ocr.mjs +351 -0
  80. package/ocr.mjs.map +7 -0
  81. package/package.json +105 -0
  82. package/qdrant/index.d.ts +3 -0
  83. package/qdrant/qdrant-client.service.d.ts +396 -0
  84. package/qdrant/qdrant-server.service.d.ts +21 -0
  85. package/qdrant/type.d.ts +18 -0
  86. package/qdrant/util.d.ts +1 -0
  87. package/qdrant.mjs +274 -0
  88. package/qdrant.mjs.map +7 -0
  89. package/util/batch-queue.d.ts +6 -0
  90. package/util/cache-queue.d.ts +10 -0
  91. package/util/clone.d.ts +1 -0
  92. package/util/embedding-queue.d.ts +3 -0
  93. package/util/get-hash.d.ts +2 -0
  94. package/util/html-to-text/index.d.ts +5 -0
  95. package/util/index.d.ts +10 -0
  96. package/util/is-truthy.d.ts +1 -0
  97. package/util/log.service.d.ts +6 -0
  98. package/util/promise.d.ts +5 -0
  99. package/util/type.d.ts +1 -0
  100. package/util/uniq-object-key.d.ts +1 -0
  101. package/util.mjs +219 -0
  102. package/util.mjs.map +7 -0
  103. package/worker/custom-cache.d.ts +28 -0
  104. package/worker/ocr/index.d.ts +17 -0
  105. package/worker/ocr.mjs +75 -0
  106. package/worker/ocr.mjs.map +7 -0
  107. package/worker/reranker.mjs +180 -0
  108. package/worker/reranker.mjs.map +7 -0
  109. package/worker/set-transformers-config.d.ts +19 -0
  110. package/worker/text2vec/index.d.ts +9 -0
  111. package/worker/text2vec.mjs +194 -0
  112. package/worker/text2vec.mjs.map +7 -0
@@ -0,0 +1,68 @@
1
+ import * as v from 'valibot';
2
+ export declare const DictCollectionDefine: v.ObjectSchema<{
3
+ readonly collectionName: v.StringSchema<undefined>;
4
+ readonly embeddingTemplate: v.OptionalSchema<v.ObjectSchema<{
5
+ readonly entry: v.OptionalSchema<v.ObjectSchema<{
6
+ readonly enable: v.BooleanSchema<undefined>;
7
+ readonly value: v.OptionalSchema<v.StringSchema<undefined>, undefined>;
8
+ }, undefined>, undefined>;
9
+ }, undefined>, undefined>;
10
+ readonly size: v.NumberSchema<undefined>;
11
+ }, undefined>;
12
+ export declare const DictKnowledgeConfigDefine: v.SchemaWithPipe<readonly [v.ObjectSchema<{
13
+ readonly type: v.OptionalSchema<v.LiteralSchema<"dict", undefined>, "dict">;
14
+ readonly collectionList: v.ArraySchema<v.ObjectSchema<{
15
+ readonly collectionName: v.StringSchema<undefined>;
16
+ readonly embeddingTemplate: v.OptionalSchema<v.ObjectSchema<{
17
+ readonly entry: v.OptionalSchema<v.ObjectSchema<{
18
+ readonly enable: v.BooleanSchema<undefined>;
19
+ readonly value: v.OptionalSchema<v.StringSchema<undefined>, undefined>;
20
+ }, undefined>, undefined>;
21
+ }, undefined>, undefined>;
22
+ readonly size: v.NumberSchema<undefined>;
23
+ }, undefined>, undefined>;
24
+ /** 词条提取 */
25
+ readonly extractorWord: v.OptionalSchema<v.BooleanSchema<undefined>, undefined>;
26
+ /** 图像识别 */
27
+ readonly useOcr: v.OptionalSchema<v.BooleanSchema<undefined>, undefined>;
28
+ readonly name: v.StringSchema<undefined>;
29
+ readonly activateCollection: v.StringSchema<undefined>;
30
+ }, undefined>, v.TransformAction<{
31
+ type: "dict";
32
+ collectionList: {
33
+ collectionName: string;
34
+ embeddingTemplate?: {
35
+ entry?: {
36
+ enable: boolean;
37
+ value?: string | undefined;
38
+ } | undefined;
39
+ } | undefined;
40
+ size: number;
41
+ }[];
42
+ extractorWord?: boolean | undefined;
43
+ useOcr?: boolean | undefined;
44
+ name: string;
45
+ activateCollection: string;
46
+ }, {
47
+ /** 激活的普通知识库(文件切片) */
48
+ activateName: string;
49
+ type: "dict";
50
+ collectionList: {
51
+ collectionName: string;
52
+ embeddingTemplate?: {
53
+ entry?: {
54
+ enable: boolean;
55
+ value?: string | undefined;
56
+ } | undefined;
57
+ } | undefined;
58
+ size: number;
59
+ }[];
60
+ extractorWord?: boolean | undefined;
61
+ useOcr?: boolean | undefined;
62
+ name: string;
63
+ activateCollection: string;
64
+ }>]>;
65
+ export type DictKnowledgeConfig = v.InferInput<typeof DictKnowledgeConfigDefine>;
66
+ export type DictKnowledgeConfigInline = v.InferOutput<typeof DictKnowledgeConfigDefine>;
67
+ export type DictCollectionInput = v.InferInput<typeof DictCollectionDefine>;
68
+ export type DictCollectionInlineType = v.InferOutput<typeof DictCollectionDefine>;
@@ -0,0 +1 @@
1
+ export * from './config';
@@ -0,0 +1,67 @@
1
+ import { DictInput } from '@shenghuabi/knowledge/file-parser';
2
+ import { DictCollectionInlineType } from './define/config';
3
+ import { CommonKnowledgeService } from '../common/common.knowledge.service';
4
+ import { QueryOptions } from '../common/query';
5
+ export declare class DictKnowledgeService extends CommonKnowledgeService {
6
+ #private;
7
+ formatCollection(input: any): {
8
+ collectionName: string;
9
+ embeddingTemplate?: {
10
+ entry?: {
11
+ enable: boolean;
12
+ value?: string | undefined;
13
+ } | undefined;
14
+ } | undefined;
15
+ size: number;
16
+ };
17
+ /** 只创建这一次,剩下的都是插入或更新 */
18
+ create(collection: DictCollectionInlineType): Promise<void>;
19
+ importDict(input: DictInput): Promise<number>;
20
+ addCollection(collection: DictCollectionInlineType): Promise<void>;
21
+ deleteCollection(collectionName: string): Promise<boolean>;
22
+ changeActivateCollection(collectionName: string): Promise<void>;
23
+ export(): Promise<{
24
+ collection: string;
25
+ name?: string | undefined;
26
+ creation_time?: string | null | undefined;
27
+ size?: number | undefined;
28
+ checksum?: string | null | undefined;
29
+ }[]>;
30
+ destroy(): Promise<void>;
31
+ searchWord(text: string, options: QueryOptions): Promise<{
32
+ id: string | number;
33
+ version: number;
34
+ score: number;
35
+ payload?: Record<string, unknown> | {
36
+ [key: string]: unknown;
37
+ } | null | undefined;
38
+ vector?: Record<string, unknown> | number[] | number[][] | {
39
+ [key: string]: number[] | number[][] | {
40
+ indices: number[];
41
+ values: number[];
42
+ } | undefined;
43
+ } | null | undefined;
44
+ shard_key?: string | number | Record<string, unknown> | null | undefined;
45
+ order_value?: number | Record<string, unknown> | null | undefined;
46
+ }[]>;
47
+ /** 当普通数据库用 */
48
+ matchWord(text: string, options: {
49
+ limit: number;
50
+ }): Promise<{
51
+ points: {
52
+ id: string | number;
53
+ payload?: Record<string, unknown> | {
54
+ [key: string]: unknown;
55
+ } | null | undefined;
56
+ vector?: Record<string, unknown> | number[] | number[][] | {
57
+ [key: string]: number[] | number[][] | {
58
+ indices: number[];
59
+ values: number[];
60
+ } | undefined;
61
+ } | null | undefined;
62
+ shard_key?: string | number | Record<string, unknown> | null | undefined;
63
+ order_value?: number | Record<string, unknown> | null | undefined;
64
+ }[];
65
+ next_page_offset?: string | number | Record<string, unknown> | null | undefined;
66
+ }>;
67
+ }
@@ -0,0 +1,20 @@
1
+ import { InjectionToken } from 'static-injector';
2
+ import { EntityExtractType } from './define/define';
3
+ import { FileChunkPayload } from '../common/define/chunk';
4
+ export type ContentParserFn = {
5
+ parse: (item: FileChunkPayload, signal?: AbortSignal) => Promise<EntityExtractType>;
6
+ };
7
+ export declare const ContentParserToken: InjectionToken<ContentParserFn>;
8
+ export interface QueryParams {
9
+ lengthLimit: {
10
+ chunk: number;
11
+ node: number;
12
+ nodeDescription: number;
13
+ edge: number;
14
+ };
15
+ topK: number;
16
+ }
17
+ export declare const QueryParamsToken: InjectionToken<QueryParams>;
18
+ export type RagChatFn = (data: Record<string, any>) => Promise<string>;
19
+ export declare const RagChatToken: InjectionToken<RagChatFn>;
20
+ export declare const CHAT_INPUT = "$$INPUT$$";
@@ -0,0 +1,169 @@
1
+ import * as v from 'valibot';
2
+ export declare const GraphCollectionDefine: v.SchemaWithPipe<readonly [v.ObjectSchema<{
3
+ readonly collectionName: v.StringSchema<undefined>;
4
+ readonly size: v.NumberSchema<undefined>;
5
+ readonly embeddingTemplate: v.OptionalSchema<v.ObjectSchema<{
6
+ readonly entry: v.OptionalSchema<v.ObjectSchema<{
7
+ readonly enable: v.BooleanSchema<undefined>;
8
+ readonly value: v.OptionalSchema<v.StringSchema<undefined>, undefined>;
9
+ }, undefined>, undefined>;
10
+ readonly node: v.OptionalSchema<v.ObjectSchema<{
11
+ readonly enable: v.BooleanSchema<undefined>;
12
+ readonly value: v.OptionalSchema<v.StringSchema<undefined>, undefined>;
13
+ }, undefined>, undefined>;
14
+ readonly edge: v.OptionalSchema<v.ObjectSchema<{
15
+ readonly enable: v.BooleanSchema<undefined>;
16
+ readonly value: v.OptionalSchema<v.StringSchema<undefined>, undefined>;
17
+ }, undefined>, undefined>;
18
+ }, undefined>, undefined>;
19
+ }, undefined>, v.TransformAction<{
20
+ collectionName: string;
21
+ size: number;
22
+ embeddingTemplate?: {
23
+ entry?: {
24
+ enable: boolean;
25
+ value?: string | undefined;
26
+ } | undefined;
27
+ node?: {
28
+ enable: boolean;
29
+ value?: string | undefined;
30
+ } | undefined;
31
+ edge?: {
32
+ enable: boolean;
33
+ value?: string | undefined;
34
+ } | undefined;
35
+ } | undefined;
36
+ }, {
37
+ graphCollectionName: string;
38
+ collectionName: string;
39
+ size: number;
40
+ embeddingTemplate?: {
41
+ entry?: {
42
+ enable: boolean;
43
+ value?: string | undefined;
44
+ } | undefined;
45
+ node?: {
46
+ enable: boolean;
47
+ value?: string | undefined;
48
+ } | undefined;
49
+ edge?: {
50
+ enable: boolean;
51
+ value?: string | undefined;
52
+ } | undefined;
53
+ } | undefined;
54
+ }>]>;
55
+ export declare const GraphKnowledgeConfigDefine: v.SchemaWithPipe<readonly [v.ObjectSchema<{
56
+ readonly type: v.OptionalSchema<v.LiteralSchema<"normal-graph", undefined>, "normal-graph">;
57
+ readonly maxChunkAsync: v.NumberSchema<undefined>;
58
+ readonly collectionList: v.ArraySchema<v.SchemaWithPipe<readonly [v.ObjectSchema<{
59
+ readonly collectionName: v.StringSchema<undefined>;
60
+ readonly size: v.NumberSchema<undefined>;
61
+ readonly embeddingTemplate: v.OptionalSchema<v.ObjectSchema<{
62
+ readonly entry: v.OptionalSchema<v.ObjectSchema<{
63
+ readonly enable: v.BooleanSchema<undefined>;
64
+ readonly value: v.OptionalSchema<v.StringSchema<undefined>, undefined>;
65
+ }, undefined>, undefined>;
66
+ readonly node: v.OptionalSchema<v.ObjectSchema<{
67
+ readonly enable: v.BooleanSchema<undefined>;
68
+ readonly value: v.OptionalSchema<v.StringSchema<undefined>, undefined>;
69
+ }, undefined>, undefined>;
70
+ readonly edge: v.OptionalSchema<v.ObjectSchema<{
71
+ readonly enable: v.BooleanSchema<undefined>;
72
+ readonly value: v.OptionalSchema<v.StringSchema<undefined>, undefined>;
73
+ }, undefined>, undefined>;
74
+ }, undefined>, undefined>;
75
+ }, undefined>, v.TransformAction<{
76
+ collectionName: string;
77
+ size: number;
78
+ embeddingTemplate?: {
79
+ entry?: {
80
+ enable: boolean;
81
+ value?: string | undefined;
82
+ } | undefined;
83
+ node?: {
84
+ enable: boolean;
85
+ value?: string | undefined;
86
+ } | undefined;
87
+ edge?: {
88
+ enable: boolean;
89
+ value?: string | undefined;
90
+ } | undefined;
91
+ } | undefined;
92
+ }, {
93
+ graphCollectionName: string;
94
+ collectionName: string;
95
+ size: number;
96
+ embeddingTemplate?: {
97
+ entry?: {
98
+ enable: boolean;
99
+ value?: string | undefined;
100
+ } | undefined;
101
+ node?: {
102
+ enable: boolean;
103
+ value?: string | undefined;
104
+ } | undefined;
105
+ edge?: {
106
+ enable: boolean;
107
+ value?: string | undefined;
108
+ } | undefined;
109
+ } | undefined;
110
+ }>]>, undefined>;
111
+ readonly name: v.StringSchema<undefined>;
112
+ readonly activateCollection: v.StringSchema<undefined>;
113
+ }, undefined>, v.TransformAction<{
114
+ type: "normal-graph";
115
+ maxChunkAsync: number;
116
+ collectionList: {
117
+ graphCollectionName: string;
118
+ collectionName: string;
119
+ size: number;
120
+ embeddingTemplate?: {
121
+ entry?: {
122
+ enable: boolean;
123
+ value?: string | undefined;
124
+ } | undefined;
125
+ node?: {
126
+ enable: boolean;
127
+ value?: string | undefined;
128
+ } | undefined;
129
+ edge?: {
130
+ enable: boolean;
131
+ value?: string | undefined;
132
+ } | undefined;
133
+ } | undefined;
134
+ }[];
135
+ name: string;
136
+ activateCollection: string;
137
+ }, {
138
+ /** 激活的普通知识库(文件切片) */
139
+ activateName: string;
140
+ /** 激活的图数据库 */
141
+ activateGraphName: string;
142
+ type: "normal-graph";
143
+ maxChunkAsync: number;
144
+ collectionList: {
145
+ graphCollectionName: string;
146
+ collectionName: string;
147
+ size: number;
148
+ embeddingTemplate?: {
149
+ entry?: {
150
+ enable: boolean;
151
+ value?: string | undefined;
152
+ } | undefined;
153
+ node?: {
154
+ enable: boolean;
155
+ value?: string | undefined;
156
+ } | undefined;
157
+ edge?: {
158
+ enable: boolean;
159
+ value?: string | undefined;
160
+ } | undefined;
161
+ } | undefined;
162
+ }[];
163
+ name: string;
164
+ activateCollection: string;
165
+ }>]>;
166
+ export type GraphKnowledgeConfig = v.InferInput<typeof GraphKnowledgeConfigDefine>;
167
+ export type GraphKnowledgeConfigInline = v.InferOutput<typeof GraphKnowledgeConfigDefine>;
168
+ export type GraphCollectionInput = v.InferInput<typeof GraphCollectionDefine>;
169
+ export type GraphCollectionInlineType = v.InferOutput<typeof GraphCollectionDefine>;