@databio/gtars 0.5.2 → 0.6.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
package/gtars_js.d.ts CHANGED
@@ -1,146 +1,377 @@
1
1
  /* tslint:disable */
2
2
  /* eslint-disable */
3
- export function greet(name: string): void;
3
+
4
+ export class BedClassificationOutput {
5
+ private constructor();
6
+ free(): void;
7
+ [Symbol.dispose](): void;
8
+ readonly bed_compliance: string;
9
+ readonly compliant_columns: number;
10
+ readonly data_format: string;
11
+ readonly non_compliant_columns: number;
12
+ }
13
+
4
14
  export class ChromosomeStatistics {
5
- private constructor();
6
- free(): void;
7
- [Symbol.dispose](): void;
8
- readonly chromosome: string;
9
- readonly start_nucleotide_position: number;
10
- readonly end_nucleotide_position: number;
11
- readonly number_of_regions: number;
12
- readonly minimum_region_length: number;
13
- readonly maximum_region_length: number;
14
- readonly mean_region_length: number;
15
- readonly median_region_length: number;
15
+ private constructor();
16
+ free(): void;
17
+ [Symbol.dispose](): void;
18
+ readonly chromosome: string;
19
+ readonly end_nucleotide_position: number;
20
+ readonly maximum_region_length: number;
21
+ readonly mean_region_length: number;
22
+ readonly median_region_length: number;
23
+ readonly minimum_region_length: number;
24
+ readonly number_of_regions: number;
25
+ readonly start_nucleotide_position: number;
16
26
  }
27
+
17
28
  export class Overlapper {
18
- free(): void;
19
- [Symbol.dispose](): void;
20
- constructor(universe: any, backend: string);
21
- get_backend(): string;
22
- find(regions: any): any;
29
+ free(): void;
30
+ [Symbol.dispose](): void;
31
+ find(regions: any): any;
32
+ get_backend(): string;
33
+ constructor(universe: any, backend: string);
23
34
  }
35
+
24
36
  export class RegionDistribution {
25
- private constructor();
26
- free(): void;
27
- [Symbol.dispose](): void;
37
+ private constructor();
38
+ free(): void;
39
+ [Symbol.dispose](): void;
28
40
  }
41
+
29
42
  export class RegionSet {
30
- free(): void;
31
- [Symbol.dispose](): void;
32
- constructor(regions: any);
33
- chromosomeStatistics(): any;
34
- regionDistribution(n_bins: number): any;
35
- readonly numberOfRegions: number;
36
- readonly meanRegionWidth: number;
37
- readonly nucleotidesLength: number;
38
- readonly identifier: string;
43
+ free(): void;
44
+ [Symbol.dispose](): void;
45
+ chromosomeStatistics(): any;
46
+ constructor(regions: any);
47
+ regionDistribution(n_bins: number): any;
48
+ readonly classify: BedClassificationOutput;
49
+ readonly firstRegion: string;
50
+ readonly identifier: string;
51
+ readonly meanRegionWidth: number;
52
+ readonly nucleotidesLength: number;
53
+ readonly numberOfRegions: number;
39
54
  }
55
+
40
56
  export class Tokenizer {
41
- free(): void;
42
- [Symbol.dispose](): void;
43
- constructor(universe: any, backend: string);
44
- tokenize(regions: any): any;
45
- encode(tokens: any): any;
46
- decode(ids: any): any;
47
- specialTokensMap(): any;
48
- getVocab(): any;
49
- readonly unkToken: string;
50
- readonly padToken: string;
51
- readonly maskToken: string;
52
- readonly clsToken: string;
53
- readonly bosToken: string;
54
- readonly eosToken: string;
55
- readonly sepToken: string;
56
- readonly padTokenId: number;
57
- readonly maskTokenId: number;
58
- readonly clsTokenId: number;
59
- readonly bosTokenId: number;
60
- readonly eosTokenId: number;
61
- readonly sepTokenId: number;
62
- readonly unkTokenId: number;
63
- readonly vocabSize: number;
64
- readonly length: number;
57
+ free(): void;
58
+ [Symbol.dispose](): void;
59
+ decode(ids: any): any;
60
+ encode(tokens: any): any;
61
+ getVocab(): any;
62
+ constructor(universe: any, backend: string);
63
+ specialTokensMap(): any;
64
+ tokenize(regions: any): any;
65
+ readonly bosToken: string;
66
+ readonly bosTokenId: number;
67
+ readonly clsToken: string;
68
+ readonly clsTokenId: number;
69
+ readonly eosToken: string;
70
+ readonly eosTokenId: number;
71
+ readonly length: number;
72
+ readonly maskToken: string;
73
+ readonly maskTokenId: number;
74
+ readonly padToken: string;
75
+ readonly padTokenId: number;
76
+ readonly sepToken: string;
77
+ readonly sepTokenId: number;
78
+ readonly unkToken: string;
79
+ readonly unkTokenId: number;
80
+ readonly vocabSize: number;
65
81
  }
66
82
 
83
+ /**
84
+ * Canonicalize a JSON string according to RFC-8785.
85
+ *
86
+ * This is useful for computing digests of JSON objects in a deterministic way.
87
+ *
88
+ * # Arguments
89
+ * * `json_str` - A JSON string
90
+ *
91
+ * # Returns
92
+ * The canonicalized JSON string
93
+ */
94
+ export function canonicalizeJsonString(json_str: string): string;
95
+
96
+ /**
97
+ * Compute the MD5 digest of a string.
98
+ *
99
+ * Low-level function that does NOT uppercase the input.
100
+ *
101
+ * # Arguments
102
+ * * `input` - The input string
103
+ *
104
+ * # Returns
105
+ * The MD5 digest as a hex string
106
+ */
107
+ export function computeMd5(input: string): string;
108
+
109
+ /**
110
+ * Compute the sha512t24u digest of a string.
111
+ *
112
+ * This is a low-level function that computes the GA4GH standard digest
113
+ * of arbitrary input. Unlike `sequence_digest`, this does NOT uppercase
114
+ * the input.
115
+ *
116
+ * # Arguments
117
+ * * `input` - The input string
118
+ *
119
+ * # Returns
120
+ * The sha512t24u digest string (base64url encoded)
121
+ */
122
+ export function computeSha512t24u(input: string): string;
123
+
124
+ /**
125
+ * Compute a seqcol (sequence collection) digest from FASTA content.
126
+ *
127
+ * This function takes FASTA file content as bytes and returns a JSON object
128
+ * containing the sequence collection digest and metadata. Automatically handles
129
+ * gzip-compressed FASTA files.
130
+ *
131
+ * # Arguments
132
+ * * `fasta_content` - The FASTA file content as a Uint8Array (supports gzip)
133
+ *
134
+ * # Returns
135
+ * A JavaScript object containing:
136
+ * - `digest`: The top-level seqcol digest
137
+ * - `names_digest`: Level 1 digest of sequence names
138
+ * - `sequences_digest`: Level 1 digest of sequence digests
139
+ * - `lengths_digest`: Level 1 digest of sequence lengths
140
+ * - `n_sequences`: Number of sequences
141
+ * - `sequences`: Array of sequence metadata objects
142
+ *
143
+ * # Example (JavaScript)
144
+ * ```javascript
145
+ * const fastaContent = new TextEncoder().encode(">chr1\nACGT\n");
146
+ * const result = digestSeqcol(fastaContent);
147
+ * console.log(result.digest); // Top-level seqcol digest
148
+ * ```
149
+ */
150
+ export function digestSeqcol(fasta_content: Uint8Array): any;
151
+
152
+ /**
153
+ * Finalize the hasher and return the results.
154
+ *
155
+ * This consumes the hasher and frees its resources.
156
+ * After calling this, the handle is no longer valid.
157
+ *
158
+ * # Arguments
159
+ * * `handle` - The hasher handle from `fastaHasherNew()`
160
+ *
161
+ * # Returns
162
+ * A JavaScript object with the sequence collection result,
163
+ * or an error if the handle is invalid.
164
+ *
165
+ * # Example (JavaScript)
166
+ * ```javascript
167
+ * const handle = fastaHasherNew();
168
+ * fastaHasherUpdate(handle, fastaData);
169
+ * const result = fastaHasherFinish(handle);
170
+ * console.log(result.digest);
171
+ * ```
172
+ */
173
+ export function fastaHasherFinish(handle: number): any;
174
+
175
+ /**
176
+ * Free a hasher without getting results.
177
+ *
178
+ * Use this if you need to cancel processing early.
179
+ * After calling this, the handle is no longer valid.
180
+ *
181
+ * # Arguments
182
+ * * `handle` - The hasher handle from `fastaHasherNew()`
183
+ *
184
+ * # Returns
185
+ * `true` if the handle was valid and freed, `false` otherwise.
186
+ */
187
+ export function fastaHasherFree(handle: number): boolean;
188
+
189
+ /**
190
+ * Create a new streaming FASTA hasher.
191
+ *
192
+ * Returns a handle (u32) that must be used in subsequent calls.
193
+ * The handle must be freed with `fastaHasherFinish()` or `fastaHasherFree()`.
194
+ *
195
+ * # Returns
196
+ * A handle ID (always > 0).
197
+ *
198
+ * # Example (JavaScript)
199
+ * ```javascript
200
+ * const handle = fastaHasherNew();
201
+ * // ... use handle with fastaHasherUpdate ...
202
+ * const result = fastaHasherFinish(handle);
203
+ * ```
204
+ */
205
+ export function fastaHasherNew(): number;
206
+
207
+ /**
208
+ * Get the current progress of a streaming hasher.
209
+ *
210
+ * # Arguments
211
+ * * `handle` - The hasher handle from `fastaHasherNew()`
212
+ *
213
+ * # Returns
214
+ * A JavaScript object with progress information, or null if handle is invalid.
215
+ * The object contains:
216
+ * - `completed_sequences`: Number of fully processed sequences
217
+ * - `current_sequence_name`: Name of sequence being processed (if any)
218
+ * - `current_sequence_length`: Length of sequence being processed
219
+ */
220
+ export function fastaHasherProgress(handle: number): any;
221
+
222
+ /**
223
+ * Process a chunk of FASTA data.
224
+ *
225
+ * This can be called multiple times with successive chunks.
226
+ * Handles both plain text and gzip-compressed FASTA.
227
+ *
228
+ * # Arguments
229
+ * * `handle` - The hasher handle from `fastaHasherNew()`
230
+ * * `chunk` - A chunk of FASTA data as Uint8Array
231
+ *
232
+ * # Returns
233
+ * Ok on success, or an error with details about what went wrong.
234
+ *
235
+ * # Example (JavaScript)
236
+ * ```javascript
237
+ * const handle = fastaHasherNew();
238
+ * fastaHasherUpdate(handle, new TextEncoder().encode(">chr1\nACGT"));
239
+ * fastaHasherUpdate(handle, new TextEncoder().encode("\n>chr2\nTGCA\n"));
240
+ * ```
241
+ */
242
+ export function fastaHasherUpdate(handle: number, chunk: Uint8Array): void;
243
+
244
+ export function greet(name: string): void;
245
+
246
+ /**
247
+ * Compute a sequence digest (sha512t24u) from raw sequence data.
248
+ *
249
+ * This is the GA4GH standard digest for sequences. The sequence is uppercased
250
+ * before computing the digest.
251
+ *
252
+ * # Arguments
253
+ * * `sequence` - The sequence string (A, C, G, T, etc.)
254
+ *
255
+ * # Returns
256
+ * The sha512t24u digest string (base64url encoded)
257
+ *
258
+ * # Example (JavaScript)
259
+ * ```javascript
260
+ * const digest = sequenceDigest("ACGT");
261
+ * console.log(digest); // "aKF498dAxcJAqme6QYQ7EZ07-fiw8Kw2"
262
+ * ```
263
+ */
264
+ export function sequenceDigest(sequence: string): string;
265
+
266
+ /**
267
+ * Compute an MD5 digest from raw sequence data.
268
+ *
269
+ * The sequence is uppercased before computing the digest.
270
+ *
271
+ * # Arguments
272
+ * * `sequence` - The sequence string
273
+ *
274
+ * # Returns
275
+ * The MD5 digest as a hex string
276
+ */
277
+ export function sequenceMd5(sequence: string): string;
278
+
67
279
  export type InitInput = RequestInfo | URL | Response | BufferSource | WebAssembly.Module;
68
280
 
69
281
  export interface InitOutput {
70
- readonly memory: WebAssembly.Memory;
71
- readonly __wbg_tokenizer_free: (a: number, b: number) => void;
72
- readonly tokenizer_new: (a: any, b: number, c: number) => [number, number, number];
73
- readonly tokenizer_tokenize: (a: number, b: any) => [number, number, number];
74
- readonly tokenizer_encode: (a: number, b: any) => [number, number, number];
75
- readonly tokenizer_decode: (a: number, b: any) => [number, number, number];
76
- readonly tokenizer_unkToken: (a: number) => [number, number];
77
- readonly tokenizer_padToken: (a: number) => [number, number];
78
- readonly tokenizer_maskToken: (a: number) => [number, number];
79
- readonly tokenizer_clsToken: (a: number) => [number, number];
80
- readonly tokenizer_bosToken: (a: number) => [number, number];
81
- readonly tokenizer_eosToken: (a: number) => [number, number];
82
- readonly tokenizer_sepToken: (a: number) => [number, number];
83
- readonly tokenizer_padTokenId: (a: number) => number;
84
- readonly tokenizer_maskTokenId: (a: number) => number;
85
- readonly tokenizer_clsTokenId: (a: number) => number;
86
- readonly tokenizer_bosTokenId: (a: number) => number;
87
- readonly tokenizer_eosTokenId: (a: number) => number;
88
- readonly tokenizer_sepTokenId: (a: number) => number;
89
- readonly tokenizer_unkTokenId: (a: number) => number;
90
- readonly tokenizer_specialTokensMap: (a: number) => [number, number, number];
91
- readonly tokenizer_getVocab: (a: number) => [number, number, number];
92
- readonly tokenizer_length: (a: number) => number;
93
- readonly tokenizer_vocabSize: (a: number) => number;
94
- readonly __wbg_chromosomestatistics_free: (a: number, b: number) => void;
95
- readonly chromosomestatistics_chromosome: (a: number) => [number, number];
96
- readonly chromosomestatistics_start_nucleotide_position: (a: number) => number;
97
- readonly chromosomestatistics_end_nucleotide_position: (a: number) => number;
98
- readonly chromosomestatistics_number_of_regions: (a: number) => number;
99
- readonly chromosomestatistics_minimum_region_length: (a: number) => number;
100
- readonly chromosomestatistics_maximum_region_length: (a: number) => number;
101
- readonly chromosomestatistics_mean_region_length: (a: number) => number;
102
- readonly chromosomestatistics_median_region_length: (a: number) => number;
103
- readonly __wbg_regiondistribution_free: (a: number, b: number) => void;
104
- readonly __wbg_regionset_free: (a: number, b: number) => void;
105
- readonly regionset_new: (a: any) => [number, number, number];
106
- readonly regionset_numberOfRegions: (a: number) => number;
107
- readonly regionset_meanRegionWidth: (a: number) => number;
108
- readonly regionset_nucleotidesLength: (a: number) => number;
109
- readonly regionset_identifier: (a: number) => [number, number];
110
- readonly regionset_chromosomeStatistics: (a: number) => [number, number, number];
111
- readonly regionset_regionDistribution: (a: number, b: number) => [number, number, number];
112
- readonly __wbg_overlapper_free: (a: number, b: number) => void;
113
- readonly overlapper_new: (a: any, b: number, c: number) => [number, number, number];
114
- readonly overlapper_get_backend: (a: number) => [number, number];
115
- readonly overlapper_find: (a: number, b: any) => [number, number, number];
116
- readonly greet: (a: number, b: number) => void;
117
- readonly __wbindgen_malloc: (a: number, b: number) => number;
118
- readonly __wbindgen_realloc: (a: number, b: number, c: number, d: number) => number;
119
- readonly __wbindgen_exn_store: (a: number) => void;
120
- readonly __externref_table_alloc: () => number;
121
- readonly __wbindgen_externrefs: WebAssembly.Table;
122
- readonly __externref_table_dealloc: (a: number) => void;
123
- readonly __wbindgen_free: (a: number, b: number, c: number) => void;
124
- readonly __wbindgen_start: () => void;
282
+ readonly memory: WebAssembly.Memory;
283
+ readonly greet: (a: number, b: number) => void;
284
+ readonly canonicalizeJsonString: (a: number, b: number) => [number, number, number, number];
285
+ readonly computeMd5: (a: number, b: number) => [number, number];
286
+ readonly computeSha512t24u: (a: number, b: number) => [number, number];
287
+ readonly digestSeqcol: (a: number, b: number) => [number, number, number];
288
+ readonly fastaHasherFinish: (a: number) => [number, number, number];
289
+ readonly fastaHasherFree: (a: number) => number;
290
+ readonly fastaHasherNew: () => number;
291
+ readonly fastaHasherProgress: (a: number) => [number, number, number];
292
+ readonly fastaHasherUpdate: (a: number, b: number, c: number) => [number, number];
293
+ readonly sequenceDigest: (a: number, b: number) => [number, number];
294
+ readonly sequenceMd5: (a: number, b: number) => [number, number];
295
+ readonly __wbg_bedclassificationoutput_free: (a: number, b: number) => void;
296
+ readonly __wbg_chromosomestatistics_free: (a: number, b: number) => void;
297
+ readonly __wbg_regiondistribution_free: (a: number, b: number) => void;
298
+ readonly __wbg_regionset_free: (a: number, b: number) => void;
299
+ readonly bedclassificationoutput_bed_compliance: (a: number) => [number, number];
300
+ readonly bedclassificationoutput_compliant_columns: (a: number) => number;
301
+ readonly bedclassificationoutput_data_format: (a: number) => [number, number];
302
+ readonly bedclassificationoutput_non_compliant_columns: (a: number) => number;
303
+ readonly chromosomestatistics_chromosome: (a: number) => [number, number];
304
+ readonly chromosomestatistics_end_nucleotide_position: (a: number) => number;
305
+ readonly chromosomestatistics_maximum_region_length: (a: number) => number;
306
+ readonly chromosomestatistics_mean_region_length: (a: number) => number;
307
+ readonly chromosomestatistics_median_region_length: (a: number) => number;
308
+ readonly chromosomestatistics_number_of_regions: (a: number) => number;
309
+ readonly chromosomestatistics_start_nucleotide_position: (a: number) => number;
310
+ readonly regionset_chromosomeStatistics: (a: number) => [number, number, number];
311
+ readonly regionset_classify: (a: number) => number;
312
+ readonly regionset_firstRegion: (a: number) => [number, number];
313
+ readonly regionset_identifier: (a: number) => [number, number];
314
+ readonly regionset_meanRegionWidth: (a: number) => number;
315
+ readonly regionset_new: (a: any) => [number, number, number];
316
+ readonly regionset_nucleotidesLength: (a: number) => number;
317
+ readonly regionset_numberOfRegions: (a: number) => number;
318
+ readonly regionset_regionDistribution: (a: number, b: number) => [number, number, number];
319
+ readonly chromosomestatistics_minimum_region_length: (a: number) => number;
320
+ readonly __wbg_tokenizer_free: (a: number, b: number) => void;
321
+ readonly tokenizer_bosToken: (a: number) => [number, number];
322
+ readonly tokenizer_bosTokenId: (a: number) => number;
323
+ readonly tokenizer_clsToken: (a: number) => [number, number];
324
+ readonly tokenizer_clsTokenId: (a: number) => number;
325
+ readonly tokenizer_decode: (a: number, b: any) => [number, number, number];
326
+ readonly tokenizer_encode: (a: number, b: any) => [number, number, number];
327
+ readonly tokenizer_eosToken: (a: number) => [number, number];
328
+ readonly tokenizer_eosTokenId: (a: number) => number;
329
+ readonly tokenizer_getVocab: (a: number) => [number, number, number];
330
+ readonly tokenizer_length: (a: number) => number;
331
+ readonly tokenizer_maskToken: (a: number) => [number, number];
332
+ readonly tokenizer_maskTokenId: (a: number) => number;
333
+ readonly tokenizer_new: (a: any, b: number, c: number) => [number, number, number];
334
+ readonly tokenizer_padToken: (a: number) => [number, number];
335
+ readonly tokenizer_padTokenId: (a: number) => number;
336
+ readonly tokenizer_sepToken: (a: number) => [number, number];
337
+ readonly tokenizer_sepTokenId: (a: number) => number;
338
+ readonly tokenizer_specialTokensMap: (a: number) => [number, number, number];
339
+ readonly tokenizer_tokenize: (a: number, b: any) => [number, number, number];
340
+ readonly tokenizer_unkToken: (a: number) => [number, number];
341
+ readonly tokenizer_unkTokenId: (a: number) => number;
342
+ readonly tokenizer_vocabSize: (a: number) => number;
343
+ readonly __wbg_overlapper_free: (a: number, b: number) => void;
344
+ readonly overlapper_find: (a: number, b: any) => [number, number, number];
345
+ readonly overlapper_get_backend: (a: number) => [number, number];
346
+ readonly overlapper_new: (a: any, b: number, c: number) => [number, number, number];
347
+ readonly __wbindgen_malloc: (a: number, b: number) => number;
348
+ readonly __wbindgen_realloc: (a: number, b: number, c: number, d: number) => number;
349
+ readonly __wbindgen_exn_store: (a: number) => void;
350
+ readonly __externref_table_alloc: () => number;
351
+ readonly __wbindgen_externrefs: WebAssembly.Table;
352
+ readonly __wbindgen_free: (a: number, b: number, c: number) => void;
353
+ readonly __externref_table_dealloc: (a: number) => void;
354
+ readonly __wbindgen_start: () => void;
125
355
  }
126
356
 
127
357
  export type SyncInitInput = BufferSource | WebAssembly.Module;
358
+
128
359
  /**
129
- * Instantiates the given `module`, which can either be bytes or
130
- * a precompiled `WebAssembly.Module`.
131
- *
132
- * @param {{ module: SyncInitInput }} module - Passing `SyncInitInput` directly is deprecated.
133
- *
134
- * @returns {InitOutput}
135
- */
360
+ * Instantiates the given `module`, which can either be bytes or
361
+ * a precompiled `WebAssembly.Module`.
362
+ *
363
+ * @param {{ module: SyncInitInput }} module - Passing `SyncInitInput` directly is deprecated.
364
+ *
365
+ * @returns {InitOutput}
366
+ */
136
367
  export function initSync(module: { module: SyncInitInput } | SyncInitInput): InitOutput;
137
368
 
138
369
  /**
139
- * If `module_or_path` is {RequestInfo} or {URL}, makes a request and
140
- * for everything else, calls `WebAssembly.instantiate` directly.
141
- *
142
- * @param {{ module_or_path: InitInput | Promise<InitInput> }} module_or_path - Passing `InitInput` directly is deprecated.
143
- *
144
- * @returns {Promise<InitOutput>}
145
- */
370
+ * If `module_or_path` is {RequestInfo} or {URL}, makes a request and
371
+ * for everything else, calls `WebAssembly.instantiate` directly.
372
+ *
373
+ * @param {{ module_or_path: InitInput | Promise<InitInput> }} module_or_path - Passing `InitInput` directly is deprecated.
374
+ *
375
+ * @returns {Promise<InitOutput>}
376
+ */
146
377
  export default function __wbg_init (module_or_path?: { module_or_path: InitInput | Promise<InitInput> } | InitInput | Promise<InitInput>): Promise<InitOutput>;