@datagrok-libraries/bio 0.0.4 → 0.0.8

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -0,0 +1,38 @@
1
+ export class SeqPaletteBase {
2
+ static makePalette(dt, simplified = false) {
3
+ const palette = {};
4
+ dt.forEach((cp) => {
5
+ const objList = cp[0];
6
+ const colour = cp[1];
7
+ objList.forEach((obj, ind) => {
8
+ palette[obj] = this.colourPalette[colour][simplified ? 0 : ind];
9
+ });
10
+ });
11
+ return palette;
12
+ }
13
+ }
14
+ /** Palette with shades of primary colors
15
+ */
16
+ SeqPaletteBase.colourPalette = {
17
+ 'orange': ['rgb(255,187,120)', 'rgb(245,167,100)', 'rgb(235,137,70)', 'rgb(205, 111, 71)'],
18
+ 'all_green': ['rgb(44,160,44)', 'rgb(74,160,74)', 'rgb(23,103,57)', 'rgb(30,110,96)', 'rgb(60,131,95)',
19
+ 'rgb(24,110,79)', 'rgb(152,223,138)', 'rgb(182, 223, 138)', 'rgb(152, 193, 138)'],
20
+ 'all_blue': ['rgb(31,119,180)', 'rgb(23,190,207)', 'rgb(122, 102, 189)', 'rgb(158,218,229)', 'rgb(141, 124, 217)',
21
+ 'rgb(31, 120, 150)'],
22
+ 'magenta': ['rgb(162,106,192)', 'rgb(197,165,224)', 'rgb(208,113,218)'],
23
+ 'red': ['rgb(214,39,40)', 'rgb(255,152,150)'],
24
+ 'st_blue': ['rgb(23,190,207)', 'rgb(158,218,229)', 'rgb(31,119,180)'],
25
+ 'dark_blue': ['rgb(31,119,180)', 'rgb(31, 120, 150)'],
26
+ 'light_blue': ['rgb(23,190,207)', 'rgb(158,218,229)', 'rgb(108, 218, 229)', 'rgb(23,190,227)'],
27
+ 'lilac_blue': ['rgb(124,102,211)', 'rgb(149,134,217)', 'rgb(97, 81, 150)'],
28
+ 'dark_green': ['rgb(23,103,57)', 'rgb(30,110,96)', 'rgb(60,131,95)', 'rgb(24,110,79)'],
29
+ 'green': ['rgb(44,160,44)', 'rgb(74,160,74)'],
30
+ 'light_green': ['rgb(152,223,138)', 'rgb(182, 223, 138)', 'rgb(152, 193, 138)'],
31
+ 'st_green': ['rgb(44,160,44)', 'rgb(152,223,138)', 'rgb(39, 174, 96)', 'rgb(74,160,74)'],
32
+ 'pink': ['rgb(247,182,210)'],
33
+ 'brown': ['rgb(140,86,75)', 'rgb(102, 62, 54)'],
34
+ 'gray': ['rgb(127,127,127)', 'rgb(199,199,199)', 'rgb(196,156,148)', 'rgb(222, 222, 180)'],
35
+ 'yellow': ['rgb(188,189,34)'],
36
+ 'white': ['rgb(230,230,230)'],
37
+ };
38
+ //# sourceMappingURL=data:application/json;base64,eyJ2ZXJzaW9uIjozLCJmaWxlIjoic2VxLXBhbGV0dGVzLmpzIiwic291cmNlUm9vdCI6IiIsInNvdXJjZXMiOlsic2VxLXBhbGV0dGVzLnRzIl0sIm5hbWVzIjpbXSwibWFwcGluZ3MiOiJBQVlBLE1BQU0sT0FBTyxjQUFjO0lBMEJmLE1BQU0sQ0FBQyxXQUFXLENBQUMsRUFBd0IsRUFBRSxVQUFVLEdBQUcsS0FBSztRQUN2RSxNQUFNLE9BQU8sR0FBOEIsRUFBRSxDQUFDO1FBQzlDLEVBQUUsQ0FBQyxPQUFPLENBQUMsQ0FBQyxFQUFFLEVBQUUsRUFBRTtZQUNoQixNQUFNLE9BQU8sR0FBRyxFQUFFLENBQUMsQ0FBQyxDQUFDLENBQUM7WUFDdEIsTUFBTSxNQUFNLEdBQUcsRUFBRSxDQUFDLENBQUMsQ0FBQyxDQUFDO1lBQ3JCLE9BQU8sQ0FBQyxPQUFPLENBQUMsQ0FBQyxHQUFHLEVBQUUsR0FBRyxFQUFFLEVBQUU7Z0JBQzNCLE9BQU8sQ0FBQyxHQUFHLENBQUMsR0FBRyxJQUFJLENBQUMsYUFBYSxDQUFDLE1BQU0sQ0FBQyxDQUFDLFVBQVUsQ0FBQyxDQUFDLENBQUMsQ0FBQyxDQUFDLENBQUMsQ0FBQyxHQUFHLENBQUMsQ0FBQztZQUNsRSxDQUFDLENBQUMsQ0FBQztRQUNMLENBQUMsQ0FBQyxDQUFDO1FBQ0gsT0FBTyxPQUFPLENBQUM7SUFDakIsQ0FBQzs7QUFuQ0Q7R0FDRztBQUNZLDRCQUFhLEdBQWdDO0lBQzFELFFBQVEsRUFBRSxDQUFDLGtCQUFrQixFQUFFLGtCQUFrQixFQUFFLGlCQUFpQixFQUFFLG1CQUFtQixDQUFDO0lBQzFGLFdBQVcsRUFBRSxDQUFDLGdCQUFnQixFQUFFLGdCQUFnQixFQUFFLGdCQUFnQixFQUFFLGdCQUFnQixFQUFFLGdCQUFnQjtRQUNwRyxnQkFBZ0IsRUFBRSxrQkFBa0IsRUFBRSxvQkFBb0IsRUFBRSxvQkFBb0IsQ0FBQztJQUNuRixVQUFVLEVBQUUsQ0FBQyxpQkFBaUIsRUFBRSxpQkFBaUIsRUFBRSxvQkFBb0IsRUFBRSxrQkFBa0IsRUFBRSxvQkFBb0I7UUFDL0csbUJBQW1CLENBQUM7SUFDdEIsU0FBUyxFQUFFLENBQUMsa0JBQWtCLEVBQUUsa0JBQWtCLEVBQUUsa0JBQWtCLENBQUM7SUFDdkUsS0FBSyxFQUFFLENBQUMsZ0JBQWdCLEVBQUUsa0JBQWtCLENBQUM7SUFDN0MsU0FBUyxFQUFFLENBQUMsaUJBQWlCLEVBQUUsa0JBQWtCLEVBQUUsaUJBQWlCLENBQUM7SUFDckUsV0FBVyxFQUFFLENBQUMsaUJBQWlCLEVBQUUsbUJBQW1CLENBQUM7SUFDckQsWUFBWSxFQUFFLENBQUMsaUJBQWlCLEVBQUUsa0JBQWtCLEVBQUUsb0JBQW9CLEVBQUUsaUJBQWlCLENBQUM7SUFDOUYsWUFBWSxFQUFFLENBQUMsa0JBQWtCLEVBQUUsa0JBQWtCLEVBQUUsa0JBQWtCLENBQUM7SUFDMUUsWUFBWSxFQUFFLENBQUMsZ0JBQWdCLEVBQUUsZ0JBQWdCLEVBQUUsZ0JBQWdCLEVBQUUsZ0JBQWdCLENBQUM7SUFDdEYsT0FBTyxFQUFFLENBQUMsZ0JBQWdCLEVBQUUsZ0JBQWdCLENBQUM7SUFDN0MsYUFBYSxFQUFFLENBQUMsa0JBQWtCLEVBQUUsb0JBQW9CLEVBQUUsb0JBQW9CLENBQUM7SUFDL0UsVUFBVSxFQUFFLENBQUMsZ0JBQWdCLEVBQUUsa0JBQWtCLEVBQUUsa0JBQWtCLEVBQUUsZ0JBQWdCLENBQUM7SUFDeEYsTUFBTSxFQUFFLENBQUMsa0JBQWtCLENBQUM7SUFDNUIsT0FBTyxFQUFFLENBQUMsZ0JBQWdCLEVBQUUsa0JBQWtCLENBQUM7SUFDL0MsTUFBTSxFQUFFLENBQUMsa0JBQWtCLEVBQUUsa0JBQWtCLEVBQUUsa0JBQWtCLEVBQUUsb0JBQW9CLENBQUM7SUFDMUYsUUFBUSxFQUFFLENBQUMsaUJBQWlCLENBQUM7SUFDN0IsT0FBTyxFQUFFLENBQUMsa0JBQWtCLENBQUM7Q0FDOUIsQ0FBQyIsInNvdXJjZXNDb250ZW50IjpbImltcG9ydCAqIGFzIGdyb2sgZnJvbSAnZGF0YWdyb2stYXBpL2dyb2snO1xuaW1wb3J0ICogYXMgdWkgZnJvbSAnZGF0YWdyb2stYXBpL3VpJztcbmltcG9ydCAqIGFzIERHIGZyb20gJ2RhdGFncm9rLWFwaS9kZyc7XG5cbmV4cG9ydCBpbnRlcmZhY2UgU2VxUGFsZXR0ZSB7XG4gIC8qKlxuICAgKiBAcGFyYW0ge3N0cmluZ30gbSBNb25vbWVyIGNoYXJhY3RlclxuICAgKiBAcmV0dXJuIHtzdHJpbmd9IENvbG9yXG4gICAqL1xuICBbbTogc3RyaW5nXTogc3RyaW5nO1xufVxuXG5leHBvcnQgY2xhc3MgU2VxUGFsZXR0ZUJhc2Uge1xuICAvKiogUGFsZXR0ZSB3aXRoIHNoYWRlcyBvZiBwcmltYXJ5IGNvbG9yc1xuICAgKi9cbiAgcHJpdmF0ZSBzdGF0aWMgY29sb3VyUGFsZXR0ZTogeyBba2V5OiBzdHJpbmddOiBzdHJpbmdbXSB9ID0ge1xuICAgICdvcmFuZ2UnOiBbJ3JnYigyNTUsMTg3LDEyMCknLCAncmdiKDI0NSwxNjcsMTAwKScsICdyZ2IoMjM1LDEzNyw3MCknLCAncmdiKDIwNSwgMTExLCA3MSknXSxcbiAgICAnYWxsX2dyZWVuJzogWydyZ2IoNDQsMTYwLDQ0KScsICdyZ2IoNzQsMTYwLDc0KScsICdyZ2IoMjMsMTAzLDU3KScsICdyZ2IoMzAsMTEwLDk2KScsICdyZ2IoNjAsMTMxLDk1KScsXG4gICAgICAncmdiKDI0LDExMCw3OSknLCAncmdiKDE1MiwyMjMsMTM4KScsICdyZ2IoMTgyLCAyMjMsIDEzOCknLCAncmdiKDE1MiwgMTkzLCAxMzgpJ10sXG4gICAgJ2FsbF9ibHVlJzogWydyZ2IoMzEsMTE5LDE4MCknLCAncmdiKDIzLDE5MCwyMDcpJywgJ3JnYigxMjIsIDEwMiwgMTg5KScsICdyZ2IoMTU4LDIxOCwyMjkpJywgJ3JnYigxNDEsIDEyNCwgMjE3KScsXG4gICAgICAncmdiKDMxLCAxMjAsIDE1MCknXSxcbiAgICAnbWFnZW50YSc6IFsncmdiKDE2MiwxMDYsMTkyKScsICdyZ2IoMTk3LDE2NSwyMjQpJywgJ3JnYigyMDgsMTEzLDIxOCknXSxcbiAgICAncmVkJzogWydyZ2IoMjE0LDM5LDQwKScsICdyZ2IoMjU1LDE1MiwxNTApJ10sXG4gICAgJ3N0X2JsdWUnOiBbJ3JnYigyMywxOTAsMjA3KScsICdyZ2IoMTU4LDIxOCwyMjkpJywgJ3JnYigzMSwxMTksMTgwKSddLFxuICAgICdkYXJrX2JsdWUnOiBbJ3JnYigzMSwxMTksMTgwKScsICdyZ2IoMzEsIDEyMCwgMTUwKSddLFxuICAgICdsaWdodF9ibHVlJzogWydyZ2IoMjMsMTkwLDIwNyknLCAncmdiKDE1OCwyMTgsMjI5KScsICdyZ2IoMTA4LCAyMTgsIDIyOSknLCAncmdiKDIzLDE5MCwyMjcpJ10sXG4gICAgJ2xpbGFjX2JsdWUnOiBbJ3JnYigxMjQsMTAyLDIxMSknLCAncmdiKDE0OSwxMzQsMjE3KScsICdyZ2IoOTcsIDgxLCAxNTApJ10sXG4gICAgJ2RhcmtfZ3JlZW4nOiBbJ3JnYigyMywxMDMsNTcpJywgJ3JnYigzMCwxMTAsOTYpJywgJ3JnYig2MCwxMzEsOTUpJywgJ3JnYigyNCwxMTAsNzkpJ10sXG4gICAgJ2dyZWVuJzogWydyZ2IoNDQsMTYwLDQ0KScsICdyZ2IoNzQsMTYwLDc0KSddLFxuICAgICdsaWdodF9ncmVlbic6IFsncmdiKDE1MiwyMjMsMTM4KScsICdyZ2IoMTgyLCAyMjMsIDEzOCknLCAncmdiKDE1MiwgMTkzLCAxMzgpJ10sXG4gICAgJ3N0X2dyZWVuJzogWydyZ2IoNDQsMTYwLDQ0KScsICdyZ2IoMTUyLDIyMywxMzgpJywgJ3JnYigzOSwgMTc0LCA5NiknLCAncmdiKDc0LDE2MCw3NCknXSxcbiAgICAncGluayc6IFsncmdiKDI0NywxODIsMjEwKSddLFxuICAgICdicm93bic6IFsncmdiKDE0MCw4Niw3NSknLCAncmdiKDEwMiwgNjIsIDU0KSddLFxuICAgICdncmF5JzogWydyZ2IoMTI3LDEyNywxMjcpJywgJ3JnYigxOTksMTk5LDE5OSknLCAncmdiKDE5NiwxNTYsMTQ4KScsICdyZ2IoMjIyLCAyMjIsIDE4MCknXSxcbiAgICAneWVsbG93JzogWydyZ2IoMTg4LDE4OSwzNCknXSxcbiAgICAnd2hpdGUnOiBbJ3JnYigyMzAsMjMwLDIzMCknXSxcbiAgfTtcblxuICBwcm90ZWN0ZWQgc3RhdGljIG1ha2VQYWxldHRlKGR0OiBbc3RyaW5nW10sIHN0cmluZ11bXSwgc2ltcGxpZmllZCA9IGZhbHNlKSB7XG4gICAgY29uc3QgcGFsZXR0ZTogeyBba2V5OiBzdHJpbmddOiBzdHJpbmcgfSA9IHt9O1xuICAgIGR0LmZvckVhY2goKGNwKSA9PiB7XG4gICAgICBjb25zdCBvYmpMaXN0ID0gY3BbMF07XG4gICAgICBjb25zdCBjb2xvdXIgPSBjcFsxXTtcbiAgICAgIG9iakxpc3QuZm9yRWFjaCgob2JqLCBpbmQpID0+IHtcbiAgICAgICAgcGFsZXR0ZVtvYmpdID0gdGhpcy5jb2xvdXJQYWxldHRlW2NvbG91cl1bc2ltcGxpZmllZCA/IDAgOiBpbmRdO1xuICAgICAgfSk7XG4gICAgfSk7XG4gICAgcmV0dXJuIHBhbGV0dGU7XG4gIH1cbn1cbiJdfQ==
@@ -1,62 +1,62 @@
1
- declare type SideChainScale = {
2
- [name: string]: number;
3
- };
4
- /**
5
- * Class to categorial encode/decode aligned amino acid residues sequence.
6
- *
7
- * @export
8
- * @class AlignedSequenceEncoder
9
- */
10
- export declare class AlignedSequenceEncoder {
11
- protected aa2num: SideChainScale;
12
- protected num2aa: {
13
- [code: number]: string;
14
- };
15
- constructor(scale?: string);
16
- /**
17
- * Truncate NH2 and -COOH terminals of the given sequence.
18
- *
19
- * @static
20
- * @param {string} seq The sequence provided.
21
- * @return {string} Truncated sequence.
22
- * @memberof AlignedSequenceEncoder
23
- */
24
- static _truncateSequence(seq: string): string;
25
- /**
26
- * Cuts auxiliary defises before a residue.
27
- *
28
- * @static
29
- * @param {string} seq The sequence to process.
30
- * @return {string} Processed sequence.
31
- * @memberof AlignedSequenceEncoder
32
- */
33
- static _dropDefises(seq: string): string;
34
- /**
35
- * Performs truncation and cutting auxiliary defises.
36
- *
37
- * @static
38
- * @param {string} sequence The sequence work under process.
39
- * @return {string} Result of cleaning.
40
- * @memberof AlignedSequenceEncoder
41
- */
42
- static clean(sequence: string): string;
43
- /**
44
- * Categorial encode of the sequence provided.
45
- *
46
- * @param {string} sequence The sequence.
47
- * @return {number[]} Encoded vector.
48
- * @memberof AlignedSequenceEncoder
49
- */
50
- encode(sequence: string): number[];
51
- encodeLettter(letter: string): number;
52
- /**
53
- * Decode the encoded vector into the sequence back.
54
- *
55
- * @param {number[]} value The vector encoded.
56
- * @return {string} Decoded sequence.
57
- * @memberof AlignedSequenceEncoder
58
- */
59
- decode(value: number[]): string;
60
- }
61
- export {};
1
+ declare type SideChainScale = {
2
+ [name: string]: number;
3
+ };
4
+ /**
5
+ * Class to categorial encode/decode aligned amino acid residues sequence.
6
+ *
7
+ * @export
8
+ * @class AlignedSequenceEncoder
9
+ */
10
+ export declare class AlignedSequenceEncoder {
11
+ protected aa2num: SideChainScale;
12
+ protected num2aa: {
13
+ [code: number]: string;
14
+ };
15
+ constructor(scale?: string);
16
+ /**
17
+ * Truncate NH2 and -COOH terminals of the given sequence.
18
+ *
19
+ * @static
20
+ * @param {string} seq The sequence provided.
21
+ * @return {string} Truncated sequence.
22
+ * @memberof AlignedSequenceEncoder
23
+ */
24
+ static _truncateSequence(seq: string): string;
25
+ /**
26
+ * Cuts auxiliary defises before a residue.
27
+ *
28
+ * @static
29
+ * @param {string} seq The sequence to process.
30
+ * @return {string} Processed sequence.
31
+ * @memberof AlignedSequenceEncoder
32
+ */
33
+ static _dropDefises(seq: string): string;
34
+ /**
35
+ * Performs truncation and cutting auxiliary defises.
36
+ *
37
+ * @static
38
+ * @param {string} sequence The sequence work under process.
39
+ * @return {string} Result of cleaning.
40
+ * @memberof AlignedSequenceEncoder
41
+ */
42
+ static clean(sequence: string): string;
43
+ /**
44
+ * Categorial encode of the sequence provided.
45
+ *
46
+ * @param {string} sequence The sequence.
47
+ * @return {number[]} Encoded vector.
48
+ * @memberof AlignedSequenceEncoder
49
+ */
50
+ encode(sequence: string): number[];
51
+ encodeLettter(letter: string): number;
52
+ /**
53
+ * Decode the encoded vector into the sequence back.
54
+ *
55
+ * @param {number[]} value The vector encoded.
56
+ * @return {string} Decoded sequence.
57
+ * @memberof AlignedSequenceEncoder
58
+ */
59
+ decode(value: number[]): string;
60
+ }
61
+ export {};
62
62
  //# sourceMappingURL=sequence-encoder.d.ts.map
@@ -1,155 +1,155 @@
1
- import { assert } from '@datagrok-libraries/utils/src/operations';
2
- class SideChainScales {
3
- static getAvailableScales() {
4
- return Object.entries(this.scales).map(([k, _]) => k);
5
- }
6
- static getScale(name) {
7
- assert(!(this.scales[name] === undefined), `Scale '${name}' was not found.`);
8
- return this.scales[name];
9
- }
10
- }
11
- SideChainScales.scales = {
12
- // Wimley-White interfacial hydrophobicity scale
13
- 'WimleyWhite': {
14
- '-': 0,
15
- 'A': 0.17,
16
- 'C': -0.24,
17
- 'D': -0.07,
18
- 'E': -0.01,
19
- 'F': -1.13,
20
- 'G': 0.01,
21
- 'H': 0.17,
22
- 'I': -0.31,
23
- 'K': 0.99,
24
- 'L': -0.56,
25
- 'M': -0.23,
26
- 'N': 0.42,
27
- 'P': 0.45,
28
- 'Q': 0.58,
29
- 'R': 0.81,
30
- 'S': 0.13,
31
- 'T': 0.14,
32
- 'V': 0.07,
33
- 'W': -1.85,
34
- 'Y': -0.94,
35
- },
36
- 'categorial': {
37
- '-': 0,
38
- 'A': 1,
39
- 'C': 2,
40
- 'D': 3,
41
- 'E': 4,
42
- 'F': 5,
43
- 'G': 6,
44
- 'H': 7,
45
- 'I': 8,
46
- 'K': 9,
47
- 'L': 10,
48
- 'M': 11,
49
- 'N': 12,
50
- 'P': 13,
51
- 'Q': 14,
52
- 'R': 15,
53
- 'S': 16,
54
- 'T': 17,
55
- 'V': 18,
56
- 'W': 19,
57
- 'Y': 20,
58
- },
59
- };
60
- /**
61
- * Class to categorial encode/decode aligned amino acid residues sequence.
62
- *
63
- * @export
64
- * @class AlignedSequenceEncoder
65
- */
66
- export class AlignedSequenceEncoder {
67
- constructor(scale = 'categorial') {
68
- this.aa2num = SideChainScales.getScale(scale);
69
- this.num2aa = {};
70
- Object.entries(this.aa2num).forEach(([k, v]) => (this.num2aa[v] = k));
71
- }
72
- /**
73
- * Truncate NH2 and -COOH terminals of the given sequence.
74
- *
75
- * @static
76
- * @param {string} seq The sequence provided.
77
- * @return {string} Truncated sequence.
78
- * @memberof AlignedSequenceEncoder
79
- */
80
- static _truncateSequence(seq) {
81
- let start = 0;
82
- let end = seq.length;
83
- const termina = ['NH2', 'COOH'];
84
- if (seq.startsWith(termina[0])) {
85
- const l = termina[0].length; // Cut only 'NH2' without following '-'.
86
- assert(seq[l] == '-', `Wrong sequence format: ${termina[0]} without following '-' in '${seq}'.`);
87
- start = l;
88
- }
89
- if (seq.endsWith(termina[1])) {
90
- const l = termina[1].length + 1; // Cut both 'COOH' and precending '-'.
91
- assert(seq[end - l] == '-', `Wrong sequence format: ${termina[1]} without '-' precending in '${seq}'.`);
92
- end -= l;
93
- }
94
- return seq.substring(start, end);
95
- }
96
- /**
97
- * Cuts auxiliary defises before a residue.
98
- *
99
- * @static
100
- * @param {string} seq The sequence to process.
101
- * @return {string} Processed sequence.
102
- * @memberof AlignedSequenceEncoder
103
- */
104
- static _dropDefises(seq) {
105
- return seq.replace(/(-)([^-]+)/g, '$2');
106
- }
107
- /**
108
- * Performs truncation and cutting auxiliary defises.
109
- *
110
- * @static
111
- * @param {string} sequence The sequence work under process.
112
- * @return {string} Result of cleaning.
113
- * @memberof AlignedSequenceEncoder
114
- */
115
- static clean(sequence) {
116
- return AlignedSequenceEncoder._dropDefises(AlignedSequenceEncoder._truncateSequence(sequence));
117
- }
118
- /**
119
- * Categorial encode of the sequence provided.
120
- *
121
- * @param {string} sequence The sequence.
122
- * @return {number[]} Encoded vector.
123
- * @memberof AlignedSequenceEncoder
124
- */
125
- encode(sequence) {
126
- const nItems = sequence.length;
127
- const values = new Array(nItems).fill(0);
128
- for (let i = 0; i < nItems; ++i) {
129
- const char = sequence[i];
130
- assert(char in this.aa2num, `Unknown char '${char}' found in sequence '${sequence}'`);
131
- values[i] = this.encodeLettter(char);
132
- }
133
- return values;
134
- }
135
- encodeLettter(letter) {
136
- return this.aa2num[letter];
137
- }
138
- /**
139
- * Decode the encoded vector into the sequence back.
140
- *
141
- * @param {number[]} value The vector encoded.
142
- * @return {string} Decoded sequence.
143
- * @memberof AlignedSequenceEncoder
144
- */
145
- decode(value) {
146
- let s = '';
147
- for (let i = 0; i < value.length; ++i) {
148
- const code = value[i];
149
- assert(code in this.num2aa, `Unknown code '${code}' found in vector '${value}'`);
150
- s += this.num2aa[code];
151
- }
152
- return s;
153
- }
154
- }
155
- //# sourceMappingURL=data:application/json;base64,{"version":3,"file":"sequence-encoder.js","sourceRoot":"","sources":["sequence-encoder.ts"],"names":[],"mappings":"AAAA,OAAO,EAAC,MAAM,EAAC,MAAM,0CAA0C,CAAC;AAKhE,MAAM,eAAe;IAmDnB,MAAM,CAAC,kBAAkB;QACvB,OAAO,MAAM,CAAC,OAAO,CAAC,IAAI,CAAC,MAAM,CAAC,CAAC,GAAG,CAAC,CAAC,CAAC,CAAC,EAAE,CAAC,CAAC,EAAE,EAAE,CAAC,CAAC,CAAC,CAAC;IACxD,CAAC;IAED,MAAM,CAAC,QAAQ,CAAC,IAAY;QAC1B,MAAM,CAAC,CAAC,CAAC,IAAI,CAAC,MAAM,CAAC,IAAI,CAAC,KAAK,SAAS,CAAC,EAAE,UAAU,IAAI,kBAAkB,CAAC,CAAC;QAC7E,OAAO,IAAI,CAAC,MAAM,CAAC,IAAI,CAAC,CAAC;IAC3B,CAAC;;AAzDM,sBAAM,GAA6B;IACxC,gDAAgD;IAChD,aAAa,EAAE;QACb,GAAG,EAAE,CAAC;QACN,GAAG,EAAE,IAAI;QACT,GAAG,EAAE,CAAC,IAAI;QACV,GAAG,EAAE,CAAC,IAAI;QACV,GAAG,EAAE,CAAC,IAAI;QACV,GAAG,EAAE,CAAC,IAAI;QACV,GAAG,EAAE,IAAI;QACT,GAAG,EAAE,IAAI;QACT,GAAG,EAAE,CAAC,IAAI;QACV,GAAG,EAAE,IAAI;QACT,GAAG,EAAE,CAAC,IAAI;QACV,GAAG,EAAE,CAAC,IAAI;QACV,GAAG,EAAE,IAAI;QACT,GAAG,EAAE,IAAI;QACT,GAAG,EAAE,IAAI;QACT,GAAG,EAAE,IAAI;QACT,GAAG,EAAE,IAAI;QACT,GAAG,EAAE,IAAI;QACT,GAAG,EAAE,IAAI;QACT,GAAG,EAAE,CAAC,IAAI;QACV,GAAG,EAAE,CAAC,IAAI;KACX;IACD,YAAY,EAAE;QACZ,GAAG,EAAE,CAAC;QACN,GAAG,EAAE,CAAC;QACN,GAAG,EAAE,CAAC;QACN,GAAG,EAAE,CAAC;QACN,GAAG,EAAE,CAAC;QACN,GAAG,EAAE,CAAC;QACN,GAAG,EAAE,CAAC;QACN,GAAG,EAAE,CAAC;QACN,GAAG,EAAE,CAAC;QACN,GAAG,EAAE,CAAC;QACN,GAAG,EAAE,EAAE;QACP,GAAG,EAAE,EAAE;QACP,GAAG,EAAE,EAAE;QACP,GAAG,EAAE,EAAE;QACP,GAAG,EAAE,EAAE;QACP,GAAG,EAAE,EAAE;QACP,GAAG,EAAE,EAAE;QACP,GAAG,EAAE,EAAE;QACP,GAAG,EAAE,EAAE;QACP,GAAG,EAAE,EAAE;QACP,GAAG,EAAE,EAAE;KACR;CACF,CAAC;AAYJ;;;;;GAKG;AACH,MAAM,OAAO,sBAAsB;IAIjC,YAAY,QAAgB,YAAY;QACtC,IAAI,CAAC,MAAM,GAAG,eAAe,CAAC,QAAQ,CAAC,KAAK,CAAC,CAAC;QAC9C,IAAI,CAAC,MAAM,GAAG,EAAE,CAAC;QACjB,MAAM,CAAC,OAAO,CAAC,IAAI,CAAC,MAAM,CAAC,CAAC,OAAO,CAAC,CAAC,CAAC,CAAC,EAAE,CAAC,CAAC,EAAE,EAAE,CAAC,CAAC,IAAI,CAAC,MAAM,CAAC,CAAC,CAAC,GAAG,CAAC,CAAC,CAAC,CAAC;IACxE,CAAC;IAED;;;;;;;SAOK;IACL,MAAM,CAAC,iBAAiB,CAAC,GAAW;QAClC,IAAI,KAAK,GAAG,CAAC,CAAC;QACd,IAAI,GAAG,GAAG,GAAG,CAAC,MAAM,CAAC;QACrB,MAAM,OAAO,GAAG,CAAC,KAAK,EAAE,MAAM,CAAC,CAAC;QAEhC,IAAI,GAAG,CAAC,UAAU,CAAC,OAAO,CAAC,CAAC,CAAC,CAAC,EAAE;YAC9B,MAAM,CAAC,GAAG,OAAO,CAAC,CAAC,CAAC,CAAC,MAAM,CAAC,CAAC,wCAAwC;YACrE,MAAM,CAAC,GAAG,CAAC,CAAC,CAAC,IAAI,GAAG,EAAE,0BAA0B,OAAO,CAAC,CAAC,CAAC,8BAA8B,GAAG,IAAI,CAAC,CAAC;YACjG,KAAK,GAAG,CAAC,CAAC;SACX;QACD,IAAI,GAAG,CAAC,QAAQ,CAAC,OAAO,CAAC,CAAC,CAAC,CAAC,EAAE;YAC5B,MAAM,CAAC,GAAG,OAAO,CAAC,CAAC,CAAC,CAAC,MAAM,GAAC,CAAC,CAAC,CAAC,sCAAsC;YACrE,MAAM,CAAC,GAAG,CAAC,GAAG,GAAC,CAAC,CAAC,IAAI,GAAG,EAAE,0BAA0B,OAAO,CAAC,CAAC,CAAC,+BAA+B,GAAG,IAAI,CAAC,CAAC;YACtG,GAAG,IAAI,CAAC,CAAC;SACV;QACD,OAAO,GAAG,CAAC,SAAS,CAAC,KAAK,EAAE,GAAG,CAAC,CAAC;IACnC,CAAC;IAED;;;;;;;SAOK;IACL,MAAM,CAAC,YAAY,CAAC,GAAW;QAC7B,OAAO,GAAG,CAAC,OAAO,CAAC,aAAa,EAAE,IAAI,CAAC,CAAC;IAC1C,CAAC;IAED;;;;;;;SAOK;IACL,MAAM,CAAC,KAAK,CAAC,QAAgB;QAC3B,OAAO,sBAAsB,CAAC,YAAY,CAAC,sBAAsB,CAAC,iBAAiB,CAAC,QAAQ,CAAC,CAAC,CAAC;IACjG,CAAC;IAED;;;;;;SAMK;IACE,MAAM,CAAC,QAAgB;QAC5B,MAAM,MAAM,GAAG,QAAQ,CAAC,MAAM,CAAC;QAC/B,MAAM,MAAM,GAAG,IAAI,KAAK,CAAC,MAAM,CAAC,CAAC,IAAI,CAAC,CAAC,CAAC,CAAC;QAEzC,KAAK,IAAI,CAAC,GAAG,CAAC,EAAE,CAAC,GAAG,MAAM,EAAE,EAAE,CAAC,EAAE;YAC/B,MAAM,IAAI,GAAG,QAAQ,CAAC,CAAC,CAAC,CAAC;YAEzB,MAAM,CAAC,IAAI,IAAI,IAAI,CAAC,MAAM,EAAE,iBAAiB,IAAI,wBAAwB,QAAQ,GAAG,CAAC,CAAC;YAEtF,MAAM,CAAC,CAAC,CAAC,GAAG,IAAI,CAAC,aAAa,CAAC,IAAI,CAAC,CAAC;SACtC;QACD,OAAO,MAAM,CAAC;IAChB,CAAC;IAEM,aAAa,CAAC,MAAc;QACjC,OAAO,IAAI,CAAC,MAAM,CAAC,MAAM,CAAC,CAAC;IAC7B,CAAC;IAED;;;;;;SAMK;IACE,MAAM,CAAC,KAAe;QAC3B,IAAI,CAAC,GAAW,EAAE,CAAC;QAEnB,KAAK,IAAI,CAAC,GAAG,CAAC,EAAE,CAAC,GAAG,KAAK,CAAC,MAAM,EAAE,EAAE,CAAC,EAAE;YACrC,MAAM,IAAI,GAAG,KAAK,CAAC,CAAC,CAAC,CAAC;YAEtB,MAAM,CAAC,IAAI,IAAI,IAAI,CAAC,MAAM,EAAE,iBAAiB,IAAI,sBAAsB,KAAK,GAAG,CAAC,CAAC;YAEjF,CAAC,IAAI,IAAI,CAAC,MAAM,CAAC,IAAI,CAAC,CAAC;SACxB;QACD,OAAO,CAAC,CAAC;IACX,CAAC;CACF","sourcesContent":["import {assert} from '@datagrok-libraries/utils/src/operations';\r\n\r\ntype SideChainScale = {[name: string]: number};\r\ntype SideChainScaleCollection = {[name: string]: SideChainScale};\r\n\r\nclass SideChainScales {\r\n  static scales: SideChainScaleCollection = {\r\n    // Wimley-White interfacial hydrophobicity scale\r\n    'WimleyWhite': {\r\n      '-': 0,\r\n      'A': 0.17,\r\n      'C': -0.24,\r\n      'D': -0.07, // Asp-: 1.23\r\n      'E': -0.01, // Glu-: 2.02\r\n      'F': -1.13, //\r\n      'G': 0.01,\r\n      'H': 0.17, // His+: 0.96\r\n      'I': -0.31,\r\n      'K': 0.99, // Lys+\r\n      'L': -0.56,\r\n      'M': -0.23,\r\n      'N': 0.42,\r\n      'P': 0.45,\r\n      'Q': 0.58,\r\n      'R': 0.81, // Arg+\r\n      'S': 0.13,\r\n      'T': 0.14,\r\n      'V': 0.07,\r\n      'W': -1.85,\r\n      'Y': -0.94,\r\n    },\r\n    'categorial': {\r\n      '-': 0,\r\n      'A': 1,\r\n      'C': 2,\r\n      'D': 3,\r\n      'E': 4,\r\n      'F': 5,\r\n      'G': 6,\r\n      'H': 7,\r\n      'I': 8,\r\n      'K': 9,\r\n      'L': 10,\r\n      'M': 11,\r\n      'N': 12,\r\n      'P': 13,\r\n      'Q': 14,\r\n      'R': 15,\r\n      'S': 16,\r\n      'T': 17,\r\n      'V': 18,\r\n      'W': 19,\r\n      'Y': 20,\r\n    },\r\n  };\r\n\r\n  static getAvailableScales(): string[] {\r\n    return Object.entries(this.scales).map(([k, _]) => k);\r\n  }\r\n\r\n  static getScale(name: string): SideChainScale {\r\n    assert(!(this.scales[name] === undefined), `Scale '${name}' was not found.`);\r\n    return this.scales[name];\r\n  }\r\n}\r\n\r\n/**\r\n * Class to categorial encode/decode aligned amino acid residues sequence.\r\n *\r\n * @export\r\n * @class AlignedSequenceEncoder\r\n */\r\nexport class AlignedSequenceEncoder {\r\n  protected aa2num: SideChainScale;\r\n  protected num2aa: {[code: number]: string};\r\n\r\n  constructor(scale: string = 'categorial') {\r\n    this.aa2num = SideChainScales.getScale(scale);\r\n    this.num2aa = {};\r\n    Object.entries(this.aa2num).forEach(([k, v]) => (this.num2aa[v] = k));\r\n  }\r\n\r\n  /**\r\n     * Truncate NH2 and -COOH terminals of the given sequence.\r\n     *\r\n     * @static\r\n     * @param {string} seq The sequence provided.\r\n     * @return {string} Truncated sequence.\r\n     * @memberof AlignedSequenceEncoder\r\n     */\r\n  static _truncateSequence(seq: string): string {\r\n    let start = 0;\r\n    let end = seq.length;\r\n    const termina = ['NH2', 'COOH'];\r\n\r\n    if (seq.startsWith(termina[0])) {\r\n      const l = termina[0].length; // Cut only 'NH2' without following '-'.\r\n      assert(seq[l] == '-', `Wrong sequence format: ${termina[0]} without following '-' in '${seq}'.`);\r\n      start = l;\r\n    }\r\n    if (seq.endsWith(termina[1])) {\r\n      const l = termina[1].length+1; // Cut both 'COOH' and precending '-'.\r\n      assert(seq[end-l] == '-', `Wrong sequence format: ${termina[1]} without '-' precending in '${seq}'.`);\r\n      end -= l;\r\n    }\r\n    return seq.substring(start, end);\r\n  }\r\n\r\n  /**\r\n     * Cuts auxiliary defises before a residue.\r\n     *\r\n     * @static\r\n     * @param {string} seq The sequence to process.\r\n     * @return {string} Processed sequence.\r\n     * @memberof AlignedSequenceEncoder\r\n     */\r\n  static _dropDefises(seq: string): string {\r\n    return seq.replace(/(-)([^-]+)/g, '$2');\r\n  }\r\n\r\n  /**\r\n     * Performs truncation and cutting auxiliary defises.\r\n     *\r\n     * @static\r\n     * @param {string} sequence The sequence work under process.\r\n     * @return {string} Result of cleaning.\r\n     * @memberof AlignedSequenceEncoder\r\n     */\r\n  static clean(sequence: string): string {\r\n    return AlignedSequenceEncoder._dropDefises(AlignedSequenceEncoder._truncateSequence(sequence));\r\n  }\r\n\r\n  /**\r\n     * Categorial encode of the sequence provided.\r\n     *\r\n     * @param {string} sequence The sequence.\r\n     * @return {number[]} Encoded vector.\r\n     * @memberof AlignedSequenceEncoder\r\n     */\r\n  public encode(sequence: string): number[] {\r\n    const nItems = sequence.length;\r\n    const values = new Array(nItems).fill(0);\r\n\r\n    for (let i = 0; i < nItems; ++i) {\r\n      const char = sequence[i];\r\n\r\n      assert(char in this.aa2num, `Unknown char '${char}' found in sequence '${sequence}'`);\r\n\r\n      values[i] = this.encodeLettter(char);\r\n    }\r\n    return values;\r\n  }\r\n\r\n  public encodeLettter(letter: string): number {\r\n    return this.aa2num[letter];\r\n  }\r\n\r\n  /**\r\n     * Decode the encoded vector into the sequence back.\r\n     *\r\n     * @param {number[]} value The vector encoded.\r\n     * @return {string} Decoded sequence.\r\n     * @memberof AlignedSequenceEncoder\r\n     */\r\n  public decode(value: number[]): string {\r\n    let s: string = '';\r\n\r\n    for (let i = 0; i < value.length; ++i) {\r\n      const code = value[i];\r\n\r\n      assert(code in this.num2aa, `Unknown code '${code}' found in vector '${value}'`);\r\n\r\n      s += this.num2aa[code];\r\n    }\r\n    return s;\r\n  }\r\n}\r\n"]}
1
+ import { assert } from '@datagrok-libraries/utils/src/vector-operations';
2
+ class SideChainScales {
3
+ static getAvailableScales() {
4
+ return Object.entries(this.scales).map(([k, _]) => k);
5
+ }
6
+ static getScale(name) {
7
+ assert(!(this.scales[name] === undefined), `Scale '${name}' was not found.`);
8
+ return this.scales[name];
9
+ }
10
+ }
11
+ SideChainScales.scales = {
12
+ // Wimley-White interfacial hydrophobicity scale
13
+ 'WimleyWhite': {
14
+ '-': 0,
15
+ 'A': 0.17,
16
+ 'C': -0.24,
17
+ 'D': -0.07,
18
+ 'E': -0.01,
19
+ 'F': -1.13,
20
+ 'G': 0.01,
21
+ 'H': 0.17,
22
+ 'I': -0.31,
23
+ 'K': 0.99,
24
+ 'L': -0.56,
25
+ 'M': -0.23,
26
+ 'N': 0.42,
27
+ 'P': 0.45,
28
+ 'Q': 0.58,
29
+ 'R': 0.81,
30
+ 'S': 0.13,
31
+ 'T': 0.14,
32
+ 'V': 0.07,
33
+ 'W': -1.85,
34
+ 'Y': -0.94,
35
+ },
36
+ 'categorial': {
37
+ '-': 0,
38
+ 'A': 1,
39
+ 'C': 2,
40
+ 'D': 3,
41
+ 'E': 4,
42
+ 'F': 5,
43
+ 'G': 6,
44
+ 'H': 7,
45
+ 'I': 8,
46
+ 'K': 9,
47
+ 'L': 10,
48
+ 'M': 11,
49
+ 'N': 12,
50
+ 'P': 13,
51
+ 'Q': 14,
52
+ 'R': 15,
53
+ 'S': 16,
54
+ 'T': 17,
55
+ 'V': 18,
56
+ 'W': 19,
57
+ 'Y': 20,
58
+ },
59
+ };
60
+ /**
61
+ * Class to categorial encode/decode aligned amino acid residues sequence.
62
+ *
63
+ * @export
64
+ * @class AlignedSequenceEncoder
65
+ */
66
+ export class AlignedSequenceEncoder {
67
+ constructor(scale = 'categorial') {
68
+ this.aa2num = SideChainScales.getScale(scale);
69
+ this.num2aa = {};
70
+ Object.entries(this.aa2num).forEach(([k, v]) => (this.num2aa[v] = k));
71
+ }
72
+ /**
73
+ * Truncate NH2 and -COOH terminals of the given sequence.
74
+ *
75
+ * @static
76
+ * @param {string} seq The sequence provided.
77
+ * @return {string} Truncated sequence.
78
+ * @memberof AlignedSequenceEncoder
79
+ */
80
+ static _truncateSequence(seq) {
81
+ let start = 0;
82
+ let end = seq.length;
83
+ const termina = ['NH2', 'COOH'];
84
+ if (seq.startsWith(termina[0])) {
85
+ const l = termina[0].length; // Cut only 'NH2' without following '-'.
86
+ assert(seq[l] == '-', `Wrong sequence format: ${termina[0]} without following '-' in '${seq}'.`);
87
+ start = l;
88
+ }
89
+ if (seq.endsWith(termina[1])) {
90
+ const l = termina[1].length + 1; // Cut both 'COOH' and precending '-'.
91
+ assert(seq[end - l] == '-', `Wrong sequence format: ${termina[1]} without '-' precending in '${seq}'.`);
92
+ end -= l;
93
+ }
94
+ return seq.substring(start, end);
95
+ }
96
+ /**
97
+ * Cuts auxiliary defises before a residue.
98
+ *
99
+ * @static
100
+ * @param {string} seq The sequence to process.
101
+ * @return {string} Processed sequence.
102
+ * @memberof AlignedSequenceEncoder
103
+ */
104
+ static _dropDefises(seq) {
105
+ return seq.replace(/(-)([^-]+)/g, '$2');
106
+ }
107
+ /**
108
+ * Performs truncation and cutting auxiliary defises.
109
+ *
110
+ * @static
111
+ * @param {string} sequence The sequence work under process.
112
+ * @return {string} Result of cleaning.
113
+ * @memberof AlignedSequenceEncoder
114
+ */
115
+ static clean(sequence) {
116
+ return AlignedSequenceEncoder._dropDefises(AlignedSequenceEncoder._truncateSequence(sequence));
117
+ }
118
+ /**
119
+ * Categorial encode of the sequence provided.
120
+ *
121
+ * @param {string} sequence The sequence.
122
+ * @return {number[]} Encoded vector.
123
+ * @memberof AlignedSequenceEncoder
124
+ */
125
+ encode(sequence) {
126
+ const nItems = sequence.length;
127
+ const values = new Array(nItems).fill(0);
128
+ for (let i = 0; i < nItems; ++i) {
129
+ const char = sequence[i];
130
+ assert(char in this.aa2num, `Unknown char '${char}' found in sequence '${sequence}'`);
131
+ values[i] = this.encodeLettter(char);
132
+ }
133
+ return values;
134
+ }
135
+ encodeLettter(letter) {
136
+ return this.aa2num[letter];
137
+ }
138
+ /**
139
+ * Decode the encoded vector into the sequence back.
140
+ *
141
+ * @param {number[]} value The vector encoded.
142
+ * @return {string} Decoded sequence.
143
+ * @memberof AlignedSequenceEncoder
144
+ */
145
+ decode(value) {
146
+ let s = '';
147
+ for (let i = 0; i < value.length; ++i) {
148
+ const code = value[i];
149
+ assert(code in this.num2aa, `Unknown code '${code}' found in vector '${value}'`);
150
+ s += this.num2aa[code];
151
+ }
152
+ return s;
153
+ }
154
+ }
155
+ //# sourceMappingURL=data:application/json;base64,{"version":3,"file":"sequence-encoder.js","sourceRoot":"","sources":["sequence-encoder.ts"],"names":[],"mappings":"AAAA,OAAO,EAAC,MAAM,EAAC,MAAM,iDAAiD,CAAC;AAKvE,MAAM,eAAe;IAmDnB,MAAM,CAAC,kBAAkB;QACvB,OAAO,MAAM,CAAC,OAAO,CAAC,IAAI,CAAC,MAAM,CAAC,CAAC,GAAG,CAAC,CAAC,CAAC,CAAC,EAAE,CAAC,CAAC,EAAE,EAAE,CAAC,CAAC,CAAC,CAAC;IACxD,CAAC;IAED,MAAM,CAAC,QAAQ,CAAC,IAAY;QAC1B,MAAM,CAAC,CAAC,CAAC,IAAI,CAAC,MAAM,CAAC,IAAI,CAAC,KAAK,SAAS,CAAC,EAAE,UAAU,IAAI,kBAAkB,CAAC,CAAC;QAC7E,OAAO,IAAI,CAAC,MAAM,CAAC,IAAI,CAAC,CAAC;IAC3B,CAAC;;AAzDM,sBAAM,GAA6B;IACxC,gDAAgD;IAChD,aAAa,EAAE;QACb,GAAG,EAAE,CAAC;QACN,GAAG,EAAE,IAAI;QACT,GAAG,EAAE,CAAC,IAAI;QACV,GAAG,EAAE,CAAC,IAAI;QACV,GAAG,EAAE,CAAC,IAAI;QACV,GAAG,EAAE,CAAC,IAAI;QACV,GAAG,EAAE,IAAI;QACT,GAAG,EAAE,IAAI;QACT,GAAG,EAAE,CAAC,IAAI;QACV,GAAG,EAAE,IAAI;QACT,GAAG,EAAE,CAAC,IAAI;QACV,GAAG,EAAE,CAAC,IAAI;QACV,GAAG,EAAE,IAAI;QACT,GAAG,EAAE,IAAI;QACT,GAAG,EAAE,IAAI;QACT,GAAG,EAAE,IAAI;QACT,GAAG,EAAE,IAAI;QACT,GAAG,EAAE,IAAI;QACT,GAAG,EAAE,IAAI;QACT,GAAG,EAAE,CAAC,IAAI;QACV,GAAG,EAAE,CAAC,IAAI;KACX;IACD,YAAY,EAAE;QACZ,GAAG,EAAE,CAAC;QACN,GAAG,EAAE,CAAC;QACN,GAAG,EAAE,CAAC;QACN,GAAG,EAAE,CAAC;QACN,GAAG,EAAE,CAAC;QACN,GAAG,EAAE,CAAC;QACN,GAAG,EAAE,CAAC;QACN,GAAG,EAAE,CAAC;QACN,GAAG,EAAE,CAAC;QACN,GAAG,EAAE,CAAC;QACN,GAAG,EAAE,EAAE;QACP,GAAG,EAAE,EAAE;QACP,GAAG,EAAE,EAAE;QACP,GAAG,EAAE,EAAE;QACP,GAAG,EAAE,EAAE;QACP,GAAG,EAAE,EAAE;QACP,GAAG,EAAE,EAAE;QACP,GAAG,EAAE,EAAE;QACP,GAAG,EAAE,EAAE;QACP,GAAG,EAAE,EAAE;QACP,GAAG,EAAE,EAAE;KACR;CACF,CAAC;AAYJ;;;;;GAKG;AACH,MAAM,OAAO,sBAAsB;IAIjC,YAAY,QAAgB,YAAY;QACtC,IAAI,CAAC,MAAM,GAAG,eAAe,CAAC,QAAQ,CAAC,KAAK,CAAC,CAAC;QAC9C,IAAI,CAAC,MAAM,GAAG,EAAE,CAAC;QACjB,MAAM,CAAC,OAAO,CAAC,IAAI,CAAC,MAAM,CAAC,CAAC,OAAO,CAAC,CAAC,CAAC,CAAC,EAAE,CAAC,CAAC,EAAE,EAAE,CAAC,CAAC,IAAI,CAAC,MAAM,CAAC,CAAC,CAAC,GAAG,CAAC,CAAC,CAAC,CAAC;IACxE,CAAC;IAED;;;;;;;SAOK;IACL,MAAM,CAAC,iBAAiB,CAAC,GAAW;QAClC,IAAI,KAAK,GAAG,CAAC,CAAC;QACd,IAAI,GAAG,GAAG,GAAG,CAAC,MAAM,CAAC;QACrB,MAAM,OAAO,GAAG,CAAC,KAAK,EAAE,MAAM,CAAC,CAAC;QAEhC,IAAI,GAAG,CAAC,UAAU,CAAC,OAAO,CAAC,CAAC,CAAC,CAAC,EAAE;YAC9B,MAAM,CAAC,GAAG,OAAO,CAAC,CAAC,CAAC,CAAC,MAAM,CAAC,CAAC,wCAAwC;YACrE,MAAM,CAAC,GAAG,CAAC,CAAC,CAAC,IAAI,GAAG,EAAE,0BAA0B,OAAO,CAAC,CAAC,CAAC,8BAA8B,GAAG,IAAI,CAAC,CAAC;YACjG,KAAK,GAAG,CAAC,CAAC;SACX;QACD,IAAI,GAAG,CAAC,QAAQ,CAAC,OAAO,CAAC,CAAC,CAAC,CAAC,EAAE;YAC5B,MAAM,CAAC,GAAG,OAAO,CAAC,CAAC,CAAC,CAAC,MAAM,GAAC,CAAC,CAAC,CAAC,sCAAsC;YACrE,MAAM,CAAC,GAAG,CAAC,GAAG,GAAC,CAAC,CAAC,IAAI,GAAG,EAAE,0BAA0B,OAAO,CAAC,CAAC,CAAC,+BAA+B,GAAG,IAAI,CAAC,CAAC;YACtG,GAAG,IAAI,CAAC,CAAC;SACV;QACD,OAAO,GAAG,CAAC,SAAS,CAAC,KAAK,EAAE,GAAG,CAAC,CAAC;IACnC,CAAC;IAED;;;;;;;SAOK;IACL,MAAM,CAAC,YAAY,CAAC,GAAW;QAC7B,OAAO,GAAG,CAAC,OAAO,CAAC,aAAa,EAAE,IAAI,CAAC,CAAC;IAC1C,CAAC;IAED;;;;;;;SAOK;IACL,MAAM,CAAC,KAAK,CAAC,QAAgB;QAC3B,OAAO,sBAAsB,CAAC,YAAY,CAAC,sBAAsB,CAAC,iBAAiB,CAAC,QAAQ,CAAC,CAAC,CAAC;IACjG,CAAC;IAED;;;;;;SAMK;IACE,MAAM,CAAC,QAAgB;QAC5B,MAAM,MAAM,GAAG,QAAQ,CAAC,MAAM,CAAC;QAC/B,MAAM,MAAM,GAAG,IAAI,KAAK,CAAC,MAAM,CAAC,CAAC,IAAI,CAAC,CAAC,CAAC,CAAC;QAEzC,KAAK,IAAI,CAAC,GAAG,CAAC,EAAE,CAAC,GAAG,MAAM,EAAE,EAAE,CAAC,EAAE;YAC/B,MAAM,IAAI,GAAG,QAAQ,CAAC,CAAC,CAAC,CAAC;YAEzB,MAAM,CAAC,IAAI,IAAI,IAAI,CAAC,MAAM,EAAE,iBAAiB,IAAI,wBAAwB,QAAQ,GAAG,CAAC,CAAC;YAEtF,MAAM,CAAC,CAAC,CAAC,GAAG,IAAI,CAAC,aAAa,CAAC,IAAI,CAAC,CAAC;SACtC;QACD,OAAO,MAAM,CAAC;IAChB,CAAC;IAEM,aAAa,CAAC,MAAc;QACjC,OAAO,IAAI,CAAC,MAAM,CAAC,MAAM,CAAC,CAAC;IAC7B,CAAC;IAED;;;;;;SAMK;IACE,MAAM,CAAC,KAAe;QAC3B,IAAI,CAAC,GAAW,EAAE,CAAC;QAEnB,KAAK,IAAI,CAAC,GAAG,CAAC,EAAE,CAAC,GAAG,KAAK,CAAC,MAAM,EAAE,EAAE,CAAC,EAAE;YACrC,MAAM,IAAI,GAAG,KAAK,CAAC,CAAC,CAAC,CAAC;YAEtB,MAAM,CAAC,IAAI,IAAI,IAAI,CAAC,MAAM,EAAE,iBAAiB,IAAI,sBAAsB,KAAK,GAAG,CAAC,CAAC;YAEjF,CAAC,IAAI,IAAI,CAAC,MAAM,CAAC,IAAI,CAAC,CAAC;SACxB;QACD,OAAO,CAAC,CAAC;IACX,CAAC;CACF","sourcesContent":["import {assert} from '@datagrok-libraries/utils/src/vector-operations';\n\ntype SideChainScale = {[name: string]: number};\ntype SideChainScaleCollection = {[name: string]: SideChainScale};\n\nclass SideChainScales {\n  static scales: SideChainScaleCollection = {\n    // Wimley-White interfacial hydrophobicity scale\n    'WimleyWhite': {\n      '-': 0,\n      'A': 0.17,\n      'C': -0.24,\n      'D': -0.07, // Asp-: 1.23\n      'E': -0.01, // Glu-: 2.02\n      'F': -1.13, //\n      'G': 0.01,\n      'H': 0.17, // His+: 0.96\n      'I': -0.31,\n      'K': 0.99, // Lys+\n      'L': -0.56,\n      'M': -0.23,\n      'N': 0.42,\n      'P': 0.45,\n      'Q': 0.58,\n      'R': 0.81, // Arg+\n      'S': 0.13,\n      'T': 0.14,\n      'V': 0.07,\n      'W': -1.85,\n      'Y': -0.94,\n    },\n    'categorial': {\n      '-': 0,\n      'A': 1,\n      'C': 2,\n      'D': 3,\n      'E': 4,\n      'F': 5,\n      'G': 6,\n      'H': 7,\n      'I': 8,\n      'K': 9,\n      'L': 10,\n      'M': 11,\n      'N': 12,\n      'P': 13,\n      'Q': 14,\n      'R': 15,\n      'S': 16,\n      'T': 17,\n      'V': 18,\n      'W': 19,\n      'Y': 20,\n    },\n  };\n\n  static getAvailableScales(): string[] {\n    return Object.entries(this.scales).map(([k, _]) => k);\n  }\n\n  static getScale(name: string): SideChainScale {\n    assert(!(this.scales[name] === undefined), `Scale '${name}' was not found.`);\n    return this.scales[name];\n  }\n}\n\n/**\n * Class to categorial encode/decode aligned amino acid residues sequence.\n *\n * @export\n * @class AlignedSequenceEncoder\n */\nexport class AlignedSequenceEncoder {\n  protected aa2num: SideChainScale;\n  protected num2aa: {[code: number]: string};\n\n  constructor(scale: string = 'categorial') {\n    this.aa2num = SideChainScales.getScale(scale);\n    this.num2aa = {};\n    Object.entries(this.aa2num).forEach(([k, v]) => (this.num2aa[v] = k));\n  }\n\n  /**\n     * Truncate NH2 and -COOH terminals of the given sequence.\n     *\n     * @static\n     * @param {string} seq The sequence provided.\n     * @return {string} Truncated sequence.\n     * @memberof AlignedSequenceEncoder\n     */\n  static _truncateSequence(seq: string): string {\n    let start = 0;\n    let end = seq.length;\n    const termina = ['NH2', 'COOH'];\n\n    if (seq.startsWith(termina[0])) {\n      const l = termina[0].length; // Cut only 'NH2' without following '-'.\n      assert(seq[l] == '-', `Wrong sequence format: ${termina[0]} without following '-' in '${seq}'.`);\n      start = l;\n    }\n    if (seq.endsWith(termina[1])) {\n      const l = termina[1].length+1; // Cut both 'COOH' and precending '-'.\n      assert(seq[end-l] == '-', `Wrong sequence format: ${termina[1]} without '-' precending in '${seq}'.`);\n      end -= l;\n    }\n    return seq.substring(start, end);\n  }\n\n  /**\n     * Cuts auxiliary defises before a residue.\n     *\n     * @static\n     * @param {string} seq The sequence to process.\n     * @return {string} Processed sequence.\n     * @memberof AlignedSequenceEncoder\n     */\n  static _dropDefises(seq: string): string {\n    return seq.replace(/(-)([^-]+)/g, '$2');\n  }\n\n  /**\n     * Performs truncation and cutting auxiliary defises.\n     *\n     * @static\n     * @param {string} sequence The sequence work under process.\n     * @return {string} Result of cleaning.\n     * @memberof AlignedSequenceEncoder\n     */\n  static clean(sequence: string): string {\n    return AlignedSequenceEncoder._dropDefises(AlignedSequenceEncoder._truncateSequence(sequence));\n  }\n\n  /**\n     * Categorial encode of the sequence provided.\n     *\n     * @param {string} sequence The sequence.\n     * @return {number[]} Encoded vector.\n     * @memberof AlignedSequenceEncoder\n     */\n  public encode(sequence: string): number[] {\n    const nItems = sequence.length;\n    const values = new Array(nItems).fill(0);\n\n    for (let i = 0; i < nItems; ++i) {\n      const char = sequence[i];\n\n      assert(char in this.aa2num, `Unknown char '${char}' found in sequence '${sequence}'`);\n\n      values[i] = this.encodeLettter(char);\n    }\n    return values;\n  }\n\n  public encodeLettter(letter: string): number {\n    return this.aa2num[letter];\n  }\n\n  /**\n     * Decode the encoded vector into the sequence back.\n     *\n     * @param {number[]} value The vector encoded.\n     * @return {string} Decoded sequence.\n     * @memberof AlignedSequenceEncoder\n     */\n  public decode(value: number[]): string {\n    let s: string = '';\n\n    for (let i = 0; i < value.length; ++i) {\n      const code = value[i];\n\n      assert(code in this.num2aa, `Unknown code '${code}' found in vector '${value}'`);\n\n      s += this.num2aa[code];\n    }\n    return s;\n  }\n}\n"]}
@@ -0,0 +1,67 @@
1
+ import * as DG from 'datagrok-api/dg';
2
+ import { StringDictionary } from '@datagrok-libraries/utils/src/type-declarations';
3
+ declare module 'datagrok-api/src/grid' {
4
+ interface Rect {
5
+ contains(x: number, y: number): boolean;
6
+ }
7
+ }
8
+ declare global {
9
+ interface HTMLCanvasElement {
10
+ getCursorPosition(event: MouseEvent): DG.Point;
11
+ }
12
+ }
13
+ export declare class PositionMonomerInfo {
14
+ /** Sequences count with monomer in position
15
+ */
16
+ count: number;
17
+ /** Remember screen coords rect
18
+ */
19
+ bounds: DG.Rect;
20
+ constructor();
21
+ }
22
+ export declare class PositionInfo {
23
+ readonly name: string;
24
+ freq: {
25
+ [m: string]: PositionMonomerInfo;
26
+ };
27
+ rowCount: number;
28
+ /** freq = {}, rowCount = 0
29
+ * @param {string} name Name of position ('111A', '111.1', etc)
30
+ */
31
+ constructor(name: string);
32
+ }
33
+ export declare class WebLogo extends DG.JsViewer {
34
+ static residuesSet: string;
35
+ protected cp: StringDictionary | null;
36
+ private canvas?;
37
+ private slider?;
38
+ private textBaseline;
39
+ private axisHeight;
40
+ private positionWidth;
41
+ private seqCol;
42
+ private positions;
43
+ private rowsMasked;
44
+ private rowsNull;
45
+ minHeight: number;
46
+ maxHeight: number;
47
+ considerNullSequences: boolean;
48
+ sequenceColumnName: string;
49
+ startPositionName: string;
50
+ endPositionName: string;
51
+ private positionNames;
52
+ private startPosition;
53
+ private endPosition;
54
+ private get Length();
55
+ constructor();
56
+ init(): Promise<void>;
57
+ rootOnSizeChanged(args: any): void;
58
+ /** Assigns {@link seqCol} and {@link cp} based on {@link sequenceColumnName} and calls {@link render}().
59
+ */
60
+ updateSeqCol(): void;
61
+ onPropertyChanged(property: DG.Property): void;
62
+ onTableAttached(): void;
63
+ protected _nullSequence(fillerResidue?: string): string;
64
+ protected _calculate(): void;
65
+ render(recalc?: boolean): void;
66
+ }
67
+ //# sourceMappingURL=web-logo.d.ts.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"web-logo.d.ts","sourceRoot":"","sources":["web-logo.ts"],"names":[],"mappings":"AAEA,OAAO,KAAK,EAAE,MAAM,iBAAiB,CAAC;AAItC,OAAO,EAAC,gBAAgB,EAAC,MAAM,iDAAiD,CAAC;AAOjF,OAAO,QAAQ,uBAAuB,CAAC;IACrC,UAAU,IAAI;QACZ,QAAQ,CAAC,CAAC,EAAE,MAAM,EAAE,CAAC,EAAE,MAAM,GAAG,OAAO,CAAC;KACzC;CACF;AAED,OAAO,CAAC,MAAM,CAAC;IACb,UAAU,iBAAiB;QACzB,iBAAiB,CAAC,KAAK,EAAE,UAAU,GAAG,EAAE,CAAC,KAAK,CAAC;KAChD;CACF;AAWD,qBAAa,mBAAmB;IAC9B;OACG;IACH,KAAK,EAAE,MAAM,CAAC;IAEd;OACG;IACH,MAAM,EAAE,EAAE,CAAC,IAAI,CAAC;;CAMjB;AAED,qBAAa,YAAY;IACvB,SAAgB,IAAI,EAAE,MAAM,CAAC;IAC7B,IAAI,EAAE;QAAE,CAAC,CAAC,EAAE,MAAM,GAAG,mBAAmB,CAAA;KAAE,CAAC;IAC3C,QAAQ,EAAE,MAAM,CAAC;IAEjB;;OAEG;gBACS,IAAI,EAAE,MAAM;CAKzB;AAED,qBAAa,OAAQ,SAAQ,EAAE,CAAC,QAAQ;IACtC,OAAc,WAAW,SAAiB;IAG1C,SAAS,CAAC,EAAE,EAAE,gBAAgB,GAAG,IAAI,CAAQ;IAG7C,OAAO,CAAC,MAAM,CAAC,CAAoB;IACnC,OAAO,CAAC,MAAM,CAAC,CAAiB;IAChC,OAAO,CAAC,YAAY,CAAqB;IAEzC,OAAO,CAAC,UAAU,CAAc;IAChC,OAAO,CAAC,aAAa,CAAc;IAEnC,OAAO,CAAC,MAAM,CAA0B;IAExC,OAAO,CAAC,SAAS,CAAsB;IAEvC,OAAO,CAAC,UAAU,CAAa;IAC/B,OAAO,CAAC,QAAQ,CAAa;IAGtB,SAAS,EAAE,MAAM,CAAC;IAClB,SAAS,EAAE,MAAM,CAAC;IAClB,qBAAqB,EAAE,OAAO,CAAC;IAC/B,kBAAkB,EAAE,MAAM,CAAC;IAC3B,iBAAiB,EAAE,MAAM,CAAC;IAC1B,eAAe,EAAE,MAAM,CAAC;IAE/B,OAAO,CAAC,aAAa,CAAgB;IAErC,OAAO,CAAC,aAAa,CAAc;IAEnC,OAAO,CAAC,WAAW,CAAc;IAEjC,OAAO,KAAK,MAAM,GAAgE;;IAiB5E,IAAI,IAAI,OAAO,CAAC,IAAI,CAAC;IAmF3B,iBAAiB,CAAC,IAAI,EAAE,GAAG;IAmB3B;OACG;IACH,YAAY,IAAI,IAAI;IAuCpB,iBAAiB,CAAC,QAAQ,EAAE,EAAE,CAAC,QAAQ,GAAG,IAAI;IAyB9C,eAAe;IAiBf,SAAS,CAAC,aAAa,CAAC,aAAa,SAAM,GAAG,MAAM;IAOpD,SAAS,CAAC,UAAU;IAoFpB,MAAM,CAAC,MAAM,UAAO;CA8DrB"}