@datagrok/peptides 0.4.2 → 0.6.1
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/detectors.js +1 -1
- package/package.json +5 -3
- package/src/describe.ts +36 -40
- package/src/package.ts +27 -44
- package/src/peptides.ts +70 -6
- package/src/styles.css +37 -0
- package/src/utils/cell-renderer.ts +126 -19
- package/src/utils/chem-palette.ts +317 -214
- package/src/utils/correlation-analysis.ts +149 -71
- package/src/utils/peptide-similarity-space.ts +23 -19
- package/src/utils/split-aligned.ts +8 -1
- package/src/viewers/logo-viewer.ts +48 -5
- package/src/viewers/model.ts +27 -0
- package/src/viewers/sar-viewer.ts +99 -38
- package/src/viewers/spiral-plot.ts +97 -0
- package/src/viewers/stacked-barchart-viewer.ts +82 -7
- package/src/viewers/subst-viewer.ts +276 -0
- package/src/widgets/analyze-peptides.ts +14 -4
- package/src/widgets/manual-alignment.ts +11 -4
- package/src/widgets/peptide-molecule.ts +7 -0
- package/webpack.config.js +4 -0
|
@@ -0,0 +1,276 @@
|
|
|
1
|
+
// import * as grok from 'datagrok-api/grok';
|
|
2
|
+
import * as ui from 'datagrok-api/ui';
|
|
3
|
+
import * as DG from 'datagrok-api/dg';
|
|
4
|
+
|
|
5
|
+
import $ from 'cash-dom';
|
|
6
|
+
|
|
7
|
+
// import {aarGroups} from '../describe';
|
|
8
|
+
import {setAARRenderer} from '../utils/cell-renderer';
|
|
9
|
+
|
|
10
|
+
export class SubstViewer extends DG.JsViewer {
|
|
11
|
+
viewerGrid: DG.Grid | null;
|
|
12
|
+
maxSubstitutions: number;
|
|
13
|
+
activityLimit: number;
|
|
14
|
+
activityColumnName: string;
|
|
15
|
+
casesGrid: DG.Grid | null;
|
|
16
|
+
|
|
17
|
+
constructor() {
|
|
18
|
+
super();
|
|
19
|
+
|
|
20
|
+
this.activityColumnName = this.string('activityColumnName');
|
|
21
|
+
|
|
22
|
+
this.maxSubstitutions = this.int('maxSubstitutions', 1);
|
|
23
|
+
this.activityLimit = this.float('activityLimit', 2);
|
|
24
|
+
|
|
25
|
+
this.viewerGrid = null;
|
|
26
|
+
this.casesGrid = null;
|
|
27
|
+
}
|
|
28
|
+
|
|
29
|
+
onPropertyChanged(property: DG.Property): void {
|
|
30
|
+
this.calcSubstitutions();
|
|
31
|
+
}
|
|
32
|
+
|
|
33
|
+
calcSubstitutions() {
|
|
34
|
+
const aarColName = 'AAR';
|
|
35
|
+
const df: DG.DataFrame = this.dataFrame!;
|
|
36
|
+
const col: DG.Column = df.columns.bySemType('alignedSequence');
|
|
37
|
+
// let values: number[] = df.columns.byName('IC50').toList();
|
|
38
|
+
const values = df.getCol(this.activityColumnName).toList().map((x) => -Math.log10(x));
|
|
39
|
+
// values = values;
|
|
40
|
+
const splitedMatrix = this.split(col);
|
|
41
|
+
|
|
42
|
+
const tableValues: { [aar: string]: number[] } = {};
|
|
43
|
+
const tableTooltips: { [aar: string]: {[index: string]: string}[][] } = {};
|
|
44
|
+
const tableCases: { [aar: string]: number[][][] } = {};
|
|
45
|
+
|
|
46
|
+
const nRows = splitedMatrix.length;
|
|
47
|
+
const nCols = splitedMatrix[0].length;
|
|
48
|
+
const nColsArray = Array(nCols);
|
|
49
|
+
|
|
50
|
+
for (let i = 0; i < nRows - 1; i++) {
|
|
51
|
+
for (let j = i + 1; j < nRows; j++) {
|
|
52
|
+
let substCounter = 0;
|
|
53
|
+
const subst1: { [pos: number]: [string, {[index: string]: string}] } = {};
|
|
54
|
+
const subst2: { [pos: number]: [string, {[index: string]: string}] } = {};
|
|
55
|
+
const delta = values[i] - values[j];
|
|
56
|
+
|
|
57
|
+
for (let k = 0; k < nCols; k++) {
|
|
58
|
+
const smik = splitedMatrix[i][k];
|
|
59
|
+
const smjk = splitedMatrix[j][k];
|
|
60
|
+
if (smik != smjk && Math.abs(delta) >= this.activityLimit) {
|
|
61
|
+
const vi = values[i].toFixed(2);
|
|
62
|
+
const vj = values[j].toFixed(2);
|
|
63
|
+
substCounter++;
|
|
64
|
+
subst1[k] = [
|
|
65
|
+
smik,
|
|
66
|
+
{key: `${smik === '-' ? 'Empty' : smik} → ${smjk === '-' ? 'Empty' : smjk}`, value: `${vi} → ${vj}`},
|
|
67
|
+
];
|
|
68
|
+
subst2[k] = [
|
|
69
|
+
smjk,
|
|
70
|
+
{key: `${smjk === '-' ? 'Empty' : smjk} → ${smik === '-' ? 'Empty' : smik}`, value: `${vj} → ${vi}`},
|
|
71
|
+
];
|
|
72
|
+
}
|
|
73
|
+
}
|
|
74
|
+
|
|
75
|
+
if (substCounter <= this.maxSubstitutions && substCounter > 0) {
|
|
76
|
+
Object.keys(subst1).forEach((pos) => {
|
|
77
|
+
const posInt = parseInt(pos);
|
|
78
|
+
const aar = subst1[posInt][0];
|
|
79
|
+
if (!Object.keys(tableValues).includes(aar)) {
|
|
80
|
+
tableValues[aar] = Array.apply(null, nColsArray).map(function() {
|
|
81
|
+
return DG.INT_NULL;
|
|
82
|
+
});
|
|
83
|
+
tableTooltips[aar] = Array.apply(null, nColsArray).map(function() {
|
|
84
|
+
return [];
|
|
85
|
+
});
|
|
86
|
+
tableCases[aar] = Array.apply(null, nColsArray).map(function() {
|
|
87
|
+
return [];
|
|
88
|
+
});
|
|
89
|
+
}
|
|
90
|
+
|
|
91
|
+
tableValues[aar][posInt] = tableValues[aar][posInt] === DG.INT_NULL ? 1 : tableValues[aar][posInt] + 1;
|
|
92
|
+
tableTooltips[aar][posInt] = !tableTooltips[aar][posInt].length ?
|
|
93
|
+
[{key: 'Substitution', value: 'Values'}] : tableTooltips[aar][posInt];
|
|
94
|
+
tableTooltips[aar][posInt].push(subst1[posInt][1]);
|
|
95
|
+
tableCases[aar][posInt].push([i, j, delta]);
|
|
96
|
+
});
|
|
97
|
+
Object.keys(subst2).forEach((pos) => {
|
|
98
|
+
const posInt = parseInt(pos);
|
|
99
|
+
const aar = subst2[posInt][0];
|
|
100
|
+
if (!Object.keys(tableValues).includes(aar)) {
|
|
101
|
+
tableValues[aar] = Array.apply(null, nColsArray).map(function() {
|
|
102
|
+
return DG.INT_NULL;
|
|
103
|
+
});
|
|
104
|
+
tableTooltips[aar] = Array.apply(null, nColsArray).map(function() {
|
|
105
|
+
return [];
|
|
106
|
+
});
|
|
107
|
+
tableCases[aar] = Array.apply(null, nColsArray).map(function() {
|
|
108
|
+
return [];
|
|
109
|
+
});
|
|
110
|
+
}
|
|
111
|
+
|
|
112
|
+
tableValues[aar][posInt] = tableValues[aar][posInt] === DG.INT_NULL ? 1 : tableValues[aar][posInt] + 1;
|
|
113
|
+
// tableValues[aar][posInt]++;
|
|
114
|
+
tableTooltips[aar][posInt] = !tableTooltips[aar][posInt].length ?
|
|
115
|
+
[{key: 'Substitution', value: 'Values'}] : tableTooltips[aar][posInt];
|
|
116
|
+
tableTooltips[aar][posInt].push(subst2[posInt][1]);
|
|
117
|
+
tableCases[aar][posInt].push([j, i, -delta]);
|
|
118
|
+
});
|
|
119
|
+
}
|
|
120
|
+
}
|
|
121
|
+
}
|
|
122
|
+
|
|
123
|
+
const tableValuesKeys = Object.keys(tableValues);
|
|
124
|
+
const dfLength = tableValuesKeys.length;
|
|
125
|
+
const cols = [...nColsArray.keys()].map((v) => DG.Column.int(v.toString(), dfLength));
|
|
126
|
+
const aarCol = DG.Column.string(aarColName, dfLength);
|
|
127
|
+
cols.splice(0, 1, aarCol);
|
|
128
|
+
const table = DG.DataFrame.fromColumns(cols);
|
|
129
|
+
|
|
130
|
+
for (let i = 0; i < dfLength; i++) {
|
|
131
|
+
const aar = tableValuesKeys[i];
|
|
132
|
+
tableValues[aar].splice(0, 1);
|
|
133
|
+
table.rows.setValues(i, [aar, ...tableValues[aar]]);
|
|
134
|
+
}
|
|
135
|
+
|
|
136
|
+
// let groupMapping: { [key: string]: string } = {};
|
|
137
|
+
|
|
138
|
+
//TODO: enable grouping
|
|
139
|
+
// Object.keys(aarGroups).forEach((value) => groupMapping[value] = value);
|
|
140
|
+
|
|
141
|
+
this.viewerGrid = table.plot.grid();
|
|
142
|
+
|
|
143
|
+
setAARRenderer(aarCol, this.viewerGrid);
|
|
144
|
+
|
|
145
|
+
this.viewerGrid.onCellTooltip(
|
|
146
|
+
(gCell, x, y) => {
|
|
147
|
+
if (gCell.cell.value !== DG.INT_NULL && gCell.tableColumn !== null && gCell.tableRowIndex !== null) {
|
|
148
|
+
const colName = gCell.tableColumn.name;
|
|
149
|
+
if (colName !== aarColName) {
|
|
150
|
+
const aar = this.viewerGrid!.table.get(aarColName, gCell.tableRowIndex);
|
|
151
|
+
const pos = parseInt(colName);
|
|
152
|
+
const tooltipText = tableTooltips[aar][pos].length ?
|
|
153
|
+
DG.HtmlTable.create(
|
|
154
|
+
tableTooltips[aar][pos], (item: {[index: string]: string}, idx: number) => [item.key, item.value],
|
|
155
|
+
).root : ui.divText('No substitutions');
|
|
156
|
+
ui.tooltip.show(tooltipText, x, y);
|
|
157
|
+
}
|
|
158
|
+
}
|
|
159
|
+
return true;
|
|
160
|
+
},
|
|
161
|
+
);
|
|
162
|
+
|
|
163
|
+
for (const col of table.columns.names()) {
|
|
164
|
+
this.viewerGrid.col(col)!.width = this.viewerGrid.props.rowHeight;
|
|
165
|
+
}
|
|
166
|
+
|
|
167
|
+
this.viewerGrid.onCellRender.subscribe((args) => {
|
|
168
|
+
if (args.cell.isRowHeader && args.cell.gridColumn.visible) {
|
|
169
|
+
args.cell.gridColumn.visible = false;
|
|
170
|
+
args.preventDefault();
|
|
171
|
+
}
|
|
172
|
+
});
|
|
173
|
+
|
|
174
|
+
this.viewerGrid.props.allowEdit = false;
|
|
175
|
+
|
|
176
|
+
table.onCurrentCellChanged.subscribe((_) => {
|
|
177
|
+
if (table.currentCol !== null && table.currentCol.name !== aarColName && table.currentCell.value !== null) {
|
|
178
|
+
const aar = table.get(aarColName, table.currentRowIdx);
|
|
179
|
+
const pos = parseInt(table.currentCol.name);
|
|
180
|
+
const currentCase = tableCases[aar][pos];
|
|
181
|
+
const tempDfLength = currentCase.length;
|
|
182
|
+
const initCol = DG.Column.string('Initial', tempDfLength);
|
|
183
|
+
const subsCol = DG.Column.string('Substituted', tempDfLength);
|
|
184
|
+
|
|
185
|
+
const tempDf = DG.DataFrame.fromColumns([
|
|
186
|
+
initCol,
|
|
187
|
+
subsCol,
|
|
188
|
+
DG.Column.float('Difference', tempDfLength),
|
|
189
|
+
]);
|
|
190
|
+
|
|
191
|
+
for (let i = 0; i < tempDfLength; i++) {
|
|
192
|
+
const row = currentCase[i];
|
|
193
|
+
tempDf.rows.setValues(i, [col.get(row[0]), col.get(row[1]), row[2]]);
|
|
194
|
+
}
|
|
195
|
+
|
|
196
|
+
initCol.semType = 'alignedSequence';
|
|
197
|
+
initCol.setTag('isAnalysisApplicable', 'false');
|
|
198
|
+
subsCol.semType = 'alignedSequence';
|
|
199
|
+
subsCol.setTag('isAnalysisApplicable', 'false');
|
|
200
|
+
|
|
201
|
+
this.casesGrid = tempDf.plot.grid();
|
|
202
|
+
this.casesGrid.props.allowEdit = false;
|
|
203
|
+
} else {
|
|
204
|
+
this.casesGrid = null;
|
|
205
|
+
}
|
|
206
|
+
this.render();
|
|
207
|
+
});
|
|
208
|
+
|
|
209
|
+
this.render();
|
|
210
|
+
}
|
|
211
|
+
|
|
212
|
+
render() {
|
|
213
|
+
$(this.root).empty();
|
|
214
|
+
this.root.appendChild(this.casesGrid === null ?
|
|
215
|
+
this.viewerGrid!.root : ui.splitH([this.viewerGrid!.root, this.casesGrid.root]),
|
|
216
|
+
);
|
|
217
|
+
}
|
|
218
|
+
|
|
219
|
+
split(peptideColumn: DG.Column, filter: boolean = true): string[][] {
|
|
220
|
+
const splitPeptidesArray: string[][] = [];
|
|
221
|
+
let currentSplitPeptide: string[];
|
|
222
|
+
let modeMonomerCount = 0;
|
|
223
|
+
let currentLength;
|
|
224
|
+
const colLength = peptideColumn.length;
|
|
225
|
+
|
|
226
|
+
// splitting data
|
|
227
|
+
const monomerLengths: { [index: string]: number } = {};
|
|
228
|
+
for (let i = 0; i < colLength; i++) {
|
|
229
|
+
currentSplitPeptide = peptideColumn.get(i).split('-').map((value: string) => value ? value : '-');
|
|
230
|
+
splitPeptidesArray.push(currentSplitPeptide);
|
|
231
|
+
currentLength = currentSplitPeptide.length;
|
|
232
|
+
monomerLengths[currentLength + ''] =
|
|
233
|
+
monomerLengths[currentLength + ''] ? monomerLengths[currentLength + ''] + 1 : 1;
|
|
234
|
+
}
|
|
235
|
+
//@ts-ignore: what I do here is converting string to number the most effective way I could find. parseInt is slow
|
|
236
|
+
modeMonomerCount = 1 * Object.keys(monomerLengths).reduce((a, b) => monomerLengths[a] > monomerLengths[b] ? a : b);
|
|
237
|
+
|
|
238
|
+
// making sure all of the sequences are of the same size
|
|
239
|
+
// and marking invalid sequences
|
|
240
|
+
let nTerminal: string;
|
|
241
|
+
const invalidIndexes: number[] = [];
|
|
242
|
+
let splitColumns: string[][] = Array.from({length: modeMonomerCount}, (_) => []);
|
|
243
|
+
modeMonomerCount--; // minus N-terminal
|
|
244
|
+
for (let i = 0; i < colLength; i++) {
|
|
245
|
+
currentSplitPeptide = splitPeptidesArray[i];
|
|
246
|
+
nTerminal = currentSplitPeptide.pop()!; // it is guaranteed that there will be at least one element
|
|
247
|
+
currentLength = currentSplitPeptide.length;
|
|
248
|
+
if (currentLength !== modeMonomerCount) {
|
|
249
|
+
invalidIndexes.push(i);
|
|
250
|
+
}
|
|
251
|
+
for (let j = 0; j < modeMonomerCount; j++) {
|
|
252
|
+
splitColumns[j].push(j < currentLength ? currentSplitPeptide[j] : '-');
|
|
253
|
+
}
|
|
254
|
+
splitColumns[modeMonomerCount].push(nTerminal);
|
|
255
|
+
}
|
|
256
|
+
modeMonomerCount--; // minus C-terminal
|
|
257
|
+
|
|
258
|
+
//create column names list
|
|
259
|
+
const columnNames = Array.from({length: modeMonomerCount}, (_, index) => `${index + 1 < 10 ? 0 : ''}${index + 1}`);
|
|
260
|
+
columnNames.splice(0, 0, 'N-terminal');
|
|
261
|
+
columnNames.push('C-terminal');
|
|
262
|
+
|
|
263
|
+
// filter out the columns with the same values
|
|
264
|
+
if (filter) {
|
|
265
|
+
splitColumns = splitColumns.filter((positionArray, index) => {
|
|
266
|
+
const isRetained = new Set(positionArray).size > 1;
|
|
267
|
+
if (!isRetained) {
|
|
268
|
+
columnNames.splice(index, 1);
|
|
269
|
+
}
|
|
270
|
+
return isRetained;
|
|
271
|
+
});
|
|
272
|
+
}
|
|
273
|
+
|
|
274
|
+
return splitPeptidesArray;
|
|
275
|
+
}
|
|
276
|
+
}
|
|
@@ -3,6 +3,16 @@ import * as ui from 'datagrok-api/ui';
|
|
|
3
3
|
import * as DG from 'datagrok-api/dg';
|
|
4
4
|
import {Peptides} from '../peptides';
|
|
5
5
|
|
|
6
|
+
/**
|
|
7
|
+
* Peptide analysis widget.
|
|
8
|
+
*
|
|
9
|
+
* @export
|
|
10
|
+
* @param {DG.Column} col Aligned sequence column.
|
|
11
|
+
* @param {DG.TableView} view Working view.
|
|
12
|
+
* @param {DG.Grid} tableGrid Working table grid.
|
|
13
|
+
* @param {DG.DataFrame} currentDf Working table.
|
|
14
|
+
* @return {Promise<DG.Widget>} Widget containing peptide analysis.
|
|
15
|
+
*/
|
|
6
16
|
export async function analyzePeptidesWidget(
|
|
7
17
|
col: DG.Column, view: DG.TableView, tableGrid: DG.Grid, currentDf: DG.DataFrame,
|
|
8
18
|
): Promise<DG.Widget> {
|
|
@@ -16,7 +26,7 @@ export async function analyzePeptidesWidget(
|
|
|
16
26
|
let hist: DG.Viewer;
|
|
17
27
|
|
|
18
28
|
const activityScalingMethod = ui.choiceInput(
|
|
19
|
-
'
|
|
29
|
+
'Scaling',
|
|
20
30
|
'none',
|
|
21
31
|
['none', 'lg', '-lg'],
|
|
22
32
|
async (currentMethod: string) => {
|
|
@@ -54,7 +64,7 @@ export async function analyzePeptidesWidget(
|
|
|
54
64
|
activityScalingMethod.fireChanged();
|
|
55
65
|
};
|
|
56
66
|
const activityColumnChoice = ui.columnInput(
|
|
57
|
-
'Activity
|
|
67
|
+
'Activity',
|
|
58
68
|
currentDf,
|
|
59
69
|
defaultColumn,
|
|
60
70
|
activityScalingMethodState,
|
|
@@ -66,8 +76,8 @@ export async function analyzePeptidesWidget(
|
|
|
66
76
|
if (activityColumnChoice.value.type === DG.TYPE.FLOAT) {
|
|
67
77
|
const progress = DG.TaskBarProgressIndicator.create('Loading SAR...');
|
|
68
78
|
const options: {[key: string]: string} = {
|
|
69
|
-
'
|
|
70
|
-
'
|
|
79
|
+
'activityColumnName': activityColumnChoice.value.name,
|
|
80
|
+
'scaling': activityScalingMethod.value,
|
|
71
81
|
};
|
|
72
82
|
|
|
73
83
|
const peptides = new Peptides();
|
|
@@ -4,11 +4,18 @@ import * as DG from 'datagrok-api/dg';
|
|
|
4
4
|
import $ from 'cash-dom';
|
|
5
5
|
import {model} from '../viewers/model';
|
|
6
6
|
import {splitAlignedPeptides} from '../utils/split-aligned';
|
|
7
|
+
import '../styles.css';
|
|
7
8
|
|
|
9
|
+
/**
|
|
10
|
+
* Manual sequence alignment widget.
|
|
11
|
+
*
|
|
12
|
+
* @param {DG.Column} alignedSequenceCol Aligned sequence column.
|
|
13
|
+
* @param {DG.DataFrame} currentDf Working table.
|
|
14
|
+
* @return {DG.Widget} Widget for manual sequence alignment.
|
|
15
|
+
*/
|
|
8
16
|
export function manualAlignmentWidget(alignedSequenceCol: DG.Column, currentDf: DG.DataFrame) {
|
|
9
17
|
const sequenceInput = ui.textInput('', alignedSequenceCol.get(currentDf.currentRowIdx));
|
|
10
|
-
(sequenceInput.
|
|
11
|
-
(sequenceInput.input as HTMLElement).style.overflow = 'hidden';
|
|
18
|
+
$(sequenceInput.root).addClass('pep-textinput');
|
|
12
19
|
|
|
13
20
|
const applyChangesBtn = ui.button('Apply', async () => {
|
|
14
21
|
const newSequence = sequenceInput.value;
|
|
@@ -30,7 +37,7 @@ export function manualAlignmentWidget(alignedSequenceCol: DG.Column, currentDf:
|
|
|
30
37
|
() => sequenceInput.value = alignedSequenceCol.get(currentDf.currentRowIdx),
|
|
31
38
|
'Reset',
|
|
32
39
|
);
|
|
33
|
-
$(resetBtn).addClass('
|
|
40
|
+
$(resetBtn).addClass('pep-snippet-editor-icon pep-reset-icon');
|
|
34
41
|
|
|
35
|
-
return new DG.Widget(ui.divV([resetBtn, sequenceInput.root, applyChangesBtn], '
|
|
42
|
+
return new DG.Widget(ui.divV([resetBtn, sequenceInput.root, applyChangesBtn], 'pep-textarea-box'));
|
|
36
43
|
}
|
|
@@ -3,6 +3,13 @@ import * as ui from 'datagrok-api/ui';
|
|
|
3
3
|
import * as DG from 'datagrok-api/dg';
|
|
4
4
|
import {ChemPalette} from '../utils/chem-palette';
|
|
5
5
|
|
|
6
|
+
/**
|
|
7
|
+
* 3D representation widget of peptide molecule.
|
|
8
|
+
*
|
|
9
|
+
* @export
|
|
10
|
+
* @param {string} pep Peptide string.
|
|
11
|
+
* @return {Promise<DG.Widget>} Widget.
|
|
12
|
+
*/
|
|
6
13
|
export async function peptideMoleculeWidget(pep: string): Promise<DG.Widget> {
|
|
7
14
|
const pi = DG.TaskBarProgressIndicator.create('Creating NGL view');
|
|
8
15
|
|