npm - @datagrok/peptides - Versions diffs - 1.19.1 → 1.21.0 - Mend

@datagrok/peptides 1.19.1 → 1.21.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (26) hide show

package/CHANGELOG.md +4 -0
package/dist/package-test.js +1 -1
package/dist/package-test.js.map +1 -1
package/dist/package.js +1 -1
package/dist/package.js.map +1 -1
package/package.json +10 -9
package/src/model.ts +69 -62
package/src/viewers/cluster-max-activity-viewer.ts +4 -4
package/src/widgets/mutation-cliffs.ts +4 -2
package/src/widgets/peptides.ts +28 -20
package/test-console-output-1.log +156 -92
package/test-record-1.mp4 +0 -0
package/dist/111.js +0 -2
package/dist/111.js.map +0 -1
package/dist/501.js +0 -2
package/dist/501.js.map +0 -1
package/dist/51.js +0 -2
package/dist/51.js.map +0 -1
package/dist/603.js +0 -2
package/dist/603.js.map +0 -1
package/dist/778.js +0 -2
package/dist/778.js.map +0 -1
package/dist/801.js +0 -2
package/dist/801.js.map +0 -1
package/dist/950.js +0 -2
package/dist/950.js.map +0 -1

package/package.json CHANGED Viewed

@@ -1,7 +1,7 @@
 {
   "name": "@datagrok/peptides",
   "friendlyName": "Peptides",
-  "version": "1.19.1",
+  "version": "1.21.0",
   "author": {
     "name": "Davit Rizhinashvili",
     "email": "drizhinashvili@datagrok.ai"
@@ -14,12 +14,12 @@
   },
   "dependencies": {
     "@datagrok-libraries/bio": "^5.46.1",
-    "@datagrok-libraries/math": "^1.2.3",
-    "@datagrok-libraries/ml": "^6.7.5",
+    "@datagrok-libraries/math": "^1.2.4",
+    "@datagrok-libraries/ml": "^6.7.6",
     "@datagrok-libraries/statistics": "^1.2.12",
     "@datagrok-libraries/tutorials": "^1.4.2",
-    "@datagrok-libraries/utils": "^4.3.10",
-    "datagrok-api": "^1.22.0",
+    "@datagrok-libraries/utils": "^4.4.0",
+    "datagrok-api": "^1.23.0",
     "@webgpu/types": "^0.1.40",
     "cash-dom": "^8.1.5",
     "file-loader": "^6.2.0",
@@ -30,10 +30,11 @@
   "devDependencies": {
     "@datagrok-libraries/helm-web-editor": "^1.1.7",
     "@datagrok-libraries/js-draw-lite": "^0.0.5",
-    "@datagrok/bio": "^2.16.9",
-    "@datagrok/chem": "^1.12.0",
+    "@datagrok/eda": "^1.3.1",
+    "@datagrok/bio": "^2.18.0",
+    "@datagrok/chem": "^1.13.0",
     "@datagrok/dendrogram": "^1.2.33",
-    "@datagrok/helm": "^2.5.9",
+    "@datagrok/helm": "^2.7.0",
     "@types/uuid": "^10.0.0",
     "@types/wu": "^2.1.44",
     "@typescript-eslint/eslint-plugin": "^8.8.1",
@@ -79,4 +80,4 @@
     "All users"
   ],
   "category": "Bioinformatics"
-}
+}

package/src/model.ts CHANGED Viewed

@@ -51,11 +51,12 @@ import {DimReductionMethods} from '@datagrok-libraries/ml/src/multi-column-dimen
 import {AggregationColumns, MonomerPositionStats} from './utils/statistics';
 import {splitAlignedSequences} from '@datagrok-libraries/bio/src/utils/splitter';
 import {getDbscanWorker} from '@datagrok-libraries/math';
-import {markovCluster} from '@datagrok-libraries/ml/src/MCL/clustering-view';
 import {DistanceAggregationMethods} from '@datagrok-libraries/ml/src/distance-matrix/types';
 import {ClusterMaxActivityViewer, IClusterMaxActivity} from './viewers/cluster-max-activity-viewer';
-import {MCL_OPTIONS_TAG, MCLSerializableOptions} from '@datagrok-libraries/ml/src/MCL';
+import {MCLSerializableOptions} from '@datagrok-libraries/ml/src/MCL';
 import {PeptideUtils} from './peptideUtils';
+import {getGPUAdapterDescription} from '@datagrok-libraries/math/src/webGPU/getGPUDevice';
+import {MCLViewer} from '@datagrok-libraries/ml/src/MCL/mcl-viewer';
 export enum VIEWER_TYPE {
   SEQUENCE_VARIABILITY_MAP = 'Sequence Variability Map',
@@ -63,6 +64,7 @@ export enum VIEWER_TYPE {
   LOGO_SUMMARY_TABLE = 'Logo Summary Table',
   DENDROGRAM = 'Dendrogram',
   CLUSTER_MAX_ACTIVITY = 'Active peptide selection',
+  MCL = 'MCL',
 }
 export type CachedWebLogoTooltip = { bar: string, tooltip: HTMLDivElement | null };
@@ -106,7 +108,7 @@ export class PeptidesModel {
   // sequence space viewer
   _sequenceSpaceViewer: DG.ScatterPlotViewer | null = null;
   //MCL viewer
-  _mclViewer: DG.ScatterPlotViewer | null = null;
+  _mclViewer: MCLViewer | null = null;
   /**
    * @param {DG.DataFrame}dataFrame - DataFrame to use for analysis
    */
@@ -143,7 +145,7 @@ export class PeptidesModel {
    */
   get analysisView(): DG.TableView {
     if (this._analysisView === undefined) {
-      this._analysisView = wu(grok.shell.tableViews).find(({dataFrame}) => dataFrame?.getTag(DG.TAGS.ID) === this.id);
+      this._analysisView = this.id ? wu(grok.shell.tableViews).find(({dataFrame}) => dataFrame?.getTag(DG.TAGS.ID) === this.id) : undefined;
       if (typeof this._analysisView === 'undefined')
         this._analysisView = grok.shell.addTableView(this.df);
     }
@@ -166,11 +168,13 @@ export class PeptidesModel {
    */
   get settings(): type.PeptidesSettings | null {
     const settingsStr = this.df.getTag(C.TAGS.SETTINGS);
-    if (settingsStr == null)
+    if (!settingsStr)
       return null;
     this._settings ??= JSON.parse(settingsStr);
+    if (this._settings?.mclSettings && !(this._settings.mclSettings.webGPUDescriptionPromise instanceof Promise))
+      this._settings.mclSettings.webGPUDescriptionPromise = getGPUAdapterDescription();
     return this._settings!;
   }
@@ -358,7 +362,14 @@ export class PeptidesModel {
       dataFrame.getCol(C.COLUMNS_NAMES.ACTIVITY_SCALED).name = C.COLUMNS_NAMES.ACTIVITY;
-    dataFrame.temp[PeptidesModel.modelName] ??= new PeptidesModel(dataFrame);
+    //dataFrame.temp[PeptidesModel.modelName] ??= new PeptidesModel(dataFrame);
+    if (!dataFrame.temp[PeptidesModel.modelName]) {
+      const model = dataFrame.temp[PeptidesModel.modelName] = new PeptidesModel(dataFrame);
+      const settings = model.settings;
+      // this is important bit. settings are written by startAnalysis function or other viewers, but separate viewers will not init the peptides model
+      if (settings)
+        model.init(settings);
+    }
     return dataFrame.temp[PeptidesModel.modelName] as PeptidesModel;
   }
@@ -690,20 +701,23 @@ export class PeptidesModel {
     const cols = this.df.columns;
     const splitSeqDf = splitAlignedSequences(this.df.getCol(this.settings!.sequenceColumnName), PeptideUtils.getSeqHelper());
     const positionColumns = splitSeqDf.columns.names();
-    for (const colName of positionColumns) {
-      let col = this.df.col(colName);
-      const newCol = splitSeqDf.getCol(colName);
-      if (col !== null)
-        cols.remove(colName);
-      const newColCat = newCol.categories;
-      const newColData = newCol.getRawData();
-      col = cols.addNew(newCol.name, newCol.type).init((i) => newColCat[newColData[i]]);
-      col.setTag(C.TAGS.ANALYSIS_COL, `${true}`);
-      col.setTag(C.TAGS.POSITION_COL, `${true}`);
-      CR.setMonomerRenderer(col, this.alphabet);
+    if (positionColumns.every((colName) => cols.contains(colName)))
+      positionColumns.forEach((colName) => CR.setMonomerRenderer(this.df.col(colName)!, this.alphabet));
+    else {
+      for (const colName of positionColumns) {
+        let col = this.df.col(colName);
+        const newCol = splitSeqDf.getCol(colName);
+        if (col !== null)
+          cols.remove(colName);
+        const newColCat = newCol.categories;
+        const newColData = newCol.getRawData();
+        col = cols.addNew(newCol.name, newCol.type).init((i) => newColCat[newColData[i]]);
+        col.setTag(C.TAGS.ANALYSIS_COL, `${true}`);
+        col.setTag(C.TAGS.POSITION_COL, `${true}`);
+        CR.setMonomerRenderer(col, this.alphabet);
+      }
     }
     this.df.name = name;
   }
@@ -1133,7 +1147,7 @@ export class PeptidesModel {
       activityColumnName: this.settings!.activityColumnName,
       clusterColumnName: potentialClusterCol ?? wu(this.df.columns.categorical).next().value?.name,
       activityTarget: C.ACTIVITY_TARGET.HIGH,
-      connectivityColumnName: this._mclCols.find((colName) => colName.toLowerCase().startsWith('connectivity')),
+      connectivityColumnName: this._mclCols.find((colName) => colName.toLowerCase().startsWith('connectivity')) ?? this.df.columns.names().find((colName) => colName.toLowerCase().includes('connectivity') && this.df.col(colName)?.isNumerical) ?? '',
       clusterSizeThreshold: 20,
       activityThreshold: 1000,
     };
@@ -1296,51 +1310,44 @@ export class PeptidesModel {
       }
     });
-    const bioPreprocessingFunc = DG.Func.find({package: 'Bio', name: 'macromoleculePreprocessingFunction'})[0];
-    const mclViewer = await markovCluster(
-      this.df, [seqCol], [mclParams!.distanceF], [1],
-      DistanceAggregationMethods.MANHATTAN, [bioPreprocessingFunc], [{
+    const serializedOptions: string = JSON.stringify({
+      cols: [seqCol].map((col) => col.name),
+      metrics: [mclParams!.distanceF],
+      weights: [1],
+      aggregationMethod: DistanceAggregationMethods.MANHATTAN,
+      preprocessingFuncs: ['macromoleculePreprocessingFunction'],
+      preprocessingFuncArgs: [{
         gapOpen: mclParams!.gapOpen, gapExtend: mclParams!.gapExtend,
         fingerprintType: mclParams!.fingerprintType,
       }],
-      mclParams!.threshold, mclParams!.maxIterations, mclParams.useWebGPU,
-      mclParams!.inflation, mclParams.minClusterSize,
-    );
-    mclAdditionSub.unsubscribe();
-    // find logo summery viewer and make it rerender
-    const lstViewer = this.findViewer(VIEWER_TYPE.LOGO_SUMMARY_TABLE) as LogoSummaryTable | null;
-    if (lstViewer) { // beware, this is accessing private things
-      lstViewer._clusterStats = null;
-      lstViewer._clusterSelection = null;
-      lstViewer._viewerGrid = null;
-      lstViewer._logoSummaryTable = null;
-      lstViewer.render();
-    }
-    if (mclViewer?.sc) {
-      const serializedOptions: string = JSON.stringify({
-        cols: [seqCol].map((col) => col.name),
-        metrics: [mclParams!.distanceF],
-        weights: [1],
-        aggregationMethod: DistanceAggregationMethods.MANHATTAN,
-        preprocessingFuncs: [bioPreprocessingFunc].map((func) => func?.name ?? null),
-        preprocessingFuncArgs: [{
-          gapOpen: mclParams!.gapOpen, gapExtend: mclParams!.gapExtend,
-          fingerprintType: mclParams!.fingerprintType,
-        }],
-        threshold: mclParams!.threshold,
-        maxIterations: mclParams!.maxIterations,
-        useWebGPU: mclParams.useWebGPU,
-        inflate: mclParams!.inflation,
-        minClusterSize: mclParams.minClusterSize,
-      } satisfies MCLSerializableOptions);
-      this.df.setTag(MCL_OPTIONS_TAG, serializedOptions);
-      //@ts-ignore
-      mclViewer.sc.props['initializationFunction'] = 'EDA:MCLInitializationFunction';
-      this._mclViewer = mclViewer?.sc ?? null;
+      threshold: mclParams!.threshold,
+      maxIterations: mclParams!.maxIterations,
+      useWebGPU: mclParams.useWebGPU,
+      inflate: mclParams!.inflation,
+      minClusterSize: mclParams.minClusterSize,
+    } satisfies MCLSerializableOptions);
+    const tv = grok.shell.getTableView(this.df.name);
+    if (tv) {
+      const func = DG.Func.find({package: 'EDA', name: 'markovClusteringViewer'})[0];
+      if (!func)
+        throw new Error('Markov clustering function is not found');
+      // make sure eda is loaded
+      await func.apply();
+      tv.addViewer(VIEWER_TYPE.MCL, {mclProps: serializedOptions}) as MCLViewer;
+      //tv.addViewer(VIEWER_TYPE.MCL, {mclProps: serializedOptions});
+      // the addviewer method goes through dart, so it returns JSViewer instead of MCLViewer, so also need to wait a bit
+      await DG.delay(500);
+      this._mclViewer = this.findViewer(VIEWER_TYPE.MCL) as MCLViewer;
+      await this._mclViewer.initPromise;
+      const lstViewer = this.findViewer(VIEWER_TYPE.LOGO_SUMMARY_TABLE) as LogoSummaryTable | null;
+      if (lstViewer) { // beware, this is accessing private things
+        lstViewer._clusterStats = null;
+        lstViewer._clusterSelection = null;
+        lstViewer._viewerGrid = null;
+        lstViewer._logoSummaryTable = null;
+        lstViewer.render();
+      }
     }
   }

package/src/viewers/cluster-max-activity-viewer.ts CHANGED Viewed

@@ -112,7 +112,7 @@ export class ClusterMaxActivityViewer extends DG.JsViewer implements IClusterMax
       return null;
     }
     const clusterSizeCol = this.dataFrame.columns.getOrCreate(ClusterMaxActivityViewer.clusterSizeColName,
-      DG.TYPE.INT, this.dataFrame.rowCount);
+      DG.TYPE.INT);
     const clusterSizeMap: {[key: number | string]: number} = {};
     for (let i = 0; i < this.dataFrame.rowCount; i++) {
       const cluster: string | number = clusterCol.get(i);
@@ -156,7 +156,7 @@ export class ClusterMaxActivityViewer extends DG.JsViewer implements IClusterMax
     }
     const maxAtivityInClusterSizeCol = this.dataFrame.columns.getOrCreate(
-      ClusterMaxActivityViewer.maxActivityInClusterColName, DG.COLUMN_TYPE.INT, this.dataFrame.rowCount);
+      ClusterMaxActivityViewer.maxActivityInClusterColName, DG.COLUMN_TYPE.INT);
     maxAtivityInClusterSizeCol.init((i) => {
       if (clusterCol.isNone(i))
         return 0;
@@ -164,7 +164,7 @@ export class ClusterMaxActivityViewer extends DG.JsViewer implements IClusterMax
     });
     const maxConnectivityInClusterSizeCol = this.dataFrame.columns.getOrCreate(
-      ClusterMaxActivityViewer.maxConnectivityInClusterColName, DG.COLUMN_TYPE.INT, this.dataFrame.rowCount);
+      ClusterMaxActivityViewer.maxConnectivityInClusterColName, DG.COLUMN_TYPE.INT);
     maxConnectivityInClusterSizeCol.init((i) => {
       if (clusterCol.isNone(i))
         return 0;
@@ -172,7 +172,7 @@ export class ClusterMaxActivityViewer extends DG.JsViewer implements IClusterMax
     });
     const synSelectionCol = this.dataFrame.columns.getOrCreate(
-      ClusterMaxActivityViewer.synSelectionColName, DG.TYPE.STRING, this.dataFrame.rowCount);
+      ClusterMaxActivityViewer.synSelectionColName, DG.TYPE.STRING);
     synSelectionCol.init((i) => {
       if (clusterCol.isNone(i))

package/src/widgets/mutation-cliffs.ts CHANGED Viewed

@@ -243,8 +243,10 @@ function cliffsPairsWidgetParts(table: DG.DataFrame, options: MutationCliffsOpti
     pairsGrid.root.style.setProperty('width', '100%');
     uniqueSequencesGrid.root.style.removeProperty('width');
     uniqueSequencesGrid.root.style.setProperty('width', '100%');
-    pairsGrid.root.style.minHeight = '250px';
-    uniqueSequencesGrid.root.style.minHeight = '250px';
+    pairsGrid.root.style.minHeight = '200px';
+    uniqueSequencesGrid.root.style.minHeight = '200px';
+    pairsGrid.root.style.height = 'unset';
+    uniqueSequencesGrid.root.style.height = 'unset';
   }, 200);
   return {pairsGrid, uniqueSequencesGrid, aminoToInput};

package/src/widgets/peptides.ts CHANGED Viewed

@@ -263,20 +263,28 @@ export async function startAnalysis(activityColumn: DG.Column<number>, peptidesC
   const progress = DG.TaskBarProgressIndicator.create('Loading SAR...');
   // Prepare new DF
-  const newDf = DG.DataFrame.create(sourceDf.rowCount);
-  newDf.name = 'Peptides analysis';
-  const newDfCols = newDf.columns;
-  newDfCols.add(scaledCol);
-  for (const col of sourceDf.columns) {
-    if (col.getTag(C.TAGS.ANALYSIS_COL) !== `${true}`) {
-      if (col.name.toLowerCase() === scaledCol.name.toLowerCase())
-        col.name = sourceDf.columns.getUnusedName(col.name);
-      newDfCols.add(col);
-    }
-  }
+  // const newDf = DG.DataFrame.create(sourceDf.rowCount);
+  // newDf.name = 'Peptides analysis';
+  // const newDfCols = newDf.columns;
+  // newDfCols.add(scaledCol);
+  // for (const col of sourceDf.columns) {
+  //   if (col.getTag(C.TAGS.ANALYSIS_COL) !== `${true}`) {
+  //     if (col.name.toLowerCase() === scaledCol.name.toLowerCase())
+  //       col.name = sourceDf.columns.getUnusedName(col.name);
+  //     newDfCols.add(col);
+  //   }
+  // }
+  //make sure the data sync is turned off for the dataframe:
+  sourceDf.tags.delete && sourceDf.tags.delete('.script');
+  const sourceCols = sourceDf.columns;
+  const oldActivityCol = sourceDf.col(scaledCol.name);
+  if (oldActivityCol)
+    oldActivityCol.name = sourceCols.getUnusedName(oldActivityCol.name);
+  const scaleColRawData = scaledCol.getRawData();
+  sourceDf.columns.addNew(scaledCol.name, scaledCol.type).init((i) => scaleColRawData[i]);
+  sourceCols.setOrder([scaledCol.name, peptidesCol.name, ...sourceCols.names().filter((name) => name !== peptidesCol.name && name !== scaledCol.name)]);
   const settings: type.PeptidesSettings = {
     sequenceColumnName: peptidesCol.name, activityColumnName: activityColumn.name, activityScaling: scaling,
     columns: {}, showDendrogram: false, showSequenceSpace: false,
@@ -285,18 +293,18 @@ export async function startAnalysis(activityColumn: DG.Column<number>, peptidesC
   };
   if (clustersColumn) {
-    const clusterCol = newDf.getCol(clustersColumn.name);
+    const clusterCol = sourceDf.getCol(clustersColumn.name);
     if (clusterCol.type !== DG.COLUMN_TYPE.STRING)
-      newDfCols.replace(clusterCol, clusterCol.convertTo(DG.COLUMN_TYPE.STRING));
+      sourceCols.replace(clusterCol, clusterCol.convertTo(DG.COLUMN_TYPE.STRING));
   }
-  newDf.setTag(C.TAGS.SETTINGS, JSON.stringify(settings));
+  sourceDf.setTag(C.TAGS.SETTINGS, JSON.stringify(settings));
-  const bitset = DG.BitSet.create(sourceDf.rowCount,
-    (i) => !activityColumn.isNone(i) && !peptidesCol.isNone(i) && sourceDf.filter.get(i));
+  // const bitset = DG.BitSet.create(sourceDf.rowCount,
+  //   (i) => !activityColumn.isNone(i) && !peptidesCol.isNone(i) && sourceDf.filter.get(i));
   // Cloning dataframe with applied filter. If filter is not applied, cloning is
   // needed anyway to allow filtering on the original dataframe
-  model = PeptidesModel.getInstance(newDf.clone(bitset));
+  model = PeptidesModel.getInstance(sourceDf);
   model.init(settings);
   if (clustersColumn) {
     const lstProps: ILogoSummaryTable = {