npm - @datagrok/sequence-translator - Versions diffs - 1.0.16 → 1.0.17 - Mend

@datagrok/sequence-translator 1.0.16 → 1.0.17

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (34) hide show

package/detectors.js +0 -28
package/dist/package-test.js +3830 -3738
package/dist/package.js +3826 -3734
package/package.json +3 -1
package/setup-unlink-clean.sh +21 -0
package/src/autostart/calculations.ts +2 -2
package/src/autostart/registration.ts +102 -37
package/src/{axolabs/define-pattern.ts → axolabs-tab/axolabs-tab.ts} +2 -2
package/src/axolabs-tab/define-pattern.ts +874 -0
package/src/{axolabs → axolabs-tab}/draw-svg.ts +1 -1
package/src/{axolabs → axolabs-tab}/helpers.ts +2 -2
package/src/{autostart → hardcode-to-be-eliminated}/ICDs.ts +0 -0
package/src/{autostart → hardcode-to-be-eliminated}/IDPs.ts +0 -0
package/src/{structures-works → hardcode-to-be-eliminated}/const.ts +0 -0
package/src/{axolabs → hardcode-to-be-eliminated}/constants.ts +0 -0
package/src/{structures-works → hardcode-to-be-eliminated}/converters.ts +1 -1
package/src/{structures-works → hardcode-to-be-eliminated}/map.ts +2 -2
package/src/{autostart → hardcode-to-be-eliminated}/salts.ts +0 -0
package/src/{autostart → hardcode-to-be-eliminated}/sources.ts +0 -0
package/src/{autostart → hardcode-to-be-eliminated}/users.ts +0 -0
package/src/{main/main-view.ts → main-tab/main-tab.ts} +27 -79
package/src/package.ts +40 -23
package/src/sdf-tab/sdf-tab.ts +163 -0
package/src/{structures-works → sdf-tab}/sequence-codes-tools.ts +8 -5
package/src/tests/smiles-tests.ts +2 -2
package/src/utils/const.ts +0 -0
package/src/{helpers.ts → utils/helpers.ts} +3 -3
package/src/utils/sdf-add-columns.ts +3 -3
package/src/utils/sdf-save-table.ts +4 -4
package/src/utils/structures-works/draw-molecule.ts +84 -0
package/src/{structures-works → utils/structures-works}/from-monomers.ts +15 -16
package/src/{structures-works → utils/structures-works}/mol-transformations.ts +34 -52
package/{test-SequenceTranslator-6288c2fbe346-cce4ac1d.html → test-SequenceTranslator-6288c2fbe346-695b7b55.html} +10 -10
package/src/structures-works/save-sense-antisense.ts +0 -91

package/package.json CHANGED Viewed

@@ -1,7 +1,7 @@
 {
   "name": "@datagrok/sequence-translator",
   "friendlyName": "Sequence Translator",
-  "version": "1.0.16",
+  "version": "1.0.17",
   "author": {
     "name": "Alexey Choposky",
     "email": "achopovsky@datagrok.ai"
@@ -16,6 +16,8 @@
     "@datagrok-libraries/utils": "^1.17.2",
     "@types/react": "^18.0.15",
     "@datagrok-libraries/bio": "^5.11.1",
+    "@deck.gl/core": "8.8.12",
+    "@luma.gl/core": "8.5.17",
     "datagrok-api": "^1.8.2",
     "datagrok-tools": "^4.1.2",
     "npm": "^8.11.0",

package/setup-unlink-clean.sh ADDED Viewed

@@ -0,0 +1,21 @@
+#!/bin/bash
+package_dir=$(pwd)
+GREEN='\e[0;32m'
+NO_COLOR='\e[0m'
+dirs=(
+  "../../js-api/"
+  "../../libraries/utils/"
+  "../../libraries/bio/"
+)
+npm uninstall --location=global datagrok-api @datagrok-libraries/utils @datagrok-libraries/ml @datagrok-libraries/bio
+for dir in ${dirs[@]}; do
+  cd $package_dir
+  cd $dir
+  echo -e $GREEN Removing node_modules and dist in $(pwd) $NO_COLOR
+  rm -rf node_modules dist
+  # rm package-lock.json
+done

package/src/autostart/calculations.ts CHANGED Viewed

@@ -1,7 +1,7 @@
 import * as DG from 'datagrok-api/dg';
-import {sortByStringLengthInDescendingOrder} from '../helpers';
-import {MODIFICATIONS} from '../structures-works/map';
+import {sortByStringLengthInDescendingOrder} from '../utils/helpers';
+import {MODIFICATIONS} from '../hardcode-to-be-eliminated/map';
 export function saltMass(
   saltNames: string[], saltsMolWeightList: number[], equivalentsCol: DG.Column, i: number, saltCol: DG.Column

package/src/autostart/registration.ts CHANGED Viewed

@@ -4,24 +4,31 @@ import * as DG from 'datagrok-api/dg';
 import {
   siRnaBioSpringToGcrs, siRnaAxolabsToGcrs, gcrsToNucleotides, asoGapmersBioSpringToGcrs, gcrsToMermade12,
   siRnaNucleotidesToGcrs
-} from '../structures-works/converters';
-import {weightsObj, SYNTHESIZERS} from '../structures-works/map';
+} from '../hardcode-to-be-eliminated/converters';
+import {weightsObj, SYNTHESIZERS} from '../hardcode-to-be-eliminated/map';
 import {SEQUENCE_TYPES, COL_NAMES, GENERATED_COL_NAMES} from './constants';
 import {saltMass, saltMolWeigth, molecularWeight, batchMolWeight} from './calculations';
-import {isValidSequence} from '../structures-works/sequence-codes-tools';
-import {sequenceToMolV3000} from '../structures-works/from-monomers';
-import {linkStrandsV3000} from '../structures-works/mol-transformations';
-import {stringify, download, removeEmptyRows, differenceOfTwoArrays} from '../helpers';
+import {isValidSequence} from '../sdf-tab/sequence-codes-tools';
+import {sequenceToMolV3000} from '../utils/structures-works/from-monomers';
+import {linkStrandsV3000} from '../utils/structures-works/mol-transformations';
+import {stringify, download, removeEmptyRows, differenceOfTwoArrays} from '../utils/helpers';
-import {SALTS_CSV} from './salts';
-import {USERS_CSV} from './users';
-import {ICDS} from './ICDs';
-import {SOURCES} from './sources';
-import {IDPS} from './IDPs';
+import {SALTS_CSV} from '../hardcode-to-be-eliminated/salts';
+import {USERS_CSV} from '../hardcode-to-be-eliminated/users';
+import {ICDS} from '../hardcode-to-be-eliminated/ICDs';
+import {SOURCES} from '../hardcode-to-be-eliminated/sources';
+import {IDPS} from '../hardcode-to-be-eliminated/IDPs';
 import {sdfAddColumns} from '../utils/sdf-add-columns';
 import {sdfSaveTable} from '../utils/sdf-save-table';
+const enum PREFIXES {
+  AS = 'AS',
+  SS = 'SS',
+  AS1 = 'AS1',
+  AS2 = 'AS2'
+}
 const enum SEQ_TYPE {
   AS = 'AS',
   SS = 'SS',
@@ -29,20 +36,38 @@ const enum SEQ_TYPE {
   DIMER = 'Dimer',
 }
-/** Computable classes of sequence types */
-const enum SEQ_TYPE_CLASS {
+/** Computable categories of sequence types */
+const enum SEQ_TYPE_CATEGORY {
   AS_OR_SS,
   DUPLEX,
   DIMER,
 }
-/** Style used for a cell with invalid value  */
-const errorStyle = {
-  'background-color': '#ff8080',
+/** Map between types and their categories inferrable from 'Sequence' column */
+const typeCategoryMap = {
+  [SEQ_TYPE.AS]: SEQ_TYPE_CATEGORY.AS_OR_SS,
+  [SEQ_TYPE.SS]: SEQ_TYPE_CATEGORY.AS_OR_SS,
+  [SEQ_TYPE.DIMER]: SEQ_TYPE_CATEGORY.DIMER,
+  [SEQ_TYPE.DUPLEX]: SEQ_TYPE_CATEGORY.DUPLEX,
+};
+/** Style used for cells in 'Type' column  */
+const typeColCellStyle = {
+  'display': 'flex',
+  'justify-content': 'center',
+  'align-items': 'center',
+  'text-color': 'var(--grey-5)', // --grey-6 does not match other cells
   'width': '100%',
   'height': '100%',
 };
+const pinkBackground = {
+  'background-color': '#ff8080',
+};
+/** Style used for a cell with invalid value  */
+const typeColErrorStyle = Object.assign({}, pinkBackground, typeColCellStyle);
 export function sdfHandleErrorUI(msgPrefix: string, df: DG.DataFrame, rowI: number, err: any) {
   const errStr: string = err.toString();
   const errMsg: string = msgPrefix + `row #${rowI + 1}, name: '${df.get('Chemistry Name', rowI)}', ` +
@@ -50,34 +75,61 @@ export function sdfHandleErrorUI(msgPrefix: string, df: DG.DataFrame, rowI: numb
   grok.shell.warning(errMsg);
 }
-// todo: use a dictionary instead?
-function getActualTypeClass(actualType: string): SEQ_TYPE_CLASS {
-  if (actualType === SEQ_TYPE.AS || actualType === SEQ_TYPE.SS)
-    return SEQ_TYPE_CLASS.AS_OR_SS;
-  else if (actualType === SEQ_TYPE.DIMER)
-    return SEQ_TYPE_CLASS.DIMER;
-  else if (actualType === SEQ_TYPE.DUPLEX)
-    return SEQ_TYPE_CLASS.DUPLEX;
+/** Determine the category of the value specified in 'Types' column  */
+function getActualTypeClass(actualType: string): SEQ_TYPE_CATEGORY {
+  if (Object.keys(typeCategoryMap).includes(actualType))
+    return typeCategoryMap[actualType as SEQ_TYPE];
   else
     throw new Error('Some types in \'Types\' column are invalid ');
 }
-function inferTypeClassFromSequence(seq: string): SEQ_TYPE_CLASS {
+function isASorSS(splittedLines: string[][]): boolean {
+  return splittedLines.length === 1 && splittedLines[0].length === 1;
+}
+/** Check whether the number of lines and prefixes in the 'Sequence' string
+ * are valid  */
+function verifyPrefixes(splittedLines: string[][], allowedPrefixes: Set<PREFIXES>, allowedLength: number): boolean {
+  const lengthCriterion = splittedLines.length === allowedLength;
+  let prefixCriterion = true;
+  for (const line of splittedLines) {
+    const prefix = line[0];
+    prefixCriterion &&= (allowedPrefixes.has(prefix as PREFIXES));
+  }
+  return lengthCriterion && prefixCriterion;
+}
+function isDuplex(splittedLines: string[][]): boolean {
+  const allowedPrefixes = new Set([PREFIXES.SS, PREFIXES.AS]);
+  return verifyPrefixes(splittedLines, allowedPrefixes, 2);
+}
+function isDimer(splittedLines: string[][]): boolean {
+  const allowedPrefixes = new Set([PREFIXES.SS, PREFIXES.AS1, PREFIXES.AS2]);
+  return verifyPrefixes(splittedLines, allowedPrefixes, 3);
+}
+function inferTypeClassFromSequence(seq: string): SEQ_TYPE_CATEGORY {
   const lines = seq.split('\n');
-  if (lines.length === 1)
-    return SEQ_TYPE_CLASS.AS_OR_SS;
-  else if (lines.length === 2)
-    return SEQ_TYPE_CLASS.DUPLEX;
-  else if (lines.length === 3)
-    return SEQ_TYPE_CLASS.DIMER;
+  const splittedLines = [];
+  for (const line of lines)
+    splittedLines.push(line.split(' '));
+  if (isASorSS(splittedLines))
+    return SEQ_TYPE_CATEGORY.AS_OR_SS;
+  else if (isDuplex(splittedLines))
+    return SEQ_TYPE_CATEGORY.DUPLEX;
+  else if (isDimer(splittedLines))
+    return SEQ_TYPE_CATEGORY.DIMER;
   else
-    throw new Error('Wrong formatting of sequences in \'Sequence\' column');
-  //todo: throw in the case of wrong formatting
+    throw new Error('Some cells in \'Sequence\' column have wrong formatting');
 }
 /** Compare type specified in 'Type' column to that computed from 'Sequence' column  */
 function validateType(actualType: string, seq: string): boolean {
-  return getActualTypeClass(actualType) === inferTypeClassFromSequence(seq);
+  if (actualType === '' && seq === '')
+    return true;
+  else
+    return getActualTypeClass(actualType) === inferTypeClassFromSequence(seq);
 }
 function oligoSdFileGrid(view: DG.TableView): void {
@@ -90,8 +142,21 @@ function oligoSdFileGrid(view: DG.TableView): void {
   const seqCol = df.getCol(seqColName);
   grid.onCellPrepare((gridCell: DG.GridCell) => {
     if (gridCell.isTableCell && gridCell.gridColumn.column!.name === typeColName) {
-      const isValidType = validateType(gridCell.cell.value, seqCol.get(gridCell.tableRow!.idx));
-      gridCell.style.element = ui.div(gridCell.cell.value, isValidType ? {} : {style: errorStyle});
+      let isValidType = false;
+      let formattingError = false;
+      try {
+        isValidType = validateType(gridCell.cell.value, seqCol.get(gridCell.tableRow!.idx));
+      } catch {
+        formattingError = true;
+      }
+      const el = ui.div(
+        gridCell.cell.value, isValidType ? {style: typeColCellStyle} : {style: typeColErrorStyle}
+      );
+      gridCell.style.element = el;
+      const msg = formattingError ? 'Sequence pattern or Type value has wrong formatting' :
+        'Input in Type column doesn\'t match the Sequence pattern';
+      if (!isValidType)
+        ui.tooltip.bind(el, msg);
     }
   });
 }
@@ -126,7 +191,7 @@ export function autostartOligoSdFileSubscription() {
             });
           }); // /^[fmpsACGU]{6,}$/
         } else if (DG.Detector.sampleCategories(seqCol,
-            (s) => /(\(invabasic\)|\(GalNAc-2-JNJ\)|f|m|ps|A|C|G|U){6,}$/.test(s)) ||
+          (s) => /(\(invabasic\)|\(GalNAc-2-JNJ\)|f|m|ps|A|C|G|U){6,}$/.test(s)) ||
           DG.Detector.sampleCategories(seqCol, (s) => /^(?=.*moe)(?=.*5mC)(?=.*ps){6,}/.test(s))) {
           menu.item('Convert GCRS to raw', () => {
             grid.table.columns.addNewString(seqCol.name + ' to raw').init((i: number) => {

package/src/{axolabs/define-pattern.ts → axolabs-tab/axolabs-tab.ts} RENAMED Viewed

@@ -6,7 +6,7 @@ import * as svg from 'save-svg-as-png';
 import $ from 'cash-dom';
 import {drawAxolabsPattern} from './draw-svg';
-import {AXOLABS_MAP} from './constants';
+import {AXOLABS_MAP} from '../hardcode-to-be-eliminated/constants';
 import {isOverhang} from './helpers';
 const baseChoices: string[] = Object.keys(AXOLABS_MAP);
@@ -114,7 +114,7 @@ function addColumnWithTranslatedSequences(
   });
 }
-export function defineAxolabsPattern() {
+export function getAxolabsTab() {
   const enumerateModifications = [defaultBase];
   let maximalSsLength = defaultSequenceLength;
   let maximalAsLength = defaultSequenceLength;