npm - @teselagen/sequence-utils - Versions diffs - 0.3.9 → 0.3.11 - Mend

@teselagen/sequence-utils 0.3.9 → 0.3.11

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (12) hide show

package/bioData.d.ts +1 -1
package/filterSequenceString.d.ts +2 -4
package/index.js +15 -17
package/index.mjs +15 -17
package/index.umd.js +15 -17
package/package.json +1 -1
package/src/bioData.js +2 -3
package/src/filterSequenceString.js +7 -11
package/src/filterSequenceString.test.js +24 -8
package/src/insertSequenceDataAtPositionOrRange.test.js +2 -2
package/src/tidyUpSequenceData.js +2 -3
package/src/tidyUpSequenceData.test.js +25 -82

package/bioData.d.ts CHANGED Viewed

@@ -1,6 +1,6 @@
 export const protein_letters: "ACDEFGHIKLMNPQRSTVWY";
 export const protein_letters_withUandX: "ACDEFGHIKLMNPQRSTVWYUX";
-export const extended_protein_letters: "ACDEFGHIKLMNPQRSTVWYBXZJUO.*-";
+export const extended_protein_letters: "ACDEFGHIKLMNPQRSTVWYBXZJUO";
 export const ambiguous_dna_letters: "GATCRYWSMKHBVDN";
 export const unambiguous_dna_letters: "GATC";
 export const ambiguous_rna_letters: "GAUCRYWSMKHBVDN";

package/filterSequenceString.d.ts CHANGED Viewed

@@ -1,18 +1,16 @@
-export default function filterSequenceString(sequenceString: any, { additionalValidChars, isOligo, name, isProtein, isRna, isMixedRnaAndDna, includeStopCodon }?: {
+export default function filterSequenceString(sequenceString: any, { additionalValidChars, isOligo, name, isProtein, isRna, isMixedRnaAndDna }?: {
     additionalValidChars?: string | undefined;
     isOligo: any;
     name: any;
     isProtein: any;
     isRna: any;
     isMixedRnaAndDna: any;
-    includeStopCodon: any;
 }): (string | string[])[];
-export function getAcceptedChars({ isOligo, isProtein, isRna, isMixedRnaAndDna, includeStopCodon }?: {
+export function getAcceptedChars({ isOligo, isProtein, isRna, isMixedRnaAndDna }?: {
     isOligo: any;
     isProtein: any;
     isRna: any;
     isMixedRnaAndDna: any;
-    includeStopCodon: any;
 }): string;
 export function getReplaceChars({ isOligo, isProtein, isRna, isMixedRnaAndDna }?: {
     isOligo: any;

package/index.js CHANGED Viewed

@@ -6000,7 +6000,7 @@ lodash.exports;
 var lodashExports = lodash.exports;
 const protein_letters = "ACDEFGHIKLMNPQRSTVWY";
 const protein_letters_withUandX = "ACDEFGHIKLMNPQRSTVWYUX";
-const extended_protein_letters = "ACDEFGHIKLMNPQRSTVWYBXZJUO.*-";
+const extended_protein_letters = "ACDEFGHIKLMNPQRSTVWYBXZJUO";
 const ambiguous_dna_letters = "GATCRYWSMKHBVDN";
 const unambiguous_dna_letters = "GATC";
 const ambiguous_rna_letters = "GAUCRYWSMKHBVDN";
@@ -6056,7 +6056,7 @@ const extended_protein_values = {
   Y: "Y",
   Z: "QE",
   "*": "\\*\\.",
-  ".": "\\.\\.",
+  ".": "\\.",
   "-": "\\-"
 };
 const bioData = /* @__PURE__ */ Object.freeze(/* @__PURE__ */ Object.defineProperty({
@@ -12329,15 +12329,13 @@ function filterSequenceString(sequenceString, {
   name,
   isProtein,
   isRna,
-  isMixedRnaAndDna,
-  includeStopCodon
+  isMixedRnaAndDna
 } = {}) {
   const acceptedChars = getAcceptedChars({
     isOligo,
     isProtein,
     isRna,
-    isMixedRnaAndDna,
-    includeStopCodon
+    isMixedRnaAndDna
   });
   const replaceChars = getReplaceChars({
     isOligo,
@@ -12387,10 +12385,9 @@ function getAcceptedChars({
   isOligo,
   isProtein,
   isRna,
-  isMixedRnaAndDna,
-  includeStopCodon
+  isMixedRnaAndDna
 } = {}) {
-  return isProtein ? `${protein_letters_withUandX.toLowerCase()}${includeStopCodon ? "*." : ""}}` : isOligo ? ambiguous_rna_letters.toLowerCase() + "t" : isRna ? ambiguous_rna_letters.toLowerCase() + "t" : isMixedRnaAndDna ? ambiguous_rna_letters.toLowerCase() + ambiguous_dna_letters.toLowerCase() : (
+  return isProtein ? `${extended_protein_letters.toLowerCase()}}` : isOligo ? ambiguous_rna_letters.toLowerCase() + "t" : isRna ? ambiguous_rna_letters.toLowerCase() + "t" : isMixedRnaAndDna ? ambiguous_rna_letters.toLowerCase() + ambiguous_dna_letters.toLowerCase() : (
     //just plain old dna
     ambiguous_rna_letters.toLowerCase() + ambiguous_dna_letters.toLowerCase()
   );
@@ -12402,9 +12399,12 @@ function getReplaceChars({
   isRna,
   isMixedRnaAndDna
 } = {}) {
-  return isProtein ? {} : isOligo ? {} : isRna ? { t: "u" } : isMixedRnaAndDna ? {} : (
-    //just plain old dna
-    {}
+  return isProtein ? {} : (
+    // {".": "*"}
+    isOligo ? {} : isRna ? { t: "u" } : isMixedRnaAndDna ? {} : (
+      //just plain old dna
+      {}
+    )
   );
 }
 __name(getReplaceChars, "getReplaceChars");
@@ -12544,7 +12544,7 @@ function tidyUpSequenceData(pSeqData, options = {}) {
   const {
     annotationsAsObjects,
     logMessages,
-    removeUnwantedChars,
+    doNotRemoveInvalidChars,
     additionalValidChars,
     noTranslationData,
     doNotProvideIdsForAnnotations,
@@ -12578,11 +12578,9 @@ function tidyUpSequenceData(pSeqData, options = {}) {
   if (seqData.isRna) {
     seqData.sequence = seqData.sequence.replace(/t/gi, "u");
   }
-  if (removeUnwantedChars) {
+  if (!doNotRemoveInvalidChars) {
     if (seqData.isProtein) {
-      const [newSeq] = filterSequenceString(seqData.proteinSequence, __spreadValues({
-        includeStopCodon: true
-      }, topLevelSeqData || seqData));
+      const [newSeq] = filterSequenceString(seqData.proteinSequence, __spreadValues({}, topLevelSeqData || seqData));
       seqData.proteinSequence = newSeq;
     } else {
       const [newSeq] = filterSequenceString(seqData.sequence, __spreadValues({

package/index.mjs CHANGED Viewed

@@ -5998,7 +5998,7 @@ lodash.exports;
 var lodashExports = lodash.exports;
 const protein_letters = "ACDEFGHIKLMNPQRSTVWY";
 const protein_letters_withUandX = "ACDEFGHIKLMNPQRSTVWYUX";
-const extended_protein_letters = "ACDEFGHIKLMNPQRSTVWYBXZJUO.*-";
+const extended_protein_letters = "ACDEFGHIKLMNPQRSTVWYBXZJUO";
 const ambiguous_dna_letters = "GATCRYWSMKHBVDN";
 const unambiguous_dna_letters = "GATC";
 const ambiguous_rna_letters = "GAUCRYWSMKHBVDN";
@@ -6054,7 +6054,7 @@ const extended_protein_values = {
   Y: "Y",
   Z: "QE",
   "*": "\\*\\.",
-  ".": "\\.\\.",
+  ".": "\\.",
   "-": "\\-"
 };
 const bioData = /* @__PURE__ */ Object.freeze(/* @__PURE__ */ Object.defineProperty({
@@ -12327,15 +12327,13 @@ function filterSequenceString(sequenceString, {
   name,
   isProtein,
   isRna,
-  isMixedRnaAndDna,
-  includeStopCodon
+  isMixedRnaAndDna
 } = {}) {
   const acceptedChars = getAcceptedChars({
     isOligo,
     isProtein,
     isRna,
-    isMixedRnaAndDna,
-    includeStopCodon
+    isMixedRnaAndDna
   });
   const replaceChars = getReplaceChars({
     isOligo,
@@ -12385,10 +12383,9 @@ function getAcceptedChars({
   isOligo,
   isProtein,
   isRna,
-  isMixedRnaAndDna,
-  includeStopCodon
+  isMixedRnaAndDna
 } = {}) {
-  return isProtein ? `${protein_letters_withUandX.toLowerCase()}${includeStopCodon ? "*." : ""}}` : isOligo ? ambiguous_rna_letters.toLowerCase() + "t" : isRna ? ambiguous_rna_letters.toLowerCase() + "t" : isMixedRnaAndDna ? ambiguous_rna_letters.toLowerCase() + ambiguous_dna_letters.toLowerCase() : (
+  return isProtein ? `${extended_protein_letters.toLowerCase()}}` : isOligo ? ambiguous_rna_letters.toLowerCase() + "t" : isRna ? ambiguous_rna_letters.toLowerCase() + "t" : isMixedRnaAndDna ? ambiguous_rna_letters.toLowerCase() + ambiguous_dna_letters.toLowerCase() : (
     //just plain old dna
     ambiguous_rna_letters.toLowerCase() + ambiguous_dna_letters.toLowerCase()
   );
@@ -12400,9 +12397,12 @@ function getReplaceChars({
   isRna,
   isMixedRnaAndDna
 } = {}) {
-  return isProtein ? {} : isOligo ? {} : isRna ? { t: "u" } : isMixedRnaAndDna ? {} : (
-    //just plain old dna
-    {}
+  return isProtein ? {} : (
+    // {".": "*"}
+    isOligo ? {} : isRna ? { t: "u" } : isMixedRnaAndDna ? {} : (
+      //just plain old dna
+      {}
+    )
   );
 }
 __name(getReplaceChars, "getReplaceChars");
@@ -12542,7 +12542,7 @@ function tidyUpSequenceData(pSeqData, options = {}) {
   const {
     annotationsAsObjects,
     logMessages,
-    removeUnwantedChars,
+    doNotRemoveInvalidChars,
     additionalValidChars,
     noTranslationData,
     doNotProvideIdsForAnnotations,
@@ -12576,11 +12576,9 @@ function tidyUpSequenceData(pSeqData, options = {}) {
   if (seqData.isRna) {
     seqData.sequence = seqData.sequence.replace(/t/gi, "u");
   }
-  if (removeUnwantedChars) {
+  if (!doNotRemoveInvalidChars) {
     if (seqData.isProtein) {
-      const [newSeq] = filterSequenceString(seqData.proteinSequence, __spreadValues({
-        includeStopCodon: true
-      }, topLevelSeqData || seqData));
+      const [newSeq] = filterSequenceString(seqData.proteinSequence, __spreadValues({}, topLevelSeqData || seqData));
       seqData.proteinSequence = newSeq;
     } else {
       const [newSeq] = filterSequenceString(seqData.sequence, __spreadValues({

package/index.umd.js CHANGED Viewed

@@ -6002,7 +6002,7 @@ var __name = (target, value) => __defProp(target, "name", { value, configurable:
   var lodashExports = lodash.exports;
   const protein_letters = "ACDEFGHIKLMNPQRSTVWY";
   const protein_letters_withUandX = "ACDEFGHIKLMNPQRSTVWYUX";
-  const extended_protein_letters = "ACDEFGHIKLMNPQRSTVWYBXZJUO.*-";
+  const extended_protein_letters = "ACDEFGHIKLMNPQRSTVWYBXZJUO";
   const ambiguous_dna_letters = "GATCRYWSMKHBVDN";
   const unambiguous_dna_letters = "GATC";
   const ambiguous_rna_letters = "GAUCRYWSMKHBVDN";
@@ -6058,7 +6058,7 @@ var __name = (target, value) => __defProp(target, "name", { value, configurable:
     Y: "Y",
     Z: "QE",
     "*": "\\*\\.",
-    ".": "\\.\\.",
+    ".": "\\.",
     "-": "\\-"
   };
   const bioData = /* @__PURE__ */ Object.freeze(/* @__PURE__ */ Object.defineProperty({
@@ -12331,15 +12331,13 @@ var __name = (target, value) => __defProp(target, "name", { value, configurable:
     name,
     isProtein,
     isRna,
-    isMixedRnaAndDna,
-    includeStopCodon
+    isMixedRnaAndDna
   } = {}) {
     const acceptedChars = getAcceptedChars({
       isOligo,
       isProtein,
       isRna,
-      isMixedRnaAndDna,
-      includeStopCodon
+      isMixedRnaAndDna
     });
     const replaceChars = getReplaceChars({
       isOligo,
@@ -12389,10 +12387,9 @@ var __name = (target, value) => __defProp(target, "name", { value, configurable:
     isOligo,
     isProtein,
     isRna,
-    isMixedRnaAndDna,
-    includeStopCodon
+    isMixedRnaAndDna
   } = {}) {
-    return isProtein ? `${protein_letters_withUandX.toLowerCase()}${includeStopCodon ? "*." : ""}}` : isOligo ? ambiguous_rna_letters.toLowerCase() + "t" : isRna ? ambiguous_rna_letters.toLowerCase() + "t" : isMixedRnaAndDna ? ambiguous_rna_letters.toLowerCase() + ambiguous_dna_letters.toLowerCase() : (
+    return isProtein ? `${extended_protein_letters.toLowerCase()}}` : isOligo ? ambiguous_rna_letters.toLowerCase() + "t" : isRna ? ambiguous_rna_letters.toLowerCase() + "t" : isMixedRnaAndDna ? ambiguous_rna_letters.toLowerCase() + ambiguous_dna_letters.toLowerCase() : (
       //just plain old dna
       ambiguous_rna_letters.toLowerCase() + ambiguous_dna_letters.toLowerCase()
     );
@@ -12404,9 +12401,12 @@ var __name = (target, value) => __defProp(target, "name", { value, configurable:
     isRna,
     isMixedRnaAndDna
   } = {}) {
-    return isProtein ? {} : isOligo ? {} : isRna ? { t: "u" } : isMixedRnaAndDna ? {} : (
-      //just plain old dna
-      {}
+    return isProtein ? {} : (
+      // {".": "*"}
+      isOligo ? {} : isRna ? { t: "u" } : isMixedRnaAndDna ? {} : (
+        //just plain old dna
+        {}
+      )
     );
   }
   __name(getReplaceChars, "getReplaceChars");
@@ -12546,7 +12546,7 @@ var __name = (target, value) => __defProp(target, "name", { value, configurable:
     const {
       annotationsAsObjects,
       logMessages,
-      removeUnwantedChars,
+      doNotRemoveInvalidChars,
       additionalValidChars,
       noTranslationData,
       doNotProvideIdsForAnnotations,
@@ -12580,11 +12580,9 @@ var __name = (target, value) => __defProp(target, "name", { value, configurable:
     if (seqData.isRna) {
       seqData.sequence = seqData.sequence.replace(/t/gi, "u");
     }
-    if (removeUnwantedChars) {
+    if (!doNotRemoveInvalidChars) {
       if (seqData.isProtein) {
-        const [newSeq] = filterSequenceString(seqData.proteinSequence, __spreadValues({
-          includeStopCodon: true
-        }, topLevelSeqData || seqData));
+        const [newSeq] = filterSequenceString(seqData.proteinSequence, __spreadValues({}, topLevelSeqData || seqData));
         seqData.proteinSequence = newSeq;
       } else {
         const [newSeq] = filterSequenceString(seqData.sequence, __spreadValues({

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@teselagen/sequence-utils",
-  "version": "0.3.9",
+  "version": "0.3.11",
   "dependencies": {
     "@teselagen/range-utils": "0.3.7",
     "bson-objectid": "^2.0.4",

package/src/bioData.js CHANGED Viewed

@@ -2,8 +2,7 @@
 export const protein_letters = "ACDEFGHIKLMNPQRSTVWY";
 export const protein_letters_withUandX = "ACDEFGHIKLMNPQRSTVWYUX";
-export const extended_protein_letters = "ACDEFGHIKLMNPQRSTVWYBXZJUO.*-";
+export const extended_protein_letters = "ACDEFGHIKLMNPQRSTVWYBXZJUO";
 export const ambiguous_dna_letters = "GATCRYWSMKHBVDN";
 export const unambiguous_dna_letters = "GATC";
 export const ambiguous_rna_letters = "GAUCRYWSMKHBVDN";
@@ -61,6 +60,6 @@ export const extended_protein_values = {
   Y: "Y",
   Z: "QE",
   "*": "\\*\\.",
-  ".": "\\.\\.",
+  ".": "\\.",
   "-": "\\-"
 };

package/src/filterSequenceString.js CHANGED Viewed

@@ -1,7 +1,7 @@
 import {
   ambiguous_dna_letters,
   ambiguous_rna_letters,
-  protein_letters_withUandX
+  extended_protein_letters
 } from "./bioData";
 export default function filterSequenceString(
@@ -12,16 +12,14 @@ export default function filterSequenceString(
     name,
     isProtein,
     isRna,
-    isMixedRnaAndDna,
-    includeStopCodon
+    isMixedRnaAndDna
   } = {}
 ) {
   const acceptedChars = getAcceptedChars({
     isOligo,
     isProtein,
     isRna,
-    isMixedRnaAndDna,
-    includeStopCodon
+    isMixedRnaAndDna
   });
   const replaceChars = getReplaceChars({
     isOligo,
@@ -82,13 +80,10 @@ export function getAcceptedChars({
   isOligo,
   isProtein,
   isRna,
-  isMixedRnaAndDna,
-  includeStopCodon
+  isMixedRnaAndDna
 } = {}) {
   return isProtein
-    ? `${protein_letters_withUandX.toLowerCase()}${
-        includeStopCodon ? "*." : ""
-      }}`
+    ? `${extended_protein_letters.toLowerCase()}}`
     : isOligo
     ? ambiguous_rna_letters.toLowerCase() + "t"
     : isRna
@@ -106,7 +101,8 @@ export function getReplaceChars({
 } = {}) {
   return isProtein
     ? {}
-    : isOligo
+    : // {".": "*"}
+    isOligo
     ? {}
     : isRna
     ? { t: "u" }

package/src/filterSequenceString.test.js CHANGED Viewed

@@ -49,10 +49,11 @@ describe("filterSequenceString", () => {
         isProtein: true
       }
     );
+    // expect(warnings[0]).toBe(`Replaced "." with "*" 2 times`);
     expect(warnings[0]).toBe(
-      'Invalid character(s) detected and removed: b, b, b, 3, 4, 2, ", ", ", ,, ,, ., ., / '
+      'Invalid character(s) detected and removed: 3, 4, 2, ", ", ", ,, ,, ., ., / '
     );
-    expect(str).toBe("xtgalmfwkqespvicyhrnd");
+    expect(str).toBe("bbbxtgalmfwkqespvicyhrnd");
   });
   it("when isProtein: true, should handle upper case letters", () => {
     const [str, warnings] = filterSequenceString("xtgalmfWKQEspvicyhrnd", {
@@ -61,12 +62,27 @@ describe("filterSequenceString", () => {
     expect(warnings.length).toBe(0);
     expect(str).toBe("xtgalmfWKQEspvicyhrnd");
   });
-  it("when isProtein: true, should handle the option to includeStopCodon by allowing periods", () => {
-    const [str] = filterSequenceString('bbb342"""xtgalmfwkqespvicyhrnd,,../', {
-      isProtein: true,
-      includeStopCodon: true
-    });
-    expect(str).toBe("xtgalmfwkqespvicyhrnd..");
+  it("when isProtein: true it should not filter this aa seq", () => {
+    const [str] = filterSequenceString(
+      "mhhhhhhgsgsmledlkrqvleanlalpkhnlasgssghvsavdrergvfviapsgvdfrimtaddmvvvsietgevvegekppaedtpthrllyqafpsiggivhthsrhatiwaqagqsipatgtthadhfygtipctrkmtdaeingeyewetgnvivetfekqgidaaqmpgvlvhshgpfawgknaedavhnaivleevaymgifcrqlapqlpdmqqtllnkhylrkhgakayygq",
+      {
+        isProtein: true
+      }
+    );
+    expect(str).toBe(
+      `mhhhhhhgsgsmledlkrqvleanlalpkhnlasgssghvsavdrergvfviapsgvdfrimtaddmvvvsietgevvegekppaedtpthrllyqafpsiggivhthsrhatiwaqagqsipatgtthadhfygtipctrkmtdaeingeyewetgnvivetfekqgidaaqmpgvlvhshgpfawgknaedavhnaivleevaymgifcrqlapqlpdmqqtllnkhylrkhgakayygq`
+    );
+  });
+  it("when isProtein: true, it should convert . to *", () => {
+    const [str] = filterSequenceString(
+      'BXZJUO*bbb342"""xtgalbmfwkqespvicyhrnd,,../',
+      {
+        isProtein: true
+      }
+    );
+    expect(str).toBe("BXZJUObbbxtgalbmfwkqespvicyhrnd");
   });
 });

package/src/insertSequenceDataAtPositionOrRange.test.js CHANGED Viewed

@@ -135,7 +135,7 @@ describe("insertSequenceData", () => {
   });
   it("inserts characters at correct origin spanning range with {maintainOriginSplit: true} option", () => {
     const sequenceToInsert = {
-      sequence: "xrrrrry",
+      sequence: "crrrrry",
       //         fffffff
       features: [{ name: "feat1", start: 0, end: 6 }]
     };
@@ -154,7 +154,7 @@ describe("insertSequenceData", () => {
         maintainOriginSplit: true
       }
     );
-    postInsertSeq.sequence.should.equal("rrrryagagaxr");
+    postInsertSeq.sequence.should.equal("rrrryagagacr");
     //                                   fffff fff ff
     postInsertSeq.features.should.containSubset([
       { name: "feat1", start: 10, end: 4 },

package/src/tidyUpSequenceData.js CHANGED Viewed

@@ -13,7 +13,7 @@ export default function tidyUpSequenceData(pSeqData, options = {}) {
   const {
     annotationsAsObjects,
     logMessages,
-    removeUnwantedChars,
+    doNotRemoveInvalidChars,
     additionalValidChars,
     noTranslationData,
     doNotProvideIdsForAnnotations,
@@ -52,10 +52,9 @@ export default function tidyUpSequenceData(pSeqData, options = {}) {
     //flip all t's to u's
     seqData.sequence = seqData.sequence.replace(/t/gi, "u");
   }
-  if (removeUnwantedChars) {
+  if (!doNotRemoveInvalidChars) {
     if (seqData.isProtein) {
       const [newSeq] = filterSequenceString(seqData.proteinSequence, {
-        includeStopCodon: true,
         ...(topLevelSeqData || seqData)
       });
       seqData.proteinSequence = newSeq;

package/src/tidyUpSequenceData.test.js CHANGED Viewed

@@ -5,29 +5,26 @@ import chaiSubset from "chai-subset";
 chai.use(chaiSubset);
 chai.should();
 describe("tidyUpSequenceData", () => {
-  it("should remove unwanted chars if passed that option, while handling annotation start,end (and location start,end) truncation correctly", () => {
-    const res = tidyUpSequenceData(
-      {
-        sequence: "http://localhost:3344/Standalone",
-        features: [
-          {
-            start: 3,
-            end: 20,
-            locations: [
-              {
-                start: "3", //this should be converted to an int :)
-                end: 5
-              },
-              {
-                start: 10,
-                end: 20
-              }
-            ]
-          }
-        ]
-      },
-      { removeUnwantedChars: true }
-    );
+  it("should remove invalid chars by default, while handling annotation start,end (and location start,end) truncation correctly", () => {
+    const res = tidyUpSequenceData({
+      sequence: "http://localhost:3344/Standalone",
+      features: [
+        {
+          start: 3,
+          end: 20,
+          locations: [
+            {
+              start: "3", //this should be converted to an int :)
+              end: 5
+            },
+            {
+              start: 10,
+              end: 20
+            }
+          ]
+        }
+      ]
+    });
     res.should.containSubset({
       sequence: "httcahstStandan",
       circular: false,
@@ -49,15 +46,6 @@ describe("tidyUpSequenceData", () => {
       ]
     });
   });
-  // const res = tidyUpSequenceData(
-  //   {
-  //     isProtein: true,
-  //     circular: true,
-  //     proteinSequence: "gagiuhwgagalasjglj*.",
-  //     features: [{ start: 3, end: 10 }, { start: 10, end: 20 }]
-  //   },
-  //   { convertAnnotationsFromAAIndices: true, removeUnwantedChars: true }
-  // );
   it("should handle a protein sequence being passed in with isProtein set to true", () => {
     const res = tidyUpSequenceData(
@@ -71,61 +59,16 @@ describe("tidyUpSequenceData", () => {
           { name: "iDon'tFit", start: 25, end: 35 }
         ]
       },
-      { convertAnnotationsFromAAIndices: true, removeUnwantedChars: true }
+      { convertAnnotationsFromAAIndices: true }
     );
     res.should.containSubset({
-      aminoAcidDataForEachBaseOfDNA: [
-        {
-          aminoAcid: {
-            value: ".",
-            name: "Gap",
-            threeLettersName: "Gap"
-          },
-          positionInCodon: 0,
-          aminoAcidIndex: 17,
-          sequenceIndex: 51,
-          codonRange: {
-            start: 51,
-            end: 53
-          },
-          fullCodon: true
-        },
-        {
-          aminoAcid: {
-            value: ".",
-            name: "Gap",
-            threeLettersName: "Gap"
-          },
-          positionInCodon: 1,
-          aminoAcidIndex: 17,
-          sequenceIndex: 52,
-          codonRange: {
-            start: 51,
-            end: 53
-          },
-          fullCodon: true
-        },
-        {
-          aminoAcid: {
-            value: ".",
-            name: "Gap",
-            threeLettersName: "Gap"
-          },
-          positionInCodon: 2,
-          aminoAcidIndex: 17,
-          sequenceIndex: 53,
-          codonRange: {
-            start: 51,
-            end: 53
-          },
-          fullCodon: true
-        }
-      ],
+      aminoAcidDataForEachBaseOfDNA: [],
       isProtein: true,
       size: 54, //size should refer to the DNA length
       proteinSize: 18, //proteinSize should refer to the amino acid length
-      sequence: "ggngcnggnathtgacaytggggngcnggngcnytngcnwsnggnytntrr...", //degenerate sequence
-      proteinSequence: "gagiuhwgagalasgl*.",
+      sequence: "ggngcnggnathtgacaytggggngcnggngcnytngcnwsnhtnggnytnhtn", //degenerate sequence
+      proteinSequence: "gagiuhwgagalasjglj",
       circular: false,
       features: [
         { start: 9, end: 32, forward: true },