opencloning 0.3.8__py3-none-any.whl → 0.4.3__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -1,7 +1,7 @@
1
1
  {
2
2
  "sequences": [
3
3
  {
4
- "id": 2,
4
+ "id": 1,
5
5
  "type": "TextFileSequence",
6
6
  "sequence_file_format": "genbank",
7
7
  "overhang_crick_3prime": 0,
@@ -9,7 +9,7 @@
9
9
  "file_content": "LOCUS pHEE401E 17112 bp DNA circular SYN 25-AUG-2024\nDEFINITION Egg cell-specific promoter-controlled expression of\n 3\u00d7FLAG-NLS-zCas9-NLS. Contains gRNA scaffold for insertion of target\n sequence (U6-26 promoter), Hyg resistance.\nACCESSION .\nVERSION .\nKEYWORDS .\nSOURCE synthetic DNA construct\n ORGANISM synthetic DNA construct\n .\nREFERENCE 1 (bases 1 to 17112)\n AUTHORS Wang ZP, Xing HL, Dong L, Zhang HY, Han CY, Wang XC, Chen QJ\n TITLE Egg cell-specific promoter-controlled CRISPR/Cas9 efficiently\n generates homozygous mutants for multiple target genes in\n Arabidopsis in a single generation.\n JOURNAL Genome Biol. 2015 Jul 21;16:144. doi: 10.1186/s13059-015-0715-0.\n PUBMED 26193878\nREFERENCE 2 (bases 1 to 17112)\n AUTHORS .\n TITLE Direct Submission\n JOURNAL Exported Aug 25, 2024 from SnapGene Server 7.0.3\n https://www.snapgene.com\nCOMMENT SGRef: number: 1; type: \"Journal Article\"; journalName: \"Genome\n Biol.\"; date: \"2015-07-21\"; volume: \"16:144. doi\"; pages: \"\n 10.1186/s13059-015-0715-0\"\nFEATURES Location/Qualifiers\n source 1..17112\n /mol_type=\"other DNA\"\n /organism=\"synthetic DNA construct\"\n promoter 104..780\n /label=\"CaMV 35S promoter (enhanced)\"\n /note=\"cauliflower mosaic virus 35S promoter with a\n duplicated enhancer region\"\n primer_bind 717..737\n /label=\"35S promoter\"\n /note=\"CaMV 35S promoter, forward primer\"\n CDS 847..1872\n /codon_start=1\n /product=\"hygromycin B phosphotransferase\"\n /label=\"HygR\"\n /note=\"confers resistance to hygromycin\"\n /translation=\"MKKPELTATSVEKFLIEKFDSVSDLMQLSEGEESRAFSFDVGGRG\n YVLRVNSCADGFYKDRYVYRHFASAALPIPEVLDIGEFSESLTYCISRRSQGVTLQDLP\n ETELPAVLQPVAEAMDAIAAADLSQTSGFGPFGPQGIGQYTTWRDFICAIADPHVYHWQ\n TVMDDTVSASVAQALDELMLWAEDCPEVRHLVHADFGSNNVLTDNGRITAVIDWSEAMF\n GDSQYEVANIFFWRPWLACMEQQTRYFERRHPELAGSPRLRAYMLRIGLDQLYQSLVDG\n NFDDAAWAQGRCDAIVRSGAGTVGRTQIARRSAAVWTDGCVEVLADSGNRRPSTRPRAK\n K\"\n polyA_signal 1913..2087\n /label=\"CaMV poly(A) signal\"\n /note=\"cauliflower mosaic virus polyadenylation signal\"\n misc_feature 2165..2189\n /label=\"LB T-DNA repeat\"\n /note=\"left border repeat from nopaline C58 T-DNA\"\n CDS 2614..3408\n /codon_start=1\n /gene=\"aphA-3\"\n /product=\"aminoglycoside phosphotransferase\"\n /label=\"KanR\"\n /note=\"confers resistance to kanamycin\"\n /translation=\"MAKMRISPELKKLIEKYRCVKDTEGMSPAKVYKLVGENENLYLKM\n TDSRYKGTTYDVEREKDMMLWLEGKLPVPKVLHFERHDGWSNLLMSEADGVLCSEEYED\n EQSPEKIIELYAECIRLFHSIDISDCPYTNSLDSRLAELDYLLNNDLADVDCENWEEDT\n PFKDPRELYDFLKTEKPEEELVFSHGDLGDSNIFVKDGKVSGFIDLGRSGRADKWYDIA\n FCVRSIREDIGEEQYVELFFDLLGIKPDWEKIKYYILLDELF\"\n rep_origin 3495..4083\n /direction=RIGHT\n /label=\"ori\"\n /note=\"high-copy-number ColE1/pMB1/pBR322/pUC origin of\n replication\"\n primer_bind 3984..4003\n /label=\"pBR322ori-F\"\n /note=\"pBR322 origin, forward primer\"\n primer_bind 4237..4254\n /label=\"L4440\"\n /note=\"L4440 vector, forward primer\"\n misc_feature 4269..4409\n /label=\"bom\"\n /note=\"basis of mobility region from pBR322\"\n primer_bind complement(4335..4354)\n /label=\"pRS-marker\"\n /note=\"pRS vectors, use to sequence yeast selectable\n marker\"\n primer_bind 4495..4517\n /label=\"pGEX 3'\"\n /note=\"pGEX vectors, reverse primer\"\n rep_origin 4753..4947\n /label=\"pVS1 oriV\"\n /note=\"origin of replication for the Pseudomonas plasmid\n pVS1 (Heeb et al., 2000)\"\n CDS complement(5013..6086)\n /codon_start=1\n /product=\"replication protein from the Pseudomonas plasmid\n pVS1 (Heeb et al., 2000)\"\n /label=\"pVS1 RepA\"\n /translation=\"MSGRKPSGPVQIGAALGDDLVEKLKAAQAAQRQRIEAEARPGESW\n QAAADRIRKESRQPPAAGAPSIRKPPKGDEQPDFFVPMLYDVGTRDSRSIMDVAVFRLS\n KRDRRAGEVIRYELPDGHVEVSAGPAGMASVWDYDLVLMAVSHLTESMNRYREGKGDKP\n GRVFRPHVADVLKFCRRADGGKQKDDLVETCIRLNTTHVAMQRTKKAKNGRLVTVSEGE\n ALISRYKIVKSETGRPEYIEIELADWMYREITEGKNPDVLTVHPDYFLIDPGIGRFLYR\n LARRAAGKAEARWLFKTIYERSGSAGEFKKFCFTVRKLIGSNDLPEYDLKEEAGQAGPI\n LVMRYRNLIEGEASAGS\"\n CDS complement(6515..7144)\n /codon_start=1\n /product=\"stability protein from the Pseudomonas plasmid\n pVS1 (Heeb et al., 2000)\"\n /label=\"pVS1 StaA\"\n /translation=\"MKVIAVLNQKGGSGKTTIATHLARALQLAGADVLLVDSDPQGSAR\n DWAAVREDQPLTVVGIDRPTIDRDVKAIGRRDFVVIDGAPQAADLAVSAIKAADFVLIP\n VQPSPYDIWATADLVELVKQRIEVTDGRLQAAFVVSRAIKGTRIGGEVAEALAGYELPI\n LESRITQRVSYPGTAAAGTTVLESEPEGDAAREVQALAAEIKSKLI\"\n misc_feature 8445..8469\n /label=\"RB T-DNA repeat\"\n /note=\"right border repeat from nopaline C58 T-DNA\"\n primer_bind 8657..8679\n /label=\"M13/pUC Forward\"\n /note=\"In lacZ gene\"\n primer_bind 8671..8688\n /label=\"M13 Forward\"\n /note=\"In lacZ gene. Also called M13-F20 or M13 (-21)\n Forward\"\n primer_bind 8672..8688\n /label=\"M13 fwd\"\n /note=\"common sequencing primer, one of multiple similar\n variants\"\n CDS 9401..10192\n /codon_start=1\n /gene=\"aadA\"\n /product=\"aminoglycoside adenylyltransferase (Murphy,\n 1985)\"\n /label=\"SmR\"\n /note=\"confers resistance to spectinomycin and\n streptomycin\"\n /translation=\"MGEAVIAEVSTQLSEVVGVIERHLEPTLLAVHLYGSAVDGGLKPH\n SDIDLLVTVTVRLDETTRRALINDLLETSASPGESEILRAVEVTIVVHDDIIPWRYPAK\n RELQFGEWQRNDILAGIFEPATIDIDLAILLTKAREHSVALVGPAAEELFDPVPEQDLF\n EALNETLTLWNSPPDWAGDERNVVLTLSRIWYSAVTGKIAPKDVAADWAMERLPAQYQP\n VILEARQAYLGQEEDRLASRADQLEEFVHYVKGEITKVVGK\"\n misc_RNA 10344..10419\n /label=\"gRNA scaffold\"\n /note=\"guide RNA scaffold for the Streptococcus pyogenes\n CRISPR/Cas9 system\"\n CDS 11989..12054\n /codon_start=1\n /product=\"three tandem FLAG(R) epitope tags, followed by an\n enterokinase cleavage site\"\n /label=\"3xFLAG\"\n /translation=\"DYKDHDGDYKDHDIDYKDDDDK\"\n CDS 12061..12081\n /codon_start=1\n /product=\"nuclear localization signal of SV40 (simian virus\n 40) large T antigen\"\n /label=\"SV40 NLS\"\n /translation=\"PKKKRKV\"\n CDS 12106..16206\n /codon_start=1\n /product=\"Cas9 (Csn1) endonuclease from the Streptococcus\n pyogenes Type II CRISPR/Cas system\"\n /label=\"Cas9\"\n /note=\"generates RNA-guided double strand breaks in DNA\"\n /translation=\"DKKYSIGLDIGTNSVGWAVITDEYKVPSKKFKVLGNTDRHSIKKN\n LIGALLFDSGETAEATRLKRTARRRYTRRKNRICYLQEIFSNEMAKVDDSFFHRLEESF\n LVEEDKKHERHPIFGNIVDEVAYHEKYPTIYHLRKKLVDSTDKADLRLIYLALAHMIKF\n RGHFLIEGDLNPDNSDVDKLFIQLVQTYNQLFEENPINASGVDAKAILSARLSKSRRLE\n NLIAQLPGEKKNGLFGNLIALSLGLTPNFKSNFDLAEDAKLQLSKDTYDDDLDNLLAQI\n GDQYADLFLAAKNLSDAILLSDILRVNTEITKAPLSASMIKRYDEHHQDLTLLKALVRQ\n QLPEKYKEIFFDQSKNGYAGYIDGGASQEEFYKFIKPILEKMDGTEELLVKLNREDLLR\n KQRTFDNGSIPHQIHLGELHAILRRQEDFYPFLKDNREKIEKILTFRIPYYVGPLARGN\n SRFAWMTRKSEETITPWNFEEVVDKGASAQSFIERMTNFDKNLPNEKVLPKHSLLYEYF\n TVYNELTKVKYVTEGMRKPAFLSGEQKKAIVDLLFKTNRKVTVKQLKEDYFKKIECFDS\n VEISGVEDRFNASLGTYHDLLKIIKDKDFLDNEENEDILEDIVLTLTLFEDREMIEERL\n KTYAHLFDDKVMKQLKRRRYTGWGRLSRKLINGIRDKQSGKTILDFLKSDGFANRNFMQ\n LIHDDSLTFKEDIQKAQVSGQGDSLHEHIANLAGSPAIKKGILQTVKVVDELVKVMGRH\n KPENIVIEMARENQTTQKGQKNSRERMKRIEEGIKELGSQILKEHPVENTQLQNEKLYL\n YYLQNGRDMYVDQELDINRLSDYDVDHIVPQSFLKDDSIDNKVLTRSDKNRGKSDNVPS\n EEVVKKMKNYWRQLLNAKLITQRKFDNLTKAERGGLSELDKAGFIKRQLVETRQITKHV\n AQILDSRMNTKYDENDKLIREVKVITLKSKLVSDFRKDFQFYKVREINNYHHAHDAYLN\n AVVGTALIKKYPKLESEFVYGDYKVYDVRKMIAKSEQEIGKATAKYFFYSNIMNFFKTE\n ITLANGEIRKRPLIETNGETGEIVWDKGRDFATVRKVLSMPQVNIVKKTEVQTGGFSKE\n SILPKRNSDKLIARKKDWDPKKYGGFDSPTVAYSVLVVAKVEKGKSKKLKSVKELLGIT\n IMERSSFEKNPIDFLEAKGYKEVKKDLIIKLPKYSLFELENGRKRMLASAGELQKGNEL\n ALPSKYVNFLYLASHYEKLKGSPEDNEQKQLFVEQHKHYLDEIIEQISEFSKRVILADA\n NLDKVLSAYNKHRDKPIREQAENIIHLFTLTNLGAPAAFKYFDTTIDRKRYTSTKEVLD\n ATLIHQSITGLYETRIDLSQLGGD\"\n CDS 12106..16206\n /codon_start=1\n /product=\"Cas9 (Csn1) endonuclease from the Streptococcus\n pyogenes Type II CRISPR/Cas system\"\n /label=\"Cas9\"\n /note=\"generates RNA-guided double strand breaks in DNA\"\n /translation=\"DKKYSIGLDIGTNSVGWAVITDEYKVPSKKFKVLGNTDRHSIKKN\n LIGALLFDSGETAEATRLKRTARRRYTRRKNRICYLQEIFSNEMAKVDDSFFHRLEESF\n LVEEDKKHERHPIFGNIVDEVAYHEKYPTIYHLRKKLVDSTDKADLRLIYLALAHMIKF\n RGHFLIEGDLNPDNSDVDKLFIQLVQTYNQLFEENPINASGVDAKAILSARLSKSRRLE\n NLIAQLPGEKKNGLFGNLIALSLGLTPNFKSNFDLAEDAKLQLSKDTYDDDLDNLLAQI\n GDQYADLFLAAKNLSDAILLSDILRVNTEITKAPLSASMIKRYDEHHQDLTLLKALVRQ\n QLPEKYKEIFFDQSKNGYAGYIDGGASQEEFYKFIKPILEKMDGTEELLVKLNREDLLR\n KQRTFDNGSIPHQIHLGELHAILRRQEDFYPFLKDNREKIEKILTFRIPYYVGPLARGN\n SRFAWMTRKSEETITPWNFEEVVDKGASAQSFIERMTNFDKNLPNEKVLPKHSLLYEYF\n TVYNELTKVKYVTEGMRKPAFLSGEQKKAIVDLLFKTNRKVTVKQLKEDYFKKIECFDS\n VEISGVEDRFNASLGTYHDLLKIIKDKDFLDNEENEDILEDIVLTLTLFEDREMIEERL\n KTYAHLFDDKVMKQLKRRRYTGWGRLSRKLINGIRDKQSGKTILDFLKSDGFANRNFMQ\n LIHDDSLTFKEDIQKAQVSGQGDSLHEHIANLAGSPAIKKGILQTVKVVDELVKVMGRH\n KPENIVIEMARENQTTQKGQKNSRERMKRIEEGIKELGSQILKEHPVENTQLQNEKLYL\n YYLQNGRDMYVDQELDINRLSDYDVDHIVPQSFLKDDSIDNKVLTRSDKNRGKSDNVPS\n EEVVKKMKNYWRQLLNAKLITQRKFDNLTKAERGGLSELDKAGFIKRQLVETRQITKHV\n AQILDSRMNTKYDENDKLIREVKVITLKSKLVSDFRKDFQFYKVREINNYHHAHDAYLN\n AVVGTALIKKYPKLESEFVYGDYKVYDVRKMIAKSEQEIGKATAKYFFYSNIMNFFKTE\n ITLANGEIRKRPLIETNGETGEIVWDKGRDFATVRKVLSMPQVNIVKKTEVQTGGFSKE\n SILPKRNSDKLIARKKDWDPKKYGGFDSPTVAYSVLVVAKVEKGKSKKLKSVKELLGIT\n IMERSSFEKNPIDFLEAKGYKEVKKDLIIKLPKYSLFELENGRKRMLASAGELQKGNEL\n ALPSKYVNFLYLASHYEKLKGSPEDNEQKQLFVEQHKHYLDEIIEQISEFSKRVILADA\n NLDKVLSAYNKHRDKPIREQAENIIHLFTLTNLGAPAAFKYFDTTIDRKRYTSTKEVLD\n ATLIHQSITGLYETRIDLSQLGGD\"\n RBS 16119..16127\n /label=\"Shine-Dalgarno sequence\"\n /note=\"full consensus sequence for ribosome-binding sites\n upstream of start codons in E. coli; complementary to a\n region in the 3' end of the 16S rRNA (Chen et al., 1994)\"\n CDS 16207..16254\n /codon_start=1\n /product=\"bipartite nuclear localization signal from\n nucleoplasmin\"\n /label=\"nucleoplasmin NLS\"\n /translation=\"KRPAATKKAGQAKKKK\"\n primer_bind complement(16911..16927)\n /label=\"M13 rev\"\n /note=\"common sequencing primer, one of multiple similar\n variants\"\n primer_bind complement(16911..16927)\n /label=\"M13 Reverse\"\n /note=\"In lacZ gene. Also called M13-rev\"\n primer_bind complement(16924..16946)\n /label=\"M13/pUC Reverse\"\n /note=\"In lacZ gene\"\n protein_bind 16935..16951\n /label=\"lac operator\"\n /bound_moiety=\"lac repressor encoded by lacI\"\n /note=\"The lac repressor binds to the lac operator to\n inhibit transcription in E. coli. This inhibition can be\n relieved by adding lactose or\n isopropyl-beta-D-thiogalactopyranoside (IPTG).\"\n promoter complement(16959..16989)\n /label=\"lac promoter\"\n /note=\"promoter for the E. coli lac operon\"\n protein_bind 17004..17025\n /label=\"CAP binding site\"\n /bound_moiety=\"E. coli catabolite activator protein\"\n /note=\"CAP binding activates transcription in the presence\n of cAMP.\"\nORIGIN\n 1 ggtttgcgta ttggctagag cagcttgcca acatggtgga gcacgacact ctcgtctact\n 61 ccaagaatat caaagataca gtctcagaag accaaagggc tattgagact tttcaacaaa\n 121 gggtaatatc gggaaacctc ctcggattcc attgcccagc tatctgtcac ttcatcaaaa\n 181 ggacagtaga aaaggaaggt ggcacctaca aatgccatca ttgcgataaa ggaaaggcta\n 241 tcgttcaaga tgcctctgcc gacagtggtc ccaaagatgg acccccaccc acgaggagca\n 301 tcgtggaaaa agaagacgtt ccaaccacgt cttcaaagca agtggattga tgtgaacatg\n 361 gtggagcacg acactctcgt ctactccaag aatatcaaag atacagtctc agaagaccaa\n 421 agggctattg agacttttca acaaagggta atatcgggaa acctcctcgg attccattgc\n 481 ccagctatct gtcacttcat caaaaggaca gtagaaaagg aaggtggcac ctacaaatgc\n 541 catcattgcg ataaaggaaa ggctatcgtt caagatgcct ctgccgacag tggtcccaaa\n 601 gatggacccc cacccacgag gagcatcgtg gaaaaagaag acgttccaac cacgtcttca\n 661 aagcaagtgg attgatgtga tatctccact gacgtaaggg atgacgcaca atcccactat\n 721 ccttcgcaag acccttcctc tatataagga agttcatttc atttggagag gacacgctga\n 781 aatcaccagt ctctctctac aaatctatct ctctcgagct ttcgcagatc cggggggcaa\n 841 tgagatatga aaaagcctga actcaccgcg acgtctgtcg agaagtttct gatcgaaaag\n 901 ttcgacagcg tctccgacct gatgcagctc tcggagggcg aagaatctcg tgctttcagc\n 961 ttcgatgtag gagggcgtgg atatgtcctg cgggtaaata gctgcgccga tggtttctac\n 1021 aaagatcgtt atgtttatcg gcactttgca tcggccgcgc tcccgattcc ggaagtgctt\n 1081 gacattgggg agtttagcga gagcctgacc tattgcatct cccgccgttc acagggtgtc\n 1141 acgttgcaag acctgcctga aaccgaactg cccgctgttc tacaaccggt cgcggaggct\n 1201 atggatgcga tcgctgcggc cgatcttagc cagacgagcg ggttcggccc attcggaccg\n 1261 caaggaatcg gtcaatacac tacatggcgt gatttcatat gcgcgattgc tgatccccat\n 1321 gtgtatcact ggcaaactgt gatggacgac accgtcagtg cgtccgtcgc gcaggctctc\n 1381 gatgagctga tgctttgggc cgaggactgc cccgaagtcc ggcacctcgt gcacgcggat\n 1441 ttcggctcca acaatgtcct gacggacaat ggccgcataa cagcggtcat tgactggagc\n 1501 gaggcgatgt tcggggattc ccaatacgag gtcgccaaca tcttcttctg gaggccgtgg\n 1561 ttggcttgta tggagcagca gacgcgctac ttcgagcgga ggcatccgga gcttgcagga\n 1621 tcgccacgac tccgggcgta tatgctccgc attggtcttg accaactcta tcagagcttg\n 1681 gttgacggca atttcgatga tgcagcttgg gcgcagggtc gatgcgacgc aatcgtccga\n 1741 tccggagccg ggactgtcgg gcgtacacaa atcgcccgca gaagcgcggc cgtctggacc\n 1801 gatggctgtg tagaagtact cgccgatagt ggaaaccgac gccccagcac tcgtccgagg\n 1861 gcaaagaaat agagtagatg ccgaccggga tctgtcgatc gacaagctcg agtttctcca\n 1921 taataatgtg tgagtagttc ccagataagg gaattagggt tcctataggg tttcgctcat\n 1981 gtgttgagca tataagaaac ccttagtatg tatttgtatt tgtaaaatac ttctatcaat\n 2041 aaaatttcta attcctaaaa ccaaaatcca gtactaaaat ccagatcccc cgaattaatt\n 2101 cggcgttaat tcagtacatt aaaaacgtcc gcaatgtgtt attaagttgt ctaagcgtca\n 2161 atttgtttac accacaatat atcctgccac cagccagcca acagctcccc gaccggcagc\n 2221 tcggcacaaa atcaccactc gatacaggca gcccatcagt ccgggacggc gtcagcggga\n 2281 gagccgttgt aaggcggcag actttgctca tgttaccgat gctattcgga agaacggcaa\n 2341 ctaagctgcc gggtttgaaa cacggatgat ctcgcggagg gtagcatgtt gattgtaacg\n 2401 atgacagagc gttgctgcct gtgatcaccg cggtttcaaa atcggctccg tcgatactat\n 2461 gttatacgcc aactttgaaa acaactttga aaaagctgtt ttctggtatt taaggtttta\n 2521 gaatgcaagg aacagtgaat tggagttcgt cttgttataa ttagcttctt ggggtatctt\n 2581 taaatactgt agaaaagagg aaggaaataa taaatggcta aaatgagaat atcaccggaa\n 2641 ttgaaaaaac tgatcgaaaa ataccgctgc gtaaaagata cggaaggaat gtctcctgct\n 2701 aaggtatata agctggtggg agaaaatgaa aacctatatt taaaaatgac ggacagccgg\n 2761 tataaaggga ccacctatga tgtggaacgg gaaaaggaca tgatgctatg gctggaagga\n 2821 aagctgcctg ttccaaaggt cctgcacttt gaacggcatg atggctggag caatctgctc\n 2881 atgagtgagg ccgatggcgt cctttgctcg gaagagtatg aagatgaaca aagccctgaa\n 2941 aagattatcg agctgtatgc ggagtgcatc aggctctttc actccatcga catatcggat\n 3001 tgtccctata cgaatagctt agacagccgc ttagccgaat tggattactt actgaataac\n 3061 gatctggccg atgtggattg cgaaaactgg gaagaagaca ctccatttaa agatccgcgc\n 3121 gagctgtatg attttttaaa gacggaaaag cccgaagagg aacttgtctt ttcccacggc\n 3181 gacctgggag acagcaacat ctttgtgaaa gatggcaaag taagtggctt tattgatctt\n 3241 gggagaagcg gcagggcgga caagtggtat gacattgcct tctgcgtccg gtcgatcagg\n 3301 gaggatatcg gggaagaaca gtatgtcgag ctattttttg acttactggg gatcaagcct\n 3361 gattgggaga aaataaaata ttatatttta ctggatgaat tgttttagta cctagaatgc\n 3421 atgaccaaaa tcccttaacg tgagttttcg ttccactgag cgtcagaccc cgtagaaaag\n 3481 atcaaaggat cttcttgaga tccttttttt ctgcgcgtaa tctgctgctt gcaaacaaaa\n 3541 aaaccaccgc taccagcggt ggtttgtttg ccggatcaag agctaccaac tctttttccg\n 3601 aaggtaactg gcttcagcag agcgcagata ccaaatactg tccttctagt gtagccgtag\n 3661 ttaggccacc acttcaagaa ctctgtagca ccgcctacat acctcgctct gctaatcctg\n 3721 ttaccagtgg ctgctgccag tggcgataag tcgtgtctta ccgggttgga ctcaagacga\n 3781 tagttaccgg ataaggcgca gcggtcgggc tgaacggggg gttcgtgcac acagcccagc\n 3841 ttggagcgaa cgacctacac cgaactgaga tacctacagc gtgagctatg agaaagcgcc\n 3901 acgcttcccg aagggagaaa ggcggacagg tatccggtaa gcggcagggt cggaacagga\n 3961 gagcgcacga gggagcttcc agggggaaac gcctggtatc tttatagtcc tgtcgggttt\n 4021 cgccacctct gacttgagcg tcgatttttg tgatgctcgt caggggggcg gagcctatgg\n 4081 aaaaacgcca gcaacgcggc ctttttacgg ttcctggcct tttgctggcc ttttgctcac\n 4141 atgttctttc ctgcgttatc ccctgattct gtggataacc gtattaccgc ctttgagtga\n 4201 gctgataccg ctcgccgcag ccgaacgacc gagcgcagcg agtcagtgag cgaggaagcg\n 4261 gaagagcgcc tgatgcggta ttttctcctt acgcatctgt gcggtatttc acaccgcata\n 4321 tggtgcactc tcagtacaat ctgctctgat gccgcatagt taagccagta tacactccgc\n 4381 tatcgctacg tgactgggtc atggctgcgc cccgacaccc gccaacaccc gctgacgcgc\n 4441 cctgacgggc ttgtctgctc ccggcatccg cttacagaca agctgtgacc gtctccggga\n 4501 gctgcatgtg tcagaggttt tcaccgtcat caccgaaacg cgcgaggcag ggtgccttga\n 4561 tgtgggcgcc ggcggtcgag tggcgacggc gcggcttgtc cgcgccctgg tagattgcct\n 4621 ggccgtaggc cagccatttt tgagcggcca gcggccgcga taggccgacg cgaagcggcg\n 4681 gggcgtaggg agcgcagcga ccgaagggta ggcgcttttt gcagctcttc ggctgtgcgc\n 4741 tggccagaca gttatgcaca ggccaggcgg gttttaagag ttttaataag ttttaaagag\n 4801 ttttaggcgg aaaaatcgcc ttttttctct tttatatcag tcacttacat gtgtgaccgg\n 4861 ttcccaatgt acggctttgg gttcccaatg tacgggttcc ggttcccaat gtacggcttt\n 4921 gggttcccaa tgtacgtgct atccacagga aacagacctt ttcgaccttt ttcccctgct\n 4981 agggcaattt gccctagcat ctgctccgta cattaggaac cggcggatgc ttcgccctcg\n 5041 atcaggttgc ggtagcgcat gactaggatc gggccagcct gccccgcctc ctccttcaaa\n 5101 tcgtactccg gcaggtcatt tgacccgatc agcttgcgca cggtgaaaca gaacttcttg\n 5161 aactctccgg cgctgccact gcgttcgtag atcgtcttga acaaccatct ggcttctgcc\n 5221 ttgcctgcgg cgcggcgtgc caggcggtag agaaaacggc cgatgccggg atcgatcaaa\n 5281 aagtaatcgg ggtgaaccgt cagcacgtcc gggttcttgc cttctgtgat ctcgcggtac\n 5341 atccaatcag ctagctcgat ctcgatgtac tccggccgcc cggtttcgct ctttacgatc\n 5401 ttgtagcggc taatcaaggc ttcaccctcg gataccgtca ccaggcggcc gttcttggcc\n 5461 ttcttcgtac gctgcatggc aacgtgcgtg gtgtttaacc gaatgcaggt ttctaccagg\n 5521 tcgtctttct gctttccgcc atcggctcgc cggcagaact tgagtacgtc cgcaacgtgt\n 5581 ggacggaaca cgcggccggg cttgtctccc ttcccttccc ggtatcggtt catggattcg\n 5641 gttagatggg aaaccgccat cagtaccagg tcgtaatccc acacactggc catgccggcc\n 5701 ggccctgcgg aaacctctac gtgcccgtct ggaagctcgt agcggatcac ctcgccagct\n 5761 cgtcggtcac gcttcgacag acggaaaacg gccacgtcca tgatgctgcg actatcgcgg\n 5821 gtgcccacgt catagagcat cggaacgaaa aaatctggtt gctcgtcgcc cttgggcggc\n 5881 ttcctaatcg acggcgcacc ggctgccggc ggttgccggg attctttgcg gattcgatca\n 5941 gcggccgctt gccacgattc accggggcgt gcttctgcct cgatgcgttg ccgctgggcg\n 6001 gcctgcgcgg ccttcaactt ctccaccagg tcatcaccca gcgccgcgcc gatttgtacc\n 6061 gggccggatg gtttgcgacc gctcacgccg attcctcggg cttgggggtt ccagtgccat\n 6121 tgcagggccg gcaggcaacc cagccgctta cgcctggcca accgcccgtt cctccacaca\n 6181 tggggcattc cacggcgtcg gtgcctggtt gttcttgatt ttccatgccg cctcctttag\n 6241 ccgctaaaat tcatctactc atttattcat ttgctcattt actctggtag ctgcgcgatg\n 6301 tattcagata gcagctcggt aatggtcttg ccttggcgta ccgcgtacat cttcagcttg\n 6361 gtgtgatcct ccgccggcaa ctgaaagttg acccgcttca tggctggcgt gtctgccagg\n 6421 ctggccaacg ttgcagcctt gctgctgcgt gcgctcggac ggccggcact tagcgtgttt\n 6481 gtgcttttgc tcattttctc tttacctcat taactcaaat gagttttgat ttaatttcag\n 6541 cggccagcgc ctggacctcg cgggcagcgt cgccctcggg ttctgattca agaacggttg\n 6601 tgccggcggc ggcagtgcct gggtagctca cgcgctgcgt gatacgggac tcaagaatgg\n 6661 gcagctcgta cccggccagc gcctcggcaa cctcaccgcc gatgcgcgtg cctttgatcg\n 6721 cccgcgacac gacaaaggcc gcttgtagcc ttccatccgt gacctcaatg cgctgcttaa\n 6781 ccagctccac caggtcggcg gtggcccata tgtcgtaagg gcttggctgc accggaatca\n 6841 gcacgaagtc ggctgccttg atcgcggaca cagccaagtc cgccgcctgg ggcgctccgt\n 6901 cgatcactac gaagtcgcgc cggccgatgg ccttcacgtc gcggtcaatc gtcgggcggt\n 6961 cgatgccgac aacggttagc ggttgatctt cccgcacggc cgcccaatcg cgggcactgc\n 7021 cctggggatc ggaatcgact aacagaacat cggccccggc gagttgcagg gcgcgggcta\n 7081 gatgggttgc gatggtcgtc ttgcctgacc cgcctttctg gttaagtaca gcgataacct\n 7141 tcatgcgttc cccttgcgta tttgtttatt tactcatcgc atcatatacg cagcgaccgc\n 7201 atgacgcaag ctgttttact caaatacaca tcaccttttt agacggcggc gctcggtttc\n 7261 ttcagcggcc aagctggccg gccaggccgc cagcttggca tcagacaaac cggccaggat\n 7321 ttcatgcagc cgcacggttg agacgtgcgc gggcggctcg aacacgtacc cggccgcgat\n 7381 catctccgcc tcgatctctt cggtaatgaa aaacggttcg tcctggccgt cctggtgcgg\n 7441 tttcatgctt gttcctcttg gcgttcattc tcggcggccg ccagggcgtc ggcctcggtc\n 7501 aatgcgtcct cacggaaggc accgcgccgc ctggcctcgg tgggcgtcac ttcctcgctg\n 7561 cgctcaagtg cgcggtacag ggtcgagcga tgcacgccaa gcagtgcagc cgcctctttc\n 7621 acggtgcggc cttcctggtc gatcagctcg cgggcgtgcg cgatctgtgc cggggtgagg\n 7681 gtagggcggg ggccaaactt cacgcctcgg gccttggcgg cctcgcgccc gctccgggtg\n 7741 cggtcgatga ttagggaacg ctcgaactcg gcaatgccgg cgaacacggt caacaccatg\n 7801 cggccggccg gcgtggtggt gtcggcccac ggctctgcca ggctacgcag gcccgcgccg\n 7861 gcctcctgga tgcgctcggc aatgtccagt aggtcgcggg tgctgcgggc caggcggtct\n 7921 agcctggtca ctgtcacaac gtcgccaggg cgtaggtggt caagcatcct ggccagctcc\n 7981 gggcggtcgc gcctggtgcc ggtgatcttc tcggaaaaca gcttggtgca gccggccgcg\n 8041 tgcagttcgg cccgttggtt ggtcaagtcc tggtcgtcgg tgctgacgcg ggcatagccc\n 8101 agcaggccag cggcggcgct cttgttcatg gcgtaatgtc tccggttcta gtcgcaagta\n 8161 ttctacttta tgcgactaaa acacgcgaca agaaaacgcc aggaaaaggg cagggcggca\n 8221 gcctgtcgcg taacttagga cttgtgcgac atgtcgtttt cagaagacgg ctgcactgaa\n 8281 cgtcagaagc cgactgcact atagcagcgg aggggttgga tcaaagtact ttgatcccga\n 8341 ggggaaccct gtggttggca tgcacataca aatggacgaa cggataaacc ttttcacgcc\n 8401 cttttaaata tccgattatt ctaataaacg ctcttttctc ttaggtttac ccgccaatat\n 8461 atcctgtcaa acactgatag tttaaactga aggcgggaaa cgacaatctg atccaagctc\n 8521 aagctgctct agcattcgcc attcaggctg cgcaactgtt gggaagggcg atcggtgcgg\n 8581 gcctcttcgc tattacgcca gctggcgaaa gggggatgtg ctgcaaggcg attaagttgg\n 8641 gtaacgccag ggttttccca gtcacgacgt tgtaaaacga cggccagtgc caagcttcga\n 8701 cttgccttcc gcacaataca tcatttcttc ttagcttttt ttcttcttct tcgttcatac\n 8761 agtttttttt tgtttatcag cttacatttt cttgaaccgt agctttcgtt ttcttctttt\n 8821 taactttcca ttcggagttt ttgtatcttg tttcatagtt tgtcccagga ttagaatgat\n 8881 taggcatcga accttcaaga atttgattga ataaaacatc ttcattctta agatatgaag\n 8941 ataatcttca aaaggcccct gggaatctga aagaagagaa gcaggcccat ttatatggga\n 9001 aagaacaata gtatttctta tataggccca tttaagttga aaacaatctt caaaagtccc\n 9061 acatcgctta gataagaaaa cgaagctgag tttatataca gctagagtcg aagtagtgat\n 9121 tgggagacca acccagtgga cataagcctg ttcggttcgt aagctgtaat gcaagtagcg\n 9181 tatgcgctca cgcaactggt ccagaacctt gaccgaacgc agcggtggta acggcgcagt\n 9241 ggcggttttc atggcttgtt atgactgttt ttttggggta cagtctatgc ctcgggcatc\n 9301 caagcagcaa gcgcgttacg ccgtgggtcg atgtttgatg ttatggagca gcaacgatgt\n 9361 tacgcagcag ggcagtcgcc ctaaaacaaa gttaaacatc atgggggaag cggtgatcgc\n 9421 cgaagtatcg actcaactat cagaggtagt tggcgtcatc gagcgccatc tcgaaccgac\n 9481 gttgctggcc gtacatttgt acggctccgc agtggatggc ggcctgaagc cacacagtga\n 9541 tattgatttg ctggttacgg tgaccgtaag gcttgatgaa acaacgcggc gagctttgat\n 9601 caacgacctt ttggaaactt cggcttcccc tggagagagc gagattctcc gcgctgtaga\n 9661 agtcaccatt gttgtgcacg acgacatcat tccgtggcgt tatccagcta agcgcgaact\n 9721 gcaatttgga gaatggcagc gcaatgacat tcttgcaggt atcttcgagc cagccacgat\n 9781 cgacattgat ctggctatct tgctgacaaa agcaagagaa catagcgttg ccttggtagg\n 9841 tccagcggcg gaggaactct ttgatccggt tcctgaacag gatctatttg aggcgctaaa\n 9901 tgaaacctta acgctatgga actcgccgcc cgactgggct ggcgatgagc gaaatgtagt\n 9961 gcttacgttg tcccgcattt ggtacagcgc agtaaccggc aaaatcgcgc cgaaggatgt\n 10021 cgctgccgac tgggcaatgg agcgcctgcc ggcccagtat cagcccgtca tacttgaagc\n 10081 tagacaggct tatcttggac aagaagaaga tcgcttggcc tcgcgcgcag atcagttgga\n 10141 agaatttgtc cactacgtga aaggcgagat caccaaggta gtcggcaaat aatgtctagc\n 10201 tagaaattcg ttcaagccga cgccgcttcg cggcgcggct taactcaagc gttagatgca\n 10261 ctaagcacat aattgctcac agccaaacta tcaggtcaag tctgctttta ttatttttaa\n 10321 gcgtgcataa taagccggtc tcggttttag agctagaaat agcaagttaa aataaggcta\n 10381 gtccgttatc aacttgaaaa agtggcaccg agtcggtgct tttttttgca aaattttcca\n 10441 gatcgatttc ttcttcctct gttcttcggc gttcaatttc tggggttttc tcttcgtttt\n 10501 ctgtaactga aacctaaaat ttgacctaaa aaaaatctca aataatatga ttcagtggtt\n 10561 ttgtactttt cagttagttg agttttgcag ttccgatgag ataaaccaat accatggtta\n 10621 tactagtgaa taaaagcatt tgcgtttggt ttatcattgc gtttatacaa ggacagagat\n 10681 ccactgagct ggaatagctt aaaaccatta tcagaacaaa ataaaccatt ttttgttaag\n 10741 aatcagagca tagtaaacaa cagaaacaac ctaagagagg taacttgtcc aagaagatag\n 10801 ctaattatat ctattttata aaagttatca tagtttgtaa gtcacaaaag atgcaaataa\n 10861 cagagaaact aggagacttg agaatataca ttcttgtata tttgtattcg agattgtgaa\n 10921 aatttgacca taagtttaaa ttcttaaaaa gatatatctg atctaggtga tggttataga\n 10981 ctgtaatttt accacatgtt taatgatgga tagtgacaca catgacacat cgacaacact\n 11041 atagcatctt atttagatta caacatgaaa tttttctgta atacatgtct ttgtacataa\n 11101 tttaaaagta attcctaaga aatatattta tacaaggagt ttaaagaaaa catagcataa\n 11161 agttcaatga gtagtaaaaa ccatatacag tatatagcat aaagttcaat gagtttatta\n 11221 caaaagcatt ggttcacttt ctgtaacacg acgttaaacc ttcgtctcca ataggagcgc\n 11281 tactgattca acatgccaat atatactaaa tacgtttcta cagtcaaatg ctttaacgtt\n 11341 tcatgattaa gtgactattt accgtcaatc ctttcccatt cctcccacta atccaacttt\n 11401 ttaattactc ttaaatcacc actaagctag taacgcctat catgaattag ctctactaaa\n 11461 tctagcaacc tttcaaattt gcagtattgc aggtgtctct gtgtctttaa aatagttgcc\n 11521 ttatgatttc ttcggtttca agatgatcaa atagttatag atttcatgct cacacatgct\n 11581 cattagatgt gtacatactt tacttaccca aatctatttt ctcgcaaaga ttttgatggt\n 11641 aaagctgatt tggttctatt gaactaaatc aaacgagttt cagactgagt gattctaatc\n 11701 cggcccatta gcccctaaac agacccacta attacgcagc ttttaataga gtaattacac\n 11761 ctagtttacc cactaaacca ctaagcacta attatctcac aatctaatga gcttccctcg\n 11821 taattacttg ggctttcact ctaccattta tttgtaacag tcaagtctct actgtctcta\n 11881 tataaactct ctaaagttaa cacacaattc tcatcacaaa caaatcaacc aaagcaactt\n 11941 ctactctttc ttctttcgac cttatcaatc tgttgagaaa tctagatgga ttacaaggac\n 12001 cacgacgggg attacaagga ccacgacatt gattacaagg atgatgatga caagatggct\n 12061 ccgaagaaga agaggaaggt tggcatccac ggggtgccag ctgctgacaa gaagtactcg\n 12121 atcggcctcg atattgggac taactctgtt ggctgggccg tgatcaccga cgagtacaag\n 12181 gtgccctcaa agaagttcaa ggtcctgggc aacaccgatc ggcattccat caagaagaat\n 12241 ctcattggcg ctctcctgtt cgacagcggc gagacggctg aggctacgcg gctcaagcgc\n 12301 accgcccgca ggcggtacac gcgcaggaag aatcgcatct gctacctgca ggagattttc\n 12361 tccaacgaga tggcgaaggt tgacgattct ttcttccaca ggctggagga gtcattcctc\n 12421 gtggaggagg ataagaagca cgagcggcat ccaatcttcg gcaacattgt cgacgaggtt\n 12481 gcctaccacg agaagtaccc tacgatctac catctgcgga agaagctcgt ggactccaca\n 12541 gataaggcgg acctccgcct gatctacctc gctctggccc acatgattaa gttcaggggc\n 12601 catttcctga tcgaggggga tctcaacccg gacaatagcg atgttgacaa gctgttcatc\n 12661 cagctcgtgc agacgtacaa ccagctcttc gaggagaacc ccattaatgc gtcaggcgtc\n 12721 gacgcgaagg ctatcctgtc cgctaggctc tcgaagtctc ggcgcctcga gaacctgatc\n 12781 gcccagctgc cgggcgagaa gaagaacggc ctgttcggga atctcattgc gctcagcctg\n 12841 gggctcacgc ccaacttcaa gtcgaatttc gatctcgctg aggacgccaa gctgcagctc\n 12901 tccaaggaca catacgacga tgacctggat aacctcctgg cccagatcgg cgatcagtac\n 12961 gcggacctgt tcctcgctgc caagaatctg tcggacgcca tcctcctgtc tgatattctc\n 13021 agggtgaaca ccgagattac gaaggctccg ctctcagcct ccatgatcaa gcgctacgac\n 13081 gagcaccatc aggatctgac cctcctgaag gcgctggtca ggcagcagct ccccgagaag\n 13141 tacaaggaga tcttcttcga tcagtcgaag aacggctacg ctgggtacat tgacggcggg\n 13201 gcctctcagg aggagttcta caagttcatc aagccgattc tggagaagat ggacggcacg\n 13261 gaggagctgc tggtgaagct caatcgcgag gacctcctga ggaagcagcg gacattcgat\n 13321 aacggcagca tcccacacca gattcatctc ggggagctgc acgctatcct gaggaggcag\n 13381 gaggacttct accctttcct caaggataac cgcgagaaga tcgagaagat tctgactttc\n 13441 aggatcccgt actacgtcgg cccactcgct aggggcaact cccgcttcgc ttggatgacc\n 13501 cgcaagtcag aggagacgat cacgccgtgg aacttcgagg aggtggtcga caagggcgct\n 13561 agcgctcagt cgttcatcga gaggatgacg aatttcgaca agaacctgcc aaatgagaag\n 13621 gtgctcccta agcactcgct cctgtacgag tacttcacag tctacaacga gctgactaag\n 13681 gtgaagtatg tgaccgaggg catgaggaag ccggctttcc tgtctgggga gcagaagaag\n 13741 gccatcgtgg acctcctgtt caagaccaac cggaaggtca cggttaagca gctcaaggag\n 13801 gactacttca agaagattga gtgcttcgat tcggtcgaga tctctggcgt tgaggaccgc\n 13861 ttcaacgcct ccctggggac ctaccacgat ctcctgaaga tcattaagga taaggacttc\n 13921 ctggacaacg aggagaatga ggatatcctc gaggacattg tgctgacact cactctgttc\n 13981 gaggaccggg agatgatcga ggagcgcctg aagacttacg cccatctctt cgatgacaag\n 14041 gtcatgaagc agctcaagag gaggaggtac accggctggg ggaggctgag caggaagctc\n 14101 atcaacggca ttcgggacaa gcagtccggg aagacgatcc tcgacttcct gaagagcgat\n 14161 ggcttcgcga accgcaattt catgcagctg attcacgatg acagcctcac attcaaggag\n 14221 gatatccaga aggctcaggt gagcggccag ggggactcgc tgcacgagca tatcgcgaac\n 14281 ctcgctggct cgccagctat caagaagggg attctgcaga ccgtgaaggt tgtggacgag\n 14341 ctggtgaagg tcatgggcag gcacaagcct gagaacatcg tcattgagat ggcccgggag\n 14401 aatcagacca cgcagaaggg ccagaagaac tcacgcgaga ggatgaagag gatcgaggag\n 14461 ggcattaagg agctggggtc ccagatcctc aaggagcacc cggtggagaa cacgcagctg\n 14521 cagaatgaga agctctacct gtactacctc cagaatggcc gcgatatgta tgtggaccag\n 14581 gagctggata ttaacaggct cagcgattac gacgtcgatc atatcgttcc acagtcattc\n 14641 ctgaaggatg actccattga caacaaggtc ctcaccaggt cggacaagaa ccggggcaag\n 14701 tctgataatg ttccttcaga ggaggtcgtt aagaagatga agaactactg gcgccagctc\n 14761 ctgaatgcca agctgatcac gcagcggaag ttcgataacc tcacaaaggc tgagaggggc\n 14821 gggctctctg agctggacaa ggcgggcttc atcaagaggc agctggtcga gacacggcag\n 14881 atcactaagc acgttgcgca gattctcgac tcacggatga acactaagta cgatgagaat\n 14941 gacaagctga tccgcgaggt gaaggtcatc accctgaagt caaagctcgt ctccgacttc\n 15001 aggaaggatt tccagttcta caaggttcgg gagatcaaca attaccacca tgcccatgac\n 15061 gcgtacctga acgcggtggt cggcacagct ctgatcaaga agtacccaaa gctcgagagc\n 15121 gagttcgtgt acggggacta caaggtttac gatgtgagga agatgatcgc caagtcggag\n 15181 caggagattg gcaaggctac cgccaagtac ttcttctact ctaacattat gaatttcttc\n 15241 aagacagaga tcactctggc caatggcgag atccggaagc gccccctcat cgagacgaac\n 15301 ggcgagacgg gggagatcgt gtgggacaag ggcagggatt tcgcgaccgt caggaaggtt\n 15361 ctctccatgc cacaagtgaa tatcgtcaag aagacagagg tccagactgg cgggttctct\n 15421 aaggagtcaa ttctgcctaa gcggaacagc gacaagctca tcgcccgcaa gaaggactgg\n 15481 gatccgaaga agtacggcgg gttcgacagc cccactgtgg cctactcggt cctggttgtg\n 15541 gcgaaggttg agaagggcaa gtccaagaag ctcaagagcg tgaaggagct gctggggatc\n 15601 acgattatgg agcgctccag cttcgagaag aacccgatcg atttcctgga ggcgaagggc\n 15661 tacaaggagg tgaagaagga cctgatcatt aagctcccca agtactcact cttcgagctg\n 15721 gagaacggca ggaagcggat gctggcttcc gctggcgagc tgcagaaggg gaacgagctg\n 15781 gctctgccgt ccaagtatgt gaacttcctc tacctggcct cccactacga gaagctcaag\n 15841 ggcagccccg aggacaacga gcagaagcag ctgttcgtcg agcagcacaa gcattacctc\n 15901 gacgagatca ttgagcagat ttccgagttc tccaagcgcg tgatcctggc cgacgcgaat\n 15961 ctggataagg tcctctccgc gtacaacaag caccgcgaca agccaatcag ggagcaggct\n 16021 gagaatatca ttcatctctt caccctgacg aacctcggcg cccctgctgc tttcaagtac\n 16081 ttcgacacaa ctatcgatcg caagaggtac acaagcacta aggaggtcct ggacgcgacc\n 16141 ctcatccacc agtcgattac cggcctctac gagacgcgca tcgacctgtc tcagctcggg\n 16201 ggcgacaagc ggccagcggc gacgaagaag gcggggcagg cgaagaagaa gaagtgagct\n 16261 cagagctttc gttcgtatca tcggtttcga caacgttcgt caagttcaat gcatcagttt\n 16321 cattgcgcac acaccagaat cctactgagt ttgagtatta tggcattggg aaaactgttt\n 16381 ttcttgtacc atttgttgtg cttgtaattt actgtgtttt ttattcggtt ttcgctatcg\n 16441 aactgtgaaa tggaaatgga tggagaagag ttaatgaatg atatggtcct tttgttcatt\n 16501 ctcaaattaa tattatttgt tttttctctt atttgttgtg tgttgaattt gaaattataa\n 16561 gagatatgca aacattttgt tttgagtaaa aatgtgtcaa atcgtggcct ctaatgaccg\n 16621 aagttaatat gaggagtaaa acacttgtag ttgtaccatt atgcttattc actaggcaac\n 16681 aaatatattt tcagacctag aaaagctgca aatgttactg aatacaagta tgtcctcttg\n 16741 tgttttagac atttatgaac tttcctttat gtaattttcc agaatccttg tcagattcta\n 16801 atcattgctt tataattata gttatactca tggatttgta gttgagtatg aaaatatttt\n 16861 ttaatgcatt ttatgacttg ccaattgatt gacaacgaat tcgtaatcat gtcatagctg\n 16921 tttcctgtgt gaaattgtta tccgctcaca attccacaca acatacgagc cggaagcata\n 16981 aagtgtaaag cctggggtgc ctaatgagtg agctaactca cattaattgc gttgcgctca\n 17041 ctgcccgctt tccagtcggg aaacctgtcg tgccagctgc attaatgaat cggccaacgc\n 17101 gcggggagag gc\n//"
10
10
  },
11
11
  {
12
- "id": 4,
12
+ "id": 2,
13
13
  "type": "TextFileSequence",
14
14
  "sequence_file_format": "genbank",
15
15
  "overhang_crick_3prime": 0,
@@ -17,7 +17,7 @@
17
17
  "file_content": "LOCUS pHEE401E 17112 bp DNA circular SYN 25-AUG-2024\nDEFINITION Egg cell-specific promoter-controlled expression of\n 3\u00d7FLAG-NLS-zCas9-NLS. Contains gRNA scaffold for insertion of target\n sequence (U6-26 promoter), Hyg resistance.\nACCESSION .\nVERSION .\nKEYWORDS .\nSOURCE synthetic DNA construct\n ORGANISM synthetic DNA construct\n .\nREFERENCE 1 (bases 1 to 17112)\n AUTHORS Wang ZP, Xing HL, Dong L, Zhang HY, Han CY, Wang XC, Chen QJ\n TITLE Egg cell-specific promoter-controlled CRISPR/Cas9 efficiently\n generates homozygous mutants for multiple target genes in\n Arabidopsis in a single generation.\n JOURNAL Genome Biol. 2015 Jul 21;16:144. doi: 10.1186/s13059-015-0715-0.\n PUBMED 26193878\nREFERENCE 2 (bases 1 to 17112)\n AUTHORS .\n TITLE Direct Submission\n JOURNAL Exported Aug 25, 2024 from SnapGene Server 7.0.3\n https://www.snapgene.com\nCOMMENT SGRef: number: 1; type: \"Journal Article\"; journalName: \"Genome\n Biol.\"; date: \"2015-07-21\"; volume: \"16:144. doi\"; pages: \"\n 10.1186/s13059-015-0715-0\"\nFEATURES Location/Qualifiers\n source 1..17112\n /mol_type=\"other DNA\"\n /organism=\"synthetic DNA construct\"\n promoter 104..780\n /label=\"CaMV 35S promoter (enhanced)\"\n /note=\"cauliflower mosaic virus 35S promoter with a\n duplicated enhancer region\"\n primer_bind 717..737\n /label=\"35S promoter\"\n /note=\"CaMV 35S promoter, forward primer\"\n CDS 847..1872\n /codon_start=1\n /product=\"hygromycin B phosphotransferase\"\n /label=\"HygR\"\n /note=\"confers resistance to hygromycin\"\n /translation=\"MKKPELTATSVEKFLIEKFDSVSDLMQLSEGEESRAFSFDVGGRG\n YVLRVNSCADGFYKDRYVYRHFASAALPIPEVLDIGEFSESLTYCISRRSQGVTLQDLP\n ETELPAVLQPVAEAMDAIAAADLSQTSGFGPFGPQGIGQYTTWRDFICAIADPHVYHWQ\n TVMDDTVSASVAQALDELMLWAEDCPEVRHLVHADFGSNNVLTDNGRITAVIDWSEAMF\n GDSQYEVANIFFWRPWLACMEQQTRYFERRHPELAGSPRLRAYMLRIGLDQLYQSLVDG\n NFDDAAWAQGRCDAIVRSGAGTVGRTQIARRSAAVWTDGCVEVLADSGNRRPSTRPRAK\n K\"\n polyA_signal 1913..2087\n /label=\"CaMV poly(A) signal\"\n /note=\"cauliflower mosaic virus polyadenylation signal\"\n misc_feature 2165..2189\n /label=\"LB T-DNA repeat\"\n /note=\"left border repeat from nopaline C58 T-DNA\"\n CDS 2614..3408\n /codon_start=1\n /gene=\"aphA-3\"\n /product=\"aminoglycoside phosphotransferase\"\n /label=\"KanR\"\n /note=\"confers resistance to kanamycin\"\n /translation=\"MAKMRISPELKKLIEKYRCVKDTEGMSPAKVYKLVGENENLYLKM\n TDSRYKGTTYDVEREKDMMLWLEGKLPVPKVLHFERHDGWSNLLMSEADGVLCSEEYED\n EQSPEKIIELYAECIRLFHSIDISDCPYTNSLDSRLAELDYLLNNDLADVDCENWEEDT\n PFKDPRELYDFLKTEKPEEELVFSHGDLGDSNIFVKDGKVSGFIDLGRSGRADKWYDIA\n FCVRSIREDIGEEQYVELFFDLLGIKPDWEKIKYYILLDELF\"\n rep_origin 3495..4083\n /direction=RIGHT\n /label=\"ori\"\n /note=\"high-copy-number ColE1/pMB1/pBR322/pUC origin of\n replication\"\n primer_bind 3984..4003\n /label=\"pBR322ori-F\"\n /note=\"pBR322 origin, forward primer\"\n primer_bind 4237..4254\n /label=\"L4440\"\n /note=\"L4440 vector, forward primer\"\n misc_feature 4269..4409\n /label=\"bom\"\n /note=\"basis of mobility region from pBR322\"\n primer_bind complement(4335..4354)\n /label=\"pRS-marker\"\n /note=\"pRS vectors, use to sequence yeast selectable\n marker\"\n primer_bind 4495..4517\n /label=\"pGEX 3'\"\n /note=\"pGEX vectors, reverse primer\"\n rep_origin 4753..4947\n /label=\"pVS1 oriV\"\n /note=\"origin of replication for the Pseudomonas plasmid\n pVS1 (Heeb et al., 2000)\"\n CDS complement(5013..6086)\n /codon_start=1\n /product=\"replication protein from the Pseudomonas plasmid\n pVS1 (Heeb et al., 2000)\"\n /label=\"pVS1 RepA\"\n /translation=\"MSGRKPSGPVQIGAALGDDLVEKLKAAQAAQRQRIEAEARPGESW\n QAAADRIRKESRQPPAAGAPSIRKPPKGDEQPDFFVPMLYDVGTRDSRSIMDVAVFRLS\n KRDRRAGEVIRYELPDGHVEVSAGPAGMASVWDYDLVLMAVSHLTESMNRYREGKGDKP\n GRVFRPHVADVLKFCRRADGGKQKDDLVETCIRLNTTHVAMQRTKKAKNGRLVTVSEGE\n ALISRYKIVKSETGRPEYIEIELADWMYREITEGKNPDVLTVHPDYFLIDPGIGRFLYR\n LARRAAGKAEARWLFKTIYERSGSAGEFKKFCFTVRKLIGSNDLPEYDLKEEAGQAGPI\n LVMRYRNLIEGEASAGS\"\n CDS complement(6515..7144)\n /codon_start=1\n /product=\"stability protein from the Pseudomonas plasmid\n pVS1 (Heeb et al., 2000)\"\n /label=\"pVS1 StaA\"\n /translation=\"MKVIAVLNQKGGSGKTTIATHLARALQLAGADVLLVDSDPQGSAR\n DWAAVREDQPLTVVGIDRPTIDRDVKAIGRRDFVVIDGAPQAADLAVSAIKAADFVLIP\n VQPSPYDIWATADLVELVKQRIEVTDGRLQAAFVVSRAIKGTRIGGEVAEALAGYELPI\n LESRITQRVSYPGTAAAGTTVLESEPEGDAAREVQALAAEIKSKLI\"\n misc_feature 8445..8469\n /label=\"RB T-DNA repeat\"\n /note=\"right border repeat from nopaline C58 T-DNA\"\n primer_bind 8657..8679\n /label=\"M13/pUC Forward\"\n /note=\"In lacZ gene\"\n primer_bind 8671..8688\n /label=\"M13 Forward\"\n /note=\"In lacZ gene. Also called M13-F20 or M13 (-21)\n Forward\"\n primer_bind 8672..8688\n /label=\"M13 fwd\"\n /note=\"common sequencing primer, one of multiple similar\n variants\"\n CDS 9401..10192\n /codon_start=1\n /gene=\"aadA\"\n /product=\"aminoglycoside adenylyltransferase (Murphy,\n 1985)\"\n /label=\"SmR\"\n /note=\"confers resistance to spectinomycin and\n streptomycin\"\n /translation=\"MGEAVIAEVSTQLSEVVGVIERHLEPTLLAVHLYGSAVDGGLKPH\n SDIDLLVTVTVRLDETTRRALINDLLETSASPGESEILRAVEVTIVVHDDIIPWRYPAK\n RELQFGEWQRNDILAGIFEPATIDIDLAILLTKAREHSVALVGPAAEELFDPVPEQDLF\n EALNETLTLWNSPPDWAGDERNVVLTLSRIWYSAVTGKIAPKDVAADWAMERLPAQYQP\n VILEARQAYLGQEEDRLASRADQLEEFVHYVKGEITKVVGK\"\n misc_RNA 10344..10419\n /label=\"gRNA scaffold\"\n /note=\"guide RNA scaffold for the Streptococcus pyogenes\n CRISPR/Cas9 system\"\n CDS 11989..12054\n /codon_start=1\n /product=\"three tandem FLAG(R) epitope tags, followed by an\n enterokinase cleavage site\"\n /label=\"3xFLAG\"\n /translation=\"DYKDHDGDYKDHDIDYKDDDDK\"\n CDS 12061..12081\n /codon_start=1\n /product=\"nuclear localization signal of SV40 (simian virus\n 40) large T antigen\"\n /label=\"SV40 NLS\"\n /translation=\"PKKKRKV\"\n CDS 12106..16206\n /codon_start=1\n /product=\"Cas9 (Csn1) endonuclease from the Streptococcus\n pyogenes Type II CRISPR/Cas system\"\n /label=\"Cas9\"\n /note=\"generates RNA-guided double strand breaks in DNA\"\n /translation=\"DKKYSIGLDIGTNSVGWAVITDEYKVPSKKFKVLGNTDRHSIKKN\n LIGALLFDSGETAEATRLKRTARRRYTRRKNRICYLQEIFSNEMAKVDDSFFHRLEESF\n LVEEDKKHERHPIFGNIVDEVAYHEKYPTIYHLRKKLVDSTDKADLRLIYLALAHMIKF\n RGHFLIEGDLNPDNSDVDKLFIQLVQTYNQLFEENPINASGVDAKAILSARLSKSRRLE\n NLIAQLPGEKKNGLFGNLIALSLGLTPNFKSNFDLAEDAKLQLSKDTYDDDLDNLLAQI\n GDQYADLFLAAKNLSDAILLSDILRVNTEITKAPLSASMIKRYDEHHQDLTLLKALVRQ\n QLPEKYKEIFFDQSKNGYAGYIDGGASQEEFYKFIKPILEKMDGTEELLVKLNREDLLR\n KQRTFDNGSIPHQIHLGELHAILRRQEDFYPFLKDNREKIEKILTFRIPYYVGPLARGN\n SRFAWMTRKSEETITPWNFEEVVDKGASAQSFIERMTNFDKNLPNEKVLPKHSLLYEYF\n TVYNELTKVKYVTEGMRKPAFLSGEQKKAIVDLLFKTNRKVTVKQLKEDYFKKIECFDS\n VEISGVEDRFNASLGTYHDLLKIIKDKDFLDNEENEDILEDIVLTLTLFEDREMIEERL\n KTYAHLFDDKVMKQLKRRRYTGWGRLSRKLINGIRDKQSGKTILDFLKSDGFANRNFMQ\n LIHDDSLTFKEDIQKAQVSGQGDSLHEHIANLAGSPAIKKGILQTVKVVDELVKVMGRH\n KPENIVIEMARENQTTQKGQKNSRERMKRIEEGIKELGSQILKEHPVENTQLQNEKLYL\n YYLQNGRDMYVDQELDINRLSDYDVDHIVPQSFLKDDSIDNKVLTRSDKNRGKSDNVPS\n EEVVKKMKNYWRQLLNAKLITQRKFDNLTKAERGGLSELDKAGFIKRQLVETRQITKHV\n AQILDSRMNTKYDENDKLIREVKVITLKSKLVSDFRKDFQFYKVREINNYHHAHDAYLN\n AVVGTALIKKYPKLESEFVYGDYKVYDVRKMIAKSEQEIGKATAKYFFYSNIMNFFKTE\n ITLANGEIRKRPLIETNGETGEIVWDKGRDFATVRKVLSMPQVNIVKKTEVQTGGFSKE\n SILPKRNSDKLIARKKDWDPKKYGGFDSPTVAYSVLVVAKVEKGKSKKLKSVKELLGIT\n IMERSSFEKNPIDFLEAKGYKEVKKDLIIKLPKYSLFELENGRKRMLASAGELQKGNEL\n ALPSKYVNFLYLASHYEKLKGSPEDNEQKQLFVEQHKHYLDEIIEQISEFSKRVILADA\n NLDKVLSAYNKHRDKPIREQAENIIHLFTLTNLGAPAAFKYFDTTIDRKRYTSTKEVLD\n ATLIHQSITGLYETRIDLSQLGGD\"\n CDS 12106..16206\n /codon_start=1\n /product=\"Cas9 (Csn1) endonuclease from the Streptococcus\n pyogenes Type II CRISPR/Cas system\"\n /label=\"Cas9\"\n /note=\"generates RNA-guided double strand breaks in DNA\"\n /translation=\"DKKYSIGLDIGTNSVGWAVITDEYKVPSKKFKVLGNTDRHSIKKN\n LIGALLFDSGETAEATRLKRTARRRYTRRKNRICYLQEIFSNEMAKVDDSFFHRLEESF\n LVEEDKKHERHPIFGNIVDEVAYHEKYPTIYHLRKKLVDSTDKADLRLIYLALAHMIKF\n RGHFLIEGDLNPDNSDVDKLFIQLVQTYNQLFEENPINASGVDAKAILSARLSKSRRLE\n NLIAQLPGEKKNGLFGNLIALSLGLTPNFKSNFDLAEDAKLQLSKDTYDDDLDNLLAQI\n GDQYADLFLAAKNLSDAILLSDILRVNTEITKAPLSASMIKRYDEHHQDLTLLKALVRQ\n QLPEKYKEIFFDQSKNGYAGYIDGGASQEEFYKFIKPILEKMDGTEELLVKLNREDLLR\n KQRTFDNGSIPHQIHLGELHAILRRQEDFYPFLKDNREKIEKILTFRIPYYVGPLARGN\n SRFAWMTRKSEETITPWNFEEVVDKGASAQSFIERMTNFDKNLPNEKVLPKHSLLYEYF\n TVYNELTKVKYVTEGMRKPAFLSGEQKKAIVDLLFKTNRKVTVKQLKEDYFKKIECFDS\n VEISGVEDRFNASLGTYHDLLKIIKDKDFLDNEENEDILEDIVLTLTLFEDREMIEERL\n KTYAHLFDDKVMKQLKRRRYTGWGRLSRKLINGIRDKQSGKTILDFLKSDGFANRNFMQ\n LIHDDSLTFKEDIQKAQVSGQGDSLHEHIANLAGSPAIKKGILQTVKVVDELVKVMGRH\n KPENIVIEMARENQTTQKGQKNSRERMKRIEEGIKELGSQILKEHPVENTQLQNEKLYL\n YYLQNGRDMYVDQELDINRLSDYDVDHIVPQSFLKDDSIDNKVLTRSDKNRGKSDNVPS\n EEVVKKMKNYWRQLLNAKLITQRKFDNLTKAERGGLSELDKAGFIKRQLVETRQITKHV\n AQILDSRMNTKYDENDKLIREVKVITLKSKLVSDFRKDFQFYKVREINNYHHAHDAYLN\n AVVGTALIKKYPKLESEFVYGDYKVYDVRKMIAKSEQEIGKATAKYFFYSNIMNFFKTE\n ITLANGEIRKRPLIETNGETGEIVWDKGRDFATVRKVLSMPQVNIVKKTEVQTGGFSKE\n SILPKRNSDKLIARKKDWDPKKYGGFDSPTVAYSVLVVAKVEKGKSKKLKSVKELLGIT\n IMERSSFEKNPIDFLEAKGYKEVKKDLIIKLPKYSLFELENGRKRMLASAGELQKGNEL\n ALPSKYVNFLYLASHYEKLKGSPEDNEQKQLFVEQHKHYLDEIIEQISEFSKRVILADA\n NLDKVLSAYNKHRDKPIREQAENIIHLFTLTNLGAPAAFKYFDTTIDRKRYTSTKEVLD\n ATLIHQSITGLYETRIDLSQLGGD\"\n RBS 16119..16127\n /label=\"Shine-Dalgarno sequence\"\n /note=\"full consensus sequence for ribosome-binding sites\n upstream of start codons in E. coli; complementary to a\n region in the 3' end of the 16S rRNA (Chen et al., 1994)\"\n CDS 16207..16254\n /codon_start=1\n /product=\"bipartite nuclear localization signal from\n nucleoplasmin\"\n /label=\"nucleoplasmin NLS\"\n /translation=\"KRPAATKKAGQAKKKK\"\n primer_bind complement(16911..16927)\n /label=\"M13 rev\"\n /note=\"common sequencing primer, one of multiple similar\n variants\"\n primer_bind complement(16911..16927)\n /label=\"M13 Reverse\"\n /note=\"In lacZ gene. Also called M13-rev\"\n primer_bind complement(16924..16946)\n /label=\"M13/pUC Reverse\"\n /note=\"In lacZ gene\"\n protein_bind 16935..16951\n /label=\"lac operator\"\n /bound_moiety=\"lac repressor encoded by lacI\"\n /note=\"The lac repressor binds to the lac operator to\n inhibit transcription in E. coli. This inhibition can be\n relieved by adding lactose or\n isopropyl-beta-D-thiogalactopyranoside (IPTG).\"\n promoter complement(16959..16989)\n /label=\"lac promoter\"\n /note=\"promoter for the E. coli lac operon\"\n protein_bind 17004..17025\n /label=\"CAP binding site\"\n /bound_moiety=\"E. coli catabolite activator protein\"\n /note=\"CAP binding activates transcription in the presence\n of cAMP.\"\nORIGIN\n 1 ggtttgcgta ttggctagag cagcttgcca acatggtgga gcacgacact ctcgtctact\n 61 ccaagaatat caaagataca gtctcagaag accaaagggc tattgagact tttcaacaaa\n 121 gggtaatatc gggaaacctc ctcggattcc attgcccagc tatctgtcac ttcatcaaaa\n 181 ggacagtaga aaaggaaggt ggcacctaca aatgccatca ttgcgataaa ggaaaggcta\n 241 tcgttcaaga tgcctctgcc gacagtggtc ccaaagatgg acccccaccc acgaggagca\n 301 tcgtggaaaa agaagacgtt ccaaccacgt cttcaaagca agtggattga tgtgaacatg\n 361 gtggagcacg acactctcgt ctactccaag aatatcaaag atacagtctc agaagaccaa\n 421 agggctattg agacttttca acaaagggta atatcgggaa acctcctcgg attccattgc\n 481 ccagctatct gtcacttcat caaaaggaca gtagaaaagg aaggtggcac ctacaaatgc\n 541 catcattgcg ataaaggaaa ggctatcgtt caagatgcct ctgccgacag tggtcccaaa\n 601 gatggacccc cacccacgag gagcatcgtg gaaaaagaag acgttccaac cacgtcttca\n 661 aagcaagtgg attgatgtga tatctccact gacgtaaggg atgacgcaca atcccactat\n 721 ccttcgcaag acccttcctc tatataagga agttcatttc atttggagag gacacgctga\n 781 aatcaccagt ctctctctac aaatctatct ctctcgagct ttcgcagatc cggggggcaa\n 841 tgagatatga aaaagcctga actcaccgcg acgtctgtcg agaagtttct gatcgaaaag\n 901 ttcgacagcg tctccgacct gatgcagctc tcggagggcg aagaatctcg tgctttcagc\n 961 ttcgatgtag gagggcgtgg atatgtcctg cgggtaaata gctgcgccga tggtttctac\n 1021 aaagatcgtt atgtttatcg gcactttgca tcggccgcgc tcccgattcc ggaagtgctt\n 1081 gacattgggg agtttagcga gagcctgacc tattgcatct cccgccgttc acagggtgtc\n 1141 acgttgcaag acctgcctga aaccgaactg cccgctgttc tacaaccggt cgcggaggct\n 1201 atggatgcga tcgctgcggc cgatcttagc cagacgagcg ggttcggccc attcggaccg\n 1261 caaggaatcg gtcaatacac tacatggcgt gatttcatat gcgcgattgc tgatccccat\n 1321 gtgtatcact ggcaaactgt gatggacgac accgtcagtg cgtccgtcgc gcaggctctc\n 1381 gatgagctga tgctttgggc cgaggactgc cccgaagtcc ggcacctcgt gcacgcggat\n 1441 ttcggctcca acaatgtcct gacggacaat ggccgcataa cagcggtcat tgactggagc\n 1501 gaggcgatgt tcggggattc ccaatacgag gtcgccaaca tcttcttctg gaggccgtgg\n 1561 ttggcttgta tggagcagca gacgcgctac ttcgagcgga ggcatccgga gcttgcagga\n 1621 tcgccacgac tccgggcgta tatgctccgc attggtcttg accaactcta tcagagcttg\n 1681 gttgacggca atttcgatga tgcagcttgg gcgcagggtc gatgcgacgc aatcgtccga\n 1741 tccggagccg ggactgtcgg gcgtacacaa atcgcccgca gaagcgcggc cgtctggacc\n 1801 gatggctgtg tagaagtact cgccgatagt ggaaaccgac gccccagcac tcgtccgagg\n 1861 gcaaagaaat agagtagatg ccgaccggga tctgtcgatc gacaagctcg agtttctcca\n 1921 taataatgtg tgagtagttc ccagataagg gaattagggt tcctataggg tttcgctcat\n 1981 gtgttgagca tataagaaac ccttagtatg tatttgtatt tgtaaaatac ttctatcaat\n 2041 aaaatttcta attcctaaaa ccaaaatcca gtactaaaat ccagatcccc cgaattaatt\n 2101 cggcgttaat tcagtacatt aaaaacgtcc gcaatgtgtt attaagttgt ctaagcgtca\n 2161 atttgtttac accacaatat atcctgccac cagccagcca acagctcccc gaccggcagc\n 2221 tcggcacaaa atcaccactc gatacaggca gcccatcagt ccgggacggc gtcagcggga\n 2281 gagccgttgt aaggcggcag actttgctca tgttaccgat gctattcgga agaacggcaa\n 2341 ctaagctgcc gggtttgaaa cacggatgat ctcgcggagg gtagcatgtt gattgtaacg\n 2401 atgacagagc gttgctgcct gtgatcaccg cggtttcaaa atcggctccg tcgatactat\n 2461 gttatacgcc aactttgaaa acaactttga aaaagctgtt ttctggtatt taaggtttta\n 2521 gaatgcaagg aacagtgaat tggagttcgt cttgttataa ttagcttctt ggggtatctt\n 2581 taaatactgt agaaaagagg aaggaaataa taaatggcta aaatgagaat atcaccggaa\n 2641 ttgaaaaaac tgatcgaaaa ataccgctgc gtaaaagata cggaaggaat gtctcctgct\n 2701 aaggtatata agctggtggg agaaaatgaa aacctatatt taaaaatgac ggacagccgg\n 2761 tataaaggga ccacctatga tgtggaacgg gaaaaggaca tgatgctatg gctggaagga\n 2821 aagctgcctg ttccaaaggt cctgcacttt gaacggcatg atggctggag caatctgctc\n 2881 atgagtgagg ccgatggcgt cctttgctcg gaagagtatg aagatgaaca aagccctgaa\n 2941 aagattatcg agctgtatgc ggagtgcatc aggctctttc actccatcga catatcggat\n 3001 tgtccctata cgaatagctt agacagccgc ttagccgaat tggattactt actgaataac\n 3061 gatctggccg atgtggattg cgaaaactgg gaagaagaca ctccatttaa agatccgcgc\n 3121 gagctgtatg attttttaaa gacggaaaag cccgaagagg aacttgtctt ttcccacggc\n 3181 gacctgggag acagcaacat ctttgtgaaa gatggcaaag taagtggctt tattgatctt\n 3241 gggagaagcg gcagggcgga caagtggtat gacattgcct tctgcgtccg gtcgatcagg\n 3301 gaggatatcg gggaagaaca gtatgtcgag ctattttttg acttactggg gatcaagcct\n 3361 gattgggaga aaataaaata ttatatttta ctggatgaat tgttttagta cctagaatgc\n 3421 atgaccaaaa tcccttaacg tgagttttcg ttccactgag cgtcagaccc cgtagaaaag\n 3481 atcaaaggat cttcttgaga tccttttttt ctgcgcgtaa tctgctgctt gcaaacaaaa\n 3541 aaaccaccgc taccagcggt ggtttgtttg ccggatcaag agctaccaac tctttttccg\n 3601 aaggtaactg gcttcagcag agcgcagata ccaaatactg tccttctagt gtagccgtag\n 3661 ttaggccacc acttcaagaa ctctgtagca ccgcctacat acctcgctct gctaatcctg\n 3721 ttaccagtgg ctgctgccag tggcgataag tcgtgtctta ccgggttgga ctcaagacga\n 3781 tagttaccgg ataaggcgca gcggtcgggc tgaacggggg gttcgtgcac acagcccagc\n 3841 ttggagcgaa cgacctacac cgaactgaga tacctacagc gtgagctatg agaaagcgcc\n 3901 acgcttcccg aagggagaaa ggcggacagg tatccggtaa gcggcagggt cggaacagga\n 3961 gagcgcacga gggagcttcc agggggaaac gcctggtatc tttatagtcc tgtcgggttt\n 4021 cgccacctct gacttgagcg tcgatttttg tgatgctcgt caggggggcg gagcctatgg\n 4081 aaaaacgcca gcaacgcggc ctttttacgg ttcctggcct tttgctggcc ttttgctcac\n 4141 atgttctttc ctgcgttatc ccctgattct gtggataacc gtattaccgc ctttgagtga\n 4201 gctgataccg ctcgccgcag ccgaacgacc gagcgcagcg agtcagtgag cgaggaagcg\n 4261 gaagagcgcc tgatgcggta ttttctcctt acgcatctgt gcggtatttc acaccgcata\n 4321 tggtgcactc tcagtacaat ctgctctgat gccgcatagt taagccagta tacactccgc\n 4381 tatcgctacg tgactgggtc atggctgcgc cccgacaccc gccaacaccc gctgacgcgc\n 4441 cctgacgggc ttgtctgctc ccggcatccg cttacagaca agctgtgacc gtctccggga\n 4501 gctgcatgtg tcagaggttt tcaccgtcat caccgaaacg cgcgaggcag ggtgccttga\n 4561 tgtgggcgcc ggcggtcgag tggcgacggc gcggcttgtc cgcgccctgg tagattgcct\n 4621 ggccgtaggc cagccatttt tgagcggcca gcggccgcga taggccgacg cgaagcggcg\n 4681 gggcgtaggg agcgcagcga ccgaagggta ggcgcttttt gcagctcttc ggctgtgcgc\n 4741 tggccagaca gttatgcaca ggccaggcgg gttttaagag ttttaataag ttttaaagag\n 4801 ttttaggcgg aaaaatcgcc ttttttctct tttatatcag tcacttacat gtgtgaccgg\n 4861 ttcccaatgt acggctttgg gttcccaatg tacgggttcc ggttcccaat gtacggcttt\n 4921 gggttcccaa tgtacgtgct atccacagga aacagacctt ttcgaccttt ttcccctgct\n 4981 agggcaattt gccctagcat ctgctccgta cattaggaac cggcggatgc ttcgccctcg\n 5041 atcaggttgc ggtagcgcat gactaggatc gggccagcct gccccgcctc ctccttcaaa\n 5101 tcgtactccg gcaggtcatt tgacccgatc agcttgcgca cggtgaaaca gaacttcttg\n 5161 aactctccgg cgctgccact gcgttcgtag atcgtcttga acaaccatct ggcttctgcc\n 5221 ttgcctgcgg cgcggcgtgc caggcggtag agaaaacggc cgatgccggg atcgatcaaa\n 5281 aagtaatcgg ggtgaaccgt cagcacgtcc gggttcttgc cttctgtgat ctcgcggtac\n 5341 atccaatcag ctagctcgat ctcgatgtac tccggccgcc cggtttcgct ctttacgatc\n 5401 ttgtagcggc taatcaaggc ttcaccctcg gataccgtca ccaggcggcc gttcttggcc\n 5461 ttcttcgtac gctgcatggc aacgtgcgtg gtgtttaacc gaatgcaggt ttctaccagg\n 5521 tcgtctttct gctttccgcc atcggctcgc cggcagaact tgagtacgtc cgcaacgtgt\n 5581 ggacggaaca cgcggccggg cttgtctccc ttcccttccc ggtatcggtt catggattcg\n 5641 gttagatggg aaaccgccat cagtaccagg tcgtaatccc acacactggc catgccggcc\n 5701 ggccctgcgg aaacctctac gtgcccgtct ggaagctcgt agcggatcac ctcgccagct\n 5761 cgtcggtcac gcttcgacag acggaaaacg gccacgtcca tgatgctgcg actatcgcgg\n 5821 gtgcccacgt catagagcat cggaacgaaa aaatctggtt gctcgtcgcc cttgggcggc\n 5881 ttcctaatcg acggcgcacc ggctgccggc ggttgccggg attctttgcg gattcgatca\n 5941 gcggccgctt gccacgattc accggggcgt gcttctgcct cgatgcgttg ccgctgggcg\n 6001 gcctgcgcgg ccttcaactt ctccaccagg tcatcaccca gcgccgcgcc gatttgtacc\n 6061 gggccggatg gtttgcgacc gctcacgccg attcctcggg cttgggggtt ccagtgccat\n 6121 tgcagggccg gcaggcaacc cagccgctta cgcctggcca accgcccgtt cctccacaca\n 6181 tggggcattc cacggcgtcg gtgcctggtt gttcttgatt ttccatgccg cctcctttag\n 6241 ccgctaaaat tcatctactc atttattcat ttgctcattt actctggtag ctgcgcgatg\n 6301 tattcagata gcagctcggt aatggtcttg ccttggcgta ccgcgtacat cttcagcttg\n 6361 gtgtgatcct ccgccggcaa ctgaaagttg acccgcttca tggctggcgt gtctgccagg\n 6421 ctggccaacg ttgcagcctt gctgctgcgt gcgctcggac ggccggcact tagcgtgttt\n 6481 gtgcttttgc tcattttctc tttacctcat taactcaaat gagttttgat ttaatttcag\n 6541 cggccagcgc ctggacctcg cgggcagcgt cgccctcggg ttctgattca agaacggttg\n 6601 tgccggcggc ggcagtgcct gggtagctca cgcgctgcgt gatacgggac tcaagaatgg\n 6661 gcagctcgta cccggccagc gcctcggcaa cctcaccgcc gatgcgcgtg cctttgatcg\n 6721 cccgcgacac gacaaaggcc gcttgtagcc ttccatccgt gacctcaatg cgctgcttaa\n 6781 ccagctccac caggtcggcg gtggcccata tgtcgtaagg gcttggctgc accggaatca\n 6841 gcacgaagtc ggctgccttg atcgcggaca cagccaagtc cgccgcctgg ggcgctccgt\n 6901 cgatcactac gaagtcgcgc cggccgatgg ccttcacgtc gcggtcaatc gtcgggcggt\n 6961 cgatgccgac aacggttagc ggttgatctt cccgcacggc cgcccaatcg cgggcactgc\n 7021 cctggggatc ggaatcgact aacagaacat cggccccggc gagttgcagg gcgcgggcta\n 7081 gatgggttgc gatggtcgtc ttgcctgacc cgcctttctg gttaagtaca gcgataacct\n 7141 tcatgcgttc cccttgcgta tttgtttatt tactcatcgc atcatatacg cagcgaccgc\n 7201 atgacgcaag ctgttttact caaatacaca tcaccttttt agacggcggc gctcggtttc\n 7261 ttcagcggcc aagctggccg gccaggccgc cagcttggca tcagacaaac cggccaggat\n 7321 ttcatgcagc cgcacggttg agacgtgcgc gggcggctcg aacacgtacc cggccgcgat\n 7381 catctccgcc tcgatctctt cggtaatgaa aaacggttcg tcctggccgt cctggtgcgg\n 7441 tttcatgctt gttcctcttg gcgttcattc tcggcggccg ccagggcgtc ggcctcggtc\n 7501 aatgcgtcct cacggaaggc accgcgccgc ctggcctcgg tgggcgtcac ttcctcgctg\n 7561 cgctcaagtg cgcggtacag ggtcgagcga tgcacgccaa gcagtgcagc cgcctctttc\n 7621 acggtgcggc cttcctggtc gatcagctcg cgggcgtgcg cgatctgtgc cggggtgagg\n 7681 gtagggcggg ggccaaactt cacgcctcgg gccttggcgg cctcgcgccc gctccgggtg\n 7741 cggtcgatga ttagggaacg ctcgaactcg gcaatgccgg cgaacacggt caacaccatg\n 7801 cggccggccg gcgtggtggt gtcggcccac ggctctgcca ggctacgcag gcccgcgccg\n 7861 gcctcctgga tgcgctcggc aatgtccagt aggtcgcggg tgctgcgggc caggcggtct\n 7921 agcctggtca ctgtcacaac gtcgccaggg cgtaggtggt caagcatcct ggccagctcc\n 7981 gggcggtcgc gcctggtgcc ggtgatcttc tcggaaaaca gcttggtgca gccggccgcg\n 8041 tgcagttcgg cccgttggtt ggtcaagtcc tggtcgtcgg tgctgacgcg ggcatagccc\n 8101 agcaggccag cggcggcgct cttgttcatg gcgtaatgtc tccggttcta gtcgcaagta\n 8161 ttctacttta tgcgactaaa acacgcgaca agaaaacgcc aggaaaaggg cagggcggca\n 8221 gcctgtcgcg taacttagga cttgtgcgac atgtcgtttt cagaagacgg ctgcactgaa\n 8281 cgtcagaagc cgactgcact atagcagcgg aggggttgga tcaaagtact ttgatcccga\n 8341 ggggaaccct gtggttggca tgcacataca aatggacgaa cggataaacc ttttcacgcc\n 8401 cttttaaata tccgattatt ctaataaacg ctcttttctc ttaggtttac ccgccaatat\n 8461 atcctgtcaa acactgatag tttaaactga aggcgggaaa cgacaatctg atccaagctc\n 8521 aagctgctct agcattcgcc attcaggctg cgcaactgtt gggaagggcg atcggtgcgg\n 8581 gcctcttcgc tattacgcca gctggcgaaa gggggatgtg ctgcaaggcg attaagttgg\n 8641 gtaacgccag ggttttccca gtcacgacgt tgtaaaacga cggccagtgc caagcttcga\n 8701 cttgccttcc gcacaataca tcatttcttc ttagcttttt ttcttcttct tcgttcatac\n 8761 agtttttttt tgtttatcag cttacatttt cttgaaccgt agctttcgtt ttcttctttt\n 8821 taactttcca ttcggagttt ttgtatcttg tttcatagtt tgtcccagga ttagaatgat\n 8881 taggcatcga accttcaaga atttgattga ataaaacatc ttcattctta agatatgaag\n 8941 ataatcttca aaaggcccct gggaatctga aagaagagaa gcaggcccat ttatatggga\n 9001 aagaacaata gtatttctta tataggccca tttaagttga aaacaatctt caaaagtccc\n 9061 acatcgctta gataagaaaa cgaagctgag tttatataca gctagagtcg aagtagtgat\n 9121 tgggagacca acccagtgga cataagcctg ttcggttcgt aagctgtaat gcaagtagcg\n 9181 tatgcgctca cgcaactggt ccagaacctt gaccgaacgc agcggtggta acggcgcagt\n 9241 ggcggttttc atggcttgtt atgactgttt ttttggggta cagtctatgc ctcgggcatc\n 9301 caagcagcaa gcgcgttacg ccgtgggtcg atgtttgatg ttatggagca gcaacgatgt\n 9361 tacgcagcag ggcagtcgcc ctaaaacaaa gttaaacatc atgggggaag cggtgatcgc\n 9421 cgaagtatcg actcaactat cagaggtagt tggcgtcatc gagcgccatc tcgaaccgac\n 9481 gttgctggcc gtacatttgt acggctccgc agtggatggc ggcctgaagc cacacagtga\n 9541 tattgatttg ctggttacgg tgaccgtaag gcttgatgaa acaacgcggc gagctttgat\n 9601 caacgacctt ttggaaactt cggcttcccc tggagagagc gagattctcc gcgctgtaga\n 9661 agtcaccatt gttgtgcacg acgacatcat tccgtggcgt tatccagcta agcgcgaact\n 9721 gcaatttgga gaatggcagc gcaatgacat tcttgcaggt atcttcgagc cagccacgat\n 9781 cgacattgat ctggctatct tgctgacaaa agcaagagaa catagcgttg ccttggtagg\n 9841 tccagcggcg gaggaactct ttgatccggt tcctgaacag gatctatttg aggcgctaaa\n 9901 tgaaacctta acgctatgga actcgccgcc cgactgggct ggcgatgagc gaaatgtagt\n 9961 gcttacgttg tcccgcattt ggtacagcgc agtaaccggc aaaatcgcgc cgaaggatgt\n 10021 cgctgccgac tgggcaatgg agcgcctgcc ggcccagtat cagcccgtca tacttgaagc\n 10081 tagacaggct tatcttggac aagaagaaga tcgcttggcc tcgcgcgcag atcagttgga\n 10141 agaatttgtc cactacgtga aaggcgagat caccaaggta gtcggcaaat aatgtctagc\n 10201 tagaaattcg ttcaagccga cgccgcttcg cggcgcggct taactcaagc gttagatgca\n 10261 ctaagcacat aattgctcac agccaaacta tcaggtcaag tctgctttta ttatttttaa\n 10321 gcgtgcataa taagccggtc tcggttttag agctagaaat agcaagttaa aataaggcta\n 10381 gtccgttatc aacttgaaaa agtggcaccg agtcggtgct tttttttgca aaattttcca\n 10441 gatcgatttc ttcttcctct gttcttcggc gttcaatttc tggggttttc tcttcgtttt\n 10501 ctgtaactga aacctaaaat ttgacctaaa aaaaatctca aataatatga ttcagtggtt\n 10561 ttgtactttt cagttagttg agttttgcag ttccgatgag ataaaccaat accatggtta\n 10621 tactagtgaa taaaagcatt tgcgtttggt ttatcattgc gtttatacaa ggacagagat\n 10681 ccactgagct ggaatagctt aaaaccatta tcagaacaaa ataaaccatt ttttgttaag\n 10741 aatcagagca tagtaaacaa cagaaacaac ctaagagagg taacttgtcc aagaagatag\n 10801 ctaattatat ctattttata aaagttatca tagtttgtaa gtcacaaaag atgcaaataa\n 10861 cagagaaact aggagacttg agaatataca ttcttgtata tttgtattcg agattgtgaa\n 10921 aatttgacca taagtttaaa ttcttaaaaa gatatatctg atctaggtga tggttataga\n 10981 ctgtaatttt accacatgtt taatgatgga tagtgacaca catgacacat cgacaacact\n 11041 atagcatctt atttagatta caacatgaaa tttttctgta atacatgtct ttgtacataa\n 11101 tttaaaagta attcctaaga aatatattta tacaaggagt ttaaagaaaa catagcataa\n 11161 agttcaatga gtagtaaaaa ccatatacag tatatagcat aaagttcaat gagtttatta\n 11221 caaaagcatt ggttcacttt ctgtaacacg acgttaaacc ttcgtctcca ataggagcgc\n 11281 tactgattca acatgccaat atatactaaa tacgtttcta cagtcaaatg ctttaacgtt\n 11341 tcatgattaa gtgactattt accgtcaatc ctttcccatt cctcccacta atccaacttt\n 11401 ttaattactc ttaaatcacc actaagctag taacgcctat catgaattag ctctactaaa\n 11461 tctagcaacc tttcaaattt gcagtattgc aggtgtctct gtgtctttaa aatagttgcc\n 11521 ttatgatttc ttcggtttca agatgatcaa atagttatag atttcatgct cacacatgct\n 11581 cattagatgt gtacatactt tacttaccca aatctatttt ctcgcaaaga ttttgatggt\n 11641 aaagctgatt tggttctatt gaactaaatc aaacgagttt cagactgagt gattctaatc\n 11701 cggcccatta gcccctaaac agacccacta attacgcagc ttttaataga gtaattacac\n 11761 ctagtttacc cactaaacca ctaagcacta attatctcac aatctaatga gcttccctcg\n 11821 taattacttg ggctttcact ctaccattta tttgtaacag tcaagtctct actgtctcta\n 11881 tataaactct ctaaagttaa cacacaattc tcatcacaaa caaatcaacc aaagcaactt\n 11941 ctactctttc ttctttcgac cttatcaatc tgttgagaaa tctagatgga ttacaaggac\n 12001 cacgacgggg attacaagga ccacgacatt gattacaagg atgatgatga caagatggct\n 12061 ccgaagaaga agaggaaggt tggcatccac ggggtgccag ctgctgacaa gaagtactcg\n 12121 atcggcctcg atattgggac taactctgtt ggctgggccg tgatcaccga cgagtacaag\n 12181 gtgccctcaa agaagttcaa ggtcctgggc aacaccgatc ggcattccat caagaagaat\n 12241 ctcattggcg ctctcctgtt cgacagcggc gagacggctg aggctacgcg gctcaagcgc\n 12301 accgcccgca ggcggtacac gcgcaggaag aatcgcatct gctacctgca ggagattttc\n 12361 tccaacgaga tggcgaaggt tgacgattct ttcttccaca ggctggagga gtcattcctc\n 12421 gtggaggagg ataagaagca cgagcggcat ccaatcttcg gcaacattgt cgacgaggtt\n 12481 gcctaccacg agaagtaccc tacgatctac catctgcgga agaagctcgt ggactccaca\n 12541 gataaggcgg acctccgcct gatctacctc gctctggccc acatgattaa gttcaggggc\n 12601 catttcctga tcgaggggga tctcaacccg gacaatagcg atgttgacaa gctgttcatc\n 12661 cagctcgtgc agacgtacaa ccagctcttc gaggagaacc ccattaatgc gtcaggcgtc\n 12721 gacgcgaagg ctatcctgtc cgctaggctc tcgaagtctc ggcgcctcga gaacctgatc\n 12781 gcccagctgc cgggcgagaa gaagaacggc ctgttcggga atctcattgc gctcagcctg\n 12841 gggctcacgc ccaacttcaa gtcgaatttc gatctcgctg aggacgccaa gctgcagctc\n 12901 tccaaggaca catacgacga tgacctggat aacctcctgg cccagatcgg cgatcagtac\n 12961 gcggacctgt tcctcgctgc caagaatctg tcggacgcca tcctcctgtc tgatattctc\n 13021 agggtgaaca ccgagattac gaaggctccg ctctcagcct ccatgatcaa gcgctacgac\n 13081 gagcaccatc aggatctgac cctcctgaag gcgctggtca ggcagcagct ccccgagaag\n 13141 tacaaggaga tcttcttcga tcagtcgaag aacggctacg ctgggtacat tgacggcggg\n 13201 gcctctcagg aggagttcta caagttcatc aagccgattc tggagaagat ggacggcacg\n 13261 gaggagctgc tggtgaagct caatcgcgag gacctcctga ggaagcagcg gacattcgat\n 13321 aacggcagca tcccacacca gattcatctc ggggagctgc acgctatcct gaggaggcag\n 13381 gaggacttct accctttcct caaggataac cgcgagaaga tcgagaagat tctgactttc\n 13441 aggatcccgt actacgtcgg cccactcgct aggggcaact cccgcttcgc ttggatgacc\n 13501 cgcaagtcag aggagacgat cacgccgtgg aacttcgagg aggtggtcga caagggcgct\n 13561 agcgctcagt cgttcatcga gaggatgacg aatttcgaca agaacctgcc aaatgagaag\n 13621 gtgctcccta agcactcgct cctgtacgag tacttcacag tctacaacga gctgactaag\n 13681 gtgaagtatg tgaccgaggg catgaggaag ccggctttcc tgtctgggga gcagaagaag\n 13741 gccatcgtgg acctcctgtt caagaccaac cggaaggtca cggttaagca gctcaaggag\n 13801 gactacttca agaagattga gtgcttcgat tcggtcgaga tctctggcgt tgaggaccgc\n 13861 ttcaacgcct ccctggggac ctaccacgat ctcctgaaga tcattaagga taaggacttc\n 13921 ctggacaacg aggagaatga ggatatcctc gaggacattg tgctgacact cactctgttc\n 13981 gaggaccggg agatgatcga ggagcgcctg aagacttacg cccatctctt cgatgacaag\n 14041 gtcatgaagc agctcaagag gaggaggtac accggctggg ggaggctgag caggaagctc\n 14101 atcaacggca ttcgggacaa gcagtccggg aagacgatcc tcgacttcct gaagagcgat\n 14161 ggcttcgcga accgcaattt catgcagctg attcacgatg acagcctcac attcaaggag\n 14221 gatatccaga aggctcaggt gagcggccag ggggactcgc tgcacgagca tatcgcgaac\n 14281 ctcgctggct cgccagctat caagaagggg attctgcaga ccgtgaaggt tgtggacgag\n 14341 ctggtgaagg tcatgggcag gcacaagcct gagaacatcg tcattgagat ggcccgggag\n 14401 aatcagacca cgcagaaggg ccagaagaac tcacgcgaga ggatgaagag gatcgaggag\n 14461 ggcattaagg agctggggtc ccagatcctc aaggagcacc cggtggagaa cacgcagctg\n 14521 cagaatgaga agctctacct gtactacctc cagaatggcc gcgatatgta tgtggaccag\n 14581 gagctggata ttaacaggct cagcgattac gacgtcgatc atatcgttcc acagtcattc\n 14641 ctgaaggatg actccattga caacaaggtc ctcaccaggt cggacaagaa ccggggcaag\n 14701 tctgataatg ttccttcaga ggaggtcgtt aagaagatga agaactactg gcgccagctc\n 14761 ctgaatgcca agctgatcac gcagcggaag ttcgataacc tcacaaaggc tgagaggggc\n 14821 gggctctctg agctggacaa ggcgggcttc atcaagaggc agctggtcga gacacggcag\n 14881 atcactaagc acgttgcgca gattctcgac tcacggatga acactaagta cgatgagaat\n 14941 gacaagctga tccgcgaggt gaaggtcatc accctgaagt caaagctcgt ctccgacttc\n 15001 aggaaggatt tccagttcta caaggttcgg gagatcaaca attaccacca tgcccatgac\n 15061 gcgtacctga acgcggtggt cggcacagct ctgatcaaga agtacccaaa gctcgagagc\n 15121 gagttcgtgt acggggacta caaggtttac gatgtgagga agatgatcgc caagtcggag\n 15181 caggagattg gcaaggctac cgccaagtac ttcttctact ctaacattat gaatttcttc\n 15241 aagacagaga tcactctggc caatggcgag atccggaagc gccccctcat cgagacgaac\n 15301 ggcgagacgg gggagatcgt gtgggacaag ggcagggatt tcgcgaccgt caggaaggtt\n 15361 ctctccatgc cacaagtgaa tatcgtcaag aagacagagg tccagactgg cgggttctct\n 15421 aaggagtcaa ttctgcctaa gcggaacagc gacaagctca tcgcccgcaa gaaggactgg\n 15481 gatccgaaga agtacggcgg gttcgacagc cccactgtgg cctactcggt cctggttgtg\n 15541 gcgaaggttg agaagggcaa gtccaagaag ctcaagagcg tgaaggagct gctggggatc\n 15601 acgattatgg agcgctccag cttcgagaag aacccgatcg atttcctgga ggcgaagggc\n 15661 tacaaggagg tgaagaagga cctgatcatt aagctcccca agtactcact cttcgagctg\n 15721 gagaacggca ggaagcggat gctggcttcc gctggcgagc tgcagaaggg gaacgagctg\n 15781 gctctgccgt ccaagtatgt gaacttcctc tacctggcct cccactacga gaagctcaag\n 15841 ggcagccccg aggacaacga gcagaagcag ctgttcgtcg agcagcacaa gcattacctc\n 15901 gacgagatca ttgagcagat ttccgagttc tccaagcgcg tgatcctggc cgacgcgaat\n 15961 ctggataagg tcctctccgc gtacaacaag caccgcgaca agccaatcag ggagcaggct\n 16021 gagaatatca ttcatctctt caccctgacg aacctcggcg cccctgctgc tttcaagtac\n 16081 ttcgacacaa ctatcgatcg caagaggtac acaagcacta aggaggtcct ggacgcgacc\n 16141 ctcatccacc agtcgattac cggcctctac gagacgcgca tcgacctgtc tcagctcggg\n 16201 ggcgacaagc ggccagcggc gacgaagaag gcggggcagg cgaagaagaa gaagtgagct\n 16261 cagagctttc gttcgtatca tcggtttcga caacgttcgt caagttcaat gcatcagttt\n 16321 cattgcgcac acaccagaat cctactgagt ttgagtatta tggcattggg aaaactgttt\n 16381 ttcttgtacc atttgttgtg cttgtaattt actgtgtttt ttattcggtt ttcgctatcg\n 16441 aactgtgaaa tggaaatgga tggagaagag ttaatgaatg atatggtcct tttgttcatt\n 16501 ctcaaattaa tattatttgt tttttctctt atttgttgtg tgttgaattt gaaattataa\n 16561 gagatatgca aacattttgt tttgagtaaa aatgtgtcaa atcgtggcct ctaatgaccg\n 16621 aagttaatat gaggagtaaa acacttgtag ttgtaccatt atgcttattc actaggcaac\n 16681 aaatatattt tcagacctag aaaagctgca aatgttactg aatacaagta tgtcctcttg\n 16741 tgttttagac atttatgaac tttcctttat gtaattttcc agaatccttg tcagattcta\n 16801 atcattgctt tataattata gttatactca tggatttgta gttgagtatg aaaatatttt\n 16861 ttaatgcatt ttatgacttg ccaattgatt gacaacgaat tcgtaatcat gtcatagctg\n 16921 tttcctgtgt gaaattgtta tccgctcaca attccacaca acatacgagc cggaagcata\n 16981 aagtgtaaag cctggggtgc ctaatgagtg agctaactca cattaattgc gttgcgctca\n 17041 ctgcccgctt tccagtcggg aaacctgtcg tgccagctgc attaatgaat cggccaacgc\n 17101 gcggggagag gc\n//"
18
18
  },
19
19
  {
20
- "id": 6,
20
+ "id": 3,
21
21
  "type": "TextFileSequence",
22
22
  "sequence_file_format": "genbank",
23
23
  "overhang_crick_3prime": 0,
@@ -25,7 +25,7 @@
25
25
  "file_content": "LOCUS p4P1R_EC1.2en-EC1.1p 3998 bp DNA circular SYN 27-AUG-2024\nDEFINITION Entry clone containing Egg cell-specific promoter (EC1.1p) fused to\n EC1.2 enhancer (EC1.2en). For use in plants and compatible with the\n MultiSite Gateway system.\nACCESSION .\nVERSION .\nKEYWORDS .\nSOURCE synthetic DNA construct\n ORGANISM synthetic DNA construct\n .\nREFERENCE 1 (bases 1 to 3998)\n AUTHORS Ziqiang P. Li, Jennifer Huard, Emmanuelle M. Bayer, Valerie\n Wattelet-Boyer\n TITLE Versatile Cloning Strategy for Efficient Multigene Editing in\n Arabidopsis\n JOURNAL Bio Protocol, Vol 14, Iss 13, Jul 5, 2024\nREFERENCE 2 (bases 1 to 3998)\n AUTHORS .\n TITLE Direct Submission\n JOURNAL Exported Aug 27, 2024 from SnapGene Server 7.0.3\n https://www.snapgene.com\nCOMMENT SGRef: number: 1; type: \"Journal Article\"; journalName: \"Bio\n Protocol, Vol 14, Iss 13, Jul 5, 2024\"\nFEATURES Location/Qualifiers\n source 1..3998\n /mol_type=\"other DNA\"\n /organism=\"synthetic DNA construct\"\n primer_bind complement(189..208)\n /label=\"T7\"\n /note=\"T7 promoter, forward primer\"\n promoter complement(190..208)\n /label=\"T7 promoter\"\n /note=\"promoter for bacteriophage T7 RNA polymerase\"\n primer_bind complement(213..229)\n /label=\"M13 rev\"\n /note=\"common sequencing primer, one of multiple similar\n variants\"\n primer_bind complement(213..229)\n /label=\"M13 Reverse\"\n /note=\"In lacZ gene. Also called M13-rev\"\n primer_bind complement(331..350)\n /label=\"pENTR-R\"\n /note=\"pENTR vectors, reverse primer\"\n CDS 342..1151\n /codon_start=1\n /gene=\"aph(3')-Ia\"\n /product=\"aminoglycoside phosphotransferase\"\n /label=\"KanR\"\n /note=\"confers resistance to kanamycin in bacteria or G418\n (Geneticin(R)) in eukaryotes\"\n /translation=\"MSHIQRETSRPRLNSNMDADLYGYKWARDNVGQSGATIYRLYGKP\n DAPELFLKHGKGSVANDVTDEMVRLNWLTEFMPLPTIKHFIRTPDDAWLLTTAIPGKTA\n FQVLEEYPDSGENIVDALAVFLRRLHSIPVCNCPFNSDRVFRLAQAQSRMNNGLVDASD\n FDDERNGWPVEQVWKEMHKLLPFSPDSVVTHGDFSLDNLIFDEGKLIGCIDVGRVGIAD\n RYQDLAILWNCLGEFSPSLQKRLFQKYGIDNPDMNKLQFHLMLDEFF\"\n primer_bind complement(409..428)\n /label=\"Kan-R\"\n /note=\"Kanamycin resistance gene, reverse primer\"\n rep_origin 1298..1886\n /direction=RIGHT\n /label=\"ori\"\n /note=\"high-copy-number ColE1/pMB1/pBR322/pUC origin of\n replication\"\n primer_bind 1787..1806\n /label=\"pBR322ori-F\"\n /note=\"pBR322 origin, forward primer\"\n primer_bind 2040..2057\n /label=\"L4440\"\n /note=\"L4440 vector, forward primer\"\n terminator complement(2216..2243)\n /label=\"rrnB T2 terminator\"\n /note=\"transcription terminator T2 from the E. coli rrnB\n gene\"\n terminator complement(2335..2421)\n /gene=\"Escherichia coli rrnB\"\n /label=\"rrnB T1 terminator\"\n /note=\"transcription terminator T1 from the E. coli rrnB\n gene\"\n primer_bind 2470..2492\n /label=\"M13/pUC Forward\"\n /note=\"In lacZ gene\"\n primer_bind 2484..2501\n /label=\"M13 Forward\"\n /note=\"In lacZ gene. Also called M13-F20 or M13 (-21)\n Forward\"\n primer_bind 2485..2501\n /label=\"M13 fwd\"\n /note=\"common sequencing primer, one of multiple similar\n variants\"\n protein_bind 2541..2636\n /gene=\"mutant version of attL\"\n /label=\"attL4\"\n /bound_moiety=\"LR Clonase(TM)\"\n /note=\"recombination site for the Gateway(R) LR reaction\"\n protein_bind join(3991..3998,1..117)\n /gene=\"mutant version of attR\"\n /label=\"attR1\"\n /bound_moiety=\"LR Clonase(TM)\"\n /note=\"recombination site for the Gateway(R) LR reaction\"\nORIGIN\n 1 gtacaaaaaa gttgaacgag aaacgtaaaa tgatataaat atcaatatat taaattagat\n 61 tttgcataaa aaacagacta cataatactg taaaacacaa catatgcagt cactatgaac\n 121 caactactta gatggtatta gtgacctgta gaattcgagc tctagagctg cagggcggcc\n 181 gcgatatccc ctatagtgag tcgtattaca tggtcatagc tgtttcctgg cagctctggc\n 241 ccgtgtctca aaatctctga tgttacattg cacaagataa aaatatatca tcatgaacaa\n 301 taaaactgtc tgcttacata aacagtaata caaggggtgt tatgagccat attcaacggg\n 361 aaacgtcgag gccgcgatta aattccaaca tggatgctga tttatatggg tataaatggg\n 421 ctcgcgataa tgtcgggcaa tcaggtgcga caatctatcg cttgtatggg aagcccgatg\n 481 cgccagagtt gtttctgaaa catggcaaag gtagcgttgc caatgatgtt acagatgaga\n 541 tggtcagact aaactggctg acggaattta tgcctcttcc gaccatcaag cattttatcc\n 601 gtactcctga tgatgcatgg ttactcacca ctgcgatccc cggaaaaaca gcattccagg\n 661 tattagaaga atatcctgat tcaggtgaaa atattgttga tgcgctggca gtgttcctgc\n 721 gccggttgca ttcgattcct gtttgtaatt gtccttttaa cagcgatcgc gtatttcgtc\n 781 tcgctcaggc gcaatcacga atgaataacg gtttggttga tgcgagtgat tttgatgacg\n 841 agcgtaatgg ctggcctgtt gaacaagtct ggaaagaaat gcataaactt ttgccattct\n 901 caccggattc agtcgtcact catggtgatt tctcacttga taaccttatt tttgacgagg\n 961 ggaaattaat aggttgtatt gatgttggac gagtcggaat cgcagaccga taccaggatc\n 1021 ttgccatcct atggaactgc ctcggtgagt tttctccttc attacagaaa cggctttttc\n 1081 aaaaatatgg tattgataat cctgatatga ataaattgca gtttcatttg atgctcgatg\n 1141 agtttttcta atcagaattg gttaattggt tgtaacactg gcagagcatt acgctgactt\n 1201 gacgggacgg cgcaagctca tgaccaaaat cccttaacgt gagttacgcg tcgttccact\n 1261 gagcgtcaga ccccgtagaa aagatcaaag gatcttcttg agatcctttt tttctgcgcg\n 1321 taatctgctg cttgcaaaca aaaaaaccac cgctaccagc ggtggtttgt ttgccggatc\n 1381 aagagctacc aactcttttt ccgaaggtaa ctggcttcag cagagcgcag ataccaaata\n 1441 ctgttcttct agtgtagccg tagttaggcc accacttcaa gaactctgta gcaccgccta\n 1501 catacctcgc tctgctaatc ctgttaccag tggctgctgc cagtggcgat aagtcgtgtc\n 1561 ttaccgggtt ggactcaaga cgatagttac cggataaggc gcagcggtcg ggctgaacgg\n 1621 ggggttcgtg cacacagccc agcttggagc gaacgaccta caccgaactg agatacctac\n 1681 agcgtgagct atgagaaagc gccacgcttc ccgaagggag aaaggcggac aggtatccgg\n 1741 taagcggcag ggtcggaaca ggagagcgca cgagggagct tccaggggga aacgcctggt\n 1801 atctttatag tcctgtcggg tttcgccacc tctgacttga gcgtcgattt ttgtgatgct\n 1861 cgtcaggggg gcggagccta tggaaaaacg ccagcaacgc ggccttttta cggttcctgg\n 1921 ccttttgctg gccttttgct cacatgttct ttcctgcgtt atcccctgat tctgtggata\n 1981 accgtattac cgcctttgag tgagctgata ccgctcgccg cagccgaacg accgagcgca\n 2041 gcgagtcagt gagcgaggaa gcggaagagc gcccaatacg caaaccgcct ctccccgcgc\n 2101 gttggccgat tcattaatgc agctggcacg acaggtttcc cgactggaaa gcgggcagtg\n 2161 agcgcaacgc aattaatacg cgtaccgcta gccaggaaga gtttgtagaa acgcaaaaag\n 2221 gccatccgtc aggatggcct tctgcttagt ttgatgcctg gcagtttatg gcgggcgtcc\n 2281 tgcccgccac cctccgggcc gttgcttcac aacgttcaaa tccgctcccg gcggatttgt\n 2341 cctactcagg agagcgttca ccgacaaaca acagataaaa cgaaaggccc agtcttccga\n 2401 ctgagccttt cgttttattt gatgcctggc agttccctac tctcgcgtta acgctagcat\n 2461 ggatgttttc ccagtcacga cgttgtaaaa cgacggccag tcttaagctc gggcccgagt\n 2521 taacgctacc atggagctcc aaataatgat tttattttga ctgatagtga cctgttcgtt\n 2581 gcaacaaatt gataagcaat gcttttttat aatgccaact ttgtatagaa aagttgaaga\n 2641 ataaaagcat ttgcgtttgg tttatcattg cgtttataca aggacagaga tccactgagc\n 2701 tggaatagct taaaaccatt atcagaacaa aataaaccat tttttgttaa gaatcagagc\n 2761 atagtaaaca acagaaacaa cctaagagag gtaacttgtc caagaagata gctaattata\n 2821 tctattttat aaaagttatc atagtttgta agtcacaaaa gatgcaaata acagagaaac\n 2881 taggagactt gagaatatac attcttgtat atttgtattc gagattgtga aaatttgacc\n 2941 ataagtttaa attcttaaaa agatatatct gatctaggtg atggttatag actgtaattt\n 3001 taccacatgt ttaatgatgg atagtgacac acatgacaca tcgacaacac tatagcatct\n 3061 tatttagatt acaacatgaa atttttctgt aatacatgtc tttgtacata atttaaaagt\n 3121 aattcctaag aaatatattt atacaaggag tttaaagaaa acatagcata aagttcaatg\n 3181 agtagtaaaa accatataca gtatatagca taaagttcaa tgagtttatt acaaaagcat\n 3241 tggttcactt tctgtaacac gacgttaaac cttcgtctcc aataggagcg ctactgattc\n 3301 aacatgccaa tatatactaa atacgtttct acagtcaaat gctttaacgt ttcatgatta\n 3361 agtgactatt taccgtcaat cctttcccat tcctcccact aatccaactt tttaattact\n 3421 cttaaatcac cactaagcta gtaacgccta tcatgaatta gctctactaa atctagcaac\n 3481 ctttcaaatt tgcagtattg caggtgtctc tgtgtcttta aaatagttgc cttatgattt\n 3541 cttcggtttc aagatgatca aatagttata gatttcatgc tcacacatgc tcattagatg\n 3601 tgtacatact ttacttaccc aaatctattt tctcgcaaag attttgatgg taaagctgat\n 3661 ttggttctat tgaactaaat caaacgagtt tcagactgag tgattctaat ccggcccatt\n 3721 agcccctaaa cagacccact aattacgcag cttttaatag agtaattaca cctagtttac\n 3781 ccactaaacc actaagcact aattatctca caatctaatg agcttccctc gtaattactt\n 3841 gggctttcac tctaccattt atttgtaaca gtcaagtctc tactgtctct atataaactc\n 3901 tctaaagtta acacacaatt ctcatcacaa acaaatcaac caaagcaact tctactcttt\n 3961 cttctttcga ccttatcaat ctgttgagaa acaagttt\n//"
26
26
  },
27
27
  {
28
- "id": 8,
28
+ "id": 4,
29
29
  "type": "TextFileSequence",
30
30
  "sequence_file_format": "genbank",
31
31
  "overhang_crick_3prime": 0,
@@ -33,7 +33,7 @@
33
33
  "file_content": "LOCUS pDONR221_zCas9 7458 bp DNA circular SYN 27-AUG-2024\nDEFINITION Entry clone containing 3\u00d7FLAG-NLS-zCas9-NLS encoding sequence, Pisum\n sativum rbcS E9 terminator. For use in plants and compatible with\n the MultiSite Gateway system.\nACCESSION .\nVERSION .\nKEYWORDS .\nSOURCE synthetic DNA construct\n ORGANISM synthetic DNA construct\n .\nREFERENCE 1 (bases 1 to 7458)\n AUTHORS Ziqiang P. Li, Jennifer Huard, Emmanuelle M. Bayer, Valerie\n Wattelet-Boyer\n TITLE Versatile Cloning Strategy for Efficient Multigene Editing in\n Arabidopsis\n JOURNAL Bio Protocol, Vol 14, Iss 13, Jul 5, 2024\nREFERENCE 2 (bases 1 to 7458)\n AUTHORS .\n TITLE Direct Submission\n JOURNAL Exported Aug 27, 2024 from SnapGene Server 7.0.3\n https://www.snapgene.com\nCOMMENT SGRef: number: 1; type: \"Journal Article\"; journalName: \"Bio\n Protocol, Vol 14, Iss 13, Jul 5, 2024\"\nFEATURES Location/Qualifiers\n source 1..7458\n /mol_type=\"other DNA\"\n /organism=\"synthetic DNA construct\"\n primer_bind 92..109\n /label=\"L4440\"\n /note=\"L4440 vector, forward primer\"\n terminator complement(268..295)\n /label=\"rrnB T2 terminator\"\n /note=\"transcription terminator T2 from the E. coli rrnB\n gene\"\n terminator complement(387..473)\n /gene=\"Escherichia coli rrnB\"\n /label=\"rrnB T1 terminator\"\n /note=\"transcription terminator T1 from the E. coli rrnB\n gene\"\n primer_bind 522..544\n /label=\"M13/pUC Forward\"\n /note=\"In lacZ gene\"\n primer_bind 536..553\n /label=\"M13 Forward\"\n /note=\"In lacZ gene. Also called M13-F20 or M13 (-21)\n Forward\"\n primer_bind 537..553\n /label=\"M13 fwd\"\n /note=\"common sequencing primer, one of multiple similar\n variants\"\n protein_bind 569..668\n /gene=\"mutant version of attL\"\n /label=\"attL1\"\n /bound_moiety=\"LR Clonase(TM)\"\n /note=\"recombination site for the Gateway(R) LR reaction\"\n CDS 674..739\n /codon_start=1\n /product=\"three tandem FLAG(R) epitope tags, followed by an\n enterokinase cleavage site\"\n /label=\"3xFLAG\"\n /translation=\"DYKDHDGDYKDHDIDYKDDDDK\"\n CDS 746..766\n /codon_start=1\n /product=\"nuclear localization signal of SV40 (simian virus\n 40) large T antigen\"\n /label=\"SV40 NLS\"\n /translation=\"PKKKRKV\"\n CDS 791..4891\n /codon_start=1\n /product=\"Cas9 (Csn1) endonuclease from the Streptococcus\n pyogenes Type II CRISPR/Cas system\"\n /label=\"Cas9\"\n /note=\"generates RNA-guided double strand breaks in DNA\"\n /translation=\"DKKYSIGLDIGTNSVGWAVITDEYKVPSKKFKVLGNTDRHSIKKN\n LIGALLFDSGETAEATRLKRTARRRYTRRKNRICYLQEIFSNEMAKVDDSFFHRLEESF\n LVEEDKKHERHPIFGNIVDEVAYHEKYPTIYHLRKKLVDSTDKADLRLIYLALAHMIKF\n RGHFLIEGDLNPDNSDVDKLFIQLVQTYNQLFEENPINASGVDAKAILSARLSKSRRLE\n NLIAQLPGEKKNGLFGNLIALSLGLTPNFKSNFDLAEDAKLQLSKDTYDDDLDNLLAQI\n GDQYADLFLAAKNLSDAILLSDILRVNTEITKAPLSASMIKRYDEHHQDLTLLKALVRQ\n QLPEKYKEIFFDQSKNGYAGYIDGGASQEEFYKFIKPILEKMDGTEELLVKLNREDLLR\n KQRTFDNGSIPHQIHLGELHAILRRQEDFYPFLKDNREKIEKILTFRIPYYVGPLARGN\n SRFAWMTRKSEETITPWNFEEVVDKGASAQSFIERMTNFDKNLPNEKVLPKHSLLYEYF\n TVYNELTKVKYVTEGMRKPAFLSGEQKKAIVDLLFKTNRKVTVKQLKEDYFKKIECFDS\n VEISGVEDRFNASLGTYHDLLKIIKDKDFLDNEENEDILEDIVLTLTLFEDREMIEERL\n KTYAHLFDDKVMKQLKRRRYTGWGRLSRKLINGIRDKQSGKTILDFLKSDGFANRNFMQ\n LIHDDSLTFKEDIQKAQVSGQGDSLHEHIANLAGSPAIKKGILQTVKVVDELVKVMGRH\n KPENIVIEMARENQTTQKGQKNSRERMKRIEEGIKELGSQILKEHPVENTQLQNEKLYL\n YYLQNGRDMYVDQELDINRLSDYDVDHIVPQSFLKDDSIDNKVLTRSDKNRGKSDNVPS\n EEVVKKMKNYWRQLLNAKLITQRKFDNLTKAERGGLSELDKAGFIKRQLVETRQITKHV\n AQILDSRMNTKYDENDKLIREVKVITLKSKLVSDFRKDFQFYKVREINNYHHAHDAYLN\n AVVGTALIKKYPKLESEFVYGDYKVYDVRKMIAKSEQEIGKATAKYFFYSNIMNFFKTE\n ITLANGEIRKRPLIETNGETGEIVWDKGRDFATVRKVLSMPQVNIVKKTEVQTGGFSKE\n SILPKRNSDKLIARKKDWDPKKYGGFDSPTVAYSVLVVAKVEKGKSKKLKSVKELLGIT\n IMERSSFEKNPIDFLEAKGYKEVKKDLIIKLPKYSLFELENGRKRMLASAGELQKGNEL\n ALPSKYVNFLYLASHYEKLKGSPEDNEQKQLFVEQHKHYLDEIIEQISEFSKRVILADA\n NLDKVLSAYNKHRDKPIREQAENIIHLFTLTNLGAPAAFKYFDTTIDRKRYTSTKEVLD\n ATLIHQSITGLYETRIDLSQLGGD\"\n CDS 791..4891\n /codon_start=1\n /product=\"Cas9 (Csn1) endonuclease from the Streptococcus\n pyogenes Type II CRISPR/Cas system\"\n /label=\"Cas9\"\n /note=\"generates RNA-guided double strand breaks in DNA\"\n /translation=\"DKKYSIGLDIGTNSVGWAVITDEYKVPSKKFKVLGNTDRHSIKKN\n LIGALLFDSGETAEATRLKRTARRRYTRRKNRICYLQEIFSNEMAKVDDSFFHRLEESF\n LVEEDKKHERHPIFGNIVDEVAYHEKYPTIYHLRKKLVDSTDKADLRLIYLALAHMIKF\n RGHFLIEGDLNPDNSDVDKLFIQLVQTYNQLFEENPINASGVDAKAILSARLSKSRRLE\n NLIAQLPGEKKNGLFGNLIALSLGLTPNFKSNFDLAEDAKLQLSKDTYDDDLDNLLAQI\n GDQYADLFLAAKNLSDAILLSDILRVNTEITKAPLSASMIKRYDEHHQDLTLLKALVRQ\n QLPEKYKEIFFDQSKNGYAGYIDGGASQEEFYKFIKPILEKMDGTEELLVKLNREDLLR\n KQRTFDNGSIPHQIHLGELHAILRRQEDFYPFLKDNREKIEKILTFRIPYYVGPLARGN\n SRFAWMTRKSEETITPWNFEEVVDKGASAQSFIERMTNFDKNLPNEKVLPKHSLLYEYF\n TVYNELTKVKYVTEGMRKPAFLSGEQKKAIVDLLFKTNRKVTVKQLKEDYFKKIECFDS\n VEISGVEDRFNASLGTYHDLLKIIKDKDFLDNEENEDILEDIVLTLTLFEDREMIEERL\n KTYAHLFDDKVMKQLKRRRYTGWGRLSRKLINGIRDKQSGKTILDFLKSDGFANRNFMQ\n LIHDDSLTFKEDIQKAQVSGQGDSLHEHIANLAGSPAIKKGILQTVKVVDELVKVMGRH\n KPENIVIEMARENQTTQKGQKNSRERMKRIEEGIKELGSQILKEHPVENTQLQNEKLYL\n YYLQNGRDMYVDQELDINRLSDYDVDHIVPQSFLKDDSIDNKVLTRSDKNRGKSDNVPS\n EEVVKKMKNYWRQLLNAKLITQRKFDNLTKAERGGLSELDKAGFIKRQLVETRQITKHV\n AQILDSRMNTKYDENDKLIREVKVITLKSKLVSDFRKDFQFYKVREINNYHHAHDAYLN\n AVVGTALIKKYPKLESEFVYGDYKVYDVRKMIAKSEQEIGKATAKYFFYSNIMNFFKTE\n ITLANGEIRKRPLIETNGETGEIVWDKGRDFATVRKVLSMPQVNIVKKTEVQTGGFSKE\n SILPKRNSDKLIARKKDWDPKKYGGFDSPTVAYSVLVVAKVEKGKSKKLKSVKELLGIT\n IMERSSFEKNPIDFLEAKGYKEVKKDLIIKLPKYSLFELENGRKRMLASAGELQKGNEL\n ALPSKYVNFLYLASHYEKLKGSPEDNEQKQLFVEQHKHYLDEIIEQISEFSKRVILADA\n NLDKVLSAYNKHRDKPIREQAENIIHLFTLTNLGAPAAFKYFDTTIDRKRYTSTKEVLD\n ATLIHQSITGLYETRIDLSQLGGD\"\n RBS 4804..4812\n /label=\"Shine-Dalgarno sequence\"\n /note=\"full consensus sequence for ribosome-binding sites\n upstream of start codons in E. coli; complementary to a\n region in the 3' end of the 16S rRNA (Chen et al., 1994)\"\n CDS 4892..4939\n /codon_start=1\n /product=\"bipartite nuclear localization signal from\n nucleoplasmin\"\n /label=\"nucleoplasmin NLS\"\n /translation=\"KRPAATKKAGQAKKKK\"\n protein_bind complement(5583..5682)\n /gene=\"mutant version of attL\"\n /label=\"attL2\"\n /bound_moiety=\"LR Clonase(TM)\"\n /note=\"recombination site for the Gateway(R) LR reaction\"\n primer_bind complement(5699..5718)\n /label=\"T7\"\n /note=\"T7 promoter, forward primer\"\n promoter complement(5700..5718)\n /label=\"T7 promoter\"\n /note=\"promoter for bacteriophage T7 RNA polymerase\"\n primer_bind complement(5723..5739)\n /label=\"M13 rev\"\n /note=\"common sequencing primer, one of multiple similar\n variants\"\n primer_bind complement(5723..5739)\n /label=\"M13 Reverse\"\n /note=\"In lacZ gene. Also called M13-rev\"\n primer_bind complement(5841..5860)\n /label=\"pENTR-R\"\n /note=\"pENTR vectors, reverse primer\"\n CDS 5852..6661\n /codon_start=1\n /gene=\"aph(3')-Ia\"\n /product=\"aminoglycoside phosphotransferase\"\n /label=\"KanR\"\n /note=\"confers resistance to kanamycin in bacteria or G418\n (Geneticin(R)) in eukaryotes\"\n /translation=\"MSHIQRETSRPRLNSNMDADLYGYKWARDNVGQSGATIYRLYGKP\n DAPELFLKHGKGSVANDVTDEMVRLNWLTEFMPLPTIKHFIRTPDDAWLLTTAIPGKTA\n FQVLEEYPDSGENIVDALAVFLRRLHSIPVCNCPFNSDRVFRLAQAQSRMNNGLVDASD\n FDDERNGWPVEQVWKEMHKLLPFSPDSVVTHGDFSLDNLIFDEGKLIGCIDVGRVGIAD\n RYQDLAILWNCLGEFSPSLQKRLFQKYGIDNPDMNKLQFHLMLDEFF\"\n primer_bind complement(5919..5938)\n /label=\"Kan-R\"\n /note=\"Kanamycin resistance gene, reverse primer\"\n rep_origin 6808..7396\n /direction=RIGHT\n /label=\"ori\"\n /note=\"high-copy-number ColE1/pMB1/pBR322/pUC origin of\n replication\"\n primer_bind 7297..7316\n /label=\"pBR322ori-F\"\n /note=\"pBR322 origin, forward primer\"\nORIGIN\n 1 ctttcctgcg ttatcccctg attctgtgga taaccgtatt accgcctttg agtgagctga\n 61 taccgctcgc cgcagccgaa cgaccgagcg cagcgagtca gtgagcgagg aagcggaaga\n 121 gcgcccaata cgcaaaccgc ctctccccgc gcgttggccg attcattaat gcagctggca\n 181 cgacaggttt cccgactgga aagcgggcag tgagcgcaac gcaattaata cgcgtaccgc\n 241 tagccaggaa gagtttgtag aaacgcaaaa aggccatccg tcaggatggc cttctgctta\n 301 gtttgatgcc tggcagttta tggcgggcgt cctgcccgcc accctccggg ccgttgcttc\n 361 acaacgttca aatccgctcc cggcggattt gtcctactca ggagagcgtt caccgacaaa\n 421 caacagataa aacgaaaggc ccagtcttcc gactgagcct ttcgttttat ttgatgcctg\n 481 gcagttccct actctcgcgt taacgctagc atggatgttt tcccagtcac gacgttgtaa\n 541 aacgacggcc agtcttaagc tcgggcccca aataatgatt ttattttgac tgatagtgac\n 601 ctgttcgttg caacaaattg atgagcaatg cttttttata atgccaactt tgtacaaaaa\n 661 agcaggcttc atggattaca aggaccacga cggggattac aaggaccacg acattgatta\n 721 caaggatgat gatgacaaga tggctccgaa gaagaagagg aaggttggca tccacggggt\n 781 gccagctgct gacaagaagt actcgatcgg cctcgatatt gggactaact ctgttggctg\n 841 ggccgtgatc accgacgagt acaaggtgcc ctcaaagaag ttcaaggtcc tgggcaacac\n 901 cgatcggcat tccatcaaga agaatctcat tggcgctctc ctgttcgaca gcggcgagac\n 961 ggctgaggct acgcggctca agcgcaccgc ccgcaggcgg tacacgcgca ggaagaatcg\n 1021 catctgctac ctgcaggaga ttttctccaa cgagatggcg aaggttgacg attctttctt\n 1081 ccacaggctg gaggagtcat tcctcgtgga ggaggataag aagcacgagc ggcatccaat\n 1141 cttcggcaac attgtcgacg aggttgccta ccacgagaag taccctacga tctaccatct\n 1201 gcggaagaag ctcgtggact ccacagataa ggcggacctc cgcctgatct acctcgctct\n 1261 ggcccacatg attaagttca ggggccattt cctgatcgag ggggatctca acccggacaa\n 1321 tagcgatgtt gacaagctgt tcatccagct cgtgcagacg tacaaccagc tcttcgagga\n 1381 gaaccccatt aatgcgtcag gcgtcgacgc gaaggctatc ctgtccgcta ggctctcgaa\n 1441 gtctcggcgc ctcgagaacc tgatcgccca gctgccgggc gagaagaaga acggcctgtt\n 1501 cgggaatctc attgcgctca gcctggggct cacgcccaac ttcaagtcga atttcgatct\n 1561 cgctgaggac gccaagctgc agctctccaa ggacacatac gacgatgacc tggataacct\n 1621 cctggcccag atcggcgatc agtacgcgga cctgttcctc gctgccaaga atctgtcgga\n 1681 cgccatcctc ctgtctgata ttctcagggt gaacaccgag attacgaagg ctccgctctc\n 1741 agcctccatg atcaagcgct acgacgagca ccatcaggat ctgaccctcc tgaaggcgct\n 1801 ggtcaggcag cagctccccg agaagtacaa ggagatcttc ttcgatcagt cgaagaacgg\n 1861 ctacgctggg tacattgacg gcggggcctc tcaggaggag ttctacaagt tcatcaagcc\n 1921 gattctggag aagatggacg gcacggagga gctgctggtg aagctcaatc gcgaggacct\n 1981 cctgaggaag cagcggacat tcgataacgg cagcatccca caccagattc atctcgggga\n 2041 gctgcacgct atcctgagga ggcaggagga cttctaccct ttcctcaagg ataaccgcga\n 2101 gaagatcgag aagattctga ctttcaggat cccgtactac gtcggcccac tcgctagggg\n 2161 caactcccgc ttcgcttgga tgacccgcaa gtcagaggag acgatcacgc cgtggaactt\n 2221 cgaggaggtg gtcgacaagg gcgctagcgc tcagtcgttc atcgagagga tgacgaattt\n 2281 cgacaagaac ctgccaaatg agaaggtgct ccctaagcac tcgctcctgt acgagtactt\n 2341 cacagtctac aacgagctga ctaaggtgaa gtatgtgacc gagggcatga ggaagccggc\n 2401 tttcctgtct ggggagcaga agaaggccat cgtggacctc ctgttcaaga ccaaccggaa\n 2461 ggtcacggtt aagcagctca aggaggacta cttcaagaag attgagtgct tcgattcggt\n 2521 cgagatctct ggcgttgagg accgcttcaa cgcctccctg gggacctacc acgatctcct\n 2581 gaagatcatt aaggataagg acttcctgga caacgaggag aatgaggata tcctcgagga\n 2641 cattgtgctg acactcactc tgttcgagga ccgggagatg atcgaggagc gcctgaagac\n 2701 ttacgcccat ctcttcgatg acaaggtcat gaagcagctc aagaggagga ggtacaccgg\n 2761 ctgggggagg ctgagcagga agctcatcaa cggcattcgg gacaagcagt ccgggaagac\n 2821 gatcctcgac ttcctgaaga gcgatggctt cgcgaaccgc aatttcatgc agctgattca\n 2881 cgatgacagc ctcacattca aggaggatat ccagaaggct caggtgagcg gccaggggga\n 2941 ctcgctgcac gagcatatcg cgaacctcgc tggctcgcca gctatcaaga aggggattct\n 3001 gcagaccgtg aaggttgtgg acgagctggt gaaggtcatg ggcaggcaca agcctgagaa\n 3061 catcgtcatt gagatggccc gggagaatca gaccacgcag aagggccaga agaactcacg\n 3121 cgagaggatg aagaggatcg aggagggcat taaggagctg gggtcccaga tcctcaagga\n 3181 gcacccggtg gagaacacgc agctgcagaa tgagaagctc tacctgtact acctccagaa\n 3241 tggccgcgat atgtatgtgg accaggagct ggatattaac aggctcagcg attacgacgt\n 3301 cgatcatatc gttccacagt cattcctgaa ggatgactcc attgacaaca aggtcctcac\n 3361 caggtcggac aagaaccggg gcaagtctga taatgttcct tcagaggagg tcgttaagaa\n 3421 gatgaagaac tactggcgcc agctcctgaa tgccaagctg atcacgcagc ggaagttcga\n 3481 taacctcaca aaggctgaga ggggcgggct ctctgagctg gacaaggcgg gcttcatcaa\n 3541 gaggcagctg gtcgagacac ggcagatcac taagcacgtt gcgcagattc tcgactcacg\n 3601 gatgaacact aagtacgatg agaatgacaa gctgatccgc gaggtgaagg tcatcaccct\n 3661 gaagtcaaag ctcgtctccg acttcaggaa ggatttccag ttctacaagg ttcgggagat\n 3721 caacaattac caccatgccc atgacgcgta cctgaacgcg gtggtcggca cagctctgat\n 3781 caagaagtac ccaaagctcg agagcgagtt cgtgtacggg gactacaagg tttacgatgt\n 3841 gaggaagatg atcgccaagt cggagcagga gattggcaag gctaccgcca agtacttctt\n 3901 ctactctaac attatgaatt tcttcaagac agagatcact ctggccaatg gcgagatccg\n 3961 gaagcgcccc ctcatcgaga cgaacggcga gacgggggag atcgtgtggg acaagggcag\n 4021 ggatttcgcg accgtcagga aggttctctc catgccacaa gtgaatatcg tcaagaagac\n 4081 agaggtccag actggcgggt tctctaagga gtcaattctg cctaagcgga acagcgacaa\n 4141 gctcatcgcc cgcaagaagg actgggatcc gaagaagtac ggcgggttcg acagccccac\n 4201 tgtggcctac tcggtcctgg ttgtggcgaa ggttgagaag ggcaagtcca agaagctcaa\n 4261 gagcgtgaag gagctgctgg ggatcacgat tatggagcgc tccagcttcg agaagaaccc\n 4321 gatcgatttc ctggaggcga agggctacaa ggaggtgaag aaggacctga tcattaagct\n 4381 ccccaagtac tcactcttcg agctggagaa cggcaggaag cggatgctgg cttccgctgg\n 4441 cgagctgcag aaggggaacg agctggctct gccgtccaag tatgtgaact tcctctacct\n 4501 ggcctcccac tacgagaagc tcaagggcag ccccgaggac aacgagcaga agcagctgtt\n 4561 cgtcgagcag cacaagcatt acctcgacga gatcattgag cagatttccg agttctccaa\n 4621 gcgcgtgatc ctggccgacg cgaatctgga taaggtcctc tccgcgtaca acaagcaccg\n 4681 cgacaagcca atcagggagc aggctgagaa tatcattcat ctcttcaccc tgacgaacct\n 4741 cggcgcccct gctgctttca agtacttcga cacaactatc gatcgcaaga ggtacacaag\n 4801 cactaaggag gtcctggacg cgaccctcat ccaccagtcg attaccggcc tctacgagac\n 4861 gcgcatcgac ctgtctcagc tcgggggcga caagcggcca gcggcgacga agaaggcggg\n 4921 gcaggcgaag aagaagaagt gagctcagag ctttcgttcg tatcatcggt ttcgacaacg\n 4981 ttcgtcaagt tcaatgcatc agtttcattg cgcacacacc agaatcctac tgagtttgag\n 5041 tattatggca ttgggaaaac tgtttttctt gtaccatttg ttgtgcttgt aatttactgt\n 5101 gttttttatt cggttttcgc tatcgaactg tgaaatggaa atggatggag aagagttaat\n 5161 gaatgatatg gtccttttgt tcattctcaa attaatatta tttgtttttt ctcttatttg\n 5221 ttgtgtgttg aatttgaaat tataagagat atgcaaacat tttgttttga gtaaaaatgt\n 5281 gtcaaatcgt ggcctctaat gaccgaagtt aatatgagga gtaaaacact tgtagttgta\n 5341 ccattatgct tattcactag gcaacaaata tattttcaga cctagaaaag ctgcaaatgt\n 5401 tactgaatac aagtatgtcc tcttgtgttt tagacattta tgaactttcc tttatgtaat\n 5461 tttccagaat ccttgtcaga ttctaatcat tgctttataa ttatagttat actcatggat\n 5521 ttgtagttga gtatgaaaat attttttaat gcattttatg acttgccaat tgattgacaa\n 5581 cgacccagct ttcttgtaca aagttggcat tataagaaag cattgcttat caatttgttg\n 5641 caacgaacag gtcactatca gtcaaaataa aatcattatt tgccatccag ctgatatccc\n 5701 ctatagtgag tcgtattaca tggtcatagc tgtttcctgg cagctctggc ccgtgtctca\n 5761 aaatctctga tgttacattg cacaagataa aaatatatca tcatgaacaa taaaactgtc\n 5821 tgcttacata aacagtaata caaggggtgt tatgagccat attcaacggg aaacgtcgag\n 5881 gccgcgatta aattccaaca tggatgctga tttatatggg tataaatggg ctcgcgataa\n 5941 tgtcgggcaa tcaggtgcga caatctatcg cttgtatggg aagcccgatg cgccagagtt\n 6001 gtttctgaaa catggcaaag gtagcgttgc caatgatgtt acagatgaga tggtcagact\n 6061 aaactggctg acggaattta tgcctcttcc gaccatcaag cattttatcc gtactcctga\n 6121 tgatgcatgg ttactcacca ctgcgatccc cggaaaaaca gcattccagg tattagaaga\n 6181 atatcctgat tcaggtgaaa atattgttga tgcgctggca gtgttcctgc gccggttgca\n 6241 ttcgattcct gtttgtaatt gtccttttaa cagcgatcgc gtatttcgtc tcgctcaggc\n 6301 gcaatcacga atgaataacg gtttggttga tgcgagtgat tttgatgacg agcgtaatgg\n 6361 ctggcctgtt gaacaagtct ggaaagaaat gcataaactt ttgccattct caccggattc\n 6421 agtcgtcact catggtgatt tctcacttga taaccttatt tttgacgagg ggaaattaat\n 6481 aggttgtatt gatgttggac gagtcggaat cgcagaccga taccaggatc ttgccatcct\n 6541 atggaactgc ctcggtgagt tttctccttc attacagaaa cggctttttc aaaaatatgg\n 6601 tattgataat cctgatatga ataaattgca gtttcatttg atgctcgatg agtttttcta\n 6661 atcagaattg gttaattggt tgtaacactg gcagagcatt acgctgactt gacgggacgg\n 6721 cgcaagctca tgaccaaaat cccttaacgt gagttacgcg tcgttccact gagcgtcaga\n 6781 ccccgtagaa aagatcaaag gatcttcttg agatcctttt tttctgcgcg taatctgctg\n 6841 cttgcaaaca aaaaaaccac cgctaccagc ggtggtttgt ttgccggatc aagagctacc\n 6901 aactcttttt ccgaaggtaa ctggcttcag cagagcgcag ataccaaata ctgttcttct\n 6961 agtgtagccg tagttaggcc accacttcaa gaactctgta gcaccgccta catacctcgc\n 7021 tctgctaatc ctgttaccag tggctgctgc cagtggcgat aagtcgtgtc ttaccgggtt\n 7081 ggactcaaga cgatagttac cggataaggc gcagcggtcg ggctgaacgg ggggttcgtg\n 7141 cacacagccc agcttggagc gaacgaccta caccgaactg agatacctac agcgtgagct\n 7201 atgagaaagc gccacgcttc ccgaagggag aaaggcggac aggtatccgg taagcggcag\n 7261 ggtcggaaca ggagagcgca cgagggagct tccaggggga aacgcctggt atctttatag\n 7321 tcctgtcggg tttcgccacc tctgacttga gcgtcgattt ttgtgatgct cgtcaggggg\n 7381 gcggagccta tggaaaaacg ccagcaacgc ggccttttta cggttcctgg ccttttgctg\n 7441 gccttttgct cacatgtt\n//"
34
34
  },
35
35
  {
36
- "id": 10,
36
+ "id": 5,
37
37
  "type": "TextFileSequence",
38
38
  "sequence_file_format": "genbank",
39
39
  "overhang_crick_3prime": 0,
@@ -41,7 +41,7 @@
41
41
  "file_content": "LOCUS pFRm43GW 11666 bp DNA circular SYN 25-AUG-2024\nDEFINITION Three-fragment Multisite Gateway vector construction for red\n fluorescent seed selection in Arabidopsis thaliana.\nACCESSION .\nVERSION .\nKEYWORDS .\nSOURCE synthetic DNA construct\n ORGANISM synthetic DNA construct\n .\nREFERENCE 1 (bases 1 to 11666)\n AUTHORS Wang X, Ye L, Lyu M, Ursache R, Loytynoja A, Mahonen AP\n TITLE An inducible genome editing system for plants.\n JOURNAL Nat Plants. 2020 Jun 29. pii: 10.1038/s41477-020-0695-2. doi:\n 10.1038/s41477-020-0695-2.\n PUBMED 32601420\nREFERENCE 2 (bases 1 to 11666)\n AUTHORS .\n TITLE Direct Submission\n JOURNAL Exported Aug 25, 2024 from SnapGene Server 7.0.3\n https://www.snapgene.com\nCOMMENT SGRef: number: 1; type: \"Journal Article\"; journalName: \"Nat Plants.\n 2020 Jun 29. pii: 10.1038/s41477-020-0695-2. doi:\n 10.1038/s41477-020-0695-2.\"\nFEATURES Location/Qualifiers\n source 1..11666\n /mol_type=\"other DNA\"\n /organism=\"synthetic DNA construct\"\n CDS 2142..2837\n /codon_start=1\n /product=\"monomeric far-red fluorescent protein (Shcherbo\n et al., 2009)\"\n /label=\"mKate2\"\n /note=\"mammalian codon-optimized\"\n /translation=\"MSELIKENMHMKLYMEGTVNNHHFKCTSEGEGKPYEGTQTMRIKV\n VEGGPLPFAFDILATSFMYGSRTFINHTQGIPDFFKQSFPEGFTWERVTTYEDGGVLTA\n TQDTSLQDGCLIYNVKIRGVNFPSNGPVMQKKTLGWEANTEMLYPADGGLEGRSDMALK\n LVGGGHLICNFKTTYRSKKPAKNLKMPGVYYVDHRLERIKEADKETYVEQHEVAVARYC\n DLPSKLGHK\"\n terminator complement(2836..3087)\n /label=\"NOS terminator\"\n /note=\"nopaline synthase terminator and poly(A) signal\"\n misc_feature 3183..3207\n /label=\"LB T-DNA repeat\"\n /note=\"left border repeat from nopaline C58 T-DNA\"\n CDS 3728..4519\n /codon_start=1\n /gene=\"aadA\"\n /product=\"aminoglycoside adenylyltransferase (Murphy,\n 1985)\"\n /label=\"SmR\"\n /note=\"confers resistance to spectinomycin and\n streptomycin\"\n /translation=\"MGEAVIAEVSTQLSEVVGVIERHLEPTLLAVHLYGSAVDGGLKPH\n SDIDLLVTVTVRLDETTRRALINDLLETSASPGESEILRAVEVTIVVHDDIIPWRYPAK\n RELQFGEWQRNDILAGIFEPATIDIDLAILLTKAREHSVALVGPAAEELFDPVPEQDLF\n EALNETLTLWNSPPDWAGDERNVVLTLSRIWYSAVTGKIAPKDVAADWAMERLPAQYQP\n VILEARQAYLGQEEDRLASRADQLEEFVHYVKGEITKVVGK\"\n rep_origin 4765..5353\n /direction=RIGHT\n /label=\"ori\"\n /note=\"high-copy-number ColE1/pMB1/pBR322/pUC origin of\n replication\"\n primer_bind 5254..5273\n /label=\"pBR322ori-F\"\n /note=\"pBR322 origin, forward primer\"\n primer_bind 5507..5524\n /label=\"L4440\"\n /note=\"L4440 vector, forward primer\"\n misc_feature 5539..5679\n /label=\"bom\"\n /note=\"basis of mobility region from pBR322\"\n primer_bind complement(5605..5624)\n /label=\"pRS-marker\"\n /note=\"pRS vectors, use to sequence yeast selectable\n marker\"\n primer_bind 5765..5787\n /label=\"pGEX 3'\"\n /note=\"pGEX vectors, reverse primer\"\n rep_origin 6023..6217\n /label=\"pVS1 oriV\"\n /note=\"origin of replication for the Pseudomonas plasmid\n pVS1 (Heeb et al., 2000)\"\n CDS complement(6283..7356)\n /codon_start=1\n /product=\"replication protein from the Pseudomonas plasmid\n pVS1 (Heeb et al., 2000)\"\n /label=\"pVS1 RepA\"\n /translation=\"MSGRKPSGPVQIGAALGDDLVEKLKAAQAAQRQRIEAEARPGESW\n QAAADRIRKESRQPPAAGAPSIRKPPKGDEQPDFFVPMLYDVGTRDSRSIMDVAVFRLS\n KRDRRAGEVIRYELPDGHVEVSAGPAGMASVWDYDLVLMAVSHLTESMNRYREGKGDKP\n GRVFRPHVADVLKFCRRADGGKQKDDLVETCIRLNTTHVAMQRTKKAKNGRLVTVSEGE\n ALISRYKIVKSETGRPEYIEIELADWMYREITEGKNPDVLTVHPDYFLIDPGIGRFLYR\n LARRAAGKAEARWLFKTIYERSGSAGEFKKFCFTVRKLIGSNDLPEYDLKEEAGQAGPI\n LVMRYRNLIEGEASAGS\"\n CDS complement(7785..8414)\n /codon_start=1\n /product=\"stability protein from the Pseudomonas plasmid\n pVS1 (Heeb et al., 2000)\"\n /label=\"pVS1 StaA\"\n /translation=\"MKVIAVLNQKGGSGKTTIATHLARALQLAGADVLLVDSDPQGSAR\n DWAAVREDQPLTVVGIDRPTIDRDVKAIGRRDFVVIDGAPQAADLAVSAIKAADFVLIP\n VQPSPYDIWATADLVELVKQRIEVTDGRLQAAFVVSRAIKGTRIGGEVAEALAGYELPI\n LESRITQRVSYPGTAAAGTTVLESEPEGDAAREVQALAAEIKSKLI\"\n misc_feature 9745..9769\n /label=\"RB T-DNA repeat\"\n /note=\"right border repeat from nopaline C58 T-DNA\"\n primer_bind 9843..9865\n /label=\"M13/pUC Forward\"\n /note=\"In lacZ gene\"\n primer_bind 9857..9874\n /label=\"M13 Forward\"\n /note=\"In lacZ gene. Also called M13-F20 or M13 (-21)\n Forward\"\n primer_bind 9858..9874\n /label=\"M13 fwd\"\n /note=\"common sequencing primer, one of multiple similar\n variants\"\n protein_bind 9882..10005\n /gene=\"mutant version of attR\"\n /label=\"attR3\"\n /bound_moiety=\"LR Clonase(TM)\"\n /note=\"recombination site for the Gateway(R) LR reaction\"\n promoter 10030..10060\n /label=\"lac UV5 promoter\"\n /note=\"E. coli lac promoter with an \"\"up\"\" mutation\"\n CDS 10114..10794\n /codon_start=1\n /product=\"chloramphenicol acetyltransferase\"\n /label=\"CmR\"\n /note=\"confers resistance to chloramphenicol\"\n /translation=\"MEKKITGYTTVDISQWHRKEHFEAFQSVAQCTYNQTVQLDITAFL\n KTVKKNKHKFYPAFIHILARLMNAHPEFRMAMKDGELVIWDSVHPCYTVFHEQTETFSS\n LWSEYHDDFRQFLHIYSQDVACYGENLAYFPKGFIENMFFVSANPWVSFTSFDLNVANM\n DNFFAPVFTMGKYYTQGDKVLMPLAIQVHHAVCDGFHVGRMLNELQQYCDEWQAGRNLE\n DPAY\"\n primer_bind complement(10180..10199)\n /label=\"CAT-R\"\n /note=\"Chloramphenicol resistance gene, reverse primer\"\n CDS 11114..11419\n /codon_start=1\n /gene=\"ccdB\"\n /product=\"CcdB, a bacterial toxin that poisons DNA gyrase\"\n /label=\"ccdB\"\n /note=\"Plasmids containing the ccdB gene cannot be\n propagated in standard E. coli strains.\"\n /translation=\"MQFKVYTYKRESRYRLFVDVQSDIIDTPGRRMVIPLASARLLSDK\n VPRELYPVVHIGDESWRMMTTDMASVPVSVIGEEVADLSHRENDIKNAINLMFWGI\"\n primer_bind 11298..11317\n /label=\"ccdB-fwd\"\n /note=\"ccdB gene, forward primer\"\n protein_bind complement(11460..11583)\n /gene=\"mutant version of attR\"\n /label=\"attR4\"\n /bound_moiety=\"LR Clonase(TM)\"\n /note=\"recombination site for the Gateway(R) LR reaction\"\n primer_bind complement(11603..11619)\n /label=\"M13 rev\"\n /note=\"common sequencing primer, one of multiple similar\n variants\"\n primer_bind complement(11603..11619)\n /label=\"M13 Reverse\"\n /note=\"In lacZ gene. Also called M13-rev\"\n primer_bind complement(11616..11638)\n /label=\"M13/pUC Reverse\"\n /note=\"In lacZ gene\"\nORIGIN\n 1 cttcaagtgt atgtaggtat agtaacatga acaagaacag actcaagtac aagatcgcat\n 61 acgaaaatgg aaatggcaat gtcacttcca cataatcaaa cacgaatcct catatcaaca\n 121 aggcctgaga ttctaactag ctcataacaa cttagccaat agttacttga gactaccaaa\n 181 tgtatgtaga actaaagact aagggacaga gagttcgtct aaacaggtga atctagtcgt\n 241 tgttatctaa taaacaattc agccccaaat gcagaacaca catagagctc tctattgatt\n 301 caaattacga tctgatactg ataacgtcta gatttttagg gttaaagcaa tcaatcacct\n 361 gacgattcaa ggtggttgga tcatgacgat tccagaaaac atcaagcaag ctctcaaagc\n 421 tacactcttt gggatcatac tgaactctaa caacctcgtt atgtcccgta gtgccagtac\n 481 agacatcctc gtaactcgga ttgtgcacga tgccatggct atacccaacc tcggtcttgg\n 541 tcacaccagg aactctctgg taagctagct ccactcccca gaaacaaccg gcgccaaatt\n 601 gcgcgaattg ctgacctgaa gacggaacat catcgtcggg tccttgggcg attgcggcgg\n 661 aagatgggtc agcttgggct tgaggacgag acccgaatcc gagtctgttg aaaaggttgt\n 721 tcattgggga tttgtatacg gagattggtc gtcgagaggt ttgagggaaa ggacaaatgg\n 781 gtttggctct ggagaaagag agtgcggctt tagagagaga attgagaggt ttagagagag\n 841 atgcggcggc gatgagcgga ggagagacga cgaggacctg cattatcaaa gcagtgacgt\n 901 ggtgaaattt ggaactttta agaggcagat agatttatta tttgtatcca ttttcttcat\n 961 tgttctagaa tgtcgcggaa caaattttaa aactaaatcc taaatttttc taattttgtt\n 1021 gccaatagtg gatatgtggg ccgtatagaa ggaatctatt gaaggcccaa acccatactg\n 1081 acgagcccaa aggttcgttt tgcgttttat gtttcggttc gatgccaacg ccacattctg\n 1141 agctaggcaa aaaacaaacg tgtctttgaa tagactcctc tcgttaacac atgcagcggc\n 1201 tgcatggtga cgccattaac acgtggccta caattgcatg atgtctccat tgacacgtga\n 1261 cttctcgtct cctttcttaa tatatctaac aaacactcct acctcttcca aaatatatac\n 1321 acatcttttt gatcaatctc tcattcaaaa tctcattctc tctagtaaac aagaacaaaa\n 1381 aaatggcgga tacagctaga ggaacccatc acgatatcat cggcagagac cagtacccga\n 1441 tgatgggccg agaccgagac cagtaccaga tgtccggacg aggatctgac tactccaagt\n 1501 ctaggcagat tgctaaagct gcaactgctg tcacagctgg tggttccctc cttgttctct\n 1561 ccagccttac ccttgttgga actgtcatag ctttgactgt tgcaacacct ctgctcgtta\n 1621 tcttcagccc aatccttgtc ccggctctca tcacagttgc actcctcatc accggttttc\n 1681 tttcctctgg agggtttggc attgccgcta taaccgtttt ctcttggatt tacaagtaag\n 1741 cacacattta tcatcttact tcataatttt gtgcaatatg tgcatgcatg tgttgagcca\n 1801 gtagctttgg atcaattttt ttggtcgaat aacaaatgta acaataagaa attgcaaatt\n 1861 ctagggaaca tttggttaac taaatacgaa atttgaccta gctagcttga atgtgtctgt\n 1921 gtatatcatc tatataggta aaatgcttgg tatgatacct attgattgtg aataggtacg\n 1981 caacgggaga gcacccacag ggatcagaca agttggacag tgcaaggatg aagttgggaa\n 2041 gcaaagctca ggatctgaaa gacagagctc agtactacgg acagcaacat actggtgggg\n 2101 aacatgaccg tgaccgtact cgtggtggcc agcacactac tatgagcgag ctgattaagg\n 2161 agaacatgca catgaagctg tacatggagg gcaccgtgaa caaccaccac ttcaagtgca\n 2221 catccgaggg cgaaggcaag ccctacgagg gcacccagac catgagaatc aaggtggtcg\n 2281 agggcggccc tctccccttc gccttcgaca tcctggctac cagcttcatg tacggcagca\n 2341 gaaccttcat caaccacacc cagggcatcc ccgacttctt taagcagtcc ttccctgagg\n 2401 gcttcacatg ggagagagtc accacatacg aagacggggg cgtgctgacc gctacccagg\n 2461 acaccagcct ccaggacggc tgcctcatct acaacgtcaa gatcagaggg gtgaacttcc\n 2521 catccaacgg ccctgtgatg cagaagaaaa cactcggctg ggaggccaac accgagatgc\n 2581 tgtaccccgc tgacggcggc ctggaaggca gaagcgacat ggccctgaag ctcgtgggcg\n 2641 ggggccacct gatctgcaac ttcaagacca catacagatc caagaaaccc gctaagaacc\n 2701 tcaagatgcc cggcgtctac tatgtggacc acagactgga aagaatcaag gaggccgaca\n 2761 aagagaccta cgtcgagcag cacgaggtgg ctgtggccag atactgcgac ctccctagca\n 2821 aactggggca caagtgatct agtaacatag atgacaccgc gcgcgataat ttatcctagt\n 2881 ttgcgcgcta tattttgttt tctatcgcgt attaaatgta taattgcggg actctaatca\n 2941 taaaaaccca tctcataaat aacgtcatgc attacatgtt aattattaca tgcttaacgt\n 3001 aattcaacag aaattatatg ataatcatcg caagaccggc aacaggattc aatcttaaga\n 3061 aactttattg ccaaatgttt gaacgatggt accctgcatg caagctgata attcaattcg\n 3121 gcgttaattc agtacattaa aaacgtccgc aatgtgttat taagttgtct aagcgtcaat\n 3181 ttgtttacac cacaatatat cctgccacca gccagccaac agctccccga ccggcagctc\n 3241 ggcacaaaat caccactcga tacaggcagc ccatcagtcc gggacggcgt cagcgggaga\n 3301 gccgttgtaa ggcggcagac tttgctcatg ttaccgatgc tattcggaag aacggcaact\n 3361 aagctgccgg gtttgaaaca cggatgatct cgcggagggt agcatgttga ttgtaacgat\n 3421 gacagagcgt tgctgcctgt gatcaattcg ggcacgaacc cagtggacat aagcctgttc\n 3481 ggttcgtaag ctgtaatgca agtagcgtat gcgctcacgc aactggtcca gaaccttgac\n 3541 cgaacgcagc ggtggtaacg gcgcagtggc ggttttcatg gcttgttatg actgtttttt\n 3601 tggggtacag tctatgcctc gggcatccaa gcagcaagcg cgttacgccg tgggtcgatg\n 3661 tttgatgtta tggagcagca acgatgttac gcagcagggc agtcgcccta aaacaaagtt\n 3721 aaacatcatg ggggaagcgg tgatcgccga agtatcgact caactatcag aggtagttgg\n 3781 cgtcatcgag cgccatctcg aaccgacgtt gctggccgta catttgtacg gctccgcagt\n 3841 ggatggcggc ctgaagccac acagtgatat tgatttgctg gttacggtga ccgtaaggct\n 3901 tgatgaaaca acgcggcgag ctttgatcaa cgaccttttg gaaacttcgg cttcccctgg\n 3961 agagagcgag attctccgcg ctgtagaagt caccattgtt gtgcacgacg acatcattcc\n 4021 gtggcgttat ccagctaagc gcgaactgca atttggagaa tggcagcgca atgacattct\n 4081 tgcaggtatc ttcgagccag ccacgatcga cattgatctg gctatcttgc tgacaaaagc\n 4141 aagagaacat agcgttgcct tggtaggtcc agcggcggag gaactctttg atccggttcc\n 4201 tgaacaggat ctatttgagg cgctaaatga aaccttaacg ctatggaact cgccgcccga\n 4261 ctgggctggc gatgagcgaa atgtagtgct tacgttgtcc cgcatttggt acagcgcagt\n 4321 aaccggcaaa atcgcgccga aggatgtcgc tgccgactgg gcaatggagc gcctgccggc\n 4381 ccagtatcag cccgtcatac ttgaagctag acaggcttat cttggacaag aagaagatcg\n 4441 cttggcctcg cgcgcagatc agttggaaga atttgtccac tacgtgaaag gcgagatcac\n 4501 caaggtagtc ggcaaataat gtctagctag aaattcgttc aagccgacgc cgcttcgcgg\n 4561 cgcggcttaa ctcaagcgtt agatgcacta agcacataat tgctcacagc caaactatca\n 4621 ggtcaagtct gcttttatta tttttaagcg tgcataataa gccctacaca aattgggaga\n 4681 tatatcatgc atgaccaaaa tcccttaacg tgagttttcg ttccactgag cgtcagaccc\n 4741 cgtagaaaag atcaaaggat cttcttgaga tccttttttt ctgcgcgtaa tctgctgctt\n 4801 gcaaacaaaa aaaccaccgc taccagcggt ggtttgtttg ccggatcaag agctaccaac\n 4861 tctttttccg aaggtaactg gcttcagcag agcgcagata ccaaatactg tccttctagt\n 4921 gtagccgtag ttaggccacc acttcaagaa ctctgtagca ccgcctacat acctcgctct\n 4981 gctaatcctg ttaccagtgg ctgctgccag tggcgataag tcgtgtctta ccgggttgga\n 5041 ctcaagacga tagttaccgg ataaggcgca gcggtcgggc tgaacggggg gttcgtgcac\n 5101 acagcccagc ttggagcgaa cgacctacac cgaactgaga tacctacagc gtgagctatg\n 5161 agaaagcgcc acgcttcccg aagggagaaa ggcggacagg tatccggtaa gcggcagggt\n 5221 cggaacagga gagcgcacga gggagcttcc agggggaaac gcctggtatc tttatagtcc\n 5281 tgtcgggttt cgccacctct gacttgagcg tcgatttttg tgatgctcgt caggggggcg\n 5341 gagcctatgg aaaaacgcca gcaacgcggc ctttttacgg ttcctggcct tttgctggcc\n 5401 ttttgctcac atgttctttc ctgcgttatc ccctgattct gtggataacc gtattaccgc\n 5461 ctttgagtga gctgataccg ctcgccgcag ccgaacgacc gagcgcagcg agtcagtgag\n 5521 cgaggaagcg gaagagcgcc tgatgcggta ttttctcctt acgcatctgt gcggtatttc\n 5581 acaccgcata tggtgcactc tcagtacaat ctgctctgat gccgcatagt taagccagta\n 5641 tacactccgc tatcgctacg tgactgggtc atggctgcgc cccgacaccc gccaacaccc\n 5701 gctgacgcgc cctgacgggc ttgtctgctc ccggcatccg cttacagaca agctgtgacc\n 5761 gtctccggga gctgcatgtg tcagaggttt tcaccgtcat caccgaaacg cgcgaggcag\n 5821 ggtgccttga tgtgggcgcc ggcggtcgag tggcgacggc gcggcttgtc cgcgccctgg\n 5881 tagattgcct ggccgtaggc cagccatttt tgagcggcca gcggccgcga taggccgacg\n 5941 cgaagcggcg gggcgtaggg agcgcagcga ccgaagggta ggcgcttttt gcagctcttc\n 6001 ggctgtgcgc tggccagaca gttatgcaca ggccaggcgg gttttaagag ttttaataag\n 6061 ttttaaagag ttttaggcgg aaaaatcgcc ttttttctct tttatatcag tcacttacat\n 6121 gtgtgaccgg ttcccaatgt acggctttgg gttcccaatg tacgggttcc ggttcccaat\n 6181 gtacggcttt gggttcccaa tgtacgtgct atccacagga aagagacctt ttcgaccttt\n 6241 ttcccctgct agggcaattt gccctagcat ctgctccgta cattaggaac cggcggatgc\n 6301 ttcgccctcg atcaggttgc ggtagcgcat gactaggatc gggccagcct gccccgcctc\n 6361 ctccttcaaa tcgtactccg gcaggtcatt tgacccgatc agcttgcgca cggtgaaaca\n 6421 gaacttcttg aactctccgg cgctgccact gcgttcgtag atcgtcttga acaaccatct\n 6481 ggcttctgcc ttgcctgcgg cgcggcgtgc caggcggtag agaaaacggc cgatgccggg\n 6541 atcgatcaaa aagtaatcgg ggtgaaccgt cagcacgtcc gggttcttgc cttctgtgat\n 6601 ctcgcggtac atccaatcag ctagctcgat ctcgatgtac tccggccgcc cggtttcgct\n 6661 ctttacgatc ttgtagcggc taatcaaggc ttcaccctcg gataccgtca ccaggcggcc\n 6721 gttcttggcc ttcttcgtac gctgcatggc aacgtgcgtg gtgtttaacc gaatgcaggt\n 6781 ttctaccagg tcgtctttct gctttccgcc atcggctcgc cggcagaact tgagtacgtc\n 6841 cgcaacgtgt ggacggaaca cgcggccggg cttgtctccc ttcccttccc ggtatcggtt\n 6901 catggattcg gttagatggg aaaccgccat cagtaccagg tcgtaatccc acacactggc\n 6961 catgccggcc ggccctgcgg aaacctctac gtgcccgtct ggaagctcgt agcggatcac\n 7021 ctcgccagct cgtcggtcac gcttcgacag acggaaaacg gccacgtcca tgatgctgcg\n 7081 actatcgcgg gtgcccacgt catagagcat cggaacgaaa aaatctggtt gctcgtcgcc\n 7141 cttgggcggc ttcctaatcg acggcgcacc ggctgccggc ggttgccggg attctttgcg\n 7201 gattcgatca gcggccgctt gccacgattc accggggcgt gcttctgcct cgatgcgttg\n 7261 ccgctgggcg gcctgcgcgg ccttcaactt ctccaccagg tcatcaccca gcgccgcgcc\n 7321 gatttgtacc gggccggatg gtttgcgacc gctcacgccg attcctcggg cttgggggtt\n 7381 ccagtgccat tgcagggccg gcagacaacc cagccgctta cgcctggcca accgcccgtt\n 7441 cctccacaca tggggcattc cacggcgtcg gtgcctggtt gttcttgatt ttccatgccg\n 7501 cctcctttag ccgctaaaat tcatctactc atttattcat ttgctcattt actctggtag\n 7561 ctgcgcgatg tattcagata gcagctcggt aatggtcttg ccttggcgta ccgcgtacat\n 7621 cttcagcttg gtgtgatcct ccgccggcaa ctgaaagttg acccgcttca tggctggcgt\n 7681 gtctgccagg ctggccaacg ttgcagcctt gctgctgcgt gcgctcggac ggccggcact\n 7741 tagcgtgttt gtgcttttgc tcattttctc tttacctcat taactcaaat gagttttgat\n 7801 ttaatttcag cggccagcgc ctggacctcg cgggcagcgt cgccctcggg ttctgattca\n 7861 agaacggttg tgccggcggc ggcagtgcct gggtagctca cgcgctgcgt gatacgggac\n 7921 tcaagaatgg gcagctcgta cccggccagc gcctcggcaa cctcaccgcc gatgcgcgtg\n 7981 cctttgatcg cccgcgacac gacaaaggcc gcttgtagcc ttccatccgt gacctcaatg\n 8041 cgctgcttaa ccagctccac caggtcggcg gtggcccata tgtcgtaagg gcttggctgc\n 8101 accggaatca gcacgaagtc ggctgccttg atcgcggaca cagccaagtc cgccgcctgg\n 8161 ggcgctccgt cgatcactac gaagtcgcgc cggccgatgg ccttcacgtc gcggtcaatc\n 8221 gtcgggcggt cgatgccgac aacggttagc ggttgatctt cccgcacggc cgcccaatcg\n 8281 cgggcactgc cctggggatc ggaatcgact aacagaacat cggccccggc gagttgcagg\n 8341 gcgcgggcta gatgggttgc gatggtcgtc ttgcctgacc cgcctttctg gttaagtaca\n 8401 gcgataacct tcatgcgttc cccttgcgta tttgtttatt tactcatcgc atcatatacg\n 8461 cagcgaccgc atgacgcaag ctgttttact caaatacaca tcaccttttt agacggcggc\n 8521 gctcggtttc ttcagcggcc aagctggccg gccaggccgc cagcttggca tcagacaaac\n 8581 cggccaggat ttcatgcagc cgcacggttg agacgtgcgc gggcggctcg aacacgtacc\n 8641 cggccgcgat catctccgcc tcgatctctt cggtaatgaa aaacggttcg tcctggccgt\n 8701 cctggtgcgg tttcatgctt gttcctcttg gcgttcattc tcggcggccg ccagggcgtc\n 8761 ggcctcggtc aatgcgtcct cacggaaggc accgcgccgc ctggcctcgg tgggcgtcac\n 8821 ttcctcgctg cgctcaagtg cgcggtacag ggtcgagcga tgcacgccaa gcagtgcagc\n 8881 cgcctctttc acggtgcggc cttcctggtc gatcagctcg cgggcgtgcg cgatctgtgc\n 8941 cggggtgagg gtagggcggg ggccaaactt cacgcctcgg gccttggcgg cctcgcgccc\n 9001 gctccgggtg cggtcgatga ttagggaacg ctcgaactcg gcaatgccgg cgaacacggt\n 9061 caacaccatg cggccggccg gcgtggtggt gtcggcccac ggctctgcca ggctacgcag\n 9121 gcccgcgccg gcctcctgga tgcgctcggc aatgtccagt aggtcgcggg tgctgcgggc\n 9181 caggcggtct agcctggtca ctgtcacaac gtcgccaggg cgtaggtggt caagcatcct\n 9241 ggccagctcc gggcggtcgc gcctggtgcc ggtgatcttc tcggaaaaca gcttggtgca\n 9301 gccggccgcg tgcagttcgg cccgttggtt ggtcaagtcc tggtcgtcgg tgctgacgcg\n 9361 ggcatagccc agcaggccag cggcggcgct cttgttcatg gcgtaatgtc tccggttcta\n 9421 gtcgcaagta ttctacttta tgcgactaaa acacgcgaca agaaaacgcc aggaaaaggg\n 9481 cagggcggca gcctgtcgcg taacttagga cttgtgcgac atgtcgtttt cagaagacgg\n 9541 ctgcactgaa cgtcagaagc cgactgcact atagcagcgg aggggttgga tcaaagtact\n 9601 ttaaagtact ttaaagtact ttaaagtact ttgatcccga ggggaaccct gtggttggca\n 9661 tgcacataca aatggacgaa cggataaacc ttttcacgcc cttttaaata tccgattatt\n 9721 ctaataaacg ctcttttctc ttaggtttac ccgccaatat atcctgtcaa acactgatag\n 9781 tttaaactga aggcgggaaa cgacaatctg atccaagctc aagctaagct tgagctcgtt\n 9841 ttcccagtca cgacgttgta aaacgacggc cagtgaatta tcaactatgt ataataaagt\n 9901 tgaacgagaa acgtaaaatg atataaatat caatatatta aattagattt tgcataaaaa\n 9961 acagactaca taatactgta aaacacaaca tatccagtca ctatggcggc cgcattaggc\n 10021 accccaggct ttacacttta tgcttccggc tcgtataatg tgtggatttt gagttaggat\n 10081 ccgtcgagat tttcaggagc taaggaagct aaaatggaga aaaaaatcac tggatatacc\n 10141 accgttgata tatcccaatg gcatcgtaaa gaacattttg aggcatttca gtcagttgct\n 10201 caatgtacct ataaccagac cgttcagctg gatattacgg cctttttaaa gaccgtaaag\n 10261 aaaaataagc acaagtttta tccggccttt attcacattc ttgcccgcct gatgaatgct\n 10321 catccggaat tccgtatggc aatgaaagac ggtgagctgg tgatatggga tagtgttcac\n 10381 ccttgttaca ccgttttcca tgagcaaact gaaacgtttt catcgctctg gagtgaatac\n 10441 cacgacgatt tccggcagtt tctacacata tattcgcaag atgtggcgtg ttacggtgaa\n 10501 aacctggcct atttccctaa agggtttatt gagaatatgt ttttcgtctc agccaatccc\n 10561 tgggtgagtt tcaccagttt tgatttaaac gtggccaata tggacaactt cttcgccccc\n 10621 gttttcacca tgggcaaata ttatacgcaa ggcgacaagg tgctgatgcc gctggcgatt\n 10681 caggttcatc atgccgtttg tgatggcttc catgtcggca gaatgcttaa tgaattacaa\n 10741 cagtactgcg atgagtggca ggcggggcgt aatctagagg atccggctta ctaaaagcca\n 10801 gataacagta tgcgtatttg cgcgctgatt tttgcggtat aagaatatat actgatatgt\n 10861 atacccgaag tatgtcaaaa agaggtatgc tatgaagcag cgtattacag tgacagttga\n 10921 cagcgacagc tatcagttgc tcaaggcata tatgatgtca gtatctccgg ttcggtaagc\n 10981 acaaccatgc agaatgaagc ccgtcgtctg cgtgccgaac gctggaaagc ggaaaatcaa\n 11041 gaagggatgg ctgaggtcgc ccggtttatt gaaatgaacg gctcttttgc cgacgagaac\n 11101 aggggctggt gaaatgcagt ttaaggttta cacctataaa agagagagcc gttatcgtct\n 11161 gtttgtggat gtacagagtg atattattga cacgcccggg cgacggatgg tgatccccct\n 11221 ggccagtgca cgtctgctgt cagataaagt cccccgtgaa ctttacccgg tggtgcatat\n 11281 cggggatgaa agctggcgca tgatgaccac cgatatggcc agtgtgccgg tctccgttat\n 11341 cggggaagaa gtggctgatc tcagccaccg cgaaaatgac atcaaaaacg ccattaacct\n 11401 gatgttctgg ggaatataaa tgtcaggctc ccttatacac agccagtctg caggtcgacc\n 11461 atagtgactg gatatgttgt gttttacagt attatgtagt ctgtttttta tgcaaaatct\n 11521 aatttaatat attgatattt atatcatttt acgtttctcg ttcaactttt ctatacaaag\n 11581 ttgatagctt ggcgtaatca tggtcatagc tgtttcctgt gtgaaattgt tatccgctcg\n 11641 ggccctctag aggatccccg ggtacc\n//"
42
42
  },
43
43
  {
44
- "id": 12,
44
+ "id": 6,
45
45
  "type": "TextFileSequence",
46
46
  "sequence_file_format": "genbank",
47
47
  "overhang_crick_3prime": 0,
@@ -49,7 +49,7 @@
49
49
  "file_content": "LOCUS pDONR_P2r-P3 4773 bp DNA circular SYN 06-MAR-2024\nDEFINITION .\nACCESSION <unknown id>\nVERSION <unknown id>\nKEYWORDS .\nSOURCE .\n ORGANISM .\n .\nFEATURES Location/Qualifiers\n CDS 3167..3976\n /codon_start=1\n /gene=\"aph(3')-Ia\"\n /note=\"confers resistance to kanamycin in bacteria or G418\n (Geneticin\u00ae) in eukaryotes\"\n /product=\"aminoglycoside phosphotransferase\"\n /transl_table=1\n /translation=\"MSHIQRETSRPRLNSNMDADLYGYKWARDNVGQSGATIYRLYGKP\n DAPELFLKHGKGSVANDVTDEMVRLNWLTEFMPLPTIKHFIRTPDDAWLLTTAIPGKTA\n FQVLEEYPDSGENIVDALAVFLRRLHSIPVCNCPFNSDRVFRLAQAQSRMNNGLVDASD\n FDDERNGWPVEQVWKEMHKLLPFSPDSVVTHGDFSLDNLIFDEGKLIGCIDVGRVGIAD\n RYQDLAILWNCLGEFSPSLQKRLFQKYGIDNPDMNKLQFHLMLDEFF*\"\n /label=\"KanR\"\n CDS 1083..1742\n /codon_start=1\n /gene=\"cat\"\n /note=\"confers resistance to chloramphenicol\"\n /product=\"chloramphenicol acetyltransferase\"\n /transl_table=1\n /translation=\"MEKKITGYTTVDISQWHRKEHFEAFQSVAQCTYNQTVQLDITAFL\n KTVKKNKHKFYPAFIHILARLMNAHPEFRMAMKDGELVIWDSVHPCYTVFHEQTETFSS\n LWSEYHDDFRQFLHIYSQDVACYGENLAYFPKGFIENMFFVSANPWVSFTSFDLNVANM\n DNFFAPVFTMGKYYTQGDKVLMPLAIQVHHAVCDGFHVGRMLNELQQYCDEWQGGA*\"\n /label=\"CmR\"\n rep_origin 4123..4711\n /direction=RIGHT\n /note=\"high-copy-number ColE1/pMB1/pBR322/pUC origin of\n replication\"\n /label=\"ori\"\n CDS 2084..2389\n /codon_start=1\n /gene=\"ccdB\"\n /note=\"Plasmids containing the ccdB gene cannot be\n propagated in standard E. coli strains.\"\n /product=\"CcdB, a bacterial toxin that poisons DNA gyrase\"\n /transl_table=1\n /translation=\"MQFKVYTYKRESRYRLFVDVQSDIIDTPGRRMVIPLASARLLSDK\n VSRELYPVVHIGDESWRMMTTDMASVPVSVIGEEVADLSHRENDIKNAINLMFWGI*\"\n /label=\"ccdB\"\n protein_bind complement(591..822)\n /bound_moiety=\"BP Clonase\u2122\"\n /gene=\"mutant version of attP\"\n /note=\"recombination site for the Gateway\u00ae BP reaction\"\n /label=\"attP2\"\n protein_bind complement(2746..2977)\n /bound_moiety=\"BP Clonase\u2122\"\n /gene=\"mutant version of attP\"\n /note=\"recombination site for the Gateway\u00ae BP reaction\"\n /label=\"attP3\"\n promoter 980..1082\n /note=\"promoter of the E. coli cat gene\"\n /label=\"cat promoter\"\n terminator 387..473\n /gene=\"Escherichia coli rrnB\"\n /note=\"transcription terminator T1 from the E. coli rrnB\n gene\"\n /label=\"rrnB T1 terminator\"\n terminator 268..295\n /note=\"transcription terminator T2 from the E. coli rrnB\n gene\"\n /label=\"rrnB T2 terminator\"\n primer_bind 537..553\n /note=\"common sequencing primer, one of multiple similar\n variants\"\n /label=\"M13 fwd\"\n primer_bind complement(3038..3054)\n /note=\"common sequencing primer, one of multiple similar\n variants\"\n /label=\"M13 rev\"\nORIGIN\n 1 ctttcctgcg ttatcccctg attctgtgga taaccgtatt accgcctttg agtgagctga\n 61 taccgctcgc cgcagccgaa cgaccgagcg cagcgagtca gtgagcgagg aagcggaaga\n 121 gcgcccaata cgcaaaccgc ctctccccgc gcgttggccg attcattaat gcagctggca\n 181 cgacaggttt cccgactgga aagcgggcag tgagcgcaac gcaattaata cgcgtaccgc\n 241 tagccaggaa gagtttgtag aaacgcaaaa aggccatccg tcaggatggc cttctgctta\n 301 gtttgatgcc tggcagttta tggcgggcgt cctgcccgcc accctccggg ccgttgcttc\n 361 acaacgttca aatccgctcc cggcggattt gtcctactca ggagagcgtt caccgacaaa\n 421 caacagataa aacgaaaggc ccagtcttcc gactgagcct ttcgttttat ttgatgcctg\n 481 gcagttccct actctcgcgt taacgctagc atggatgttt tcccagtcac gacgttgtaa\n 541 aacgacggcc agtcttaagc tcgggccctg cagctctaga gctcgaattc tacaggtcac\n 601 taataccatc taagtagttg attcatagtg actgcatatg ttgtgtttta cagtattatg\n 661 tagtctgttt tttatgcaaa atctaattta atatattgat atttatatca ttttacgttt\n 721 ctcgttcaac tttcttgtac aaagttggca ttataaaaaa gcattgctta tcaatttgtt\n 781 gcaacgaaca ggtcactatc agtcaaaata aaatcattat ttggagctct agagcgtcga\n 841 ctaagttggc agcatcaccc gacgcacttt gcgccgaata aatacctgtg acggaagatc\n 901 acttcgcaga ataaataaat cctggtgtcc ctgttgatac cgggaagccc tgggccaact\n 961 tttggcgaaa atgagacgtt gatcggcacg taagaggttc caactttcac cataatgaaa\n 1021 taagatcact accgggcgta ttttttgagt tatcgagatt ttcaggagct aaggaagcta\n 1081 aaatggagaa aaaaatcact ggatatacca ccgttgatat atcccaatgg catcgtaaag\n 1141 aacattttga ggcatttcag tcagttgctc aatgtaccta taaccagacc gttcagctgg\n 1201 atattacggc ctttttaaag accgtaaaga aaaataagca caagttttat ccggccttta\n 1261 ttcacattct tgcccgcctg atgaatgctc atccggaatt ccgtatggca atgaaagacg\n 1321 gtgagctggt gatatgggat agtgttcacc cttgttacac cgttttccat gagcaaactg\n 1381 aaacgttttc atcgctctgg agtgaatacc acgacgattt ccggcagttt ctacacatat\n 1441 attcgcaaga tgtggcgtgt tacggtgaaa acctggccta tttccctaaa gggtttattg\n 1501 agaatatgtt tttcgtctca gccaatccct gggtgagttt caccagtttt gatttaaacg\n 1561 tggccaatat ggacaacttc ttcgcccccg ttttcaccat gggcaaatat tatacgcaag\n 1621 gcgacaaggt gctgatgccg ctggcgattc aggttcatca tgccgtctgt gatggcttcc\n 1681 atgtcggcag aatgcttaat gaattacaac agtactgcga tgagtggcag ggcggggcgt\n 1741 aatcgcgtgg atccggctta ctaaaagcca gataacagta tgcgtatttg cgcgctgatt\n 1801 tttgcggtat aagaatatat actgatatgt atacccgaag tatgtcaaaa agaggtgtgc\n 1861 tatgaagcag cgtattacag tgacagttga cagcgacagc tatcagttgc tcaaggcata\n 1921 tatgatgtca atatctccgg tctggtaagc acaaccatgc agaatgaagc ccgtcgtctg\n 1981 cgtgccgaac gctggaaagc ggaaaatcag gaagggatgg ctgaggtcgc ccggtttatt\n 2041 gaaatgaacg gctcttttgc tgacgagaac agggactggt gaaatgcagt ttaaggttta\n 2101 cacctataaa agagagagcc gttatcgtct gtttgtggat gtacagagtg atattattga\n 2161 cacgcccggg cgacggatgg tgatccccct ggccagtgca cgtctgctgt cagataaagt\n 2221 ctcccgtgaa ctttacccgg tggtgcatat cggggatgaa agctggcgca tgatgaccac\n 2281 cgatatggcc agtgtgccgg tctccgttat cggggaagaa gtggctgatc tcagccaccg\n 2341 cgaaaatgac atcaaaaacg ccattaacct gatgttctgg ggaatataaa tgtcaggctc\n 2401 ccttatacac agccagtctg caggtcgata cagtagaaat tacagaaact ttatcacgtt\n 2461 tagtaagtat agaggctgaa aatccagatg aagccgaacg acttgtaaga gaaaagtata\n 2521 agagttgtga aattgttctt gatgcagatg attttcagga ctatgacact agcgtatatg\n 2581 aataggtaga tgtttttatt ttgtcacaca aaaaagaggc tcgcacctct ttttcttatt\n 2641 tctttttatg atttaatacg gcattgagga caatagcgag taggctggat acgacgattc\n 2701 cgtttgagaa gaacatttgg aaggctgtcg gtcgagctcg aattctacag gtcactaata\n 2761 ccatctaagt agttgattca tagtgactgc atatgttgtg ttttacagta ttatgtagtc\n 2821 tgttttttat gcaaaatcta atttaatata ttgatattta tatcatttta cgtttctcgt\n 2881 tcaactttat tatacaaagt tggcattata aaaaagcatt gcttatcaat ttgttgcaac\n 2941 gaacaggtca ctatcagtca aaataaaatc attatttgga gctccatggt agcgttaacg\n 3001 cggccgcgat atcccctata gtgagtcgta ttacatggtc atagctgttt cctggcagct\n 3061 ctggcccgtg tctcaaaatc tctgatgtta cattgcacaa gataaaaata tatcatcatg\n 3121 aacaataaaa ctgtctgctt acataaacag taatacaagg ggtgttatga gccatattca\n 3181 acgggaaacg tcgaggccgc gattaaattc caacatggat gctgatttat atgggtataa\n 3241 atgggctcgc gataatgtcg ggcaatcagg tgcgacaatc tatcgcttgt atgggaagcc\n 3301 cgatgcgcca gagttgtttc tgaaacatgg caaaggtagc gttgccaatg atgttacaga\n 3361 tgagatggtc agactaaact ggctgacgga atttatgcct cttccgacca tcaagcattt\n 3421 tatccgtact cctgatgatg catggttact caccactgcg atccccggaa aaacagcatt\n 3481 ccaggtatta gaagaatatc ctgattcagg tgaaaatatt gttgatgcgc tggcagtgtt\n 3541 cctgcgccgg ttgcattcga ttcctgtttg taattgtcct tttaacagcg atcgcgtatt\n 3601 tcgtctcgct caggcgcaat cacgaatgaa taacggtttg gttgatgcga gtgattttga\n 3661 tgacgagcgt aatggctggc ctgttgaaca agtctggaaa gaaatgcata aacttttgcc\n 3721 attctcaccg gattcagtcg tcactcatgg tgatttctca cttgataacc ttatttttga\n 3781 cgaggggaaa ttaataggtt gtattgatgt tggacgagtc ggaatcgcag accgatacca\n 3841 ggatcttgcc atcctatgga actgcctcgg tgagttttct ccttcattac agaaacggct\n 3901 ttttcaaaaa tatggtattg ataatcctga tatgaataaa ttgcagtttc atttgatgct\n 3961 cgatgagttt ttctaatcag aattggttaa ttggttgtaa cactggcaga gcattacgct\n 4021 gacttgacgg gacggcgcaa gctcatgacc aaaatccctt aacgtgagtt acgcgtcgtt\n 4081 ccactgagcg tcagaccccg tagaaaagat caaaggatct tcttgagatc ctttttttct\n 4141 gcgcgtaatc tgctgcttgc aaacaaaaaa accaccgcta ccagcggtgg tttgtttgcc\n 4201 ggatcaagag ctaccaactc tttttccgaa ggtaactggc ttcagcagag cgcagatacc\n 4261 aaatactgtc cttctagtgt agccgtagtt aggccaccac ttcaagaact ctgtagcacc\n 4321 gcctacatac ctcgctctgc taatcctgtt accagtggct gctgccagtg gcgataagtc\n 4381 gtgtcttacc gggttggact caagacgata gttaccggat aaggcgcagc ggtcgggctg\n 4441 aacggggggt tcgtgcacac agcccagctt ggagcgaacg acctacaccg aactgagata\n 4501 cctacagcgt gagcattgag aaagcgccac gcttcccgaa gggagaaagg cggacaggta\n 4561 tccggtaagc ggcagggtcg gaacaggaga gcgcacgagg gagcttccag ggggaaacgc\n 4621 ctggtatctt tatagtcctg tcgggtttcg ccacctctga cttgagcgtc gatttttgtg\n 4681 atgctcgtca ggggggcgga gcctatggaa aaacgccagc aacgcggcct ttttacggtt\n 4741 cctggccttt tgctggcctt ttgctcacat gtt\n//"
50
50
  },
51
51
  {
52
- "id": 14,
52
+ "id": 7,
53
53
  "type": "TextFileSequence",
54
54
  "sequence_file_format": "genbank",
55
55
  "overhang_crick_3prime": 0,
@@ -57,7 +57,7 @@
57
57
  "file_content": "LOCUS U6-26_promoter 465 bp DNA linear UNK 01-JAN-1980\nDEFINITION description.\nACCESSION 14\nVERSION 14\nKEYWORDS .\nSOURCE \n ORGANISM .\n .\nFEATURES Location/Qualifiers\nORIGIN\n 1 ggggacagct ttcttgtaca aagtggaacg acttgccttc cgcacaatac atcatttctt\n 61 cttagctttt tttcttcttc ttcgttcata cagttttttt ttgtttatca gcttacattt\n 121 tcttgaaccg tagctttcgt tttcttcttt ttaactttcc attcggagtt tttgtatctt\n 181 gtttcatagt ttgtcccagg attagaatga ttaggcatcg aaccttcaag aatttgattg\n 241 aataaaacat cttcattctt aagatatgaa gataatcttc aaaaggcccc tgggaatctg\n 301 aaagaagaga agcaggccca tttatatggg aaagaacaat agtatttctt atataggccc\n 361 atttaagttg aaaacaatct tcaaaagtcc cacatcgctt agataagaaa acgaagctga\n 421 gtttatatac agctagagtc gaagtagtga ttaacatgag accat\n//"
58
58
  },
59
59
  {
60
- "id": 16,
60
+ "id": 8,
61
61
  "type": "TextFileSequence",
62
62
  "sequence_file_format": "genbank",
63
63
  "overhang_crick_3prime": 0,
@@ -65,7 +65,7 @@
65
65
  "file_content": "LOCUS U6-26_term 230 bp DNA linear UNK 01-JAN-1980\nDEFINITION description.\nACCESSION 16\nVERSION 16\nKEYWORDS .\nSOURCE \n ORGANISM .\n .\nFEATURES Location/Qualifiers\nORIGIN\n 1 taggtctccg cttttttttg caaaattttc cagatcgatt tcttcttcct ctgttcttcg\n 61 gcgttcaatt tctggggttt tctcttcgtt ttctgtaact gaaacctaaa atttgaccta\n 121 aaaaaaatct caaataatat gattcagtgg ttttgtactt ttcagttagt tgagttttgc\n 181 agttccgatg agataaacca atatcaactt tattatacaa agttgtcccc\n//"
66
66
  },
67
67
  {
68
- "id": 18,
68
+ "id": 9,
69
69
  "type": "TextFileSequence",
70
70
  "sequence_file_format": "genbank",
71
71
  "overhang_crick_3prime": 0,
@@ -76,145 +76,136 @@
76
76
  "sources": [
77
77
  {
78
78
  "id": 1,
79
- "input": [],
80
- "output": 2,
81
79
  "type": "AddgeneIdSource",
82
80
  "output_name": null,
83
81
  "database_id": null,
82
+ "input": [],
84
83
  "repository_id": "71287",
85
84
  "repository_name": "addgene",
86
85
  "sequence_file_url": "https://media.addgene.org/snapgene-media/v2.0.0/sequences/352460/6c8b0369-e549-4517-95da-8d07146ca49d/addgene-plasmid-71287-sequence-352460.gbk",
87
86
  "addgene_sequence_type": "addgene-full"
88
87
  },
89
88
  {
90
- "id": 3,
91
- "input": [],
92
- "output": 4,
89
+ "id": 2,
93
90
  "type": "AddgeneIdSource",
94
91
  "output_name": null,
95
92
  "database_id": null,
93
+ "input": [],
96
94
  "repository_id": "71287",
97
95
  "repository_name": "addgene",
98
96
  "sequence_file_url": "https://media.addgene.org/snapgene-media/v2.0.0/sequences/352460/6c8b0369-e549-4517-95da-8d07146ca49d/addgene-plasmid-71287-sequence-352460.gbk",
99
97
  "addgene_sequence_type": "addgene-full"
100
98
  },
101
99
  {
102
- "id": 5,
103
- "input": [],
104
- "output": 6,
100
+ "id": 3,
105
101
  "type": "AddgeneIdSource",
106
102
  "output_name": null,
107
103
  "database_id": null,
104
+ "input": [],
108
105
  "repository_id": "213912",
109
106
  "repository_name": "addgene",
110
107
  "sequence_file_url": "https://media.addgene.org/snapgene-media/v2.0.0/sequences/437264/8bd82b44-a1c3-4f81-8936-ebcc16d171e9/addgene-plasmid-213912-sequence-437264.gbk",
111
108
  "addgene_sequence_type": "addgene-full"
112
109
  },
113
110
  {
114
- "id": 7,
115
- "input": [],
116
- "output": 8,
111
+ "id": 4,
117
112
  "type": "AddgeneIdSource",
118
113
  "output_name": null,
119
114
  "database_id": null,
115
+ "input": [],
120
116
  "repository_id": "213913",
121
117
  "repository_name": "addgene",
122
118
  "sequence_file_url": "https://media.addgene.org/snapgene-media/v2.0.0/sequences/437263/af62d64e-1f22-4dce-aafa-7935d1665700/addgene-plasmid-213913-sequence-437263.gbk",
123
119
  "addgene_sequence_type": "addgene-full"
124
120
  },
125
121
  {
126
- "id": 9,
127
- "input": [],
128
- "output": 10,
122
+ "id": 5,
129
123
  "type": "AddgeneIdSource",
130
124
  "output_name": null,
131
125
  "database_id": null,
126
+ "input": [],
132
127
  "repository_id": "133748",
133
128
  "repository_name": "addgene",
134
129
  "sequence_file_url": "https://media.addgene.org/snapgene-media/v2.0.0/sequences/271264/c0ae5f43-46e6-4175-a0c1-9a00cbb92034/addgene-plasmid-133748-sequence-271264.gbk",
135
130
  "addgene_sequence_type": "addgene-full"
136
131
  },
137
132
  {
138
- "id": 11,
139
- "input": [],
140
- "output": 12,
133
+ "id": 6,
141
134
  "type": "SnapGenePlasmidSource",
142
135
  "output_name": "pDONR_P2r-P3",
143
136
  "database_id": null,
137
+ "input": [],
144
138
  "repository_id": "gateway_cloning_vectors/pDONR_P2r-P3",
145
139
  "repository_name": "snapgene"
146
140
  },
147
141
  {
148
- "id": 13,
149
- "input": [
150
- 2
151
- ],
152
- "output": 14,
142
+ "id": 7,
153
143
  "type": "PCRSource",
154
144
  "output_name": "U6-26_promoter",
155
145
  "database_id": null,
156
- "circular": false,
157
- "assembly": [
146
+ "input": [
158
147
  {
159
- "sequence": 1,
148
+ "type": "AssemblyFragment",
149
+ "sequence": 10,
160
150
  "left_location": null,
161
151
  "right_location": "29..50",
162
152
  "reverse_complemented": false
163
153
  },
164
154
  {
165
- "sequence": 2,
155
+ "type": "AssemblyFragment",
156
+ "sequence": 1,
166
157
  "left_location": "8698..8719",
167
158
  "right_location": "9102..9121",
168
159
  "reverse_complemented": false
169
160
  },
170
161
  {
171
- "sequence": 2,
162
+ "type": "AssemblyFragment",
163
+ "sequence": 11,
172
164
  "left_location": "1..20",
173
165
  "right_location": null,
174
166
  "reverse_complemented": true
175
167
  }
176
168
  ],
169
+ "circular": false,
177
170
  "add_primer_features": false
178
171
  },
179
172
  {
180
- "id": 15,
181
- "input": [
182
- 4
183
- ],
184
- "output": 16,
173
+ "id": 8,
185
174
  "type": "PCRSource",
186
175
  "output_name": "U6-26_term",
187
176
  "database_id": null,
188
- "circular": false,
189
- "assembly": [
177
+ "input": [
190
178
  {
191
- "sequence": 13,
179
+ "type": "AssemblyFragment",
180
+ "sequence": 14,
192
181
  "left_location": null,
193
182
  "right_location": "10..37",
194
183
  "reverse_complemented": false
195
184
  },
196
185
  {
197
- "sequence": 4,
186
+ "type": "AssemblyFragment",
187
+ "sequence": 2,
198
188
  "left_location": "10418..10445",
199
189
  "right_location": "10590..10611",
200
190
  "reverse_complemented": false
201
191
  },
202
192
  {
203
- "sequence": 14,
193
+ "type": "AssemblyFragment",
194
+ "sequence": 15,
204
195
  "left_location": "1..22",
205
196
  "right_location": null,
206
197
  "reverse_complemented": true
207
198
  }
208
199
  ],
200
+ "circular": false,
209
201
  "add_primer_features": false
210
202
  },
211
203
  {
212
- "id": 17,
213
- "input": [],
214
- "output": 18,
204
+ "id": 9,
215
205
  "type": "AddgeneIdSource",
216
206
  "output_name": null,
217
207
  "database_id": null,
208
+ "input": [],
218
209
  "repository_id": "63143",
219
210
  "repository_name": "addgene",
220
211
  "sequence_file_url": "https://media.addgene.org/snapgene-media/v2.0.0/sequences/223326/8c81fe9a-fb57-40bc-93d6-e17d83502061/addgene-plasmid-63143-sequence-223326.gbk",
@@ -223,42 +214,42 @@
223
214
  ],
224
215
  "primers": [
225
216
  {
226
- "id": 1,
217
+ "id": 10,
227
218
  "type": "Primer",
228
219
  "name": "Fw-Primer1",
229
220
  "database_id": null,
230
221
  "sequence": "GGGGACAGCTTTCTTGTACAAAGTGGAACGACTTGCCTTCCGCACAATAC"
231
222
  },
232
223
  {
233
- "id": 2,
224
+ "id": 11,
234
225
  "type": "Primer",
235
226
  "name": "Rev-Primer2",
236
227
  "database_id": null,
237
228
  "sequence": "ATGGTCTCATGTTAATCACTACTTCGACTCTAG"
238
229
  },
239
230
  {
240
- "id": 3,
231
+ "id": 12,
241
232
  "type": "Primer",
242
233
  "name": "Fw-Primer3",
243
234
  "database_id": null,
244
235
  "sequence": "TAGGTCTCCAACAaagcaccagtggtctagtgg"
245
236
  },
246
237
  {
247
- "id": 12,
238
+ "id": 13,
248
239
  "type": "Primer",
249
240
  "name": "Rev-Primer12",
250
241
  "database_id": null,
251
242
  "sequence": "ATGGTCTCAAAGCaccgactcggtgccactttttc"
252
243
  },
253
244
  {
254
- "id": 13,
245
+ "id": 14,
255
246
  "type": "Primer",
256
247
  "name": "Fw-Primer13",
257
248
  "database_id": null,
258
249
  "sequence": "TAGGTCTCCGCTTTTTTTTGCAAAATTTTCCAGaTCG"
259
250
  },
260
251
  {
261
- "id": 14,
252
+ "id": 15,
262
253
  "type": "Primer",
263
254
  "name": "Rev-Primer14",
264
255
  "database_id": null,
@@ -267,7 +258,7 @@
267
258
  ],
268
259
  "description": "",
269
260
  "files": null,
270
- "schema_version": "0.2.9",
261
+ "schema_version": "0.4.3",
271
262
  "backend_version": null,
272
263
  "frontend_version": null
273
264
  }