From 9e19e2cdebf740cadace53949e4e2ace61b27ebd Mon Sep 17 00:00:00 2001 From: John SJ Anderson Date: Thu, 17 Oct 2024 10:30:28 -0700 Subject: [PATCH 1/2] Update nextclade files based on PR feedback Context: https://github.com/nextstrain/nextclade_data/pull/220 --- nextclade/defaults/nextclade-dataset/CHANGELOG.md | 2 +- nextclade/defaults/nextclade-dataset/README.md | 4 ++-- nextclade/defaults/nextclade-dataset/pathogen.json | 7 +++---- 3 files changed, 6 insertions(+), 7 deletions(-) diff --git a/nextclade/defaults/nextclade-dataset/CHANGELOG.md b/nextclade/defaults/nextclade-dataset/CHANGELOG.md index 3b67234..eb62595 100644 --- a/nextclade/defaults/nextclade-dataset/CHANGELOG.md +++ b/nextclade/defaults/nextclade-dataset/CHANGELOG.md @@ -1,3 +1,3 @@ ## Unreleased -Initial release of yellow fever virus dataset. +Initial release of yellow fever virus (prM-E region only) dataset. diff --git a/nextclade/defaults/nextclade-dataset/README.md b/nextclade/defaults/nextclade-dataset/README.md index 10bb176..1a22958 100644 --- a/nextclade/defaults/nextclade-dataset/README.md +++ b/nextclade/defaults/nextclade-dataset/README.md @@ -1,4 +1,4 @@ -# Yellow fever virus dataset +# Yellow fever virus (prM-E region only) dataset | Key | Value | | ----------------- | -----------------------------------------------------------------| @@ -36,7 +36,7 @@ following genotypes as described in the aforementioned two papers: (N.b., the reference sequence used in this data set is actually 672nt long, from bases 641-1312 of the genome reference. The 2 extra bases -make the reference an complete open reading frame.) +make the reference a complete open reading frame.) This dataset can be used to assign genotypes to any sequence that includes at least 500 bp of the prM-E region, including whole genome diff --git a/nextclade/defaults/nextclade-dataset/pathogen.json b/nextclade/defaults/nextclade-dataset/pathogen.json index 92213e6..b1d1212 100644 --- a/nextclade/defaults/nextclade-dataset/pathogen.json +++ b/nextclade/defaults/nextclade-dataset/pathogen.json @@ -15,8 +15,7 @@ }, "schemaVersion": "3.0.0", "alignmentParams": { - "minSeedCover": 0.01, - "minLength": 500 + "minSeedCover": 0.01 }, "qc": { "missingData": { @@ -36,8 +35,8 @@ }, "privateMutations": { "enabled": true, - "cutoff": 8, - "typical": 2, + "cutoff": 12, + "typical": 4, "weightLabeledSubstitutions": 1, "weightReversionSubstitutions": 1, "weightUnlabeledSubstitutions": 1 From 2e33696f513900bac145cdee9246de828a4a2166 Mon Sep 17 00:00:00 2001 From: John SJ Anderson Date: Thu, 17 Oct 2024 10:46:53 -0700 Subject: [PATCH 2/2] Add some Clade III example sequences Context: https://github.com/nextstrain/nextclade_data/pull/220 --- nextclade/defaults/sequences.fasta | 364 +++++++++++++++++++++++++++++ 1 file changed, 364 insertions(+) diff --git a/nextclade/defaults/sequences.fasta b/nextclade/defaults/sequences.fasta index e5d2170..1cb0f31 100644 --- a/nextclade/defaults/sequences.fasta +++ b/nextclade/defaults/sequences.fasta @@ -5839,3 +5839,367 @@ GTTTCTGGGACCTCCCACCCCAGAGTAAAAAGAACGGAGCCTCCGCTACCACCCTCCCAC GTGGTGGTAGAAAGACGGGGTCTAGAGGTTAGAGGAGACCCTCCAGGGAACAAATAGTGG GACCATATTGACGCCAGGGAAAGACCGGAGTGGTTCTCTGCTTTTCCTCCAGAGGTCTGT GAGCACAGTTTGCTCAAGAATAAGCAGACCTTTGGATGAAAAACACAAAAC +>JN620362 +AGTAAATCCTGTGTGCTAATTGAGGTGCATTGGTCTGCAAATCGAGTTGCTAGGCAATAA +ACACATTTGGATTAATTTTAATCGTTCTTTGAGCGATTAGCAGAGAACTGACCAGAGTAA +TGTCTGGTCGAAAAGCTCAGGGTAAAACCCTGGGCGTCAATATGGTAAGACGAGGAGTAC +GCTCCTTGTCAAACAAAATAAAACAAAAAACAAAACAGATTGGAAACAGACCTGGCCCTT +CAAGAGGTGTTCAAGGATTTATTTTCTTCTTTTTGTTCAACATCCTAACTGGGAAAAAAC +TAACTACCCACCTGAAAAGGCTCTGGAGAATGCTTGACCCCCGACAGGGACTTGCTGTTC +TAAGGAAAGTTAAGAGGGTGGTAGCCAGCTTGATGAGAGGGTTGTCATCTAGGAAGCGTC +GCTCTAATGAGATGACCATGATGCCACTTCTAATCTTGAGCATGGTGATCTTGGCTGGAG +GGGTGACACTCGTCCGGAAAAACCGATGGCTACTCTTGAATGTCACAGCTGAGGACTTGG +GAAAGACGTTCTCAGTGGGAACCGGGAACTGCACCACCAACATCCTTGAGGCAAAGTATT +GGTGTCCCGACTCAATGGAATACAATTGTCCCAATCTTAGCCCCAGAGAGGAGCCTGATG +ACATTGACTGTTGGTGTTATGGAGTGGAAAATGTCCGAGTAGCCTATGGAAGGTGTGATG +CAGTGGGAAGGTCAAAGAGATCTAGGAGAGCAATTGATCTGCCCACACATGAAAACCACG +GACTGAAAACTCGGCAGGAAAAATGGATGACAGGCAGAATGGGTGAGCGGCAACTCCAAA +AGATTGAGCGGTGGCTGGTGAGGAATCCGTTCTTCGCCATAACAGCCTTGGCCATTGCTT +ATTTGGTGGGCAATAATATGACACAACGTGTCGTCATAGCTCTGCTGGTTCTGGCAGTTG +GCCCAGCCTATTCTGCACATTGCATTGGGATAACTGACAGAGACTTCATTGAGGGTGTCC +ATGGGGGCACCTGGGTGTCAGCAACCCTGGAGCAGGATAAGTGCGTGACTGTCATGGCGC +CTGATAAACCATCACTGGACATCTCACTCCAAACAGTGGCAATAGATGGGCCAGCTGAAG +CGAGAAAGGTTTGCTACAGCGCGGTTCTCACCCATGTAAAAATCAATGATAAATGCCCGA +GCACTGGTGAGGCTCACCTTGCAGAGGAAAATGATGGTGACAACGCGTGCAAACGAACAT +ACTCAGATAGAGGCTGGGGCAATGGTTGTGGGCTCTTTGGAAAGGGGAGCATTGTGGCAT +GTGCTAAGTTCACGTGTGCCAAATCCATGAGCCTTTTTGAAGTGGACCAGACCAAAATCC +AGTATGTCATCAGAGCCCAGCTTCATGTAGGTGCCAAGCAGGAAAACTGGAACACAGACA +TAAAGACATTGAAATTTGATGCCTTATCTGGCTCTCAAGAGGCCGAATTTACTGGCTATG +GGAAAGCAACACTAGAGTGTCAGGTCCAGACTGCGGTGGACTTTGGAAACAGCTACATTG +CAGAGATGGAGAAAGACAGCTGGATTGTTGACCGCCAGTGGGCACAAGACTTGACACTAC +CATGGCAGAGTGGGAGTGGTGGAATATGGAGGGAAATGCATCATCTAGTTGAGTTTGAGC +CTCCTCATGCCGCCACAATCAGAGTGTTGGCCCTGGGAAACCAAGAGGGGTCTTTGAAAA +CAGCCCTTACAGGAGCCATGCGGGTCACTAAAGATGAAAATGACAACAACTTGTACAAGC +TGCATGGTGGTCATGTTTCTTGTAGGGTGAAACTCTCAGCTTTAACTCTCAAGGGAACAT +CCTACAAAATGTGCACAGATAAAATGTCATTTGTGAAAAATCCAACGGACACAGGTCATG +GCACTGTTGTCATGCAGGTGAAGGTCCCCAAAGGAGCTCCATGCAAGATCCCCGTGATTG +TGGCCGATGATCTAACAGCTGCAGTGAACAAGGGTATATTGGTCACTGTCAACCCCATAG +CATCCACAAATGACGATGAAGTTCTAATTGAAGTCAATCCCCCTTTTGGAGACAGCTACA +TTATTGTTGGGACTGGAGACTCAAGACTGACTTATCAGTGGCATAAAGAAGGAAGCTCAA +TAGGGAAATTGTTCACACAGACAATGAAGGGAGCTGAACGTCTTGCAGTGATGGGTGACG +CCGCCTGGGACTTTAGCTCTGCAGGTGGCTTCTTCACGTCAGTGGGAAAAGGAATTCATA +CTGTGTTTGGCTCAGCTTTCCAGGGGTTGTTTGGTGGCCTGAGCTGGATTACAAAGGTCA +TCATGGGAGCTGTTCTTATCTGGGTTGGAATTAACACACGTAACATGACTATGTCCATGT +CTATGATTCTGGTAGGAGTGATCATGATGTTTCTTTCCCTGGGTGTTGGGGCAGACCAAG +GATGTGCTGTCAACTTTGGGAAGCGAGAGCTTAAATGTGGAGATGGCATCTTTGTGTTCA +GAGACTCAGATGATTGGCTCACCAAGTACTCATATTATCCAGAAGACCCTGTTAAATTGG +CTTCTATCATTAAGGCCTCCTATGAAGAGGGCAAATGTGGACTGAATTCCGTGGACTCCC +TTGAGCATGAAATGTGGAGGAGTAGAGCTGATGAGATCAACGCCATATTTGAGGAAAATG +AAGTGGACATCTCGGTTGTTGTTCAAGACCCAAAGAACATCTACCAAAGAGGGACACATC +CTTTTTCTCGGATTCGTGATGGGTTGCAGTATGGATGGAAAACCTGGGGTAAAAATCTTA +TCTTCTCACCCGGAAGAAGAAATGGCAGTTTCATCATTGATGGGAAGTCAAGGAAGGAAT +GCCCTTTTTCAAACAGAGTGTGGAACTCTTTTCAAATTGAGGAGTTTGGCATGGGGGTTT +TTACGACACGGGTTTTTATGGATGCTGTCTTTGACTACTCAGTGGACTGTGATGGGGCCA +TACTAGGGGCAGCTGTGAATGGGAAGAAGAGCGCACACGGATCGCCCACCTTCTGGATGG +GAAGTCATGAGGTCAATGGAACATGGATGGTACACACACTTGAGACCCTTGATTACAAAG +AGTGTGAATGGCCTCTGACACACACCATAGGAACCTCAGTGGAAGAGAGTGACATGTTCA +TGCCCCGTTCCATTGGAGGCCCAGTGAGCTCCCATAACCACATTCCAGGTTACAAGGTCC +AAACGAACGGACCATGGATGCAAGTCCCTCTGGAAGTCAGAAGGGAGCCATGTCCGGGGA +CAAGTGTGGTGCTAGACACCGGCTGTGATGGACGTGGCAAATCAACCAGATCAACTACTG +ACAGTGGGAAAATAATTCCAGAATGGTGCTGTAGATCTTGCACCATGCCCCCAGTCAGCT +TTCACGGCAGTGATGGCTGCTGGTACCCCATGGAAATTAGACCCATGAAGACCCACGAGA +GCCATCTGGTGAGATCATGGGTTGCTGCAGGAGAAGTGCATGCGGTGCCTTTCGGTTTGG +TGAGCATGATGATTGCCATGGAGGTTGTCTTACGCAAAAGACAAGGACCAAAGCAAATGC +TGGTGGGAGGAATCATTTTACTTGGAGCAATGCTAGTAGGACAAGTCACGACATTGGATC +TAGTGAAACTTATTGTGGCAGTGGGCTTGCATTTTCACGAGATCAACAATGGAGGAGACG +CTATGTACATGGCTTTGATTGCGAGCTTTTCTATTCGCCCGGGCCTGCTCATAGGTTTTG +GACTGCGCACACTCTGGAGTCCTCGCGAACGTCTCGTGATGGCATTCGGAGCAGCCATGG +TTGAAGTGGCATTGGGCGGGATGATGGGTGGACTGTGGCAGTATTTGAACGCCGTCTCAC +TATGCGTCCTCACCATCAATGCAATTTCTTCAAGAAAGGCCTCAAATGCGGTCCTCCCTC +TTATGGCGCTCTTGACTCCTGTGACAATGCATGAAGTAAGGATGGCAACAATGTTGTTCT +GCACAGTGGTCATAGTGGGTGTGCTCTACCAGAATTCAAAAGACACGTCCATGCAAAAAG +CCATTCCCATTGTGGCTCTGACACTGACTTCATATATGGGTCTAACCCAACCTTTTCTTG +GACTGTGTGCCTACATGTCCACACAAGTGTTTGGTAGAAGAAGCATCCCCGTAAATGAAG +CTCTTGCAGCAGCTGGCCTGGTAGGAGTGTTGGCAGGCTTGGCCTTCCAAGACATGGAAA +ATTTTTTAGGGCCGATTGCTGTGGGCGGGATACTCATGATGCTAGTCAGTGTGGCAGGGA +AAGTTGATGGACTGGAACTCAAAAAGCTCGGTGAGGTTTCCTGGGAGGAGGAAGCTGAGA +TAAGTGGAAGCTCCAGCCGCTACGATGTGGCACTAAGTGAACAGGGAGAATTCAAGCTTC +TCTCAGAGGATAAAGTGCCCTGGGACCAGATTGTCATGACCTCCTTGGCTCTTGTTGGGG +CAGCAATACATCCATTTGCCCTATTGCTGGTTCTAGGAGGTTGGGTTTTACATATCAAAG +GAGCTAGAAGGAGCGGGGATGTCCTTTGGGACATTCCCACACCAAAAGTCATAGAGGAAT +GTGAGCACCTGGAAGATGGAATTTACGGCATATTCCAATCAACCTTTCTTGGAGCATCCC +AGAGAGGAGTTGGAGTGGCCCAAGGGGGTGTCTTCCACACGATGTGGCACGTCACCAGAG +GAGCGTTTCTCTTGAGGAACGGGAAGAAATTAGTGCCATCCTGGGCCTCTGTGAAGGAGG +ATTTGGTGGCCTATGGTGGATCTTGGAAGCTGGATGGAAAGTGGGATGGTGAGGAAGAGG +TACAACTCATAGCTGCTGTGCCAGGAAAAGCCGTTGTAAATGTGCAGACCAAGCCAAGTT +TGTTCAAAGTTAGAAATGGAGGTGAGATTGGGGCAGTAGCCCTGGACTATCCTAGCGGGA +CCTCTGGTTCACCCATTGTGAATCGCAGTGGTGAAGTGGTGGGGCTCTATGGCAACGGGA +TCTTGGTTGGTGATAATTCCTTTGTGTCCGCCATCTCACAAACTGAGGTGAAAGAGGAAT +CTAAAGAGGAACTGCAGGAAATACCAACAATGTTGAAAAAAGGAATGACAACCATCCTTG +ATTTCCACCCCGGCGCGGGAAAGACCCGCAGGTTCCTGCCCCAAATACTGGCAGAATGCG +CCAGGAGGCGCCTACGAACACTAGTGCTGGCGCCTACCCGGGTTGTCCTGTCAGAAATGA +AGGAAGCTTTTCATGGACTTGATGTGAAGTTTCACACGCAGGCTTTTTCGGCCCATGGGA +GTGGGAAAGAAGTCATTGATGCAATGTGCCATGCGACCCTCACGTACAGGATGCTGGAGC +CAACAAGAGCTGTCAACTGGGAGGTGATTATCATGGATGAGGCTCACTTCTTGGATCCTG +CCAGCATTGCAGCAAGAGGCTGGGCAGCCCATAGGGCAAGAGCAAACGAGAGTGCCACGA +TACTCATGACAGCCACTCCACCAGGCACAAGTGATGAATTTCCCCATTCCAATGGTGAAA +TTGAAGATGTCCAGACTGATATTCCAAGTGAACCATGGACTTCAGGCCATGAGTGGATTC +TAGCCGACAAACGACCAACGGCATGGTTTCTCCCATCGATCAGAGCAGCAAATGTCATGG +CTGCCTCTTTGCGGAAGGCCGGGAAGAGTGTGGTGGTGTTGAACAGGAAGACCTTTGAAA +AGGAATACCCCACCATTAAACAAAAGAGACCGGATTTCATCCTAGCCACAGACATTGCCG +AGATGGGAGCAAACTTGTGCGTTGAAAGAGTGCTGGACTGTAGGACTGCATACAAACCTG +TCCTGGTGGATGAAGGGAGGAAAGTGGCCATCAAAGGGCCATTACGGATTTCTGCATCAT +CGGCTGCTCAGAGAAGAGGGCGCATTGGACGAAACCCAAACAGAGATGGAGATTCCTACT +ACTATTCAGAACCCACTAGTGAGGATAATGCCCATCATGTGTGTTGGCTGGAAGCTTCCA +TGCTTCTTGACAACATGGAAGTTAGAGGGGGAATGGTTGCCCCGCTCTATGGAATTGAAG +GGACAAAGACTCCTGTTTCCCCTGGGGAAATGAGGCTGAGAGATGATCAAAGGAGAGTTT +TCAGGGAGTTGGTGCGTGGATGTGACCTGCCGGTCTGGCTATCCTGGCAGGTAGCAAAGG +CCGGTTTAAAAACCAATGACCGCAAGTGGTGCTTTGAAGGACCCGAGGAACACGAGATAC +TCAATGACAACGGTGAAACTGTGAAGTGTAGGTCACCTGGTGGAGCGAAAAAGGCACTGA +GACCTAGATGGTGTGATGAAAGAGTGTCCTCAGATCAGAGCGCTTTGGCTGACTTCATTA +AGTTTGCCGAAGGTAGAAGAGGAGCTGCTGAGATGCTTGTGGTTCTCACGGAACTGCCTG +ACTTCTTGATGCAAAAAGGGGGGGAGGCTATGGACACCATTAGTGTGTTTCTCCATTCTG +AGGAGGGATCAAGAGCTTATAGAAATGCTCTATCAATGATGCCTGAAGCCATGACCATCG +TGATGCTTTTCATACTGGCTGGTCTCTTGACCTCAGGAATGGTGATCTTCTTCATGTCGC +CCAAAGGCATGAGCAGAATGTCTATGGCAATGGGGACTATGGCTGGCAGCGGGTACCTCA +TGTTCCTAGGGGGAGTGAAACCAACACACATCTCATATGTCATGTTGATCTTTTTTGTCC +TCATGGTCGTCATAATTCCAGAGCCAGGACAACAGAGGTCCATCCAGGACAACCAAGTGG +CCTATCTCATCATTGGAATACTCACATTGCTGTCCATTGTGGCGGCTAATGAGTTAGGAA +TGCTGGAAAAGACCAAGGAAGACTTTTTTGGAAGAAGAAATGCTGCCACACCTGGGGGGA +CGATTCCATGGAGTTGGCCCGATTTGGATCTGAAACCTGGGGCTGCCTGGACCGTTTATG +TGGGAATTGTGACAATGCTGTCACCAATGCTTCATCACTGGATTAAAGTGGAGTATGGCA +ACCTCTCGTTGTCAGGGATAGCCCAGTCGGCCTCGGTCCTTTCATTTATGGATAAAGGAA +TCCCTTTCATGAAGATGAACATATCTGTGGTCATACTCCTAGTCAGTGGCTGGAACTCAA +TAACAGTGATCCCCCTGTTATGTGGTGTGGGTGGAGCCATGCTGCATTGGACACTGATTC +TTCCTGGAATCAAAGCCCAGCAGTCAAAACTAGCACAAAAAAGAGTTTTTCATGGAGTGG +CAAAAAATCCAGTCGTTGATGGCAATCCAACTGCTGACATTGAAGAAGCACCTGAAATGC +CTGCCCTGTACGAGAAGAAATTGGCACTGTATCTTCTCCTCGCCTTGAGCCTGATGTCGG +TAGCCATGTGCAGAACTCCTTTTTCCCTAGCCGAAGGCATAGTGCTGTCATCTGCTGCCC +TTGGGCCCCTAATAGAGGGAAACACAAGTCTGCTATGGAATGGTCCTATGGCCGTTTCCA +TGACTGGGGTTATGCGCGGCAATTACTACGCTTTTGTGGGTGTGATGTACAACCTCTGGA +AGATGAAAACAGGGCGTAGAGGGAGAGCAAGTGGCAAGACACTAGGTGAGGTCTGGAAGA +GGGAGCTCAACCTGCTAGACAAACAGCAATTTGAGCTGTACAAGAGAACAGATATCACCG +AGGTGGATCGCGACATGGCTAGGCGACATCTAGCAGAGGGGAAGGTGGACACTGGAGTGG +CCGTGTCGAGAGGGACAGCGAAGCTAAGGTGGTTCCACGAGCGTGGCTATGTAAAACTTG +AAGGAAGGGTCATGGATTTGGGATGTGGACGTGGAGGTTGGTGCTACTATGCAGCAGCTC +AGAAAGAGGTCAGTGGTGTGAAAGGTTACACCCTGGGCAGGGATGGCCATGAGAAGCCCA +TGAACGTGCAAAGCTTAGGATGGAACATTGTGACCTTCAAGGACAAGACTGACATCCACA +GGCTAGAGCCGGCCAAGTGTGAAACCCTCCTTTGTGACATTGGAGAATCCTCACCTTCCT +CGGTTACCGAGGGTGAGAGGACCTTGAGAGTTCTTGAAACAATTGAAAAGTGGCTGGCCT +GTGGAGTGGACAACTTTTGTGTCAAGGTTCTAGCACCATACATGCCTGATGTGATAGAGA +AACTGGAACTTCTCCAAAGAAGATTTGGTGGAACTGTTATCAGGAATCCCCTTTCCAGAA +ACTCAACCCATGAGATGTATTATGTGTCAGGAGCAAGAAGTAATATCACTTTCACAGTCA +ACCAAACGTCACGTCTGCTGATGAGGAGGATGAGACGCCCAACAGGCAAGGTCACCCTTG +AGCCCGATGTCATTCTTCCCATAGGCACACGCAGCGTAGAAACTGACAAGGGACCATTGG +ACAGGGATGCCATTGAAGAGAGGGTTGAGAGAATCAAGACCGAGTATGCCACTACATGGT +TCTATGACAATGACAACCCATACCGGACCTGGCATTACTGTGGCTCATATATCACTAAAA +CATCAGGCAGTGCAGCCAGCATGATAAATGGAGTCATCAAAATCTTGACTTTTCCATGGG +ATAGGATAGAAGAGGTCACCAGGATGGCAATGACTGACACTACGCCTTTTGGCCAACAAA +GAGTTTTCAAGGAAAAGGTGGACACGAGAGCCAAAGATCCTCCTGCTGGAACTAGGAAAA +TCATGAAGGTGGTAAACCGTTGGCTGTTCCGTCATCTGGCCCGGGAGAAGAACCCTAGGC +TGTGCACAAAGGAGGAATTCATAGCCAAGGTGCGCAGTCATGCTGCGGTAGGAGCCTTTC +TAGAAGAGCAGGAGCAATGGAAGACAGCCAATGAAGCAGTTCAAGACCCTAAGTTTTGGG +AGATGGTTGATGCTGAGCGCAAACTACATCAACAGGGGCGTTGCCAGTCTTGTGTCTATA +ACATGATGGGAAAGAGAGAGAAAAAACTGTCTGAGTTTGGGAAAGCAAAAGGAAGTCGTG +CGATCTGGTACATGTGGCTGGGGGCGCGTTTCCTTGAGTTCGAGGCTCTTGGGTTCTTGA +ATGAAGATCACTGGGCCTCCAGAGAGAACTCAGGAGGAGGTGTTGAAGGCATAGGACTCC +AATATCTGGGCTATGTAATCAAGGACCTATCCACCAAAGAAGGGGGAGGATTCTATGCAG +ATGACACGGCAGGATGGGACACACGCATCACGGAAGCTGACCTAGATGATGAACAGGAGA +TCATGAGCTACATGAATGCTGAGCAGAGGAAACTGGCCTGGGCAGTGATGGAAATGACAT +ACAAGAACAAAGTGGTCAAGGTCCTTCGACCAGCACCAGGTGGCAAGGCTTTCATGGACA +TCATCAGTAGGAGAGATCAAAGGGGGTCAGGGCAAGTGGTGACATACGCTCTCAACACTA +TCACCAATTTGAAAGTCCAGCTCATAAGGATGGCTGAAGCTGAGATGGTAATCAACCATC +AGCACGTGAATGAATGTGACGAGGGCGTTTTGGCACGGCTGGACGCATGGCTTGCTGAGA +ATGGATGTGACAGACTTGCCCGGATGGCTGTGAGTGGAGATGATTGTGTCGTGAGGCCTG +TGGATGACAGATTTGGCCTGGCTCTTTCCCATCTCAATGCCATGTCAAAAGTCAGGAAGG +ACATTTCAGAATGGCAGCCCTCCAAGGGGTGGACGGATTGGGAAAATGTTCCTTTCTGCT +CCCACCATTTCCATGAACTTGTGTTGAAAGATGGAAGGAAAGTTGTGGTGCCCTGTAGAG +ACCAAGATGAGTTGATAGGAAGAGGGAGAGTGTCTCCAGGAAATGGCTGGATGATCAAAG +AAACAGCCTGCCTCAGCAAGGCTTATGCAAACATGTGGTCACTGATGTATTTTCACAAGA +GGGACATGAGGCTGCTTTCATTTGCTGTCTCATCGGCCGTCCCAACGGCATGGGTACCCA +GTGGAAGAACAACATGGTCTGTTCATGGAAAAGGAGAATGGATGACCACCGAAGACATGT +TGGACGTCTGGAACAGAGTTTGGGTTTTAAACAACCCACACATGAAGGACAAGACTACCG +TGAAGGAGTGGAGAGATGTTCCTTACCTCACAAAAAGGCAAGACAAGCTCTGTGGGTCCC +TAATAGGAATGACAAACAGGGCCACATGGGCCTCACACATCCACCTGGTGATCCACCGAA +TTCGGACTTTAATCGGCCAAGAAAAATACACAGATTATCTCACTGTGATGGACAGGTACT +CGGTTGATGCTGACCTCCAACCAGGAGAGCTCATCTGAGACCAGCCATCGTAAATCAACC +GGGATAAAAACTACGGGTGGAGAACCGGACTCCCCACTTCCAAAGCATCAACAAGAAACC +GGTATAAAAACTACGGATGGAGAACCGGACTCCACACTTAAGAGGCCATTGACGTCAGCC +CAGGACCCTAGAATTAGGAGTCTTGCCACCGCTAAGCTGTGAGGCGGTGCGGGCTGGGAC +AGCCGTTTTCCAGATCACGACAGATCTGGTTTCTGGGACTTCCCAACCCAGAGTAAAATG +ATGGAGCCTCCGCCACCACCCACCCACGGGGTGGTGGAAAGATGGGGTCCAGAGGTTAGA +GGAGACCCTCCAGGGAAATTAGTGGGACCATATTGACGCCAGGGAAAGACCGGAGTGGTT +CTCTGCTTTTCCTCCAGGGGTCTGCGAGCACAGTTTGCTCTAGAAGAAGCAGACCTTTGG +ACGAAAAACACAAAACCACT +>MW960207 +ATTAAAATTAATCCTGTGTGCTAATTGAGGTGCATTGGTCTGCAAATCGAGTTGCTAGGC +AATAAACACATTTGGATTAATTTTAATCGTTCTTTGAGCGATTAGCAGAGAACTGACCAG +AACAATGTCTGGTCGAAAAGCTCAGGGTAAAACCCTGGGCGTCAATATGGTAAGACGAGG +AGTACGCTCCTTGTCAAACAAAATAAAACAAAAAACAAAACAGATTGGAAACAGACCTGG +CCCTTCAAGAGGTGTTCAAGGATTTATTTTCTTCTTTTTGTTCAACATCCTAACTGGGAA +AAAACTAACTACCCACCTGAAAAGGTTCTGGAGAATGCTTGACCCCCGACAGGGACTTGC +TGTTCTAAGGAAAGTCAAGAGGGTGGTAGCCAGCTTGATGAGAGGGTTGTCATCTAGGAA +GCGCCGCTCTAATGAGATGACCATGATGCCACTTCTAATCTTGAGCATGGTGATTTTGGC +TGGAGGGGTGACACTCGTCCGGAAAAATCGATGGCTACTCTTGAATGTCACAGCTGAGGA +CTTGGGAAAGACGTTCTCAGTGGGAACCGGGAACTGCACCACCAACATCCTTGAGGCAAA +GTATTGGTGTCCCGACTCAATGGAATACAACTGTCCCAATCTTAGCCCCAGAGAGGAGCC +TGATGACATTGACTGTTGGTGTTATGGAGTGGAAAATGTCAGAGTAGCCTATGGAAGGTG +TGATGCAGTGGGGAGGTCAAAGAGATCTAGGAGAGCAATTGATCTGCCCACACATGAAAA +CCACGGACTGAAAACCCGGCAGGAGAAATGGATGACAGGCAGAATGGGTGAGCGGCAACT +CCAAAAGATTGAGCGGTGGCTGGTGAGAAATCCGTTCTTCGCCATAACAGCCTTGGCCAT +TGCTTATCTGGTGGGCAACAATATGACACAACGTGTCGTCATAGCTCTGCTAGTTTTGGC +AGTTGGCCCAGCCTATTCTGCACATTGCATTGGGATAACTGACAGAGATTTCATTGAGGG +TGTCCATGGGGGCACATGGGTGTCAGCAACCCTGGAGCAGGACAAGTGCGTGACTGTCAT +GGCGCCTGATAAACCATCACTAGACATCTCGCTCCAAACAGTGGCAATAGATGGTCCTGC +TGAAGCGAGAAAGGTTTGCTACAGCGCGGTTCTCACCCATGTAAAAATCAATGATAAGTG +CCCGAGCACTGGTGAGGCTCACCTCGCAGAGGAAAAGGATGGTGACAACGCGTGCAAACG +AACATACTCAGATAGAGGCTGGGGTAATGGTTGTGGGCTCTTTGGAAAGGGGAGCATTGT +GGCATGTGCTAAGTTCACGTGTGCCAAATCCATGAGCCTTTTTGAAGTGGACCAGACCAA +AATCCAGTACGTTATCAGGGCCCAGCTTCATGTGGGTGCCAAGCAGGAGAACTGGAACAC +AGACATAAAGACACTGAAATTTGATGCCTTATCTGGCTCTCAAGAGGCCGAATTTACTGG +CTATGGGAAAGCAACACTAGAGTGTCAGGTCCAGACTGCGGTGGACTTTGGGAACAGCTA +CATTGCAGAGATGGAGAAAGACAGCTGGATTGTTGACCGCCAGTGGGCACAAGACTTGAC +ACTACCATGGCAGAGTGGGAGTGGTGGAATATGGAGGGAAATGCATCATCTAGTTGAGTT +TGAGCCTCCTCATGCCGCTACAATCAGAGTGTTAGCCCTGGGAAACCAAGAGGGGTCTTT +GAAAACAGCCCTTACAGGAGCCATGCGGGTCACTAAAGATGAAAATGACAACAACTTGTA +CAAGCTGCATGGTGGACATGTCTCTTGTAGGGTGAAACTCTCAGCCTTAACTCTCAAGGG +AACATCCTACAAAATGTGCACAGATAAAATGTCATTTGTGAAAAACCCAACGGACACAGG +TCATGGCACTGTTGTCATGCAGGTGAAGGTCCCCAAAGGAGCTCCATGCAAGATCCCCGT +GATTGTGGCCGATGATCTAACAGCTGCAGTGAACAAGGGTATACTGGTCACTGTCAACCC +CATAGCATCCACAAATGACGATGAAGTCCTAATTGAAGTTAATCCCCCTTTTGGAGACAG +CTACATCATTGTTGGGACTGGAGACTCAAGACTGACTTATCAGTGGCATAAAGAAGGAAG +CTCAATAGGGAAACTGTTCACACAGACAATGAAGGGAGCTGAACGTCTTGCAGTGATGGG +TGACGCCGCCTGGGACTTTAGCTCTGCAGGTGGTTTCTTCACGTCAGTAGGGAAAGGAAT +TCATACTGTGTTTGGCTCAGCTTTCCAAGGGTTGTTTGGTGGCCTGAGCTGGATTACAAA +GGTCATCATGGGAGCTGTTCTTATCTGGGTTGGAATTAACACACGTAACATGACCATGTC +CATGTCTATGATTCTGGTAGGAGTGATCATGATGTTTCTTTCCCTGGGTGTTGGGGCAGA +CCAAGGATGTGCTGTCAACTTTGGGAAGCGAGAGCTTAAATGTGGAGATGGCATCTTTGT +GTTTAGAGACTCAGATGACTGGCTCACCAAGTATTCATATTATCCAGAAGACCCTGTTAA +ATTGGCTTCTATCATCAAGGCCTCCTATGAAGAGGGCAAATGTGGACTGAACTCTGTGGA +CTCCCTTGAGCATGAAATGTGGAGGAGTAGAGCTGATGAGATCAACGCCATATTTGAGGA +AAATGAAGTGGACATCTCGGTTGTTGTTCAAGACCCAAAGAACATCTACCAAAGAGGGAC +ACATCCTTTTTCTCGGATTCGTGATGGGTTGCAGTATGGATGGAAAACCTGGGGTAAAAA +TCTCATCTTCTCACCCGGAAGAAGAAATGGCAGTTTCATCATTGATGGGAAGTCAAGGAA +GGAATGCCCTTTTTCAAACAGAGTGTGGAACTCTTTTCAAATTGAGGAGTTTGGCATGGG +GGTTTTCACAACACGGGTTTTTATGGATGCTGTCTTTGACTACTCAGTGGACTGTGATGG +GGCCATACTAGGGGCAGCTGTGAATGGGAAGAAGAGCGCACACGGATCGCCCACCTTCTG +GATGGGAAGCCATGAGGTCAATGGAACATGGATGGTACACACACTTGAGACCCTTGACTA +CAAAGAGTGTGAATGGCCTCTGACACACACCATAGGAACCTCAGTGGAAGAGAGTGACAT +GTTCATGCCCCGTTCCATTGGAGGCCCAGTGAGCTCCCATAACCACATTCCAGGTTACAA +GGTCCAGACGAATGGACCATGGATGCAAGTCCCTTTGGAAGTTAGAAGGGAGCCATGTCC +GGGGACAAGTGTGGTGCTGGATACCGGCTGTGATGGACGTGGCAAATCAACCAGATCAAC +TACTGACAGTGGGAAAATAATTCCAGAATGGTGCTGCAGATCTTGCACCATGCCCCCAGT +TAGCTTTCACGGCAGTGATGGCTGCTGGTATCCCATGGAAATTAGACCCATGAAAACCCA +CGAGAGCCATCTGGTGAGATCATGGGTTACCGCAGGAGAAGTGCACGCGGTGCCTTTCGG +ATTGGTGAGCATGATGATTGCCATGGAGGTTGTCCTACGCAAAAGACAAGGACCAAAGCA +AATGCTGGTGGGAGGAATCATTTTACTTGGAGCAATGCTAGTGGGACAAGTCACGATGCT +GGATCTAGTGAAACTCATTGTGGCAGTGGGCTTGCATTTTCATGAGATCAACAATGGAGG +AGACGCCATGTACATGGCTTTGATTGCGAGCTTTTCTATTCGCCCGGGCCTGCTCGTAGG +TTTTGGACTGCGCACACTCTGGAGTCCTCGCGAGCGTCTCGTGATGGCATTCGGGGCAGC +CATGGTTGAAGTGGCCTTGGGCGGGATGATGGGTGGACTGTGGCAGTACCTGAACGCCGT +CTCACTATGCGTCCTCACCATCAATGCAATTTCTTCAAGAAAGGCCTCAAATGCGGTCCT +CCCCTTGATGGCACTCTTGACCCCTGTAACAATGCATGAAGTAAGGATGGCAACAATGCT +GTTCTGCACAGTGGTCATAGTGGGGGTGCTCCACCAGAATTCAAAAGACACGTCCATGCG +AAAAGCCATTCCCATTGTGGCTCTGACACTGACCTCATATATGGGTCTAACTCAACCTTT +TCTTGGACTGTGTGCCTACATGTCCACACAAGTGTTTGGTAGAAGAAGCATCCCCGTAAA +TGAAGCTCTTGCAGCAGCTGGCCTGGTAGGAGTGTTGGCAGGCCTAGCTTTTCAAGACAT +GGAAAATTTTTTAGGGCCGATTGCTGTGGGCGGGATACTCATGATGCTGGTCAGTGTGGC +AGGGAAAGTTGATGGACTGGAACTTAAGAAGCTCGGTGAGGTTTCCTGGGAGGAGGAAGC +TGAGATAAGTGGAAGCTCCAGCCGCTACGATGTGGCACTAAGTGAACAGGGAGAATTTAA +GCTTCTCTCAGAGGATAAAGTGCCCTGGGACCAGATTGTCATGACTTCCTTGGCTCTCGT +TGGGGCAGCGATACATCCATTTGCCCTATTGTTGGTTCTAGGAGGTTGGGTTTTACATAT +CAAGGGAGCTAGGAGGAGCGGGGATGTCCTTTGGGACATTCCCACACCAAAAGTTATAGA +GGAATGTGAGCATCTGGAAGATGGAATCTACGGCATATTCCAGTCAACCTTTCTTGGAGC +ATCCCAGAGAGGAGTTGGAGTGGCCCAAGGGGGTGTCTTCCACACGATGTGGCACGTCAC +CAGAGGAGCGTTTCTCTTGAGGAACGGGAAGAAATTAGTACCATCCTGGGCCTCTGTGAA +GGAGGATTTGGTGGCCTATGGTGGATCTTGGAAGCTGGATGGAAAGTGGGATGGTGAGGA +AGAGGTACAACTCATAGCTGCTGTGCCAGGAAAAGCTGTTGTCAATGTGCAGACCAAGCC +AAGTTTGTTCAAAGTTAGAAATGGAGGTGAGATTGGGGCAGTTGCCTTGGACTATCCTAG +CGGGACCTCTGGTTCACCCATTGTGAATCGCAGTGGTGAGGTGGTGGGACTCTATGGCAA +CGGGATCCTGGTTGGTGACAATTCTTTTGTGTCTGCCATCTCACAAACTGAAGTGAAAGA +GGAATCCAAAGAGGAATTGCAGGAAATACCAACAATGTTGAAAAAAGGAATGACAACTAT +CCTTGATTTCCACCCCGGCGCGGGGAAGACCCGTAGGTTCTTGCCCCAAATACTGGCAGA +ATGCGCCAGGAGGCGCCTACGAACATTAGTGCTGGCGCCTACCCGGGTTGTCCTGTCAGA +AATGAAGGAAGCTTTCCATGGACTTGATGTGAAGTTTCACACGCAGGCTTTTTCAGCCCA +TGGGAGTGGGAAAGAAGTCATTGATGCAATGTGCCACGCAACCCTCACGTACAGGATGCT +GGAGCCAACAAGAGCTGTCAACTGGGAGGTGATTATCATGGATGAGGCTCACTTCTTGGA +TCCTGCCAGCATCGCAGCAAGGGGCTGGGCAGCCCATAGGGCAAGAGCAAATGAGAGTGC +CACAATACTCATGACAGCCACTCCACCAGGCACAAGTGATGAATTTCCCCATTCCAATGG +TGAGATTGAAGATGTCCAGACTGACATTCCAAGTGAACCATGGACTTCAGGCCATGAGTG +GATTCTAGCCGACAAACGACCAACGGCATGGTTTCTCCCATCGATCAGAGCAGCAAATGT +CATGGCGGCCTCTTTGCGGAAGGCCGGGAGGAGTGTGGTGGTGTTGAACAGGAAGACCTT +TGAAAAGGAATACCCCACCATTAAACAAAAGAGGCCGGATTTCATCCTAGCCACAGACAT +TGCCGAGATGGGAGCAAACTTGTGCGTTGAAAGAGTGCTGGACTGTAGGACTGCATACAA +ACCTGTTCTGGTGGATGAAGGGAGGAAAGTGGCCATCAAAGGGCCATTACGGATTTCTGC +ATCATCGGCTGCTCAGAGAAGAGGGCGCATTGGAAGAAACCCAAACAGAGATGGAGATTC +CTACTACTATTCAGAACCCACTAGTGAGGATAATGCCCATCACGTGTGCTGGCTGGAGGC +TTCCATGCTTCTTGACAACATGGAAGTTAGAGGAGGAATGGTTGCCCCGCTCTATGGAAT +TGAAGGGACAAAGACTCCTGTCTCCCCTGGGGAAATGAGGCTGAGAGATGATCAAAGGAG +AGTTTTCAGGGAGTTGGTGCGTGGATGTGACCTGCCGGTCTGGCTATCCTGGCAGGTAGC +AAAGGCCGGTTTAAAAACCAATGACCGCAAGTGGTGCTTTGAAGGACCCGAGGAACACGA +GATACTCAATGACAACGGTGAAACTGTGAAGTGCAGGTCACCCGGCGGAGCGAAAAAGGC +ACTGAGACCTAGATGGTGTGATGAAAGAGTGTCCTCAGATCAGAGCGCTTTGGCTGACTT +CATCAAGTTCGCCGAGGGTAGAAGAGGAGCTGCTGAGATGCTTGTGGTTCTCACGGAACT +GCCTGACTTCTTGATGAAAAAAGGGGGGGAGGCCATGGACACCATAAGTGTGTTTCTCCA +TTCTGAGGAGGGATCAAGAGCTTATAGAAATGCTTTATCAATGATGCCTGAAGCCATGAC +CATCGTGATGCTTTTCATACTGGCTGGCCTCCTGACCTCAGGAATGGTGATCTTCTTCAT +GTCGCCCAAAGGCATGAGCAGAATGTCTATGGCAATGGGGACCATGGCTGGCAGCGGGTA +CCTCATGTTCCTAGGGGGAGTGAAACCAACACACATCTCATATGTCATGTTGATCTTTTT +CGTCCTCATGGTCGTCATAATTCCAGAGCCAGGACAACAGAGGTCCATCCAGGACAACCA +AGTGGCCTATCTTATCATTGGAATACTCACATTGCTGTCCATTGTGGCAGCTAATGAGTT +GGGAATGCTGGAAAAGACCAAGGAAGACTTTTTTGGAAGAAGAAATACTGCCACACCTGG +TGGGACGATTCCATGGAGTTGGCCCGATTTAGATCTGAAACCTGGGGCTGCTTGGACCGT +TTATGTGGGAATTGTGACAATGCTGTCACCAATGCTTCATCACTGGATCAAAGTGGAGTA +TGGCAACCTTTCGTTGTCAGGGATAGCCCAGTCGGCCTCGGTCCTTTCATTTATGGATAA +AGGAATCCCTTTCATGAAGATGAACATATCTGTGGTCATACTCCTAGTCAGTGGCTGGAA +CTCAATAACAGTGATCCCCCTGTTATGTGGTGTGGGTGGAGCCATGCTGCATTGGACACT +GATTCTTCCTGGAATCAAAGCCCAGCAGTCAAAACTAGCACAAAAAAGAGTTTTTCATGG +AGTGGCAAAAAATCCAGTCGTTGATGGCAACCCAACCGCTGACATCGAAGAAGCACCTGA +AATGCCAGCCCTGTACGAGAAGAAATTGGCACTGTATCTTCTCCTCGCCTTGAGCCTGAT +GTCAGTAGCCATGTGCAGAACTCCTTTTTCCCTAGCCGAAGGCATAGTGTTGTCATCTGC +TGCCCTTGGGCCCCTAATAGAGGGAAACACAAGTTTGCTATGGAATGGTCCTATGGCCGT +TTCCATGACTGGGGTCATGCGCGGCAATTACTACGCTTTTGTGGGTGTGATGTACAACCT +CTGGAAGATGGAAACAGGGCGTAGAGGGAGAGCAAGTGGCAAGACACTAGGTGAGGTTTG +GAAGAGGGAGCTCAACTTGCTAGACAAACAGCAATTTGAGCTGTACAAGAGAACAGATAT +CACCGAGGTGGATCGCGACATGGCTAGGCGACATCTAGCAGAGGGGAAGGTGGACACTGG +AGTGGCCGTGTCGAGAGGGACAGCGAAGCTAAGGTGGTTCCACGAGCGTGGCTATGTAAA +ACTGGAAGGAAGGGTCATGGATTTGGGATGTGGACGTGGAGGTTGGTGCTATTATGCAGC +AGCTCAGAAAGAGGTCAGTGGTGTGAAGGGTTACACCCTGGGCAGGGATGGCCATGAAAA +GCCCATGAACGTGCAAAGCTTAGGATGGAATATTGTGACCTTCAAGGACAAGACTGACAT +CCACAGGCTAGAGCCGGCCAAGTGTGAAACCCTCCTTTGTGACATTGGAGAATCCTCACC +CTCCTCTGCGACCGAGGGTGAGAGGACCTTGAGAGTTCTTGAAACAATTGAAAAGTGGCT +GGCCTGTGGAGTGGACAACTTTTGTGTCAAGGTTCTAGCACCATACATGCCTGATGTGAT +AGAGAAACTGGAACTTCTCCAAAGAAGATTTGGCGGAACTGTTATCAGGAATCCCCTTTC +CAGAAACTCAACCCATGAGATGTATTATGTGTCAGGGGCAAGAAGTAACATCACCTTTAC +AGTCAACCAGACATCACGTCTGTTGATGAGGAGGATGAGACGACCAACAGGCAAAGTCAC +CCTTGAACCCGATGTCATTCTTCCCATAGGCACACGCAGCGTAGAAACTGACAAGGGACC +TTTGGACAGGGATGCCATTGAAGAGAGGGTTGAGAGAATCAAGACTGAGTATGCCACTAC +ATGGTTCTATGACAATGACAACCCGTATCGGACCTGGCATTACTGTGGCTCATATATCAC +TAAGACATCAGGCAGTGCAGCCAGCATGATAAATGGAGTCATCAAAATCTTGACCTTCCC +ATGGGATAGGATAGAAGAGGTCACCAGAATGGCAATGACTGACACCACGCCTTTTGGCCA +ACAAAGAGTCTTCAAGGAAAAGGTGGACACAAGAGCCAAAGATCCCCCTGCTGGAACCAG +GAAAATCATGAAGGTGGTAAATCGCTGGCTGTTCCGTCATCTGGCCCGGGAGAAGAACCC +CAGGCTGTGCACAAAGGAGGAATTCATAGCCAAGGTGCGCAGTCATGCTGCGGTTGGAGC +CTTTCTAGAGGAGCAGGAGCAATGGAAGACAGCCAATGAAGCTGTTCAAGACCCTAAGTT +TTGGGAGATGGTTGATGCTGAGCGCAAACTACACCAACAGGGGCGTTGCCAGTCTTGTGT +CTATAACATGATGGGAAAAAGAGAGAAAAAACTATCTGAGTTTGGGAAAGCAAAAGGAAG +TCGTGCGATCTGGTACATGTGGCTGGGGGCACGTTTCCTTGAGTTTGAGGCTCTTGGGTT +CTTGAATGAAGATCACTGGGCCTCCAGAGAGAACTCAGGAGGAGGTGTTGAAGGCATAGG +ACTCCAATATCTAGGCTATGTAATCAAGGACCTATCCACCAAAGAAGGGGGAGGATTCTA +TGCAGATGACACAGCAGGATGGGACACACGTATCACGGAAGCTGACCTAGATGATGAACA +GGAGATCATGAGCTACATGAATGCTGAGCAGAGGAAACTGGCCTGGGCAGTGATGGAAAT +GACATACAAGAACAAAGTGGTCAAGGTCCTTCGACCAGCACCAGGTGGCAAGGCTTTCAT +GGACATCATCAGTAGGAGAGATCAAAGGGGGTCAGGGCAAGTAGTGACATACGCTCTCAA +CACTATCACCAATTTGAAAGTCCAGCTCATAAGGATGGCTGAAGCTGAGATGGTAATCAA +CCATCAGCACGTGAATGAATGTGACGAGGGCGTTTTGGCACGGCTGGACGCATGGCTTGC +TGAGAATGGATGTGACAGACTTGCCCGGATGGCTGTGAGTGGAGATGATTGTGTCGTAAG +GCCTGTGGATGACAGATTCGGCTTGGCTCTTTCCCATCTCAATGCCATGTCAAAAGTCAG +GAAGGACATTTCAGAATGGCAGCCCTCCAAGGGGTGGACAGATTGGGAAAATGTTCCTTT +CTGCTCCCACCATTTCCATGAACTTGTGTTGAAAGATGGAAGGAAAGTTGTGGTGCCCTG +TAGAGACCAAGATGAGTTGATAGGAAGAGGGAGAGTGTCTCCAGGAAATGGCTGGATGAT +TAAAGAAACAGCTTGCCTTAGTAAGGCTTATGCAAACATGTGGTCACTGATGTATTTCCA +CAAGAGAGACATGAGGCTGCTCTCATTTGCTGTCTCATCGGCCGTTCCAACAGCATGGGT +CCCCAGTGGAAGAACAACATGGTCTGTTCATGGAAAAGGAGAGTGGATGACCACCGAAGA +CATGTTGGACGTCTGGAACAGAGTTTGGGTTTTAAACAACCCACACATGAAGGATAAGAC +TACCGTGAAGGAGTGGAGAGATGTTCCTTACCTCACAAAAAGGCAAGACAAACTCTGTGG +GTCCCTAATAGGAATGACAAACAGGGCCACATGGGCCTCACACATCCACCTGGTGATCCA +CCGAATTCGGACTTTGATCGGCCAAGAAAAATACACAGATTATCTCACTGTGATGGACAG +GTATTCGGTTGACGCTGACCTCCAACCAGGAGAGCTCATCTGAGACCAGCCATTGTGAAT +TAACCGGGATAAAAACTACGGGTGGAGAACCGGACTCCCCACTTCCAAAGCATCAACGAG +AAACCGGGATAAAAAACCACGGATGGAGAACCGGACTCCACACTTAAAAGGCTATTGACG +TCAGCCCAGGACNYCTAGAATTCTNWRGAGTCTTGCCACCGCTAAGCTGTGAGGCGGTGC +GGGCTGGGACAGCCGTTTTCCAGATCACGACAGATCTGGTTTCTGGGATTTCCCAACCCA +GAGTGAAATGATGGAGCCTCCGCCACCACCCACCCACGGGGTAGTGGAAAGATGGGGTCT +AGAGGTTAGAGGAGACCCTCCAGGGAAATTAGTGGGACCATATTGACGCCAGGGAAAGAC +CGGAGTGGTTCTCTGCTTTTCCTCCAGGGGTCTGCGAGCACAGTTTGCTCTAGAAGAAGC +AGACCTTTGGATGAAAAACACAAAACCACG