From 9754b1175e326f90cd9e96660cdc94aa889cffa1 Mon Sep 17 00:00:00 2001 From: Daniel Lundin Date: Mon, 14 Oct 2019 18:10:26 +0200 Subject: [PATCH] Handle empty fasta files (0.2.1) --- src/R-test/Makefile | 8 +- src/R-test/dada2idseq.02.expect | 648 ++++++++++++++++++++++++++++++++ src/R-test/dada2idseq.02.fna | 0 src/R/dada2idseq.R | 12 +- 4 files changed, 663 insertions(+), 5 deletions(-) create mode 100644 src/R-test/dada2idseq.02.expect create mode 100644 src/R-test/dada2idseq.02.fna diff --git a/src/R-test/Makefile b/src/R-test/Makefile index 2ba0d4a..f09c7b3 100644 --- a/src/R-test/Makefile +++ b/src/R-test/Makefile @@ -18,7 +18,7 @@ dada2cleanNmerge: dada2cleanNmerge.00 dada2bimeras: dada2bimeras.00 -dada2idseq: dada2idseq.00 dada2idseq.01 +dada2idseq: dada2idseq.00 dada2idseq.01 dada2idseq.02 dada2taxonomy: dada2taxonomy.00 @@ -57,6 +57,12 @@ dada2idseq.01: @gunzip -c $@.out.tsv.gz >> $@.out @$(CHECK) +dada2idseq.02: + @cp $@.fna $@.out + @../R/dada2idseq.R --verbose --prefix=S_ --fnafile=$@.out --outtable=$@.out.tsv.gz $@.tsv.gz + @gunzip -c $@.out.tsv.gz >> $@.out + @$(CHECK) + dada2taxonomy.00: @../R/dada2taxonomy.R --verbose --seed 42 \ --rdp_fasta ../../testdata/silva.fna.gz \ diff --git a/src/R-test/dada2idseq.02.expect b/src/R-test/dada2idseq.02.expect new file mode 100644 index 0000000..1620664 --- /dev/null +++ b/src/R-test/dada2idseq.02.expect @@ -0,0 +1,648 @@ +>S_000000001 +AACGTTATTCGGAATTACTGGGCTTAAAGGGTGCGTAGGCTGTGCGGAAAGTTAGGTGTGAAATCCCCCGGCTCAACCGGGGAATTGCGCTTAAAACTACCGTGCTAGAGGAAGACAGAGGTGAGCGGAACTTCGGGTGGAGCGGTGAAATGCGTTGATATCCGAAGGAACACCGGTGGCGAAAGCGGCTCACTGGGTCTTTTCTGACGCTGATGCACGAAAGCTAG +>S_000000002 +AACGTTATTCGGATTTACTGGGCTTAAAGAGTTCGTAGGCGGCGCAGAAAGTAGGGTGTGAAAGCCCTCGGCTCAACCGAGGAATTGCGCCCTAAACTACTGTGCTCGAGGAAGCTAGAGGTGAGCGGAACTGATGGTGGAGCGGTGAAATGCGTTGATATCATCAGGAACACCGGAGGCGAAGGCGGCTCACTGGGGCTTTTCTGACGCTGAGGAACGAAAGCCAG +>S_000000003 +AACGTTATTCGGATTTACTGGGCTTAAAGAGTTCGTAGGCGGCGCAGAAAGTAGGGTGTGAAAGCCCTCGGCTCAACCGAGGAATTGCGCCCTAAACTACTGTGCTTGAGGAAGCTAGAGGTGAGCGGAACTGATGGTGGAGCGGTGAAATGCGTTGATATCATCAGGAACACCGGAGGCGAAGGCGGCTCACTGGGGCTTTTCTGACGCTGAGGAACGAAAGCCAG +>S_000000004 +AACGTTGTTCGGAATCACTGGGCGTAAAGGGCGCGTAGGCGGATCGGTAAGTCAGAGGTGAAATCCCGGGGCTCAACTCCGGGCCTGCCTCTGATACTGCCGTTCTAGAGTGCAGGAGAGGAAGGCGGAATTCCAGGTGTAGCGGTGGAATGCGTAGATATCTGGAAGAACACCAGTGGCGAAGGCGGCCTTCTGGACTGTTACTGACGCTGAGGCGCGAAAGCTAG +>S_000000005 +AACGTTGTTCGGAATCACTGGGCTTAAAGGGCGCGTAGGCGGGTCAGCAAGTCCGGGGTGAAATCTTTCGGCTCAACCGGAAAAGTGCCTTGGATACTGCTGGTCTAGAGGGAGGTAGGGGTCTGTGGAACTTCTGGTGGAGCGGTGAAATGCGTTGATATCAGAAGGAACGCCGGTGGCGAAAGCGACGGACTGGACCTCTTCTGACGCTGAGGCGCGAAAGCCAG +>S_000000006 +AACGTTGTTCGGAATTACTGGGCGTAAAGCGCGTGTAGGCGGCTATGCAAGTCGGATGTGAAAGCCCTCGGCTCAACCGGGGAAGGGCACCCGAAACTGCAAAGCTAGAGTCTCGGAGAGGATCGTGGAATTCTCGGTGTAGAGGTGAAATTCGTAGATATCGAGAGGAACACCGGTGGCGAAGGCGGCGATCTGGACGATGACTGACGCTGAGACGCGAAAGCGTG +>S_000000007 +AGCGTTAATCGGAATCACTGGGCGTAAAGGGCGCGTAGGCGGTTAGGTAAGTCGGATGTGAAAGCCCTGGGCTCAACCTGGGAATGGCATTCGAGACTGTCTATCTAGAGTCTGGTAGAGGGAAGTGGAATTTCCGGTGTAGCGGTGAAATGTGTAGATATCGGAAGGAACACCAGTGGCGAAGGCGACTTCCTGGACCAAGACTGACGCTGAGGCGCGAAAGCGTG +>S_000000008 +AGCGTTAATCGGAATCACTGGGCGTAAAGGGCGCGTAGGCGGTTAGGTAAGTCGGATGTGAAAGCCCTGGGCTTAACCTGGGAATGGCATTCGAGACTGTCTATCTAGAGTCTGGTAGAGGGAAGTGGAATTTCCGGTGTAGCGGTGAAATGTGTAGATATCGGAAGGAACACCAGTGGCGAAGGCGACTTCCTGGACCAAGACTGACGCTGAGGCGCGAAAGCGTG +>S_000000009 +AGCGTTAATCGGAATTACTGGGCGTAAAGCGCACGTAGGTGGCGATGTAAGTCGGGTGTGAAATCCCCGGGCTCAACCTGGGAATTGCATTCGAGACTGCATTGCTGGAGTACGGAAGAGGAAGGCGGAATTCCCGGTGTAGCGGTGAAATGCGTAGATATCGGGAGGAACATCAGTGGCGAAGGCGGCCTTCTGGTCCAGTACTGACACTCAAGTGCGAAAGCGTG +>S_000000010 +AGCGTTAATCGGAATTACTGGGCGTAAAGCGCGCGTAGGCGGCTTTGCAAGTCGGGTGTGAAATCCCCAGGCTTAACCTGGGAACTGCATTCGAGACTGCATAGCTAGAGTATGGGAGAGGGAAGTGGAATTTCAGGTGTAGCGGTGAAATGCGTAGATATCTGAAGGAACATCAGTGGCGAAAGCGACTTCCTGGACCAATACTGACGCTCATGTGCGAAAGCGTG +>S_000000011 +AGCGTTAATCGGAATTACTGGGCGTAAAGCGCGCGTAGGCGGCTTTGCAAGTCGGGTGTGAAATCCCCAGGCTTAACCTGGGAACTGCATTCGAGACTGCATTGCTAGAGTATGGGAGAGGGAAGTGGAATTTCCGGTGTAGCGGTGAAATGCGTAGATATCGGAAGGAACATCAGTGGCGAAAGCGACTTCCTGGACCAATACTGACGCTCATGTGCGAAAGCGTG +>S_000000012 +AGCGTTAATCGGAATTACTGGGCGTAAAGCGCGCGTAGGCGGCTTTGCAAGTCGGGTGTGAAATCCCCAGGCTTAACCTGGGAACTGCATTCGAGACTGCATTGCTAGAGTATGGGAGAGGGCAGTGGAATTTCCGGTGTAGCGGTGAAATGCGTAGATATCGGAAGGAACATCAGTGGCGAAAGCGACTGCCTGGACCAATACTGACGCTCATGTGCGAAAGCGTG +>S_000000013 +AGCGTTAATCGGAATTACTGGGCGTAAAGCGCGCGTAGGCGGTTTAGCAAGTCGGATGTGAAAGCCCCGGGCTTAACCTGGGAATTGCATTCGAGACTGCTTGGCTAGAGTTTGGTAGAGGAAAGCGGAATTCCGGGTGTAGCGGTGAAATGCGTAGATATCCGGAGGAACATCAGTGGCGAAGGCGGCTTTCTGGACCAAAACTGACGCTGAGGTGCGAAAGCGTG +>S_000000014 +AGCGTTAATCGGAATTACTGGGCGTAAAGCGTGCGCAGGCGGCGGCTTGTGTCAGGTGTGAAATCCCCGGGCTTAACCTGGGAATTGCGCTTGAAACTAAGCTGCTCGAGTTCAGTAGAGGGGGGTGGAATTCCAGGTGTAGCAGTGAAATGCGTAGAGATCTGGAGGAACACCAATGGCGAAGGCAGCCCCCTGGGCTGAAACTGACGCTCAGGCACGAAAGCGTG +>S_000000015 +AGCGTTAATCGGAATTACTGGGCGTAAAGCGTGCGTAGGCGGTTCGTTATGTCTGCTGTGAAAGCCCCGGGCTCAACCTGGGAATGGCAGTGGAAACTGGCGGGCTGGAGGGTGGCAGAGGGGGGTGGAATTCCGCGTGTAGCAGTGAAATGCGTAGAGATGCGGAGGAACACCGATGGCGAAGGCAGCCCCCTGGGCCGACCCTGACGCTCAGGCACGAAAGCGTG +>S_000000016 +AGCGTTAATCGGAATTACTGGGCGTAAAGGGCGCGTAGGCGGTGAAGTAAGTCGGGTGTGAAAGCCCCGGGCTCAACCTGGGAACTGCATCCGATACTGCTTCGCTAGAGTATGGTAGAGGGAAGCGGAATTCCGGGTGTAGCGGTGAAATGCGTAGATATCCGGAGGAACACCAGTGGCGAAGGCGGCTTCCTGGACCAATACTGACGCTGAGGCGCGAAAGCGTG +>S_000000017 +AGCGTTAATCGGAATTACTGGGCGTAAAGGGCGCGTAGGCGGTGAAGTAAGTCGGGTGTGAAAGCCCCGGGCTCAACCTGGGAACTGCATTCGATACTGCTTCGCTAGAGTATGGTAGAGGGAAGCGGAATTCCGGGTGTAGCGGTGAAATGCGTAGATATCCGGAGGAACACCAGTGGCGAAGGCGGCTTCCTGGACCAATACTGACGCTGAGGCGCGAAAGCGTG +>S_000000018 +AGCGTTAATCGGAATTACTGGGCGTAAAGGGCGCGTAGGCGGTGAAGTAAGTCGGGTGTGAAAGCCCCGGGCTCAACCTGGGAACTGCCTCCGATACTGCTTCGCTAGAGTATGGTAGAGGGAAGCGGAATTCCGGGTGTAGCGGTGAAATGCGTAGATATCCGGAGGAACACCAGTGGCGAAGGCGGCTTCCTGGACCAATACTGACGCTGAGGCGCGAAAGCGTG +>S_000000019 +AGCGTTAATCGGAATTACTGGGCGTAAAGGGCGCGTAGGCGGTGAAGTAAGTCGGGTGTGAAAGCCCTGGGCTCAACCTGGGAACTGCCTCCGATACTGCTTCACTAGAGTATGGTAGAGGGAAGCGGAATTCCGGGTGTAGCGGTGAAATGCGTAGATATCCGGAGGAACACCAGTGGCGAAGGCGGCTTCCTGGACCAATACTGACGCTGAGGCGCGAAAGCGTG +>S_000000020 +AGCGTTAATCGGAATTACTGGGCGTAAAGGGCGCGTAGGCGGTGAAGTCAGTCGGGTGTGAAAGCCCCGGGCTCAACCTGGGAACGGCATCCGATACTGCTTCGCTAGAGTATGGTAGAGGGAAGCGGAATTCCGGGTGTAGCGGTGAAATGCGTAGATATCCGGAGGAACACCAGTGGCGAAGGCGGCTTCCTGGACCAATACTGACGCTGAGGCGCGAAAGCGTG +>S_000000021 +AGCGTTAATCGGAATTACTGGGCGTAAAGGGCGCGTAGGCGGTGAAGTCAGTCGGGTGTGAAAGCCCCGGGCTCAACCTGGGAACTGCATCCGATACTGCTTCGCTAGAGTATGGTAGAGGGAAGCGGAATTCCGGGTGTAGCGGTGAAATGCGTAGATATCCGGAGGAACACCAGTGGCGAAGGCGGCTTCCTGGACCAATACTGACGCTGAGGCGCGAAAGCGTG +>S_000000022 +AGCGTTAATCGGAATTACTGGGCGTAAAGGGCGCGTAGGCGGTTCAGTGAGTCGGATGTGAAAGCCCTGGGCTTAACCTGGGAATGGCATTCGATACGGCTGGGCTAGAGTATGGTAGAGGGAAGTGGAATTTCCGGTGTAACGGTGAAATGTGTAGAGATCGGAAGGAACACCAGTGGCGAAGGCGACTTCCTGGACCAATACTGACGCTCAAGCGCGAAAGCGTG +>S_000000023 +AGCGTTAATCGGAATTACTGGGCGTAAAGGGCGCGTAGGCGGTTCAGTGCGTTGGATGTGAAAGCCCTGGGCTTAACCTGGGAATGGCATTCGATACGGCTGGGCTAGAGTATGGTAGAGGGAAGTGGAATTTCCGGTGTAACGGTGAAATGTGTAGAGATCGGAAGGAACACCAGTGGCGAAGGCGACTTCCTGGACCAATACTGACGCTCAAGCGCGAAAGCGTG +>S_000000024 +AGCGTTAATCGGAATTACTGGGCGTAAAGGGCGCGTAGGCGGTTGGGTAAGTCGGATGTGAAAGCCCTGGGCTTAACCTGGGAATGGCATTCGAGACTACCTATCTAGAGTCTGGTAGAGGGAAGTGGAATTTCCGGTGTAGCGGTGAAATGTGTAGATATCGGAAGGAACACCAGTGGCGAAGGCGACTTCCTGGACCAAGACTGACGCTGAGGCGCGAAAGCGTG +>S_000000025 +AGCGTTAATCGGAATTACTGGGCGTAAAGGGCGCGTAGGCGGTTGGGTAAGTCGGGTGTGAAAGCCCTGGGCTTAACCTGGGAACGGCATTCGAGACTACCTATCTAGAGTCTGGTAGAGGGAAGTGGAATTTCCGGTGTAGCGGTGAAATGTGTAGATATCGGAAGGAACACCAGTGGCGAAGGCGACTTCCTGGACCAAGACTGACGCTGAGGCGCGAAAGCGTG +>S_000000026 +AGCGTTAATCGGAATTACTGGGCGTAAAGGGCGCGTAGGCGGTTGGGTAAGTCGGGTGTGAAAGCCCTGGGCTTAACCTGGGAATGGCATTCGAGACCACCTATCTAGAGTCTGGTAGAGGGAAGTGGAATTTCCGGTGTAGCGGTGAAATGTGTAGATATCGGAAGGAACACCAGTGGCGAAGGCGACTTCCTGGACCAAGACTGACGCTGAGGCGCGAAAGCGTG +>S_000000027 +AGCGTTAATCGGAATTACTGGGCGTAAAGGGCGCGTAGGCGGTTGGGTAAGTCGGGTGTGAAAGCCCTGGGCTTAACCTGGGAATGGCATTCGAGACTACCTAGCTAGAGTCTGGTAGAGGGAAGTGGAATTTCCGGTGTAGCGGTGAAATGTGTAGATATCGGAAGGAACACCAGTGGCGAAGGCGACTTCCTGGACCAAGACTGACGCTGAGGCGCGAAAGCGTG +>S_000000028 +AGCGTTAATCGGAATTACTGGGCGTAAAGTGTGCGCAGGCGGCGTTGCAAGTCGAGTGTGAAAGCCCCGGGCTTAACTTGGGAATTGCGCTCGAAACTACGATGCTGGAGTGTGGCAGAGGAAGGTGGAATTCCACGTGTAGCGGTGAAATGCGTAGAGATGTGGAGGAACACCGATGGCGAAGGCAGCCTTCTGGGCCAACACTGACGCTCATGCACGAAAGCGTG +>S_000000029 +AGCGTTACTCGGAATTACTGGGCGTAAAGCGTGCGTAGGTGGTCTGTTAAGTCTGATGTGAAAGCCCTGGGCTCAACCTGGGAATTGCATTGGATACTGGCAGGCTAGAGTGCGGTAGAGGATGGCGGAATTCCCGGTGTAGCAGTGAAATGCGTAGAGATCGGGAGGAACATCTGTGGCGAAGGCGGCCATCTGGACCAGCACTGACACTGAGGCACGAAAGCGTG +>S_000000030 +AGCGTTAGGCGGAATCACTGGGCTTAAAGCGTGTGTAGGCGGATCGTTAAGTACCTTGTGAAATCCCACGGCTCAACCGTGGAACTGCTGGGTATACTGGCGGTCTTGAGCCACCTAGGGGCAACTGGAACAAGCGGTGGAGCGGTGAAATGCGTAGATATCGCTTGGAACGCCAACGGTGAAAACAGGTTGCTGGGGGTGTGCTGACGCTGAGACACGAAAGCCAG +>S_000000031 +AGCGTTATCCGGAATTATTGGGCGTAAAGAGCTCGTAGGCGGTTTGTCGCGTCTGCCGTGAAAGTCCGGGGCTCAACTCCGGATCTGCGGTGGGTACGGGCAGACTAGAGTGATGTAGGGGAGACTGGAATTCCTGGTGTAGCGGTGAAATGCGCAGATATCAGGAGGAACACCGATGGCGAAGGCAGGTCTCTGGGCATTAACTGACGCTGAGGAGCGAAAGCATG +>S_000000032 +AGCGTTATCCGGATTCACTGGGCGTAAAGCGCGTGTAGGTGGCTCGCCAAGTCGAATGTGAAAGCCCCTGGCTCAACTGGGGGAGGTCATTCGATACTAGTGGGCTTGAGGGTAAGAGAGGAAGGTGGAATTCCCGGTGTAGCGGTGGAATGCGTAGAGATCGGGAGGAACACCAGTGGCGAAGGCGGCCTTCTGGCTTACCCCTGACACTGAGACGCGAAAGCGTG +>S_000000033 +AGCGTTATCCGGATTCACTGGGCGTAAAGGGCGCGCAGGCGGTTACGTAAGTCCGGCGTGAAATCCCACGGCTTAACTGTGGAACTGCGTCGGATACTGCGTTGACTTGAGGATGGTAGAGGCCATTAGAACTAGCGGTGTAGCGGTGAAATGCGCAGATATCGCTAGGAATGCCGGTGGCGAAGGCGGATGGCTGGGCCACTCCTGACGCTGAGGCGCGAAAGCTAG +>S_000000034 +AGCGTTATCCGGATTCACTGGGTTTAAAGGGTGCGTAGGCGGATAGGTAAGTCCGTGGTGAAATCCTGCAGCTTAACTGCAGAACTGCCGTGGATACTATCTATCTTGAATATCGTGGAGGTTAGCGGAATATGTCATGTAGCGGTGAAATGCTTAGATATGACATAGAACACCCATTGCGAAGGCAGCTAACTACGCGATTATTGACGCTGATGCACGAAAGCGTG +>S_000000035 +AGCGTTATCCGGATTCACTGGGTTTAAAGGGTGCGTAGGCGGATTGGTAAGTCCGTGGTGAAATCTCCGAGCTTAACTCGGAAACTGCCATGGATACTATCAGTCTTGAATATCTTGGAGGTAAGCGGAATATGTCATGTAGCGGTGAAATGCTTAGATATGACATAGAACACCAATTGCGAAGGCAGCTTACTACACGATAATTGACGCTGAGGCACGAAAGCGTG +>S_000000036 +AGCGTTATCCGGATTCACTGGGTTTAAAGGGTGCGTAGGCGGGTTGGTAAGTCAGTGGTGAAATCTTCAAGCTTAACTTGGAAACTGCCGTTGATACTATCAATCTTGAATATTGTGGAGGTAAGCGGAATATGTCATGTAGCGGTGAAATGCTTAGATATGACATAGAACACCGATAGCGAAGGCAGCTTGCTACACAGTTATTGACGCTGAGGCACGAAAGCGTG +>S_000000037 +AGCGTTATCCGGATTCACTGGGTTTAAAGGGTGCGTAGGTGGGCAGGTAAGTCAGTGGTGAAATCCCCGAGCTTAACTTGGGAACTGCCGTTGATACTATCTGTCTTGAATATCGCGTAGGTAAGCGGAATATGTCATGTAGCGGTGAAATGCTTAGATATGACATAGAACACCAATTGCGAAGGCAGCTTACTTCACGATCATTGACACTGAGGCACGAAAGCGTG +>S_000000038 +AGCGTTATCCGGATTCACTGGGTTTAAAGGGTGCGTAGGTGGGCAGGTAAGTCAGTGGTGAAATCTCCGGGCTTAACCCGGAAACTGCCATTGATACTATCTGTCTTGAATACCGTGGAGGTGAGCGGAATATGTCATGTAGCGGTGAAATGCTTAGATATGACATAGAACACCAATTGCGAAGGCAGCTCACTACACGAATATTGACACTGAGGCACGAAAGCGTG +>S_000000039 +AGCGTTATCCGGATTCACTGGGTTTAAAGGGTGCGTAGGTGGGTTGGTAAGTCAGTGGTGAAATCCCCGAGCTTAACTTGGGAACTGCCATTGATACTATCAGTCTTGAATACCGTGGAGGTTAGCGGAATATGTCATGTAGCGGTGAAATGCTTAGATATGACATAGAACACCAATTGCGAAGGCAGCTGGCTACACGAATATTGACACTGAGGCACGAAAGCGTG +>S_000000040 +AGCGTTATCCGGATTCACTGGGTTTAAAGGGTGCGTAGGTGGGTTGGTAAGTCAGTGGTGAAATCTCCGTGCTTAACATGGAAACTGCCATTGATACTACTGGTCTTGAATTTTCTGGAGGATAGCGGAATATGTCATGTAGCGGTGAAATGCTTAGATATGACATAGAACACCAATTGCGAAGGCAGCTATCTACAGGGATATTGACACTGAGGCACGAAAGCGTG +>S_000000041 +AGCGTTATCCGGATTCATTGGGTTTAAAGGGTGCGTAGGCGGCCCGATAAGTCAGTGGTGAAAGCCTGTTGCTTAACAACAGAACTGCCATTGATACTGTCGGGCTTGAGTACAGATGCTGTGGGCGGAATATGACATGTAGTGGTGAAATACATAGAGATGTCATAGAACACCGATTGCGAAGGCAGCTCACAAAACTGTAACTGACGCTGAGGCACGAAAGTGCG +>S_000000042 +AGCGTTATCCGGATTTACTGGGCGTAAAGAGCGCGTAGGCGGTTCCGTAAGTTGGTTGTGAAAGTTCGAGGCTCAACCTCGAAACTGCGTCCAATACTGCGGGGCTGGAGTGCAAGAGAGGCAAGTGGAATTTGCGGTGTAGTAGTGAAATGCGTAGATATCGCAAGGAACACCAGTGGCGAAGGCGGCTTGCTAGCTTGTAACTGACGCTGAGGCGCGAAAGCTAG +>S_000000043 +AGCGTTATCCGGATTTATTGGGTTTAAAGGGTGCGTAGGCGGCCTGTTAAGTCAGGGGTGAAAGGTTGCGGCTTAACCGCAGAATTGCCTTTGATACTGGCGGGCTTGAATAAAGTTGAGGTAGGCGGAATGTGGCAAGTAGCGGTGAAATGCATAGAGATGCCACAGAACACCGATTGCGAAGGCAGCTTACTAAGCTTTGATTGACGCTGAGGCACGAAAGCGTG +>S_000000044 +AGCGTTATCCGGATTTATTGGGTTTAAAGGGTGCGTAGGTGGCCTGTTAAGTCAGGGGTGAAAGACGGTAGCTTAACTATCGCAGTGCCTTTGATACTGACGGGCTTGAATACACTAGAGGTAGGCGGAATGTGACAAGTAGCGGTGAAATGCATAGATATGTCACAGAACACCAATTGCGAAGGCAGCTTACTATGGTGTCATTGACACTGAGGCACGAAAGCGTG +>S_000000045 +AGCGTTATTCGGAATTATTGGGCGTAAAGGGCGCGTAGGCGGCACGACGTGTCCAAGGTGAAATCCCTCGGCTCAACTGAGGAACTGCCTTGGAAACTGTCGAGCTTGAGGCCGGGAGGGGGTAGCGGAATTCCCAGTGTAGCGGTGAAATGCGTAGATATTGGGAGGAACACCAGTGGCGAAGGCGGCTACCTGGACCGGTTCTGACGCTGATGCGCGAAAGCGTG +>S_000000046 +AGCGTTATTCGGAATTATTGGGCGTAAAGGGCGCGTAGGCGGCCCGGTAAGTCAAAGGTGAAATCCCTCGGCTCAACTGAGGAACTGCCTTTGAAACTGTCGGGCTTGAGGCCGGGAGGGGGTAGCGGAATTCCCAGTGTAGCGGTGAAATGCGTAGATATTGGGAGGAACACCAGTGGCGAAGGCGGCTACCTGGACCGGTTCTGACGCTGATGCGCGAAAGCGTG +>S_000000047 +AGCGTTATTCGGAATTATTGGGCGTAAAGGGCGCGTAGGCGGCCTGGCAAGTGGATGGTGAAATCCCTCGGCTTAACCGAGGAACTGCCATCCAGACTGCTTGGCTTGAGACCGGGAGAGGTGAGTGGAATTCCCAGTGTAGCGGTGAAATGCGTAGATATTGGGAGGAACACCAGTGGCGAAGGCGGCTCACTGGACCGGTACTGACGCTGATGCGCGAAAGCGTG +>S_000000048 +AGCGTTATTCGGAATTATTGGGCGTAAAGGGCGCGTAGGCGGCTTGGCAAGTGGAAGGTGAAATCCCTCGGCTTAACCGAGGAACTGCCTTCCAGACTGCTTGGCTTGAGACCAGGAGAGGTGAGTGGAATTCCCAGTGTAGCGGTGAAATGCGTAGATATTGGGAGGAACACCAGTGGCGAAGGCGGCTCACTGGACTGGTACTGACGCTGAGGCGCGAAAGCGTG +>S_000000049 +AGCGTTATTCGGATTCACTGGGCGTAAAGGGTGCGCAGGCGGCCAAGTGTGTGAGGCGTGAAAGCCTGGAGCTTAACTCCAGAATTGCACCTCAAACTACTTGGCTAGAGCATTGGAGAGGGTAGCAGAATTCATGGTGTAGCAGTGAAATGCGTAGATATCATGAGGAATACCAGAGGCGAAGGCGGCTACCTGGACAATTGCTGACGCTCAGGCACGAAAGCGTG +>S_000000050 +AGCGTTATTCGGATTCACTGGGCGTAAAGGGTGCGCAGGCGGCCATGTGTGTGAGGCGTGAAAGCCCGATGCTTAACATCGGAATTGCACCTCAAACTACATGGCTAGAGCATTGGAGAGGGAAGCGGAATTCACGGTGTAGCAGTGAAATGCGTAGATATCGTGAGGAACACCAGAGGCGAAGGCGGCTTCCTGGACAATTGCTGACGCTCAGGCACGAAAGCGTG +>S_000000051 +AGCGTTGCCCGGATTCACTGGGCGTAAAGCGGGTGTAGGCGGTTCCTTAAGTCAGATGTGAAATCCAGCGGCCCAACCGCTGAATTGCATCTGATACTGGGGAACTTGAGGACGGTAGAGGTCGGTGGAATTCCCGGTGTACCGGTGAAATGGGCAGATATCGGGAGGAACACCAGTGGCGAAGGCGGCCGACTGGGCCGATCCTGACGCTGAGACCCGAAAGCCAG +>S_000000052 +AGCGTTGCCCGGATTCACTGGGCGTAAAGCGGGTGTAGGCGGTTCCTTAAGTCAGATGTGAAATCCTACGGCTCAACCGTGGAATTGCATCTGATACTGGGGAACTTGAGGACGGTAGAGGTCGGTGGAATTCCCGGTGTACCGGTGAAATGGGCAGATATCGGGAGGAACACCAGTGGCGAAGGCGGCCGACTGGGCCGATCCTGACGCTGAGACCCGAAAGCCAG +>S_000000053 +AGCGTTGCCCGGATTTATTGGGCGTAAAGGGCGCGCAGGCGGCTCGGCACGTCCGTTGTGAAATCGCCCGGCTCAACTGGGCGGGGTCAGCGGATACGGCCGAGCTGGAGCAAGCTAGGGGGCAATGGAATTCCCGGTGTAGTGGTGGAATGCGTAGATATCGGGAGGAACACCAGTGGCGAAGGCGGTTGCCTGGAGCTTTGCTGACGCTGAGGCGCGAAAGCGTG +>S_000000054 +AGCGTTGCTCGGAATCACTGGGCGTAAAGGGCGCGTAGGCGGGATGGCAAGTCAGTCGTGAAATCTCTCGGCTCAACCGAGAAACGTCGGCTGATACTGCCGTTCTTGAGGGATGCAGAGGAGACTGGAATTCCCGGTGTAGCGGTGAAATGTGTAGAGATCGGGAGGAACACCGGTGGCGAAGGCGGGTCTCTGGGCATTTCCTGACGCTGAGGCGCGAAAGCGTG +>S_000000055 +AGCGTTGCTCGGAATCACTGGGCGTAAAGGGCGCGTAGGCGGGATGGCAAGTCGGTCGTGAAATCTCTCGGCTCAACCGAGAAACGTCGGCCGATACTGCCGTTCTTGAGGGATGCAGAGGAGACTGGAATTCCCGGTGTAGCGGTGAAATGTGTAGAGATCGGGAGGAACACCGGTGGCGAAGGCGGGTCTCTGGGCATTTCCTGACGCTGAGGCGCGAAAGCGTG +>S_000000056 +AGCGTTGCTCGGAATCACTGGGCGTAAAGGGTGCGTAGGCGGGTCTTTAAGTCAGGGGTGAAATCCTGGAGCTCAACTCCAGAACTGCCTTTGATACTGAAGATCTTGAGTTCGGGAGAGGTGAGTGGAACTGCGAGTGTAGAGGTGAAAGTCGTAGATATTCGCAAGAACACCAGTGGCGAAGGCGGCTCACTGGCCCGATACTGACGCTGAGGCACGAAAGCGTG +>S_000000057 +AGCGTTGCTCGGAATCACTGGGCGTAAAGGGTGCGTAGGCGGGTCTTTAAGTCAGGGGTGAAATCCTGGAGCTCAACTCCAGAACTGCCTTTGATACTGAAGATCTTGAGTTCGGGAGAGGTGAGTGGAACTGCGAGTGTAGAGGTGAAATGCGTAGATATTCGCAAGAACACCAGTGGCGAAGGCGGCTCACTGGCCCGATACTGACGCTGAGGCACGAAAGCGTG +>S_000000058 +AGCGTTGCTCGGAATCACTGGGCGTAAAGGGTGCGTAGGCGGGTCTTTAAGTCAGGGGTGAAATCCTGGAGCTCAACTCCAGAACTGCCTTTGATACTGAAGATCTTGAGTTCGGGAGAGGTGAGTGGAACTGCGAGTGTAGAGGTGAAATTCGTAGATATTCGCAAGAACACCAGTGGCGAAGGCGGCTCACTGGCCCGATACTGACGCTGAGGCACGAAAGCGTG +>S_000000059 +AGCGTTGTCCGGAATCACTGGGCGTAAAGGGCGCGTAGGCGGCCTGATAAGTAGGGGGTGAAATCCTGCGGCTTAACCGCAGGGCTGCCTTCTAAACTGTCAGGCTCGAGCACAGTAGAGGCAGGTGGAATTCCCGGTGTAGCGGTGGAATGCGTAGAGATCGGGAAGAACATCAGTGGCGAAGGCGGCCTGCTGGGCTGTTGCTGACGCTGAGGCGCGACAGCGTG +>S_000000060 +AGCGTTGTCCGGAATCACTGGGCGTAAAGGGCGCGTAGGCGGCCTGATAAGTAGGGGGTGAAATCCTGCGGCTTAACCGCAGGGCTGCCTTCTAAACTGTCAGGCTTGAGCACAGTAGAGGCAGGTGGAATTCCCGGTGTAGCGGTGGAATGCGTAGAGATCGGGAAGAACATCAGTGGCGAAGGCGGCCTGCTGGGCTGTTGCTGACGCTGAGGCGCGACAGCGTG +>S_000000061 +AGCGTTGTCCGGAATCACTGGGCGTAAAGGGCGCGTAGGCGGCCTGATAAGTAGGGGGTGAAATCCTGCGGCTTAACCGCAGGGCTGCCTTCTAAACTGTCGGGCTCGAGCACAGTAGAGGCAGGTGGAATTCCCGGTGTAGCGGTGGAATGCGTAGAGATCGGGAAGAACATCAGTGGCGAAGGCGGCCTGCTGGGCTGTTGCTGACGCTGAGGCGCGACAGCGTG +>S_000000062 +AGCGTTGTCCGGAATCACTGGGCGTAAAGGGCGCGTAGGCGGCCTGATAAGTAGGGGGTGAAATCTTGCGGCTTAACCGCAAGGCTGCCTTCTAAACTGTCAGGCTAGAGCACAGTAGAGGCAGGTGGAATTCCCGGTGTAGCGGTGGAATGCGTAGAGATCGGGAAGAACATCAGTGGCGAAGGCGGCCTGCTGGGCTGTTGCTGACGCTGAGGCGCGACAGCGTG +>S_000000063 +AGCGTTGTCCGGAATCACTGGGCGTAAAGGGCGCGTAGGTGGTTTGATAAGGGTGTGGTGAAAGTCCGGGGCTCAACCCCGGATCTGCCGTGCCGACTGTCAAACTCGAGGACTGTAGAGGCAGACGGAATTCCGGGTGTAGCGGTGGAATGCGTAGAGATCCGGAGGAAGACCGGTGGCGAAGGCGGTCTGCTGGGCAGTTTCTGACACTGAGGCGCGACAGCGTG +>S_000000064 +AGCGTTGTCCGGAATCATTGGGCGTAAAGAGCGCGCAGGCGGCTTGGCAAGTCGGGTGTGAAATCCCGGGGCTCAACCCCGTGACTGCATCCGATACTGTCAGGCTAGAGGTAGGTAGGGGAGATCGGAATTCCTGGTGTAGCGGTGAAATGCGCAGATATCAGGAGGAACACCGGTGGCGAAGGCGGATCTCTGGGCCTTACCTGACGCTCAGGCGCGAAAGCTAG +>S_000000065 +AGCGTTGTCCGGAATCATTGGGCGTAAAGAGCGCGTAGGCGGTCCGGTAAGTCTGCCGTGAAAGCCAGGGGCTCAACCCTTGGATGCCGGTGGATACTGTCGGGCTAGAGTCCGGAAGAGGCGAGTGGAATTCCTGGTGTAGCGGTGAAATGCGCAGATATCAGGAAGAACACCTATGGCGAAGGCAGCTCGCTGGGACGGAACTGACGCTGAGGCGCGAAAGCGTG +>S_000000066 +AGCGTTGTCCGGAATCATTGGGCGTAAAGAGCGTGTAGGCGGCCCGGTAAGTCCGCTGTGAAAGTCGAGGGCTCAACCCTCGAATGCCGGCGGATACTGTCGGGCTAGAGTCCGGAAGAGGCGAGTGGAATTCCTGGTGTAGCGGTGAAATGCGCAGATATCAGGAGGAACACCGATGGCGAAGGCAGCTCGCTGGGACGGTACTGACGCTGAGACGCGAAAGCGTG +>S_000000067 +AGCGTTGTCCGGAATCATTGGGCGTAAAGAGCGTGTAGGCGGTCCGGTAAGTCCGCTGTGAAAGCCAAGGGCTCAACCCTTGAATGCCGGCGGATACTGCCGGGCTAGAGTCCGGAAGAGGCGAGTGGAATTCCCGGTGTAGCGGTGAAATGCGCAGATATCGGGAGGAACACCTATGGCGAAGGCAGCTCGCTGGGACGGTACTGACGCTGAGACGCGAAAGCGTG +>S_000000068 +AGCGTTGTCCGGAATCATTGGGCGTAAAGAGCGTGTAGGCGGTCCGGTAAGTCGGCTGTGAAAGTCCAGGGCTCAACCCTGGGATGCCGGTCGATACTGCCGGACTAGAGTTCGGAAGAGGCGAGTGGAATTCCCGGTGTAGCGGTGAAATGCGCAGATATCGGGAGGAACACCTATGGCGAAGGCAGCTCGCTGGGACGTTACTGACGCTGAGACGCGAAAGCGTG +>S_000000069 +AGCGTTGTCCGGAATCATTGGGCGTAAAGAGCGTGTAGGCGGTCCGGTAAGTCGGCTGTGAAAGTCCAGGGCTCAACTCTGGGATGCCGGTCGATACTGCCGGACTAGAGTTCGGAAGAGGCGAGTGGAATTCCCGGTGTAGCGGTGAAATGCGCAGATATCGGGAGGAACACCTATGGCGAAGGCAGCTCGCTGGGACGTTACTGACGCTGAGACGCGAAAGCGTG +>S_000000070 +AGCGTTGTCCGGAATCATTGGGCGTAAAGAGCGTGTAGGCGGTCCGGTTAGTCGGCTGTGAAAGTCCAGGGCTCAACCCTGGGATGCCGGTCGATACTGCCGGACTAGAGTCCGGAAGAGGCAAGTGGAATTCCCGGTGTAGCGGTGAAATGCGCAGATATCGGGAGGAACACCAATGGCGAAGGCAGCTTGCTGGGACGGTACTGACGCTGAGACGCGAAAGCGTG +>S_000000071 +AGCGTTGTCCGGAATCATTGGGCGTAAAGAGCGTGTAGGCGGTTCGGTAAGTCCGCTGTGAAAGTCCAGGGCTCAACCCTGGAATGCCGGTGGATACTGTCGGGCTAGAGTCCGGAAGAGGCGAGTGGAATTCCTGGTGTAGCGGTGAAATGCGCAGATATCAGGAGGAACACCAATGGCGAAGGCAGCTCGCTGGGACGGTACTGACGCTGAGACGCGAAAGCGTG +>S_000000072 +AGCGTTGTCCGGAATCATTGGGCGTAAAGAGCTCGTAGGCGGCTCGGTAAGTCGGGTGTGAAACCCTCAGGCTCAACCTGGGGACGCCACCCGATACTGCCGTGGCTAGAGTCCAGTAGGGGAGTGTGGAATTCCCGGTGTAGCGGTGAAATGCGCAGATATCGGGAGGAACACCAGCGGCGAAGGCGGCACTCTGGGCTGGTACTGACGCTGAGGAGCGAAAGCGTG +>S_000000073 +AGCGTTGTCCGGAATCATTGGGCGTAAAGAGCTCGTAGGCGGCTCGGTAAGTCGGGTGTGAAACCCTCAGGCTCAACCTGGGGACGCCACCCGATACTGCTGTGGCTAGAGTCCAGTAGGGGAGTGTGGAATTCCCGGTGTAGCGGTGAAATGCGCAGATATCGGGAGGAACACCAGCGGCGAAGGCGGCACTCTGGGCTGGTACTGACGCTGAGGAGCGAAAGCGTG +>S_000000074 +AGCGTTGTCCGGAATCATTGGGCGTAAAGCGCGCGTAGGCGGCCCGATCAGTCTGCTGTGAAAGTCGGAGGCTCAACCTCCGAATGCCGGTGGATACTGTCGGGCTAGAGTCCGGAAGAGGCGAGTGGAATTCCTGGTGTAGCGGTGAAATGCGCAGATATCAGGAGGAACACCAATGGCGAAGGCAGCTCGCTGGGACGGTACTGACGCTGAGACGCGAAAGCGTG +>S_000000075 +AGCGTTGTCCGGAATCATTGGGCGTAAAGCGCGTGTAGGCGGCCCGATAAGTCCGCTGTGAAAGTCCAGGGCTCAACCCTGGGATGCCGGTGGATACTGTCGGGCTCGAGTCCGGAAGAGGAGTGTGGAATTCCTGGTGTAGCGGTGAAATGCGCAGATATCAGGAGGAACACCAATGGCGAAGGCAGCACTCTGGGACGTGACTGACGCTGAGACGCGAAAGCGTG +>S_000000076 +AGCGTTGTCCGGAATCATTGGGCGTAAAGCGCGTGTAGGCGGCCCGGTAAGTCCGCTGTGAAAGTCGGGGGCTCAACCCTCGAATGCCGGTGGATACTGTCGGGCTCGAGTACGGAAGAGGCGAGTGGAATTCCTGGTGTAGCGGTGAAATGCGCAGATATCAGGAGGAACACCAATTGCGAAGGCAGCTCGCTGGGACGTTACTGACGCTGAGACGCGAAAGCGTG +>S_000000077 +AGCGTTGTCCGGAATCATTGGGCGTAAAGCGCGTGTAGGCGGTCCGGTAAGTCCGCTGTGAAAGTCGGGGGCTCAACCCTCGAAAGCCGGTGGATACTGTTGGGCTAGAGTACGGAAGAGGCGAGTGGAATTCCTGGTGTAGCGGTGAAATGCGCAGATATCAGGAGGAACACCAATTGCGAAGGCAGCTCGCTGGGACGTTACTGACGCTGAGACGCGAAAGCGTG +>S_000000078 +AGCGTTGTCCGGAATCATTGGGCGTAAAGCGCGTGTAGGCGGTCCGGTAAGTCGGCTGTGAAAGTCCAGGGCTCAACCCTGGGATGCCGGTCGATACTGCCGGACTAGAGTTCGGAAGAGGCGAGTGGAATTCCCGGTGTAGCGGTGAAATGCGCAGATATCGGGAGGAACACCAATGGCGAAGGCAGCTCGCTGGGACGTTACTGACGCTGAGACGCGAAAGCGTG +>S_000000079 +AGCGTTGTCCGGAATCATTGGGCGTAAAGCGCGTGTAGGCGGTCCGGTAAGTCGGCTGTGAAAGTCCAGGGCTCAACCCTGGGATGCCGGTCGATACTGCCGGACTAGAGTTCGGAAGAGGCGAGTGGAATTCCCGGTGTAGCGGTGAAATGCGCAGATATCGGGAGGAACACCTATGGCGAAGGCAGCTCGCTGGGACGTTACTGACGCTGAGACGCGAAAGCGTG +>S_000000080 +AGCGTTGTCCGGAATCATTGGGCGTAAAGCGCGTGTAGGCGGTTCGGTAAGTCCGCTGTGAAAGTCGGGGGCTCAACCCTCGAAAGCCGGTGGATACTGTCGGGCTAGAGTACGGAAGAGGCGAGTGGAATTCCTGGTGTAGCGGTGAAATGCGCAGATATCAGGAGGAACACCAATTGCGAAGGCAGCTCGCTGGGACGTTACTGACGCTGAGACGCGAAAGCGTG +>S_000000081 +AGCGTTGTCCGGAATCATTGGGCGTAAAGCGCGTGTAGGCGGTTTGGTAAGTCCGCTCTGAAAGTCCGGGGCTCAACCCCGGAAGGCGGGTGGATACTGCCAGGCTAGAGTACGGAAGAGGCGAGTGGAATTCCTGGTGTAGCGGTGAAATGCGCAGATATCAGGAGGAACACCGATTGCGAAGGCAGCTCGCTGGGACGTTACTGACGCTGAGACGCGAAAGCGTG +>S_000000082 +AGCGTTGTCCGGAATCATTGGGCGTAAAGGGCGCGTAGGTGGCCCGGTCAGTTCGTGGTGAAAGCGCGGGGCTCAACCCCGCGTCGGCCAGGAATACTGCGGGGCTGGAGCACTGTAGAGGCAGGCGGAATTCCGGGTGTAGCGGTGGAATGCGTAGAGATCCGGAAGAACACCGGTGGCGAAGGCGGCCTGCTGGGCAGTTGCTGACACTGAGGCGCGACAGCGTG +>S_000000083 +AGCGTTGTCCGGAATTACTGGGCGTAAAGAGCTCGTAGGTGGTTTGTCGCGTTGTTCGTGAAAACTCACAGCTTAACTGTGGGCGTGCGGGCGATACGGGCAGACTGGAGTACTGCAGGGGAGACTGGAATTCCTGGTGTAGCGGTGGAATGCGCAGATATCAGGAGGAACACCGGTGGCGAAGGCGGGTCTCTGGGCAGTAACTGACGCTGAGGAGCGAAAGCGTG +>S_000000084 +AGCGTTGTCCGGAATTATTGGGCGTAAAGAGCGTGTAGGCGGTCCGGTAAGTCGGCTGTGAAAGTCCAGGGCTCAACCCTGGGATGCCGGTCGATACTGCCGGACTAGAGTTCGGAAGAGGCGAGTGGAATTCCCGGTGTAGCGGTGAAATGCGCAGATATCGGGAGGAACACCTATGGCGAAGGCAGCTCGCTGGGACGTTACTGACGCTGAGACGCGAAAGCGTG +>S_000000085 +AGCGTTGTCCGGAATTATTGGGCGTAAAGAGCGTGTAGGCGGTTCGGTAAGTCTGCCGTGAAAACCCAGGGCTCAACCCTGGGCGTGCGGTGGATACTGCCGGGCTAGAGGGTGGTAGAGGCGAGTGGAATTCCCGGTGTAGCGGTGAAATGCGCAGATATCGGGAGGAACACCAGTAGCGAAGGCGGCTCGCTGGGCCACACCTGACGCTGAGACGCGAAAGCGTG +>S_000000086 +AGCGTTGTCCGGAATTATTGGGCGTAAAGAGCGTGTAGGCGGTTCGGTAAGTCTGCCGTGAAAACCTGGGGCTCAACCCCAGGCGTGCGGTGGAAACTGTCGGACTAGAGGATGGTAGAGGGGAGTGGAATTCCCGGTGTAGCGGTGAAATGCGCAGATATCGGGAGGAACACCAGTAGCGAAGGCGGCTCCCTGGGCCATTCCTGACGCTGAGACGCGAAAGCGTG +>S_000000087 +AGCGTTGTCCGGAATTATTGGGCGTAAAGAGCGTGTAGGCGGTTCGGTAAGTCTGCCGTGAAAACCTGGGGCTCAACCCCGGGCGTGCGGTGGATACTGCCGGGCTAGAGGATGGTAGAGGCGAGTGGAATTCCCGGTGTAGCGGTGAAATGCGCAGATATCGGGAGGAACACCAGTAGCGAAGGCGGCTCGCTGGGCCATTCCTGACGCTGAGACGCGAAAGCTAG +>S_000000088 +AGCGTTGTCCGGAATTATTGGGCGTAAAGAGCGTGTAGGCGGTTCGGTAAGTCTGCCGTGAAAACCTGGGGCTCAACCCCGGGCGTGCGGTGGATACTGCCGGGCTAGAGGGTGGTAGAGGCGAGTGGAATTCCCGGTGTAGCGGTGAAATGCGCAGATATCGGGAGGAACACCAGTAGCGAAGGCGGCTCGCTGGGCCATTCCTGACGCTGAGACGCGAAAGCTAG +>S_000000089 +AGCGTTGTCCGGAATTATTGGGCGTAAAGAGCGTGTAGGCGGTTCGGTAAGTCTGCTGTGAAATCCTGGGGCTCAACCCCGGGCGTGCAGCGGATACTGCCGGGCTAGAGGATGGTAGAGGCGAGTGGAATTCCCGGTGTAGCGGTGAAATGCGCAGATATCGGGAGGAACACCAGTAGCGAAGGCGGCTCGCTGGGCCATTCCTGACGCTGAGACGCGAAAGCTAG +>S_000000090 +AGCGTTGTCCGGAATTATTGGGCGTAAAGAGCGTGTAGGCGGTTCGGTAAGTCTGTCGTGAAATCCTGGGGCTCAACCCCGGGCGTGCGATGGATACTGCCGGGCTAGAGGGTGGTAGAGGCGAGTGGAATTCCCGGTGTAGCGGTGAAATGCGCAGATATCGGGAGGAACACCAGTAGCGAAGGCGGCTCGCTGGGCCACACCTGACGCTGAGACGCGAAAGCGTG +>S_000000091 +AGCGTTGTCCGGAATTATTGGGCGTAAAGAGCTCGTAGGCGGCGTGTCACGTCGGATGTGAAAGCCCGGGGCTTAACCCTGGGTCTGCATTCGATACGGGCAGGCTAGAGTTCGGTAGGGGAGATCGGAATTCCTGGTGTAGCGGTGAAATGCGCAGATATCAGGAGGAACACCGGTGGCGAAGGCGGATCTCTGGGCCGATACTGACGCTGAGGAGCGAAAGCATG +>S_000000092 +AGCGTTGTCCGGAATTATTGGGCGTAAAGAGCTCGTAGGCGGCTTGTCACGTCGGATGTGAAAGCCCGGGGCTTAACCCCGGGTCTGCATTCGATACGGGCAGGCTAGAGTGTGGTAGGGGAGATCGGAATTCCTGGTGTAGCGGTGAAATGCGCAGATATCAGGAGGAACACCGGTGGCGAAGGCGGATCTCTGGGCCATTACTGACGCTGAGGAGCGAAAGCGTG +>S_000000093 +AGCGTTGTCCGGAATTATTGGGCGTAAAGAGCTCGTAGGCGGCTTGTCGCGTCGGATGTGAAAGCCCGGGGCTTAACCCCGGGTCTGCATTCGATACGGGCAGGCTAGAGTGTGGTAGGGGAGATCGGAATTCCTGGTGTAGCGGTGAAATGCGCAGATATCAGGAGGAACACCGGTGGCGAAGGCGGATCTCTGGGCCATTACTGACGCTGAGGAGCGAAAGCGTG +>S_000000094 +AGCGTTGTCCGGAATTATTGGGCGTAAAGAGCTCGTAGGCGGTCTGTCACGTCTGCCGTGAAAACCCGAGGCTTAACCTCGTGGCTTGCGGTGGATACGGGCAGACTAGAGGTAGGTAGGGGAGAACGGAATTCCCGGTGTAGCGGTGAAATGCGCAGATATCGGGAGGAACACCGGTGGCGAAGGCGGTTCTCTGGGCCTTACCTGACGCTGAGGAGCGAAAGCATG +>S_000000095 +AGCGTTGTCCGGAATTATTGGGCGTAAAGAGCTCGTAGGCGGTGTGTCACGTCGGTCGTGAAAACTTGGGGCTTAACCCTGAGCGTGCGGTCGATACGGGCATCACTTGAGTTCGGCAGGGGAGACTGGAATTCCTGGTGTAGCGGTGAAATGCGCAGATATCAGGAGGAACACCGGTGGCGAAGGCGGGTCTCTGGGCCGATACTGACGCTGAGGAGCGAAAGCGTG +>S_000000096 +AGCGTTGTCCGGAATTATTGGGCGTAAAGAGCTCGTAGGCGGTGTGTCACGTCGGTCGTGAAAACTTGGGGCTTAACCCTGAGCTTGCGGTCGATACGGGCATCACTTGAGTTCGGCAGGGGAGACTGGAATTCCTGGTGTAGCGGTGAAATGCGCAGATATCAGGAGGAACACCGGTGGCGAAGGCGGGTCTCTGGGCCGATACTGACGCTGAGGAGCGAAAGCGTG +>S_000000097 +AGCGTTGTCCGGAATTATTGGGCGTAAAGAGCTCGTAGGCGGTTTGTTGCGTCGGCCGTGAAAACTTCACGCTTAACGTGGAGCTTGCGGTCGATACGGGCAGACTTGAGTTCGGTAGGGGAGACTGGAATTCCTGGTGTAGCGGTGAAATGCGCAGATATCAGGAGGAACACCGGTGGCGAAGGCGGGTCTCTGGGCCGATACTGACGCTGAGGAGCGAAAGCGTG +>S_000000098 +AGCGTTGTCCGGAATTATTGGGCGTAAAGAGCTCGTAGGCGGTTTGTTGCGTCGGCTGTGAAATCCCGAGGCTCAACCTCGGGTCTGCAGTCGATACGAGCAAACTAGAGTGTTGCAGGGGAGACTGGAATTCCTGGTGTAGCGGTGAAATGCGCAGATATCAGGAGGAACACCGGTGGCGAAGGCGGGTCTCTGGGCAACAACTGACGCTGAGGAGCGAAAGCGTG +>S_000000099 +AGCGTTGTCCGGAATTATTGGGCGTAAAGAGCTCGTAGGCGGTTTGTTGCGTCTATCGTGAAAACCTGGGGCTCAACCCCGGGCCTGCGGTGGATACGGGCAGACTTGAGTTCGGTAGGGGAGACTGGAATTCCTGGTGTAGCGGTGAAATGCGCAGATATCAGGAGGAACACCGGTGGCGAAGGCGGGTCTCTGGGCCGAAACTGACGCTGAGGAGCGAAAGCGTG +>S_000000100 +AGCGTTGTCCGGAATTATTGGGCGTAAAGCGCGCGCAGGCGGCAGCTTAAGTCTGGTGTTTAAGCCCGGGGCTCAACCCCGGTTCGCATCGGAAACTGGGCTGCTTGAGTGTAGGAGAGGAAAGTGGAATTCCACGTGTAGCGGTGAAATGCGTAGATATGTGGAGGAACACCAGTGGCGAAGGCGACTTTCTGGCCTATAACTGACGCTGAGGCGCGAAAGCGTG +>S_000000101 +AGCGTTGTCCGGAATTATTGGGCGTAAAGCGCGCGCAGGCGGCCTTGTAAGTCTAGTGTTTAATCTCGAAGCTCAACTTCGATTCGCACTGGAAACTGCAAAGCTTGAGTACAGAAGAGGAAAGTGGAATTCCACGTGTAGCGGTGAAATGCGTAGAGATGTGGAGGAACACCAGTGGCGAAGGCGACTTTCTGGGCTGTAACTGACGCTGAGGCGCGAAAGCGTG +>S_000000102 +AGCGTTGTCCGGAATTATTGGGCGTAAAGCGCGCGCAGGCGGCTTTGTAAGTCTAGCGTTTAAGCTCGGGGCTCAACCCCGATACGCGCCGGAAACTGCAAGGCTTGAGTGCAGAAGAGGAAAGTGGAATTCCACGTGTAGCGGTGAAATGCGTAGAGATGTGGAGGAACACCAGTGGCGAAGGCGACTTTCTGGGCTGTAACTGACGCTGAGGCGCGAAAGCGTG +>S_000000103 +AGCGTTGTCCGGAATTATTGGGCGTAAAGCGCGCGCAGGCGGTCCTTTAAGTCTGATGTGAAAGCCCACGGCTCAACCGTGGAGGGTCATTGGAAACTGAGGGACTTGAGTACAGAAGAGGAAAGCGGAATTCCACGTGTAGCGGTGAAATGCGTAGAGATGTGGAGGAACACCAGTGGCGAAGGCGGCTTTCTGGTCTGTAACTGACGCTGAGGCGCGAAAGCGTG +>S_000000104 +AGCGTTGTCCGGAATTATTGGGCGTAAAGCGCGCGCAGGCGGTCCTTTAAGTCTGATGTGAAAGCCCACGGCTCAACCGTGGAGGGTCATTGGAAACTGGGGGACTTGAGTACAGAAGAGAAGAGTGGAATTCCACGTGTAGCGGTGAAATGCGTAGAGATGTGGAGGAACACCAGTGGCGAAGGCGACTCTTTGGTCTGTAACTGACGCTGAGGCGCGAAAGCGTG +>S_000000105 +AGCGTTGTCCGGAATTATTGGGCGTAAAGCGCGCGCAGGCGGTCCTTTAAGTCTGATGTGAAAGCCCACGGCTCAACCGTGGAGGGTCATTGGAAACTGGGGGACTTGAGTACAGAAGAGGAAAGCGGAATTCCACGTGTAGCGGTGAAATGCGTAGAGATGTGGAGGAACACCAGTGGCGAAGGCGGCTTTCTGGTCTGTAACTGACGCTGAGGCGCGAAAGCGTG +>S_000000106 +AGCGTTGTCCGGAATTATTGGGCGTAAAGCGCGCGCAGGCGGTCCTTTAAGTCTGATGTGAAAGCCCACGGCTCAACCGTGGAGGGTCATTGGAAACTGGGGGACTTGAGTGCAGAAGAGGAAAGCGGAATTCCACGTGTAGCGGTGAAATGCGTAGAGATGTGGAGGAACACCAGTGGCGAAGGCGGCTTTCTGGTCTGTAACTGACGCTGAGGCGCGAAAGCGTG +>S_000000107 +AGCGTTGTCCGGAATTATTGGGCGTAAAGGGCTCGTAGGCGGTCCGTTACGTCGGGAGTGAAAACTCGGAGCTTAACTCCGAGCCTGCTTCCGATACGGGCGGACTAGAGGTAGGCAGGGGAGAGCGGAACTCCTGGTGTAGCGGTGGAATGCGCAGATATCAGGAAGAACACCGGTGGCGAAGGCGGCTCTCTGGGCCTTACCTGACGCTGAGGAGCGAAAGCGTG +>S_000000108 +AGCGTTGTCCGGAATTATTGGGCGTAAAGGGCTCGTAGGCGGTTCGTCGCGTCGGGAGTGAAAACTCGGAGCTCAACTCCGAGCCTGCTTCCGATACGGGCAGACTAGAGGTAGGCAGGGGAGAGCGGAACTCCTGGTGTAGCGGTGGAATGCGCAGATATCAGGAAGAACACCGGTGGCGAAGGCGGCTCTCTGGGCCTTACCTGACGCTGAGGAGCGAAAGCGTG +>S_000000109 +AGCGTTGTCCGGAATTATTGGGCGTAAAGGGCTCGTAGGCGGTTTGTCGCGTCGGGAGTGAAAACCCAGGGCTTAACTCTGGGCTGGCTTTCGATACGGGCAGACTAGAGGCATGCAGGGGAGAACGGAATTCCTGGTGTAGCGGTGAAATGCGCAGATATCAGGAGGAACACCGGTGGCGAAGGCGGTTCTCTGGGCATGTCCTGACGCTGAGGAGCGAAAGTGTG +>S_000000110 +AGCGTTGTCCGGAATTATTGGGCGTAAAGGGCTCGTAGGCGGTTTGTCGCGTCGGGAGTGAAAACTCAGGGCTCAACCCTGAGCGTGCTTCCGATACGGGCAGACTAGAGGTATGCAGGGGAGAACGGAATTCCTGGTGTAGCGGTGGAATGCGCAGATATCAGGAGGAACACCGGTGGCGAAGGCGGTTCTCTGGGCATTACCTGACGCTGAGGAGCGAAAGCATG +>S_000000111 +AGCGTTGTCCGGAGTTACTGGGCGTAAAGCGCGCGCAGGCGGCGGTGCTGGCCCGGCGTGAAAGCCCCCGGCTCAACCGGGGAGGGTCGTCGGGGACCGCACCGCTTGAGGGCGGTAGGGGCTGGTGGAATGCCTGGTGTAGTGGTGAAATGCGTAGAGATCAGGCGGAACACCCGTGGCGAAGGCGGCCAGCTGGGCCGTCCCTGACGCTGAGGCGCGAAGGCGTG +>S_000000112 +AGCGTTGTCCGGATTCATTGGGCGTAAAGAGCGTGTAGGCGGCCAGGTAGGTCCGCTGTGAAAACTCGAGGCTCAACCTCGAGACGTCGGCGGAAACCATCTGGCTAGAGTCCGGAAGAGGAGAGTGGAATTCCTGGTGTAGCGGTGAAATGCGCAGATATCAGGAAGAACACCCATGGCGAAGGCAGCTCTCTGGGACGGTACTGACGCTGAGACGCGAAAGCGTG +>S_000000113 +AGCGTTGTCCGGATTCATTGGGCGTAAAGCGCGCGCAGGCGGCCGCGCAAGTCGGTTGTGAAATCCCGGGGCTCAACCCCGGGACTGCATCCGATACTGCGTGGCTCGAGGCAGGTAGGGGAGAGCGGAATTCCCGGTGTAGCGGTGAAATGCGCAGATATCGGGAGGAACACCGGTGGCGAAGGCGGCTCTCTGGGCCTGTCCTGACGCTCAGGCGCGAAAGCTAG +>S_000000114 +AGCGTTGTCCGGATTTACTGGGCGTAAAGAGCGCGCAGGCGGCTGATTAAGTCTGATGTGAAATCTCCCGGCTCAACCGGGAAACTGCATCGGAAACTGATCGGCTTGAAGGTGGGAGAGGGTAGTGGAATTCCCGGTGTAGTGGTGAAATGCGTAGATATCGGGAGGAACACCAGTGGCGAAGGCGACTACCTGGCCCATTCTTGACGCTGAGGCGCGAAAGCTAG +>S_000000115 +AGCGTTGTCCGGATTTACTGGGCGTAAAGAGCGCGCAGGCGGTCATGCAAGTCGGTTGTGAAAGCCCCCGGCTCAACTGGGGAGGGACATTCGATACTGCTCGACTCGAAGGCAGGAGAGGGAAGCGGAATTCCCGGTGTAGTGGTGAAATGCGTAGATATCGGGAGGAACACCAGTGGCGAAGGCGGCTTCCTGGCCTGTTCTTGACGCTGAGGCGCGAAAGCTAG +>S_000000116 +AGCGTTGTCCGGATTTACTGGGCGTAAAGAGCGCGCAGGCGGTCGTGCAAGTCGCGTGTGAAAGCCCCCGGCTCAACTGGGGAGGGTCACGCGATACTGCTCGACTTGAAGGCAGGAGAGGGAAGTGGAATTCCCGGTGTAGTGGTGAAATGCGTAGATATCGGGAGGAACACCAGTGGCGAAGGCGACTTCCTGGCCTGTTCTTGACGCTGAGGCGCGAAAGCTAG +>S_000000117 +AGCGTTGTCCGGATTTACTGGGCGTAAAGAGCGCGCAGGCGGTCGTTCAAGTCGCGTGTGAAAGCCCCCGGCTCAACTGGGGAGGGTCACGCGATACTGATCGACTCGAAGGCAGGAGAGGGTAGTGGAATTCCCGGTGTAGTGGTGAAATGCGTAGATATCGGGAGGAACACCAGTGGCGAAGGCGACTACCTGGCCTGTTCTTGACGCTGAGGCGCGAAAGCTAG +>S_000000118 +AGCGTTGTCCGGATTTACTGGGTGTAAAGCGCGCGCAGGCGGTCTCGAAAGTCCACGGTGAAAGCTCCCGGCCCAACTGGGAGAGGCCCGTGGAAACTTCGGAACTTGAAGGCGGGAGAGGCAAATGGAATTTCCGGTGTAGCGGTAAAATGCGTAGATACCGGAAGGAACACCAGTGGCGAAGGCGATTTGCTGGCCCGCACTTGACGCTCAGGCGCGAAAGCTAG +>S_000000119 +AGCGTTGTCCGGATTTATTGGGCGTAAAGAGCGCGTAGGCGGCTCGGAAAGTCGGACGTGAAAACCCGGGGCTCAACCCCGGGCCTGCGTCCGATACTCCCGGGCTAGAGGCAGGTAGGGGAGAGTGGAATTCCCGGTGTAGCGGTGAAATGCGCAGATATCGGGAGGAACACCGGTGGCGAAGGCGGCTCTCTGGACCTGTCCTGACGCTCAGGCGCGAAAGCTAG +>S_000000120 +AGCGTTGTCCGGATTTATTGGGCGTAAAGAGCGCGTAGGCGGCTCGGAAAGTCGGTTGTGAAATCCCAGGGCTCAACCCCGGGACTGCGTCCGATACTGCCGAGCTAGAGGCAGGTAGGGGAGATCGGAATTCCTGGTGTAGCGGTGAAATGCGCAGATATCAGGAGGAACACCGGTGGCGAAGGCGGATCTCTGGGCCTGTCCTGACGCTGAGGCGCGAAAGCTAG +>S_000000121 +AGCGTTGTCCGGATTTATTGGGCGTAAAGAGCGCGTAGGCGGTTCGGAAAGTCGGGTGTGAAAACCCGGGGCTCAACCCCGGGCCTGCATCCGATACTGTCGAACTAGAGGCAGACAGGGGAGAGTGGAATTCCTGGTGTAGCGGTGAAATGCGCAGATATCAGGAGGAACACCGGTGGCGAAGGCGGCTCTCTGGGTCTGTCCTGACGCTCAGGCGCGAAAGCTAG +>S_000000122 +AGCGTTGTCCGGATTTATTGGGCGTAAAGAGCGTGTAGGCGGCCAGACAGGTCCGTTGTGAAAACTCGAGGCTCAACCTCGAGACGTCGACGGAAACCGTCTGGCTAGAGTCCGGAAGAGGAGTGTGGAATTCCTGGTGTAGCGGTGAAATGCGCAGATATCAGGAAGAACACCTATGGCGAAGGCAGCACTCTGGGACGGTACTGACGCTGAGACGCGAAAGCGTG +>S_000000123 +AGCGTTGTCCGGATTTATTGGGCGTAAAGAGCGTGTAGGCGGCCAGACAGGTCCGTTGTGAAAACTGGAGGCTCAACCTCCAGCCGTCGATGGAAACCGTCTGGCTAGAGTCCGGAAGAGGAGAGTGGAATTCCTGGTGTAGCGGTGAAATGCGCAGATATCAGGAGGAACACCCGTGGCGAAAGCGGCTCTCTGGGACGGTACTGACGCTGAGACGCGAAAGCGTG +>S_000000124 +AGCGTTGTCCGGATTTATTGGGCGTAAAGAGCGTGTAGGCGGCCAGATAAGTCTGCTGTGAAAACTCGAGGCTCAACCTCGAGCTGTCGGCGGAAACTATTTGGCTAGAGTCCGGAAGAGGAAAGCGGAATTCCTGGTGTAGCGGTGAAATGCGCAGATATCAGGAAGAACACCCGTGGCGAAGGCGGCTTTCTGGGACGGTACTGACGCTGAGACGCGAAAGCGTG +>S_000000125 +AGCGTTGTCCGGATTTATTGGGCGTAAAGAGCGTGTAGGCGGCCAGGTAGGTCCGCTGTGAAAACTCGAGGCTCAACCTCGAGATGTCGGTGGAAACCATCTGGCTAGAGTCCGGAAGAGGAGAGTGGAATTCCCGGTGTAGCGGTGAAATGCGCAGATATCGGGAAGAATATCCGTGGCGAAGGCGGCTCTCTGGTACGGCACTGACGCTGAGACGCGAAAGCGTG +>S_000000126 +AGCGTTGTCCGGATTTATTGGGCGTAAAGAGCGTGTAGGCGGCCAGGTAGGTCCGGTGTGAAAACTCGAGGCTTAACCTCGAGATGTCATCGGAAACCATCTGGCTAGAGTCCGGAAGAGGAGAGTGGAATTCCTGGTGTAGCGGTGAAATGCGCAGATATCAGGAAGAACACCTATGGCGAAAGCAGCTCTCTGGGACGGTACTGACGCTGAGACGCGAAAGCGTG +>S_000000127 +AGCGTTGTCCGGATTTATTGGGCGTAAAGAGCGTGTAGGCGGCCAGGTAGGTCCGTTGTGAAAACTCGAGGCTCAACCTCGAGACGTCGATGGAAACCATCTGGCTAGAGTCCGGAAGAGGAGAGTGGAATTCCTGGTGTAGCGGTGAAATGCGCAGATATCAGGAAGAACACCCGTGGCGAAGGCGGCTCTCTAGGACGGTACTGACGCTGAGACGCGAAAGCGTG +>S_000000128 +AGCGTTGTCCGGATTTATTGGGCGTAAAGAGCGTGTAGGCGGCCAGGTAGGTCTGCTGTGAAAACTCGAGGCTTAACCTCGAGATGTCGGCGGAAACCATCTGGCTAGAGTCCGGAAGAGGAGAATGGAATTCCCGGTGTAGCGGTGAAATGCGCAGATATCGGGAAGAACACCCGTGGCGAAGGCGGTTCTCTGGGACGGTACTGACGCTGAGACGCGAAAGCGTG +>S_000000129 +AGCGTTGTCCGGATTTATTGGGCGTAAAGAGCGTGTAGGCGGCCAGGTAGGTCTGGTGTGAAAACTCGAGGCTCAACCTCGAGATGTCATCGGAAACCATCTGGCTAGAGTCCGGAAGAGGAGAGTGGAATTCCTGGTGTAGCGGTGAAATGCGCAGATATCAGGAAGAACACCCATGGCGAAGGCAGCTCTCTGGGACGGTACTGACGCTGAGACGCGAAAGCGTG +>S_000000130 +AGCGTTGTCCGGATTTATTGGGCGTAAAGAGCGTGTAGGCGGCCGAATAAGTCTGACGTGAAATCTGGAGGCTCAACCTCCAGCTGTCGTTGGAAACTATTCGGCTAGAGTCCGGAAGAGGAGAGTGGAATTCCCGGTGTAGCGGTGAAATGCGCAGATATCGGGAAGAACACCTATGGCGAAGGCAGCTCTCTGGGACGGTACTGACGCTGAGACGCGAAAGCGTG +>S_000000131 +AGCGTTGTCCGGATTTATTGGGCGTAAAGAGCGTGTAGGCGGCCGGATAAGTCTGACGTGAAATCTGGAGGCTCAACCTCCAGCTGTCGTTGGAAACTATTCGGCTAGAGTCCGGAAGAGGAGAGTGGAATTCCCGGTGTAGCGGTGAAATGCGCAGATATCGGGAAGAACACCCATGGCGAAGGCAGCTCTCTGGGACGGTACTGACGCTGAGACGCGAAAGCGTG +>S_000000132 +AGCGTTGTCCGGATTTATTGGGCGTAAAGAGCGTGTAGGCGGCTAGATAGGTCCGTTGTGAAAACTCGAGGCTCAACCTCGAGACGTCGATGGAAACCATCTGGCTAGAGTCCGGAAGAGGAGAGTGGAATTCCTGGTGTAGCGGTGAAATGCGCAGATATCAGGAAGAACACCCGTGGCGAAGGCGGCTCTCTGGTACGTGACTGACGCTGAGACGCGAAAGCGTG +>S_000000133 +AGCGTTGTCCGGATTTATTGGGCGTAAAGAGCGTGTAGGCGGCTAGGTAGGTCCGTTGTGAAAACTCGAGGCTCAACCTCGAGACGCCGGTGGAAACCATCTAGCTAGAGTCCGGAAGAGGAGAGTGGAATTCCTGGTGTAGCGGTGAAATGCGCAGATATCAGGAAGAACACCCGTGGCGAAGGCGGCTCTCTGGGACGTGACTGACGCTGAGACGCGAAAGCGTG +>S_000000134 +AGCGTTGTCCGGATTTATTGGGCGTAAAGAGCGTGTAGGCGGCTAGGTAGGTCCGTTGTGAAAACTCGAGGCTCAACCTCGAGACGTCGATGGAAACCATCTAGCTAGAGTCCGGAAGAGGAGAGTGGAATTCCTGGTGTAGCGGTGAAATGCGCAGATATCAGGAAGAACACCCGTGGCGAAGGCGGCTCTCTGGTACGTGACTGACGCTGAGACGCGAAAGCGTG +>S_000000135 +AGCGTTGTCCGGATTTATTGGGCGTAAAGAGCGTGTAGGCGGTTAGGTAGGTCTGCTGTGAAAACTCCAGGCTCAACCTGGAGACGTCGGTGGAAACCATCTGACTAGAGTCCGGAAGAGGAGAGTGGAATTCCTGGTGTAGCGGTGAAATGCGCAGATATCAGGAAGAACACCTGTTGCGAAGGCGGCTCTCTGGGACGGTACTGACGCTGAGACGCGAAAGCGTG +>S_000000136 +AGCGTTGTCCGGATTTATTGGGCGTAAAGAGCTCGTAGGCGGTTTGGCAAGTCGGGTGTGAAAACTCCGAGCTCAACTCGGAGACGCCACTCGATACTGCCATGACTCGAGTCCGGTAGGGGAGTGCGGAATTCCTGGTGTAGCGGTGAAATGCGCAGATATCAGGAGGAACACCGGTGGCGAAGGCGGCACTCTGGGCCGGTACTGACGCTGAGGAGCGAAAGCGTG +>S_000000137 +AGCGTTGTCCGGATTTATTGGGCGTAAAGAGCTCGTAGGCGGTTTGGCAAGTCGGGTGTGAAAACTCCGGGCTCAACTCGGAGACGCCACTCGATACTGCCATGACTCGAGTCCGGTAGGGGAGTGCGGAATTCCTGGTGTAGCGGTGAAATGCGCAGATATCAGGAGGAACACCGGTGGCGAAGGCGGCACTCTGGGCCGGTACTGACGCTGAGGAGCGAAAGCGTG +>S_000000138 +AGCGTTGTCCGGATTTATTGGGCGTAAAGAGCTCGTAGGTGGCTGTTCAAGTCGGGTGTGAAATCCCAAGGCTCAACCTTGGGTCTGCATTCGATACTGGGTGGCTTGAGTCTGGTAGGGGGACCTGGAATTCCTGGTGTAGCGGTGGAATGCGCAGATATCAGGAGGAACACCGGTGGCGAAGGCGGGGTCCTGGGCCAGTACTGACGCTGAGGAGCGAAAGCGTG +>S_000000139 +AGCGTTGTCCGGATTTATTGGGCGTAAAGCGCGCGCAGGCGGCCACGTAAGTCGGATGTGAAATCCCGGGGCTCAACCCCGGAACTGCATTCGATACTGCGTGGCTCGAGGTAGGTAGGGGAGATCGGAATTCCTGGTGTAGCGGTGGAATGCGCAGATATCAGGAGGAACACCGGTGGCGAAGGCGGATCTCTGGGCCTTACCTGACGCTCAGGCGCGAAAGCTAG +>S_000000140 +AGCGTTGTCCGGATTTATTGGGCGTAAAGCGCGCGTAGGCGGCTCGTTAAGTCGGTTGTGAAAACCCGGGGCTCAACCCCGGGCCTGCGTCCGATACTGGCGAGCTGGAGGCAGGTAGGGGAGAGTGGAATTCCCGGTGTAGCGGTGAAATGCGCAGATATCGGGAGGAACACCGGTGGCGAAGGCGGCTCTCTGGGCCTGTCCTGACGCTCATGCGCGAAAGCTAG +>S_000000141 +AGCGTTGTCCGGATTTATTGGGCGTAAAGCGCGTGTAGGCGGCCAGACAGGTCTGCTGTGAAAACTCGAGGCTCAACCTCGAGAGGTCGGTAGAAACCGTCTGGCTAGAGTGCGGAAGAGGAGAGTGGAATTCCTGGTGTAGCGGTGAAATGCGCAGATATCAGGAGGAACACCCGTGGCTAAGGCGGCTCTCTGGTACGCAACTGACGCTGAGACGCGAAAGCGTG +>S_000000142 +AGCGTTGTCCGGATTTATTGGGCGTAAAGCGCTCGCAGGCGGCTAGGCCAAGTCGTGCGTGAAATCTCTCGGCTCAACTGAGAGTTGTCGTGCGATACTGGTCAGCTCGAGGCCGGTAGGGGGAAGCGGAATTCCGGGTGTAGTGGTGGAATGCGTAGATATCCGGAGGAACACCAGTGGCGAAGGCGGCTTCCTGGACCGGTTCTGACGCTCAGGAGCGAAAGCGTG +>S_000000143 +AGCGTTGTCCGGATTTATTGGGCGTAAAGGGCTCGTAGGCGGCTCGTCGCGTCTGCCGTGAAAGGCTCCGGCTTAACCGGGGTTTGGCGGTGGATACGGGCGGGCTTGAGGCCAGTAGGGGAGATCGGAATTCTACGTGTAGCGGTGAAATGCGCAGATATGTGGAGGAACACCGGTGGCGAAGGCGGATCTCTGGGCTGGTGCTGACGCTGAGGAGCGAAAGCGTG +>S_000000144 +AGCGTTGTCCGGATTTATTGGGCGTAAAGGGCTCGTAGGCGGTTGATTGCGTCCGCCGTGAAAGGCCTCGGCTTAACCGGGGTTTTGCGGTGGATACGGGTCGACTTGAGGCAATTAGGGGAGATCGGAATTCTACGTGTAGCGGTGAAATGCGCAGATATGTGGAGGAACACCGGTGGCGAAGGCGGATCTCTGGGATTGTTCTGACGCTGAGGAGCGAAAGCGTG +>S_000000145 +AGCGTTGTTCGGAATCACTGGGCGTAAAGCGCACGTAGGCGGATGTGCCAGTCAGGGGTGAAATCCCGGAGCTCAACTCCGGAACTGCCTCTGATACAGCACGTCTTGAGTTCGAGAGAGGTGGGTGGAATTCCTAGTGTAGAGGTGAAATTCGTAGATATTAGGAAGAACACCGGTGGCGAAGGCGGCCCACTGGCTCGATACTGACGCTGAGGTGCGAAAGCGTG +>S_000000146 +AGCGTTGTTCGGAATCACTGGGCGTAAAGGGCGCGTAGGCGGCTGTGGCAGTCGGGTGTGAAAGCCCGGAGCTCAACTCCGGAACGGCACTCGAGACGCCACGGCTGGAGGCCGGAAGAGGAGGGTGGAATACCCAGTGTAGAGGTGAAATTCGTAGATATTGGGTGGAACACCGGTGGCGAAAGCGGCTCTCTGGTCCGGACCTGACGCTGAGGCGCGAAAGCGTG +>S_000000147 +AGCGTTGTTCGGAATTACTGGGCGTAAAGCGAGTGTAGGTGGTTGTCCAAGTTGGATGTGAAAGCCTTGAGCTCAACTCAAGAAATGCATTCAGGACTGGATGGCTAGAGGACCGGAGAGGATAGTGGAATTCCCAGTGTAGTGGTGAAATACGTAGAGATTGGGAAGAACACCAGTGGCGAAGGCGGCTATCTGGACGGTTTCTGACACTAAGACTCGAAAGCGTG +>S_000000148 +AGCGTTGTTCGGAATTACTGGGCGTAAAGCGAGTGTAGGTGGTTGTCCAAGTTGGATGTGAAAGCCTTGAGCTCAACTCAAGAAATGCATTCAGGACTGGGCGGCTAGAGGACCGGAGAGGATAGTGGAATTCCCAGTGTAGTGGTGAAATACGTAGAGATTGGGAAGAACACCAGTGGCGAAGGCGGCTATCTGGACGGTTTCTGACACTAAGACTCGAAAGCGTG +>S_000000149 +AGCGTTGTTCGGAATTACTGGGCGTAAAGCGCACGTAGGCGGCTTTGTAAGTTAGAGGTGAAAGCCCGGGGCTCAACTCCGGAACTGCCTTTAAGACTGCATCGCTTGAATCCAGGAGAGGTGAGTGGAATTCCGAGTGTAGAGGTGAAATTCGTAGATATTCGGAAGAACACCAGTGGCGAAGGCGGCTCACTGGACTGGTATTGACGCTGAGGTGCGAAAGCGTG +>S_000000150 +AGCGTTGTTCGGAATTACTGGGCGTAAAGCGCACGTAGGCGGCTTTGTAAGTTAGAGGTGAAAGCCCGGGGCTCAACTCCGGAATTGCCTTTAAGACTGCATCGCTAGAACGTCGGAGAGGTGAGTGGAATTCCGAGTGTAGAGGTGAAATTCGTAGATATTCGGAAGAACACCAGTGGCGAAGGCGACTCACTGGACGACCGTTGACGCTGAGGTGCGAAAGCGTG +>S_000000151 +AGCGTTGTTCGGAATTACTGGGCGTAAAGCGCACGTAGGCGGCTTTGTAAGTTAGAGGTGAAAGCCCGGGGCTCAACTCCGGAATTGCCTTTAAGACTGCATCGCTAGAATTGTGGAGAGGTAAGTGGAATTCCGAGTGTAGAGGTGAAATTCGTAGATATTCGGAAGAACACCAGTGGCGAAGGCGACTTACTGGACACATATTGACGCTGAGGTGCGAAAGCGTG +>S_000000152 +AGCGTTGTTCGGAATTACTGGGCGTAAAGCGCACGTAGGCGGCTTTGTAAGTTAGAGGTGAAAGCCCGGGGCTCAACTCCGGAATTGCCTTTAAGACTGCATCGCTAGAATTGTGGAGAGGTGAGTGGAATTCCGAGTGTAGAGGTGAAATTCGTAGATATTCGGAAGAACACCAGTGGCGAAGGCGACTCACTGGACACATATTGACGCTGAGGTGCGAAAGCGTG +>S_000000153 +AGCGTTGTTCGGAATTACTGGGCGTAAAGCGCACGTAGGCGGCTTTGTAAGTTAGAGGTGAAAGCCCGGGGCTCAACTCCGGAATTGCCTTTAAGACTGCATCGCTTGAATCCGGGAGAGGTGAGTGGAATTCCGAGTGTAGAGGTGAAATTCGTAGATATTCGGAAGAACACCAGTGGCGAAGGCGGCTCACTGGACCGGTATTGACGCTGAGGTGCGAAAGCGTG +>S_000000154 +AGCGTTGTTCGGAATTACTGGGCGTAAAGCGCGCGTAGGCGGGCATCTAAGTCAGGGGTGAAATGCCAGGGCTCAACCTTGGAATTGCCTTTGATACTGGATGTCTGGAGTTCGGGAGAGGTGAGTGGAATTCCGAGTGTAGAGGTGAAATTCGTAGATATTCGGAGGAACACCAGAAGCGAAGGCGGCTCACTGGCCCGATACTGACGCTGAGGCGCGAAAGCGTG +>S_000000155 +AGCGTTGTTCGGAATTACTGGGCGTAAAGGGCGCGTAGGCGGCCGCCTAAGTCAGACGTGAAATCCCTCGGCTCAACCGGGGAACTGCGTCTGAGACTGGGTGGCTTGAATCCGGGAGAGGGATGTGGAATTCCAGGTGTAGCGGTGAAATGCGTAGATATCTGGAGGAACACCGGTGGCGAAGGCGGCATCCTGGACCGGCATTGACGCTGAGGCGCGAAAGCCAG +>S_000000156 +AGCGTTGTTCGGAATTACTGGGCGTAAAGGGCGCGTAGGCGGCCTGCTAAGTCGAACGTGAAATCCCCGGGCTCAACCCGGGAACTGCGTTCGATACTGGTTGGCTTGAATTCGGGAGAGGGATGCGGAATTCCAGGTGTAGCGGTGAAATGCGTAGATATCTGGAGGAACACCGGTGGCGAAGGCGGCATCCTGGACCGGCATTGACGCTGAGGCGCGAAAGCCAG +>S_000000157 +AGCGTTGTTCGGAATTACTGGGCGTAAAGGGCGCGTAGGCGGCGACCCAAGTCAGATGTGAAAGTCCTGGGCTTAACCTGGGGACTGCATTTGATACTGGGTTGCTTGAATTCGGGAGAGGATAGCGGAATTCCCAGTGTAGAGGTGAAATTCGTAGATATTGGGAAGAACACCGGTGGCGAAGGCGGCTATCTGGACCGACATTGACGCTGAGGCGCGAAAGCGTG +>S_000000158 +AGCGTTGTTCGGAATTACTGGGCGTAAAGGGCTCGTAGGCGGCCAACTAAGTCAGACGTGAAATCCCCAGGCTCAACCTGGGAACTGCGTCTGAGACTGGATGGCTTGAATCCGGGAGAGGGATGCAGAATTCCAGGTGTAGCGGTGAAATGCGTAGATATCTGGAGGAATACCGGTGGCGAAGGCGGCATCCTGGACCGGCATTGACGCTGAGGAGCGAAAGCCAG +>S_000000159 +AGCGTTGTTCGGAATTACTGGGCGTAAAGGGCTCGTAGGCGGCCAACTAAGTCGGACGTGAAATCCCCAGGCTCAACCTGGGAACTGCGTCCGATACTGGATGGCTTGAATTCGGGAGAGGGATGCAGAATTCCAGGTGTAGCGGTGAAATGCGTAGATATCTGGAGGAATACCGGTGGCGAAGGCGGCATCCTGGACCGACATTGACGCTGAGGAGCGAAAGCTAG +>S_000000160 +AGCGTTGTTCGGAATTACTGGGCGTAAAGGGCTCGTAGGCGGCCAACTAAGTCGGACGTGAAATCCCTCAGCTTAACTGGGGAACTGCGTCCGATACTGGATGGCTTGGATTTGGGAGAGGGATGCGGAATTCCAGGTGTAGCGGTGAAATGCGTAGATATCTGGAGGAACACCGGTGGCGAAGGCGGCATCCTGGACCAATATTGACGCTGAGGAGCGAAAGCCAG +>S_000000161 +AGCGTTGTTCGGAATTACTGGGCGTAAAGGGCTCGTAGGCGGCCAACTAAGTCGGATGTGAAATCCCCAGGCTCAACCTGGGAACTGCATCCGATACTGGATGGCTTGAATTCGGGAGAGGGATGCAGAATTCCAGGTGTAGCGGTGAAATGCGTAGATATCTGGAGGAATACCGGTGGCGAAGGCGGCATCCTGGACCGACATTGACGCTGAGGAGCGAAAGCTAG +>S_000000162 +AGCGTTGTTCGGAATTACTGGGCGTAAAGGGCTCGTAGGTGGCCTCTTAAGTCAGACGTGAAATCCCTCGGCTCAACCGGGGAACTGCGTCTGAGACTGAAAGGCTTGAATCCGGGAGAGGGATGCGGAATTCCAGGTGTAGCGGTGAAATGCGTAGATATCTGGAGGAACACCGGTGGCGAAGGCGGCATCCTGGACCGGTATTGACACTGAGGAGCGAAAGCCAG +>S_000000163 +AGCGTTGTTCGGAATTATTGGGCGTAAAGGGCGCGTAGGCGGTGCGGTAAGTCACCTGTGAAAACTCTGGGCTCAACTCAGAGCCTGCAGGCGAAACTGCCGTGCTTGAGTGTGGGAGAGGTGCGTGGAATTCCCGGTGTAGCGGTGAAATGCGTAGATATCGGGAGGAACACCTGTGGCGAAAGCGGCGCACTGGACCACAACTGACGCTGAGGCGCGAAAGCTAG +>S_000000164 +AGCGTTGTTCGGAGTTACTGGGCGTAAAGAGTGCGTAGGCGGTTTTCTAAGTTTGGTGTGAAATCTCCCGGCTTAACTGGGAGGGTGCGCCGAAGACTGGAAGGCTTGAGTATGGGAGAGGTAAGCGGAATTCCTGGTGTAGCGGTGAAATGCGTAGATATCAGGAGGAACACCTGCGGTGTAGACGGCTTACTGGACCATAACTGACGCTGAGGCACGAAAGCGTG +>S_000000165 +AGCGTTGTTCGGATTCATTGGGCGTAAAGGGTACGTAGGTGGCGCCGTAAGTCAGGTGTGAAATCTCGGGGCTTAACTCCGAAACTGCATTTGATACTGCGGTGCTTGAGGACTGGAGAGGAGACTGGAATTTACGGTGTAGCAGTGAAATGCGTAGAGATCGTAAGGAAGACCAGTGGCGAAGGCGGGTCTCTGGACAGTTCCTGACACTGAGGCACGAAGGCCAG +>S_000000166 +AGCGTTGTTCGGATTCATTGGGCGTAAAGGGTGCGTAGGCGGCGAGGCAAGTCTGGTGTGAAATCCCGGGGCTCAACCCCGGAACTGCACTGGATACTGCTTTGCTAGAGTACTGGAGAGGGAACTGGAATTTACGGTGTAGCAGTGAAATGCGTAGATATCGTAAGGAAGACCAGCGGCGAAGGCGAGTTCCTGGACAGTTACTGACGCTGAGGCACGAAGGCCAG +>S_000000167 +AGCGTTGTTCGGATTCATTGGGCGTAAAGGGTGCGTAGGCGGCGCGGTAAGTCGGGTGTGAAATCTCGGGGCTTAACTCCGAAACTGCATTCGATACTACCGTGCTTGAGGACTGGAGAGGAGACTGGAATTTACGGTGTAGCGGTGAAATGCGTAGATATCGTAAGGAAGACCAGTGGCGAAGGCGGGTCTCTGGACAGTTCCTGACGCTGAGGCACGAAGGCCAG +>S_000000168 +AGCGTTGTTCGGATTCATTGGGCGTAAAGGGTGCGTAGGCGGCGCGGTAAGTCGGGTGTGAAATTTCGAGGCTTAACTTCGAAACTGCATTCGATACTGCCGTGCTTGAGGACTGGAGAGGAGACTGGAATTTACGGTGTAGCGGTGAAATGCGTAGATATCGTAAGGAAGACCAGTGGCGAAGGCGGGTCTCTGGACAGTTCCTGACGCTGAGGCACGAAGGCCAG +>S_000000169 +AGCGTTGTTCGGATTCATTGGGCGTAAAGGGTGCGTAGGTGGCGCCGTAAGTCAGGTGTGAAATCTCGGGGCTTAACTCCGAAACTGCATTTGATACTGCGGTGCTTGAGGACTGGAGAGGAGACTGGAATTTACGGTGTAGCAGTGAAATGCGTAGAGATCGTAAGGAAGACCAGTGGCGAAGGCGGGTCTCTGGACAGTTCCTGACACTGAGGCACGAAGGCCAG +>S_000000170 +AGCGTTGTTCGGATTCATTGGGCGTAAAGGGTGCGTAGGTGGCGCCGTAAGTCGGGTGTGAAATTTCGGAGCTTAACTCCGAAACTGCATTCGATACTGCGGTGCTTGAGGACTGGAGAGGAGACTGGAATTCATGGTGTAGCAGTGAAATGCGTAGAGATCATGAGGAAGACCAGTGGCGAAGGCGGGTCTCTGGACAGTTCCTGACACTGAGGCACGAAGGCCAG +>S_000000171 +AGCGTTGTTCGGATTCATTGGGCGTAAAGGGTGCGTAGGTGGCGTCGTAAGTCAGGTGTGAAATCTCGGGGCTTAACTCCGAAACTGCATTTGATACTGCGGTGCTTGAGGACTGGAGAGGAGACTGGAATTTACGGTGTAGCAGTGAAATGCGTAGAGATCGTAAGGAAGACCAGTGGCGAAGGCGGGTCTCTGGACAGTTCCTGACACTGAGGCACGAAGGCCAG +>S_000000172 +AGCGTTGTTCGGATTCATTGGGCGTAAAGGGTGTGTAGGTGGCGCCGTAAGTCGGGTGTGAAATCTCGGGGCTTAACTCCGAAACTGCATTCGATACTGCGGTGCTTGAGGACTGGAGAGGAGACTGGAATTCATGGTGTAGCAGTGAAATGCGTAGAGATCATGAGGAAGACCAGTGGCGAAGGCGGGTCTCTGGACAGTTCCTGACACTGAGACACGAAGGCCAG +>S_000000173 +AGCGTTGTTCGGATTCATTGGGCGTAAAGGGTGTGTAGGTGGCGCCGTAAGTCGGGTGTGAAATCTCGGGGCTTAACTCCGAAACTGCATTCGATACTGCGGTGCTTGAGGACTGGAGAGGAGACTGGAATTTACGGTGTAGCAGTGAAATGCGTAGATATCGTAAGGAAGACCAGTGGCGAAGGCGGGTCTCTGGACAGTTCCTGACACTGAGACACGAAGGCCAG +>S_000000174 +AGCGTTGTTCGGATTTACTGGGCGTAAAGCGCACGTAGGCGGATCGTTAAGTCGGGGGTGAAATCCTGGAGCTCAACTCCAGAACTGCCTTCGATACTGGCGATCTTGAGTCCGGAAGAGGTGAGTGGAACTCCTAGTGTAGAGGTGGAAGTCGTAGATATTAGGAAGAACACCAGTGGCGAAGGCGGCTCACTGGTCCGGTACTGACGCTGAGGTGCGAAAGCGTG +>S_000000175 +AGCGTTGTTCGGATTTACTGGGCGTAAAGCGTGCGTAGGTGGTGAGGTAAGACCTGTGGGAAAGACCTGGGCTTAACCCAGGAAGGTCGCAGGTGACTGCTTTGCTGGAGGACGGGAGAGGAGAGCGGAATTCCCGGTGTAGCGGTGAAATGCGTAGAGATCGGGAAGAAGGCCGGTGGCGAAGGCGGCTCTCTGGAACGTTCCTGACACTGAGGCACGAAAGCGTG +>S_000000176 +AGCGTTGTTCGGATTTACTGGGCGTAAAGGGCGCGTAGGCGGCCACCGCAAGTCAGTTGTGAAATCTCTGGGCTTAACCCAGAAAGGTCAACTGATACTGCGGGGCTAGAGTGCAGAAGGGGCAACTGGAATTCTCGGTGTAGCGGTGAAATGCGTAGATATCGAGAGGAACACCTGCGGCGAAGGCGGGTTGCTGGGCTGACACTGACGCTGAGGCGCGAAAGCTAG +>S_000000177 +AGCGTTGTTCGGATTTACTGGGCGTAAAGGGCGCGTAGGCGGCCACCGCAAGTCGACTGTGAAATCTCCGGGCTTAACCCGGAAAGGTCAGCCGATACTGCGGGGCTAGAGTGCAGAAGGGGCAACTGGAATTCTCGGTGTAGCGGTGAAATGCGTAGATATCGAGAGGAACACCTGCGGCGAAGGCGGGTTGCTGGGCTGACACTGACGCTGAGGCGCGAAAGCTAG +>S_000000178 +AGCGTTGTTCGGATTTACTGGGCGTAAAGGGCGCGTAGGCGGCCAGCGCAAGTCAGTTGTGAAATCTCCGAGCTTAACTCGGAAAGGTCAACTGATACTGCGCGGCTAGAGTGCGGAAGGGGCAACTGGAATTCTTGGTGTAGCGGTGAAATGCGTAGATATCAAGAGGAACACCTGCGGCGAAGGCGGGTTGCTGGGCCGACACTGACGCTGAGGCGCGAAAGCCAG +>S_000000179 +AGCGTTGTTCGGATTTACTGGGCGTAAAGGGCGCGTAGGCGGCCCTCCTTGTCGCGTGTGAAAGCCCCGGGCTCAACCTGGGAATTGCGCGCGAAACGGGAGGGCTTGAGTTCGGGAGAGGAGCGTGGAATTCCCAGTGTAGAGGTGAAATTCGTAGATATTGGGAAGAACACCGGTGGCGAAGGCGGCGCTCTGGACCGAGACTGACGCTGAGGCGCGAAAGCGTG +>S_000000180 +AGCGTTGTTCGGATTTACTGGGCGTAAAGGGCGCGTAGGCGGCCGAACAAGTCACTTGTGAAATCTCCGGGCTTAACTCGGAAAGGTCAAGTGATACTGTTTGGCTAGAGTGCGGAAGGGGCAACTGGAATTCTCGGTGTAGCGGTGAAATGCGTAGATATCGAGAGGAACACCTGCGGCGAAGGCGGGTTGCTGGGCCGACACTGACGCTGAGGCGCGAAAGCTAG +>S_000000181 +AGCGTTGTTCGGATTTACTGGGCGTAAAGGGCGCGTAGGCGGCCTCCGCAAGTCAATTGTGAAATCTCCGGGCTTAACTCGGAAAGGTCAACTGATACTGCGGGGCTAGAGTGCGGAAGGGGCAACCGGAATTCTCGGTGTAGCGGTGAAATGCGTAGATATCGAGAGGAACACCTGCGGCGAAGGCGGGTTGCTGGGCCGACACTGACGCTGAGGCGCGAAAGCTAG +>S_000000182 +AGCGTTGTTCGGATTTACTGGGCGTAAAGGGCGCGTAGGCGGCCTGTCAAGTCAACTGTGAAATCTCCGGGCTTAACTCGGAACGGTCAGTTGATACTGTCAGGCTAGAGTGCAGAAGGGGCAATCGGAATTCTTGGTGTAGCGGTGAAATGCGTAGATATCAAGAGGAACACCTGAGGTGAAGACGGGTTGCTGGGCTGACACTGACGCTGAGGCGCGAAAGCCAG +>S_000000183 +AGCGTTGTTCGGATTTACTGGGCGTAAAGGGCGCGTAGGCGGCGCAACAAGTCACTTGTGAAATCTCCGGGCTTAACCCGGAGCGGCCAAGTGATACTGTCGTGCTAGAGTGCGGAAGGGGCTACTGGAATTCTCGGTGTAGCGGTGAAATGCGTAGATATCGAGAGGAACACCTGCGGCGAAGGCGGGTAGCTGGGCCGACACTGACGCTGAGGCGCGAAAGCCAG +>S_000000184 +AGCGTTGTTCGGATTTACTGGGCGTAAAGGGCGCGTAGGCGGCGCGGTAAGTCACTTGTGAAATCTCTGAGCTTAACTCAGAACGGCCAAGTGATACTGCAGTGCTAGAGTGTGGAAGGGGCAATCGGAATTCTTGGTGTAGCGGTGAAATGCGTAGATATCAAGAGGAACACCTGAGGTGAAGACGGGTTGCTGGGCCAACACTGACGCTGAGGCGCGAAAGCCAG +>S_000000185 +AGTGGTCGGGACGATTATTGGGCCTAAAGCATCCGTAGCCGGTACTGCAAGTCTTCCGTTAAATCCACCTGCTCAACAGTTGGGCTGCGGAGGATACTACAGCGCTAGGAGGCGGGAGAGGCAAGCGGTACTCAGTGGGTAGGGGTAAAATCCACTGATCCATTGAAGACCACCAGTGGCGAAGGCGGCTTGCCAGAACGCGCTCGACGGTGAGGGATGAAAGCTGG +>S_000000186 +AGTGGTCGGGACGATTATTGGGCCTAAAGCATCCGTAGCCGGTCATGCAAGTCCTCCGTTAAATCCACCTGCTTAACAGATGGGCTGCGGAGGATACTACAAGGCTAGGAGGCGGAAGAGGCAAGCGGTACTCAGTGGGTAGGGGTAAAATCCTCTGATCCATTGAAGACCACCAGTGGCGAAGGCGGCTTGCCAATACGCGCTCGACGGTGAGGGATGAAAGCTGG +>S_000000187 +AGTGGTCGGGACGATTATTGGGCCTAAAGCATCCGTAGCCGGTCCTGCAAGTCCTCCGTTAAATCCACCCGCTCAACGGTTGGGCCGCGGGGGATACTACAGGGCTAGGAGGCGGGAGAGGCAAGCGGTACTCGATGGGTAGGGGTAAAATCCACTGATCCATTGAAGACCACCAGTGGCGAAGGCGGCTTGCCAGAACGCGCTCGACGGTGAGGGATGAAAGCTGG +>S_000000188 +AGTGGTCGGGACGATTATTGGGCCTAAAGCATCCGTAGCCGGTCTTGCAAGTCTTCCGTTAAATCCAGCTGCTTAACAGATGGGCTGCGGAGGATACTACAAGGCTAGGAGGCGGGAGAGGCAAGCGGTACTCAGTGGGTAGGGGTAAAATCCTCTGATCCATTGAAGACCACCAGTGGCGAAGGCGGCTTGCCAGAACGCGCTCGACGGTGAGGGATGAAAGCTGG +>S_000000189 +AGTGGTCGGGACGATTATTGGGCCTAAAGCATCCGTAGCCGGTTTTACAAGTCCTCCGTTAAATCCAACTGCTTAACAGATGGGCTGCGGAGGATACTATAAGACTAGGAGGCAGGAGAGGCAAGCGGTACTCAGTGGGTAGGGGTAAAATCCGTTGATCCATTGAAGACCACCAGTGGCGAAGGCGGCTTGCCAGAATGCGCTCGACGGTGAGGGATGAAAGCTGG +>S_000000190 +AGTGGTCGGGACGATTATTGGGCCTAAAGCATCCGTAGCCGGTTTTACAAGTCCTCCGTTAAATCCAGCTGCTTAACAGATGGGCTGCGGAGGATACTATAAGACTAGGAGGCAGGAGAGGCAAGCGGTACTCAGTGGGTAGGGGTAAAATCCGTTGATCCATTGAAGACCACCAGTGGCGAAGGCGGCTTGCCAGAATGCGCTCGACGGTGAGGGATGAAAGCTGG +>S_000000191 +AGTGGTCGGGACGTTTATTGGGCCTAAAGCATCCGTAGCCGGTTCTACAAGTCTTCCGTTAAATCCACCTGCTTAACAGATGGGCTGCGGAAGATACTATAGAGCTAGGAGGCGGGAGAGGCAAGCGGTACTCGATGGGTAGGGGTAAAATCCGTTGATCCATTGAAGACCACCAGTGGCGAAGGCGGCTTGCCAGAACGCGCTCGACGGTGAGGGATGAAAGCTGG +>S_000000192 +AGTGGTGCTCGTTATTATTGGGTCTAAAACGTCCGTAGTCGGTTGAGTAGATGCCCGGGTAAATCGCAGCGCTTAACGTTGCGAATTCCGGGTAGACCGCTCGACTAGGGATTGGGAGAGGTGCATAGTACTCTGAGGGTAGGGGTAAAATCCTGTAATCCTTGGGGGACTACCAGTGGCGAAGGCGATGCACTAGAACAAGTCCGACGATCAGGGACGAAGCCCTG +>S_000000193 +AGTTGTCGGGACGATTATTGGGCCTAAAGCATCCGTAGCCTGTTCTGCAAGTCCTCCGTTAAATCCACCTGCTCAACGGATGGGCTGCGGAGGATACCGCAGAGCTAGGAGGCGGGAGAGGCAAACGGTACTCAGTGGGTAGGGGTAAAATCCATTGATCTACTGAAGACCACCAGTGGCGAAGGCGGTTTGCCAGAACGCGCTCGACGGTGAGGGATGAAAGCTGG +sample seqname count +BAQ3473.1_35_L001 S_000000068 79 +BAQ3473.1_35_L001 S_000000083 15 +BAQ3473.1_35_L001 S_000000080 68 +BAQ3473.1_35_L001 S_000000149 47 +BAQ3473.1_35_L001 S_000000098 15 +BAQ3473.1_35_L001 S_000000095 20 +BAQ3473.1_35_L001 S_000000082 20 +BAQ3473.1_35_L001 S_000000174 17 +BAQ3473.1_35_L001 S_000000109 14 +BAQ3473.1_35_L001 S_000000191 13 +BAQ3473.1_35_L001 S_000000019 12 +BAQ3473.1_35_L001 S_000000049 2 +BAQ3473.3_10_L001 S_000000068 88 +BAQ3473.3_10_L001 S_000000059 30 +BAQ3473.3_10_L001 S_000000083 25 +BAQ3473.3_10_L001 S_000000043 79 +BAQ3473.3_10_L001 S_000000186 13 +BAQ3473.3_10_L001 S_000000077 39 +BAQ3473.3_10_L001 S_000000010 33 +BAQ3473.3_10_L001 S_000000096 32 +BAQ3473.3_10_L001 S_000000155 28 +BAQ3473.3_10_L001 S_000000092 18 +BAQ3473.3_10_L001 S_000000182 18 +BAQ3473.3_10_L001 S_000000153 17 +BAQ3473.3_10_L001 S_000000143 17 +BAQ3473.3_10_L001 S_000000154 16 +BAQ3473.3_10_L001 S_000000146 16 +BAQ3473.3_10_L001 S_000000039 15 +BAQ3473.3_10_L001 S_000000024 12 +BAQ3473.3_10_L001 S_000000145 12 +BAQ3473.3_10_L001 S_000000009 7 +BAQ3473.3_10_L001 S_000000147 4 +BAQ4166.1.1_38_L001 S_000000183 30 +BAQ4166.1.1_38_L001 S_000000084 42 +BAQ4166.1.1_38_L001 S_000000172 69 +BAQ4166.1.1_38_L001 S_000000167 15 +BAQ4166.1.1_38_L001 S_000000011 5 +BAQ4166.1.1_38_L001 S_000000057 23 +BAQ4166.1.1_38_L001 S_000000179 16 +BAQ4166.1.1_38_L001 S_000000136 11 +BAQ4166.1.1_38_L001 S_000000163 10 +BAQ4166.1.1_38_L001 S_000000046 4 +BAQ4166.1.2_39_L001 S_000000068 64 +BAQ4166.1.2_39_L001 S_000000058 33 +BAQ4166.1.2_39_L001 S_000000132 75 +BAQ4166.1.2_39_L001 S_000000061 46 +BAQ4166.1.2_39_L001 S_000000178 50 +BAQ4166.1.2_39_L001 S_000000160 40 +BAQ4166.1.2_39_L001 S_000000028 15 +BAQ4166.1.2_39_L001 S_000000091 34 +BAQ4166.1.2_39_L001 S_000000076 22 +BAQ4166.1.2_39_L001 S_000000035 20 +BAQ4166.1.2_39_L001 S_000000116 18 +BAQ4166.1.2_39_L001 S_000000107 9 +BAQ4166.1.2_39_L001 S_000000030 5 +BAQ4166.1.2_39_L001 S_000000157 4 +BAQ4166.1.3_15_L001 S_000000058 35 +BAQ4166.1.3_15_L001 S_000000168 50 +BAQ4166.1.3_15_L001 S_000000028 12 +BAQ4166.1.3_15_L001 S_000000007 9 +BAQ4166.1.3_15_L001 S_000000078 26 +BAQ4166.1.3_15_L001 S_000000126 22 +BAQ4166.1.3_15_L001 S_000000133 21 +BAQ4166.1.3_15_L001 S_000000187 21 +BAQ4166.1.3_15_L001 S_000000117 18 +BAQ4166.1.3_15_L001 S_000000124 14 +BAQ4166.1.3_15_L001 S_000000055 13 +BAQ4166.1.3_15_L001 S_000000189 12 +BAQ4166.1.3_15_L001 S_000000175 12 +BAQ4166.1.3_15_L001 S_000000140 10 +BAQ4166.1.3_15_L001 S_000000053 3 +BAQ4166.2_21_L001 S_000000058 45 +BAQ4166.2_21_L001 S_000000031 16 +BAQ4166.2_21_L001 S_000000084 24 +BAQ4166.2_21_L001 S_000000083 41 +BAQ4166.2_21_L001 S_000000167 12 +BAQ4166.2_21_L001 S_000000170 32 +BAQ4166.2_21_L001 S_000000075 45 +BAQ4166.2_21_L001 S_000000062 37 +BAQ4166.2_21_L001 S_000000098 19 +BAQ4166.2_21_L001 S_000000111 6 +BAQ4166.2_21_L001 S_000000094 27 +BAQ4166.2_21_L001 S_000000044 27 +BAQ4166.2_21_L001 S_000000185 18 +BAQ4166.2_21_L001 S_000000151 17 +BAQ4166.2_21_L001 S_000000180 15 +BAQ4166.2_21_L001 S_000000029 5 +BAQ4166.2_21_L001 S_000000101 5 +BAQ4166.3_44_L001 S_000000059 61 +BAQ4166.3_44_L001 S_000000132 32 +BAQ4166.3_44_L001 S_000000031 8 +BAQ4166.3_44_L001 S_000000084 20 +BAQ4166.3_44_L001 S_000000167 42 +BAQ4166.3_44_L001 S_000000097 15 +BAQ4166.3_44_L001 S_000000056 38 +BAQ4166.3_44_L001 S_000000028 10 +BAQ4166.3_44_L001 S_000000011 5 +BAQ4166.3_44_L001 S_000000171 30 +BAQ4166.3_44_L001 S_000000064 21 +BAQ4166.3_44_L001 S_000000190 16 +BAQ4166.3_44_L001 S_000000079 14 +BAQ4166.3_44_L001 S_000000040 12 +BAQ4166.3_44_L001 S_000000047 6 +BAQ4166.3_44_L001 S_000000042 5 +BAQ4697.3_22_L001 S_000000068 32 +BAQ4697.3_22_L001 S_000000016 160 +BAQ4697.3_22_L001 S_000000059 8 +BAQ4697.3_22_L001 S_000000134 67 +BAQ4697.3_22_L001 S_000000120 65 +BAQ4697.3_22_L001 S_000000031 21 +BAQ4697.3_22_L001 S_000000131 31 +BAQ4697.3_22_L001 S_000000115 24 +BAQ4697.3_22_L001 S_000000110 20 +BAQ4697.3_22_L001 S_000000122 19 +BAQ4697.3_22_L001 S_000000113 19 +BAQ4697.3_22_L001 S_000000123 17 +BAQ4697.3_22_L001 S_000000121 17 +BAQ4697.3_22_L001 S_000000150 13 +BAQ4697.3_22_L001 S_000000181 13 +BAQ4697.3_22_L001 S_000000118 8 +BAQ4697.3_22_L001 S_000000114 7 +BAQ4697.3_22_L001 S_000000015 5 +BAQ4697.3_22_L001 S_000000034 3 +YUN3259.2_30_L001 S_000000059 23 +YUN3259.2_30_L001 S_000000031 16 +YUN3259.2_30_L001 S_000000089 60 +YUN3259.2_30_L001 S_000000193 12 +YUN3259.2_30_L001 S_000000105 24 +YUN3259.2_30_L001 S_000000164 5 +YUN3259.2_30_L001 S_000000051 5 +YUN3259.2_30_L001 S_000000001 5 +YUN3259.2_30_L001 S_000000166 4 +YUN3259.3_36_L001 S_000000059 26 +YUN3259.3_36_L001 S_000000021 48 +YUN3259.3_36_L001 S_000000026 116 +YUN3259.3_36_L001 S_000000065 64 +YUN3259.3_36_L001 S_000000125 57 +YUN3259.3_36_L001 S_000000158 44 +YUN3259.3_36_L001 S_000000093 11 +YUN3259.3_36_L001 S_000000188 10 +YUN3259.3_36_L001 S_000000142 17 +YUN3259.3_36_L001 S_000000052 10 +YUN3259.3_36_L001 S_000000102 7 +YUN3259.3_36_L001 S_000000002 6 +YUN3428.1_31_L001 S_000000152 29 +YUN3428.1_31_L001 S_000000008 20 +YUN3428.1_31_L001 S_000000017 45 +YUN3428.1_31_L001 S_000000183 37 +YUN3428.1_31_L001 S_000000128 40 +YUN3428.1_31_L001 S_000000061 31 +YUN3428.1_31_L001 S_000000188 10 +YUN3428.1_31_L001 S_000000106 25 +YUN3428.1_31_L001 S_000000013 18 +YUN3428.1_31_L001 S_000000165 14 +YUN3428.1_31_L001 S_000000032 9 +YUN3428.1_31_L001 S_000000072 7 +YUN3428.2_42_L001 S_000000152 31 +YUN3428.2_42_L001 S_000000021 90 +YUN3428.2_42_L001 S_000000104 84 +YUN3428.2_42_L001 S_000000025 20 +YUN3428.2_42_L001 S_000000119 14 +YUN3428.2_42_L001 S_000000071 47 +YUN3428.2_42_L001 S_000000093 25 +YUN3428.2_42_L001 S_000000156 34 +YUN3428.2_42_L001 S_000000011 14 +YUN3428.2_42_L001 S_000000069 24 +YUN3428.2_42_L001 S_000000169 24 +YUN3428.2_42_L001 S_000000127 24 +YUN3428.2_42_L001 S_000000176 23 +YUN3428.2_42_L001 S_000000129 20 +YUN3428.2_42_L001 S_000000022 15 +YUN3428.2_42_L001 S_000000074 14 +YUN3428.2_42_L001 S_000000023 12 +YUN3428.2_42_L001 S_000000112 5 +YUN3428.2_42_L001 S_000000006 3 +YUN3428.3_14_L001 S_000000152 23 +YUN3428.3_14_L001 S_000000031 7 +YUN3428.3_14_L001 S_000000128 39 +YUN3428.3_14_L001 S_000000063 12 +YUN3428.3_14_L001 S_000000088 38 +YUN3428.3_14_L001 S_000000188 14 +YUN3428.3_14_L001 S_000000020 28 +YUN3428.3_14_L001 S_000000004 10 +YUN3428.3_14_L001 S_000000141 9 +YUN3428.3_14_L001 S_000000073 7 +YUN3428.3_14_L001 S_000000012 6 +YUN3533.2_26_L001 S_000000027 348 +YUN3533.2_26_L001 S_000000008 29 +YUN3533.2_26_L001 S_000000017 29 +YUN3533.2_26_L001 S_000000183 22 +YUN3533.2_26_L001 S_000000031 9 +YUN3533.2_26_L001 S_000000119 41 +YUN3533.2_26_L001 S_000000186 7 +YUN3533.2_26_L001 S_000000111 8 +YUN3533.2_26_L001 S_000000060 17 +YUN3533.2_26_L001 S_000000014 11 +YUN3533.2_26_L001 S_000000048 10 +YUN3533.2_26_L001 S_000000148 4 +YUN3533.3_33_L001 S_000000059 25 +YUN3533.3_33_L001 S_000000152 38 +YUN3533.3_33_L001 S_000000008 50 +YUN3533.3_33_L001 S_000000017 24 +YUN3533.3_33_L001 S_000000066 79 +YUN3533.3_33_L001 S_000000025 41 +YUN3533.3_33_L001 S_000000063 19 +YUN3533.3_33_L001 S_000000186 14 +YUN3533.3_33_L001 S_000000161 48 +YUN3533.3_33_L001 S_000000097 27 +YUN3533.3_33_L001 S_000000177 23 +YUN3533.3_33_L001 S_000000036 19 +YUN3533.3_33_L001 S_000000014 5 +YUN3533.3_33_L001 S_000000103 16 +YUN3533.3_33_L001 S_000000108 16 +YUN3533.3_33_L001 S_000000162 16 +YUN3533.3_33_L001 S_000000054 12 +YUN3533.3_33_L001 S_000000045 10 +YUN3533.3_33_L001 S_000000086 9 +YUN3533.3_33_L001 S_000000192 5 +YUN3856.2_6_L001 S_000000059 31 +YUN3856.2_6_L001 S_000000008 47 +YUN3856.2_6_L001 S_000000134 41 +YUN3856.2_6_L001 S_000000149 17 +YUN3856.2_6_L001 S_000000063 10 +YUN3856.2_6_L001 S_000000170 16 +YUN3856.2_6_L001 S_000000193 15 +YUN3856.2_6_L001 S_000000011 6 +YUN3856.2_6_L001 S_000000070 11 +YUN3856.2_6_L001 S_000000085 25 +YUN3856.2_6_L001 S_000000173 25 +YUN3856.2_6_L001 S_000000099 18 +YUN3856.2_6_L001 S_000000018 18 +YUN3856.2_6_L001 S_000000100 17 +YUN3856.2_6_L001 S_000000139 13 +YUN3856.2_6_L001 S_000000038 9 +YUN3856.2_6_L001 S_000000033 9 +YUN3856.2_6_L001 S_000000090 9 +YUN3856.3_4_L001 S_000000016 59 +YUN3856.3_4_L001 S_000000152 31 +YUN3856.3_4_L001 S_000000120 25 +YUN3856.3_4_L001 S_000000031 12 +YUN3856.3_4_L001 S_000000063 14 +YUN3856.3_4_L001 S_000000186 14 +YUN3856.3_4_L001 S_000000159 45 +YUN3856.3_4_L001 S_000000193 10 +YUN3856.3_4_L001 S_000000007 24 +YUN3856.3_4_L001 S_000000087 30 +YUN3856.3_4_L001 S_000000111 15 +YUN3856.3_4_L001 S_000000067 29 +YUN3856.3_4_L001 S_000000070 16 +YUN3856.3_4_L001 S_000000130 23 +YUN3856.3_4_L001 S_000000081 20 +YUN3856.3_4_L001 S_000000135 18 +YUN3856.3_4_L001 S_000000184 13 +YUN3856.3_4_L001 S_000000041 9 +YUN3856.3_4_L001 S_000000137 8 +YUN3856.3_4_L001 S_000000138 8 +YUN3856.3_4_L001 S_000000005 8 +YUN3856.3_4_L001 S_000000037 7 +YUN3856.3_4_L001 S_000000144 7 +YUN3856.3_4_L001 S_000000050 5 +YUN3856.3_4_L001 S_000000003 5 diff --git a/src/R-test/dada2idseq.02.fna b/src/R-test/dada2idseq.02.fna new file mode 100644 index 0000000..e69de29 diff --git a/src/R/dada2idseq.R b/src/R/dada2idseq.R index fe70818..202cc59 100755 --- a/src/R/dada2idseq.R +++ b/src/R/dada2idseq.R @@ -13,7 +13,7 @@ suppressPackageStartupMessages(library(Biostrings)) suppressPackageStartupMessages(library(readr)) suppressPackageStartupMessages(library(dplyr)) -SCRIPT_VERSION = "0.2" +SCRIPT_VERSION = "0.2.1" # Get arguments # For testing: opt <- list(args = 'dada2idseq.00.tsv.gz', options = list(fnafile = 'dada2idseq.01.fna', idlen = 9, prefix = 'S_')) @@ -79,7 +79,11 @@ if ( file.exists(opt$options$fnafile) ) { seqs <- data.frame(seq = readDNAStringSet(opt$options$fnafile)) %>% tibble::rownames_to_column('seqname') %>% mutate(seqnum = sub(opt$options$prefix, '', seqname) %>% as.integer()) - max_seqnum = seqs %>% filter(seqnum == max(seqnum)) %>% pull(seqnum) + max_seqnum = ifelse( + nrow(seqs) > 0, + seqs %>% filter(seqnum == max(seqnum)) %>% pull(seqnum), + 0 + ) } else { seqs <- tibble(seqname = character(), seq = character(), seqnum = integer()) max_seqnum = 0 @@ -99,8 +103,8 @@ seqname_format = sprintf("%%s%%0%dd", opt$options$idlen) seqs <- seqs %>% select(-seqnum) %>% union( seqtab %>% distinct(seq) %>% - anti_join(seqs, by = 'seq') %>% - mutate(seqname = sprintf(seqname_format, opt$options$prefix, max_seqnum + rank(seq))) + anti_join(seqs, by = 'seq') %>% + mutate(seqname = sprintf(seqname_format, opt$options$prefix, max_seqnum + rank(seq))) ) logmsg(sprintf("Writing %d sequences to %s fasta file", nrow(seqs), opt$options$fnafile))