diff --git a/example_files/dengue_metadata.tsv b/example_files/dengue_metadata.tsv new file mode 100644 index 0000000..5839ff0 --- /dev/null +++ b/example_files/dengue_metadata.tsv @@ -0,0 +1,6 @@ +submissionId authors authorAffiliations specimenCollectorSampleId geoLocCountry geoLocAdmin1 geoLocAdmin2 geoLocCity hostNameScientific sampleCollectionDate +AB597980.1 Yamanaka, A.; Konishi, E. BIKEN Endowed Department of Dengue Vaccine Development; 3-1 Yamadaoka, Suita, Osaka 565-0871 SBY6.4Mos, Indonesia Indonesia Aedes aegypti 2009 +AB608786.1 Chu, P. Y.; Ke, G. M.; Chen, P. C.; Liu, L. T.; Tsai, Y. C.; Tsai, J. J. Kaohsiung 80705 NDF30 Taiwan Homo sapiens 2008 +AB873104.1 Moi, M. L.; Kotaki, A.; Takasaki, T. Chigasaki, Kanagawa 253-0087 D1/Cambodia/NRTqs/2013 Cambodia Homo sapiens 2013 +AB915379.1 Kotaki, T.; Yamanaka, A.; Mulyatno, K. C.; Churrotin, S.; Labiqah, A.; Sucipto, T. H.; Soegijanto, S.; Kameoka, M.; Konishi, E. Mahidol University, BIKEN Endowed Department of Dengue Vaccine Development; 420/6 Ratchawithi Road, Ratchathewi, Bangkok 10400 D1/SBY20/13 Indonesia Surabaya Homo sapiens 2013 +EU518605.1 de Thoisy, B.; Lacoste, V.; Germain, A.; Munoz-Jordan, J.; Colon, C.; Mauffrey, J. F.; Delaval, M.; Catzeflis, F.; Kazanji, M.; Matheus, S.; Dussart, P.; Morvan, J.; Setien, A. A.; Deparis, X.; Lavergne, A.; Lacoste, V. L.; Jorge, M.-J.; Jean-Francois, M. Institut Pasteur de la Guyane, Laboratoire des Interactions Virus-Hotes S0108118 French Guiana Homo sapiens 2008-01 diff --git a/example_files/dengue_sequences.fasta b/example_files/dengue_sequences.fasta new file mode 100644 index 0000000..4d2aa87 --- /dev/null +++ b/example_files/dengue_sequences.fasta @@ -0,0 +1,10 @@ +>AB597980.1 +ATGCGGTGCGTAGGAATAGGCAACAGAGACTTCGTGGAAGGACTGTCAGGAGCTACGTGGGTGGATGTGGTACTGGAGCATGGAAGTTGTGTCACTACAATGGCAAAAAACAAACCAACACTGGATATTGAACTCTTAAAGACGGAGGTTACAAACCCAGCCATCCTGCGCAAACTGTGCATTGAAGCCAAAATATCAAATACTACCACCGATTCGAGATGTCCAACACAAGGAGAAGCCACGCTGGTGGAAGAACAAGACACGAACTTCGTGTGTCGACGAACGTTCGTGGACAGAGGCTGGGGCAATGGTTGTGGGCTATTTGGAAAAGGTAGCTTAATAACGTGTGCTAAGTTTAAGTGTGTGACAAAATTGGAAGGAAAGATAGTCCAATATGAAAATTTAAAATATTCAGTGATAGTCACCGTCCACACTGGAGACCAGCACCAAGTTGGGAATGAGACTACAGAACATGGGACAACTGCAATCATAACACCTCAAGCTCCTACGTCGGAAATACAGCTGACAGACTACGGAGCTCTAACACTGGACTGTTCACCTAGAACAGGGCTAGACTTCAATGAGATGGTGTTGTTGACAATGAAAAAAAAATCATGGCTCGTCCACAAACAATGGTTTCTAGACTTACCGCTGCCTTGGACCTCGGGGGCTTCAACATCCCAAGAGACTTGGAATAGACAAGACTTGCTGGTCACATTTAAGACAGCTCATGCAAAGAAGCAGGAAGTAGTTGTACTAGGATCACAAGAGGGAGCGATGCACACTGCGCTGACTGGAGCAACAGAAATCCAAACGTCTGGAACGACAACAATTTTCGCAGGACACCTGAAATGCAGACTGAAAATGGATAAACTAACTTTAAAAGGGGTATCATACGTAATGTGCACAGGCTCATTCAAGCTAGAAAAGGAAGTGGCTGAGACCCAGCATGGAACTGTTCTAGTGCAGGTTAAGTACGAAGGAACAGATGCACCATGTAAGATCCCCTTCTCATCCCAAGATGAGAAGGGAGTAATCCAGAATGGGAGATTGATAACAGCCAACCCCATAGTCACTGACAAAGAAAAACCAGTCAACATTGAGGCGGAGCCACCTTTTGGTGAGAGCTACATCGTGGTAGGAGCAGGTGAGAAAGCTTTGAAACTAAGCTGGTTCAAGAAGGGAAGCAGTATAGGGAAAATGTTTGAAGCAACTGCCCGTGGAGCACGAAGGATGGCCATTCTGGGAGACACTGCATGGGACTTTGGTTCTATAGGAGGAGTGTTCACGTCCGTGGGAAAACTGGTACACCAGATTTTTGGAACTGCGTACGGAGTTTTGTTCAGCGGTGTTTCTTGGACCATGAAAATAGGAATAGGGATTCTGCTGACATGGCTAGGATTAAATTCAAGGAGCACGTCCCTTTCAATGACGTGTATCGCAGTTGGCATGGTCACACTGTACCTAGGAGTCATGGTTCAGGCG +>AB608786.1 +AGTTGTTAGTCTACGTGGACCGACAAGAACAGTTTCGAATCGGAAGCTTGCTTAACGTAGTTCTGACAGTTTTTTATTAGAGAGCAGATCTCTGATGAACAACCAACGGAAAAAGACGGCTCGACCGTCTTTCAATATGCTGAAACGCGCGAGAAACCGCGTGTCAACTGTTTCACAGTTGGCGAAGAGATTCTCAAAAGGATTGCTCTCAGGCCAAGGACCCATGAAATTGGTGATGGCTTTCATAGCATTCCTAAGATTTCTAGCCATACCCCCAACAGCAGGAATTTTGGCTAGATGGGGTTCATTCAAGAAGAGTGGAGCGATCAAAGTGCTACGGGGTTTCAAGAAAGAAATCTCAAACATGTTGAATACAATGAATAGAAGGAAAAGATCTGTGACCATGCTCCTTATGCTGATGCCTACAGCCTTGGCGTTCCATTTGACTACACGAGGGGGAGAGCCGCACATGATAGTCAGCAAGCAGGAAAGAGGAAAATCACTCTTGTTTAAGACCTCAGCAGGTGTCAACATGTGCACCCTTATAGCTATGGATTTGGGAGAGTTATGTGAGGACACAATGACTTACAAATGCCCTCGAATCACTGAAACTGAACCAGATGACGTTGATTGTTGGTGTAATGCCACAGACACATGGGTGACCTATGGAACATGTTCCCAAACTGGCGAGCACCGACGAGACAAACGTTCCGTCGCACTGGCCCCACACGTGGGACTTGGTTTGGAAACAAGAACCGAAACGTGGATGTCCTCTGAAGGCGCTTGGAAACAGATACAAAGAGTGGAGACTTGGGCCCTGAGACACCCAGGATTCACGGTGATAGCCCTTTTTCTAGCACATGTCATAGGAACATCCATCACCCAGAAAGGGATTATTTTCATTTTGTTAATGCTGGTAACACCATCCTTGGCCATGCGATGCGTGGGAATAGGCAGCAGGGACTTCGTGGAAGGACTGTCAGGAGCAACTTGGGTAGATGTGGTACTGGAACATGGAAGTTGCGTCACCACCATGGCAAAAGACAAACCAACATTGGACATTGAACTCTTGAAGACAGAAGTCACAAACCCTGCCGTCCTGCGCAAACTGTGCATTGAAGCTAAAATATCAAACACCACCACCGACTCAAGATGTCCAACACAAGGAGAAGCCACACTAGTGGAAGAACAAGACGCGAACTTTGTGTGTCGACGAACGTTTGTGGACAGAGGCTGGGGCAATGGCTGTGGGCTCTTCGGAAAAGGAAGCCTAATAACGTGTGCTAAGTTCAAGTGTGTGACAAAACTGGAAGGAAAGATAGTTCAATATGAGAACTTGAAATATTCAGTAATAGTCACCGTTCACACCGGAGACCAGCACCAAGTGGGAAATGAAAGCACAGAACATGGGACAACTGCAACTATAACACCTCAAGCTCCTACGACGGAAATACAGCTGACCGACTACGGAGCTCTTACATTGGATTGTTCACCTAGAACAGGACTAGACTTTAATGAAATGGTGTTGTTGACAATGAAAGAAAAATCATGGCTAGTCCACAAACAATGGTTTTTAGACCTACCACTGCCTTGGACCTCGGGAGCTTCAACATCACAAGAGACTTGGAACAGACAAGATTTGCTGGTGACATTTAAGACAGCTCATGCAAAGAAGCAGGAAGTAGTCGTACTAGGATCACAAGAAGGAGCAATGCACACTGCGTTGACCGGAGCGACAGAAATCCAAACGTCTGGAACGACAACAATTTTTGCAGGACACTTGAAGTGCAGACTAAAGATGGACAAACTGACTCTAAAAGGGATGTCATATGTGATGTGCACAGGCTCATTCAAGCTAGAGAAAGAAGTGGCTGAGACCCAGCATGGAACCGTTCTAGTGCAGATTAAATACGAAGGAACAGATGCACCATGCAAGATCCCTTTTTCGACCCAAGATGAAAAAGGAGTAACCCAGAATGGGAGATTGATAACAGCCAACCCCATAGTTACTGACAAAGAAAAACCAGTCAACATTGAGGCAGAACCGCCCTTTGGTGAGAGTTACATCATAATAGGAGCAGGTGAAAAAGCTTTGAAACTAAGCTGGTTCAAGAAAGGAAGCAGCATAGGGAAAATGTTTGAGGCAACTGCCAGAGGAGCACGAAGGATGGCCATACTGGGAGACACCGCATGGGACTTTGGTTCTATAGGAGGAGTGTTCACGTCTGTTGGAAAATTAGTACACCAGATTTTTGGAACTGCATATGGAGTTTTGTTCAGCGGTGTTTCTTGGACCATGAAAATAGGAATAGGGGTTCTGCTGACATGGCTGGGATTAAACTCAAGGAGCACGTCCCTTTCGATGACGTGCATTGCAGTTGGCCTAGTAACACTATACCTAGGAGTCATGGTTCAGGCGGATTCAGGATGTGTAATAAATTGGAAAGGTAGAGAACTCAAATGTGGAAGTGGCATTTTTGTCACCAATGAAGTTCACACTTGGACAGAGCAATACAAATTTCAAGCTGACTCCCCAAAGAGACTATCAGCAGCCATCGGGAAGGCATGGGAGGAGGGTGTGTGTGGAATTCGATCAGCAACTCGTCTCGAGAACATCATGTGGAAGCAAATATCAAATGAACTGAATCACATCTTACTTGAAAATGATATGAAATTCACAGTGGTTGTAGGAGATGTTGCTGGGATCTTGGCTCAAGGAAAGAAAATGATTAGGCCACAACCCATGGAATACAAATACTCGTGGAAAAGCTGGGGAAAGGCTAAAATCATAGGGGCAGATGTACAGAACACCACCTTCATCATCGATGGCCCAAACACCCCAGAATGCCCTGATGACCAAAGAGCATGGAACATTTGGGAAGTTGAGGACTATGGATTTGGAATTTTCACGACAAACATATGGCTGAAATTGCGCGATTCCTACACCCAAGTGTGTGACCACCGGCTAATGTCAGCTGCCATCAAGGACAGCAAGGCAGTTCACGCTGACATGGGGTACTGGATAGAAAGTGAAAAGAACGAGACCTGGAAGCTGGCAAGAGCCTCTTTCATAGAAGTTAAAACATGTATCTGGCCAAAATCCCACACTCTATGGAGCAATGGAGTTCTGGAAAGTGAAATGATAATTCCAAAGATCTATGGAGGACCAATATCTCAGCACAACTACAGACCAGGATATTTCACACAAACAGCAGGGCCGTGGCACCTAGGCAAGTTGGAACTGGATTTTGATTTGTGTGAGGGTACCACAGTTGTTGTGGATGAACATTGTGGAAATCGAGGACCATCTCTTAGGACCACAACAGTCACAGGAAAGATAATTCATGAATGGTGTTGCAGATCTTGCACGCTACCACCCTTACGTTTCAGAGGAGAAGATGGGTGCTGGTACGGTATGGAAATCAGACCAGTCAAGGAAAAGGAAGAAAATCTAGTCAAATCAATGGTCTCTGCAGGGTCAGGGGAAGTGGACAGCTTTTCACTAGGACTGCTATGCATATCAATAATGATCGAGGAGGTGATGAGATCCAGATGGAGTAGAAAAATGCTGATGACTGGAACACTGGCTGTGTTCTTCCTTCTCATAATGGGACAATTGACATGGAACGATCTGATCAGATTATGCATCATGGTTGGAGCCAACGCGTCCGACAGGATGGGGATGGGAACGACGTACCTAGCCCTGATGGCCACTTTTAAAATGAGACCGATGTTTGCTGTAGGGCTATTATTTCGCAGACTAACATCCAGAGAAGTTCTTCTTCTAACAATTGGATTGAGTCTAGTGGCATCTGTGGAGTTACCAAATTCCTTGGAGGAGCTGGGGGATGGACTTGCAATGGGCATTATGATTTTAAAATTATTGACTGACTTTCAATCACATCAGCTGTGGGCTACCTTGCTGTCCTTGACATTTATCAAAACAACGTTTTCCTTGCACTACGCATGGAAGACAATGGCTATGGTACTGTCAATTGTATCTCTCTTCCCTTTATGCCTGTCCACGACCTCCCAAAAAACAACATGGCTTCCGGTGCTATTGGGATCCCTTGGATGCAAACCACTAACCATGTTTCTTATAGCAGAAAACAAAATCTGGGGAAGGAAAAGTTGGCCCCTCAATGAAGGAATCATGGCTGTTGGAATAGTCAGCATCCTACTAAGTTCACTCCTCAAAAATGATGTACCGCTAGCTGGGCCACTAATAGCTGGAGGCATGCTAATAGCATGTTATGTTATATCTGGAAGCTCAGCCGACCTATCACTAGAGAAAGCGGCTGAGGTCTCCTGGGAAGAAGAAGCAGAACACTCTGGTGCCTCACACAACATATTAGTGGAAGTCCAAGATGATGGAACCATGAAGATAAAGGATGAAGAGAGAGATGACACGCTAACCATTCTCCTTAAAGCAACTCTGTTAGCAGTTTCAGGGGTGTACCCATTATCAATACCAGCGACCCTTTTCGTGTGGTACTTTTGGCAGAAAAAGAAACAGAGATCTGGAGTGTTATGGGACACACCCAGCCCTCCAGAAGTGGAAAGAGCAGTTCTTGATGATGGTATCTATAGAATTATGCAGAGAGGACTGTTGGGCAGGTCCCAAGTAGGGGTAGGAGTTTTCCAAGAAAACGTGTTCCACACAATGTGGCATGTCACCAGGGGAGCTGTACTCATGTATCAAGGGAAGAGATTGGAACCGAGCTGGGCCAGTGTCAAAAAAGACCTGATCTCATATGGAGGAGGTTGGAGGCTTCAAGGATCCTGGAACACAGGAGAAGAAGTGCAGGTGATTGCTGTTGAACCAGGGAAAAACCCCAAAAATGTACAAACAGCGCCGGGCACCTTTAAGACCCCTGAAGGTGAAGTTGGAGCCATTGCCCTAGACTTTAAACCTGGCACATCCGGATCTCCCATCGTGAACAGAGAAGGAAAAATAGTAGGTCTTTATGGAAATGGAGTAGTGACAACAAGTGGAACCTACGTCAGTGCCATAGCCCAAGCCAAAGCATCACAAGAAGGGCCCCTACCAGAGATTGAAGACGAGGTGTTTAGGAAAAGAAACTTAACAATAATGGACCTACATCCAGGATCGGGGAAAACAAGAAGATATCTTCCAGCCATAGTCCGTGAGGCCATAAAAAGGAAGCTGCGCACACTAATTCTGGCTCCCACAAGGGTTGTCGCTTCCGAAATGGCAGAGGCGCTCAAGGGAATGCCAATAAGGTACCAAACAACAGCAGTGAAGAGTGAACATACAGGAAAAGAGATAGTTGACCTCATGTGTCACGCCACTTTCACCATGCGCCTCCTGTCTCCCGTAAGAGTTCCCAATTACAACATGATCATCATGGATGAAGCACATTTCACCGATCCATCCAGTATAGCGGCCAGAGGGTACATCTCAACCCGAGTGGGCATGGGTGAAGCAGCTGCAATCTTCATGACAGCCACTCCCCCAGGATCAGTGGAGGCCTTTCCACAGAGCAACGCAGTTATCCAAGATGAGGAAAGAGACATTCCTGAGAGATCATGGAACTCAGGCTATGAGTGGATCACTGACTTCCCAGGTAAAACAGTTTGGTTTGTTCCAAGCATTAAATCAGGAAATGACATTGCCAACTGCTTAAGAAAGAATGGGAAACGGGTGATTCAATTGAGCAGGAAAACCTTTGATACAGAGTACCAAAAAACAAAAAACAACGACTGGGACTACGTCGTCACAACAGACATCTCCGAAATGGGAGCAAATTTCCGAGCCGACAGGGTGATAGACCCAAGACGGTGTCTGAAACCGGTAATACTAAAAGACGGTCCAGAGCGTGTTATTTTAGCAGGACCAATGCCAGTGACTGTGGCCAGTGCCGCCCAGAGGAGAGGAAGAATTGGAAGGAACCACAATAAGGAAGGTGATCAGTACATCTACATGGGACAGCCTTTAAACAACGATGAAGATCACGCTCACTGGACAGAAGCAAAAATGCTCCTTGATAATATAAACACACCAGAAGGGATTATCCCAGCCCTCTTCGAGCCAGAGAGAGAAAAGAGCGCAGCAATAGACGGGGAATACAGACTGCGGGGTGAAGCAAGGAAAACGTTTGTGGAGCTCATGAGAAGAGGAGATCTACCTGTCTGGCTATCCTACAAAGTTGCCTCAGAAGGCTTCCAGTACTCTGACAGAAGATGGTGCTTTGACGGTGAAAGGAACAACCAGGTGTTGGAGGAGAACATGGACGTAGAGATCTGGACAAAAGAAGGAGAAAGAAAGAAACTACGACCCCGCTGGCTGGATGCCAGAACATACTCAGACCCACTAGCCCTGCGCGAGTTTAAAGAGTTTGCAGCAGGGAGAAGAAGCGTCTCAGGTGATTTAATATTAGAAATAGGGAAGCTTCCACAACACTTGACGCAAAGGGCCCAGAATGCCTTGGACAACCTGGTTATGTTGCACAACTCCGAACAAGGAGGAAGAGCCTATAGACATGCAATGGAAGAACTGCCAGACACCATAGAAACGTTGATGCTCCTAGCTCTGATAGCTGTGTTAACTGGTGGAGTGACACTGTTCTTCCTATCAGGAAGGGGCCTAGGGAAAACATCTATTGGCCTACTCTGCGTAATGGCTTCAAGCGTACTGCTATGGATGGCCAGTGTGGAGCCCCATTGGATAGCGGCCTCCATCATACTGGAGTTCTTCCTGATGGTGCTGCTTATTCCGGAGCCAGACAGACAACGCACTCCGCAGGACAACCAGCTGGCATATGTGGTGATAGGTTTGTTATTCATGATACTGACAGTAGCAGCCAATGAGATGGGACTGCTGGAAACCACAAAGAAAGACTTAGGGATTGGCCATGTGGCTGTTGAAAATCACCACCATGCCGCAATGCTGGACGTAGACTTACATCCAGCTTCAGCCTGGACCCTCTATGCAGTGGCCACAACAATTATCACTCCCATGATGAGGCACACAATCGAAAACACAACGGCAAACATTTCCCTGACAGCCATTGCAAACCAGGCAGCTATATTGATGGGACTTGACAAAGGATGGCCAATATCGAAGATGGACATAGGAGTTCCACTTCTCGCCTTGGGGTGCTATTCCCAGGTGAATCCACTGACGCTGACAGCGGCGGTATTGATGCTAGTGGCTCATTACGCCATAATTGGACCTGGACTGCAAGCAAAAGCTACTAGAGAAGCTCAAAAAAGGACAGCGGCCGGAATAATGAAAAATCCAACCGTTGATGGAATTGTTGCAATAGATTTGGACCCTGTGGTTTATGATGCAAAATTTGAAAAACAACTAGGCCAAATAATGTTGTTGATACTATGCACATCACAGATCCTCTTGATGCGGACTACATGGGCCTTGTGCGAGTCCATCACACTGGCCACTGGACCTCTGACCACGCTTTGGGAGGGATCTCCAGGAAAATTTTGGAACACCACGATAGCGGTTTCCATGGCAAACATTTTCAGAGGAAGTTATCTAGCAGGAGCAGGTCTGGCCTTCTCATTAATGAAATCTCTAGGAGGAGGTAGGAGAGGCACGGGAGCCCAAGGGGAAACACTGGGAGAGAAATGGAAAAGACAGCTGAACCAACTGAGCAAGTCAGAATTTAACACCTATAAAGGAAGTGGGATTATGGAAGTGGACAGATCCGAAGCCAAAGAGGGATTGAAAAGAGGAGAAACAACCAAACATGCAGTGTCGAGAGGAACCGCTAAACTGAGGTGGTTTGTGGAAAGGAACCTTGTGAAACCAGAAGGGAAAGTCATAGACCTCGGTTGTGGAAGAGGTGGCTGGTCATACTATTGCGCTGGGCTGAAGAAAGTCACAGAAGTGAAGGGATATACAAAAGGAGGACCTGGACATGAGGAACCAATCCCAATGGCGACCTATGGATGGAACCTAGTAAAGCTGCACTCTGGGAAAGACGTATTCTTTATACCACCTGAGAAATGTGACACCCTTTTGTGTGATATTGGTGAGTCCTCTCCAAACCCAACTATAGAGGAAGGAAGAACGCTACGCGTCCTAAAGATGGTGGAACCATGGCTCAGAGGAAACCAATTTTGCATAAAAATTCTGAATCCCTACATGCCAAGTGTGGTGGAAACTCTGGAGCAAATGCAAAGAAAACATGGAGGAATGCTAGTGCGAAATCCACTTTCAAGAAATTCTACTCATGAAATGTATTGGGTTTCATGTGGAACAGGAAACATTGTGTCAGCAGTAAACATGACATCTAGAATGTTGCTAAATCGATTCACAATGGCTCACAGGAAACCAACATATGAAAGAGACGTGGACCTAGGCGCCGGAACAAGACATGTGGCAGTGGAACCAGAGGTAGCCAACCTAGACATCATTGGCCAGAGGATAGAGAACATAAAACATGAACATAAGTCAACATGGCATTATGATGAGGACAATCCATATAAAACGTGGGCCTATCATGGATCATATGAGGTCAAGCCATCAGGATCAGCCTCATCCATGGTCAATGGCGTGGTGAAACTGCTCACCAAACCATGGGATGTCATCCCTATGGTCACACAAATAGCCATGACTGACACTACACCCTTTGGACAACAGAGGGTGTTTAAAGAGAAAGTTGACACACGCACACCAAAAGCAAAACGGGGCACAGCACAAATCATGGAGGTGACAGCCAAGTGGTTATGGGGTTTTCTTTCTAGAAACAAGAAACCAAGAATTTGCACAAGAGAGGAGTTCACAAGAAAAGTTAGGTCAAACGCAGCCATTGGAGCAGTGTTCGTTGATGAAAATCAATGGAACTCAGCAAAAGAAGCAGTGGAAGATGAGCGGTTCTGGGACCTTGTGCATAGAGAGAGGGAGCTTCACAAACAGGGAAAATGTGCTACGTGTGTTTACAACATGATGGGGAAGAGAGAGAAAAAGCTAGGAGAGTTCGGAAAGGCAAAAGGAAGTCGTGCAATATGGTACATGTGGTTGGGAGCACGCTTTCTAGAGTTCGAAGCTCTTGGTTTCATGAACGAAGATCACTGGTTCAGCAGAGAGAATTCACTCAGCGGAGTGGAAGGAGAAGGACTCCACAAACTTGGATATATACTCAGAGACATATCAAAGATTCCAGGGGGAAACATGTATGCAGATGACACAGCCGGATGGGATACAAGGATAACAGAGGATGACCTTCAGAATGAGGCCAAAATTACTGACATCATGGAACCCGAACATGCCCTACTGGCTAAGTCAATCTTCAAGTTAACCTACCAAAATAAGGTGGTAAGGGTACAGAGACCAGCAAAAAATGGAACCGTGATGGATGTCATATCCAGACGTGACCAGAGAGGAAGTGGTCAGGTCGGAACTTATGGCTTAAACACTTTCACCAACATGGAAGCCCAGCTGATAAGACAAATGGAGTCTGAGGGAATCTTTTCACCCAGCGAATTAGAGACCCCAAATTTAGCCGAGAGAGTTCTCGACTGGCTGGAAAAATATGGCGTCGAAAGGCTGAAAAGAATGGCAATCAGCGGAGATGACTGCGTAGTGAAACCAATTGATGATAGGTTTGCAACAGCCTTGACAGCTCTGAATGATATGGGAAAAGTAAGAAAAGATATACCACAATGGGAACCTTCAAAAGGATGGAATGATTGGCAACAAGTGCCTTTTTGTTCACACCACTTCCACCAGCTGATTATGAAGGATGGGAGGGAAATAGTGGTGCCATGCCGCAACCAAGATGAACTTGTGGGTAGGGCTAGAGTATCACAAGGTGCTGGATGGAGCCTGAGAGAAACTGCATGCCTAGGCAAGTCATATGCACAAATGTGGCAGCTGATGTACTTCCACAGGAGAGACCTGAGACTAGCCGCTAATGCTATCTGTTCAGCCGTTCCAGTTGATTGGGTCCCAACCAGCCGTACCACCTGGTCGATCCATGCCCATCACCAATGGATGACAACAGAAGACATGCTGTCAGTGTGGAATAGGGTTTGGATAGAGGAAAACCCATGGATGGAGGACAAAACCCACATATCCAGTTGGGGAGATGTTCCATATTTAGGAAAAAGGGAAGACCAATGGTGTGGATCCCTGATAGGCTTAACAGCAAGGGCCACCTGGGCCACCAACATACAAGTGGCCATAAACCAAGTGAGAAGACTAATTGGGAATGAGAATTATCTAGATTACATGACATCAATGAAGAGATTCAAGAACGAGAGTGATCCCGAAGGGGCACTCTGGTAAGTCAACACATTCACAAAACAAAGGAAAATAAGAAATCAAACAAGGCAAGAAGTCAGGCCGGATTAAGCCATAGTACGGTAAGAGCTATGCTGCCTGTGAGCCCCGTCTAAGGACGTAAAATGAAGTCAGGCCGGAAGCCACGGTTTGAGCAAACCGTGCTGCCTGTAGCTCCATCGTGGGATGTAAAAACCCGGGAGGCTGCACCCATGGAAGCTGTACGCATGGGGTAGCAGACTAGTGGTTAGAGGAGACCCCTCCCAAAACACAACGCAGCAGCGGGGCCCAACACCAGGGGAAGCTGTACCCTGGTGGTAAGGACTAGAGGTTAGAGGAGACCCCCCGCACAACAATAAACAGCATATTGACGCTGGGAGAGACCAGAGATCCTGCTGTCTCTACAGCATCATTCCAGGCACAGAACGCCAGAAAATGGAATGGTGCTGTTGAATCAACAGGTTCTATCAATGAAGAGATTC +>AB873104.1 +ATGCGATGCGTGGGAATAGGCAACAGGGACTTCGTGGAAGGACTGTCAGGAGCAACCTGGGTAGATGTGGTGCTGGAACATGGAAGTTGCGTCACCACCATGGCAAAAGACAAACCAACATTGGACATTGAACTCTTGAAGACGGAAGTCACAAACCCTGCCATCCTGCGCAAACTGTGCATTGAAGCTAAAATATCAAACACCACCACCGACTCAAGATGTCCAACACAAGGAGAAGCCACACTGGTGGAAGAACAAGACGCGAACTTTGTGTGTCGACGAACGTTTGTGGACAGAGGCTGGGGCAATGGCTGTGGGCTCTTCGGAAAAGGAAGCCTAATAACGTGTGCCAAGTTCAAGTGTGTGACAAAACTGGAAGGAAAGATAGTTCAATATGAAAACTTGAAATATTCAGTAATAGTCACCGTTCACACCGGAGACCAGCACCAGGTGGGAAATGAAAGCACAGAACATGGGACAACTGCAACTATAACACCTCAAGCTCCTACGACGGAAATACAGCTGACTGACTACGGAGCTCTTACATTGGATTGCTCACCTAGAACAGGACTAGACTTTAATGAAATGGTGTTGTTGACAATGAAAGAAAAATCATGGCTAGTCCACAAACAATGGTTTCTAGACCTACCACTGCCTTGGACCTCGGGAGCCTCAACATCACAAGAGACTTGGAACAGACAAGATTTGCTGGTGACATTTAAGACAGCCCATGCAAAGAAGCAGGAAGTAGTCGTACTAGGATCACAAGAAGGAGCAATGCACACTGCGTTGACCGGAGCAACAGAAATCCAAACGTCTGGAACGACAACAATTTTTGCAGGACACTTGAAATGCAGACTAAAGATGGACAAACTGACCCTAAAAGGGGTGTCATATGTGATGTGCACAGGCTCATTCAAGCTAGAGAAAGAAGTGGCTGAGACCCAGCATGGAACCGTTCTAGTGCAGATTAAATATGAAGGAACAGATGCACCATGCAAGATCCCTTTTTCAACCCAAGATGAAAAAGGAGTAACCCAGAATGGGAGATTGATAACAGCCAACCCCATAGTTACTGACAAAGAAAAACCAGTCAACATTGAGGCAGAACCGCCTTTTGGTGAGAGTTACATCGTAATAGGAGCAGGTGAAAAAGCTTTGAAACTAAGCTGGTTTAAGAAAGGAAGCAGCATAGGGAAAATGTTTGAGGCAACTGCCAGAGGAGCACGAAGGATGGCCATACTGGGAGACACCGCATGGGACTTTGGTTCTATAGGAGGAGTGTTCACGTCCGTTGGAAAATTAGTACACCAGATTTTTGGAACTGCATATGGAGTTTTGTTCAGCGGTGTTTCCTGGACCATGAAAATAGGAATAGGGGCTCTGCTGACATGGCTAGGACTAAACTCAAGGAGCACGTCCCTTTCGATGACGTGCATTGCAGTTGGCCTAGTAACACTATACCTAGGAGTCATGGTTCAGGCA +>AB915379.1 +ATGCGATGCGTGGGAATAGGCAGCAGGGACTTCGTGGAAGGACTGTCAGGAGCAACTTGGGTAGATGTGGTGCTGGAACATGGAAGTTGCGTCACTACCATGGCAAAAGACAAACCAACATTGGACATTGAACTCTTGAAGACGGAAGTCACAAACCCTGCCGTCCTGCGCAAATTGTGCATTGAAGCTAAAATATCAAACACCACCACCGACTCAAGATGTCCAACACAAGGTGAAGCCACACTGGTGGAAGAACAAGACGCGAACTTTGTGTGTCGACGAACGTTTGTGGACAGAGGATGGGGCAATGGCTGTGGGCTCTTCGGAAAAGGAAGCCTTATAACGTGTGCTAAATTCAAGTGTGTGACAAAACTGGAAGGAAAAATAGTTCAATATGAAAACTTGAAATATTCAGTAATAGTCACCGTCCACACTGGAGACCAGCATCAGGTGGGAAATGAAAGCACAGAACATGGGACAACTGCAACTATAACACCTCAAGCTCCTACGACAGAAATACAGCTGACCGACTACGGAGCTCTCACATTGGATTGTTCACCTAGAACAGGACTAGACTTTAATGAAATGGTGTTGTTGACAATGAAAGAAAAATCATGGCTAGTCCACAAACAATGGTTTCTAGACCTACCACTGCCTTGGACCTCGGGAGCTTCAACAACACAAGAAACTTGGAACAGACAAGATTTGCTGGTGACATTTAAGACAGCCCATGCAAAGAAGCAGGAAGTAGTCGTACTAGGATCACAAGAAGGAGCAATGCACACTGCGCTGACCGGAGCGACGGAAATCCAAACGTCTGGAACGACAACAATTTTTGCAGGACACTTGAAATGTAGACTAAAAATGGACAAACTGACTCTAAAAGGGATGTCATATGTGATGTGCACAGGCTCATTCAAGCTAGAGAAAGAAGTGGCTGAGACCCAGCATGGAACCGTCCTAGTGCAGATTAAATACGAAGGAACAGATGCACCATGCAAGATCCCTTTTTCGACCCAAGATGAAAAAGGAGTGACCCAGAATGGGAGATTGATAACAGCCAACCCCATAGTCACTGACAAAGAAAAACCAATCAACATTGAGGCAGAACCGCCTTTTGGTGAGAGTTACATCGTGATAGGAGCAGGTGAAAAAGCTTTGAAACTAAGCTGGTTCAAGAAAGGAAGCAGCATAGGGAAAATGTTTGAGGCAACGGCCAGAGGAGCACGAAGGATGGCCATACTGGGAGACACCGCATGGGACTTTGGTTCTATAGGAGGAGTGTTTACGTCTGTTGGAAAATTAGTACACCAGATCTTTGGAACTGCATATGGAGTTTTGTTCAGCGGTGTTTCCTGGACCATGAAGATAGGAATAGGGGTTCTGCTAACATGGCTAGGATTAAACTCAAGGAGCACGTCCCTTTCGATGACGTGCATTGCAGTTGGCTTAGTAACGCTATACTTAGGAGTCATGGTTCAGGCG +>EU518605.1 +GTGTCAACTGGTTCACAGTTGGCGAAGAGATTCTCAAAAGGATTGCTTTCAGGCCAAGGACCCATGAAATTGGTGATGGCTTTCATAGCATTTCTAAGATTTCTAGCCATACCCCCAACAGCAGGAATTTTGGCTAGATGGAGCTCATTCAAGAAGAATGGAGCAATCAAAGTGTTACGGGGTTTCAAAAAAGAGATCTCAAGCATGTTGAACATAATGAACAGGAGGAAAAGATCCGTGACCATGCTCCTCATGCTGCTGCCCACAGCCCTGGCGTTTCATTTGACCACACGAGGGGGAGAGCCACACATGATAGTTAGTAAGCAGGAAAGAGGAAAGTCACTCTTGTTTAAGACCTCTGCGGGCGTCAATATGTGCACCCTCATTGCGATGGACTTGGGAGAGTTATGTGAGGACAC