diff --git a/.gitignore b/.gitignore index a30c9f7be..27573288e 100644 --- a/.gitignore +++ b/.gitignore @@ -5,3 +5,4 @@ \.env \.vscode /docs/tmp/ +\.venv diff --git a/data/community/genspectrum/iav/h5n1/GG1996/HA/CHANGELOG.md b/data/community/genspectrum/iav/h5n1/GG1996/HA/CHANGELOG.md new file mode 100644 index 000000000..81199b7df --- /dev/null +++ b/data/community/genspectrum/iav/h5n1/GG1996/HA/CHANGELOG.md @@ -0,0 +1,3 @@ +## Unreleased + +Initial release diff --git a/data/community/genspectrum/iav/h5n1/GG1996/HA/README.md b/data/community/genspectrum/iav/h5n1/GG1996/HA/README.md new file mode 100644 index 000000000..7341aaff6 --- /dev/null +++ b/data/community/genspectrum/iav/h5n1/GG1996/HA/README.md @@ -0,0 +1,26 @@ +# H5N1 (segment4/ HA) - dataset with A/Goose/Guangdong/1/96 reference + +| attribute | value | +| ------------------- | ---------------------------------------- | +| dataset name | community/genspectrum/iav/h5n1/GG1996/HA | +| reference strain | A/Goose/Guangdong/1/96(H5N1) | +| reference accession | NC_007362.1 | +| assembly accession | GCF_000864105.1 | + +## Authors and contacts + +Maintained by Genspectrum, Chaoran Chen and Anna Parker + +With the help of: Cornelius Roemer and Richard Neher + +## Scope of this dataset + +This dataset uses the first highly-pathogenic avian influenza (HPAI) isolate (A/Goose/Guangdong/1/96) as a reference and is suitable for the analysis of circulating and historical H5 sequences, including low-pathogenicity avian influenza (LPAI) isolates. + +## Features + +This simple dataset only supports alignment. + +## What is Nextclade dataset + +Read more about Nextclade datasets in Nextclade documentation: https://docs.nextstrain.org/projects/nextclade/en/stable/user/datasets.html diff --git a/data/community/genspectrum/iav/h5n1/GG1996/HA/examples.fasta b/data/community/genspectrum/iav/h5n1/GG1996/HA/examples.fasta new file mode 100644 index 000000000..7f980491b --- /dev/null +++ b/data/community/genspectrum/iav/h5n1/GG1996/HA/examples.fasta @@ -0,0 +1,38 @@ +>AB823747.1 +TCCAATCTGTCAAAATGGAGAAAATAGTGCTTCTTTTTGCGATAGTCAGTCTTGTCAAAAGTGACCAGATTTGCATTGGCTACCATGCAAACAACTCGACAGAGAAGGTTGACACGATAATGGAAAAGAACGTTACTGTTACACATGCCCAAGACATACTAGAAAAGACACATAACGGAAAGCTCTGTGACTTAGATGGAGTTAGGCCTCTAATTTTGAGAGATTGTAGTGTAGCTGGATGGCTTCTCGGAAACCCAATGTGTGACGAATTCATCAATGTGCCAGAATGGTCTTATATAGTGGAGAAGGCCAATCCAGTCAATGACCTCTGTTACCCAGGAGTTTTCAATGACTATGAAGAATTGAAACACCTATTGAGCAGAATAAACCATTTTGAGAAAATTCAGATCATCCCCAAGAGTTCTTGGCCCAGTCATGAAGCCTCAATGGGGGTGAGCGCAGCATGTCCATACCAGGGACAGTCCTCTTTTTTCCGAAATGTGGTGTGGCTTATCAAAAAGAACAGTACATACCCAACAATAAAGAGGAGTTACAATAATACCAACCAAGAAGATCTTTTAGTAATGTGGGGGATCCACCATCCTAATGATGCAGCAGAACAGACAAAACTCTATCAAAATCCAACCACCTATATCTCCGTTGGGACGTCAACACTAAACCAGAGACTGACACCAAGAATAGCTACTAGATCCAAAATAAACGGACAAAGTGGGAGGATGGAGTTCTTTTGGACAATCTTAAAACCGAATGATGCAATCAACTTCGAGAGTAATGGAAATTTCATTGCTCCAGAATATGCATACAAAATTGTCAAGAAAGGGGACTCAACAATTATGAGAAGTGAATTGGAATATGGTAACTGCAACACCAAGTGTCAAACTCCAATGGGGGCGATAAACTCTAGTATGCCATTCCACAATATACATCCTCTCACTATTGGAGAATGCCCCAAATATGTGAAATCAACCAGATTAGTCCTTGCGACTGGGCTCAGAAATAGCCCTCAAAGAGAGGAAAGAAGAAAAAAGAGAGGATTATTTGGAGCTATAGCAGGGTTTATAGAAGGAGGATGGCAGGGGATGGTAGATGGTTGGTATGGATACCATCATAGCAATGAGCAGGGAAGCGGGTACGCTGCAGACAAAGAATCCACTCAAAAGGCTATAGATGGAGTCACCAATAAGGTCAACTCGATCATTGACAAAATGAACACTCAGTTTGAGGCTGTTGGAAGGGAATTTAACAACTTAGAAAGAAGAATAGAGAATTTAAACAAGAAGATGGAAGACGGGTTCCTAGATGTCTGGACTTATAATGCTGAACTTCTGGTTCTCATGGAAAATGAAAGAACTCTAGACTTCCATGACTCAAATGTAAAGAACCTTTACGACAAGGTCCGATTGCAGCTTAGGGATAATGCCAAGGAGCTGGGTAACGGTTGTTTTGAGTTCTATCACAAATGTGATAATGAATGCATGGAAAGTGTGAGAAACGGGACATATGACTACCCGCAGTATTCAGAAGAAGCAAGATTAAAAAGAGAGGAGATAAGTGGAGTGAAATTGGAATCGATAGGAGTTTACCAAATACTGTCAATTTATTCTACAGTGGCGAGTTCCCTAGCACTGGCAATCATGGTAGCTGGTCTATCCTTATGGATGTGCTCCAATGGGTCGTTACAATGCAGAATTTGCATTTAAATTTGTGAG +>GU002704.1 +AAAAGTGATCAGATTTGCATTGGTTACCATGCAAACAACTCGACAGAGCAGGTTGACACAATAATGGAAAAGAACGTCACTGTTACACACGCCCAAGACATACTGGAAAAGACACACAACGGGAAACTCTGCAATCTAGATGGAGTGAAGCCTCTAATTTTAAGAGATTGTAGTGTAGCCGGATGGCTCCTCGGGAACCCAATGTGCGACGAATTCCTCAATGTGCCGGAATGGTCTTACATAGTGGAGAAGATCAATCCAGCCAATGACCTCTGTTATCCAGGGAATTTCAACGACTATGAAGAACTGAAACACCTATTGAGCAGAATAAACCATTTTGAGAAAATTCAGATCATCCCCAAAAATTATTGGTCAGATCATGAAGCCTCAGGAGTGAGCTCAGCATGTCCATACCAGGGAAGATCCTCCTTTTTTAGAAATGTGGTATGGCTTACCAAAAAGAACAATGCATACCCAACAATAAAGAGAAGTTACAATAATACCAACCAAGAAGATCTTTTGGTACTATGGGGGATTCACCATCCAAATGATGCGGAAGAGCAGACAAGGCTTTATCAAAACCCAACTACCTATATTTCCGTTGGGACATCAACACTAAACCAGAGATTGGTACCAAAAATAGCTACTAGATCTAAGGTAAACGGGCAAAGTGGAAGGATGGAGTTCTTTTGGACAATTTTAAAATCGAATGATGCAATAAACTTTGAGAGTAATGGAAATTTCATTGCTCCAGAAAATGCATACAAAATTGTCAAGAAAGGGGACTCAACAATTATGAAAAGTGAGTTGGAATATGGTAACTGCAACACCAAGTGTCAGACTCCAATAGGGGCGATAAACTCCAGTATGCCATTCCACAACATCCACCCCCTCACCATCGGGGAATGCCCCAAATATGTGAAATCAAACAGATTAGTCCTTGCTACTGGGCTCAGAAATAGCCCTCAAGGAGAGAGAAGAAGAAAAAAGAGAGGACTATTTGGAGCTATAGCAGGTTTTATAGAGGGAGGATGGCAGGGAATGGTAGATGGTTGGTATGGGTACCACCATAGCAACGAGCAGGGGAGTGGGTACGCTGCAGACAAAGAATCCACTCAAAAGGCAATAGATGGAGTCACCAATAAGGTCAACTCGATCATTGACAAAATGAACACTCAGTTTGAGGCTGTTGGAAGGGAATTTAATGCCTTAGAAAGGAGAATAGAAAATTTAAACAAGAAGATGGAAGACGGATTCCTAGATGTCTGGACTTATAATGCTGAACTTCTGGTTCTCATGGAAAATGAGAGAACTCTAGACTTTCATGACTCAAATGTCAAGAACCTTTACGACAAGGTCCGACTACAGCTTAGGGATAATGCAAAGGAGCTTGGCAACGGTTGTTTCGAGTTCTATCACAGATGTGATAATGAATGTATGGAAAGTGTAAGAAACGGAACGTATGACTACCCGCAGTATTCAGAAGAAGCAAGATTAAAAAGAGAGGAAATAAGTGGAGTAAAATTGGAGTCAATAGGAACTTACCAAATACTGTCAATTTATTCAACAGTGGCGAGCTCCCTAGCACTGGCAATCATGGTGGCTGGTCTATTTTTATGGATGTGCTCCAATGGATCGTTACAATGCAGAATTTGCATTTAA +>GU002705.1 +ATGGAGAAAATAGTGCTTCTTCTTGCAATAGTCAGTCTTGTTAAAAGTGATCAGATTTGCATTGGTTACCATGCAAACAACTCAACAGAGCAGGTTGACACAATAATGGAAAAGAACGTCACTGTTACACACGCTCAAGACATACTGGAAAAGACACACAACGGGAAACTCTGCGATCTAGATGGAGTGAAGCCTCTAATTTTAAGAGATTGTAGTGTAGCTGGATGGCTCCTCGGGAACCCAATGTGTGACGAATTCCCCAATGTGTCGGAATGGTCCTACATAGTGGAGAAGATCAATCCAGCCAATGACCTCTGTTACCCAGGGAATTTCAACAACTATGAAGAACTGAAACACCTATTGAGCAGAATAAACCGGTTTGAGAAAATTCAGATCATCCCCAAAAGTTCTTGGCCAGATCATGAAGCCTCATTAGGAGTGAGCTCAGCATGTCCATACCAGGGAGGACCCTCCTTTTATAGAAATGTGGTATGGCTTATCAAAAAGAACAATACATACCCAACAATAAAGGAAAGTTACCATAATACCAATCAAGAAGATCTTTTGGTGCTGTGGGGGATCCACCATCCAAATGATGAGGAAGAGCAGACAAGGATCTATAAAAACCCAACTACCTATATTTCCGTTGGGACATCAACACTAAACCAGAGATTGGTACCAAAGATAGCCACTAGATCTAAGGTAAACGGGCAAAGTGGAAGAGTGGAGTTCTTTTGGACAATTTTAAAATCAAATGATACAATAAGCTTTGAGAGTAATGGAAATTTCATTGCTCCAGAAAATGCATACAAAATTGTCAAGAAAGGGGACTCAACAATTATGAAAAGTGAGTTGGAATATGGTAACTGCAGCACCAAGTGTCAAACTCCAATAGGGGCGATAAACTCCAGTATGCCATTCCACAACATCCACCCTCTCACCATCGGGGAATGCCCCAAATATGTGAAATCAAACAGATTAGTCCTTGCTACTGGGCTCAGAAATAGCCCTCAAGGAGAGGGAAGAAGAAAAAAGAGAGGACTATTTGGAGCTATAGCAGGTTTTATAGAGGGAGGATGGCAGGGAATGGTAGATGGTTGGTATGGGTACCACCATAGCAACGAGCAGGGGAGTGGGTACGCTGCAGACAAAGAATCCACTCAAAAGGCAATAGATGGAGTCACCAATAAGGTCAACTCAATCATTGACAAAATGAATACTCAGTTTGAGGCTGTTGGGAGGGAATTTAATAACTTGGAAAAGAGAATAGAAAATTTAAACAAGAAAATGGAAGACGGGTTCCTAGATGTCTGGACTTATAATGCTGAACTTCTGGTTCTCATGGAAAATGAGAGAACTCTAGACTTTCATGACTCAAATGTCAAGAACCTTTACGACAAGGTGCGACTACAGCTTAGGGACAATGCAAAGGAGCTTGGTAACGGTTGTTTCGAGTTCTATCACAGATGCGATAATGAATGTATGGAAAGTGTAAGAAACGGAACGTATGACTACCCGCAGTATTCAGAAGAAGCAAGATTAAAAAGAGAGGAAATAAGTGGAGTAAAATTGGAATCAATAGGAACTTACCAAATACTATCAATTTATTCAACAGTGGCAAGTTCCCTAGCACTGGCAATCATGGTGGCTGGTCTATTTTTATGGATGTGCTCCAATGGATCGTTACAATGCAGAATTTGCATTTAA +>GU002684.1 +AGTCAGTCTTGTTAAAAGTGATCAGATTTGCATTGGTTACCATGCAAACAACTCAACAGAGCAGGTTGACACAATAATGGAAAAGAACGTCACTGTTACACACGCTCAAGACATACTGGAAAAGACACACAACGGGAAACTCTGCGATCTAGATGGAGTGAAGCCTCTAATTTTAAGAGATTGTAGTGTAGCTGGATGGCTCCTCGGGAACCCAATGTGTGACGAATTCCCCAATGTGTCGGAATGGTCCTACATAGTGGAGAAGATCAATCCAGCCAATGACCTCTGTTACCCAGGGAATTTCAACAACTATGAAGAACTGAAACACCTATTGAGCAGAATAAACCGGTTTGAGAAAATTCAGATCATCCCCAAAAGTTCTTGGCCAGATCATGAAGCCTCATTAGGAGTGAGCTCAGCATGTCCATACCAGGGAGGACCCTCCTTTTATAGAAATGTGGTATGGCTTATCAAAAAGAACAATACATACCCAACAATAAAGGAAAGTTACCATAATACCAATCAAGAAGATCTTTTGGTGCTGTGGGGGATCCACCATCCAAATGATGAGGAAGAGCAGACAAGGATCTATAAAAACCCAACTACCTATATTTCCGTTGGGACATCAACACTAAACCAGAGATTGGTACCAAAGATAGCCACTAGATCTAAGGTAAACGGGCAAAGTGGAAGAGTGGAGTTCTTTTGGACAATTTTAAAATCAAATGATACAATAAACTTTGAGAGTAATGGAAATTTCATTGCTCCAGAAAATGCATACAAAATTGTCAAGAAAGGGGACTCAACAATTATGAAAAGTGAGTTGGAATATGGTAACTGCAGCACCAAGTGTCAAACTCCAATAGGGGCGATAAACTCCAGTATGCCATTCCACAACATCCACCCTCTCACCATCGGGGAATGCCCCAAATATGTGAAATCAAACAGATTAGTCCTTGCTACTGGGCTCAGAAATAGCCCTCAAGGAGATGGAAGAAGAAAAAAGAGAGGACTATTTGGAGCCATAGCAGGTTTTATAGAGGGAGGATGGCAGGGAATGGTAGATGGTTGGTATGGGTACCACCATAGCAACGAGCAGGGGAGTGGGTACGCTGCAGACAAAGAATCCACTCAAAAGGCAATAGATGGAGTCACCAATAAGGTCAACTCAATCATTGACAAAATGAATACTCAGTTTGAGGCTGTTGGGAGGGAATTTAATAACTTGGAAAAGAGAATAGAAAATTTAAACAAGAAGATGGAAGACGGGTTCCTAGATGTCTGGACTTATAATGCTGAACTTCTGGTTCTCATGGAAAATGAGAGAACTCTAGACTTTCATGACTCAAATGTCAAGAACCTTTACGACAAGGTGCGACTACAGCTTAGGGACAATGCAAAGGAGCTTGGTAACGGTTGTTTCGAGTTCTATCACAGATGCGATAATGAATGTATGGAAAGTGTAAGAAACGGAACGTATGACTACCCGCAGTATTCAGAAGAAGCAAGATTAAAAAGAGAGGAAATAAGTGGAGTAAAATTGGAATCAATAGGAACTTACCAAATACTATCAATTTATTCAACAGTGGCAAGTTCCCTAGCACTGGCAATCATGGTGGCTGGTCTATCTTTATGGATGTGCTCCAATGGATCGTTACAATGCAGAATTTGCATTT +>AM911075.1 +AGCAAAAGCAGGGGTTCAATCTGTCAAAATGGAGAAAATAGTGCTTCTTCTTGCAATAGTCAGTCTTGTTAAAAGTGATCAGATTTGCATTGGTTACCATGCAAACAACTCGACAGAGCAGGTTGACACAATAATGGAAAAAAACGTCACTGTTACACATGCCCAAGACATACTGGAAAAGACACACAACGGGAAACTCTGCGATCTAGATGGAGTGAAGCCTCTAATTTTAAGAGATTGTAGTGTAGCTGGATGGCTCCTCGGGAACCCAATGTGTGACGAATTCCTCAATGTGCCGGAATGGTCTTACATAGTGGAGAAGATCAATCCAGCCAATGACCTCTGTTACCCAGGGAATTTCAACGACTATGAAGAACTGAAACACCTATTGAGCAGAATAAACCATTTTGAGAAAATTCAGATCATCCCCAAAAGTTCTTGGTCAGATCATGAAGCCTCATCAGGGGTGAGCTCAGCATGTCCATACCAGGGAAGGTCCTCCTTTTTTAGAAATGTGGTATGGCTTATCAAAAAGGACAATGCATATCCAACAATAAAGAGAAGTTACAATAATACCAACCAAGAAGATCTTTTGGTACTGTGGGGGATTCACCATCCAAATGATGCGGCAGAGCAGACAAGGCTCTATCAAAACCCGACTACCTATATTTCCGTTGGGACATCAACACTAAACCAGAGATTGGTACCAAAAATAGCTACTAGATCTAAGGTAAACGGGCAAAGTGGAAGGATGGAGTTCTTTTGGACAATTTTAAAACCGAATGATGCAATAAACTTTGAGAGTAATGGAAATTTCATTGCTCCAGAAAATGCATACAAAATTGTCAAGAAAGGGGACTCAACAATTATGAAAAGTGAGTTGGAATATGGTAACTGCAACACCAAGTGTCAAACTCCAATAGGGGCGATAAACTCTAGTATGCCATTCCACAACATCCACCCTCTCACCATCGGGGAATGCCCCAAATATGTGAAATCAAACAGATTAGTCCTTGCTACTGGGCTCAGAAATAGCCCTCAAGGAGAGAGAAGAAGAAAAAAGAGAGGACTATTTGGAGCTATAGCAGGTTTTATAGAGGGAGGATGGCAGGGAATGGTAGATGGTTGGTATGGGTACCACCATAGCAACGAGCAGGGGAGTGGGTACGCTGCAGACAAAGAATCCACTCAAAAGGCAATAGATGGAGTCACCAATAAGGTCAACTCGATCATTGACAAAATGAACACTCAGTTTGAGGCTGTTGGAAGGGAATTTAATAACTTAGAAAGGAGAATAGAAAATTTAAACAAGAAGATGGAAGACGGATTCCTAGATGTCTGGACTTATAATGCTGAACTTCTGGTTCTCATGGAAAATGAGAGAACTCTAGACTTTCATGACTCAAATGTCAAGAACCTTTACGACAAGGTCCGACTACAGCTTAGGGATAATGCAAAGGAGCTTGGTAACGGTTGTTTCGAGTTCTATCACAGATGTGATAATGAATGTATGGAAAGTGTAAGAAACGGAACGTATGACTACCCGCAGTATTCAGAAGAAGCAAGATTAAAAAGAGAGGAAATAAGTGGAGTAAAATTGGAATCAATAGGGACTTACCAAATACTGTCAATTTATTCAACAGTGGCGAGCTCCCTAGCACTGGCAATCATGGTGGCTGGTCTATCTTTATGGATGTGCTCCAATGGATCGCTACAATGCAGAATTTGCATTTAAATTTGTGAGTTCAGATTGTAGTTAAAAACACCCTTGTTTCTACT +>FJ602800.1 +ATGGAGAAAATAGTGCTTCTTCTTGCAATAGTCAGTCTTGTTAAAAGTGATCAGATTTGCATTGGTTACCATGCAAACAACTCGACAGAGCAGGTTGACACAATAATGGAAAAGAACGTCACTGTTACACACGCACAAGACATACTGGAAAAGACACACAACGGGAAACTCTGCGATCTAGATGGAGTGAAGCCTCTAATTTTAAGAGATTGTAGTGTAGCTGGATGGCTCCTCGGGAACCCAATGTGTGACGAATTCCTCAATGTGCCGGAATGGTCTTACATAGTGGAGAAGATCAATCCAGCCAATGACCTCTGTTACCCAGGGAATTTCAACGACTATGAAGAACTGAAACACCTATTGAGCAGAATAAACCATTTTGAGAAAATTCAGATCATCCCCAAAAGTTCTTGGTCAGATCATGAAGCCTCATCAGGGGTGAGCTCAGCATGTCCATACCAGGGAAGGTCCTCCTTTTTTAGAAATGTGGTATGGCTTATCAAAAAGGACAATGCATACCCAACAATAAAGAGAAGTTACAATAATACCAACCAAGAAGATCTTTTGGTACTGTGGGGGATTCACCATCCAAATGATGCGGCAGAGCAGACTAGGCTCTATCAAAACCCAACCACCTATATTTCCGTTGGGACATCAACACTAAACCAGAGACTGGTACCAAAAATAGCTACTAGATCCAAGGTAAACGGGCAAAGTGGAAGGATGGAGTTCTTTTGGACAATTTTAAAACCGAATGATGCAATAAACTTTGAGAGTAATGGAAATTTCATTGCTCCAGAAAATGCATACAAAATTGTCAAGAAACGGGACTCAACAATTATGAAAAGTGAATTGGAATATGGTAACTGCAACACCAAGTGTCAAACTCCAATAGGGGCGATAAACTCTAGTATGCCATTCCACAACATCCACCCTCTCACCATCGGGGAATGCCCCAAATATGTGAAATCAAACAGATTAGTCCTTGCGACTGGGCTCAGAAATAGCCCTCAAGGAGAGAGAAGAAGAAGAAAGAGAGGACTATTTGGAGCTATAGCAGGTTTTATAGAGGGAGGATGGCAGGGAATGGTAGATGGTTGGTATGGGTACCACCATAGCAACGAGCAGGGGAGTGGGTACGCTGCAGACAAAGAATCCACTCAAAAGGCAATAGATGGAGTCACCAATAAGGTCAACTCGATCATTGACAAAATGAACACTCAGTTTGAGGCTGTTGGAAGGGAATTTAATAACTTAGAAAGGAGAATAGAAAATTTAAACAAGAAGATGGAAGACGGATTCCTAGATGTCTGGACTTATAATGCTGAACTTCTGGTTCTCATGGAAAATGAGAGAACTCTAGACTTTCATGACTCAAATGTCAAGAACCTTTACGACAAGGTCCGACTACAGCTTAGGGATAATGCAAAGGAGCTTGGTAACGGTTGTTTCGAGTTCTATCATAGATGTGATAATGAATGTATGGAAAGTGTAAGAAACGGAACGTATGACTACCCGCAGTATTCAGAAGAAGCAAGATTAAAAAGAGAGGAAATAAGTGGAGTAAAATTGGAATCAATAGGAACTTACCAAATACTGTCAATTTATTCAACAGTGGCGAGCTCCCTAGCACTGGCAATCATGGTGGCTGGTCTATCTTTATGGATGTGCTCCAATGGATCGTTACAATGCAGAATTTGCATTTAAATTTGTGAGTTCAGATTGTAGTTA +>FJ602805.1 +ATGGAGAAAATAGTGCTTCTTCTTGCAATAGTCAGTCTTGTTAAAAGTGATCAGATTTGCATTGGTTACCATGCAAACAACTCGACAGAGCAGGTTGACACAATAATGGAAAAGAACGTCACTGTTACACACGCCCAAGACATACTGGAAAAGACACACAACGGGAAGCTCTGCGATCTAGACGGAGTGAAGCCTCTAATTTTAAGAGATTGTAGTGTAGCTGGATGGCTCCTCGGGAACCCAATGTGTGACGAATTCCTCAATGTGCCGGAATGGTCTTACATAGTGGAGAAGATCAATCCAGCCAATGACCTCTGTTACCCAGGGAATTTCAACGACTATGAAGAACTGAAACACCTATTGAGCAGAATAAACCATTTTGAGAAAATTCAGATCATCCCCAAAAGTTCTTGGTCAGATCATGAAGCCTCATCAGGGGTGAGCTCAGCATGTCCATACCAGGGAAGGTCCTCCTTATTTAGAAATGTGGTATGGCTTATCAAAAAGAACGATGCATACCCAACAATAAAGAGAAGTTACAATAATACCAACCAAGAAGATCTTTTGGTACTGTGGGGGATTCACCATCCAAATGATGCGGCAGAGCAGACAAGGCTCTATCAAAACCCAACCACCTATATTTCCGTTGGGACATCAACACTAAACCAGAGATTGGTACCAAAAATAGCTACTAGATCCAAGGTAAACGGGCAAAGTGGAAGGATGGAGTTCTTTTGGACAATTTTAAAACCGAATGATGCAATAAACTTTGAGAGTAATGGAAATTTCATTGCTCCAGAAAATGCATACAAAATTGTCAAGAAAGGGGACTCAACAATCATGAAAAGTGAATTGGAATATGGTAACTGCAACACCAAGTGTCAAACTCCAATAGGGGCGATAAACTCTAGTATGCCATTCCACAACATCCACCCTCTCACCATCGGGGAATGCCCCAAATATGTGAAATCAAACAGATTAGTCCTTGCGACTGGGCTCAGAAATAGCCCTCAAGGAGAGAGAAGAAGAAAAAAGAGAGGACTATTTGGAGCTATAGCAGGTTTTATAGAGGGAGGATGGCAGGGAATGGTAGATGGTTGGTATGGGTACCACCATAGCAACGAGCAGGCGAGTGGGTACGCTGCAGACAAAGAATCCACTCAAAAGGCAATAGATGGAGTCACCAATAAGGTCAACTCGATCATTGACAAAATGAACACTCAATTTGAGGCCGTTGGAAGGGAATTTAATAACTTAGAAAGGAGAATAGAAAATTTAAACAAGAAGATGGAAGACGGATTCCTAGATGTCTGGACTTATAATGCTGAACTTCTGGTTCTCATGGAAAATGAGAGAACTCTAGACTTTCATGACTCAAATGTCAAGAACCTTTACGACAAGGTCCGACTACAGCTTAGGGATAATGCAAAGGAGCTTGGTAACGGTTGTTTCGAGTTCTATCACAGATGTGATAATGAATGTATGGAAAGTGTAAGAAACGGAACGTATGACTACCCGCAGTATTCAGAAGAAGCAAGATTAAAAAGAGAGGAAATAAGTGGAGTAAAATTGCAATCAATAGGAACTTACCAAATACTGTCAATTTATTCAACAGTGGCGAGCTCCCTAGCACTGGCAATCATGGTGGCTGGTCTATCTTTATGGATGTGCTCCAATGGATCGTTACAATGCAGAATTTGCATTTAAATTTGTGAGTTCAGATTGTAGTTAAAAACACCCTTGTTTCTACTA +>CY146700.1 +ATGGAAAAAATAGTGCTCCTTTTTGCAATAGTCAGCCTTGTTAAAAGCGATCATATTTGCATTGGTTACCATGCAAACAACTCGACAGAGCAGGTTGACACAATAATGGAAAAGAACGTTACTGTTACACATGCTCAAGACATACTGGAGAAGACGCACAACGGGAAGCTCTGCGATCTAAATGGAGTGAAGCCTCTGATTTTAAAAGATTGTAGTGTAGCAGGATGGCTCCTCGGGAACCCAATGTGTGACGAATTCATCGATGTGCCAGAATGGTCTTACATAGTAGAGAAGACCAATCCAGCCAATGACCTCTGTTACCCAGGGAGTTTCAACGATTATGAAGAATTAAAACACCTATTGAGCAGAATAAACCACTTTGAGAAAATACGAATCATTCCCAAAGATTCTTGGCCAGATCATGAAGCCTCATTGGGGGTGAGCGCAGCATGTTCATACCAGGGAAATTCCTCATTTTTCAGAAATGTGGTATGGCTTCTCAAAAAGGACGATGCATACCCAATAATAACGAAAAGCTACAATAATACCAATAAAGAAGATCTCTTGGTACTGTGGGGGATCCATCATCCTAATGATGAGGCAGAGCAGATAAGGCTCTATAAAAACCCAACCACCTATATTTCCATTGGGACATCAACACTAAACCAGAGATTGGTACCAAGAATAGCTACTAGATCCAAAGTAAACGGGCAACGTGGAAGGATAGATTTCTTCTGGACAATTTTAAAACCGAATGATGCAATCAACTTCGAGAGTAATGGAAATTTCATTGCTCCAGAATATGCATACAAAATTGTCAAGAAAGGAGACTCCACAATTATGAGAAGTGAAGTGGAATATGGTAACTGCAACACCAGGTGTCAGACTCCGATAGGGGCGATAAACTCTAGTATGCCATTCCATAACATACACCCCCTCACCATCGGAGAATGTCCCAAATATGTGAAATCAAACAAATTAGTCCTTGCGACTGGGCTCAGAAATAGTCCTCAAAGAGAGAGAAGAAGAAAAAGAGGACTGTTTGGAGCTATAGCAGGTTTTATAGAGGGAGGATGGCAGGGAATGGTAGATGGTTGGTATGGGTACCACCACAGCAATGAGCAGGGGAGTGGGTACGCTGCAGACAAAGAATCTACTCAAAAGGCAATAGACGGAGTCACCAATAAGGTCAACTCGATCATTGACAAAATGAACACTCAGTTTGAGGCCGTAGGAAGGGAATTTAATAACTTAGAGAGGAGAATAGAGAATTTGAACAAGAAGATGGAAGACGGATTCCTAGATGTCTGGACTTATAATGCTGAACTTCTGGTTCTCATGGAAAATGAGAGAACTCTAGACTTCCATGACTCAAATGTCAGGAACCTTTACGACAAGGTCAGACTACAGCTTAAGGACAATGCAAAAGAGCTGGGTAACGGTTGTTTCGAGTTCTATCACAAATGTAATAATGAATGTATGGAAAGTGTAAGAAACGGAACGTATGACTACCCGCAGTATTCAGAAGAAGCAAGATTAAAAAGAGAGGAAATAAGTGGAGTAAAATTGGAATCAATAGGAATTTACCAAATACTGTCAATTTATTCAACAGTGGCGAGTTCCCTAGTACTGGCAATCATGATGGCTGGTCTATCTTTATGGATGTGCTCCAACGGGTCGTTACAGTGCAGAATTTGCATTTAA +>FJ602826.1 +ATGGAGAAAATAGTGCTTCTTCTTGCAATAGTCAGTCTTGTCAAAAGTGATCAGATTTGCATTGGTTACCATGCAAACAACTCGACAGAGCAGGTTGACACAATAATGGAAAAGAACGTTACTGTTACACATGCCCAAGACATACTGGAAAAGACACACAACGGGAAGCTCTGCGATCTAAATGGAGTAAAGCCTCTCATTTTGAGAGATTGTAGTGTAGCTGGATGGCTCCTCGGAAACCCTATGTGTGACGAATTCACCAATGTGCCGGAATGGTCTTACATAGTGGAGAAGGCCAGTCCAGCCAATGACCTCTGTTACCCAGGGGATTTCAACGACTATGAAGAACTGAAACACCTATTGAGCAGAATAAACCATTTTGAGAAAATTCAGATCATCCCCAAAAGTTCTTGGTCCAATCATGATGCCTCATCACCCGTGAGCTCAGCATGTCCATACCATGGGAGGTCCTCCTTTTTCAGAAATGTGGTATGGCTTATCAAAAAGAACAGTACATACCCAACAATAAAGAGGAGCTACAATAATACCAACCAAGAAGATCTTTTGGTACTGTGGGGGATTCACCATCCTAATGATGCGGCAGAGCAGACAAAGCTCTATCAAAACCCAACCACCTACATTTCCGTTGGAACATCAACACTGAACCAGAGATTGGTTCCAGAAATAGCTACTAGACCCAAAGTAAACGGGCAAAGTGGAAGAATGGAGTTCTTCTGGACAATTTTAAAGCCGAATGATGCCATCAATTTCGAAAGTAATGGAAATTTCATTGCTCCAGAATATGCATACAAAATTGTCAAAGAAAGGGACTCAGCAATTATGAAAAGTGAATTGGAATATGGTAACTGCAACACCAAGTGTCAAACTCCAATGGGGGCGATAAACTCTAGTATGCCATTCCACAACATACACCCCCTCACCATCGGGGAATGCCCCAAATATGTGAAATCAAACAGATTAGTCCTTGCGACTGGACTCAGAAATACCCCTCAAAGAGAGAGAAGAAGAAAAAAGCGAGGACTATTTGGAGCTATAGCAGGTTTTATAGAGGGAGGATGGCAGGGAATGGTAGATGGTTGGTATGGGTACCACCATAGCAATGAGCAGGGGAGCGGATACGCTGCAGACAAAGAATCCACTCAAAAGGCAATAGATGGAGTCACCAATAAGGTCAACTCGATCATTGACAAAATGAACACTCAGTTTGAGGCCGTTGGAAGGGAATTTAATAACTTGGAAAGGAGGATAGAGAGTTTAAACAAGAAGATGGAAGACGGATTCCTAGATGTCTGGACTTATAATGCTGAACTTCTGGTTCTCATGGAAAATGAGAGAACTCTAGACTTTCATGACTCAAATGTCAAGAACCTTTACGACAAGGTCCGACTACAGCTTAGGGATAATGCAAAGGAGCTGGGTAATGGTTGTTTCGAGTTCTATCACAAATGTGATAATGAATGTATGGAAAGTGTAAAAAACGGAACGTATGACTACCCGCAGTATTCAGAAGAAGCAAGACTAAACAGAGAGGAAATAAGTGGAGTAAAATTGGAATCAATGGGAACTTACCAAATACTGTCAATTTATTCAACAGTGTGCGAGTTCCCTAGCTCTGGCAATCATGGTAGCCTGGTTCTATCTTTATGGATGTGCTCCAATGGATCGTTACAAAGCAGAATTTGCATTTAAAT +>GU002674.1 +ATGGAGAAAATAGTGCTTCTTCTTGCAATAGTCAGTCTTGTTAAGAGTGATCAGATTTGCATTGGTTACCATGCAAACAACTCGACAGAGCAGGTTGACACAATAATGGAAAAGAACGTCACTGTTACACACGCCCAAGACATACTGGAAAAGACACACAACGGGAAACTCTGCAATCTAGATGGAGTGAAGCCTCTAATTTTAAGAGATTGTAGTGTAGCCGGATGGCTCCTCGGGAACCCAATGTGCGACGAATTCCTCAATGTGCCGGAATGGTCTTACATAGTGGAGAAGATCAATCCAGCCAATGACCTCTGTTATCCAGGGAATTTCAACGACTATGAAGAACTGAAACACCTATTGAGCAGAATAAACCATTTTGAGAAAATTCAGATCATCCCCAAAAATTCTTGGTCAGATCATGAAGCCTCAGGAGTGAGCTCAGCATGTCCATACCAGGGAAGATCCTCCTTTTTTAGAAATGTGGTATGGCTTACCAAAAAGGACAATGCATACCCAACAATAAAGAGAAGTTACAATAATACCAACCAAGAAGATCTTTTGGTACTATGGGGGATTCACCATCCAAATGATGCGGCAGAGCAGACAAGGCTTTATCAAAACCCAACTACCTATATTTCCGTTGGGACATCAACACTAAACCAGAGATTGGTACCAAAAATAGCTACTAGATCTAAGGTAAACGGACAAAGTGGAAGGATGGAGTTCTTTTGGACAATTTTAAAATCGAATGATGCAATAAACTTTGAGAGTAATGGAAATTTCATTGCTCCAGAAAATGCATACAAAATTGTCAAGAAAGGGGACTCAACAATTATGAAAAGTGAGTTGGAATATGGTAACTGCAACACCAAGTGTCAGACTCCAATAGGGGCGATAAACTCCAGTATGCCATTCCACAACATCCACCCTCTCACCATCGGGGAATGCCCCAAATATGTGAAATCAAACAGATTAGTCCTTGCTACTGGGCTCAGAAATAGCCCTCAAGGAGAGAGAAGAAGAAAAAAGAGAGGACTATTTGGAGCTATAGCAGGTTTTATAGAGGGAGGATGGCAGGGAATGGTAGATGGTTGGTATGGGTACCACCATAGCAACGAGCAGGGGAGTGGGTACGCTGCAGACAAAGAATCCACTCAAAAGGCAATAGATGGAGTCACCAATAAGGTCAACTCGATCATTGACAAAATGAACACTCAGTTTGAGGCTGTTGGAAGGGAATTTAATAACTTAGAAAGGAGAATAGAAAATTTAAACAAGAAGATGGAAGACGGATTCCTAGATGTCTGGACTTATAATGCTGAACTTCTGGTTCTCATGGAAAATGAGAGAACTCTAGACTTTCATGACTCAAATGTCAAGAATCTTTACGACAAGGTCCGACTACAGCTTAGGGATAATGCAAAGGAGCTTGGTAACGGTTGTTTCGAGTTCTATCACAGATGTGATAATGAATGTATGGAAAGTGTAAGAAACGGAACGTATGACTACCCGCAGTATTCAGAAGAAGCAAGATTAAAAAGAGAGGAAATAAGTGGAGTAAAATTGGAGTCAATAGGAACTTACCAAATACTGTCAATTTATTCAACAGTGGCGAGCTCCCTAGCACTGGCAATCATGGTGGCTGGTCTATTTTTATGGATGTGCTCCAATGGATCGTTACAATGCAGAATTTGCATTTAA +>EU195392.1 +ATGGAGAAAATAGTGCTTTTTCTTGCAATAGTCAGCCTTGTTAAAAGTGATCAGATTTGCATTGGTTACCATGCAAACAACTCGACAGAGCAGGTTGACACAATAATGGAAAAGAATGTTACTGTTACACATGCCCAAGACATACTGGAAAAGACACACAACGGGAAGCTCTGCGATCTAGATGGAGTGAAGCCTCTGATTTTAAGAGATTGTAGTGTAGCTGGATGGCTCCTCGGAAACCCAATGTGTGACGAATTCATCAATGTGCCGGAATGGTCTTACATAGTGGAGAAGGCCAACCCAGCCAATGACCTCTGTTACCCAGGGAATTTCAACGACTATGAAGAACTGAAACACCTATTGAGCAGAATAAACCATTTTGAGAAAATTCAGATCATCCCCAAAAGTTCTTGGTCCGATCATGAAGCCTCATCAGGGGTGAGCTCAGCATGTCCTTACCAGGGAACGCCCTCCTTTTTCAGAAATGTGGTATGGCTTATCAAAAAGAACAATACATACCCAACAATAAAGAGAAGCTACAATAATACCAACCAGGAAGATCTTTTGATACTGTGGGGGATTCATCATTCTAATGATGCGGCAGAGCAGACAAAGCTCTATCAAAACCCAACCACCTATATTTCCGTTGGGACATCAACACTAAACCAGAGATTAGTACCAAAAATAGCTACTAGATCCAAAGTAAACGGGCAAAGTGGAAGGATGGATTTCTTCTGGACAATTTTAAAACCGAATGATGCAATCAACTTCGAGAGTAATGGAAATTTCATTGCTCCAGAATATGCATACAAAATTGTCAAGAAAGGGGACTCAGCAATTATGAAAAGTGAAGTGGAATATGGTAACTGCAACACCAAGTGTCAAACTCCAATAGGGGCGATAAACTCTAGTATGCCATTCCACAACATACACCCTCTCACCATCGGGGAATGCCCAAAATATGTGAAATCAAACAAATTAGTCCTTGCGACTGGGCTCAGAAATAGTCCTCTAAGAGAAAGAAGAAGAAAAAGAGGACTATTTGGAGCTATAGCAGGTTTTATAGAGGGAGGATGGCAGGGAATGGTAGATGGTTGGTATGGGTACCACCATAGCAATGAGCAGGGGAGTGGGTACGCTGCAGACAAAGAATCCACTCAAAAGGCAATAGATGGAGTTACCAATAAGGTCAACTCGATCATTGACAAAATGAACACTCAGTTTGAGGCCGTTGGAAGGGAATTTAATAACTTAGAAAGGAGAATAGAGAATTTAAACAAGAAAATGGAAGACGGATTCCTAGATGTCTGGACTTATAATGCTGAACTTCTGGTTCTCATGGAAAATGAGAGAACTCTAGACTTCCATGACTCAAATGTCAAGAACCTCTACGACAAGGTCCGACTACAGCTTAGGGATAATGCAAAGGAACTGGGTAACGGTTGTTTCGAGTTCTATCACAAATGTGATAATGAATGTATGGAAAGTGTAAGAAACGGAACGTATGACTACCCGCAGTATTCAGAAGAAGCAAGATTAAAAAGAGAGGAAATAAGTGGAGTAAAATTGGAATCAATAGGAACTTACCAAATACTGTCAATTTATTCAACAGTGGCGAGTTCTCTAGCACTGGCAATCATGGTGGCTGGTCTATCTTTATGGATGTGCTCCAATGGGTCGTTACAATGCAGAATTTGCATTTAA +>GU002675.1 +ATGGAGAAAATAGTGCTTCTTCTTGCAATAGTCAGTCTTGTTAAAAGTGATCAGATTTGCATTGGTTACCATGCAAACAACTCGACAGAGCAGGTTGACACAATAATGGAAAAGAACGTCACTGTTACACACGCCCAAGACATACTGGAAAAGACACACAACGGGAAACTCTGCGATTTAGATGGAGTGAAGCCTCTAATTTTAAGAGATTGTAGTGTAGCTGGGTGGCTCCTCGGGAACCCAATGTGTGACGAATTCCTCAATGTGCCGGAATGGTCTTACATAGTGGAGAAGATCAATCCAGTCAATGACCTCTGTTACCCAGGGAATTTCAACGACTATGAAGAACTGAAACACCTATTGAGCAGAATAAACCATTTTGAGAAAATTCAGATCTTCCCCAAAAGTTCTTGGTCAGACCATGAAGCCTCATCAGGGGTGAGCTCGGCATGTCCATACCAGGGAAGATCCTCCTTTTTTAGAAATGTGGTATGGCTTGTCAAAAAGGACAATGCATACCCAACAATAAAGAAAAGTTACAATAATACCAACCAAGAAGATCTTTTGATACTGTGGGGGATTCACCATCCAAATGATGCGGCAGAGCAGACAAGGCTCTATCAAAACCCAACTACCTATATTTCCGTTGGGACATCAACACTAAACCAGAGATTGGTACCAAAAATAGCTACTAGATCTAAAGTAAACGGGCAAAGTGGAAGGATTGAGTTCTTTTGGACAATTTTAAAATCGAATGATGTAATAAACTTTGAGAGTAATGGAAATTTCATTGCTCCAGAAAATGCATACAAAATTGTCAAGAAAGGGGACTCAACAATTATGAAAAGTGAGTTGGAATATGGTAACTGCAACACCAAGTGTCAAACTCCAATAGGGGCGATAAACTCCAGTATGCCATTCCACAACATCCACCCTCTCACCATCGGGGAATGCCCCAAATATGTGAAATCAAACAGATTAGTCCTTGCTACTGGGCTCAGAAATAGCCCTCAAGGAGAGAGAAGAAGAAAAAAGAGAGGACTATTTGGGGCTATAGCAGGCTTTATAGAAGGAGGATGGCAGGGAATGGTAGACGGTTGGTATGGGTACCACCATAGCAACGAGCAGGGGAGTGGGTATGCTGCAGATAAAGAATCCACTCAAAAGGCAATAGATGGAGTCACCAATAAGGTCAACTCGATCATTGACAAAATGAACACTCAGTTTGAGGCTGTTGGGAGGGAATTTAATAACTTAGAAAGGAGAATAGAAAATTTAAATAAGAAGATGGAAGACGGATTCCTAGATGTCTGGACTTATAATGCTGAACTTCTGGTTCTCATGGAAAATGAGAGAACTCTAGACTTTCATGACTCAAATGTCAAGAACCTTTACGACAAGGTCCGACTACAGCTTAGGGATAATGCAAAGGAGCTTGGTAACGGTTGTTTCGAGTTCTATCACAGATGTGATAATGAATGTATGGAAAGTGTAAAAAACGGAACGTATGACTACCCGCAGTATTCAGAAGAAGCAAGATTAAAGAGAGAGGAAATAAGTGGAGTAAAATTGGAATCAATAGGAACTTACCAAATACTGTCAATTTATTCAACAGTGGCGAGCTCCCTAGCACTGGCAATCATGATGGCTGGTCTATTTTTATGGATGTGCTCCAATGGGTCGTTACAATGCAGAATTTGCATTTAA +>FM177119.1 +AGCAAAAGCAGGGGTTCAATCTGTCAAAATGGAGAAAATAGTGCTTCTTCTTGCAATAATCAATCTTGTTAAAAGTGATCAGATTTGCATTGGTTACCATGCAAACAACTCGACAGAGCAGGTTGACACAATAATGGAAAAGAACGTCACTGTTACACACGCCCAAGACATACTGGAAAAGACACACAACGGGAAGCTCTGCGATCTAGACGGAGTGAAGCCTCTAATTTTAAGAGATTGTAGTGTAGCTGGATGGCTCCTTGGGAATCCAATGTGTGACGAATTCCTCAATGTGCCGGAATGGTCTTACATAGTGGAGAAGATCAATCCAGCCAATGACCTCTGTTACCCAGGGAATTTCAACGACTATGAAGAACTGAAACACCTATTGAGCAGAATAAACCATTTTGAGAAAATTCAGATCATCCCCAAAAGTTCTTGGTCAGATCATGAAGCCTCATCAGGGGTGAGCTCAGCATGTCCATACCAGGGAAGGTCCTCCTTTTTTAGAAATGTGGTATGGCTTATCAAAAAGAACGATGCATACCCAACAATAAAGATAAGTTACAATAATACCAACCAAGAAGATCTTTTGGTACTGTGGGGGATTCACCATCCAAATGATGCGGCAGAGCAGACAAGGCTCTATCAAAACCCAACCACCTATATTTCCGTTGGGACATCAACACTAAACCAGAGATTGGTACCAAAAATAGCTACTAGATCCAAGGTAAACGGGCAAAGTGGAAGGATGGAGTTCTTTTGGACAATTTTAAAACCGAATGATGCAATAAATTTTGAGAGTAATGGAAATTTCATTGCTCCAGAAAATGCATACAAAATTGTCAAGAAAGGGGACTCAACAATCATGAAAAGTGAATTGGAATATGGTAACTGCAACACCAAGTGTCAAACTCCAATAGGGGCGATAAACTCTAGTATGCCATTCCACAACATCCACCCTCTCACCATTGGGGAATGCCCCAAATATGTGAAATCAAACAGATTAGTCCTTGCGACTGGGCTCAGAAATAGCCCTCAAGGAGAGAGAAGAAGAAAAAAGAGAGGACTATTTGGAGCTATAGCAGGTTTTATAGAGGGAGGATGGCAGGGAATGGTAGATGGTTGGTATGGGTACCACCATAGTAACGAGCAGGGGAGTGGGTACGCTGCAGACAAAGAATCCACTCAAAAGGCAATAGATGGAGTCACCAATAAGGTCAACTCGATCATTGACAAAATGAATACTCAGTTTGAGGCCGTTGGAAGGGAATTTAATAACTTAGAAAGGAGAATAGAGAATTTAAACAAGAAGATGGAAGACGGATTTCTAGATGTCTGGACTTATAATGCTGAACTTCTGGTTCTCATGGAAAATGAGAGAACTCTAGACTTTCATGACTCAAATGTCAAGAACCTTTACGACAAGGTCCGGCTACAGCTTAGGGATAATGCAAAAGAGCTTGGTAACGGTTGTTTCGAGTTCTATCACAGATGTGATAATGAATGTATGGAAAGTGTAAGAAACGGAACGTATGACTACCCGCAGTATTCAGAAGAATCAAGATTAAAAAGAGAGGAAATAAATGGAGTAAAGTTGGAGTCAATAGGAACTTATCAAATACTGTCAATTTATTCAACAGTGGCGAGCTCCCTAGCACTGGCAATCATGGTGGCTGGTCTATCTTTATGGATGTGCTCCAATGGATCGTTACAATGCAGAATTTGCATTTAAATTTGTGAGTTCAGATTGTAGTTAAAAACACCCTTGTTTCTACT +>OP950305.1 +GCAGGGGTTCATTCTGTCAAAATGGAGAACATAGTACTACTTCTTGCAATAGTTAGCCTTGTTAAAAGTGATCAGATTTGCATTGGTTACCATGCAAACAATTCGACAGAGCAAGTTGACACGATAATGGAAAAGAACGTCACTGTTACACATGCCCAAGACATACTGGAAAAAACACACAACGGGAAGCTCTGTGATCTAAATGGGGTGAAGCCTCTGATTTTAAAGGATTGTAGTGTAGCTGGATGGCTCCTCGGAAACCCAATGTGCGACGAATTCATCAGAGTGCCGGAATGGTCCTACATAGTGGAGCGGGCTAACCCAGCTAATGACCTCTGTTACCCAGGGAGCCTCAATGACTATGAAGAACTGAAACACATGTTGAGCAGAATAAATCATTTTGAGAAGATTCTGATCATTCCCAAGAGTTCCTGGCCAAATCATGAAACATCACTAGGGGTGAGCGCAGCTTGTCCATATCAGGGAGCGCCCTCCTTTTTCAGAAATGTGGTGTGGCTTATCAAAAAGAACGATGCATACCCAACAATAAAGATAAGCTACAATAATACCAATCGGGAAGATCTCTTGATACTGTGGGGGATCCATCATTCCAACAATGCAGAAGAGCAGACAAATCTCTACAAAAACCCAACCACCTACATTTCAGTTGGAACATCAACTTTAAACCAGAGGTTGGCACCAAAAATAGCTACTAGATCCCAAGTAAACGGGCAACGTGGAAGAATGGACTTCTTCTGGACAATCTTAAAACCAGATGATGCAATCCATTTCGAGAGTAATGGAAATTTCATTGCTCCAGAATATGCATACAAAATTGTCAAGAAAGGGGACTCAACAATTATGAAAAGTGGAGTGGAATATGGCCACTGCAACACCAAATGTCAAACCCCAGTAGGTGCGATAAATTCTAGTATGCCATTCCACAACATACATCCTCTCACCATTGGGGAATGCCCCAAATACGTGAAGTCAAACAAGTTGGTCCTTGCAACTGGGCTCAGAAATAGTCCTCTAAGAGAAAGGAGAAGAAAAAGAGGCCTGTTTGGGGCTATAGCAGGGTTTATAGAGGGAGGATGGCAGGGAATGGTTGATGGTTGGTATGGGTACCATCATAGCAATGAGCAGGGGAGTGGGTACGCTGCAGACAAAGAATCCACCCAAAAGGCAATAGATGGAGTCACCAACAAGGTCAACTCAATCATTGACAAAATGAACACTCAATTTGAGGCAGTTGGAAGGGAGTTTAATAACTTAGAAAGGAGGATAGAGAATTTGAACAAGAAAATGGAAGACGGATTCCTAGATGTCTGGACCTATAATGCTGAACTTCTAGTTCTCATGGAAAACGAAAGGACTCTAGATTTCCATGATTCAAATGTCAAGAACCTTTACGACAAAGTCAGATTACAGCTTAGGGATAATGCAAAGGAGCTGGGTAACGGCTGTTTCGAATTCTATCACAAATGTGATAATGAATGTATGGAAAGTGTGAGAAATGGGACGTATGACTACCCTCAGTATTCAGAAGAAGCAAGATTAAAAAGAGAAGAAATAAGCGGAGTGAAATTAGAATCAGTAGGAACTTACCAGATACTGTCAATTTATTCAACAGCGGCAAGTTCCCTAGCACTGGCAATCATGATGGCTGGTCTATCTTTATGGATGTGCTCCAATGGGTCGTTACAGTGCAGAATTTGCATTTAGATTTGTGAGCTCAGATTGTAGTTAAAAACACC +>JN401974.1 +ATGGAGAAAATAGTGCTTCTTCTTGCAATAGTCAGTCTTGTTAAAAGTGATCAGATTTGCATTGGTTACCATGCAAACAACTCGACAGAGCAGGTTGACACAATAATGGAAAAGAACGTCACTGTTACACACGCCCAAGACATACTGGAAAAGACACACAACGGGAAACTCTGCAATCTAGATGGAGTGAAGCCTCTAATTTTAAGAGATTGTAGCGTAGCCGGATGGCTCCTCGGGAACCCAATGTGCGACGAATTCCTCAATGTGCCGGAATGGTCTTACATAGTGGAGAAGATCAATCCAGCCAATGACCTCTGTTATCCAGGGAATTTCAACGACTATGAAGAACTGAAACACCTATTGAGCAGAATAAACCATTTTGAGAAAATTCAGATCATCCCCAAAAGTTCTTGGTCAGATCATGAAGCCTCAGGAGTGAGCTCAGTATGTCCATACCAGGGAAGATCCTCCTTTTTTAGAAATGTGGTATGGCTTACCAAAAAGGACAATGCATACCCAACAATAAAGAGAAGTTACAATAATACCAACCAAGAAGATCTTTTGGTACTATGGGGGATTCACCATCCAAATGATGCGGCAGAGCAGACAAGGCTTTATCAAAACCCAACTACCTATATTTCCGTTGGGACATCAACACTAAACCAGAGATTGGTACCAAAAATAGCTACTAGATCTAAGGTAAACGGGCAAAGTGGAAGGATGGAGTTCTTTTGGACAATTTTAAAATCGAATGATGCAATAAACTTTGAGAGTAATGGAAATTTCATTGCTCCAGAAAATGCATACAAAATTGTCAAGAAAGGGGACTCAACAATTATGAAAAGTGAGTTGGAATATGGTAACTGCAACACCAAGTGTCAGACTCCAATAGGGGCGATAAACTCCAGTATGCCATTCCACAACATCCACCCTCTCACCATCGGGGAATGCCCCAAATATGTGAAATCAAACAGATTAGTCCTTGCTACTGGGCTAAGAAATAGCCCTCAAGGAGAGACGCGAGGACTATTTGGAGCTATAGCAGGTTTTATAGAGGGAGGATGGCAGGGAATGGTAGATGGTTGGTATGGGTACCACCATAGCAACGAGCAGGGGAGTGGGTACGCTGCAGACAAAGAATCCACTCAAAAGGCAATAGATGGAGTCACCAATAAGGTCAACTCAATCATTGACAAAATGAACACTCAGTTTGAGGCTGTTGGAAGGGAATTTAATAACTTAGAAAGGAGAATAGAAAATTTAAACAAGAAGATGGAAGACGGATTCCTAGATGTCTGGACTTATAATGCTGAACTTCTGGTTCTCATGGAAAATGAGAGAACTCTAGACTTTCATGACTCAAATGTCAAGAACCTTTACGACAAGGTCCGGCTACAGCTTAGGGATAATGCAAAGGAGCTTGGTAACGGTTGTTTCGAGTTCTATCACAGATGTGATAATGAATGTATGGAAAGTGTAAGAAACGGAACGTATGACTACCCGCAGTATTCAGAAGAAGCAAGATTAAAAAGAGAGGAAATAAGTGGAGTAAAATTGGAGTCAATAGGAACTTACCAAATACTGTCAATTTATTCAACAGTGGCGAGCTCCCTAGCACTGGCAATCATGGTGGCTGGTCTATTTTTATGGATGTGCTCCAATGGATCGTTACAATGCAGAATTTGCATTTAA +>KC784944.1 +ATGGAGAAAATAGTGCTTCTTCTTGCAATAGTCAGCCTTGTTAAAAGTGATCAGATTTGCATTGGTTACCATGCAAACAACTCGACAGAGCAGGTTGACACGATAATGGAAAAGAACGTTACTGTTACACATGCCCAAGACATACTGGAAAAGACACACAACGGGAAGCTCTGCGATCTAGATGGAGTGAAGCCTCTGATTTTAAGAGATTGTAGTGTAGCTGGATGGCTCCTCGGAAACCCAATGTGTGACGAATTCATCAATGTGCCGGAATGGTCTTACATAGTGGAGAAGGCCAACCCAACCAATGACCTCTGTTACCCAGGGAATTTCAACGACTATGAAGAACTGAAACACCTATTGAGCAGAATAAACCATTTTGAGAAAATTCAGATCATCCCCAAGAGTTCTTGGTCCGGCCATGAAGCCTCATCAGGGGTGAGCTCAGCATGTCCATACCAGGGAACGCCCTCCTTTTTCAGAAATGTGGTATGGCTTATCAAAAAGAACAATACATACCCAACAATAAAGAGAAGCTACAATAATACCAACCAGGAAGATCTTTTGATACTGTGGGGGATTCATCATTCTAATGATGCGGCAGAGCAGACAAAGCTCTATCAAAACCCAACCACCTATATTTCCGTTGGGACATCAACACTAAACCAGAGATTGGTACCAAAAATAGCTACTAGATCCAAAGTAAACGGGCAAAGTGGAAGGATGGATTTCTTCTGGACAATTTTAAAACCGAATGATGCAATCAACTTCGAGAGTAATGGAAATTTTATTGCTCCAGAATATGCATACAAAATTGTCAAGAAAGGGGACTCAGCAATTATGAAAAGTGAAGTGGAATATGGTAACTGCAACACCAAGTGTCAAACTCCAATAGGGGCGATAAACTCTAGTATGCCATTCCACAACATACACCCTCTCACCATCGGGGAATGCCCCAAATATGTGAAATCAAACAAATTAGTCCTTGCGACTGGGCTCAGAAATAGTCCTCTAAGAGAAAGAAGAAGAAAAAGAGGACTATTTGGAGCTATAGCAGGTTTTATAGAGGGAGGATGGCAGGGAATGGTAGATGGTTGGTATGGGTACCACCATAGCAATGAGCAGGGGAGTGGGTACGCTGCAGACAAAGAATCCACTCAAAAGGCAATAGATGGAGTTACCAATAAGGTCAACTCGATCATTGACAAAATGAACACTCAGTTTGAGGCCGTTGGAAGGGAATTTAATAACTTAGAAAGGAGAATAGAGAATTTAAACAAGAAAATGGAAGACGGATTCCTAGATGTCTGGACTTATAATGCTGAACTTCTGGTTCTCATGGAAAATGAGAGAACTCTAGACTTCCATGACTCAAATGTCAAGAACCTTTACGACAAGGTCCGACTACAGCTTAGGAATAATGCAAAGGAGCTGGGTAATGGTTGTTTCGAGTTCTATCACAAATGTGATAATGAATGTATGGAAAGTGTAAGAAACGGAACGTATGACTACCCACAGTATTCAGAAGAAGCAAGATTAAAAAGAGAGGAAATAAGTGGAGTAAAATTGGAATCAATAGGAACTTACCAAATACTGTCAATTTATTCAACAGTGGCGAGTTCTCTAGCACTGGCAATCATGGTGGCTGGTCTATCTTTATGGATGTGCTCCAATGGGTCGTTACAATGCAGAATTTGCATCTAG +>CY062482.1 +ATGGAGAAAATAGTGCTTCTTCTTGCAATAGTCAGTATTGTTAAAAGTGATCAGATTTGCATTGGTTACCATGCAAACAACTCGACAGAGCAAGTTGACACAATAATGGAAAAGAACGTCACTGTTACACACGCCCAAGACATACTGGAAAAGACACACAACGGGAAACTCTGCAATCTAGATGGAGTGAAGCCTCTAATTTTAAGAGATTGTAGTGTAGCTGGATGGCTCCTCGGGAACCCAATGTGCGACGAATTCCTCAATGTGCCGGAATGGTCTTACATAGTGGAGAAGATCAATCCATCCAATGACCTCTGTTATCCAGGGAATTTCAACGACTATGAAGAACTGAAACACCTATTGAGCAGAATAAACCATTTTGAGAAAATTCAGATCATTCCCAAAAATTCTTGGTCAGATCATGAAGCCTCAGGAGTGAGCTCAGCATGTCCATACCAGGGAAGATCCTCCTTTTTTAGAAATGTGGTATGGCTTACCAAAAAGAACAATGCATACCCAACAATAAAGAAAAGTTACAATAATACCAACCAAGAAGATCTTTTGGTACTATGGGGGATTCACCATCCAAATGATGAGGCAGAGCAGACAAGGCTTTATCAAAACCCAACTACCTATATTTCCGTTGGGACATCAACACTAAACCAGAGATTGGTACCAAAAATAGCTACTAGATCTAAGGTAAACGGGCAAAGTGGAAGGATGGAGTTCTTTTGGACAATTTTAAAATCGAATGATGCAATAAACTTTGAGAGTAATGGAAATTTCATTGCTCCAGAAAATGCATACAAAATTGTCAAGAAAGGGGACTCAACAATTATGAAAAGTGAATTGGAATATGGCAACTGCAACACCAAGTGTCAGACTCCAATAGGGGCGATAAACTCCAGTATGCCATTCCACAACATCCACCCTCTCACCATCGGGGAATGCCCCAAATATGTGAAATCAAACAGATTAGTCCTTGCTACTGGGCTCAGAAATAGCCCTCAAGGAGAGAGAAGAAGAAAAAAGAGAGGACTATTTGGAGCTATAGCAGGTTTTATAGAGGGCGGATGGCAGGGAATGGTAGATGGTTGGTATGGGTACCACCATAGCAACGAGCAGGGGAGTGGGTACGCTGCAGACAAAGAATCCACTCAAAAGGCAATAGATGGAGTCACCAATAAGGTCAACTCGATCATTGACAAAATGAACACTCAGTTTGAGGCTGTTGGAAGGGAATTTAATAACTTAGAAAGGAGAATAGAAAATTTAAACAAGAAGATGGAAGACGGATTCCTAGATGTCTGGACTTATAATGCTGAACTTCTGGTTCTCATGGAAAATGAGAGAACTCTAGACTTTCATGACTCAAATGTCAAGAACCTTTATGACAAGGTCCGACTACAGCTTAGGGATAATGCAAAGGAGCTTGGTAACGGTTGTTTCGAGTTCTATCACAGATGTGATAATGAATGTATGGAAAGTGTAAGAAACGGAACGTATGACTACCCGCAGTATTCAGAAGAAGCAAGATTAAAAAGAGAGGAAATAAGTGGAGTAAAATTGGAGTCAATAGGAACTTACCAAATACTGTCAATTTATTCAACAGTGGCGAGCTCCCTAGCACTGGCAATCATGGTGGCTGGTCTATTTTTATGGATGTGCTCCAATGGATCGTTACAATGCAGAATTTGCATTTAA +>CY041920.1 +ATGGAGAAAATAGTGCTTCTTCTTGCAATAGTCAGTCTTGTTAAGAGTGATCAGATTTGCATTGGTTACCATGCAAACAACTCGACAGAGCAGGTTGACACAATAATGGAAAAGAACGTCACTGTTACACACGCCCAAGACATACTGGAAAAGACACACAACGGGAAACTCTGCAATCTAGATGGAGTGAAGCCTCTAATTTTAAGAGATTGTAGTGTAGCCGGATGGCTCCTCGGGAACCCAATGTGCGACGAATTCCTCAATGTGCCGGAATGGTCTTACATAGTGGAGAAGATCAATCCAGCCAATGACCTCTGTTATCCAGGGAATTTCAACGACTATGAAGAACTGAAACACCTATTGAGCAGAATAAACCATTTTGAGAAAATTCAGATCATCCCCAAAAATTCTTGGTCAGATCATGAAGCCTCAGGAGTGAGCTCAGCATGTCCATACCAGGGAAGATCCTCCTTTTTTAGAAATGTGGTATGGCTTACCAAAAAGGACAATGCATACCCAACAATAAAAAGAAGTTACAATAATACCAACCAAGAAGATCTTTTGGTACTATGGGGGATTCACCATCCAAATGATGCGGCAGAGCAGACAAGGCTTTATCAAAACCCAACTACCTATATTTCCGTTGGGACATCAACACTAAACCAGAGATTGGTACCAAAAATAGCTACTAGATCTAAGGTAAACGGACAAAGTGGAAGGATGGAGTTCTTTTGGACAATTTTAAAATCGAATGATGCAATAAACTTTGAGAGTAATGGAAATTTCATTGCTCCAGAAAATGCATACAAAATTGTCAAGAAAGGGGACTCAACAATTATGAAAAGTGAGTTGGAATATGGTAACTGCAACACCAAGTGTCAGACTCCAATAGGGGCGATAAACTCCAGTATGCCATTCCACAACATCCACCCTCTCACCATCGGGGAATGCCCCAAATATGTGAAATCAAACAGATTAGTCCTTGCTACTGGGCTCAGAAATAGCCCTCAAGGAGAGAGAAGAAGAAAAAAGAGAGGACTATTTGGAGCTATAGCAGGTTTTATAGAGGGAGGATGGCAGGGAATGGTAGATGGTTGGTATGGGTACCACCATAGCAACGAGCAGGGGAGTGGGTACGCTGCAGACAAAGAATCCACTCAAAAGGCAATAGATGGAGTCACCAATAAGGTCAACTCGATCATTGACAAAATGAACACTCAGTTTGAGGCTGTTGGAAGGGAATTTAATAACTTAGAAAGTAGAATAGAAAATTTAAACAAGAAGATGGAAGACGGATTCCTAGATGTCTGGACTTATAATGCTGAACTTCTGGTTCTCATGGAAAATGAAAGAACTCTAGACTTTCATGACTCAAATGTCAAGAATCTTTACGACAAGGTCCGACTACAGCTTAGGGATAATGCAAAGGAGCTTGGTAACGGTTGTTTCGAGTTCTATCACAGATGTGATAATGAATGTATGGAAAGTGTAAGAAACGGAACGTATGACTACCCGCAGTATTCAGAAGAAGCAAGATTAAAAAGAGAGGAAATAAGTGGAGTAAAATTGGAGTCAATAGGAACTTACCAAATACTGTCAATTTATTCAACAGTGGCGAGCTCCCTAGCACTGGCAATCATGGTGGCTGGTCTATTTTTATGGATGTGCTCCAATGGATCGTTACAATGCAGAATTTGCATTTAA +>GQ338084.1 +GGTCCAATCTGTCAAAATGGAGAAAATAGTGCTTCTTTTTGCAACAATCAGCCTTGTTAAAAGCGATCATATTTGCATTGGTTATCATGCAAATAACTCGACAGAGCAGGTTGACACAATAATGGAAAAGAACGTTACTGTTACACATGCCCAAGACATACTGGAAAAGACACACAACGGGAAGCTCTGCGATCTAAATGGAGTGAAGCCTCTGATTTTAAAAGATTGTAGTGTAGCGGGATGGCTCCTCGGAAACCCATTGTGTGACGAATTCATCAATGTGCCAGAATGGTCTTACATAGTAGAGAAGGCCAATCCAGCCAATGACCTCTGTTACCCAGGGAATTTCAACGATTATGAAGAATTGAAACACCTATTGAGCAGGATAAACCATTTTGAGAAAATACAGATCATCCCCAAAGATTCTAGGTCAGATCATGAAGCCTCATTGTGGGTGAGCGCAGCATGTCCATACCAGGGAAAATCCTCCTTCTTCAGAAATGTGGTATGGCTTATCAAAAAGGACAATGCATACCCAACAATAAAGAAAGGCTACAATAATACCAACCAAGAAGATCTCTTGGTACTGTGGGGGATTCACCATCCTAATGATGAGGCAGAGCAGACAAGGCTCTATCAAAACCCAACCACCTATATTTCCATTGGGACATCAACACTAAACCAGAGATTGGTACCAAAAATAGCCACTAGATCCAAAATAAACGGGCAAAGTGGCAGGATAGATTTCTTCTGGACAATTTTAAAACCGAATGATGCAATCCACTTCGAGAGTAATGGAAATTTCATTGCTCCAGAATATGCATACAAAATTGTCAAGAAAGGAGACTCCACAATTATGAAAAGTGAAGTGGAATATGGTAACTGCAACACCAGGTGTCAGACTCCGATAGGGGCGATAAACTCTAGTATGCCATTCCACAACATACACCCTCTCACCATCGGAGAATGTCCCAAATATGTGAAATCAAACAAATTAGTCCTTGCGACTGGGCTCAGAAATAGTCCTCAAAGAGAGAGAAGAAGAAAAAGAGGACTGTTTGGAGCTATAGCAGGTTTTATAGAGGGAGGATGGCAGGGAATGGTAGATGGTTGGTATGGGTACCACCACAGCAATGAGCAGGGGAGTGGGTACGCTGCAGACAAAGAATCTACTCAAAAGGCAATAGACGGAGTCACCAATAAGGTCAACTCGATCATTGACAAAATGAACACTCAGTTTGAGGCTGTTGGAAGGGAATTTAATAACTTAGAGAGGAGAATAGAGAATTTAAACAAGAAGATGGAAGACGGATTCCTAGATGTCTGGACTTATAATGCTGAACTTCTGGTTCTCATGGAAAATGAGAGAACTCTAGACTTCCATGACTCAAATGTCAAGAACCTTTACGATAAGGTCAGACTACAGCTTAAGGATAATGCAAAAGAGTTGGGTAATGGTTGTTTCGAGTTCTATCACAAATGTAATAATGAATGTATGGAAAGTGTAAGAAACGGAACTTATGACTACCCGCAGTATTCAGAAGAAGCAAGATTAAAAAGAGAGGAAATAAGTGGAGTAAAATTGGAATCAATAGGAATCTACCAAATACTGTCAATTTATTCAACAGTGGCGAGTTCCCTAGTGCTGGCAATCATGATGGCTGGTCTATCTTTATGGATGTGTTCCAACGGGTCGTTACAGTGCAGAATTTGCATTTAAGTTTGTGAGTTCAGATTGTAGTTAAAAACACCCTTGTTTCTACTGGTC diff --git a/data/community/genspectrum/iav/h5n1/GG1996/HA/genome_annotation.gff3 b/data/community/genspectrum/iav/h5n1/GG1996/HA/genome_annotation.gff3 new file mode 100644 index 000000000..648a50357 --- /dev/null +++ b/data/community/genspectrum/iav/h5n1/GG1996/HA/genome_annotation.gff3 @@ -0,0 +1 @@ +. . CDS 22 1728 . + . gene="HA" diff --git a/data/community/genspectrum/iav/h5n1/GG1996/HA/pathogen.json b/data/community/genspectrum/iav/h5n1/GG1996/HA/pathogen.json new file mode 100644 index 000000000..7f5494002 --- /dev/null +++ b/data/community/genspectrum/iav/h5n1/GG1996/HA/pathogen.json @@ -0,0 +1,19 @@ +{ + "schemaVersion": "3.0.0", + "alignmentParams": { + "minSeedCover": 0.01 + }, + "attributes": { + "name": "Influenza A/H5N1 (segment 4/HA)", + "reference name": "Influenza A virus (A/goose/Guangdong/1/1996(H5N1)) hemagglutinin (HA) gene, complete cds", + "reference accession": "NC_007362.1" + }, + "files": { + "reference": "reference.fasta", + "pathogenJson": "pathogen.json", + "changelog": "CHANGELOG.md", + "genomeAnnotation": "genome_annotation.gff3", + "readme": "README.md", + "examples": "examples.fasta" + } +} diff --git a/data/community/genspectrum/iav/h5n1/GG1996/HA/reference.fasta b/data/community/genspectrum/iav/h5n1/GG1996/HA/reference.fasta new file mode 100644 index 000000000..932c18011 --- /dev/null +++ b/data/community/genspectrum/iav/h5n1/GG1996/HA/reference.fasta @@ -0,0 +1,27 @@ +>NC_007362.1 Influenza A virus (A/goose/Guangdong/1/1996(H5N1)) hemagglutinin (HA) gene, complete cds +GCAGGGGTATAATCTGTCAAAATGGAGAAAATAGTGCTTCTTCTTGCAATAGTCAGTCTTGTCAAAAGTG +ATCAGATTTGCATTGGTTACCATGCAAACAACTCGACAGAGCAGGTTGACACAATAATGGAAAAGAACGT +TACTGTTACACATGCCCAAGACATACTGGAAAAGACACACAATGGGAAGCTCTGCGATCTAAATGGAGTG +AAGCCTCTCATTTTGAGAGATTGTAGTGTAGCTGGATGGCTCCTCGGAAACCCTATGTGTGACGAATTCA +TCAATGTGCCGGAATGGTCTTACATAGTGGAGAAGGCCAGTCCAGCCAATGACCTCTGTTACCCAGGGGA +TTTCAACGACTATGAAGAACTGAAACACCTATTGAGCAGAACAAACCATTTTGAGAAAATTCAGATCATC +CCCAAAAGTTCTTGGTCCAATCATGATGCCTCATCAGGGGTGAGCTCAGCATGTCCATACCATGGGAGGT +CCTCCTTTTTCAGAAATGTGGTATGGCTTATCAAAAAGAACAGTGCATACCCAACAATAAAGAGGAGCTA +CAATAATACCAACCAAGAAGATCTTTTAGTACTGTGGGGGATTCACCATCCTAATGATGCGGCAGAGCAG +ACAAAGCTCTATCAAAACCCAACCACTTACATTTCCGTTGGAACATCAACACTGAACCAGAGATTGGTTC +CAGAAATAGCTACTAGACCCAAAGTAAACGGGCAAAGTGGAAGAATGGAGTTCTTCTGGACAATTTTAAA +GCCGAATGATGCCATCAATTTCGAGAGTAATGGAAATTTCATTGCTCCAGAATATGCATACAAAATTGTC +AAGAAAGGGGACTCAGCAATTATGAAAAGTGAATTGGAATATGGTAACTGCAACACCAAGTGTCAAACTC +CAATGGGGGCGATAAACTCTAGTATGCCATTCCACAACATACACCCCCTCACCATCGGGGAATGCCCCAA +ATATGTGAAATCAAACAGATTAGTCCTTGCGACTGGACTCAGAAATACCCCTCAGAGAGAGAGAAGAAGA +AAAAAGAGAGGACTATTTGGAGCTATAGCAGGTTTTATAGAGGGAGGATGGCAGGGAATGGTAGATGGTT +GGTATGGGTACCACCATAGCAATGAGCAGGGGAGTGGATACGCTGCAGACAAAGAATCCACTCAAAAGGC +AATAGATGGAGTCACCAATAAGGTCAACTCGATCATTGACAAAATGAACACTCAGTTTGAGGCCGTTGGA +AGGGAATTTAATAACTTGGAAAGGAGGATAGAGAATTTAAACAAGCAGATGGAAGACGGATTCCTAGATG +TCTGGACTTATAATGCTGAACTTCTGGTTCTCATGGAAAATGAGAGAACTCTAGACTTTCATGACTCAAA +TGTCAAGAACCTTTATGACAAGGTCCGACTACAGCTTAGGGATAATGCAAAGGAGCTGGGTAATGGTTGT +TTCGAGTTCTATCACAAATGTGATAATGAATGTATGGAAAGTGTAAAAAACGGAACGTATGACTACCCGC +AGTATTCAGAAGAAGCAAGACTAAACAGAGAGGAAATAAGTGGAGTAAAATTGGAATCAATGGGAACTTA +CCAAATACTGTCAATTTATTCAACAGTGGCGAGTTCCCTAGCACTGGCAATCATGGTAGCTGGTCTATCT +TTATGGATGTGCTCCAATGGATCGTTACAATGCAGAATTTGCATTTAAATTTGTGAGTTCAGATTGTAGT +TAAAAACACC diff --git a/data/community/genspectrum/iav/h5n1/GG1996/M/CHANGELOG.md b/data/community/genspectrum/iav/h5n1/GG1996/M/CHANGELOG.md new file mode 100644 index 000000000..81199b7df --- /dev/null +++ b/data/community/genspectrum/iav/h5n1/GG1996/M/CHANGELOG.md @@ -0,0 +1,3 @@ +## Unreleased + +Initial release diff --git a/data/community/genspectrum/iav/h5n1/GG1996/M/README.md b/data/community/genspectrum/iav/h5n1/GG1996/M/README.md new file mode 100644 index 000000000..ead1605b5 --- /dev/null +++ b/data/community/genspectrum/iav/h5n1/GG1996/M/README.md @@ -0,0 +1,26 @@ +# H5N1 (segment7/ M) - dataset with A/Goose/Guangdong/1/96 reference + +| attribute | value | +| ------------------- | --------------------------------------- | +| dataset name | community/genspectrum/iav/h5n1/GG1996/M | +| reference strain | A/Goose/Guangdong/1/96(H5N1) | +| reference accession | NC_007363.1 | +| assembly accession | GCF_000864105.1 | + +## Authors and contacts + +Maintained by Genspectrum, Chaoran Chen and Anna Parker + +With the help of: Cornelius Roemer and Richard Neher + +## Scope of this dataset + +This dataset uses the first highly-pathogenic avian influenza (HPAI) isolate (A/Goose/Guangdong/1/96) as a reference and is suitable for the analysis of circulating and historical H5 sequences, including low-pathogenicity avian influenza (LPAI) isolates. + +## Features + +This simple dataset only supports alignment. + +## What is Nextclade dataset + +Read more about Nextclade datasets in Nextclade documentation: https://docs.nextstrain.org/projects/nextclade/en/stable/user/datasets.html diff --git a/data/community/genspectrum/iav/h5n1/GG1996/M/examples.fasta b/data/community/genspectrum/iav/h5n1/GG1996/M/examples.fasta new file mode 100644 index 000000000..4e879a47b --- /dev/null +++ b/data/community/genspectrum/iav/h5n1/GG1996/M/examples.fasta @@ -0,0 +1,38 @@ +>EU195411.1 +ATGAGTCTTCTAACCGAGGTCGAAACGTACGTTCTCTCTATCATCCCGTCAGGCCCCCTCAAAGCCGAGATAGCGCAAAAACTTGAAGATGTTTTCGCAGGAAAGAACACTGATCTCGAGGCTCTCATGGAGTGGCTAAAGACAAGACCAATCCTGTCACCTCTGACTAAAGGGATTTTGGGATTTGTATTCACGCTCACCGTGCCCAGTGAGCGAGGACTGCAGCGTAGACGCTTTGTCCAGAATGCCCTAAGTGGAAATGGAGATCCAAATAATATGGATAGGGCAGTTAAGCTATATAAGAAGCTGAAAAGAGAAATAACATTCCATGGGGCTAAGGAGGTCGCACTCAGCTACTCAACCGGTGCACTTGCCAGTTGCATGGGTCTCATATACAACAGAATGGGAACGGTAACTACAGAAGTAGCTTTTGGTTTAGTGTGTGCCACTTGTGAGCAGATTGCAGATTCACAGCATCGGTCTCACAGACAGATGGCAACTATCACCAACCCACTAATCAGGCATGAGAACAGAATGGTGCTGGCCAGCACTACAGCTAAGGCTATGGAGCAGATGGCGGGATCAAGTGAGCAGGCAGCGGAAGCCATGGAGATCGCTAATCAGGCTAGGCAGATGGTGCAGGCAATGAGGACAATTGGGACTCATCCTAACTCTAGTGCTGGTCTGAGAGACAATCTTCTTGAAAATTTGCAGGCCTACCAGAAACGAATGGGAGTGCAGATGCAGCGATTCAAGTGATCCTCTTGTTGTTGCCGCAAATATCATTGGGATCTTGCACTTGATATTGTGGATTCTTGATCATCTTTTCTTCAAATGCATTTATCGTCGCCTTAAATACGGTTTGAAAAGAGGGCCTTCTACGGCAGGGGTACCTGAGTCTATGAGGGAAGAGTACCGGCAGGAACAGCAGAGTGCTGTGGATGTTGACGACGGTCATTTTGTCAACATAGAGTTGGAGTAA +>JX236015.1 +ATGAGTCTTCTAACCGAGGTCGAAACGTACGTTCTCTCTATTGTCCCGTCAGGCCCCCTCAAAGCCGAGATCGCGCAGAGACTTGAAGATGTCTTTGCAGGGAAGAACACCGATCTCGAGGCTCTCATGGAATGGTTAAAGACAAGACCAATCCTGTCACCTCTGACTAAGGGGATTTTAGGATTTGTGTTCACGCTCACCGTGCCCAGTGAGCGAGGACTGCAGCGTAGACGCTTTGTCCAAAATGCCCTAAATGGGAATGGAGACCCAAACAACATGGACAGAGCAGTCAAACTGTACAGGAAGTTGAAAAGAGAGATAACATTCCATGGAGCTAAAGAAGTTGCACTCAGTTACTCAACCGGTGCACTTGCCAGTTGCATGGGTCTCATATACAACAGGATGGGAACGGTGACCACAGAAGTGGCTTTTGGCCTAGTGTGTGCCACCTGTGAGCAGATTGCTGATTCGCAGCATCGGTCCCACAGGCAGATGGTAACTACCACCAACCCACTAATCAGGCATGAAAACAGAATGGTGCTGGCTAGCACCACGGCTAAGGCTATGGAGCAGATGGCTGGGTCAAGTGAGCAGGCAGCGGAAGCCATGGAAGTTGCTAGTCAGGCCAGGCAGATGGTGCAGGCAATGAGGACAATTGGAACTCACCCTAGCTCCAGTGCCGGTCTGAAGGATGATCTTCTTGAAAATTTGCAGGCCTACCAGAAACGGATGGGAGTGCAAATGCAGCGATTCAAGTGATCCTCTCGTTATTGCTGCAAGCATCATTGGGATCTTGCACTTGATATTGTGGATTCTTGATCGTCTTTTCTTCAAATGTATTTATCGTCGCCTTAAATACGGTTTGAAAAGAGGGCCTTCTACGGAAGGAGTGCCTGAGTCTATGAGGGAAGAGTATCGGCAGGAACAGCAGAGTGCTGTGGATGTTGACGATGGTCATTTTGTCAACATAGAGCTGGAGTAA +>OP269958.1 +AGCAAAAGCAGGTAGATATTGAAAGATGAGTCTTCTAACCGAGGTCGAAACGTACGTTCTCTCTATCGTCCCGTCGGGCCCCCTCAAAGCCGAGATCGCGCAGAGACTTGAAGATGTCTTTGCAGGGAAAAACACCGATCTTGAGGCTCTCATGGAATGGCTAAAGACAAGACCAATCCTGTCACCTCTGACTAAGGGGATTTTGGGATTTGTGTTCACGCTCACCGTGCCCAGTGAGCGAGGACTGCAGCGTAGACGCTTTGTCCAAAATGCTCTAAATGGAAATGGAGACCCAAACAACATGGACAGGGCAGTCAAGTTGTACAGGAAATTGAAGAGAGAGATAACATTCCATGGGGCTAAAGAAGTTGCACTCAGTTACTCAACCGGTGCACTTGCCAGTTGTATGGGTCTCATATACAACAGGATGGGGACGGTGACCGCAGAAGTGGCATTGGGCCTAGTGTGTGCCACCTGTGAGCAGATTGCTGATTCACAGCATCGGTCTCACAGACAGATAGCTACCACCACCAACCCACTAATCAGACATGAAAACAGAATGGTGTTGGCCAGTACTACAGCTAAGGCTATGGAGCAGATGGCTGGATCGAGTGAGCAAGCAGTGGAGGCCATGGAGGTTGCTAGTCAGGCTAGGCAGATGGTGCAGGCGATGAGGACCATTGGAACTCATCCTAGCTCCAGTGCCGGTCTGAGAGATGATCTCCTTGAAAATTTGCAGGCCTACCAAAAACGGATGGGAGTGCAACTGCAGCGATTCAAGTGATCCTCTCGTTATTGCCGCAAGTATCATTGGGATCTTGCACTTGATATTGTGGATTCTTGATCGCCTTTTCTTCAAATGCGTTTATCGTCGCCTTAAATACGGTTTGAAAGGAGGGCCTTCTACGGAAGGAGTACCTGAGTCCATGAGGGAAGAGTACCGGCAGGAACAGCAGAGTGCTGTGGATGTTGACGATGGTCATTTTGTCAACATAGAGCTGGAGTAAAAAACTACCTTGTTTCTACT +>OQ584648.1 +AGCAAAAGCAGGTAGATATTGAAAGATGAGTCTTCTAACCGAGGTCGAAACGTACGTTCTCTCTATCGTCCCGTCGGGCCCCCTCAAAGCCGAGATCGCGCAGAGACTTGAAGATGTCTTTGCAGGGAAGAACACCGATCTTGAGGCTCTCATGGAATGGCTAAAGACAAGACCAATCCTGTCACCTCTGACTAAGGGGATTTTGGGATTTGTGTTCACGCTCACCGTGCCCAGTGAGCGAGGACTGCAGCGTAGACGCTTTGTCCAAAATGCTCTAAATGGAAATGGAGACCCAAACAACATGGACAGGGCAGTCAAGTTGTACAGGAAATTGAAGAGAGAGATAACATTCCATGGGGCTAAAGAAGTTGCACTCAGTTACTCAACCGGTGCACTTGCCAGTTGTATGGGTCTCATATACAACAGGATGGGGACGGTGACCGCAGAAGTGGCATTGGGCCTAGTGTGTGCCACCTGTGAGCAGATTGCTGATTCACAGCATCGGTCTCACAGACAGATAGCTACCACCACCAACCCACTAATCAGACATGAAAACAGAATGGTGTTGGCCAGTACTACAGCTAAGGCTATGGAGCAGATGGCTGGATCGAGTGAGCAAGCAGCGGAGGCCATGGAGGTTGCTAGTCAGGCTAGGCAGATGGTGCAGGCGATGAGGACCATTGGAACTCATCCTAGCTCCAGTGCCGGTCTGAGAGATGATCTCCTTGAAAATTTGCAGGCCTACCAAAAACGGATGGGAGTGCAACTGCAGCGATTCAAGTGATCCTCTCGTTATTGCCGCAAGTATCATTGGGATCTTGCACTTGATATTGTGGATTCTTGATCGCCTTTTCTTCAAATGTGTTTATCGTCGCCTTAAATACGGTTTGAAAGGAGGGCCTTCTACGGAAGGAGTACCTGAGTCCATGAGGGAAGAGTACCGGCAGGAACAGCAGAGTGCTGTGGATGTTGACGATGGTCATTTTGTCAACATAGAGCTGGAGTAAAAAACTACCTTGTTTCTACT +>CY060148.1 +CCCCCTCAAAGCCGAGATCGCGCAGAAACTTGAAGATGTCTTTGCAGGGAAGAACACCGATCTCGAGGCTCTCATGGAGTGGCTAAAGACAAGACCAATCCTGTCACCTCTGACTAAAGGGATTTTGGGATTTGTATTCACGCTCACCGTGCCCAGTGAGCGAGGACTGCAGCGTAGACGCTTTGTCCAGAATGCCCTAAATGGAAATGGAGATCCAAATAATATGGATAGGGCAGTTAAGCTATATAAGAAGCTGAAAAGAGAAATAACATTCCATGGGGCTAAGGAGGTCGCACTCAGCTACTCAACCGGTGCACTTGCCAGTTGCATGGGTCTCATATACAACAGGATGGGAACGGTGACTACGGAAGTGGCTTTTGGCCTAGTGTGTGCCACTTGTGAGCAGATTGCAGATTCACAGCATCGGTCTCACAGACAGATGGCAACCATCACCAACCCACTAATCAGGCATGAGAACAGAATGGTGCTGGCCAGCACTACAGCTAAGGCTATGGAGCAGATGGCGGGATCAAGCGAGCAGGCAGCGGAAGCCATGGAAGTCGCTAATCAGGCTAGGCAGATGGTGCAGGCAATGAGGACAATTGGGACTCATCCTAACTCTAGTGCTGGTCTGAGAGATAATCTTCTTGAAAATTTGCAGGCCTACCAGAAACGAATGGGAGTGCAGATGCAGCGATTCAAGTGATCCTCTTGTTGTTGCCGCAAGTATCATTGGGATCTTGCACTTGATATTGTGGATTCTTGATCGTCTTTTCTTCAAATGCATTTATCGTCGCCTTAAATACGGTTTGAAAAGAGGGCCTTCTACGGAAGGGGTACCTGAGTCTATGAGGGAAGA +>OQ584727.1 +AGCAAAAGCAGGTAGATATTGAAAGATGAGTCTTCTAACCGAGGTCGAAACGTACGTTCTCTCTATCGTCCCGTCGGGCCCCCTCAAAGCCGAGATCGCGCAGAGACTTGAAGATGTCTTTGCAGGGAAGAACACCGATCTTGAGGCTCTCATGGAATGGCTAAAGACAAGACCAATCCTGTCACCTCTGACTAAGGGGATTTTGGGATTTGTGTTCACGCTCACCGTGCCCAGTGAGCGAGGACTGCAGCGTAGACGCTTTGTCCAAAATGCTCTAAATGGAAATGGAGACCCAAACAACATGGACAGGGCAGTCAAGTTGTACAGGAAATTGAAGAGAGAGATAACATTCCATGGGGCTAAAGAAGTTGCACTCAGTTACTCAACCGGTGCACTTGCCAGTTGTATGGGTCTCATATACAACAGGATGGGGACGGTGACCGCAGAAGTGGCATTGGGCCTAGTGTGTGCCACCTGTGAGCAGATTGCTGATTCACAGCATCGGTCTCACAGACAGATAGCTACCACCACCAACCCACTAATCAGACATGAAAACAGAATGGTGTTGGCCAGTACTACAGCTAAGGCTATGGAGCAGATGGCTGGATCGAGTGAGCAAGCAGCGGAGGCCATGGAGGTTGCTAGTCAGGCTAGGCAGATGGTGCAGGCGATGAGGACCATTGGAACTCATCCTAGCTCCAGTGCCGGTCTGAGAGATGATCTCCTTGAAAATTTGCAGGCCTACCAAAAACGGATGGGAGTGCAACTGCAGCGATTCAAGTGATCCTCTCGTTATTGCCGCAAGTATCATTGGGATCTTGCACTTGATATTGTGGATTCTTGATCGCCTTTTCTTCAAATGTGTTTATCGTCGCCTTAAATACGGTTTGAAAGGAGGGCCTTCTACGGAAGGAGTACCTGAGTCCATGAGGGAAGAGTACCGGCAGGAACAGCAGAGTGCTGTGGATGTTGACGATGGTCATTTTGTCAACATAGAGCTGGAGTAAAAAACTACCTTGTTTCTACT +>OQ584719.1 +AGCAAAAGCAGGTAGATATTGAAAGATGAGTCTTCTAACCGAGGTCGAAACGTACGTTCTCTCTATCGTCCCGTCGGGCCCCCTCAAAGCCGAGATCGCGCAGAGACTTGAAGATGTCTTTGCAGGGAAGAACACCGATCTTGAGGCTCTCATGGAATGGCTAAAGACAAGACCAATCCTGTCACCTCTGACTAAGGGGATTTTGGGATTTGTGTTCACGCTCACCGTGCCCAGTGAGCGAGGACTGCAGCGTAGACGCTTTGTCCAAAATGCTCTAAATGGAAATGGAGACCCAAACAACATGGACAGGGCAGTCAAGTTGTACAGGAAATTGAAGAGAGAGATAACATTCCATGGGGCTAAAGAAGTTGCACTCAGTTACTCAACCGGTGCACTTGCCAGTTGTATGGGTCTCATATACAACAGGATGGGGACGGTGACCGCAGAAGTGGCATTGGGCCTAGTGTGTGCCACCTGTGAGCAGATTGCTGATTCACAGCATCGGTCTCACAGACAGATAGCTACCACCACCAACCCACTAATCAGACATGAAAACAGAATGGTGTTGGCCAGTACTACAGCTAAGGCTATGGAGCAGATGGCTGGATCGAGTGAGCAAGCAGCGGAGGCCATGGAGGTTGCTAGTCAGGCTAGGCAGATGGTGCAGGCGATGAGGACCATTGGAACTCATCCTAGCTCCAGTGCCGGTCTGAGAGATGATCTCCTTGAAAATTTGCAGGCCTACCAAAAACGGATGGGAGTGCAACTGCAGCGATTCAAGTGATCCTCTCGTTATTGCCGCAAGTATCATTGGGATCTTGCACTTGATATTGTGGATTCTTGATCGCCTTTTCTTCAAATGTGTTTATCGTCGCCTTAAATACGGTTTGAAAGGAGGGCCTTCTACGGAAGGAGTACCTGAGTCCATGAGGGAAGAGTACCGGCAGGAACAGCAGAGTGCTGTGGATGTTGACGATGGTCATTTTGTCAACATAGAGCTGGAGTAAAAAACTACCTTGTTTCTACT +>CY060157.1 +CCCCCTCAAAGCCGAGATCGCGCAGAAACTTGAAGATGTCTTTGCAGGGAAGAACACCGATCTCGAGGCTCTCATGGAGTGGCTAAAGACAAGACCAATCCTGTCACCTCTGACTAAAGGGATTTTGGGATTTGTATTCACGCTCACCGTGCCCAGTGAGCGAGGACTGCAGCGTAGACGCTTTGTCCAGAATGCCCTAAATGGAAATGGAGATCCAAATAATATGGATAGGGCAGTTAAGCTATATAAGAAGCTGAAAAGAGAAATAACATTCCATGGGGCTAAGGAGGTCTCACTCAGCTACTCAACCGGTGCACTTGCCAGTTGCATGGGTCTCATATACAACAGGATGGGAACGGTGACTACGGAAGTGGCTTTTGGCCTAGTGTGTGCCACTTGTGAGCAGATTGCAGATTCACAGCATCGGTCTCACAGACAGATGGCAACCATCACCAACCCACTAATCAGGCATGAGAACAGAATGGTGCTGGCCAGCACTACAGCTAAGGCTATGGAGCAGATGGCGGGATCAAGCGAGCAGGCAGCGGAAGCCATGGAAGTCGCTAATCAGGCTAGGCAGATGGTGCAGGCAATGAGGACAATTGGGACTCATCCTAACTCTAGTGCTGGTCTGAGAGATAATCTTCTTGAAAATTTGCAGGCCTACCAGAAACGGATGGGAGTGCAGATGCAGCGATTCAAGTGATCCTCTTGTTGTTGCCGCAAGTATCATTGGGATCTTGCACTTGATATTGTGGATTCTTGATCGTCTTTTCTTCAAATGCATTTATCGTCGCCTTAAATACGGTTTGAAAAGAGGGCCTTCTACGGAAGGGGTACCTGAGTCTATGAGGGAAGA +>CY111124.1 +AGCAAAAGCAGGTAGATGTTGAAAGATGAGTCTTCTAACCGAGGTCGAAACGTACGTTCTCTCTATCATTCCGTCCGGCCCCCTCAAAGCCGAGATCGCGCAGAAACTTGAAGATGTCTTTGCAGGAAAGAACACCGATCTTGAGGCTCTCATGGAGTGGCTAAAGACAAGACCAATCCTGTCACCTTTGACTAAAGGGATGTTGGGATTTGTATTCACGCTCACCGTGCCCAGTGAGCGAGGACTGCAGCGTAGACGCTTTGTCCAGAATGCCCTAAATGGAAATGGAGATCCAAATAATATGGATAGGGCAGTTAAGCTATATAAGAAGCTGAAAAGAGAAATAACATTCCATGGGGCTAAGGAGGTCGCACTCAGCTACTCAACCGGTGCACTAGCCAGTTGCATGGGTCTCATATACAACAGAATGGGCACAGTGACTACGGAAGTGGCTTTTGGCCTAGTGTGTGCCACTTGTGAGCAGATTGCAGATTCACAGCATCGGTCTCACAGACAGATGGCAACTATTACCAACCCACTAATCAGGCATGAGAACAGAATGGTGCTAGCAAGCACTACAGCTAAGGCTATGGAGCAGATGGCGGGATCAAGTGAGCAGGCAGCGGAAGCCATGGAGGTCGCTAATCAGGCTAGGCAGATGGTGCAGGCAATGAGAACAATTGGGACTCATCCTAACTCTAGTGCTGGTCTGAGAGATAATCTTCTTGAAAATTTGCAGGCCTACCAGAAACGAATGGGAGTGCAAATGCAGCGATTCAAGTGATCCTCTTGTTGTTGCCGCAAGTATCATTGGGATCTTGCACTTGATATTGTGGATTCTTGATCGTCTTTTCTTCAAATGCATTTATCGTCGCCTTAAATACGGTTTGAAAAGAGGGCCTTCTACGGAAGGAGTACCTGAGTCTATGAGGGAAGAGTATCGGCAGGAACAGCAGAATGCTGTGGATGTTGACGATGGTCATTTTGTCAACATAGAATTGGAGTAAAAAACTACCTTGTTTCTACT +>KC436115.1 +AGCAAAAGCAGGTAGATGTTGAAAGATGAGTCTTCTAACCGAGGTCGAAACGTACGTTCTCTCTATCATCCCGTCAGGCCCCCTCAAAGCCGAGATCGCGCAGAAACTTGAAGATGTCTTTGCAGGAAAGAACACCGATCTCGAGGCTCTCATGGAGTGGCTAAAGACAAGACCAATCCTGTCACCTTTGACTAAAGGGATGTTGGGATTTGTATTCACGCTCACCGTGCCCAGTGAGCGAGGACTGCAGCGTAGACGCTTTGTCCAGAATGCCCTAAATGGAAATGGAGATCCAAATAATATGGATAGGGCAGTTAAGCTATATAAGAAGCTGAAAAGAGAAATAACATTCCATGGGGCTAAGGAGGTCGCACTCAGCTACTCAACCGGTGCACTCGCCAGTTGCATGGGTCTCATATACAACAGAATGGGCACAGTGACTACGGAAGTGGCTTTTGGCCTAGTGTGTGCCACTTGTGAGCAGATTGCAGATTCACAGCATCGGTCTCACAGACAGATGGCAACTATCACCAACCCACTAATCAGGCATGAGAACAGAATGGTGCTGGCAAGCACTACAGCTAAGGCTATGGAGCAGATGGCGGGATCAAGTGAGCAGGCAGCGGAAGCCATGGAGGTCGCTAATCAGGCTAGGCAGATGGTGCAGGCAATGAGAACAATTGGGACTCATCCTAACTCTAGTGCTGGTCTGAGAGATAATCTTCTTGAAAATTTGCAGGCCTACCAGAAACGAATGGGAGTGCAGATGCAGCGATTCAAGTGATCCTCTTGTTGTTGCCGCAAGTATCATTGGGATCTTGCACTTGATATTGTGGATTCTTGATCGTCTTTTCTTCAAATGCATTTATCGTCGCCTTAAATACGGTTTGAAAAGAGGGCCTTCTACGGAAGGAGTACCTGAGTCTATGAGGGAAGAGTATCGACAGGAACAGCAGAATGCTGTGGATGTTGACGATGGTCATTTTGTCAACATAGAATTGGAGTAAAAAACTACCTTGTTTCTACT +>JF758742.1 +ATGAGTCTTCTAACCGAGGTCGAAACGTACGTTCTCTCTATCGTCCCGTCAGGCCCCCTCAAAGCCGAGATCGCGCAGAGACTTGAAGATGTGTTTGCAGGGAAGAACACCGACCTTGAGGCACTCATGGAATGGCTAAAGACAAGACCAATCCTGTCACCTCTGACTAAGGGGATTTTAGGATTTGTGTTCACGCTCACCGTGCCCAGTGAGCGAGGACTGCAGCGTAGACGCTTTGTCCAAAATGCCCTTAATGGGAATGGGGATCCAAACAACATGGACAGAGCGGTCAAACTGTACAGGAAACTTAAAAGAGAAATAACATTCCATGGGGCAAAAGAAGTGGCACTCAGTTATTCAACTGGTGCACTTGCCAGCTGCATGGGCCTCATATACAACAGGATGGGGACTGTGACTAGTGAAGTGGCATTTGGCCTGGTGTGCGCCACGTGTGAGCAGATTGCTGATTCCCAGCATCGGTCTCACAGACAAATGGTGACAACAACCAACCCACTAATCAGGCATGAGAACAGAATGGTACTGGCCAGTACCACAGCTAAAGCCATGGAGCAAATGGCAGGGTCAAGTGAGCAGGCAGCAGAGGCCATGGAGGTTGCTAGTCAGGCCAGACAAATGGTGCAGGCAATGAGGACAATTGGGACTCACCCTAGCTCCAGTGCTGGTCTAAAAGATGATCTTCTTGAAAATTTGCAGGCCTACCAAAAACGGATGGGAGTGCAGATGCAGCGATTCAAGTGA +>JF758732.1 +ATGAGTCTTCTAACCGAGGTCGAAACGTACGTTCTCTCTATCGTCCCGTCAGGCCCCCTCAAAGCCGAGATCGCGCAGAGACTTGAAGATGTGTTTGCAGGGAAGAACACCGACCTTGAGGCACTCATGGAATGGCTAAAGACAAGACCAATCCTGTCACCTCTGACTAAGGGGATTTTAGGATTTGTGTTCACGCTCACCGTGCCCAGTGAGCGAGGACTGCAGCGTAGACGCTTTGTCCAAAATGCCCTTAATGGGAATGGGGATCCAAACAACATGGACAGAGCGGTCAAACTGTACAGGAAACTTAAAAGAGAAATAACATTCCATGGGGCAAAAGAAGTGGCACTCAGTTATTCAACTGGTGCACTTGCCAGCTGCATGGGCCTCATATACAACAGGATGGGGACTGTGACTAGTGAAGTGGCATTTGGCCTGGTGTGCGCCACGTGTGAGCAGATTGCTGATTCCCAGCATCGGTCTCACAGACAAATGGTGACAACAACCAACCCACTAATCAGGCATGAGAACAGAATGGTACTGGCCAGTACCACAGCTAAAGCCATGGAGCAAATGGCAGGGTCAAGTGAGCAGGCAGCAGAGGCCATGGAGGTTGCTAGTCAGGCCAGACAAATGGTGCAGGCAATGAGGACAATTGGGACTCACCCTAGCTCCAGTGCTGGTCTAAAAGATGATCTTCTTGAAAATTTGCAGGCCTACCAAAAACGGATGGGAGTGCAGATGCAGCGATTCAAGTGA +>JF758696.1 +ATGAGTCTTCTAACCGAGGTCGAAACGTACGTTCTCTCTATCGTCCCGTCAGGCCCCCTCAAAGCCGAGATCGCGCAGAGACTTGAAGATGTGTTTGCAGGGAAGAACACCGACCTTGAGGCACTCATGGAATGGCTAAAGACAAGACCAATCCTGTCACCTCTGACTAAGGGGATTTTAGGATTTGTGTTCACGCTCACCGTGCCCAGTGAGCGAGGACTGCAGCGTAGACGCTTTGTCCAAAATGCCCTTAATGGGAATGGGGATCCAAACAACATGGACAGAGCGGTCAAACTGTACAGGAAACTTAAAAGAGAAATAACATTCCATGGGGCAAAAGAAGTGGCACTCAGTTATTCAACTGGTGCACTTGCCAGCTGCATGGGCCTCATATACAACAGGATGGGGACTGTGACTAGTGAAGTGGCATTTGGCCTGGTGTGCGCCACGTGTGAGCAGATTGCTGATTCCCAGCATCGGTCTCACAGACAAATGGTGACAACAACCAACCCACTAATCAGGCATGAGAACAGAATGGTACTGGCCAGTACCACAGCTAAAGCCATGGAGCAAATGGCAGGGTCAAGTGAGCAGGCAGCAGAGGCCATGGAGGTTGCTAGTCAGGCCAGACAAATGGTGCAGGCAATGAGGACAATTGGGACTCACCCTAGCTCCAGTGCTGGTCTAAAAGATGATCTTCTTGAAAATTTGCAGGCCTACCAAAAACGGATGGGAGTGCAGATGCAGCGATTCAAGTGA +>AB675561.1 +ATGTTGAAAGATGAGTCTTCTAACCGAGGTCGAAACGTACGTTCTTTCTATCATTCCGTCAGGCCCCCTCAAAGCCGAGATCGCGCAGAAACTTGAGGATGTCTTTGCAGGGAAGAACACCGATCTCGAGGCTCTTATGGAGTGGCTAAAGACAAGACCAATCCTGTCACCTCTGACTAAAGGGATATTGGGATTTGTGTTCACGCTCACCGTGCCCAGTGAGCGAGGACTGCAACGTAGACGTTTTGTCCAGAATGCCCTAAATGGAAATGGTGATCCAAATAATATGGATAGAGCAGTTAAGCTATATAAGAAGCTGAAAAGAGAAATAACATTCCATGGGGCTAAGGAGGTCGCACTCAGCTACTCAACCGGTGCACTTGCCAGTTGCATGGGCCTCATATACAACAGGATGGGAACGGTGACTACGGAAGTGGCTTTTGGCTTAGTGTGTGCCACTTGTGAGCAGATTGCAGACTCACAGCATCGGTCTCACAGACAGATGGCAACCATCACCAACCCACTAATCAGACATGAGAACAGAATGGTGCTGGCCAGCACTACAGCTAAGGCTATGGAGCAAATGGCGGGATCAAGCGAGCAAGCAGCGGAAGCCATGGAGGTCGCTAATCAGGCTAGGCAGATGGTGCAGGCAATGAGGACAATTGGGACTCATCCTAATTCCAGTGCTGGTCTGAGAGATAATCTTCTTGAAAATTTGCAGGCCTACCAGAAACGAATGGGAGTGCAGATGCAGCGATTCAAGTGATCCTCTTGTTTTTGCCGCAAGTATCATTGGGAT +>OP950300.1 +AGCAAAAGCAGGTAGATATTGAAAGATGAGTCTTCTAACCGAGGTCGAAACGTACGTTCTCTCTATCGTCCCGTCGGGCCCCCTCAAAGCCGAGATCGCGCAGAGACTTGAAGATGTCTTTGCAGGGAAGAACACCGATCTTGAGGCTCTCATGGAATGGCTAAAGACAAGACCAATCCTGTCACCTCTGACTAAGGGGATTTTGGGATTTGTGTTCACGCTCACCGTGCCCAGTGAGCGAGGACTGCAGCGTAGACGCTTTGTCCAAAATGCTCTAAATGGAAATGGAGACCCAAACAACATGGACAGGGCAGTCAAGTTGTACAGGAAATTGAAGAGAGAGATAACATTCCATGGGGCTAAAGAAGTTGCACTCAGTTACTCAACCGGTGCACTTGCCAGTTGTATGGGTCTCATATACAACAGGATGGGGACGGTGACCGCAGAAGTGGCATTGGGCCTAGTGTGTGCCACCTGTGAGCAGATTGCTGATTCACAGCATCGGTCTCACAGACAGATAGCTACCACCACCAACCCACTAATCAGACATGAAAACAGAATGGTGTTGGCCAGTACTACAGCTAAGGCTATGGAGCAGATGGCTGGATCGAGTGAACAAGCAGTGGAAGCCATGGAGGTTGCTAGTCAGGCTAGGCAGATGGTGCAGGCGATGAGGACCATTGGAACTCATCCTAGCTCCAGTGCCGGTCTGAGAGATGATCTCCTTGAAAATTTGCAGGCCTACCAAAAACGGATGGGAGTGCAACTGCAGCGATTCAAGTGATCCTCTCGTTATTGCCGCAAGTATCATTGGGATCTTGCACTTGATATTGTGGATTCTTGATCGCCTTTTCTTCAAATGCGTTTATCGTCGCCTTAAATACGGTTTGAAAGGAGGGCCTTCTACGGAAGGAGTACCTGAGTCCATGAGGGAAGAGTACCGGCAGGAACAGCAGAGTGCTGTGGATGTTGACGATGGTCATTTTGTCAACATAGAGCTGGAGTAAAAAACTACCTTGTTTCTACT +>KP097989.1 +ATGAGTCTTCTAACCGAGGTCGAAACGTACGTTCTCTCTATCATCCCATCAGGCCCCCTCAAAGCCGAGATCGCGCAGAAACTTGAGGATGTATTTGCAGGAAAGAACACTGATCTCGAGGCTCTCATGGAGTGGCTAAAGACAAGACCAATCCTGTCACCTCTGACTAAAGGGATCTTGGGATTTGTATTCACGCTCACCGTGCCCAGTGAGCGAGGACTGCAGCGTAGACGTTTTGTCCAGAATGCCCTAAATGGAAATGGAGATCCAAATAATATGGATAGGGCAGTTAAGCTATATAAGAAGCTGAAAAGAGAAATAACATTCCATGGAGCTAAGGAGGTCGCACTCAGTTACTCAACCGGTGCACTTGCCAGTTGCATGGGTCTCATATACAACAGGATGGGAACGGTGACTACAGAAGTGGCTTTTGGCCTAGTGTGTGCCACTTGTGAGCAGATTGCAGATTCACAGCATCGGTCTCACAGACAGATGGCAACCATCACCAACCCACTAATCAGGCATGAGAACAGAATGGTGCTGGCCAGCACTACAGCTAAGGCCATGGAGCAGATGGCAGGATCAAGCGAGCAGGCAGCAGAAGCCATGGAGGTCGCCAATCAGGCTAGACAGATGGTGCAGGCAATGAGGACAATTGGGACTCATCCTAACTCTAGTGCTGGTCTGAGAGATAATCTTCTTGAAAATTTGCAGGCCTACCAGAAACGAATGGGAGTGCAGATGCAGCGATTCAAGTGATCCTCTTATTGTTGCCGCAAGTATCATTGGGATCTTGCACTTGATATTGTGGATTCTTGATCGTCTTTTCTTCAAATGCATTTATCGTCGCCTTAAATACGGTTTGAAAAGAGGGCCTTCTACGGAAGGGGTACCGGAGTCTATGAGGGAAGAGTACCGGCAGGAACAGCAGAATGCTGTGGATGTTGACGATGGTCATTTTGTCAACATAGAATTGGAGTAA +>KP097998.1 +ATGAGTCTTCTAACCGAGGTTGAAACGTACGTTCTCTCTATCATCCCGTCAGGCCCCCTCAAAGCCGAGATAGCGCAAAAACTTGAAGATGTTTTCGCAGGAAAGAACACTGATCTCGAGGCTCTCATGGAGTGGCTAAAGACAAGACCAATCCTGTCACCTCTGACTAAAGGGATTTTGGGATTTGTATTCACGCTCACCGTGCCCAGTGAGCGAGGACTGCAGCGTAGACGCTTTGTCCAGAATGCCCTAAGTGGAAATGGAGATCCAAATAATATGGATAGGGCAGTTAAGCTATATAAGAAGCTGAAAAGAGAAATAACATTCCATGGGGCTAAGGAGGTCGCACTCAGCTACTCAACCGGTGCACTTGCCAGTTGCATGGGTCTCATATACAACAGAATGGGAACGGTAACTACGGAAGTAGCTTTTGGTTTGGTGTGTGCCACTTGTGAGCAGATTGCAGATTCACAGCATCGGTCTCACAGACAGATGGCAACTATCACCAACCCACTAATCAGGCATGAGAACAGAATGGTGCTGGCCAGCACTACAGCTAAGGCCATGGAGCAGATGGCGGGATCAAGTGAGCAGGCAGCGGAAGCCATTGAGATCGCTAATCAGGCTAGGCAGATGGTGCAGGCAATGAGGACAATTGGGACTCATCCTAACTCTAGTGCTGGTCTAAGGGACAATCTTCTTGAAAATTTGCAGGCCTACCAGAAACGAATGGGAGTGCAGATGCAGCGATTCAAGTGATCCTCTTGTTGTTGCCGCAAATATCATTGGGATCTTGCACTTGATATTGTGGATTCTTGATCATCTTTTCTTCAAATGCATTTATCGTCGCCTTAAATACGGTTTGAAAAGAGGGCCTTCTACGGTAGGGGTACCTGAGTCTATGAGGGAAGAGTACCGGCAGGAACAGCAGAGTGCTGTGGATGTTGACGACGGTCATTTTGTCAACATAGAGTTGGAGT +>KU715862.1 +AGCAAAAGCAGGTAGATGTTGAAAGATGAGTCTTCTAACCGAGGTCGAAACGTACGTTCTCTCTATCGTCCCATCAGGCCCCCTCAAAGCCGAGATCGCGCAGAAACTTGAAGATGTCTTTGCAGGGAAGAACACCGATCTCGAGGCTCTCATGGAATGGCTAAAGACAAGACCAATCCTGTCACCTCTGACTAAAGGAATGTTGGGATTTGTATTCACGCTCACCGTGCCCAGTGAGCGAGGACTGCAGCGTAGACGCTTTGTCCAGAATGCCCTAAATGGAAATGGAGATCCAAATAATATGGATAAGGCAGTTAAGCTATATAAGAAGCTGAAAAGAGAAATAACATTCTATGGGGCTAAGGAGGTTGCACTCAGCTACTCAACCGGTGCACTCGCCAGTTGCATGGGTCTCATATATAACAGAATGGGCACAGTGACCACGGAAGTGGCTTTTGGCCTAGTATGTGCCACTTGTGAGCAGATTGCAGATTCACAGCATCGGTCTCACAGACAGATGGCAACCACCACCAACCCACTAATCAGGCATGAGAACAGAATGGTGCTGGCCAGCACTACAGCTAAGGCTATGGAGCAAATGGCGGGATCAAGTGAGCAGGCAGCGGAAGCCATGGAAGTCGCTAGTCAGGCTAGGCAGATGGTGCAGGCAATGAGAACAATTGGGACTCATCCTAACTCTAGTGCCGGTCTGAGAGATAATCTTCTTGAAAATTTGCAGGCCTACCAGAAACGAATGGGAGTGCAGATGCAGCGATTCAAGTGATCCTCTTGTTATTGCCGCAAGTATCATTGGGATCTTGCACTTGATATTGTGGATTCTTGATCGTCTTTTCTTCAAATTCATTTATCGCCGCCTCAAATACGGTTTGAAAAGAGGGCCTTCTACGGAAGGAGTGCCTGAGTCTATGAGGGAAGAATATCGGCAGGAACAGCAGAATGCTGTAGATGTTGACGATGGTCATTTTGTCAACATAGAATTGGAGTAAAAAACTACCTTGTTT +>KU715898.1 +AGCAAAAACAGGTAGATGTTGAAGTATGAGTCTTCTAACCGAGGTCGAAACGTACGTTCTCTCTATCGTCCCATCAGGCCCCCTCAAAGCCGAGATCGCGCAGAAACTTGAAGATGTCTTTGCAGGAAAGAACACCGATCTCGAGGCTCTCATGGAATGGCTAAAGACAAGACCAATCCTGTCACCTCTGACTAAAGGAATGTTGGGATTTGTATTCACGCTCACCGTGCCCAGTGAGCGAGGACTGCAGCGTAGACGCTTTGTCCAGAATGCCCTAAATGGAAATGGAGATCCAAATAATATGGATAAGGCAGTTAAGCTATATAAGAAGCTGAAAAGAGAAATAACATTCCATGGGGCTAAGGAGGTTGCACTCAGCTACTCAACCGGTGCACTCGCCAGTTGCATGGGTCTCATATACAACAGAATGGGCACAGTGACCACGGAAGTGGCTTTTGGCCTAGTATGTGCCACTTGTGAGCAGATTGCAGATTCACAGCATCGGTCTCACAGACAGATGGCAACCACCACCAACCCACTAATCAGGCATGAGAACAGAATGGTGCTGGCCAGCACTACAGCTAAGGCTATGGAGCAGATGGCGGGATCAAGTGAGCAGGCAGCGGAAGCCATGGAAGTCGCTAGTCAGGCTAGGCAGATGGTGCAGGCAATGAGAACAATTGGGACTCATCCTAACTCTAGTGCCGGTCTGAGAGATAATCTTCTTGAAAATTTGCAGGCCTACCAGAAACGAATGGGAGTGCAGATGCAGCGATTCAAGTGATCCTCTTGTTATTGCCGCAAGTATCATTGGGATCTTGCACTTGATATTGTGGATTCTTGATCGTCTTTTCTTCAAATTCATTTATCGCCGCCTCAAATACGGTTTGAAAAGAGGGCCTTCTACGGAAGGAGTGCCTGAGTCTATGAGGGAAGAATATCGGCAGGAACAGCAGAATGCTGTAGATGTTGACGATGGTCATTTTGTCAACATAGAATTGGAGTAAAAAACTACCTTGTTT diff --git a/data/community/genspectrum/iav/h5n1/GG1996/M/genome_annotation.gff3 b/data/community/genspectrum/iav/h5n1/GG1996/M/genome_annotation.gff3 new file mode 100644 index 000000000..89a48f756 --- /dev/null +++ b/data/community/genspectrum/iav/h5n1/GG1996/M/genome_annotation.gff3 @@ -0,0 +1,3 @@ +. . CDS 26 51 . + . gene=M2;ID=cds-M2 +. . CDS 740 1007 . + . gene=M2;ID=cds-M2 +. . CDS 26 784 . + . Name=M1;gene=M1 diff --git a/data/community/genspectrum/iav/h5n1/GG1996/M/pathogen.json b/data/community/genspectrum/iav/h5n1/GG1996/M/pathogen.json new file mode 100644 index 000000000..4b18a27b9 --- /dev/null +++ b/data/community/genspectrum/iav/h5n1/GG1996/M/pathogen.json @@ -0,0 +1,19 @@ +{ + "schemaVersion": "3.0.0", + "alignmentParams": { + "minSeedCover": 0.01 + }, + "attributes": { + "name": "Influenza A/H5N1 (segment 7/M)", + "reference name": "Influenza A virus (A/goose/Guangdong/1/1996(H5N1)) segment 7, complete sequence", + "reference accession": "NC_007363.1" + }, + "files": { + "reference": "reference.fasta", + "pathogenJson": "pathogen.json", + "changelog": "CHANGELOG.md", + "genomeAnnotation": "genome_annotation.gff3", + "readme": "README.md", + "examples": "examples.fasta" + } +} diff --git a/data/community/genspectrum/iav/h5n1/GG1996/M/reference.fasta b/data/community/genspectrum/iav/h5n1/GG1996/M/reference.fasta new file mode 100644 index 000000000..de43cc8e7 --- /dev/null +++ b/data/community/genspectrum/iav/h5n1/GG1996/M/reference.fasta @@ -0,0 +1,16 @@ +>NC_007363.1 Influenza A virus (A/goose/Guangdong/1/1996(H5N1)) segment 7, complete sequence +AGCAAAAGCAGGTAGATATTGAAAAATGAGTCTTCTAACCGAGGTCGAAACGTACGTTCTCTCTATCGTC +CCGTCAGGCCCCCTCAAAGCCGAGATCGCGCAGAGACTTGAGGATGTCTTTGCAGGAAAGAACACCGATC +TCGAGGCTCTCATGGAATGGCTAAAGACAAGACCAATCCTGTCACCTCTGACTAAAGGGATTTTAGGATT +TGTGTTCACGCTCACCGTGCCCAGTGAGCGAGGACTGCAGCGTAGACGCTTTGTCCAGAATGCCTTAAAT +GGAAATGGAGATCCAAACAATATGGATAGGGCAGTTAAGCTATACAAGAAGCTGAAAAGAGAAATAACAT +TCCATGGGGCTAAGGAGGTCGCACTCAGCTACTCAACCGGTGCACTTGCCAGTTGTATGGGTCTCATATA +CAACAGGATGGGAACGGTGACCACAGAAGTGGCTTTTGGCCTAGTGTGTGCCACTTGTGAGCAGATTGCA +GATTCACAGCATCGGTCTCACAGACAGATGGCAACTACCACCAACCCACTAATCAGGCATGAGAACAGAA +TGGTGCTGGCCAGCACTACAGCTAAGGCTATGGAGCAGATGGCTGGATCGAGTGAGCAGGCAGCGGAAGC +CATGGAGGTTGCTAGTCAGGCTAGGCAGATGGTGCAGGCAATGAGGACAATTGGGACTCATCCTAGCTCC +AGTGCCGGTCTGAAAGATAATCTTCTTGAAAATTTGCAGGCCTACCAAAAACGAATGGGAGTGCAAATGC +AGCGATTCAAGTGATCCTCTTGTTGTTGCCGCAAGTATCATTGGGATACTGCACTTGATATTGTGGATTC +TTGATCGTCTTTTCTTCAAATGCATTTATCGTCGCCTTAAATACGGTTTGAAAAGAGGGCCTTCTACGGA +AGGGGTACCTGAGTCTATGAGGGAAGAGTATCGGCAGGAACAGCAGAGTGCTGTGGATGTTGACGATGGT +CATTTTGTCAACATAGAGCTGGAGTAAAAAACTACCTTGTTTCTACT diff --git a/data/community/genspectrum/iav/h5n1/GG1996/NA/CHANGELOG.md b/data/community/genspectrum/iav/h5n1/GG1996/NA/CHANGELOG.md new file mode 100644 index 000000000..81199b7df --- /dev/null +++ b/data/community/genspectrum/iav/h5n1/GG1996/NA/CHANGELOG.md @@ -0,0 +1,3 @@ +## Unreleased + +Initial release diff --git a/data/community/genspectrum/iav/h5n1/GG1996/NA/README.md b/data/community/genspectrum/iav/h5n1/GG1996/NA/README.md new file mode 100644 index 000000000..2a11ca93e --- /dev/null +++ b/data/community/genspectrum/iav/h5n1/GG1996/NA/README.md @@ -0,0 +1,26 @@ +# H5N1 (segment6/ NA) - dataset with A/Goose/Guangdong/1/96 reference + +| attribute | value | +| ------------------- | ---------------------------------------- | +| dataset name | community/genspectrum/iav/h5n1/GG1996/NA | +| reference strain | A/Goose/Guangdong/1/96(H5N1) | +| reference accession | NC_007361.1 | +| assembly accession | GCF_000864105.1 | + +## Authors and contacts + +Maintained by Genspectrum, Chaoran Chen and Anna Parker + +With the help of: Cornelius Roemer and Richard Neher + +## Scope of this dataset + +This dataset uses the first highly-pathogenic avian influenza (HPAI) isolate (A/Goose/Guangdong/1/96) as a reference and is suitable for the analysis of circulating and historical H5 sequences, including low-pathogenicity avian influenza (LPAI) isolates. + +## Features + +This simple dataset only supports alignment. + +## What is Nextclade dataset + +Read more about Nextclade datasets in Nextclade documentation: https://docs.nextstrain.org/projects/nextclade/en/stable/user/datasets.html diff --git a/data/community/genspectrum/iav/h5n1/GG1996/NA/examples.fasta b/data/community/genspectrum/iav/h5n1/GG1996/NA/examples.fasta new file mode 100644 index 000000000..f2c8a2f98 --- /dev/null +++ b/data/community/genspectrum/iav/h5n1/GG1996/NA/examples.fasta @@ -0,0 +1,38 @@ +>AB824273.1 +TCAAAATGAATCCAAATCAGAAGATAGTAACCATTGGATCAATCTGTATGGTAATTGGAATAATTAGCTTGATGTTACAGATTGGGAACATAATATCAATATGGGTCAGTCATTCAATTCAAACAGGGAATCAACACCAAACTGAACCAATCAGAAATACTAATTTTCTTACTGAGAACGCTGTAGCTTCAGTAACATTAGCTGGCAATTCATCTCTTTGCCCCATTAAAGGATGGGCTGTACACAGTAAAGACAACAGTATAAGGATTGGGTCCAAGGGGGATGTGTTTGTAATTAGAGAGCCGTTCATATCATGCTCCCATCTGGAATGCAGAACTTTCTTTTTGACTCAGGGAGCTTTACTGAATGACAAGCACTCCAACGGGACTGTCAAAGATAGGAGCCCTCACAGAACGCTAATGAGTTGCCCTATAGGAGAGGCTCCCTCCCCATATAACTCAAGGTTTGAGTCTGTCGCTTGGTCGGCAAGTGCTTGCCATGATGGCACCAGTTGGTTGATAATTGGAATTTCTGGTCCAGACAATGGGGCTGTGGCGGTATTGAAATACAATGGCATAATAACAGACACTATCAAGAGTTGGAGGAATAACATACTGAGGACCCAAGAGTCTGAATGTGCATGTGTAAATGGCTCTTGCTTTGCTGTTATGACAGATGGACCAAGTAATGGGCAGGCATCATATAAGATTTTCAAAATAGAAAAAGGGAAAGTAGTTAAGTCAGTCGAATTGAATGCCCCTAATTATCACTATGAGGAATGCTCCTGTTATCCTGATGCTGGCGAAATCATATGTGTGTGCAGGGATAATTGGCATGGCTCAAACAGGCCATGGGTATCTTTCAATCAGAATTTGGAGTATCGAATAGGATATATTTGCAGTGGAGTTTTCGGTGACAATCCACGGCCAAATGACGGTACAGGTAGTTGTGGTCCAGTGTCCTCTAACGGGGCATATGGGGTAAAAGGGTTCTCATTTAAATATGGCAATGGTGTCTGGATCGGGAGGACCAAAAGCACTCATTCCAGGAGCGGCTTTGAAATGATTTGGGATCCAAACGGGTGGACTGGAACGGACAGTGAATTTTCGATGAAACAAGATATAGTAGCAATAACTGATTGGTCAGGATATAGCGGGAGTTTTGTCCAGCACCCAGAACTGACAGGATTAGATTGTATAAGACCTTGCTTCTGGGTTGAGTTGATCAGAGGGCGGCCCAAAGAGAGCACAATTTGGACTAGTGGGAGCAGCATATCATTTTGTGGTGTAAATAGTGACACTGTGAGTTGGTCTTGGCCAGACGGTGCTGAGTTGCCATTCACCATTGACAAGTAGTTTATTC +>FM163442.1 +AGCAAAAGCAGGAGTTCAAAATGAATCCAAATCAGAAGATAATAACCATCGGATCAATCTGTATGGTAATTGGAATAGTTAGCTTAATGTTACAAATTGGGAACATGATCTCAATATGGGTCAGTCATTCAATTCTGACAAGGAATCAACGCCAAGCTGAACCAATCAGCAATACTAAATTTCTTACTGAGAAAGCTGTGGCTTCAGTAACATTAGCGAGCAATTCATCTCTTTGCCCCATTAGCGGATGGGCTGTATACAGTAAGGACAACAGTATAAGGATCGGTTCCAGGGGGGATGTGTTTGTTATAAGAGAGCCGTTCATCTCATGCTCCCACTTGGAATGCAGAACTTTCTTTTTGACTCAGGGAGCCTTGCTGAATGACAAGCACTCCAATGGGACTGTCAAAGACAGAAGCCCTCACAGAACATTAATGAGTTGTCCTGTGGGTGAGGCTCCCTCCCCATATAACTCAAGGTTTGAGTCTGTTGCTTGGTCAGCAAGTGCTTGCCATGATGGCACCAGTTGGTTGACAATTGGAATTTCTGGTCCAGACAATGGGGCTGTGGCTGTATTGAAATACAATGGCATAATAACAGACACCATCAAGAGTTGGAGGAACAACATACTGAGAACCCAAGAGTCTGAATGTGCATGTGTAAATGGCTCTTGCTTTACTGTAATGACTGATGGACCAAGTAATGGGCAGGCATCATATAAGATCTTCAAAATGGAAAAAGGAAAAGTGGTTAAATCAGTCGAATTGGATGCTCCTAATTATCACTATGAGGAGTGCTCCTGTTATCCTGATGCCGGCGAAATCACATGTGTGTGCAGGGATAATTGGCATGGCTCAAATAGGCCATGGGTATCTTTCAATCAAAATTTGGAGTATCAAATAGGATATATATGCAGTGGAGTTTTCGGAGACAATCCACGCCCCAATGATGGAACAGGTAGTTGTGATCCGGTGTCCCTTAACGGGGCATATGGGGTAAAAGGGTTTTCATTTAAATACGGCAATGGTGTTTGGATTGGGAGAACCAAAAGCACTAATTCCAGGAGCGGCTTTGAAATGATTTGGGACCCAAATGGATGGACTGGAACGGACAGTAGCTTTTCGGTGAAGCAAGATATCGTAGCAATAACTGATTGGTCAGGATATAGCGGGAGTTTTGTCCAGCATCCAGAATTGACAGGATTAGATTGCATAAGACCTTGTTTCTGGGTTGAGTTAATCAGGGGGCGGCCTGAAGAGAGCACAATTTGGACCAGTGGGAGCAGCATATCTTTTTGTGGTGTAAATAGTGACACTGTTAGTTGGTCTTGGCCAGACGGTGCTGAATTGCCATTCACCATTGACAAGTAG +>OQ683500.1 +GCAAAAGCAGGAGTTCAAAATGAATCCAAATCAAAAGATAACAACCATTGGATCAATCTGTATGGTAATTGGGATAGTCAGCTTGATGCTGCAAATTGGGAACATAATCTCAATATGGGTTAGCCATTCAATCCGAACAGGGAATCAATACCAGCCTGAACCATGCAATCAAAGCATCATTACCTATGAGAACAACACCTGGGTAAATCAGACGTATGTCAACATCAACAATACCAATTTTCTTGCTGAGCAGGCTGTTACTTCAGTAACATTAGCGGGCAATTCATCTCTTTGCCCTATTAGTGGGTGGGCAATATACAGTAAGGACAACGGTATAAGAATTGGGTCCAAGGGGGATGTGTTTGTTATAAGAGAACCGTTCATCTCATGCTCCCACTTGGAATGCAGAACCTTTTTCCTGACCCAGGGAGCTCTGCTGAATGACAAACATTCTAATGGGACCGTTAAAGATAGAAGCCCTTATAGAACTTTGATGAGTTGCCCCGTGGGTGAGGCTCCTTCTCCGTACAACTCAAGATTTGAGTCTGTTGCTTGGTCGGCAAGTGCTTGTCATGATGGCATCAGTTGGTTGACAATCGGTATCTCTGGTCCAGACAATGGAGCTGTGGCTGTATTGAAGTACAATGGCATAATAACGGATACTATCAAGAGTTGGAGAAACAACATTTTGAGAACTCAAGAATCTGAATGTGCGTGCGTAAATGGCTCTTGCTTCACCGTAATGACTGATGGACCAAGCAATGGGCAGGCCTCATCTAAAATCTTCAAGATAGAGAAAGGGAAAGTTGTCAAATCAGTTGAATTGAATGCCCCTAATTACCACTACGAGGAATGCTCCTGTTATCCTGATGCGGGTGATATTATGTGTGTGTGCAGGGACAATTGGCATGGCTCAAACCGGCCGTGGGTATCTTTTAATCAAAATCTGGAGTATCAAATAGGATATATATGCAGTGGGGTTTTCGGGGACAATCCCCGCCCCAATGATGGAACAGGCAGTTGCAGTCCAATGTCCTCTAATGGGGCATATGGGATAAAAGGGTTTTCATTTAAGTACGGTAATGGGGTTTGGATCGGAAGAACAAAAAGCACTAGTTCCAGAAGCGGCTTTGAGATGATTTGGGATCCGAATGGGTGGACTGAGACGGACAGTAGTTTCTCAGTGAAGCAAGACATTGTAGAGATAACTGACTGGTCAGGATATAGTGGGAGCTTTGTCCAGCATCCAGAACTGACAGGATTAGATTGCATGAGGCCTTGTTTCTGGGTTGAGCTAATTAGAGGGAGGCCCAAAGAGAACACAATTTGGACTAGCGGGAGCAGCATATCCTTTTGTGGTGTAAATAGTGACACTGTGGGTTGGTCTTGGCCAGACGGTGGGAGGTTCGCTAGATGGTCGGCCGAGTAGTGGTCGCAAAATGGTCGCATGTGGAGGT +>CY146646.1 +ATGAATCCAAATCAGAAGATAGTAACCATTGGATCAATCTGTATGGTAATTGGAATAGTTAGCTTGATGTTACAGATTGGGAACATGATCTCAATATGGGTCAGTCATTCAATTCAAACAGGGAATCAACACCAAACTGAACCAATCAGAAATACTAATTTTCTTACTGAGAACGCTGTGGCTTCAGTAACATTAGCTGGCAATTCATCTCTTTGCCCCATTAGAGGATGGGCTGTACACAGTAAAGACAACAGTATAAGGATTGGGTCCAAAGGGGATGTGTTTGTAATTAGAGAGCCGTTCATCTCATGCTCACATCTGGAGTGCAGAACTTTCTTCTTGACTCAGGGAGCTTTACTGAATGACAAGCACTCCAACGGGACTGTCAAAGACAGGAGCCCTCACAGAACGCTAATGAGTTGTCCTATAGGTGAGGCTCCCTCCCCATATAACTCGAGGTTTGAGTCTGTTGCTTGGTCAGCAAGTGCTTGCCATGATGGCACCAGTTGGTTGACAATTGGAATTTCTGGTCCAGACAATGGGGCTGTGGCGGTATTGAAATACAATGGCATAATAACAGACACTATCAAGAGTTGGAGGAATAGCATACTGAGAACCCAAGAGTCTGAATGTGCATGTGTAAATGGCTCTTGCTTTACTGTGATGACAGATGGACCAAGTAATGGACAGGCATCATATAAGATTTTCAAAATAGAAAAAGGGAAAGTAGTTAAGTCAGTCGAATTGAATGCTCCTAATTATCACTATGAGGAATGCTCCTGTTATCCCGATGCTGGCGAAATCATATGTGTGTGCAGGGATAATTGGCATGGCTCAAACAGGCCATGGGTATCTTTCAATCAGAATTTGGAGTATCAAATAGGATATATTTGCAGTGGAGTTTTCGGAGACAATCCACGACCAAACGATGGGAAAGGTAGTTGTGGTCCAGTGTCCCCTAACGGGGCATATGGGGTAAAAGGGTTTTCATTTAAATACGGCAATGGTGTCTGGATCGGGAGGACCAAAAGCACTCATTCCAGGAGCGGCTTTGAAATGATTTGGGATCCAAATGGGTGGACTGGAACGGACAGTGAATTTTCGATGAAACAAGATATAGTAGCAATAACTGATTGGTCAGGATATAGCGGGAGTTTTGTCCAGCACCCAGAACTGACAGGATTAGATTGCATAAGACCTTGCTTCTGGATTGAGTTAATCAGAGGGCGGCCCAAGGAGAGCACAATTTGGACCAGTGGGAGCAGCATATCTTTTTGTGGTGTAAATAGTGACACTGTGAGTTGGTCCTGGCCAGACGGTGCTGAGTTGCCATTCACCATTGACAAGTAG +>OQ584537.1 +AAAGCAGGAGTTCAAAATGAATCCAAATCAAAAGATAACAACCATTGGATCAATCTGTATGGTAATTGGGATAGTCAGCTTGATGCTGCAAATTGGGAACATAATCTCAATATGGGTTAGCCATTCAATCCAAACAGGGAATCAATACCAGCCTGAACCATGCAATCAAAGCATCATTACCTATGAGAACAACACCTGGGCAAATCATACGTATGTCAACATCAGCAATACCAATTTTCTTGCTGAGCAGGCTGTTACTTCAGTAACATTAGCGGGCAATTCATCTCTTTGCCCTATTAGTGGGTGGGCAATATACAGTAAGGACAACGGTATAAGAATTGGGTCCAAGGGGGATGTGTTTGTTATAAGAGAACCGTTCATCTCATGCTCCCACTTGGAATGCAGAACCTTTTTCCTGACCCAGGGAGCTCTGCTGAATGACAAACATTCTAATGGGACCGTTAAGGATAGAAGCCCTTATAAAACTTTGATGAGCTGTCCCGTGGGTGAGGCTCCTTCCCCGTACAATTCAAGATTTGAGTCTGTTGCTTGGTCGGCAAGTGCTTGTCATGATGGCATCAGTTGGTTGACAATCGGTATTTCTGGTCCAGACAATGGAGCTGTGGCTGTATTGAAGTACAATGGCATAATAACGGATACTATCAAGAGTTGGAGAAACAACATTTTGAGAACTCAAGAATCTGAATGTGCGTGCGTAAATGGCTCTTGCTTCACCGTAATGACTGATGGACCAAGCAATGGGCAGGCCTCATATAAAATCTTCAAGATAGAGAAAGGGAAAGTTGTCAAATCAGTTGAATTGAATGCCCCTAATTACCACTACGAGGAATGCTCCTGTTATCCTGATGCGGGTGATATTATGTGTGTGTGCAGGGACAATTGGCATGGCTCAAACCGGCCGTGGGTATCTTTTAATCAAAATCTGGAGTATCAAATAGGATATATATGCAGTGGGGTTTTCGGGGACAATCCCCGCCCCAATGATGGAACAGGCAGTTGCAGTCCAATGTCCTCTAATGGGGCATATGGGGTAAAAGGGTTTTCATTTAAGTACGGTAATGGGGTTTGGATCGGAAGAACAAAAAGCACTAGTTCCAGAAGCGGCTTTGAGATGATTTGGGATCCGAATGGGTGGACTGAGACGGACAGTAGTTTCTCAGTGAAGCAAGACATTGTAGAAATAACTGACTGGTCAGGATATAGTGGGAGTTTTGTCCAGCATCCAGAACTGACAGGATTAGATTGCATGAGGCCTTGTTTCTGGGTTGAGCTAATTAGAGGGAGGCCCAAAGAGAACACAATTTGGACTAGCGGGAGCAGCATATCCTTTTGTGGTGTAAATAGTGACACTGTGGGTTGGTCTTGGCCAGACGGTGCTGAGTTGCCATTCACCATTGACAAGTAGTTTGTTCAAAAAACTCCTTGTTTCTACT +>OQ584792.1 +AAAGCAGGAGTTCAAAATGAATCCAAATCAAAAGATAACAACCATTGGATCAATCTGTATGGTAATTGGGATAGTCAGCTTGATGCTGCAAATTGGGAACATAATCTCAATATGGGTTAGCCATTTAATCCAAACAGGGAATCAATACCAGCCTGAACCATGCAATCAAAGCATCATTACCTATGAGAACAACACCTGGGTAAATCATACGTATGTCAACATCAGCAATACCAATTTTCTTGCTGAGCAGGCTGTTACTTCGGTAACATTAGCGGGCAATTCATCTCTTTGCCCTATTAGTGGGTGGGCAATATACAGTAAGGACAACGGTATAAGAATTGGGTCCAAGGGGGATGTGTTTGTTATAAGAGAACCGTTCATCTCATGCTCCCACTTGGAATGCAGAACCTTTTTCCTGACCCAGGGAGCTCTGCTGAATGACAAACATTCTAATGGGACCGTTAAGGATAGAAGCCCTTATAGAACTTTGATGAGCTGTCCCGTGGGTGAGGCTCCTTCCCCGTACAATTCAAGATTTGAGTCTGTTGCTTGGTCGGCAAGTGCTTGTCATGATGGCATCAGTTGGTTGACAATCGGTATTTCTGGTCCAGACAATGGAGCTGTGGCTGTATTGAAGTACAATGGCATAATAACGGATACTGTCAAGAGTTGGAGAAACAACATTTTGAGAACTCAAGAATCTGAATGTGCGTGCGTAAATGGCTCTTGCTTCACTGTAATGACTGATGGACCAAGCAATGGGCAGGCCTCATATAAAATCTTCAAGATAGAGAAAGGGAAAGTTGTCAAATCAGTTGAATTGAATGCCCCTAATTACCACTACGAGGAATGCTCCTGTTATCCTGATGCGGGTGATATTATGTGTGTGTGTAGGGACAATTGGCATGGCTCAAACCGGCCGTGGGTATCTTTTAATCAAAATCTGGAGTATCAAATAGGATATATATGCAGTGGGGTTTTCGGGGACAATCCCCGCCCCAATGATGGAACAGGCAGTTGCAGTCCAATGTCCTCTAATGGGGCATATGGGGTAAAAGGGTTTTCATTTAAGTACGGTAATGGGGTTTGGATCGGAAGAACAAAAAGCACTAGTTCCAGAAGCGGCTTTGAGATGATTTGGGATCCGAATGGGTGGACTGAGACGGACAGTAGTTTCTCAGTGAAGCAAGACATTGTAGAAATAACTGACTGGTCAGGATATAGTGGGAGTTTTGTCCAGCATCCAGAACTGACAGGATTAGATTGCATGAGGCCTTGTTTCTGGGTTGAGCTAATTAGAGGGAGGCCCAAAGAGAACACAATTTGGATTAGCGGGAGCAGCATATCCTTTTGTGGTGTAAATAGTGACACTGTGGGTTGGTCTTGGCCAGACGGTGCTGAGTTGCCATTCACCATTGACAAGTAGTTTGTTCAAAAAACTCCTTGTTTCTACT +>FJ602832.1 +ATGAATCCAAATCAGAAGATAATAACCATCGGATCAATCTGTATGGTAATTGGAATAGTTAGCTTAATGTTACAAATTGGGAACATGATCTCAATATGGGTCAGTCATTCAATTCAGACAGGGAATCAACGCCAAGCTGAACCAATCAGCAATACTAAATTTCTTACTGAGAAAGCTGTGGCTTCAGTAACATTAGCGGGCAATTCATCTCTTTGCCCCATTAGCGGATGGGCTGTATACAGTAAGGACAACAGTATAAGGATCGGTTCCAGGGGGGATGTGTTTGTTATAAGAGAGCCGTTCATCTCATGCTCCCACTTGGAATGCAGAACTTTCTTATTGACTCAGGGAGCCTTGCTGAATGACAAGCACTCCAATGGGACTGTCAAAGACAGAAGCCCTCACAGAACATTAATGAGTTGTCCTGTGGGTGAGGCTCCCTCCCCATATAACTCAAGGTTTGAGTCTGTTGCTTGGTCAGCAAGTGCTTGCCATGATGGCACCAGTTGGTTGACAATTGGAATTTCTGGTCCAGACAATGGGGCTGTGGCTGTATTGAAATACAATGGCATAATAACAGACACCATCAAGAGTTGGAGGAACAACATACTGAGAACTCAAGAGTCTGAATGTGCATGTGTAAATGGCTCTTGCTTTACTGTAATGACTGATGGACCAAGTAATGGGCAGGCATCATATAAGATCTTCAAAATGGAAAAAGGGAAAGTGGTTAAATCAGTCGAATTGGATGCTCCTAATTATCACTATGAGGAGTGCTCCTGTTATCCTGATGCCGGCGAAATCACATGTGTGTGCAGGGATAATTGGCATGGCTCAAATAGGCCATGGGTATCTTTCAATCAAAATTTGGAGTATCAAATAGGATATATATGCAGTGGAGTTTTCGGAGACAATCCACGCCCCAATGATGGAACAGGTAGTTGTGGTCCGGTGTCCCCTAACGGGGCATATGGGGTAAAAGGGTTTTCATTTAGATACGGCAATGGTGTCTGGATCGGGAGAACCAAAAGCACTATTTCCAGGAGCGGCTTTGAAATGATTTGGGATCCAAATGGGTGGACTGGAACGGACAGTAGCTTTTCGGTGAAGCAAGATATCGTAGCAATAACTGATTGGTCAGGATATAGCGGGAGTTTTGTCCAGCATCCAGAACTGACAGGATTAGATTGCATAAGACCTTGTTTCTGGGTTGAGTTAATCAGAGGGCGGCCTAAAGAGAGCACAATTTGGACCAGTGGGAGCAGCATATCTTTTTGTGGTGTAAATAGTGACACTGTTAGTTGGTCTTGGCCAGACGGTGCTGAGTTGCCATTCACCATTGACAAGTAGTTTGTTCAAAA +>CY062435.1 +AATCAGAAGATAATAACCATCGGATCAATCTGTATGGTAATTGGAATAGTTAGCTTGATGTTACAAATTGGGAACATGATCTCAATATGGGTCAGTCATTCAATTCAGACAGGGAATCAATGCCAAGCTGAACCAATCAGCAATACTAAATTTCTTACTGAGAAAGCTGTGGCTTCAGTAACATTAGCGGGCAATTCATCTCTTTGTCCCATTAGCGGATGGGCTGTATACAGTAAGGACAACAGTATAAGGATCGGTTCCAGGGGGGATGTGTTTGTTATAAGAGAGCCGTTCATCTCATGCTCCCACTTGGAATGCAGAACTTTCTTTTTGACTCAGGGAGCCTTGCTGAATGACAAGCACTCCAATGGGACTGTCAAAGACAGAAGCCCTCACAGAACATTAATGAGTTGTCCTGTGGGTGAGGCTCCCTCCCCATATAACTCAAGGTTTGAGTCTGTTGCTTGGTCAGCAAGTGCTTGCCATGATGGCACCAGTTGGTTGACAATTGGAATTTCTGGTCCAGACAATGGGGCTGTGGCTGTATTGAAATACAATGGCATAATAACAGACACCATCAAGAGTTGGAGGAACAACATACTGAGAACTCAAGAGTCTGAATGTGCATGTGTAAATGGCTCTTGCTTTACTGTAATGACTGATGGACCAAGTAGTGGGCAGGCATCATATAAGATCTTCAAAATGGAAAAGGGGAAAGTGGTTAAATCAGTCGAATTGGATGCTCCTAATTATCACTATGAGGAGTGCTCCTGTTATCCTGATGCCGGCGAAATCACATGTGTGTGCAGGGATAATTGGCATGGCTCAAATAGGCCATGGGTATCTTTCAATCAAAATTTGGAGTATCAAATAGGATATATATGCAGTGGAGTTTTCGGAGACAATCCACGCCCCAATGATGGAACAGGTAGTTGTGGTCCGGTGTCCCCTAACGGGGCATATGGGGTAAAAGGGTTTTCATTTAAATACGGCAATGGTGTTTGGATCGGGAGAACCAAAAGCACTAATTCCAGGAGCGGCTTTGAAATGATTTGGGACCCAAATGGGTGGACTGGAACGGACAGTAGCTTTTCGGTGAAGCAAGATATCGTAGCAATAACTGATTGGTCAGGATATAGCGGGAGTTTTGTCCAGCATCCAGAACTGACAGGATTAGATTGCATAAGACCTTGTTTCTGGGTTGAGTTAATCAGAGGGCGGCCTAAAGAGAGCACAATTTGGACCAGTGGAAGCAGCATATCTTTTTGTGGTGTAAATAGTGACACTGTTAGTTGGTCTTGGCCAGACGGTGCTGAGTTGCCATTCACCATTGACAAGTAG +>OQ546776.1 +ATGAATCCAAATCAGAAGATAGTAACCATTGGATCAATCTGTATGGTAATTGGAATAATTAGCTTGATGTTACAGATTGGGAACATAATATCAATATGGGTCAGTCATTCAATTCAAACAGGGAATCAACACCAAACTGAACCAATCAGAAATACTAATTTTCTTACTGAGAACGCTGTAGCTTCAGTAACATTAGCTGGCAATTCATCTCTTTGCCCCATTAAAGGATGGGCTGTACACAGTAAAGACAACAGTATAAGGATTGGGTCCAAGGGGGATGTGTTTGTAATTAGAGAGCCGTTCATATCATGCTCCCATCTGGAATGCAGAACTTTCTTTTTGACTCAGGGAGCTTTACTGAATGACAAGCACTCCAACGGGACTGTCAAAGATAGGAGCCCTCACAGAACGCTAATGAGTTGCCCTATAGGTGAGGCTCCCTCCCCATATAACTCAAGGTTTGAGTCTGTTGCTTGGTCGGCAAGTGCTTGCCATGATGGCACCAGTTGGTTGATAATTGGAATTTCTGGTCCAGACAATGGGGCTGTGGCGGTATTGAAATACAATGGCATAATAACAGACACTATCAAGAGTTGGAGGAATAACATACTGAGGACCCAAGAATCTGAATGTGCATGTGTAAATGGCTCTTGCTTTGCTGTTATGACAGATGGACCAAGTAATGGGCAGGCATCATATAAGATTTTCAAAATAGAAAAAGGGAAAGTAGTTAAGTCAGTCGAATTGAATGCCCCTAATTATCACTATGAGGAATGCTCCTGTTATCCTGATGCTGGCGAAATCATATGTGTGTGCAGGGATAATTGGCATGGCTCAAACAGGCCATGGGTATCTTTCAATCAGAATTTGGAGTATCAAATAGGATATATTTGCAGTGGAGTTTTCGGTGACAATCCACGGCCAAATGACGGTACAGGTAGTTGTGGTCCAGTGTCCTCTAACGGGGCATATGGGGTAAAAGGGTTCTCATTTAAATATGGCAATGGTGTCTGGATCGGGAGGACCAAAAGCACTCATTCCAGGAGTGGCTTTGAAATGATTTGGGATCCAAACGGGTGGACTGGAACGGACAGTGAATTTTCGATGAAACAAGATATAGTAGCAATAACTGATTGGTCAGGATATAGCGGGAGTTTTGTCCAGCACCCAGAACTGACAGGGTTAGATTGCATAAGACCTTGCTTCTGGGTTGAGTTAATCAGAGGGCGGCCCAAAGAGAGCACAATTTGGACTAGTGGGAGCAGCATATCTTTTTGTGGTGTAAATAGTGACACTGTGAGTTGGTCTTGGCCAGACGGTGCTGAGTTGCCATTCACCATTGACAAGTAG +>CY111067.1 +AGCAAAAGCAGGAGATTAAAATGAATCCAAATCAGAAGATAATAACCATCGGATCAATCTGTATGGTAATTGGAATAGTTAGCTTAATGTTACAAATTGGGAACATGATCTCAGTATGGGTCAGTCATTCAATTCAGACAAGGAATCAACGCCAAGCTGAACCAATCAGCAATACTAAATTTCTTACTGAGAAAGCTGTGGCTTCAGTAACATTAGCGGGCAATTCATCTCTTTGCCCCATTAGCGGATGGGCTGTATACAGTAAGGACAACAGTATAAGGATCGGTTCCAGGGGGGATGTGTTTGTTATAAGAGAGCCGTTCATCTCATGCTCCCACTTGGAATGCAGAACTTTCTTTTTGACTCAGGGAGCCTTGCTGAATGATAAGCACTCCAATGGGACTGTCAAAGACAGAAGCCCTCACAGAACATTAATGAGTTGTCCTGTGGGTGAGGCTCCCTCCCCATATAACTCAAGGTTTGAGTCTGTTGCTTGGTCAGCAAGTGCTTGCCATGATGGCACCAGTTGGTTGACAATTGGAATTTCTGGTCCAGACAATGGGGCTGTGGCTGTATTGAAATACAATGGCATAATAACAGACACCATCAAGAGTTGGAGGAACAACATACTGAGAACCCAAGAGTCTGAATGTGCATGTGTAAATGGCTCTTGCTTTACTGTAATGACTGATGGACCAAGTAATGGGCAGGCATCATATAAGATCTTCAAAATGGAAAAAGGGAAAGTGGTTAAATCAGTCGAATTGGATGCTCCTAATTATCACTATGAGGAGTGCTCCTGTTATCCTGATGCCGGCGAAATCACATGTGTGTGCAGGGATAATTGGCATGGCTCAAATAGGCCATGGGTATCTTTCAATCAAAATTTGGAGTATCAAATAGGATATATATGCAGTGGAGTTTTCGGAGACAATCCACGCCCCAATGATGGAACAGGTAGTTGTGGTCCGGTGTCCCTTAACGGGGCATATGGGGTAAAAGGGTTTTCATTTAAATACGGCAATGGTGTTTGGATTGGGAGAACCAAAAGCACTAATTCCAGGAGCGGCTTTGAAATGATTTGGGATCCAAATGGGTGGACTGGAACGGACAGTAGCTTTTCGGTGAAGCAAGATATCGTAGCAATAACTGATTGGTCAGGATATAGCGGGAGTTTTGTCCAGCATCCAGAATTGACAGGATTAGATTGCATAAGACCTTGTTTCTGGGTTGAGTTAATCAGAGGGCAGCCTAAAGAGAGCACAATTTGGACTAGTGGGAGCAGCATATCTTTTTGTGGTGTAAATAGTGACACTGTTAGTTGGTCTTGGCCAGACGGTGCTGAATTGCCATTCACCATTGACAAGTAGTTTGTTCAAAAAAACTCCTTGTTT +>KC590651.1 +AGCAAAAGCAGGAGTTCAAAATGAATCCAAATCAGAAGATAGTAACCATTGGATCAATCTGTATGGTAATTGGAATAATTAGCTTGATGTTACAGATTGGGAACATAATCTCAATATGGGTCAGTCATTCAATTCAAACAGGGAATCAACACCAAACTGAACCAATCAGAAATACTAATTTTCTTACTGAGAACGCTGTAGCTTCAGTAACATTAGCTGGCAATTCATCTCTTTGCCCCATTAGAGGATGGGCTGTACACAGTAAAGACAACAGTATAAGGATTGGGTCCAAGGGGGATGTGTTTGTAATTAGAGAGCCGTTCATCTCATGCTCCCATCTGGAATGCAGAACTTTCTTTTTGACTCAGGGAGCTTTACTGAATGACAAGCACTCCAACGGGACTGTCAAAGATAGGAGCCCTCACAGAACGCTAATGAGTTGTCCTATAGGTGAGGCTCCCTCCCCATATAACTCGAGGTTTGAGTCTGTTGCTTGGTCGGCAAGTGCTTGCCATGATGGCACCAGTTGGTTGATAATTGGAATTTCTGGTCCAGACAATGGGGCTGTGGCGGTATTGAAATACAATGGCATAATAACAGACACTATCAAGAGTTGGAGGAATAACATACTGAGGACCCAAGAGTCTGAATGTGCATGTGTAAATGGCTCTTGCTTTACTGTGATGACAGATGGACCAAGTAATGGGCAGGCATCATATAAGATTTTCAAAATAGAAAAAGGGAAAGTAGTTAAGTCAGTCGAATTGAATGCTCCTAATTATCACTATGAGGAATGCTCCTGTTATCCTGATGCTGGCGAAATCATATGTGTGTGCAGGGATAATTGGCATGGCTCAAACAGGCCATGGGTATCTTTCAATCAGAATTTGGAGTATCAAATAGGATATATTTGCAGTGGAGTTTTCGGAGACAATCCACGGCCAAATGACGGGACAGGTAGTTGTGGTCCAGTGTCCCCTAACGGGGCATATGGGGTAAAAGGGTTCTCATTTAAATACGGCAATGGTGTCTGGATCGGGAGGACCAAAAGCACTCATTCCAGGAGCGGCTTTGAAATGATTTGGGATCCAAACGGGTGGACTGGAACGGACAGTGAATTTTCGATGAAACAAGATATAGTAGCAATAACTGATTGGTCAGGATATAGCGGGAGTTTTGTCCAGCACCCAGAACTGACAGGATTAGATTGCATAAGACCTTGCTTCTGGGTTGAGTTAATCAGAGGGCGGCCCAAAGAGAGCACAATTTGGACTAGTGGGAGCAGCATATCTTTTTGTGGTGTAAATAGTGACACTGTGAGTTGGTCTTGGCCAGACGGTGCTGAGTTGCCATTCACCATTGACAAGTAGTTTATTCAAAAAACTCCTTGTTTCTACT +>CY062473.1 +ATGAATCCAAATCAGAAGATAATAACCATCGGATCAATCTGTATGGTAATTGGGATAGCTAGCTTAATGTTACAAATTGGGAACATGATCTCAATATGGGTCAGTCATTCAATTCAGACAGGGAATCAATGCCAAGATGAATCAATCAGCAACACTAAATTTCTTACTGAGAAAGCTGTAGCTTCAGTAACATTAGCGGGCAATTCATCTCTTTGTCCCATTAGCGGATGGGCTGTGTACAGTAAGGATAACAGCATAAGGATCGGTTCCAGGGGGGATGTGTTTGTTATAAGAGAGCCATTCATCTCATGCTCCCACTTGGAATGCAGAACTTTCTTTTTAACCCAGGGAGCCTTACTGAATGACAAGCACTCCAATGGAACTGTCAAAGACAGAAGCCCTCACAGAACATTAATGAGTTGTCCTGTGGGTGAGGCTCCCTCCCCATATAACTCAAGGTTTGAGTCTGTTGCTTGGTCAGCAAGTGCTTGCCATGATGGCACCAGTTGGTTGACAATTGGAATTTCTGGTCCAGACAATGGGGCTGTGGCTGTATTGAAATACAATGGCATAATAACAGACACCATCAAGAGTTGGAGGAACAACATAATGAGAACTCAAGAGTCTGAATGTGCATGTGTAAATGGCTCTTGCTTTACTGTAATGACTGATGGACCAAGTAGTGGGCAGGCATCATATAAGATCTTCAAAATGGAAAAGGGAAAAGTGGTTAAATCAGTCGAATTGGATGCTCCTAATTATCACTATGAGGAGTGCTCCTGTTATCCTGATGCCGGCGAAATCACATGTGTGTGCAGGGATAATTGGCATGGATCAAATAGGCCATGGGTATCTTTCAATCAAAATTTGGAGTATCAAATAGGATATATATGCAGTGGAGTTTTCGGAGACAATCCACGCCCCAATGATGGAACAGGTAGTTGTGGTCCGGTGTTCCCTAACGGGGCATATGGGGTAAAAGGGTTTTCATTTAAATACGGCAATGGTGTTTGGATCGGGAGAACCAAAAGCACTAATTCCAGGAGCGGCTTTGAAATGATTTGGGACCCAAATGGGTGGACTGGAACGGACAGTAGCTTTTCAGTGAAGCAAGATATCGTAGCAATAACTGATTGGTCAGGATATAGCGGGAGTTTTGTCCAGCATCCAGAACTGACAGGATTAGATTGCATAAGACCTTGTTTCTGGGTTGAGTTAATCAGAGGGCGGCCTAAAGAGAGCACAATTTGGACCAGTGGAAGCAGCATATCTTTTTGTGGGGTAAATGGTGACACTGTTAGTTGGTCTTGGCCAGACGGTGCTGAGTTGCCATTCACCATTGACAAGTAA +>CY062445.1 +ATGAATCCAAATCAGAAGATAATAACCATCGGATCAATCTGTATGGTAATTGGGATAGTTAGCTTAATGTTACAAATTGGGAACATGATCTCAATATGGGTCAGTCATTCAATTCAGACAGGGAATCAATGCCAAGATGAACCAATCAGCAACACTAAATTTCTTACTGAGAAAGCTGTGGCTTCAGTAACATTAGCGGGCAATTTATCTCTTTGTCCCGTTAGCGGATGGGCTGTGTACAGTAAGGACAACAGCATAAGGATCGGTTCCAGAGGGGATGTGTTTGTTATAAGAGAGCCGTTCATCTCATGCTCCCACTTGGAATGCAGAACTTTCTTTTTAACCCAGGGAGCCTTACTGAATGACAAGCACTCCAATGGGACTGTCAAAGACAGAAGCCCTCACAGAACATTAATGAGTTGTCCTGTGGGTGAGGCTCCCTCCCCATATAACTCAAGGTTTGAGTCTGTTGCTTGGTCAGCAAGTGCTTGCCATGATGGCACCAGTTGGTTGACAATTGGAATTTCTGGTCCAGACAATGGGGCTGTGGCCGTATTGAAATACAATGGCATAATAACAGACACCATCAAGAGTTGGAGGAACAATATAATGAGAACTCAGGAGTCTGAATGTGCATGTGTAAATGGCTCTTGCTTTACTGTAATGACTGATGGACCAAGTAGTGGGCAGGCATCATATAAGATCTTCAAAATGGAAAAGGGAAAAGTGGTTAAATCAGTCGAATTGGATGCTCCTAATTATCACTATGAGGAGTGCTCCTGTTATCCTGATGCCGGCGAAATCACATGTGTGTGCAGGGATAATTGGCATGGATCAAATAGGCCATGGGTATCTTTCAATCAAAATTTGGAGTATCAAATAGGATATATATGCAGTGGAGTTTTCGGAGACAATCCACGCCCCAATGATGGAACAGGTAGTTGTGGTCCGGTGTTCCCTAACGGGGCATATGGGGTAAAAGGGTTTTCATTTAAATACGGCAATGGTGTTTGGATCGGGAGAACCAAAAGCACTAATTCCAGGAGCGGCTTTGAAATGATTTGGGACCCAAATGGGTGGACTGGAACGGACAGTAGCTTTTCAGTGAAGCAAGATATCGTAGCAATAACTGATTGGTCAGGATATAGCGGGAGTTTTGTCCAGCATCCAGAACTGACAGGATTAGATTGCATAAGACCTTGTTTTTGGGTTGAGTTAATCAGAGGGCGGCCTAAAGAGAGCACAATTTGGACCAGTGGAAGCAGCATATCTTTTTGTGGTGTAAATGGTGACACTGTTAGTTGGTCTTGGCCAGACGGTGCTGAGTTGCCATTCACCATTGACAAGTAG +>CY041931.1 +ATGAATCCAAATCAGAAGATAATAACCATCGGATCAATCTGTATGGTAATTGGAATAGTTAGCTTAATGTTACAAATTGGGAACATGATCTCAATATGGGTCAGCCATTCAATTCAGACAGGAAATCAATGCCAAGGTGAACCAATCAGCAACACTAAATTTCTTACTGAGAAAGCTGTGGCTTCAGTAACATTAGCGGGCAATTCATCTCTTTGTCCTATTAGCGGGTGGGCTGTATACAGTAAGGACAACAGTATAAGGATCGGCTCCAGGGGAGATGTGTTTGTTATAAGAGAGCCGTTCATCTCATGCTCCCACTTGGAATGCAGAACCTTCTTTTTGACTCAGGGAGCCTTACTGAATGACAAGCACTCCAATGGGACTGTCAAAGACAGAAGCCCTCACAGAACATTAATGAGTTGTCCTGTGGGTGAGGCTCCCTCCCCATATAACTCAAGGTTTGAGTCTGTTGCTTGGTCAGCAAGTGCTTGCCATGATGGCACCAGTTGGTTGACAATTGGAATCTCTGGTCCAGACAATGGAGCTGTGGCTGTATTGAAATACAATGGCATAATAACAGACACCATCAAGAGTTGGAGGAACAACATACTGAGAACTCAAGAGTCTGAATGTGCATGTGTAAATGGCTCTTGCTTTACTGTAATGACTGATGGACCAAGTAGTGGGCAGGCATCATATAAGATCTTCAAAATGGAAAAGGGGAAAGTGGTTAAATCAGTCGAATTGGATGCTCCTAATTATCACTATGAGGAATGCTCCTGTTATCCTGATGCTGGCGAAATCACATGTGTGTGCAGGGATAATTGGCATGGTTCAAATAGGCCATGGGTATCTTTCAATCAAAATTTGGAGTATCAAATAGGATATATATGCAGTGGAGTTTTCGGAGACAATCCACGCCCCAATGATGGAACAGGTAGTTGTGGTCCAGTGGTCTCTAATGGGGCATATGGGGTAAAAGGGTTTTCGTTTAAATACGGCAATGGTGTTTGGATCGGGAGAACCAAAAGCACTAATTCTAGGAGCGGCTTTGAAATGATTTGGGACCCCAATGGGTGGACTGGAACGGACAGTAGCTTCTCGGGGAAGCAAGATATCGTAGCAATAACTGATTGGTCAGGATATAGCGGGAGTTTTGTCCAGCATCCAGAACTGACAGGATTAGATTGCATAAGACCTTGTTTCTGGGTTGAGTTAATCAGAGGGCGGCCTAAAGAGAGCACAATTTGGACCAGTGGAAGCAGCATATCTTTTTGTGGTGTAAATAGTGACACTGTTAGTTGGTCTTGGCCAGACGGTGCTGAGTTGCCATTCACCATTGACAAGTAG +>KP097951.1 +ATGAATCCAAATCAGAAGATAATAACAATCGGATCAATCTGTATGGTAACTGGAATAGTTAGCTTATTGTTGCAAGTTGGGAACATGATCTCGATATGGGTTAATCATTCAATTCACACAGGGAATCAACACCAAGCTGAGCCAATCAGAAATACTAATTTTCCTACTGAGAAAACTGTGGCCTCAGCAAAATTAGCGGGCAATTCATCTCTTTGCCCCATTAACGGATGGGCTGTATACAGCAAGGACAACAGCATAAGGATCGGCTCCAAGGGGGATGTGTTTGTTATAAGAGAGCCATTCATCTCATGCTCTCACTTGGAATGCAGAACTTTCTTTTTGACTCAAGGAGCCTTGCTGAATGATAAACACTCCAATGGGACTGTCAAAGACAGAAGCCCTCACAGAACATTAATGAGTTGTCCTGTGGGTGAGGCTCCCTCCCCGTATAACTCAAGGTTTGAGTCTGTTGCTTGGTCAGCAAGTGCTTGCCATGATGGCACCAGTTGGTTGACAATTGGAATTTCTGGTCCAGACAATGGGGCTGTGGCTGTATTGAAATACAATGGCATAATAACAGACACTATCAAGAGTTGGAGGAACAATATAATGAGAACTCAAGAGTCTGAATGTGCATGTGTAAATGGCTCTTGCTTTACTGTAATGACAGATGGACCAAGTGATGGTCAGGCATCACATAAGATCTTCAAAATGGAAAAAGGAAAAGTGATTAAATCAGTCGAATTGGATGCTCCTAATTATCACTATGAGGAATGCTCCTGTTATCCAGATGCCGGCGAAATAACATGTGTGTGCAGGGATAATTGGCATGGTTCAAATCGACCATGGGTGTCTTTCAATCAAAACTTGGAGTATCAAATAGGATATATATGCAGTGGGGTTTTCGGAGATAATCCACGCCCCAATGATGGAAAAGGCAGTTGTGGTCCGGTGTCCTCTAACGGGGCATATGGGGTAAAAGGGTTTTCATTTAAATACGGCAATGGTGTCTGGATCGGGAGAACCAAAAGCACCAATTCCAGGAGCGGCTTTGAAATGATTTGGGATCCAAATGGGTGGACTGAAACAGACAGTAGCTTTTCAGTGAAACAAGATATCGTAGCAATAACTGATTGGTCAGGATATAGCGGGAGTTTTGTCCAGCATCCAGAACTGACAGGACTAGATTGCATAAGACCTTGTTTCTGGGTTGAGTTGATCAGAGGGCGACCCAAAGAGGGCACAATTTGGACTAGTGGGAGCAGCATATCTTTCTGTGGTGTAAGTGGTGACACTGTGGGTTGGTCTTGGCCAGACGGTGCTGAGTTGCCATTCACCATTGACAAGTAG +>KJ162127.1 +GAGATTAAAATGAATCCAAATCAAAAGATAATGGCCATTGGATCAATCTGTATGGTAATTGGAATAGTTAGCTTAATGTTACAGATTGGGAACATAATCTCAATATGGGTCAGCCATTCATTTCAAACAAGGGTTCAACACCAAGCTGAACCAATCAGAAATAATAATTTTCTTGTTGAGAACGCTGTGGCTTCAGTAACATTAGCGGGCAATTCGTCTCTTTGCCCCATCAGGGGATGGGCTGTACACAGTAAAGACAACAGTATAAGAATTGGTTCCAAGGGGGATGTGTTTGTAATTAGAGAGCCGTTCATCTCATGCTCTCATTTGGAATGCAGAACTTTCTTTTTGACCCAGGGAGCCTTACTGAATGACAAGCACTCCAACGGGACTGTCAAAGACAGGAGCCCTCACAGAACATTAATGAGTTGCCCTGTGGGTGAGGTTCCCTCCCCATACAACTCAAGGTTCGAGTCTGTTGCTTGGTCAGCAAGTGCTTGCCATGATGGCACCAGTTGGTTGACAATTGGAATTTCTGGACCAGACAATGGGGCTGTAGCTGTATTGAAATACAATGGCATAATAACAGACACCATCAAGAGTTGGAGGAACAACATACTGAGAACTCAAGAGTCTGAATGTGCATGTGTAAATGGTTCTTGCTTTACTGTAATGACTGATGGACCAAGTAATGGACAGGCATCATATAAGATCTTCAAAATGAAAAAAGGGAAAGTAGTTAAATCAGTCGAGTTGAATGCTCCTAATTATCACTATGAGGAATGCTCCTGTTATCCTGATGCGGGAGAAATCATGTGTGTGTGCAGGGATAACTGGCATGGCTCAAATAGGCCATGGGTATCTTTCAATCAGAATTTGGAGTATCAGATAGGATATATATGCAGTGGAGTTTTCGGAGACAATCCACGCCCCAATGATGGAACAGGTAGTTGTAGCCCAATGTCCCCTAACGGGGCATATGGGATAAAAGGGTTTTCATTTAAATACGGCAATGGCGTTTGGATCGGGAGAACCAAAAGCACTAATTCCAGAAGCGGCTTTGAAATGATTTGGGATCCAAATGGGTGGACTGGTACGGACAGTGACTTTTTGATGAAACAAGATATAGTAGCAATAACTGACTGGTCAGGATATAGCGGGAGTTTTGTCCAGCATCCAGAACTAACAGGATTAGATTGCATAAGACCTTGCTTCTGGGTTGAGTTGATCAGAGGGCGGCCCAAAGAAAGCACAATTTGGACTAGTGGGAGCAGCATATCTTTTTGTGGTGTAAATAGTGAAACTGTGAGTTGGTCTTGGCCAGACGGTGCTGAGTTG +>OQ683476.1 +TCAAAATGAATCCAAATCAAAAGATAACAACCATTGGATCAATCTGTATGGTAATTGGGATAGTCAGCTTGATGCTGCAAATTGGGAACATAATCTCAATATGGGTTAGCCATTCAATCCGAACAGGGAATCAATACCAGCCTGAACCATGCAATCAAAGCATCATTACCTATGAGAACAACACCTGGGTAAATCAGACGTATGTCAACATCAACAATACCAATTTTCTTGCTGAGCAGGCTGTTACTTCAGTAACATTAGCGGGCAATTCATCTCTTTGCCCTATTAGTGGGTGGGCAATATACAGTAAGGACAACGGTATAAGAATTGGGTCCAAGGGGGATGTGTTTGTTATAAGAGAACCGTTCATCTCATGCTCCCACTTGGAATGCAGAACCTTTTTCCTGACCCAGGGAGCTCTGCTGAATGACAAACATTCTAATGGGACCGTTAAAGATAGAAGCCCTTATAGAACTTTGATGAGTTGCCCCGTGGGTGAGGCTCCTTCTCCGTACAACTCAAGATTTGAGTCTGTTGCTTGGTCGGCAAGTGCTTGTCATGATGGCATCAGTTGGTTGACAATCGGTATCTCTGGTCCAGACAATGGAGCTGTGGCTGTATTGAAGTACAATGGCATAATAACGGATACTATCAAGAGTTGGAGAAACAACATTTTGAGAACTCAAGAATCTGAATGTGCGTGCGTAAATGGCTCTTGCTTCACCGTAATGACTGATGGACCAAGCAATGGGCAGGCCTCATCTAAAATCTTCAAGATAGAGAAAGGGAAAGTTGTCAAATCAGTTGAATTGAATGCCCCTAATTACCACTACGAGGAATGCTCCTGTTATCCTGATGCGGGTGATATTATGTGTGTGTGCAGGGACAATTGGCATGGCTCAAACCGGCCGTGGGTATCTTTTAATCAAAATCTGGAGTATCAAATAGGATATATATGCAGTGGGGTTTTCGGGGACAATCCCCGCCCCAATGATGGAACAGGCAGTTGCAGTCCAATGTCCTCTAATGGGGCATATGGGATAAAAGGGTTTTCATTTAAGTACGGTAATGGGGTTTGGATCGGAAGAACAAAAAGCACTAGTTCCAGAAGCGGCTTTGAGATGATTTGGGATCCGAATGGGTGGACTGAGACGGACAGTAGTTTCTCAGTGAAGCAAGACATTGTAGAGATAACTGACTGGTCAGGATATAGTGGGAGCTTTGTCCAGCATCCAGAACTGACAGGATTAGATTGCATGAGGCCTTGTTTCTGGGTTGAGCTAATTAGAGGGAGGCCCAAAGAGAACACAATTTGGACTAGCGGGAGCAGCATATCCTTTTGTGGTGTAAATAGTGACACTGTGGGTTGGTCTTGGCCAGACGGTGGTGAGTGGCCATTCACCATTGACAAGTAGATGGTCGTGGAGGTCGCTAGATGGTCG +>CY041939.1 +ATGAATCCAAATCAGAAGATAATAACCATCGGATCAATCTGTATGGTAATTGGGATAGTTAGCTTAATGTTACAAATTGGGAACATGATCTCAATATGGGTCAGTCATTCAATTCAGACAGGGAATCAATGCCAAGATGAACCAATCAGCAACACTAAATTTCTTACTGAGAAAGCTGTGGCTTCAGTAACATTAGCGGGCAATTCATCTCTTTGTCCCATTAGCGGATGGGCTGTGTACAGTAAGGACAACAGCATAAGGATCGGTTCCAGGGGGGACGTGTTTGTTATAAGAGAGCCATTCATCTCATGCTCCCACTTGGAATGCAGAACTTTCTTTTTAACCCAGGGAGCCTTACTGAATGACAAGCACTCCAATGGGACTGTCAAAGACAGAAGCCCTCACAGAACATTAATGAGTTGTCCTGTAGGTGAGGCTCCCTCCCCATATAACTCAAGGTTTGAGTCTGTTGCTTGGTCAGCAAGTGCTTGCCATGATGGCACCAGTTGGTTGACAATTGGAATTTCTGGTCCAGACAATGGGGCTGTGGCTGTATTGAAATACAATGGCATAATAACAGACACCATCAAGAGTTGGAGGAACAACATAATGAGAACTCAAGAGTCTGAATGTGCATGTGTAAATGGCTCTTGCTTTACTGTAATGACTGATGGACCAAGTAGTGGGCAGGCATCATATAAGATCTTCAAAATGGAAAAGGGAAAAGTGGTTAAATCAGTCGAATTGGATGCTCCTAATTATCACTATGAGGAGTGCTCCTGTTATCCTGATGCCGGCGAAATCACATGTGTGTGCAGGGATAATTGGCATGGATCAAATAGGCCATGGGTATCTTTCAATCAAAATTTGGAGTATCAAATAGGATATATATGCAGTGGAGTCTTCGGAGACAATCCACGCCCCAATGATGGAACAGGTAGTTGTGGTCCGGTGTTCCCTAACGGGGCATATGGGGTAAAAGGGTTTTCATTTAAATACGGCAATGGTGTTTGGATCGGGAGAACCAAAAGCACTAATTCCAGGAGCGGCTTTGAAATGATTTGGGACCCAAATGGGTGGACTGGAACGGACAGTAGCTTTTCAGTGAAGCAAGATATCGTAGCAATAACTGATTGGTCAGGATATAGCGGGAGTTTTGTCCAGCATCCAGAACTGACAGGATTAGATTGCATAAGACCTTGTTTCTGGGTTGAGTTAATCAGAGGGCGGCCTAAAGAGAGCACAATTTGGACCAGTGGAAGCAGCATATCTTTTTGTGGTGTAAATGGTGACACTGTTAGTTGGTCTTGGCCAGACGGTGCTGAGTTGCCATTCACCATTGACAAGTAG +>MF116322.1 +AGCAAAAGCAGGAGTTTAAAATGAATCCAAATCAGAAGATAATAACCATCGGATCAATCTGTGTGGGAATTGGAATAGTTAGCTTAATGTTGCAAATTGGGAACATGGTCTCAATATGGGTCAGTCATTCAATTCAGACAGAGAATCAGTGCCAAGCTGAATCAATCAGCAATACTAAATTTCTCACTGAGAAGGCTATGGCTCCAGTAACATTAATGGGTAATTCATCTCTTTGCCCCATTAGCGGATGGGCTGTACACAGTAAGGACAATAGCATAAGGATCGGTTCCAAGGGGGATGTGTTTGTTATAAGAGAGCCGTTCATCTCATGCTCCCACTTGGAATGCAGAACTTTCTTTTTGACTCAGGGAGCCCTGCTGAATGACAAGCACTCCAATGGGACTGTCAAAGACAGAAGCCCTCACAGAGCATTAATGAGTTGTCCTGTGGGTGAGGCTCCCTCTCCATATAACTCAAGGTTTGAGTCTGTTGCTTGGTCAGCAAGTGCCTGCCATGATGGCACCGGTTGGTTAACAATTGGAATTTCTGGCCCAGACAATGGGGCTGTGGCTGTATTGAAATACAATGGCATAATAACAGACACTATCAAAAGTTGGAGGAACAACATACTGAGAACTCAAGAGTCTGAATGTGCATGTGTAAATGGCTCTTGCTTTACTGTAATGACTGATGGACCAAGTAATGGGCAGGCATCATATAAAATCTTCAAATTGGAAAAAGGGAAAGTGGTTAAATCAGTTGAATTGGATGCTCCTAATTATCACTATGAGGAATGCTCCTGTTATCCTGATTCCGGCGAAATCACTTGTGTGTGCAGGGATAATTGGCATGGTTCAAATAGACCATGGGTATCTTTCAACCAAAATTTAGAGTACCAAATAGGATATATATGCAGTGGAGTTTTCGGAGATAATCCACGGCCCAATGATGGAACAGGGAGCTGTGGTCCGGTGTCCCCTAATGGGGCATATGGGGTGAAAGGGTTTTCATTTAAATACGGCAATGGTGTTTGGATCGGGAGAACCAAAAGCACTAATTCCAGGAGTGGCTTTGAAATGATTTGGGATCCGAATGGGTGGACTGAAACGGACAGCAGCTTCTCGGTGAAGCAAGATATCGTGGCAATAACTGATTGGTCAGGATATAGCGGGAGTTTTGTCCAGCATCCAGAACTGACAGGATTAGATTGCATAAGACCTTGTTTCTGGGTTGAGTTAATCAGAGGGCGGCCCAAAGAGAACACAATCTGGACTAGTGGGAGCAGCATATCCTTTTGTGGTGTAAATAGTGACACTGTGGGTTGGTCTTGGCCAGACGGTGCTGAGGTGCCATTCACCATTGACAAGTAGTTTGTTCAAAAAACTCCTTGTTTCTACT diff --git a/data/community/genspectrum/iav/h5n1/GG1996/NA/genome_annotation.gff3 b/data/community/genspectrum/iav/h5n1/GG1996/NA/genome_annotation.gff3 new file mode 100644 index 000000000..0206383bf --- /dev/null +++ b/data/community/genspectrum/iav/h5n1/GG1996/NA/genome_annotation.gff3 @@ -0,0 +1 @@ +. . CDS 21 1430 . + . gene="NA" diff --git a/data/community/genspectrum/iav/h5n1/GG1996/NA/pathogen.json b/data/community/genspectrum/iav/h5n1/GG1996/NA/pathogen.json new file mode 100644 index 000000000..547b05c3a --- /dev/null +++ b/data/community/genspectrum/iav/h5n1/GG1996/NA/pathogen.json @@ -0,0 +1,19 @@ +{ + "schemaVersion": "3.0.0", + "alignmentParams": { + "minSeedCover": 0.01 + }, + "attributes": { + "name": "Influenza A/H5N1 (segment 6/NA)", + "reference name": "Influenza A virus (A/Goose/Guangdong/1/96(H5N1)) neuraminidase (NA) gene, complete cds", + "reference accession": "NC_007361.1" + }, + "files": { + "reference": "reference.fasta", + "pathogenJson": "pathogen.json", + "changelog": "CHANGELOG.md", + "genomeAnnotation": "genome_annotation.gff3", + "readme": "README.md", + "examples": "examples.fasta" + } +} diff --git a/data/community/genspectrum/iav/h5n1/GG1996/NA/reference.fasta b/data/community/genspectrum/iav/h5n1/GG1996/NA/reference.fasta new file mode 100644 index 000000000..fb6108ee9 --- /dev/null +++ b/data/community/genspectrum/iav/h5n1/GG1996/NA/reference.fasta @@ -0,0 +1,22 @@ +>NC_007361.1 Influenza A virus (A/Goose/Guangdong/1/96(H5N1)) neuraminidase (NA) gene, complete cds +AGCAAAAGCAGGAGATTAAAATGAATCCAAATCAGAAGATAATAACCATTGGATCAATCTGTATGGTAGT +TGGGATAATTAGCTTGATGTTACAAATTGGGAACATAATCTCAATATGGGTCAGTCATTCAATTCAGACA +GGGAATCAACACCAAGCTGAACCATGCAATCAAAGCATTATTACTTATGAAAACAACACCTGGGTAAATC +AAACATATGTCAACATCAGCAATACCAATTTTCTTACTGAAAAAGCTGTGGCTTCAGTAACATTAGCGGG +CAATTCATCTCTTTGCCCCATTAGCGGATGGGCTGTACACAGTAAGGACAACGGTATAAGAATCGGTTCC +AAGGGGGATGTGTTTGTTATAAGAGAGCCGTTCATCTCATGCTCCCACTTGGAATGCAGAACTTTCTTTT +TGACTCAGGGAGCCTTGCTGAATGACAAGCACTCCAATGGGACCGTCAAAGACAGAAGCCCTCACAGAAC +ATTGATGAGTTGTCCTGTGGGTGAGGCTCCCTCCCCATATAACTCAAGGTTTGAGTCTGTTGCTTGGTCG +GCAAGTGCTTGCCATGATGGCACCAGTTGGTTGACAATTGGAATTTCTGGCCCAGACAATGGGGCTGTGG +CTGTATTGAAATACAACGGCATAATAACAGACACTATCAAGAGTTGGAGGAACAACATACTGAGAACTCA +AGAGTCTGAATGTGCATGTGTAAATGGCTCTTGCTTTACTGTAATGACTGACGGACCAAGTAATGGGCAG +GCCTCATATAAGATCTTCAAAATGGAAAAAGGGAAAGTAGTTAAATCAGTCGAATTGAATGCCCCTAATT +ATCACTATGAGGAGTGCTCCTGTTATCCTGATGCTGGCGAAATCACATGTGTGTGCAGGGATAATTGGCA +TGGCTCAAATCGGCCATGGGTATCTTTCAATCAAAATTTGGAGTATCAAATAGGATATATATGCAGTGGA +GTTTTCGGAGACAATCCACGCCCCAATGATGGAACAGGCAGTTGTGGTCCGGTGTCCCCTAACGGGGCAT +ATGGAGTAAAAGGGTTTTCATTTAAATACGGCAATGGTGTTTGGATCGGGAGAACCAAAAGCACTAATTC +CAGGAGCGGCTTTGAAATGATTTGGGATCCAAATGGGTGGACTGGAACGGACAGTAGCTTCTCGGTGAAA +CAAGATATCGTAGCAATAACTGATTGGTCAGGATATAGCGGGAGTTTTGTCCAGCATCCAGAACTGACAG +GATTAGATTGCATAAGACCTTGTTTCTGGGTTGAGCTAATCAGAGGGCGGCCCAAAGAGAGCACAATTTG +GACTAGTGGGAGCAGCATATCTTTTTGTGGTGTAAATAGTGACACTGTGGGTTGGTCTTGGCCAGACGAT +GCCGAGTTGCCATTCACCATTGACAAGTAGTTTGTTCAAAAAACTCCTTGTTTCTACT diff --git a/data/community/genspectrum/iav/h5n1/GG1996/NP/CHANGELOG.md b/data/community/genspectrum/iav/h5n1/GG1996/NP/CHANGELOG.md new file mode 100644 index 000000000..81199b7df --- /dev/null +++ b/data/community/genspectrum/iav/h5n1/GG1996/NP/CHANGELOG.md @@ -0,0 +1,3 @@ +## Unreleased + +Initial release diff --git a/data/community/genspectrum/iav/h5n1/GG1996/NP/README.md b/data/community/genspectrum/iav/h5n1/GG1996/NP/README.md new file mode 100644 index 000000000..239f4bdf0 --- /dev/null +++ b/data/community/genspectrum/iav/h5n1/GG1996/NP/README.md @@ -0,0 +1,26 @@ +# H5N1 (segment5/ NP) - dataset with A/Goose/Guangdong/1/96 reference + +| attribute | value | +| ------------------- | ---------------------------------------- | +| dataset name | community/genspectrum/iav/h5n1/GG1996/NP | +| reference strain | A/Goose/Guangdong/1/96(H5N1) | +| reference accession | NC_007360.1 | +| assembly accession | GCF_000864105.1 | + +## Authors and contacts + +Maintained by Genspectrum, Chaoran Chen and Anna Parker + +With the help of: Cornelius Roemer and Richard Neher + +## Scope of this dataset + +This dataset uses the first highly-pathogenic avian influenza (HPAI) isolate (A/Goose/Guangdong/1/96) as a reference and is suitable for the analysis of circulating and historical H5 sequences, including low-pathogenicity avian influenza (LPAI) isolates. + +## Features + +This simple dataset only supports alignment. + +## What is Nextclade dataset + +Read more about Nextclade datasets in Nextclade documentation: https://docs.nextstrain.org/projects/nextclade/en/stable/user/datasets.html diff --git a/data/community/genspectrum/iav/h5n1/GG1996/NP/examples.fasta b/data/community/genspectrum/iav/h5n1/GG1996/NP/examples.fasta new file mode 100644 index 000000000..7b155de66 --- /dev/null +++ b/data/community/genspectrum/iav/h5n1/GG1996/NP/examples.fasta @@ -0,0 +1,38 @@ +>CY047476.1 +ATGGCGTCTCAAGGCACCAAACGATCTCATGAACAGATGGAAACTGGTGGAGAACGCCAGAATGCTACTGAGATCAGGGCATCTGTTGGAAGAATGATTAGTGGCATCGGGAGGTTCTACATACAGATGTGCACAGAACTCAAACTCAGTGACTATGAAGGGAGGCTTATCCAGAACAGCATAACAATAGAGAGAATGGTACTCTCTGCATTTGATGAACGAAGGAACAGATACCTGGAAGAACACCCCAGTGCGGGGAAGGACCCGAAGAAAACTGGAGGTCCAATTTATAGGAGGAGAGACGGGAAATGGGTGAGAGAGCTGATTCTGTACGACAAAGAGGAGATCAGGAGGATTTGGCGTCAAGCGAACAATGGAGAGGACGCAACTGCTGGTCTCACCCACCTGATGATATGGCATTCCAATCTAAATGATGCCACATATCAGAGAACGAGAGCTCTCGTACGTACTGGAATGGACCCCAGGATGTGCTCTCTGATGCAAGGGTCAACTCTCCCGAGGAGATCTGGAGCTGCCGGTGCAGCAGTGAAGGGGGTAGGGACAATGGTGATGGAGCTGATTCGGATGATAAAACGAGGGATCAACGACCGGAATTTCTGGAGAGGCGAAAATGGAAGAAGAACAAGGATCGCATACGAGAGAATGTGCAACATCCTCAAAGGGAAATTCCAAACAGCAGCACAAAGAGCAATGATGGATCAGGTGCGAGAGAGCAGAAATCCCGGGAATGCTGAAATTGAAGATCTCATTTTTCTGGCACGGTCTGCACTCATCCTGAGAGGATCAGTAGCCCATAAGTCCTGCTTGCCTGCTTGTGTGTACGGACTTGCTGTGGCCAGTGGATATGACTTTGAGAGAGAAGGGTACTCTCTGGTTGGAATAGATCCTTTCCGTCTGCTTCAAAACAGCCAGGTCTTTAGTCTCATTAGACCAAATGAGAATCCAGCACATAAGAGTCAATTAGTGTGGATGGCATGCCACTCTGCAGCATTTGAGGACCTTAGAGTCTCAAGTTTCATCAGAGGGACAAGAGTGGTCCCAAGAGGACAGCTATCCACCAGAGGGGTTCAAATTGCTTCAAATGAGAACATGGAAGCAATGGACTCCAACACTCTTGAACTGAGAAGTAGATATTGGGCTATAAGAACCAGAAGCGGAGGAAACACCAGCCAGCAGAGGGCATCTGCAGGACAGATAAGCATTCAGCCCACTTTCTCGGTACAGAGAAACCTTCCCTTCGAAAGAGCGACCATTATGGCAGCATTCACAGGAAATACTGAGGGCAGAACGTCTGACATGAGAACTGAAATCATAAGAATGATGGAAAGTGCCAGACCAGAAGATGTGTCATTCCAGGGGCGGGGAGTCTTCGAGCTCTCGGACGAAAAGGCAACGAACCCGATCGTGCCTTCCTTTGACATGAATAATGAAGGATCTTATTTCTTCGGAGACAATGCAGAGGAGTATGACAATTAA +>CY146645.1 +ATGGCGTCTCAAGGCACCAAACGATCTTATGAACAGATGGAAACTGGTGGAGAGCGCCAGAATGCTACTGAGATCAGGGCATCGGTTGGAAGAATGGTTAGTGGCATTGGGAGGTTCTACATACAGATGTGCACAGAACTCAAACTCAGTGACTATGAAGGGAGACTGATCCAGAACAGCATAACAATAGAGAGAATGGTACTTTCTGCATTTGATGAAAGGAGAAACAGGTACCTAGAAGAACACCCCAGTGCGGGGAAGGACCCGAAGAAAACTGGAGGTCCAATTTATCGAAGGAGAGACGGAAAATGGGTGAGGGAGCTGATTCTGTATGACAAAGAGGAGATCCGGAGGATTTGGCGCCAAGCTAACAATGGAGAGGACGCAACTGCTGGTCTTACCCATCTGATGATATGGCATTCCAATCTAAATGATGCCACATATCAGAGAACGAGAGCTCTCGTGCGTACCGGAATGGACCCCAGGATGTGCTCTCTGATGCAAGGATCAACTCTCCCGAGGAGATCTGGAGCTGCCGGTGCAGCAGTGAAGGGGATAGGAACAATGGTGATGGAGCTGATTCGGATGATAAAACGAGGGATCAACGACCGGAATTTCTGGAGAGGCGAAAATGGAAGAAGAACAAGGATTGCATATGAGAGAATGTGCAACATCCTCAAAGGGAAATTCCAAACAGCTGCACAAAGAGCAATGATGGATCAAGTGCGAGAGAGCAGAAATCCTGGGAATGCTGAAATTGAAGATCTCATTTTTCTGGCACGGTCTGCACTCATCCTGAGAGGATCAGTAGCCCATAAGTCTTGCCTGCCTGCTTGTGTGTACGGACTTGCAGTGGCCAGTGGATATGACTTTGAGAGAGAAGGATACTCTCTGGTTGGAATAGATCCCTTCCGTCTACTTCAAAACAGCCAGGTCTTCAGTCTCATTAGGCCAAATGAAAATCCAGCACATAAGAGCCAATTAGTGTGGATGGCATGCCACTCTGCAGCATTCGAGGACCTTAGAGTCTCAAGTTTCATCAGAGGGACAAGAGTGATCCCAAGAGGACAGCTATCCACCAGAGGGGTTCAAATTGCTTCAAATGAGAACATGGAAGCAATGGACTCCAACACTCTTGAACTGAGAAGTAGATATTGGGCTATAAGAACCAGGAGCGGAGGGAACACCAATCAACAGAGGGCATCTGCAGGACAGATCAGCGTTCAGCCTACCTTCTCGGTGCAGAGAAACCTCCCATTCGAAAGAGCGACCATTATGGCAGCATTTACAGGAAATACTGAAGGCAGGACGTCTGACATGAGGACTGAAATCATAAGAATGATGGAAAGTGCCAGACCAGAAGATGTGTCATTCCAAGGGCGGGGAGTCTTCGAGCTCTCGGACGAAAAGGCAACGAACCCGATCGTGCCTTCCTTTGACATGAATAATGAGGGGTCTTATTTCTTCGGAGACAATGCAGAGGAGTATGACAATTAA +>JF758694.1 +ATGGCGTCTCAAGGCACCAAACGATCCTATGAGCAGATGGAGACTGGTGGAGAACGCCAGAACGCCACTGAAATCAGAGCATCTGTTGGGAGAATGGTTGGTGGAATCGGGAGATTCTACATACAGATGTGCACTGAACTCAAACTCAGTGACTATGAAGGAAGACTAATCCAAAACAGCATCACAATAGAGAGAATGGTTCTCTCAGCATTTGATGAGAGGAGGAACAGATATCTCGAAGAGCATCCCAGTGCTGGTAAAGACCCTAAGAAGACTGGAGGTCCAATCTACAGGAGGAGAGATGGGAAATGGATGAGAGAATTGATCCTATATGACAAAGAGGAGATCAGAAGGATTTGGCGTCAAGCGAATAATGGAGAAGACGCAACTGCTGGTCTCACCCATTTGATGATCTGGCACTCCAATCTGAATGATGCCACCTACCAGAGAACGAGGGCACTTGTGCGTACTGGGATGGATCCCAGGATGTGTTCTCTGATGCAAGGCTCAACTCTTCCGAGGAGGTCTGGAGCTGCTGGAGCAGCAGTGAAGGGGGTTGGAACAATGGTGATGGAATTGATCCGAATGATCAAGCGAGGGATCAATGATCGGAATTTCTGGAGAGGTGAAAATGGGCGGAGGACAAGAATTGCTTATGAAAGAATGTGCAACATCCTCAAGGGGAAGTTCCAAACAGCAGCACAACGAGCAATGATGGACCAGGTGAGGGAAAGCCGGAATCCTGGGAATGCTGAAATTGAGGATCTCATCTTTCTTGCACGGTCTGCTCTCATTCTGAGGGGATCAGTAGCTCATAAGTCTTGCCTGCCTGCTTGTGTGTATGGACTTGCTGTGGCCAGTGGATATGACTTTGAAAGGGAGGGGTATTCCCTAGTCGGAATTGATCCTTTCCGTCTGCTCCAAAACAGTCAAGTCTTCAGTCTTATCAGACCAAACGAAAATCCAGCACATAAAAGTCAGCTGGTATGGATGGCATGCCACTCTGCAGCTTTTGAAGATCTGAGAGTGTCAAGCTTCATTAGAGGAACAAGAATAGTCCCAAGAGGACAACTGTCCACCAGAGGAGTTCAGATAGCTTCAAATGAGAACATGGAGACAATGGACTCCAGTACTCTTGAACTGAGGAGCAGATACTGGGCTATAAGGACCAGAAGCGGAGGAAACACTAACCAGCAGAGAGCATCTGCAGGGCAAATCAGCGTACAGCCCACGTTCTCTGTACAGAGAAACCTCCCATTCGAGAGAGCAACCATTATGGCAGCTTTTGCAGGAAATACTGAAGGCAGAACTTCAGACATGAGAACAGAAATCATAAGGATGATGGAAAATGCCAGACCTGAAGATGTGTCTTTCCAGGGGCGGGGAGTCTTCGAGCTCTCGGACGAAAAGGCAACGAACCCGATCGTGCCTTCCTTTGACATGAGTAACGAAGGATCTTATTTCTTCGGAGACAATCAGGAGGAGTAG +>OP269982.1 +AGCAAAAGCAGGGTAGATAATCACTCACTGAGTGACATCCACATCATGGCGTCTCAAGGCACCAAACGATCCTATGAACAAATGGAAACTGGTGGGGAACGCCAGAATGCCACTGAAATCAGAGCATCTGTTGGAAGAATGGTTGGCGGAATCGGGAGATTCTACATACAGATGTGCACTGAGCTCAAACTCAGTGATTACGAAGGGAGGCTGATCCAAAACAGCATAACCATAGAAAGGATGGTTCTCTCGGCATTTGATGAGAGGAGGAACAAGTATCTGGAGGAACATCCCAGTGCTGGGAAGGATCCCAAGAAGACCGGAGGTCCAATCTACAGGAGGAGAGATGGCAAATGGATGAGAGAGTTGATCCTCTACGACAAAGAAGAGATCAGAAGAATTTGGCGTCAAGCTAATAATGGAGAGGATGCAACTGCTGGTCTCACTCATTTGATGATTTGGCATTCCAATCTGAATGATGCCACATACCAGAGAACAAGGGCACTTGTGCGTACTGGAATGGACCCTAGGATGTGCTCTCTGATGCAAGGCTCAACCCTCCCTAGGAGATCCGGGGCTGCTGGAGCAGCAGTGAAAGGAGTTGGAACAATGGTGATGGAATTGATTCGGATGATCAAACGAGGGATCAATGATCGTAATTTCTGGAGAGGCGAAAATGGACGGAGAACCAGGATTGCCTACGAGAGAATGTGCAACATTCTCAAGGGAAAGTTCCAAACAGCAGCACAACGAGCAATGATGGACCAAGTGAGGGAAAGCCGGAATCCTGGGAATGCTGAGATTGAAGATCTCATCTTTCTCGCACGATCTGCTCTCATTCTGAGGGGATCAGTGGCTCACAAGTCCTGTCTGCCTGCTTGCGTGTATGGACTTGCTGTAGCCAGTGGATATGACTTTGAAAGAGAAGGATACTCTCTAGTCGGGATTGATCCTTTCCGTCTACTCCAAAACAGTCAAGTCTTCAGTCTCATCAGACCGAACGAAAATCCCGCTCATAAAAGTCAGCTGGTATGGATGGCATGCCACTCTGCGGCATTCGAGGATCTGAGAGTGTCAAGCTTCATCAGAGGGACAAGAGTAGTCCCAAGAGGACAACTGTCCACCAGAGGAGTTCAGATTGCTTCAAATGAAAACATGGAGACGATGGACTCCAGTACTCTTGAACTGAGGAGCAGATACTGGGCTATAAGAACAAGAAGTGGAGGAAACACTAACCAACAGAGAGCATCTGCAGGACAAATCAGCGTACAGCCCACATTCTCTGTGCAGAGAAACCTCCCATTCGAGAGAGCAACCATCATGGCAGCATTTACGGGAAACACTGAAGGCAGAACTTCAGACATGAGAACTGAGATCATAAGGATGATGGAAAATGCCAGACCTGAAGATGTGTCTTTCCAGGGGCGGGGAGTCTTCGAGCTCTCGGACGAAAAGGCAACGAACCCGATCGTGCCTTCCTTTGACATGAGCAATGAAGGATCTTATTTCTTCGGAGACAATGCAGAGGAGTATGACAATTAA +>JF758810.1 +ATGGCGTCTCAAGGCACCAAACGATCTTATGAGCAAATGGAAACTGGTGGAGAACGCCAGAATGCTACTGAAATCAGAGCATCTGTTGGGAGAATGGTCGGTGGAATTGGGAGATTCTACATACAGATGTGCACTGAGCTCAAACTCAGCGACTATGAAGGGAGGCTAATCCAAAACAGCATAACAATAGAGAGAATGGTTCTCTCTGCATTTGATGAAAGGAGGAACAAATATCTGGAAGAACATCCCAGTGCGGGGAAGGATCCGAAGAAAACCGGAGGTCCAATCTACAGAAGGAGAGACGGAAAGTGGATGAGAGAGCTAATTCTGTATGACAAAGAGGAGATCAGGAGGGTTTGGCGTCAAGCGAACAATGGAGAAGACGCAACTGCTGGTCTCACTCATCTGATGATCTGGCATTCCAACCTGAATGATGCCACATATCAGAGAACAAGAGCTCTCGTGCGTACTGGGATGGACCCTAGAATGTGCTCCCTGATGCAGGGATCAACCCTCCCAAGAAGATCTGGAGCTGCTGGTGCAGCAGTAAAGGGAGTTGGGACAATGGTGATGGAACTGATTCGGATGATAAAGCGGGGGATCAATGACCGGAATTTCTGGAGAGGCGAGAATGGACGGAGAACAAGGATTGCATATGAGAGAATGTGCAACATCCTCAAAGGGAAATTCCAAACAGCAGCACAACGAGCAATGATGGACCAGGTGCGAGAAAGCAGAAATCCTGGGAATGCTGAAATTGAAGACCTTATCTTCCTGGCACGGTCTGCACTCATCCTGAGAGGATCAGTGGCTCATAAGTCCTGCTTGCCTGCTTGTGTATATGGACTTGCTGTGGCCAGTGGATATGATTTTGAGAGAGAGGGATACTCTCTGGTCGGAATTGATCCTTTCCGTCTGCTTCAGAACAGCCAGGTGTTCAGCCTCATTAGACCAAATGAGAATCCGGCACATAAGAGTCAGCTGGTATGGATGGCATGTCATTCTGCAGCATTTGAAGACCTGAGAGTATCAAGCTTCATCAGAGGAACAAGGGTGGTCCCAAGAGGACAACTGTCCACCAGAGGAGTTCAAATAGCTTCAAATGAAAACATGGAAACAATGGACTCCAGCACTCTTGAACTGAGAAGCAGATACTGGGCTATAAGGACCAGAAGTGGAGGAAACACCAACCAACAGAGAGCATCTGCAGGACAAATCAGTGTACAGCCTACTTTCTCGGTACAGAGAAATCTTCCTTTTGAGAGAGCGACCATCATGGCGGCATTCACAGGGAACACTGAAGGCAGGACATCCGACATGAGGACTGAAATCATAAGAATGATGGAAAGTGCCAGACCAGAAGATGTGTCTTTCCAGGGGCGGGGAGTCTTCGAGCTCTCGGACGAAAAGGCAACGAACCCGATCGTGCCTTCCTTTGACATGAGTAACGAGGGGTCTTATTTCTTCGGAGACAATGCAGAGGAGTATGACAATTAA +>GQ386144.1 +GTAGATAATCACTCACCGAGTGACATCAACATTATGGCGTCCCAAGGCACCAAACGATCTTATGAACAGATGGAAACTGGTGGAGAGCGCCAGAATGCTACTGAGATCAGGGCATCCGTTGGAAGAATGATTAGTGGCATTGGGAGATTCTACATACAGATGTGCACAGAACTCAAACTCAGTGACTATGAAGGAAGACTGATCCAGAACAGCATAACAATAGAGAGAATGGTACTTTCTGCATTTGATGAAAGGAGGAACAGATACCTGGAAGAACACCCCAGTGCGGGGAAGGACCCGAAGAAGACTGGAGGTCCAATTTATCGGAGGAGAGACGGAAAATGGGTGAGGGAGCTGATTCTGTACGACAAAGAGGAGATCAGGAGGATTTGGCGTCAAGCGAACAATGGAGAGGACGCAACTGCGGGTCTTACCCACCTTATGATATGGCATTCCAATCTAAATGATGCCACATATCAGAGAACGAGAGCTCTCGTGCGTACTGGAATGGATCCCAGGATGTGCTCTCTGATGCAAGGATCAACCCTCCCGAGGAGATCTGGAGCTGCCGGTGCAGCAGTGAAGGGGGTAGGAACAATGGTGATGGAGCTGATTCGGATGATAAAACGGGGAATCAACGACCGGAATTTCTGGAGAGGCGAAAATGGAAGAAGAACAAGGATTGCCTATGAGAGAATGTGCAACATCCTCAAAGGGAAATTCCAAACAGCAGCACAAAGAGCAATGATGGATCAAGTGCGAGAGAGCAGAAACCCTGGGAATGCTGAAATTGAAGATCTCATTTTTCTGGCACGGTCTGCACTCATCCTGAGAGGATCAGTGGCCCATAAGTCCTGCTTGCCTGCCTGTGTGTACGGACTTGCAGTGGCCAGTGGATATGACTTTGAGAGAGAAGGGTACTCTCTGGTTGGAATAGATCCTTTCCGTCTGCTTCAAAACAGCCAGGTCTTTAGTCTCATTAGACCAAATGAGAATCCAGCACATAAGAGTCAATTAGTGTGGATGGCATGCCACTCTGCAGCATTTGAGGACCTTAGAGTCTCAAGTTTCATCAGAGGGACAAGAGTGGTCCCAAGAGGACAGCTATCCACCAGAGGGGTTCAAATTGCTTCAAATGAGAATATGGAAGCAATGGATTCCAACACTCTTGAACTGAGAAGTAGATATTGGGCTATAAGAACCAGAAGCGGAGGAACCACCAACCAGCAGAGGGCATCTGCAGGGCAGATCAGCGTTCAGCCCACTTTCTCGGTACAGAGAAACCTTCCCTTCGAAAGAGCGACCATTATGGCAGCATTTACAGGAAATACTGAGGGCAGAACGTCTGACATGAGGACTGAAATCATAAGAATGATGGAAAGTGCCAGACCAGAAGATGTGTCATTCCAGGGGCGGGGAGTCTTCGAGCTCTCGGACGAAAAGGCAACGAACCCGATCGTGCCTTCCTTTGACATGAATAATGAAGGATCTTATTTCTTCGGAGACAATGCAGAGGAGTATGACAATTAAAGAAAAAATGC +>OP269986.1 +AGCAAAAGCAGGGTAGATAATCACTCACTGAGTGACATCCACATCATGGCGTCTCAAGGCACCAAACGATCCTATGAACAAATGGAAACTGGTGGGGAACGCCAGAATGCCACTGAAATCAGAGCATCTGTTGGAAGAATGGTTGGCGGAATCGGGAGATTCTACATACAGATGTGCACTGAGCTCAAACTCAGTGATTACGAAGGGAGGCTGATCCAAAACAGCATAACCATAGAAAGGATGGTTCTCTCGGCATTTGATGAGAGGAGGAACAAGTATCTGGAGGAACATCCCAGTGCTGGGAAGGATCCCAAGAAGACTGGAGGTCCAATCTACAGGAGGAGAGATGGCAAATGGATGAGAGAGTTGATCCTCTACGACAAAGAAGAGATCAGAAGAATTTGGCGTCAAGCTAATAATGGAGAGGATGCAACTGCTGGTCTCACTCATTTGATGATTTGGCATTCCAATTTGAATGATGCCACATACCAGAGAACAAGGGCACTTGTGCGTACTGGAATGGACCCTAGGATGTGCTCTCTGATGCAAGGCTCAACCCTCCCTAGGAGATCCGGGGCTGCTGGAGCAGCAGTGAAAGGAGTTGGAACAATGGTGATGGAATTGATTCGGATGATCAAACGAGGGATCAATGATCGGAATTTCTGGAGAGGCGAAAATGGACGGAGAACCAGGATTGCCTACGAGAGAATGTGCAACATTCTCAAGGGAAAGTTCCAAACAGCAGCACAACGAGCAATGATGGACCAAGTGAGGGAAAGCCGGAATCCTGGGAATGCTGAGATTGAAGATCTCATCTTTCTCGCACGATCTGCTCTCATTCTGAGGGGATCAGTGGCTCACAAGTCCTGTCTGCCTGCTTGCGTGTATGGACTTGCTGTAGCCAGTGGATATGACTTTGAAAGAGAAGGATACTCTCTAGTCGGGATTGATCCTTTCCGTCTACTCCAAAACAGTCAAGTCTTCAGTCTCATCAGACCAAACGAAAATCCAGCTCATAAAAGTCAGCTGGTATGGATGGCATGCCACTCTGCGGCATTCGAGGATCTGAGAGTGTCAAGCTTCATCAGAGGGACAAGAGTAGTCCCAAGAGGACAACTGTCCACCAGAGGAGTTCAGATTGCTTCAAATGAAAACATGGAGACGATGGACTCCAATACTCTTGAACTGAGGAGCAGATACTGGGCTATAAGAACAAGAAGTGGAGGAAACACTAACCAACAGAGAGCATCTGCAGGACAAATCAGCGTACAGCCCACATTCTCTGTGCAGAGAAACCTCCCATTCGAGAGAACAACCATCATGGCAGCATTTACGGGAAACACTGAAGGCAGAACTTCAGACATGAGAACTGAGATCATAAGGATGATGGAAAATGCCAGACCTGAAGATGTGTCTTTCCAGGGGCGGGGAGTCTTCGAGCTCTCGGACGAAAAGGCAACGAACCCGATCGTGCCTTCCTTTGACATGAGCAATGAAGGATCTTATTTCTTCGGAGACAATGCAGAGGAGTATGACAATTAA +>KU042776.1 +ATGGCGTCTCAAGGCACCAAACGATCTTATGAACAGATGGAAACTGGTGGAGAGCGCCAGAATGCTACTGAGATCAGGGCATCTGTTGGAAGAATGGTGAGTGGCATTGGGAGGTTCTACATACAGATGTGCACAGAACTCAAACTCAGTGACCATGAAGGGAGACTGATCCAGAACAGCATAACAATAGAGAGAATGGTACTTTCTGCATTTGATGAAAGAAGGAACAGGTACCTGGAAGAGCACCCCAGTGCGGGGAAGGACCCTAAGAAAACTGGAGGTCCAATTTATCGGAGGAGAGACGGGAAATGGGTGAGAGAGCTGATTCTGTACGACAAAGAAGAGATCAGGAGGATTTGGCGCCAAGCGAACAATGGAGAGGACGCAACTGCTGGCCTTACCCACCTGATGATATGGCATTCCAATCTGAATGATGCCACATATCAGAGAACAAGAGCTCTCGTGCGTACCGGAATGGACCCCAGGATGTGCTCTCTGATGCAAGGATCAACTCTCCCGAGGAGATCTGGAGCTGCTGGTGCAGCAGTGAAGGGGGTAGGAACAATGGTGATGGAGCTGATTCGAATGATAAAACGAGGGATTAACGACCGGAATTTCTGGAGAGGCGAAAATGGAAGAAGAACAAGGATTGCATATGAGAGAATGTGCAACATCCTCAAAGGGAAATTCCAAACAGCTGCACAAAGAGCAATGATGGATCAAGTGCGAGAGAGCAGAAATCCTGGGAATGCTGAAATTGAAGATCTCATTTTTCTGGCACGGTCTGCACTCATCCTGAGAGGATCAGTGGCCCATAAGTCCTGCTTGCCCGCTTGTGTATACGGACTTGCAGTGGCCAGTGGGTATGACTTCGAGAGAGAAGGATACTCTCTGGTTGGAATAGATCCTTTCCGTCTGCTTCAAAACAGCCAGGTCTTTAGTCTCATTAGACCAAATGAAAACCCAGCACATAAGAGTCAATTAGTGTGGATGGCATGCCACTCTGCAGCATTTGAGGACCTTAGAGTCTCAAGTTTTATCAGAGGGGCAAGAGTGGTCCCAAGAGGGCAGCTATCCACCAGAGGGGTTCAAATTGCTTCAAATGAGAACATGGAAACAATGGACTCCAACACCCTTGAACTGAGAAGTAGATATTGGGCCATAAGAACCAGGAGCGGAGGGAACACCAACCAGCAGAGGGCATCTGCAGGGCAAATCAGCGTTCAACCCACTTTCTCGGTACAGAGAAACCTTCCCTTCGAAAGGGCGACCATTATGGCAGCATTTACAGGAAATACTGAAGGTAGAACGTCCGACATGAGGACTGAAATCATAAGAATGATGGAAAGTGCCAAACCAGAAGATGTGTCATTCCAGGGGCGGGGAGTCTTCGAGCTCTCGGACGAAAAGGCAACGAACCCGATCGTGCCTTCCTTTGACATGAATAATGAAGGATCTTATTTCTTCGGAGACAATGCAGAGGAGTATGACAATTAA +>OQ067783.1 +GTAGATAATCACTCACTGAGTGACATCAACATCATGGCGTCTCAAGGCACCAAACGATCTTATGAACAGATGGAGACTGGTGGAGAACGCCAGAATGCCACTGAAATCAGAGCATCTGTTGGAAGAATGGTTGGTGGAATTGGGAGGTTTTACGTACAGATGTGCACTGAACTCCAACTCAGTGACTATGAAGGGAGGCTGATTCAGAACAGCATAACAATAGAGAGAATGGTTCTCTCTGCATTTGATGAAAGGAGGAACAAATACCTGGAAGAACATCCCAGTCCTGGGAAGGATCCGAAGAAAACTGGAGGCCCAATTTATCGAAGGAGGGACGGGAAATGGATGAGAGAGCTGATTCTGTATGACAAAGAAGAGATCAGGAGAATCTGGCGTCAAGCGAATAATGGAGAAGACGCAACTGCTGGTCTCACTCACCTGATGATTTGGCATTCCAATCTAAATGATGCCACATACCAGAGAACCAGAGCCCTCGTGCGCACTGGGATGGACCCCAGAATGTGCTCTCTGATGCAAGGATCAACTCTCCCGAGGAGATCTGGAGCTGCTGGAGCAGCAATAAAGGGAGTCGGAACGATGGTGATGGAACTAATTCGGATGATTAAACGAGGGATTAATGATCGTAATTTCTGGAGAGGTGAAAATGGACGGAGAACAAGGATTGCATATGAGAGAATGTGCAACATCCTCAAGGGGAAATTCCAAACAGCTGCACAAAGAGCAATGATGGACCAGGTGCGAGAAAGCAGAAATCCTGGGAATGCTGAAATTGAAGATCTCATCTTCCTGGCGCGGTCTGCGCTCATCCTGAGAGGATCAGTGGCCCATAAGTCCTGCCTTCCTGCTTGTGTGTACGGGCTTGCTGTGGCCAGTGGATATGACTTTGAGAGAGAAGGATACTCTCTAGTTGGAATAGATCCTTTCCGTCTGCTCCAAAACAGCCAGGTTTTCAGTCTCATTAGACCAAATGAGAACCCAGCACACAAGAGTCAATTGGTGTGGATGGCATGCCATTCTGCAGCGTTTGAGGACCTGAGAGTCTCAAGTTTCATCAGAGGGACAAGAGTGGTCCCAAGAGGACAACTATCCACCAGAGGAGTTCAAATTGCTTCAAATGAGAACATGGAAACAATGGACTCCAGCACTCTTGAACTGAGGAGCAGGTATTGGGCTATAAGGACCAGGAGTGGAGGAAACACCAACCAACAGAGAGCATCTGCAGGACAGATCAGTGTACAGCCTACTTTCTCGGTACAGAGAAATCTTCCCTTTGAGAGAGCGACCATTATGGCGGCGTTCACAGGAAATACTGAAGGCAGGACATCTGATATGAGGACTGAAATCATAAGAATGATGGAAAGTGCCAGACCAGAAGATGTGTCCTTCCAGGGGCGGGGAGTCTTCGAGCTCTCGGACGAAAAGGCAACGAACCCGATCGTGCCTTCCTTTGACATGAGTAATGAAGGATCTTATTTCTTCGGAGACAATGCAGAGGAGTATGACAATTAAAGAAAAATAC +>KP097936.1 +ATGGCGTCTCAAGGCACCAAACGATCTTATGAACAGATGGAAACTGGTGGAGAGCGCCAGAATGCTACTGAGATCAGGGCATCTGTTGGAAGAATGGTTAGTGGCATTGGGAGGTTCTACATACAGATGTGCACAGAACTCAAACTCAGTGACCATGAAGGGAGACTGATCCAGAACAGCATAACAATAGAGAGAATGGTACTTTCTGCATTTGATGAAAGAAGGAACAGGTACCTGGAAGAGCACCCCAGTGCGGGGAAGGACCCTAAGAAAACTGGAGGTCCAATTTATCGGAGGAGAGACGGGAAATGGGTGAGAGAGCTGATTCTTTACGACAAAGAAGAGATCAGGAGGATTTGGCGCCAAGCGAACAATGGAGAGGACGCAACTGCTGGCCTTACCCACCTGATGATATGGCATTCCAATCTGAATGATGCCACATATCAGAGAACAAGAGCTCTCGTGCGTACCGGAATGGACCCCAGGATGTGCTCTCTGATGCAAGGATCAACTCTCCCGAGGAGATCTGGAGCTGCTGGTGCAGCAGTGAAGGGGGTAGGAACAATGGTGATGGAGCTGATTCGAATGATAAAACGAGGGATTAACGACCGGAATTTCTGGAGAGGCGAAAATGGAAGAAGAACAAGGATTGCATATGAGAGAATGTGCAACATCCTCAAAGGGAAATTCCAAACAGCTGCACAAAGAGCAATGATGGATCAAGTGCGAGAGAGCAGAAACCCTGGGAATGCTGAAATTGAAGATCTCATTTTTCTGGCACGGTCTGCACTCATCCTGAGAGGATCAGTGGCCCATAAGTCCTGCTTGCCTGCTTGTGTGTACGGACTTGCAGTGGCCAGTGGGTATGACTTCGAGAGAGAAGGATACTCTCTGGTTGGAATAGATCCTTTCCGTCTGCTTCAAAACAGCCAGGTCTTTAGTCTCATTAGGCCAAATGAAAACCCAGCACATAAGAGTCAATTAGTGTGGATGGCATGCCACTCTGCAGCATTTGAGGACCTCAGAGTCTCAAGTTTCATCAGAGGGGCAAGAGTGGTCCCAAGAGGGCAGCTATCCACCAGAGGGGTTCAAATTGCTTCAAATGAGAACATGGAAACAATGGACTCCAACACCCTTGAACTGAGAAGTAGATATTGGGCTATAAGAACCAGGAGCGGAGGGAACACCAACCAGCAGAGGGCATCTGCAGGGCAGATCAGCGTTCAACCCACTTTTTCGGTACAGAGAAACCTTCCCTTCGAAAGAGCGACCATTATGGCAGCATTTACAGGAAATACTGAAGGTAGAACGTCCGACATGAGGACTGAAATCATAAGAATGATGGAAAGTGCCAAACCAGAAGATGTGTCATTCCAGGGGCGGGGAGTCTTCGAGCTCTCGGACGAAAAGGCAACGAACCCGATCGTGCCTTCCTTTGACATGAATAATGAAGGATCTTATTTCTTCGGAGACAATGCAGAGGAGTATGACAATTAA +>KP097941.1 +ATGGCGTCTCAAGGCACCAAACGATCTTATGAACAGATGGAGACTAGTGGAGAACGCCAGAATGCTACTGAGATCAGGGCATCTGTTGGAAGAATGGTTAGTGGCATTGGGAGGTTCTACATACAGATGTGCACAGAACTCAAACTCAGTGACTATGAAGGGAGGCTAATCCAGAACAGCATAACAATAGAGAGAATGGTACTATCTGCCTTTGATGAAAGAAGGAACAGATACCTGGAAGAACACCCCAGTGCGGGAAAGGATCCAAAAAAGACTGGAGGTCCAATTTATCGGAGGAGAGATGGGAAGTGGGTGAGAGAACTAATTCTGTACGACAAAGAGGAGATCAGGAGGATCTGGCGTCAAGCGAACAATGGAGAGGACGCAACTGCTGGTCTTACCCACCTGATGATATGGCATTCCAATCTAAATGATGCCACATATCAGAGAACGAGGGCTCTCGTGCGTACTGGAATGGACCCAAGGATGTGCTCTCTGATGCAAGGGTCAACTCTCCCGAGGAGATCTGGAGCTGCTGGTGCAGCAGTAAAGGGAATAGGAACAATGGTGATGGAGCTGATTCGAATGATAAAACGAGGGGTCAACGACCGGAATTTCTGGAGAGGCGAAAATGGAAGAAGAACAAGGATTGCATATGAGAGAATGTGCAACATCCTCAAAGGGAAATTCCAAACAGCAGCACAAAGAGCAATGATGGATCAAGTGCGAGAGAGCAGAAATCCTGGGAATGCTGAAATTGAAGACCTCATTTTTCTGGCACGGTCTGCACTCATCTTGAGAGGATCAGTGGCCCATAAGTCCTGCTTGCCTGCTTGTGTATACGGACTTGCAGTGGCCAGTGGATATGACTTTGAGAGAGAAGGATACTCTCTGGTTGGAATAGATCCTTTCCGCCTACTTCAAAACAGCCAGGTCTTTAGTCTCATTAGACCAAATGAGAATCCAGCGCATAAGAGTCAATTAGTGTGGATGGCATGCCACTCTGCAGCATTTGAGGACCTTAGAGTCTCAAGTTTCATCAGAGGGACAAGAGTGGTCCCAAGAGGACAGCTATCCACCAGAGGGGTTCAAATTGCTTCAAATGAGAACATGGAGGCTATGGACTCCAACACTCTTGAACTGAGAAGCAGATATTGGGCTATAAGAACCAGAAGCGGAGGAAACACCAACCACCAGAGGGCATCTGCAGGACAGATCAGTGTTCAGCCCACTTTCTCGGTACAGAGAAACCTTCCCTTCGAAAGAGCGACCATTATGGCAGCATTTACAGGAAATACTGAGGGTAGAACATCTGACATGAGAACTGAAATCATAAGAATGATGGAAAGTGCCAGACCAGAAGATGTGTCATTCCAGGGGCGGGGAGTCTTCGAGCTCTCGGACGAAAAGGCAACGAACCCGATCGTGCCTTCCTTTGACATGAATAATGAAGGATCTTATTTCTTCGGAGACAATGCAGAGGAGTATGACAATTAA +>CY063482.1 +AGCAAAAGCAGGGTAGATAATCACTCACCGAGTGACATCAACATCATGGCGTCTCAAGGCACCAAACGATCTTATGAACAGATGGAAACTAGTGGTGAACGCCAGAATGCTACTGAGATCAGGGCATCAGTTGGAAGAATGGTTAGTGGCATCGGGAGGTTCTACATACAGATGTGCACAGAACTCAAACTCAGTGACTATGAAGGGAGGCTTATCCAGAACAGCATAACAATAGAGAGAATGGTACTCTCTGCATTTGATGAACGAAGGAACAGATACCTGGAAGAACACCCCAGTGCGGGAAAGGACCCGAAGAAAACTGGAGGTCCAATTTATAGGAGGAGAGAAGGGAAATGGGTGAGAGAGCTGATTCTGTACGACAAAGAGGAGATCAGGAGGATTTGGCGTCAAGCGAACAATGGAGAGGACGCAACTGCTGGTCTCACCCACCTGATGATATGGCATTCCAATCTAAATGATGCCACATATCAGAGAACGAGAGCTCTCGTACGTACTGGAATGGACCCCAGGATGTGCTCTCTGATGCAAGGGTCAACTCTTCCGAGGAGATCTGGAGCTGCCGGTGCAGCAGTGAAGGGGGTAGGGACAATGGTAATGGAGCTGATTCGGATGATAAAACGAGGGATCAACGACCGGAATTTCTGGAGAGGCGAAAATGGAAGAAGAACAAGGATTGCATACGAGAGAATGTGCAACATCCTCAAAGGGAAATTCCAAACAGCAGCACAAAGAGCAATGATGGATCAGGTGCGAGAGAGCAGAAATCCCGGGAATGCTGAAATTGAAGATCTCATTTTTCTGGCACGGTCTGCACTCATCCTGAGAGGATCAGTAGCCCATAAGTCCTGCTTGCCTGCTTGTGTGTACGGACTTGCCGTAGCCAGTGGATATGACTTTGAGAGAGAAGGGTACTCCCTGGTTGGAATAGATCCTTTCCGTCTGCTACAAAACAGTCAGGTCTTTAGTCTCATTAGACCAAATGAGAATCCAGCACACAAGAGTCAATTAGTGTGGATGGCATGCCACTCTGCAGCATTTGAGGACCTTAGAGTCTCAAGTTTCATCAGAGGGACAAGAGTGGTCCCAAGAGGACAGCTATCCACCAGAGGGGTTCAAATTGCTTCAAATGAGAATATGGAAGCAATGGACTCCAACACTCTTGAACTGAGAAGTAGATATTGGGCTATAAGAACCAGAAGCGGAGGAAACACCAACCAGCAGAGGGCATCTGCAGGACAGATAAGCATTCAGCCCACTTTTTCGGTACAGAGAAACCTTCCCTTCGAGAGAGCAACCATTATGGCAGCATTCACAGGAAATACTGAGGGCAGAACGTCTGACATGAGAACTGAAATCATAAGAATGATGGAAAGTGCCAGACCAGAAGATGTGTCGTTCCAGGGGCGGGGAGTCTTCGAGCTATCGGACGAAAAGGCAACGAACCCGATCGTGCCTTCCTTTGACATGAATAATGAAGGATCTTATTTCTTCGGAGACAATGCAGAGGAATACGACAATTAAGGAAAAATACCCTTGTTTCTACT +>KX215267.1 +AGCAAAAGCAGGGTAGATAATCACTCACCGAGTGACATCAACATTATGGCGTCTCAAGGCACCAAACGATCTTATGAACAAATGGAAACTGGTGGAGAGCGCCAGAATGCTACTGAGATCAGGGCATCTGTTGGAAGAATGGTTAGTGGCATTGGGAGGTTCTACATACAGATGTGCACAGAACTCAAACTCAGTGACTATGAAGGGAGACTGATCCAGAACAGCATAACAATAGAAAGGATGGTACTTTCTGCATTTGATGAAAGAAGGAACAGGTACCTGGAAGAACACCCCAGTGCGGGGAAGGACCCGAAGAAAACTGGAGGCCCAATTTATCGGAGGAGAGACGGAAAGTGGGTGAGGGAGCTGATTCTGTACGACAAAGAGGAGATCAGGAGGATTTGGCGTCAAGCGAACAATGGAGAGGACGCAACTGCTGGTCTTACCCACCTGATGATATGGCATTCCAATCTAAATGATGCCACATATCAGAGAACGAGAGCTCTAGTGCGTACTGGGATGGACCCCAGGATGTGCTCTCTGATGCAAGGGTCAACTCTCCCGAGGAGATCTGGAGCTGCCGGTGCAGCAGTGAAGGGGGTAGGGACAATGGTGATGGAGCTGATTAGGATGATAAAACGAGGGGTCAACGACCGGAATTTCTGGAGAGGCGAAAATGGAAGAAGAACTAGGATTGCATATGAGAGAATGTGCAACATCCTCAAAGGGAAATTCCAAACAGCAGCACAAAGAGCAATGATGGATCAAGTGCGAGAGAGCAGAAATCCTGGGAATGCTGAAATTGAAGATCTCATTTTTCTGGCACGGTCTGCACTCATCCTGAGAGGATCAGTGGCCCATAAGTCCTGCTTGCCTGCTTGTGTATACGGACTTGCAGTGGCCAGTGGATATGACTTTGAGAGAGAAGGGTACTCTCTGGTTGGAATAGATCCTTTCCGTCTGCTTCAAAACAGCCAGGTCTTTAGTCTCATTAGGCCAAACGAGAATCCAGCACATAAGAGTCAATTAGTGTGGATGGCATGTCACTCTGCAGCATTTGAGGACCTTAGAGTCTCAAGCTTCATTAGAGGAACAAGAGTGGTCCCAAGAGGACAGCTATCCACCAGAGGGGTTCAAATTGCTTCAAATGAGAACATGGAAGTAATGGACTCCAACACTCTTGAACTGAGGAGTAGATATTGGGCTATAAGAACCAGAAGCGGGGGAAACACCAACCAGCAGAGGGCATCTGCAGGGCAGATCAGCGTTCAGCCCACTTTCTCGGTACAGAGAAACCTTCCCTTCGAAAGAGCGACCATTATGGCAGCATTTACAGGAAATGCTGAGGGCAGAACGTCTGACATGAGGACTGAAATCATAAGAATGATGGAAAGTGCCAGACCAGAAGATGTGTCATTCCAGGGGCGGGGAGTCTTCGAGCTCTCGGACGAAAAGGCAACGAACCCGATCGTGCCTTCCTTTGACATGAATAATGAAGGATCTTATTTCTTCGGAGACAATGCAGAGGAGTATGACAATTAAAGAAAAATACCCTTGTTTCTACT +>KX513272.1 +AGCGAAAGCAGGGTAGATAATCACTCATCGAGTGACATCAACACCATGGCGTCTCAAGGCACCAAACGATCTTATGAACAGATGGAAACTGGTGGAGAGCGCCAGAATGCTACTGAGATCAGGGCATCGGTTGGAAGAATGGTTAGTGGCATTGGGAGGTTCTACATACAGATGTGCACAGAACTCAAACTCAGTGACTATGAAGGGAGACTGATCCAGAACAGCATAACAATAGAGAGAATGGTACTTTCTGCATTTGATGAAAGGAGAAACAAGTACCTAGAAGAACACCCCAGTGCGGGGAAGGACCCGAAGAAAACTGGAGGTCCAATTTATCGAAGGAGAGACGGAAAATGGGCAAGGGAGCTGATTCTGTACGACAAAGAGGAGATCAGGAGGATTTGGCGCCAAGCTAACAATGGAGAGGACGCAACTGCTGGCCTTACCCACCTGATGATATGGCATTCCAATCTAAATGATGCCACATATCAGAGAACAAGAGCTCTCGTGCGCACCGGAATGGATCCCAGGATGTGCTCTCTGATGCAAGGATCAACTCTCCCGAGGAGATCTGGAGCTGCCGGTGCAGCGGTGAAGGGGGTAGGAACAATGGTGATGGAGCTGATTCGGATGATAAAACGAGGGATCAACGACCGGAATTTCTGGAGAGGCGAAAATGGAAGAAGAACAAGGATTGCATATGAGAGAATGTGTAACATCCTCAAAGGGAAATTCCAAACAGCTGCACAAAGAGCAATGATGGATCAAGTGCGAGAGAGCAGAAATCCTGGGAATGCTGAAATTGAAGATCTCATTTTTCTGGCACGGTCTGCACTCATCCTGAGAGGATCAGTAGCCCATAAGTCTTGCCTGCCTGCTTGTGTGTACGGACTTGCAGTGGCCAGTGGATATGACTTTGAGAGAGAAGGATACTCTCTGGTTGGAATAGATCCCTTCCGTCTGCTTCAAAACAGCCAGGTCTTCAGCCTCATTAGGCCAAATGAAAATCCAGCACATAAGAGCCAATTAGTGTGGATGGCATGCCACTCTGCAGCATTCGAGGACCTTAGAGTCTCAAGTTTCATCAGAGGGACAAGAGTGGTCCCAAGAGGACAGCTATCCACCAGAGGGGTTCAAATTGCTTCAAATGAGAATATGGAAGCAATGGACTCCAACACTCTTGAACTGAGAAGTAGATATTGGGCTATAAGAACCAGGAGCGGAGGGAACACCAATCAACAGAGGGCATCTGCAGGACAGATCAGCGTTCAGCCCACTTTCTCGGTGCAGAGAAACCTCCCATTCGAAAGAGCGACCATTATGGCAGCATTTACAGGAAATACTGAAGGCAGGACGTCTGACATGAGGACTGAAATCATAAGAATGATGGAAAGTGCCAGACCAGAAGATGTGTCATTCCAAGGGCGGGGAGTCTTCGAGCTCTCGGACGAAAAGGCAACGAACCCGATCGTGCCTTCCTTTGACATGAATAATGAGGGGTCTTATTTCTTCGGAGACAATGCAGAGGAGTATGACAATTAAAGAAAAATACCCTTGTTTCTACT +>KX513316.1 +AGCGAAAGCAGGGTAGATAATCACTCACCGAGTGACATCAACATTATGGCGTCTCAAGGCACCAAACGATCTTATGAACAGATGGAAACTGGTGGAGAGCGCCAGAATGCTACTGAGATCAGGGCATCTGTTGGAAGAATGGTTAGTGGCATTGGGAGGTTCTACATACAGATGTGCACAGAACTCAAACTCAGTGACCATGAAGGGAGACTGATCCAGAACAGCATAACAATAGAGAGAATGGTACTTTCTGCATTTGATGAAAGAAGGAACAGGTACCTGGAAGAGCACCCCAGTGCGGGGAAGGACCCTAAGAAAACTGGAGGTCCAATTTATCGGAGGAGAGACGGAAAATGGGTGAGAGAGCTGATTCTGTACGACAAAGAAGAGATCAGGAGGATTTGGCGCCAAGCGAACAATGGAGAGGACGCAACTGCTGGCCTTACCCACCTGATGATATGGCATTCCAATCTGAATGATGCCACATATCAGAGAACAAGAGCTCTCGTGCGTACCGGAATGGACCCCAGGATGTGCTCTCTGATGCAAGGATCAACTCTCCCGAGGAGATCTGGAGCTGCTGGTGCAGCAGTGAAGGGGGTAGGAACAATGGTGATGGAGCTGATTCGAATGATAAAACGAGGGATTAACGACCGGAATTTCTGGAGAGGCGAAAATGGAAGAAGAACAAGGATTGCATATGAGAGAATGTGCAACATCCTCAAAGGGAAATTCCAAACAGCTGCACAAAGAGCAATGATGGATCAAGTGCGAGAGAGCAGAAATCCTGGGAATGCTGAAATTGAAGATCTCATTTTTCTGGCACGGTCTGCACTCATCCTGAGAGGATCAGTGGCCCATAAGTCCTGCTTGCCTGCTTGTGTGTACGGACTTGCAGTGGCCAGTGGGTATGACTTCGAGAGAGAAGGATACTCTCTGGTTGGAATAGATCCTTTCCGTCTGCTTCAAAACAGCCAGGTCTTTAGTCTCATTAGGCCAAATGAAAACCCAGCACATAAGAGTCAATTAGTGTGGATGGCATGCCACTCTGCAGCATTTGAGGACCTCAGAGTCTCAAGTTTCATCAGAGGGGCAAGAGTGGTCCCAAGAGGGCAGCTATCCACCAGAGGGGTTCAAATTGCTTCAAATGAGAACATGGAAACAATGGACTCCAACACCCTTGAACTGAGAAGTAGATATTGGGCTATAAGAACCAGGAGCGGAGGGAACACCAACCAGCAGAGGGCATCTGCAGGGCAGATCAGCATTCAACCCACTTTTTCGGTACAGAGAAACCTTCCCTTCGAAAGAGCGACCATTCTGGCAGCATTTACAGGAAATACTGAAGGTAGAACGTCCGACATGAGGACTGAAATCATAAGAATGATGGAAAGTGCCAAACCAGAAGATGTGTCATTCCAGGGGCGGGGAGTCTTCGAGCTCTCGGACGAAAAGGCAACGAACCCGATCGTGCCTTCCTTTGACATGAATAATGAAGGATCTTATTTCTTCGGAGACAATGCAGAGGAGTATGACAATTAAAGAAAAATACCCTTGTTTCTACT +>KX513360.1 +AGCGAAAGCAGGGTAGATAATCACTCACCGAGTGACATCAACACCATGGCGTCTCAAGGCACCAAACGATCTTATGAACAGATGGAGACTAGTGGGGAACGCCAGAATGCTACTGAGATCAGGGCATCTGTTGGAAGAATGGTTAGTGGCATTGGGAGGTTCTACATACAGATGTGCACAGAACTCAAACTCAGTGACTATGAAGGGAGGCTAATCCAGAACAGCATAACAATAGAGAGAATGGTACTATCTGCATTTGATGAAAGAAGGAACAGATACCTGGAAGAACACCCCAGTGCGGGAAAGGATCCAAAAAAGACTGGAGGTCCAATTTATCGGAGGAGAGATGGGAAGTGGATGAGAGAGCTAATTCTGTACGACAAAGAGGAGATCAGGAGGATTTGGCGTCAAGCGAACAATGGAGAGGACGCAACTGCTGGTCTTACCCACCTGATGATATGGCATTCCAATCTAAATGATGCCACATATCAGAGAACGAGGGCTCTCGTGCGTACTGGAATGGACCCAAGGATGTGCTCTCTGATGCAAGGGTCAACTCTCCCGAGGAGATCTGGAGCTGCTGGTGCAGCAGTAAAGGGAATAGGAACAATGGTGATGGAGCTGATTCGAATGATAAAACGAGGGGTCAACGACCGGAATTTCTGGAGAGGCGAAAATGGAAGAAGAACAAGGATTGCATATGAGAGAATGTGCAACATCCTCAAAGGGAAATTCCAAACAGCAGCACAAAGAGCAATGATGGATCAAGTGCGAGAGAGTAGAAATCCTGGGAATGCTGAAATTGAAGATCTCATTTTTCTGGCACGGTCTGCACTCATCTTGAGAGGATCAGTGGCCCATAAGTCCTGCTTGCCTGCTTGTGTATACGGACTTGCAGTGGCCAGTGGATATGACTTTGAGAGAGAAGGATACTCTCTGGTTGGAATAGATCCTTTCCGCCTGCTTCAAAACAGCCAGGTCTTTAGTCTCATTAGACCAAATGAGAATCCAGCACATAAGAGTCAATTAGTGTGGATGGCATGCCACTCTGCAGCATTTGAGGACCTTAGAGTCTCAAGTTTCATCAGAGGGACAAGGGTGGTCCCAAGAGGACAGCTATCCACCAGAGGGGTTCAAATTGCTTCAAATGAGAACATGGAGGCTATGGACTCCAACACTCTTGAACTGAGAAGCAGATATTGGGCTATAAGAACCAGAAGCGGAGGAAACACCAACCACCAGAGGGCATCTGCAGGACAGATCAGTGTTCAGCCCACTTTCTCGGTACAGAGAAACCTTCCCTTCGAAAGAGCGACCATTATGGCAGCATTTACAGGAAATACTGAGGGTAGAACATCTGACATGAGAACTGAAATCATAAGAATGATGGAAAGTGCCAGACCAGAAGATGTGTCATTCCAGGGGCGGGGAGTCTTCGAGCTCTCGGACGAAAAGGCAACGAACCCGATCGTGCCTTCCTTTGACATGAATAATGAAGGATCTTATTTCTTCGGAGACAATGCAGAGGAGTATGACAATTAAAGAAAAATACCCTTGTTTCTACT +>KX513394.1 +AGCGAAAGCAGGGTAGATAATCACTCATCGAGTGACATCAACACCATGGCGTCTCAAGGCACCAAACGATCTTATGAACAGATGGAAACTGGTGGAGAGCGCCAGAATGCTACTGAGATCAGGGCATCGGTTGGAAGAATGGTTAGTGGCATTGGGAGGTTCTACATACAGATGTGCACAGAACTCAAACTCAGTGACTATGAAGGGAGACTGATCCAGAACAGCATAACAATAGAGAGAATGGTACTTTCTGCATTTGATGAAAGGAGAAACAAGTACCTAGAAGAACACCCCAGTGCGGGGAAGGACCCGAAGAAAACTGGAGGTCCAATTTATCGAAGGAGAGACGGAAAATGGGTGAGGGAGCTGATTCTGTACGACAAAGAGGAGATCAGGAGGATTTGGCGCCAAGCTAACAATGGAGAGGACGCAACTGCTGGCCTTACCCACCTGATGATATGGCATTCCAATCTAAATGATGCCACATATCAGAGAACAAGAGCTCTCGTGCGTACCGGAATGGATCCCAGGATGTGCTCTCTGATGCAAGGATCAACTCTCCCGAGGAGATCTGGAGCTGCCGGTGCAGCAGTGAAGGGGGTAGGAACAATGGTGATGGAGCTGATTCGGATGATAAAACGAGGGATCAACGACCGGAATTTCTGGAGAGGCGAAAATGGAAGAAGAACAAGGATTGCATATGAGAGAATGTGCAACATCCTCAAAGGGAAATTCCAAACAGCTGCACAAAGAGCAATGATGGATCAAGTGCGAGAGAGCAGAAATCCTGGGAATGCTGAAATTGAAGATCTCATTTTTCTGGCACGGTCTGCACTCATCCTGAGAGGATCAGTAGCCCATAAGTCTTGCCTGCCTGCTTGTGTGTACGGACTTGCAGTGGCCAGTGGATATGACTTTGAGAGAGAAGGATACTCTCTGGTTGGAATAGATCCCTTCCGTCTGCTTCAAAACAGCCAGGTCTTCAGCCTCATTAGGCCAAATGAAAATCCAGCACATAAGAGCCAATTAGTGTGGATGGCATGCCACTCTGCAGCATTCGAGGACCTTAGAGTCTCAAGTTTCATCAGAGGGACAAGAGTGGTCCCAAGAGGACAGCTATCCACCAGAGGGGTTCAAATTGCTTCAAATGAGAATATGGAAGCAATGGACTCCAACACTCTTGAACTGAGAAGTAGATATTGGGCTATAAGAACCAGGAGCGGAGGGAACACCAATCAACAGAGGGCATCTGCAGGACAGATCAGCGTTCAGCCCACTTTCTCGGTGCAGAGAAACCTCCCATTCGAAAGAGCGACCATTATGGCAGCATTTACAGGAAATACTGAAGGCAGGACGTCTGACATGAGGACTGAAATCATAAGAATGATGGAAAGTGCCAGACCAGAAGATGTGTCATTCCAAGGGCGGGGAGTCTTCGAGCTCTCGGACGAAAAGGCAACGAACCCGATCGTGCCTTCCTTTGACATGAATAATGAGGGGTCTTATTTCTTCGGAGACAATGCAGAGGAGTATGACAATTAAAGAAAAATACCCTTGTTTCTACT +>KX513406.1 +AGCGAAAGCAGGGTAGATAATCACTCACCGAGTGACATCAACACCATGGCGTCTCAAGGCACCAAACGATCTTATGAACAGATGGAGACTAGTGGGGAACGCCAGAATGCTACTGAGATCAGGGCATCTGTTGGAAGAATGGTTAGTGGCATTGGGAGGTTCTACATACAGATGTGCACAGAACTCAAACTCAGTGACTATGAAGGGAGGCTAATCCAGAACAGCATAACAATAGAGAGAATGGTACTATCTGCATTTGATGAAAGAAGGAACAGATACCTGGAAGAACACCCCAGTGCGGGAAAGGATCCAAAAAAGACTGGAGGTCCAATTTATCGGAGGAGAGATGGGAAGTGGATGAGAGAGCTAATTCTGTACGACAAAGAGGAGATCAGGAGGATTTGGCGTCAAGCGAACAATGGAGAGGACGCAACTGCTGGTCTTACCCACCTGATGATATGGCATTCCAATCTAAATGATGCCACATATCAGAGAACGAGGGCTCTCGTGCGTACTGGAATGGACCCAAGGATGTGCTCTCTGATGCAAGGGTCAACTCTCCCGAGGAGATCTGGAGCTGCTGGTGCAGCAGTAAAGGGAATAGGAACAATGGTGATGGAGCTGATTCGAATGATAAAACGAGGGGTCAACGACCGGAATTTCTGGAGAGGCGAAAATGGAAGAAGAACAAGGATTGCATATGAGAGAATGTGCAACATCCTCAAAGGGAAATTCCAAACAGCAGCACAAAGAGCAATGATGGATCAAGTGCGAGAGAGTAGAAATCCTGGGAATGCTGAAATTGAAGATCTCATTTTTCTGGCACGGTCTGCACTCATCTTGAGAGGATCAGTGGCCCATAAGTCCTGCTTGCCTGCTTGTGTATACGGACTTGCAGTGGCCGGTGGATATGACTTTGAGAGAGAAGGATACTCTCTGGTTGGAATAGATCCTTTCCGCCTGCTTCAAAACAGCCAGGTCTTTAGTCTCATTAGACCAAATGAGAATCCAGCACATAAGAGTCAATTAGTGTGGATGGCATGCCACTCTGCAGCATTTGAGGACCTTAGAGTCTCAAGTTTCATCAGAGGGACAAGGGTGGTCCCAAGAGGACAGCTATCCACCAGAGGGGTTCAAATTGCTTCAAATGAGAACATGGAGGCTATGGACTCCAACACTCTTGAACTGAGAAGCAGATATTGGGCTATAAGAACCAGAAGCGGAGGAAACACCAACCACCAGAGGGCATCTGCAGGACAGATCAGTGTTCAGCCCACTTTCTCGGTACAGAGAAACCTTCCCTTCGAAAGAGCGACCATTATGGCAGCATTTACAGGAAATACTGAGGGTAGAACATCTGACATGAGAACTGAAATCATAAGAATGATGGAAAGTGCCAGACCAGAAGATGTGTCATTCCAGGGGCGGGGAGTCTTCGAGCTCTCGGACGAAAAGGCAACGAACCCGATCGTGCCTTCCTTTGACATGAATAATGAAGGATCTTATTTCTTCGGAGACAATGCAGAGGAGTATGACAATTAAAGAAAAATACCCTTGTTTCTACT +>KX513320.1 +AGCGAAAGCAGGGTAGATAATCACTCATCGAGTGACATCAACACCATGGCGTCTCAAGGCACCAAACGATCTTATGAACAGATGGAAACTGGTGGAGAGCGCCAGAATGCTACTGAGATCAGGGCATCGGTTGGAAGAATGGTTAGTGGCATTGGGAGGTTCTACATACAGATGTGCACAGAACTCAAACTCAGTGACTATGAAGGGAGACTGATCCAGAACAGCATAACAATAGAGAGAATGGTACTTTCTGCATTTGATGAAAGGAGGAACAAGTACCTAGAAGAACACCCCAGTGCGGGGAAGGACCCGAAGAAAACTGGAGGTCCAATTTATCGAAGGAGAGACGGAAAATGGGTGAGGGAGCTGATTCTGTACGACAAAGAGGAGATCAGGAGGATTTGGCGCCAAGCTAACAATGGAGAGGACGCAACTGCTGGCCTTACCCACCTGATGATATGGCATTCCAATCTAAATGATGCCACATATCAGAGAACAAGAGCTCTCGTGCGTACCGGAATGGATCCCAGGATGTGCTCTCTGATGCAAGGATCAACTCTCCCGAGGAGATCTGGAGCTGCCGGTGCAGCAGTGAAGGGGGTAGGAACAATGGTGATGGAGCTGATTCGGATGATAAAACGAGGGATCAACGACCGGAATTTCTGGAGAGGCGAAAATGGAAGAAGAACAAGGATTGCATATGAGAGAATGTGCAACATCCTCAAAGGGAAATTCCAAACAGCTGCACAAAGAGCAATGATGGATCAAGTGCGAGAGAGCAGAAATCCTGGGAATGCTGAAATTGAAGATCTCATTTTTCTGGCACGGTCTGCACTCATCCTGAGAGGATCAGTAGCCCATAAGTCTTGCCTGCCTGCTTGTGTGTACGGACTTGCAGTGGCCAGTGGATATGACTTTGAGAGAGAAGGATACTCTCTGGTTGGAATAGATCCCTTCCGTCTGCTTCAAAACAGCCAGGTCTTCAGCCTCATTAGGCCAAATGAAAATCCAGCACATAAGAGCCAATTAGTGTGGATGGCATGCCACTCTGCAGCATTCGAGGACCTTAGAGTCTCAAGTTTCATCAGAGGGACAAGAGTGGTCCCAAGAGGACAGCTATCCACCAGAGGGGTTCAAATTGCTTCAAATGAGAATATGGAAGCAATGGACTCCAACACTCTTGAACTGAGAAGTAGATATTGGGCTATAAGAACCAGGAGCGGAGGGAACACCAATCAACAGAGGGCATCTGCAGGACAGATCAGCGTTCAGCCCACTTTCTCGGTGCAGAGAAACCTCCCATTCGAAAGAGCGACCATTATGGCAGCATTTACAGGAAATACTGAAGGCAGGACGTCTGACATGAGGACTGAAATCATAAGAATGATGGAAAGTGCCAGACCAGAAGATGTGTCATTCCAAGGGCGGGGAGTCTTCGAGCTCTCGGACGAAAAGGCAACGAACCCGATCGTGCCTTCCTTTGACATGAATAATGAGGGGTCTTATTTCTTCGGAGACAATGCAGAGGAGTATGACAATTAAAGAAAAATACCCTTGTTTCTACT diff --git a/data/community/genspectrum/iav/h5n1/GG1996/NP/genome_annotation.gff3 b/data/community/genspectrum/iav/h5n1/GG1996/NP/genome_annotation.gff3 new file mode 100644 index 000000000..d6e753049 --- /dev/null +++ b/data/community/genspectrum/iav/h5n1/GG1996/NP/genome_annotation.gff3 @@ -0,0 +1 @@ +. . CDS 46 1542 . + . gene="NP" diff --git a/data/community/genspectrum/iav/h5n1/GG1996/NP/pathogen.json b/data/community/genspectrum/iav/h5n1/GG1996/NP/pathogen.json new file mode 100644 index 000000000..0eef36c08 --- /dev/null +++ b/data/community/genspectrum/iav/h5n1/GG1996/NP/pathogen.json @@ -0,0 +1,19 @@ +{ + "schemaVersion": "3.0.0", + "alignmentParams": { + "minSeedCover": 0.01 + }, + "attributes": { + "name": "Influenza A/H5N1 (segment 5/NP)", + "reference name": "Influenza A virus (A/Goose/Guangdong/1/96(H5N1)) nucleocapsid protein (NP) gene, complete cds", + "reference accession": "NC_007360.1" + }, + "files": { + "reference": "reference.fasta", + "pathogenJson": "pathogen.json", + "changelog": "CHANGELOG.md", + "genomeAnnotation": "genome_annotation.gff3", + "readme": "README.md", + "examples": "examples.fasta" + } +} diff --git a/data/community/genspectrum/iav/h5n1/GG1996/NP/reference.fasta b/data/community/genspectrum/iav/h5n1/GG1996/NP/reference.fasta new file mode 100644 index 000000000..a5d66e768 --- /dev/null +++ b/data/community/genspectrum/iav/h5n1/GG1996/NP/reference.fasta @@ -0,0 +1,24 @@ +>NC_007360.1 Influenza A virus (A/Goose/Guangdong/1/96(H5N1)) nucleocapsid protein (NP) gene, complete cds +AGCAAAAGCAGGGTAGATAATCACTCACTGAGTGACATCAACATCATGGCGTCTCAGGGCACCAAACGAT +CTTATGAACAGATGGAAACTGGTGGAGAACGCCAGAATGCTACTGAGATCAGAGCATCTGTTGGAAGAAT +GGTTGGTGGAATTGGGAGGTTTTATATACAGATGTGCACTGAACTCAAACTCAGCGACTATGAAGGAAGG +CTGATTCAGAACAGCATAACAATAGAGAGAATGGTTCTCTCTGCATTTGATGAAAGGAGGAACAAATACC +TGGAAGAACATCCCAGTGCGGGGAAGGACCCAAAGAAAACTGGAGGTCCAATCTACCGAAGAAGAGACGG +AAAATGGGTGAGAGAGCTGATTCTGTATGACAAAGAGGAGATCAGGAGAATTTGGCGTCAAGCGAACAAT +GGAGAAGATGCAACTGCTGGTCTCACTCACATGATGATCTGGCATTCCAATCTAAATGATGCCACATACC +AGAGAACAAGAGCTCTCGTGCGTACTGGGATGGACCCTAGAATGTGCTCTCTGATGCAAGGATCAACTCT +CCCGAGGAGATCTGGAGCTGCTGGTGCGGCAGTAAAGGGAGTCGGAACGATGGTGATGGAACTAATTCGG +ATGATAAAGCGAGGGATTAACGATCGGAATTTCTGGAGAGGTGAAAATGGGCGAAGAACAAGAATTGCAT +ATGAGAGAATGTGCAACATCCTCAAAGGGAAATTCCAAACAGCAGCACAAAGAGCAATGATGGATCAGGT +ACGGGAAAGCAGAAATCCTGGGAATGCTGAGATTGAAGATCTCATATTTCTGGCACGGTCTGCACTCATC +CTGAGAGGATCAGTGGCCCACAAGTCCTGCTTGCCTGCTTGTGTGTACGGGCTTGCCGTGGCCAGTGGAT +ATGACTTTGAGAGAGAAGGGTACTCTCTGGTCGGGATTGATCCTTTCCGTCTGCTGCAAAACAGCCAGGT +CTTTAGTCTAATTAGACCAAATGAGAATCCAGCACATAAAAGTCAATTGGTGTGGATGGCATGCCATTCT +GCAGCATTTGAAGATCTGAGAGTCTCAAGCTTCATCAGAGGGACAAGAGTGGCCCCAAGGGGACAACTAT +CTACTAGAGGAGTTCAAATTGCTTCAAATGAGAACATGGAAACAATGGACTCCAGCACTCTTGAACTGAG +AAGCAGATATTGGGCTATAAGGACCAGGAGTGGAGGAAACACCAACCAGCAGAGAGCATCTGCAGGACAA +ATCAGTGTGCAGCCTACTTTCTCGGTACAGAGAAATCTTCCCTTCGAAAGAGCGACCATTATGGCGGCAT +TCACAGGGAATACAGAGGGCAGAACATCTGACATGAGGACTGAAATCATAAGGATGATGGAAAGCTCCAG +ACCAGAAGATGTGTCTTTCCAGGGGCGGGGAGTCTTCGAGCTCTCGGACGAAAAGGCAACGAACCCGATC +GTGCCTTCCTTTGACATGAGTAATGAAGGATCTTATTTCTTCGGAGACAATGCAGAGGAATATGACAATT +GAAGAAAAATACCCTTGTTTCTACT diff --git a/data/community/genspectrum/iav/h5n1/GG1996/NS/CHANGELOG.md b/data/community/genspectrum/iav/h5n1/GG1996/NS/CHANGELOG.md new file mode 100644 index 000000000..81199b7df --- /dev/null +++ b/data/community/genspectrum/iav/h5n1/GG1996/NS/CHANGELOG.md @@ -0,0 +1,3 @@ +## Unreleased + +Initial release diff --git a/data/community/genspectrum/iav/h5n1/GG1996/NS/README.md b/data/community/genspectrum/iav/h5n1/GG1996/NS/README.md new file mode 100644 index 000000000..743e9c774 --- /dev/null +++ b/data/community/genspectrum/iav/h5n1/GG1996/NS/README.md @@ -0,0 +1,26 @@ +# H5N1 (segment8/ NS) - dataset with A/Goose/Guangdong/1/96 reference + +| attribute | value | +| ------------------- | ---------------------------------------- | +| dataset name | community/genspectrum/iav/h5n1/GG1996/NS | +| reference strain | A/Goose/Guangdong/1/96(H5N1) | +| reference accession | NC_007364.1 | +| assembly accession | GCF_000864105.1 | + +## Authors and contacts + +Maintained by Genspectrum, Chaoran Chen and Anna Parker + +With the help of: Cornelius Roemer and Richard Neher + +## Scope of this dataset + +This dataset uses the first highly-pathogenic avian influenza (HPAI) isolate (A/Goose/Guangdong/1/96) as a reference and is suitable for the analysis of circulating and historical H5 sequences, including low-pathogenicity avian influenza (LPAI) isolates. + +## Features + +This simple dataset only supports alignment. + +## What is Nextclade dataset + +Read more about Nextclade datasets in Nextclade documentation: https://docs.nextstrain.org/projects/nextclade/en/stable/user/datasets.html diff --git a/data/community/genspectrum/iav/h5n1/GG1996/NS/examples.fasta b/data/community/genspectrum/iav/h5n1/GG1996/NS/examples.fasta new file mode 100644 index 000000000..b40b827b6 --- /dev/null +++ b/data/community/genspectrum/iav/h5n1/GG1996/NS/examples.fasta @@ -0,0 +1,38 @@ +>AB523779.1 +ACAAAAACATAATGGATTCCAACACTGTGTCAAGCTTTCAGGTAGACTGCTTTCTTTGGCATGTCCGCAAACGATTTGCAGACCAAGAACTGGGTGATGCCCCATTCCTTGACCGGCTTCGCCGAGATCAGAAGTCCCTAAGAGGAAGAGGCAACACTCTTGGTCTGAACATCGAAACAGCTACTCGTGCGGGGAAACAGATAGTGGAGCGGATTCTGGATGAGGAATCTGATGAGGCACTTAAAATGCCGACTTCACGCTACCTAACTGACATGACTCTCGAAGAAATGTCAAGGGACTGGTTCATGCTCATGCCCAAGCAGAAAGTGGTGGGTTCCCTTTGCATCAAAATGGACCAGGCAATGATGGATAAAACCGTCATATTGAAAGCAAACTTCAGTGTGATTTTTGACCGATTAGAAACCCTAATACTGCTTAGAGCTTTCACAGAAGAAGGAGCAATCGTGGGAGAAATCTCACCATTACCTTCTCTTCCAGGACATACTAGTGAGGATGTCAAAAATGCAATTGGCGTCCTCATCGGAGGACTTGAATGGAATGATAACACAGTTAGGGTCTCTGAAACTATACAGAGATTCGCTTGGAGAAGCAGTGATGAGGGTGGGAGACTTCCACTCCCTCCAAATCAGAAACGGAAAATGGCGAGAACAATTGAGTCAGAAGTTTGAAGAAATAAGGTGGCTGATTGAAGAAGTACGACATAGATTGAAAATTACAGAAAACAGCTTCGAACAGATAACGTTTATGCAAGCCTTACAACTACTGCTTGAAGTGGAGCAAGAGATAAGAGCCTTCTCGTTTCAGCTTATTTAATGATAA +>OP950309.1 +AGCAAAAGCAGGGTGACAAAAACATAATGGATTCCAACACTGTGTCAAGCTTTCAGGTAGACTGCTTTCTTTGGCATGTCCGCAAACAATTTGCAGACCAAGAACTGAGTGATGCCCCATTCCTTGACCGGCTTCGCCGAGATCAGAAGTCCCTAAGGGGAAGAGGCAGCACTCTTGGTCTGGACATCGAAACGGCCACTCGCGCTGGAAAGCAGATAGTGGAGAGGATTCTGGAGGAAGAATCCGACGAGGCACTCAAAATGACCATTGCCTCTGTACCTGCTTCACGCTACCTAACTGACATGACTCTTGAAGAGATGTCAAGAGACTGGTTCATGCTCATGCCCAAACGAAAAGTGGCAGGCTCCCTCTGTATCAGAATGGACCAGGCGATTATGGATAAGAACATCACATTGAAAGCAAACTTCAGTGTGATCTTCGATAGGCTGGAGACATTAATACTACTCAGAGCTTTCACTGAAGAGGGAGCAATTGTCGGCGAAATTTCACCACTGCCTTCTCTTCCAGGACATACTGATGAGGATGTCAAAAATGCAATTGGGGTCCTCATCGGAGGACTTGAATGGAATGATAACACAGTTCGAGTCTCTGAAACTTTACAGAGATTCACTTGGAGAAGCGGTAATGAGGATGGGAGACCTCCACTCCCTCCAAAGCAGAAACGGAAAATGGCGAGAACAATTGAGTCAGAAGTTTGAAGAAATAAGGTGGCTAATTGAAGAAGTGCGACATAGACTAAAGATCACAGAAAATAGTTTTGAACAAATAACATTTATGCAAGCCTTACAACTATTGCTTGAAGTGGAGCAAGAGATAAGAACTTTCTCGTTTCAGCTTATTTAATAATAAAAAACACCCTTGTTTCTACT +>AM911070.1 +AGCAAAAGCAGGGTGACAAAAACATAATGGATTCCAACACTGTGTCAAGCTTTCAGGTAGACTGCTTTCTTTGGCATGTCCGCAAACGATTTGCAGACCAAGAACTGGGTGATGCCCCATTCCTTGACCGGCTTCGTCGAGATCAGAAGTCCCTAAGAGGAAGAGGCAACACTCTTGGTCTGGACATCGAAACAGCTACTCGTGCGGGAAAGCAGATATTGGAGCGAATTCTGGAGGAGGAGTCTGATGAGGCACTTAAAATGCCAGCTTCACGCTACCTAACTGATATGACTCTCGAGGAAATGTCAAGGGACTGGTTTATGCTCATGCCCAAGCAGAAAGTGACAGGTTCCCTTTGCATCAAAATGGACCAGGCGATAATGGATAAAACCATCATATTGAAAGCAAACTTCAGTGTGATTTATGACCGGTTAGAGACCCTAATACTACTTAGAGCTTTCACAGAAGAAGGAGCAATCGTGGGAGAAATCTCACCATTACCTTCTCTTCCAGGACATACTAATGAGGATGTCAAAAATGCAATTGGCGTCCTCATCGGAGGACTTGAATGGAATGATAACACGGTTCGAGTCTCTGAAATTATACAGAGATTCGCTTGGAGAAGCATTGATGAGGATGGGAGACTTCCACTCCCTCCAGATCAGAAACGGAAAATGGCGAGAACAATTGAGTCAAAAGTTTGAAGAAATAAGGTGGCTGATTGAAGAAATACGACATAGATTGAAAATTACAGAAAACAGCTTCGAACAGATAACGTTTATGCAAGCCTTACAACTACTGCTTGAAGTGGAGCAAGAGATAAGAACCTTCTCGTTTCAGCTTATTTAATGATAAAAAACACCCTTGTTTCTACT +>EU420050.1 +AGCAAAAGCAGGGTGACAAAAACATAATGGATCCCAACACTGTGTCAAGCTTTCAGGTAGACTGCTTTCTTTGGCATGTCCGCAAACGATTTGCAGACCAAGAACTGGGTGATGCCCCATTCCTTGACCGGCTTCGCCGAGATCAGAAGTCCCTAAGAGGAAGAGGCAACACTCTTGGTCTGGACATCGAAACAGCTACTCGTGCGGGAAAGCAGATAGTGGAGCGGATTCTGGAGGAGGAGTCTGATGAGGCACTTAAAATGCCGGCTTCACGCTACCTAACTGACATGACTCTCGAAGAAATGTCAAGGGACTGGTTCATGCTCATGCCCAAGCAGAAAGTGGCAGGTTCCCTTTGCATCAAAATGGACCAGGCAATAATGGATAAAACCATCATATTGAAAGCAAACTTCAGTGTGATTTTTGATAGATTGGAAACCCTAATACTACTTAGAGCTTTCACAGAAGAAGGAGCAATCGTGGGAGAAATCTCACCATTACCTTCTCTTCCAGGACATACTGGTGAGGATGTCAAAAATGCAATTGGCGTCCTCATCGGAGGACTTGAATGGAATGATAACACAGTTCGAGTCTCTGAAACTATACAGAGATTCGCTTGGGGAAACAGTGATGAGGATGGGAGACTTCCACTCCCTCCAAATCAGAAACGAAAAATGGCGAGAACAATTGAGTCAGAAGTTTGAAGAAATAAGGTGGCTGATTGAAGAAGTACGACATAGATTGAAAATTACAGAAAACAGCTTCGAACAGATAACATTTATGCAAGCCTTACAACTACTGCTTGAAGTGGAGCAAGAGATAAGAGCCTTCTCGTTTCAGCTTATTTAATGATAAAAAACACCCTTGTTTCTACT +>FM165534.1 +AAAAAGACAGGGTGACAAAGACATAATGGATTCCAACACAGTGTCAAGCTTTCAGGTAGACTGCTTTCTTTGGCATGTCCGCAAACGATTTGCAGACCAAGAACTGGGTGATGCCCCATTCCTTGACCGGCTTCGCCGAGATCAGAAGTCCCTAAGAGGAAGAGGCAACACTCTTGGTCTGGACATCGAAACAGCTACTCGTGCGGGAAAGCAGATAGTGGAGCGAATTCTGGAGGAGGAGTCTGATGAGGCACTTAAAATGCCAGCTTCACGCTACTTAGCTGATATGACTCTCGAGGAAATGTCAAGGGACTGGTTCATGCTAATGCCTAAGCAGAAAGTGACAGGTTCCCTTTGCATCAAAATGGACCAGGCAATAATGGATAAAACCATCATATTGAAAGCAAACTTCAGTGTGATTTATGACCGGTTAGAGACCCTAATACTACTTAGAGCTTTCACAGAAGAAGGAGCAATCGTGGGAGAAATCTCACCATTACCTTCTCTTCCAGGACATACTAATGAGGATGTCAAAAATGCAATTGGCGTCCTCATCGGAGGACTTGAATGGAATGATAACACAGTTCGAGTCTCTGAAATTATACAGAGATTCGCTTGGAGAAGCATTGGTGAGGATGGGAGACTTCCACTCCCTCCAGACCAGAAACGGAAAATGGCGAGAACAATTGAGTCAAAAGTTTGAAGAAATAAGGTGGCTGATTGAAGAAATACGACATAGATTGAAAATTACAGAAAACAGCTTCGAACAGATAACGTTTATGCAAGCCTTACAACTACTGCTTGAAGTGGAGCAAGAGATAAGAACCTTCTCGTTTCAGCTTATTTAGTGATAAAAACACCTTGTTCTACT +>EU147297.1 +GTGACAAAAACATAATGGATTCCAACACTGTGTCAAGCTTTCAGGTAGACTGCTTTCTTTGGCATGTCCGCAAACGATTTGCAGACCAAGAACTGGGTGATGCCCCATTCCTTGACCGGCTTCGCCGAGATCAGAAGTCCCTAAGAGGAAGAGGCAACACTCTTGGTCTGGACATCGAAACAGCTACTCGTGCGGGAAAGCAGATAGTGGAGCGAATTCTGGAGGAGGAGTCTGATGAGGCACTTAAAATGCCAGCTTCACGCTACCTAACTGATATGACTCTCGAGGAAATGTCAAGGGACTGGTTCATGCTCATGCCCAAGCAGAAAGTGACAGGTTCCCTTTGCATCAAAATGGACCAGGCAATAATGGATAAAACCATCATATTGAAAGCAAACTTCAGTGTGATTTATGACCGGTTAGAGACCCTAATACTACTTAGAGCTTTCACAGAAGAAGGAGCAATCGTGGGAGAAATCTCACCATTACCTTCTCTTCCAGGACATACTAATGAGGATGTCAAAAATGCAATTGGCGTCCTCATCGGAGGACTTGAATGGAATGATAACACAGTTCGAGTCTCTGAAATTATACAGAGATTCGCTTGGAGAAGCATTGATGAGGATGGGAGACTTCCACTCCCTCCAGATCAGAAACGGAAAATGGCGAGAACAATTGAGTCAAAAGTTTGAAGAAATAAGGTGGCTGATTGAAGAAATACGACATAGATTGAAAATTACAGAAAACAGCTTCGAACAGATAACGTTTATGCAAGCCTTACAACTACTGCTTGAAGTGGAGCAAGAGATAAGAACCTTCTCGTTTCAGCTTATTTAATGATAAAAAACAC +>JN558596.1 +AGCAAAAGCAGGGGGACAAAAACATAATGGATTCCAACACTGTGTCAAGCTTTCAGGTAGACTGCTTTCTTTGGCATGTCCGCAAACGATTTGCAGACCAAGAACTGGGTGATGCCCCATTCCTTGACCGGCTTCGCCGAGATCAGAAGTCCCTAAGAGGAAGAGGCAACACTCTTGGTCTGGACATCGAAACAGCTACTCGTGCGGGGAAACAGATAGTGGAGCGGATTCTGGATGAGGAATCTGATGAGGCACTTAAAATGCCGACTTCACGCTACCTAACTGACATGACTCTCGATGAAATGTCAAGGGACTGGTTCATGCTCATGCCCAAGCAGAAAGTGGTGGGTTCCCTTTGCATCAAAATGGACCAGGCAATGATGGATAAAACCGTCATATTGAAAGCAAACTTCAGTGTGATTTTTGACCGATTAGAAACCCTAATACTGCTTAGAGCTTTCACAGAAGAAGGAGCAATCGTGGGAGAAATCTCACCATTACCTTCTCTTCCAGGACATACTAGTGAGGATGTCAAAAATGCAATTGGCGTCCTCATCGGAGGACTTGAATGGAATGATAACACAGTTAGGGTCTCTGAAACTATACAGAGATTCGCTTGGAGAAGCAGTGATGAGGGTGGGAGACTTCCACTCCCTCCAAATCAGAAACGGAAAATGGCGAGAACAATTGAGTCAGAAGTTTGAAGAAATAAGGTGGCTGATTGAAGAAGTACGACATAGATTGAAAATTACAGAAAACAGCTTCGAACAGATAACGTTTATGCAAGCCTTACAACTACTGCTTGAAGTGGAGCAAGAGATAAGAGCCTTCTCGTTTCAGCTTATTTAATGATAAAAAACACCCTTGTTTCTACT +>JF758749.1 +ATGGATTCCAACACTGTGTCAAGCTTTCAGGTAGACTGCTTTCTTTGGCATGTCCGCAAACGATTTGCAGACCAAGAACTGGGTGATGCCCCATTCCTTGACCGGCTTCGCCGAGATCAGAAATCTCTAAGAGGAAGAGGCAGCACTCTTGGTCTGGACATCGAAACAGCCACTCGTGCTGGAAAGCAGATAGTGGAGAGGATTCTGGAGGAGGAATCCGACGAGGCACTCAAAATGACTATTGCTTCTGTGCCTGCTTCACGCTACCTAACTGACATGACTCTTGAAGAGATGTCAAGAGACTGGTTCATGCTCATGCCCAAGCAAAAAGTAGCAGGCTCCCTCTGTATCAGAATGGACCAGGCTATTATGGATAAGAACATCATACTGAAAGCAAATTTCAGTGTGATCTTTGATCGGCTGGAGACACTAATACTACTCAGAGCTTTCACTGAAGAAGGAGCAATTGTCGGCGAAATTTCACCATTGCCTTCTCTTCCAGGACATACTGATGAGGATGTCAAAAATGCAATTGGGGTCCTCATCGGAGGACTTGAATGGAATGATAACACAGTTCGAGTCTCTGAAACTCTACAGAGATTCGCTTGGAGAAGCAGTAATGAGGATGGGAGACCTCCACTCCCTCCAAAGCAGAAACGGAAAATGGCGAGAACAATTGAGTCAGAAGTTTGA +>EU871815.1 +GATCAAGAACTGGGTGATGCCCCATTCCTTGACCGGCTTCGCCGAGATCAGAAGTCCCTAAGAGGAAGAGGCAACACTCTTGGTCTGGACATCGAAACAGCTACTCGTGCGGGAAAGCAGATAGTGGAGCGAATTCTGGAGGAGGAGTCTGATGAGGCACTTAAAATGCCAGCTTCACGCTACTTAACTGATATGACTCTCGAGGAAATGTCAAGGGACTGGTTCATGCTCATGCCTAAGCAGAAAGTGACAGGTTCCCTTTGCATCAAAATGGACCAGGCAATAATGGATAAAACCATCATATTGAAAGCAAACTTCAGTGTGATTTATGACCGGTTAGAGACCCTAATACTACTTAGAGCTTTCACAGAAGAAGGAGCAATCGTGGGAGAAATCTCACCATTACCTTCTCTTCCAGGACATACTAATGAGGATGTCAAAAATGCAATTGGCGTCCTCATCGGAGGACTTGAATGGAATGATAACACAGTTCGAGTCTCTGAAATTATACAGAGATTCGCTTGGAGAAGCGTTGATGAGGATGGGAGACTTCCACTCCCTCCAGACCAGAAACGGAAAATGGCGAGAACAATTGAGTCAAAAGTTTGAAGAAATAAGGTGGATGATTGAAGAAATACGACATAGATTGAAAATTACAGAAAACAGCTTCGAACAGATAACGTTTATGCAAGCCTTACAACTACTGCTTGAAGTGGAGCAAGAGATAAGAAC +>MH588130.1 +ATGGATTCCAACACTGTGTCAAGCTTCCAGGTAGACTGCTTTCTTTGGCATGTCCGCAAACGATTTGCAGACCAAGAACTGGGTGATGCCCCATTCCTTGATCGGCTTCGTAGAGATCAGAAATCCCTAAAAGGAAGAGGCAGCACTCTTGGTCTGGACATCAAAACAGCTACTCGTGCGGGAAAGCAGATAGTGGAGCGAATTCTGGAGAAGGAGTCTGATGAGGCACTTAAAATGCCAGCTTCACGCTACCTAACAGATATGACTCTCGAGGAAATGTCAAGGGACTGGTTTATGCTCATGCCCAAGCAGAAAGTGACAGGTTCCCTTTGCATCAAAATGGACCAGGCAATAATGGATAAAACCATAATATTGAAAGCAAACTTCAGTGTGATTTATGACCGATTAGAGACCCTAATACTGCTTAGAGCTTTCACAGAAGAAGGAACAATCGTGGGAGAAATCTCACCATTACCTTCTCTTCCAGGACATACTAGTGAGGATGTCAAAAATGCAATTGGCGTCCTCATCGGAGGACTTGAATGGAATGATAACACGGTTCGAGTCTCTGAAATTGTACAGAGATTCGCTTGGAGAAGCATTGATGAGGATGGGAGACTTCCACTCCCTTCAGATCAGAAACGGAAAATGGCGAGAGCAATTGAGTCAGAAGTTTGAAGAAATAAGATGGTTGATTGAAGAAATACGACATAGATTGAAAATTACAGAAAACAGCTTTGAACAGATAACATTTATGCAAGCCTTACAACTACTGCTTGAAGTGGAGCAAGAGATAAGAACCTTCTCGTTTCAGCTTATTTAATG +>KU143438.1 +AGCGAAAGCAGGGTGACAAATACATAATGGATTCCAACACTGTGTCAAGCTTTCAGGTAGACTGCTTTCTTTGGCATGTCCGCAAACGATTTGCAGACCAAGAACTGGGTGATGCCCCATTCCTTGACCGGCTTCGCCGAGATCAGAAGTCCCTAAGAGGAAGGGGCAACACTCTTGGTCTGGACATCGAAACAGCTACTCGTACGGGGAAGCAGATAGTGGAGCGGATTCTGGACGAGGAATCTGATGAGGCAATTAAAATGCCGACTCCACGTTACCTAACTGACATGACTCTCGAAGAAATGTCAAGGAACTGGTTCATGCTCATGCCCAAGCAGAAAGTGGTGGGTTCCCTTTGCATCAAAATGGACCAGGCAATGATGGATAAAACCGTCATATTGAAAGCAAACTTCAGTGTGATTTTTGACAGATTGGAAACCCTAATACTGCTTAGAGCTTTCACAGAAGAAGGAGCAATCGTGGGAGAAATCTCACCATTACCTTCTCTTCCAGGACATACTAGTGAGGATGTCAAGAATGCAATTGGCGTCCTCATCGGAGGACTTGAATGGAATGATAACACAGTTAGGGTCTCTGAAACTATACAGAGATTCGCTTGGAGAAGCAGTGATGAGGGTGGGAGACTTCCACTCCCTCCAAATCAGAAACGGAAAATGGCGAGAACAATTGAGTCAGAAGTTTGAAGAAATAAGGTGGCTGATTGAAGAAGTACGACATAGATTGAAAATTACAGAAAACAGCTTCGAACAGATAACGTTTATGCAAGCCTTACAACTACTGCTTGAAGTGGAGCAAGAGATAAGAGCCTTCTCGTTTCAGCTTATTTAATGATAAAAAACACCCTTGTTTCTACT +>KP098018.1 +ATGGATTCCAACACTGTGTCAAGCTTTCAGGTAGACTGCTTTCTTTGGCATGTCCGCAAACGATTTGCAGACCAAGAACTGGGTGATGCCCCATTCCTTGACCGGCTTCGCCGAGATCAGAAGTCCCTAAGAGGAAGGGGCAACACTCTTGGTCTGGACATCGAAACAGCTACTTGCGCAGGGAAACAGATAGTGGAGCGGATTCTGGAAGAGGAGTCTGATAAGGCACTTAAAATGCCGGTTTCACGCTACCTAACTGACATGACTCTCGAGGAGATGTCAAGGGACTGGTTCATGCTCATGCCCAAGCAGAAAGTGGCAGGTTCCCTTTGCATCAAAATGGACCAGGCAATAATGGATAAAGCCATCATATTGAAAGCAAACTTCAGCGTGACTTTTGGCCGGTTGGAAAACTTAATACTACTTAGAGCGTTCACAGAAGAGGGAACAATCGTGGGAGAAATCTCACCATTACCTTCTCTTCCAGGACATACTGGGGAGGATGTCAAAAATGCAATTGGCATCCTCATCGGAGGACTTGAATGGAATGATAACACAGTTCAAATCACTGAAACTATACAGAGATTCGCTTGGGGAAGCAGTGATGAGGTTGGGAGACCTCCACTCCCTCCAAAACAGAACCGGAAAGTGGCGGGAACAATTGAGTCAGAAGTTTGAAGAGATAAGGTGGCTGATTGAAGAAGTAAGACATAGATTGAAAATTACAGAAAACAGCTTCGAACAGATAACGTTTATGCAAGCCTTACAACTACTGCTTGAAGTGGAGCAAGAGATAAGAACCTTCTCGTTTCAGCTTATTTAA +>KU971312.1 +ATGGATCCCAACACTGTGTCAAGTTTTCAGGTAGACTGCTTTCTCTGGCATGTCCGCAAACGATTTGCAGACCAAGAACTGGGTGATGCCCCATTCCTTGACCGGCTTCGCCGAGATCAGAAGTCCCTAAGAGGAAGAGGCAACACTCTTGGTCTGGACATCGAAACAGCTACTCGTGCGGGAAAACAGATAGTGGAGCGGATTCTTGATGAGGAACCTGATGAGGCACTTAAAATGCCGACTTCACGCTACCTAACTGAAATGACTCTCGAAGAGATGTCAAGGGACTGGTTCATGCTCATGCCCAAGCAGAAAGTGGTGGGTTCCCTTTGCATCAAAATGGACCAGGCAATAATGGATAAAACCATCATACTGAAAGCAAACTTCAGTGTGATTTTTGACCGGTTAGAGACCCTAATACTACTCAGAGCTTTCACAGAAGAAGGAGCAATCGTGGGAGAAATCTCACCATTACCTTCTCTTCCAGGACATACTGGTGAGGATGTCAAAAATGCAATTGGCGTCCTCATCGGAGGACTTGAATGGAATGATAACACAGTTCGAGTCTCTGAAACTGTACAGAGATTCGCTTGGAGAAACAGTGATGAGGGTGGGAGACTTCCACTCCCTCCAAATCAGAAACGGAAACTGGCGAGAGCAATTGAGTCAGAAGTTTGAAGAAATAAGGTGGCTGATTGAAGAAGTACGACATAGATTGAAAATCACAGAAAACAGCTTCGAACAGATAACGTTTATGCAAGCTTTACAACTACTGCTTGAAGTGGAGCAAGAGATAAGAGCCTTCTCATTTCAGCTTATTTAA +>KX215361.1 +AGCAAAAGCAGGGTGACAAAAACATAATGGATTCCAACACTGTGTCAAGCTTTCAGGTAGACTGCTTTCTTTGGCATGTCCGCAAACGATTTGCAGACCAAGAACTGGGTGATGCCCCATTCCTTGACCGGCTCCGCCGAGATCAGAAATCCCTAAGAGGAAGAGGCAACACTCTTGGTCTGGACATCGAAACAGCTACTCGTGTGGGGAAACAGATAGTGGAGCGGATTCTTGATGAGGAATCTGATGAGGCATTTAAAATGCCGACTTCACGCTACCTAACTGACATGACTCTCGAAGAAATGTCAAGGGACTGGTTCATGCTCATGCCCAAGCAGAAAGTGGTGGGTTCCCTTTGCATCAAAATGGACCAGGCAATGATGGATAAAACCGTCATATTGAAAGCAAACTTCAGTGTGATTTTTGACCGATTAGAAACCCTAATACTGCTTAGAGCTTTCACAGAAGAAGGAGCAATTGTGGGAGAAATCTCACCATTACCTTCCCTTCCAGGACATACTAGCGAGGATGTCAAAAATGCAATTGGAGTCCTCATCGGAGGACTTGAATGGAATGATAACACAGTTAGGGTCTCTGAAACTATACAGAGATTCGCTTGGAGAAGCAGTGATGAGGGTGGGAGACTTCCACTCCCTCCACATCAGAAACGGAAAATGGCGAGAACAATTGAGTCAGAAGTTTGAAGAAATAAGGTGGCTGATTGAAGAAATACGACATAGATTGAAAATTACAGAAAACAGCTTCGAACAGATAACGTTTATGCAAGCCTTACAACTACTGCTTGAAGTGGAGCAAGAGATAAGAGCCTTCTCGTTTCAGCTTATTTAATGATAAAAAACACCCTTGTTTCTACT +>KX513148.1 +AGCGAAAGCAGGGTGACAAAAACATAATGGATTCCAACACTGTGTCAAGTTTTCAGGTAGACTGCTTTCTTTGGCATGTCCGCAAACGATTTGCAGACCAAGAACTGGGTGATGCCCCATTCCTTGACCGGCTTCGCCGAGATCAGAAGTCCCTAAGAGGAAGAGGCAACACTCTTGGTCTGGACATCGAAACAGCTACTCGTGCGGGAAAACAGATAGTGGAGCGGATTCTTGATGAGGAACCTGATGAAGCACTTAAAATGCCGACTTCACGCTACCTAACTGAAATGACTCTCGAAGAAATGTCAAGGGACTGGTTCATGCTCATGCCCAAGCAGAAAGTGGTGGGTTCCCTTTGCATCAAAATGGACCAGGCAATAATGGATAAAACCATCATACTGAAAGCAAACTTCAGTGTGATTTTCGACCGGTTAGAGACCCTAATACTACTCAGAGCTTTCACAGAAAAAGGAGCAATCGTGGGAGAAATCTCACCATTACCTTCTCTTCCAGGACATACTGGTGAGGATGTCAAAAATGCAATTGGCGTCCTCATCGGAGGACTTGAATGGAATGATAACACAGTTCGGGTCTCTGAAACTATACAGAGATTCGCTTGGAGAAGCAGTGATGAGGGTGGGAGACTTCCACTCCCTCCAAATCAGAAACGGAAACTGGCGAGAGCAATTGAGTCAGAAGTTTGAAGAAATAAGGTGGCTGATTGAAGAAGTACGACATAGATTGAAAATTACAGAAAACAGCTTCGAACAGATAACGTTTATGCAAGCCTTACAACTACTGCTTGAAGTGGAGCAAGAGATAAGAGCCTTCTCGTTTCAGCTTATTTAATGATAAAAAACACCCTTGTTTCTACT +>KX513209.1 +AGCGAAAGCAGGGTGACAAAAACATAATGGATTCCAACACTGTGTCAAGTTTTCAGGTAGACTGCTTTCTTTGGCATGTCCGCAAACGATTTGCAGACCAAGAACTGGGTGATGCCCCATTCCTTGACCGGCTTCGCCGAGATCAGAAGTCCCTAAGAGGAAGAGGCAACACTCTTGGTCTGGACATCGAAACAGCTACTCGTGCGGGAAAACAGATAGTGGAGCGGATTCTTGATGAGGAACCTGATGAGGCACTTAAAATGCCGACTTCACGCTACCTAACTGAAATGACTCTCGAAGAGATGTCAAGGGACTGGTTCATGCTCATGCCCAAGCAGAGAGTGATGGGTTCCCTTTGCATCAAAATGGACCAGGCAATAATGGATAAAACCATCATACTGAAAGCAAACTTCAGTGTGATTTTTGACCGGTTAGAGACCCTAATACTACTCAGAGCTTTCACAGAAGAAGGAGCAATCGTGGGAGAAATCTCACCATTACCTTCTCTTCCAGGACATACTGGTGAGGATGTCAAAAATGCAATTGGCGTCCTCATCGGAGGACTTGAATGGAATGATAACACAGTTCGGGTCTCTGAAACTATACAGAGATTCGCTTGGAGAAACAGTGATGAGGGTGGGAGACTTTCACTCCCTCCAAATCAGAAACGGAAACTGGCGAGAGCAATTGAGTCAGAAGTTTGAAGAAATAAGGTGGCTGATTGAAGAAGTACGACATAGATTGAAAATTACAGAAAACAGCTTCGAACAGATAACGTTTATGCAAGCTTTACAACTACTGCTTGAAGTGGAGCAAGAGATAAGAGCCTTCTCGTTTCAGCTTATTTAATGATAAAAAACACCCTTGTTTCTACT +>KX513399.1 +AGCGAAAGCAGGGTGACAAAAACATAATGGATTCCAACACTGTGTCAAGTTTTCAGGTAGACTGCTTTCTTTGGCATGTCCGCAAACGATTTGCAGACCAAGAACTGGGTGATGCCCCATTCCTTGACCGGCTTCGCCGAGATCAGAAGTCCCTAAGAGGAAGAGGCAACACTCTTGGTCTGGACATCGAAACAGCTACTCGTGCGGGAAAACAGATAGTGGAGCGGATTCTTGATGAGGAACCTGATGAAGCACTTAAAATGCCGACTTCACGCTACCTAACTGAAATGACTCTCGAAGAAATGTCAAGGGACTGGTTCATGCTCATGCCCAAGCAGAAAGTGGTGGGTTCCCTTTGCATCAAAATGGACCAGGCAATAATGGATAAAACCATCATACTGAAAGCAAACTTCAGTGTGATTTTCGACCGGTTAGAGACCCTAATACTACTCAGAGCTTTCACAGAAAAAGGAGCAATCGTGGGAGAAATCTCACCATTACCTTCTCTTCCAGGACATACTGGTGAGGATGTCAAAAATGCAATTGGCGTCCTCATCGGAGGACTTGAATGGAATGATAACACAGTTCGGGTCTCTGAAACTATACAGAGATTCGCTTGGAGAAGCAGTGATGAGGGTGGGAGACTTCCACTCCCTCCAAATCAGAAACGGAAACTGGCGAGAGCAATTGAGTCAGAAGTTTGAAGAAATAAGGTGGCTGATTGAAGAAGTACGACATAGATTGAAAATTACAGAAAACAGCTTCGAACAGATAACGTTTATGCAAGCCTTACAACTACTGCTTGAAGTGGAGCAAGAGATAAGAGCCTTCTCGTTTCAGCTTATTTAATGATAAAAAACACCCTTGTTTCTACT +>LC167570.1 +AGCAGGGTGACAAAAACATAATGGATTCCAACACTGTGTCAAGTTTTCAGGTAGACTGCTTTCTTTGGCATGTCCGCAAACGATTTGCAGACCAAGAAATGGGTGATGCCCCATTCCTTGACCGGCTTCGCCGAGATCAGAAGTCCCTAAGAGGAAGAGGCAACACTCTTGGTCTGGACATCGAAACAGCTACTCGTGCGGGGAAACAGATAGTGGAACGGATTCTTGATGAGGAACCTGATGAGGCACTTAAATTGCCGACTTCACGCTACCTAACTGAAATGACTCTCGAAGAGATGTCAAAGGACTGGTTCATGCTCATGCCCAAGCAGAAAGTGATGGGTTCCCTTTGCATCAAAATGGACCAGGCAATAATGGATAAAACCATCATACTGAAAGCAAACTTCAGTGTGATTTTTGACCGATTAGAGACCCTAATACTACTCAGAGCTTTCACAGAAGAAGGGGCAATCGTGGGAGAAATCTCACCATTACCTTCTCTTCCAGGACATACTGGTGAGGATGTCAAAAATGCAATTGGCGTCCTCATCGGAGGACTTGAATGGAATGATAACACAGTTCGGGTCTCTGAAACTATACAGAGATTCGCTTGGAGAAACAGTGATGAGGGTGGGAGACTTCCACTCCCTCCAACTCAGAAACGGAAACTGGCGAGAGCAATTGAGTCAGAAGTTTGAAGAAATAAGGTGGCTAATTGAAGAAATACGACATAGATTAAAAATTACAGAAAACAGCTTCGAACAGATAACGTTTATGCAAGCTTTACAACTACTGCTTGAAGTGGAGCAAGAGATAAGAGCCTTCTCGTTTCAGCTTATTTAATGATAAAAAACACCCTTGT +>PP854504.1 +ATGGATTCCAACACTGTGTCAAGCTTTCAGGTAGACTGCTTTCTTTGGCATGTCCGCAAACGATTTGCAGACCAAGAACTGGGTGATGCCCCATTCCTTGACCGGCTCCGCCGAGACCAGAAGTCTCTAAGAGGAAGAGGCAGCACTCTTGGTCTGGACATCGAGACAGCCACTCGTGCTGGAAAGCAGATGGTGGAGAGGATTCTGGAGGAAGAATCCAACGAGGCACTCAAAATGACTATTGCCTCTGTGCCTGCTCCACGCTACCTAACTGACATGACTCTTGAAGAGATGTCAAGAGACTGGTTCATGCTCATGCCCAAGCAAAAAGTGGCAGGCTCCCTCAGTATCAGAATGGACCAGGCGATTATGGATAAGAACATCATACTGAAGGCAAACTTCAGCGTGATCTTCAATCGGCTGGAGACACTAATACTACTCAGAGCTTTCACTGAAGAGGGAGCAATTGTCGGCGAAATTTCACCATTGCCTTCTCTTCCAGGACATACTGATGAGGATGTCAAAAATGCAATTGGGGTCCTCATCGGAGGACTTGAATGGAATGATAACACAGTTCGAGTCTCTGAAACTTTACAGAGATTCGCTTGGAGAAGCAGTAATGAGGATGGGAGACCTCCACTCCCTCCAAAGCAGAAACGAAAAATGGAGAGGACAATTGAGTCAGAAGTTTGAAGAAATAAGGTGGCTGATTGAAGAAGTGCGACACAGACTAAAGATCACAGAAAATAGTTTTGAACAAATAACATTTATGCAAGCCTTACAACTACTGCTTGAAGTGGAGCAAGAGATAAGAACTTTCTCGTTTCAGCTTATTTAATAATAAAAAACACCCTTGTTTCTACT diff --git a/data/community/genspectrum/iav/h5n1/GG1996/NS/genome_annotation.gff3 b/data/community/genspectrum/iav/h5n1/GG1996/NS/genome_annotation.gff3 new file mode 100644 index 000000000..463256b56 --- /dev/null +++ b/data/community/genspectrum/iav/h5n1/GG1996/NS/genome_annotation.gff3 @@ -0,0 +1,4 @@ +. . CDS 15 707 . + . gene="NS1" +. . gene 15 852 . + . gene=NS2;ID=gene-NS2 +. . CDS 15 44 . + . gene=NS2;ID=cds-NS2;Parent=gene-NS2 +. . CDS 517 852 . + . gene=NS2;ID=cds-NS2;Parent=gene-NS2 diff --git a/data/community/genspectrum/iav/h5n1/GG1996/NS/pathogen.json b/data/community/genspectrum/iav/h5n1/GG1996/NS/pathogen.json new file mode 100644 index 000000000..d49531247 --- /dev/null +++ b/data/community/genspectrum/iav/h5n1/GG1996/NS/pathogen.json @@ -0,0 +1,21 @@ +{ + "schemaVersion": "3.0.0", + "alignmentParams": { + "minSeedCover": 0.005, + "kmerLength":7, + "allowedMismatches": 12 + }, + "attributes": { + "name": "Influenza A/H5N1 (segment 8/NS)", + "reference name": "Influenza A virus (A/goose/Guangdong/1/1996(H5N1)) segment 8, complete sequence", + "reference accession": "NC_007364.1" + }, + "files": { + "reference": "reference.fasta", + "pathogenJson": "pathogen.json", + "changelog": "CHANGELOG.md", + "genomeAnnotation": "genome_annotation.gff3", + "readme": "README.md", + "examples": "examples.fasta" + } +} diff --git a/data/community/genspectrum/iav/h5n1/GG1996/NS/reference.fasta b/data/community/genspectrum/iav/h5n1/GG1996/NS/reference.fasta new file mode 100644 index 000000000..004416e62 --- /dev/null +++ b/data/community/genspectrum/iav/h5n1/GG1996/NS/reference.fasta @@ -0,0 +1,14 @@ +>NC_007364.1 Influenza A virus (A/goose/Guangdong/1/1996(H5N1)) segment 8, complete sequence +GTGACAAAGACATAATGGATTCCAACACGATAACCTCGTTTCAGGTAGATTGTTATCTATGGCACATAAG +AAAGCTACTCAGTATGAGAGACATGTGTGATGCCCCCTTTGATGACAGGCTCCGAAGAGACCAAAAGGCA +TTAAAGGGAAGAGGCAGCACACTTGGACTCGATTTAAGAGTGGCTACAATGGAGGGGAAAAAGATCGTTG +AGGACATCCTGAAGAGTGAGACAAATGAAAACCTCAAAATAGCCATTGCTTCCAGTCCTGCTCCTCGGTA +TATCACCGATATGAGCATAGAGGAGATGAGCCGAGAATGGTACATGCTGATGCCTAGGCAGAAAATAACT +GGAGGCCTTATGGTGAAAATGGACCAAGCCATAATGGATAAAAGAATTATCCTTAAAGCAAATTTCTCAG +TTCTATTTGATCAACTAGAGACATTAGTCTCTCTGAGGGCATTCACAGAAAGTGGTGCTATTGTGGCTGA +AATATTTCCCATTCCCTCCGTACCAGGACATTTTACAGAGGATGTCAAAAATGCAATTGGAATCCTCATC +GGTGGACTTGAATGGAATGATAACTCAATTCGAGCGTCTGAAAATATACAGAGATTCGCTTGGGGAATCC +ATGATGAGAATGGGGGACCTTCACTCCCTCCAAAACAGAAACGCTACATGGCGAAACGAGTTGAGTCAGA +AGTTTGAAGAGATCAGATGGCTCATTGCTGAATGTAGAAATATACTGACAAAGACTGAAAATAGCTTTGA +ACAGATAACATTTTTGCAAGCATTGCAACTCTTACTTGAAGTTGAGAGTGAGATAAGGACCTTCTCTTTT +CAGCTTATTTAATACTAAAAAACAC diff --git a/data/community/genspectrum/iav/h5n1/GG1996/PA/CHANGELOG.md b/data/community/genspectrum/iav/h5n1/GG1996/PA/CHANGELOG.md new file mode 100644 index 000000000..81199b7df --- /dev/null +++ b/data/community/genspectrum/iav/h5n1/GG1996/PA/CHANGELOG.md @@ -0,0 +1,3 @@ +## Unreleased + +Initial release diff --git a/data/community/genspectrum/iav/h5n1/GG1996/PA/README.md b/data/community/genspectrum/iav/h5n1/GG1996/PA/README.md new file mode 100644 index 000000000..ad57cb8d1 --- /dev/null +++ b/data/community/genspectrum/iav/h5n1/GG1996/PA/README.md @@ -0,0 +1,26 @@ +# H5N1 (segment3/ PA) - dataset with A/Goose/Guangdong/1/96 reference + +| attribute | value | +| ------------------- | ---------------------------------------- | +| dataset name | community/genspectrum/iav/h5n1/GG1996/PA | +| reference strain | A/Goose/Guangdong/1/96(H5N1) | +| reference accession | NC_007359.1 | +| assembly accession | GCF_000864105.1 | + +## Authors and contacts + +Maintained by Genspectrum, Chaoran Chen and Anna Parker + +With the help of: Cornelius Roemer and Richard Neher + +## Scope of this dataset + +This dataset uses the first highly-pathogenic avian influenza (HPAI) isolate (A/Goose/Guangdong/1/96) as a reference and is suitable for the analysis of circulating and historical H5 sequences, including low-pathogenicity avian influenza (LPAI) isolates. + +## Features + +This simple dataset only supports alignment. + +## What is Nextclade dataset + +Read more about Nextclade datasets in Nextclade documentation: https://docs.nextstrain.org/projects/nextclade/en/stable/user/datasets.html diff --git a/data/community/genspectrum/iav/h5n1/GG1996/PA/examples.fasta b/data/community/genspectrum/iav/h5n1/GG1996/PA/examples.fasta new file mode 100644 index 000000000..0e5d96801 --- /dev/null +++ b/data/community/genspectrum/iav/h5n1/GG1996/PA/examples.fasta @@ -0,0 +1,38 @@ +>OP950296.1 +AGCAAAAGCAGGTACTGATTCAAAATGGAAGACTTTGTGCGACAATGCTTCAATCCAATGATTGTCGAGCTTGCGGAAAAAGCAATGAAAGAATATGGGGAAGATCCGAAAATCGAGACAAACAAATTTGCCGCAATATGCACACACTTAGAAGTCTGTTTCATGTATTCGGATTTCCATTTTATTGATGAACAAGGCGAATCAATGATTGTAGAATCTGGCGATCCAAATGCATTATTGAAACACCGATTTGAGATAATCGAAGGGAGAGACCGAGCAATGGCCTGGACAGTGGTGAATAGTATCTGCAACACCACAGGGGTCGAAAAGCCCAAATTCCTCCCTGATTTGTATGACTACAAAGAGAACCGATTCATTGAAATTGGAGTAACGCGAAGGGAAGTTCACATATACTATTTAGAAAAAGCCAACAAGATAAAATCAGAGAAAACACATATTCACATATTCTCATTCACTGGAGAGGAAATGGCCACCAAGGCGGACTACACCCTTGATGAAGAGAGCAGAGCAAGAATAAAAACCAGACTGTTCACTATAAGACAAGAAATGGCTAGTAGAGGTCTATGGGATTCCTTTCGTCAGTCCGAGAGAGGCGAAGAGACAATTGAAGAAAGATTTGAAATCACAGGAACCATGCGCAGGCTTGCCGATCAAAGTCTTCCACCGAACTTCTCCAGCCTTGAAAACTTTAGAGCCTATGTGGATGGATTCGAACCGAACGGCTGCATTGAGGGCAAACTTTCTCAAATGTCAAAAGAAGTGAACGCCAGAATTGAGCCATTTCTGAAGACAACACCACGCCCTCTCAGATTACCTGATGGGCCTCCCTGTTCTCAGCGGTCGAAGTTCTTGCTGATGGATGCCCTTAAGTTGAGCATCGAAGACCCTAGCCATGAAGGGGAGGGCATACCGCTGTATGATGCAATCAAATGCATGAAGACATTTTTTGGCTGGAAAGAGCCCAACATCGTAAAGCCGCATGAGAAAGGCATAAACCCTAATTACCTCCTGGCTTGGAAGCAGGTGCTGGCAGAACTTCAAGACATTGAAAATGAGGAGAAAATTCCAAAAACAAAGAACATGAAGAAAACAAGCCAATTGAAGTGGGCACTTGGTGAGAACATGGCTCCAGAAAAAGTGGACTTTGAGGACTGCAAAGATGTTAGCGATCTAAGACAGTACGACAGTGACGAACCAGAGTCTAGATCATTAGCAAGCTGGATCCAGAGTGAATTCAACAAGGCATGTGAACTGACAGATTCGAGTTGGATTGAACTTGATGAGATAGGGGAAGACGTTGCTCCAATCGAACACATTGCGAGTGTGAGGAGAAACTATTTCACAGCGGAGGTATCCCATTGCAGGGCCACTGAATACATAATGAAGGGAGTATACATAAACACAGCCCTATTGAATGCATCCTGTGCAGCCATGGATGACTTCCAACTGATTCCAATGATAAGTAAGTGCAGAACTAAAGAAGGAAGACGGAAGACAAATCTGTATGGATTCATTATAAAAGGAAGATCCCATTTGAGGAATGACACCGATGTGGTAAACTTTGTGAGCATGGAATTCTCTCTAACTGACCCGAGGCTAGAGCCACACAAATGGGAAAAGTACTGTGTTCTTGAGATAGGAGACATGCTCCTACGGACTGCAATAGGCCAAGTGTCGAGGCCCATGTTCCTGTATGTGAGAACCAATGGGACTTCCAAGATCAAAATGAAATGGGGCATGGAGATGAGGCGATGCCTTCTTCAGTCCCTTCAACAAATTGAGAGCATGATTGAGGCCGAATCTTCTGTCAAAGAGAAGGACATGTCCAAGGAATTCTTTGAAAACAAATCAGAAACATGGCCAATTGGAGAATCACCCAAAGGGGTGGAGGAAGGCTCTATTGGGAAAGTATGCAGAACATTGCTAGCAAAGTCTGTGTTCAACAGCCTATATACATCTCCACAACTCGAGGGGTTTTCAGCTGAATCAAGAAAATTGCTTCTCATTGTTCAGGCACTTAGGGACAACCTGGAACCTGGAACCTTCGATCTTGGGGGGCTATATGAAGCAATTGAGGAGTGCCTGATTAACGATCCCTGGGTTTTGCTTAATGCGTCTTGGTTCAACTCCTTCCTCACACATGCACTGAAATAGTTGTGGCAATGCTACTATTTGCTATCCATACTGTCCAAAAAAGTACCTTGTTTCTACT +>FM177118.1 +AGCGAAAGCAGGTACTGATTCAAAATGGAAGATTTTGTGCGACAATGCTTCAATCCAATGATTGTCGAGCTTGCGGAAAAGGCAATGAAAGAATATGGGGAAGATCTGAAAATCGAAACGAACAAATTTGCTGCAATATGCACACACTTGGAGGTCTGCTTCATGTATTCGGATTTTCACTTTATTGATGAACGGAGTGAATCAATAATTGTAGAATCTGGAGATCCGAACGCATTATTAAAACACCGATTTGAAATAATTGAAGGAAGAGACCGAACGATGGCCTGGACTGTGGTGAATAGTATTTGCAACACCACAGGGGTCGAGAAACCTAAATTTCTCCCAGATTTGTATGACTACAAAGAGAACCGATTCATTGAAATTGGAGTGACACGGAGGGAAGTTCATACATACTATCTGGAGAAGGCCAACAAGATAAAATCCGAGAAGACACATATTCACATATTCTCATTCACAGGGGAGGAAATGGCAACCAAAGCGGACTACACCCTTGATGAAGAGAGCAGGGCAAGAATTAAAACCAGGCTGTTCACCATAAGACAGGAAATGGCCAGTAGGGGTTTATGGGATTCCTTTCGTCAATCCGAGAGAGGCGAAGAGACAATTGAAGAAAAATTTGAAATCACTGGAACCATGCGCAGACTTGCCGACCAAAGTCTCCCACCGAACTTCTCCAGCCTTGAAAACTTTAGAGCCTATGTGGATGGATTCGAACCGAACGGCTGCATTGAGGGCAAGCTTTCTCAAATGTCAAAAGAAGTGAATGCTAGAATTGAGCCATTTTTGAAGACAACGCCACGCCCTCTCAGATTACCTGATGGGCCTCCTTGCTCTCAGCGGTCGAAATTCCTGCTGATGGATGCCCTTAAATTAAGTATTGAAGACCCGAGTCATGAGGGGGAGGGGATACCACTATACGATGCAATCAAATGCATGAAGACATTTTTCGGGTGGAAGGAGCCCAACATCGTGAAACCACATGAAAAGGGTATAAACCCCAATTACCTCCTGACTTGGAAGCAAGTGCTGGCAGAACTCCAAGATATTGAAAATGAGGAGAAAATCCCAAAAACAAAGAACATGAAAAAAACAAGCCAGTTGAGGTGGGCACTCGGTGAGAACATGGCACCAGAGAAAGTAGACTTTGAGGACTGCAAAGATGTTAGCGATCTAAGACAGTATGACAGTGATGAACCAGAATCTAGATCACTAGCAAGCTGGATTCAGAGTGAATTCAACAAGGCATGTGAATTGACAGACTCGAGTTGGATTGAACTTGATGAAATAGGAGAGGATGTTGCTCCAATTGAGCACATTGCAAGTATGAGAAGGAACTACTTTACAGCGGAAGTATCCCATTGCAGAGCCACTGAATACATAATGAAGGGAGTGTACATAAACACAGCCCTGTTGAATGCATCCTGTGCAGCCATGGATGACTTTCAACTGATTCCAATGATAAGCAAATGCAGAACCAAAGAAGGAAGACGGAAAACTAATCTGTATGGATTCATTATAAAAGGAAGATCCCACTTGAGGAATGATACCGATGTGGTAAATTTTGTGAGCATGGAATTCTCTCTCACTGATCCGAGGTTGGAGCCACACAAGTGGGAAAAGTACTGTGTCCTCGAGATAGGAGACATGCTCCTCCGGACTGCAGTAGGTCAAGTTTCAAGGCCCATGTTCCTGTATGTGAGAACCAACGGAACCTCCAAGATCAAAATGAAATGGGGCATGGAAATGAGACGATGCCTTCTTCAATCCCTTCAACAAATTGAAAGCATAATTGAAGCCGAATCTTCTGTCAAAGAAAAGGACATGACCAAAGAATTCTTTGAAAACAAATCAGAAACATGGCCGATCGGAGAATCCCCCAAAGGAGTGGAGGAAGGCTCCATCGGAAAGGTGTGCAGAACCTTGCTGGCGAAGTCTGTGTTCAACAGTTTATATGCATCTTCACAACTCGAGGGGTTTTCAGCTGAATCAAGAAAATTGCTTCTCATTGTTCAGGCACTTAGGGACAACCTGGAACCTGGGACCTTCGATCTTGGAGGGCTATATGAAGCAATTGAGGAGTGCCTGATTAACGATCCCTGGGTTTTGCTTAATGCGTCTTGGTTCAACTCCTTCCTCGCACATGCACTGAAATAGTTGGGGCAATGCTACTACTTGCTATCCATACTGTCCAAAAAAGTACCTTGTTTCTACT +>OQ584517.1 +AGCAAAAGCAGGTACTGATTCGAAATGGAAGACTTTGTGCGACAATGCTTCAATCCAATGATTGTCGAGCTTGCGGAAAAGGCAATGAAAGAATATGGGGAAGATCCGAAAATCGAGACAAACAAATTTGCCGCAATATGCACACACCTAGAAGTCTGTTTCATGTATTCGGATTTCCATTTTATTGATGAACGAGGCGAATCAATGATTGTAGAATCTGGCGATCCAAATGCATTATTGAAACACCGATTTGAGATAATCGAAGGGAGAGACCGAGCAATGGCCTGGACAGTGGTGAATAGTATCTGCAACACCACAGGGGTCGAAAAGCCCAAATTCCTCCCTGATTTGTATGACTACAAAGAGAACCGATTCATTGAAATTGGAGTAACGCGAAGGGAAGTTCACATATACTATTTAGAAAAAGCCAACAAGATAAAATCAGAGAAAATACATATTCACATATTCTCATTCACTGGAGAGGAAATGGCCACCAAGGCGGACTACACCCTTGATGAAGAGAGCAGGGCAAGAATAAAAACCAGACTGTTCACTATAAGACAAGAAATGGCCAGTAGAGGTCTATGGGATTCCTTTCGTCAGTCCGAGAGAGGCGAAGAGACAATTGAAGAAAGATTTGAACTCACAGGAACCATGCGCAGGCTTGCCGACCAAAGTCTCCCACCGAACTTCTCCAGCCTTGAAAACTTTAGAGCCTATGTGGATGGATTCGAACCGAACGGCTGCATTGAGGGCAAACTTTCTCAAATGTCAAAAGAAGTGAACGCCAGAATTGAGCCATTTCTGAAGACAACACCACGCCCTCTCAGATTACCTGATGGGCCTCCCTGTTCTCAGCGGTCGAAGTTCTTGCTGATGGATGCCCTTAAGTTGAGCATCGAAGACCCTAGCCACGAGGGGGAGGGCATACCGCTGTATGATGCAATCAAATGCATGAAGACATTTTTTGGCTGGAAAGAGCCCAACATCGTAAAGCCGCATGAGAAAGGCATAAACCCTAATTACCTCCTGGCTTGGAAGCAGGTGCTGGCAGAACTTCAAGACATTGAAAATGAGGAGAAAATTCCAAAAACAAAGAACATGAAGAAAACAAGCCAATTGAAGTGGGCACTTGGTGAGAACATGGCTCCAGAAAAAGTGGACTTTGAGGACTGCAAAGATGTTAGCGATCTAAGACAGTACGACAGTGACGAACCAGAGTCTAGATCACTAGCAAGCTGGATTCAGAGTGAATTCAACAAGGCATGCGAACTGACAGATTCGAGTTGGATTGAACTTGATGAGATAGGGGAAGACGTTGCTCCAATCGAACACATTGCGAGTGTGAGGAGGAACTATTTCACAGCGGAGGTATCCCATTGCAGGGCCACTGAATACATAATGAAGGGAGTATACATAAACACAGCCCTATTGAATGCATCCTGTGCAGCCATGGATGACTTCCAACTGATTCCAATGATAAGTAAGTGCAGAACTAAAGAAGGAAGACGGAAGACAAATCTGTATGGATTCATTATAAAAGGAAGATCCCATTTGAGGAATGACACCGATGTGGTAAACTTTGTGAGCATGGAATTCTCTCTAACTGACCCGAGGCTAGAGCCACACAAATGGGAAAAGTACTGTGTTCTTGAGATAGGAGACATGCTCCTACGGACTGCAATAGGCCAAGTGTCGAGGTCCATGTTCCTGTATGTGAGAACCAATGGGACTTCCAAGATCAAAATGAAATGGGGCATGGAGATGAGGCGATGCCTTCTTCAGTCCCTTCAACAAATTGAGAGCATGATTGAGGCCGAATCTTCTGTCAAAGAGAAGGACATGTCCAAGGAATTCTTTGAAAACAAATCAGAAACATGGCCAATTGGAGAATCACCCAAAGGGGTGGAGGAAGGCTCTATTGGGAAAGTATGCAGAACATTGCTAGCAAAGTCTGTGTTCAACAGCCTATATGCATCTCCACAACTCGAGGGGTTTTCAGCTGAATCAAGAAAATTGCTTCTCATTGTTCAGGCACTTAGGGACAACCTGGAACCTGGAACCTTCGATCTTGGGGGGCTATATGAAGCAATTGAGGAGTGCCTGATTAACGATCCCTGGGTTTTGCTTAATGCGTCTTGGTTCAACTCCTTCCTCACACATGCACTGAAATAGTTGTGGCAATGCTACTATTTGCTATCCATACTGTCCAAAAAAGTACCTTGTTTCTACT +>OQ584643.1 +AGCGAAAGCAGGTACTGATCCGAAATGGAAGACTTTGTGCGACAATGCTTCAATCCAATGATTGTCGAGCTTGCGGAAAAAGCAATGAAAGAATATGGGGAAGATCCGAAAATCGAGACAAACAAATTTGCCGCAATATGCACACACTTAGAAGTCTGTTTCATGTATTCGGATTTCCATTTTATTGATGAACGAGGCGAATCAATGATTGTAGAATCTGGCGATCCAAATGCATTATTGAAACACCGATTTGAGATAATCGAAGGGAGAGACCGAGCAATGGCCTGGACAGTGGTGAATAGTATCTGCAACACCACAGGGGTCGAAAAGCCCAAATTCCTCCCTGATTTGTATGACTACAAAGAGAACCGATTCATTGAAATTGGAGTAACGCGAAGGGAAGTTCACATATACTATTTAGAAAAAGCCAACAAGATAAAATCAGAGAAAACACATATTCACATATTCTCATTCACTGGAGAGGAAATGGCCACCAAGGCGGACTACACCCTTGATGAAGAGAGCAGGGCAAGGATAAAAACCAGACTGTTCACTATAAGACAAGAAATGGCCAGTAGAGGTCTATGGGATTCCTTTCGTCAGTCCGAGAGAGGCGAAGAGACAATTGAAGAAAGATTTGAAATCACAGGAACCATGCGCAGGCTTGCCGACCAAAGTCTCCCACCGAACTTCTCCAGCATTGAAAACTTTAGAGCCTATGTGGATGGATTCGAACCGAACGGCTGCATTGAGGGCAAACTTTCTCAAATGTCAAAAGAAGTGAACGCCAGAATTGAGCCATTTCTGAAGACAACACCACGCCCTCTCAGATTACCTGATGGGCCTCCCTGTTCTCAGCGGTCGAAGTTCTTGCTGATGGATGCCCTTAAGTTGAGCATCGAAGACCCTAGCCATGAGGGGGAGGGCATACCGCTGTATGATGCAATCAAATGCATGAAGACATTTTTTGGCTGGAAAGAGCCCAACATCGTAAAGCCACATGAGAAAGGCATAAACCCTAATTACCTCCTGGCTTGGAAGCAGGTGCTGGCAGAACTTCAAGACATTGAAAATGAGGAGAAAATTCCAAAAACAAAGAACATGAAGAAAACAAGCCAATTGAAGTGGGCACTTGGTGAGAACATGGCTCCAGAAAAAGTGGACTTTGAGGACTGCAAAGATGTTAGCGATCTAAGACAGTACGACAGTGACGAACCAGAGTCTAGATCACTAGCAAGCTGGATTCAGAGTGAATTCAACAAGGCATGCGAACTGACAGATTCGAGTTGGATTGAACTTGATGAGATAGGGGAAGACGTTGCTCCAATCGAACACATTGCGAGTGTGAGGAGGAACTATTTCACAGCGGAGGTATCCCATTGCAGGGCCACTGAATACATAATGAAGGGAGTATACATAAACACAGCCCTATTGAATGCATCCTGTGCAGCCATGGATGACTTCCAACTGATTCCAATGATAAGTAAGTGCAGAACTAAAGAAGGAAGACGGAAGACAAATCTGTATGGATTCATTATAAAAGGAAGATCCCATTTGAGGAATGACACCGATGTGGTAAACTTTGTGAGCATGGAATTCTCTCTAACTGACCCGAGGCTAGAGCCACACAAATGGGAAAAGTACTGTGTTCTTGAGATAGGAGACATGCTCCTACGGACTGCAATAGGCCAAGTGTCGAGGCCCATGTTCCTGTATGTGAGAACCAATGGGACTTCCAAGATCAAAATGAAATGGGGCATGGAGATGAGGCGATGCCTTCTTCAGTCCCTTCAACAAATTGAGAGCATGATTGAGGCCGAATCTTCTGTCAAAGAGAAGGACATGTCCAAGGAATTCTTTGAAAACAAATCAGAAACATGGCCAATTGGAGAATCACCCAAAGGGGTGGAGGAAGGCTCTATTGGGAAAGTATGCAGAACATTGCTAGCAAAGTCTGTGTTCAACAGCCTATATGCATCTCCACAACTCGAGGGGTTTTCAGCTGAATCAAGAAAATTGCTTCTCATTGTTCAGGCACTTAGGGACAACCTGGAACCTGGAACCTTCGATCTTGGGGGGCTATATGAAGCAATTGAGGAGTGCCTGATTAACGATCCCTGGGTTTTGCTTAATGCGTCTTGGTTCAACTCCTTCCTCACACATGCACTGAAATAGTTGTGGCAATGCTACTATTTGCTATCCATACTGTCCAAAAAAGTACCTTGTTTCTACT +>OQ584691.1 +AAAGCAGGTACTGATTCAAAATGGAAGACTTTGTGCGACAATGCTTCAATCCAATGATTGTCGAGCTTGCGGAAAAGGCAATGAAAGAATATGGGGAAGATCCGAAAATCGAGACAAACAAATTTGCCGCAATATGCACACACCTAGAAGTCTGTTTCATGTATTCGGATTTCCATTTTATTGATGAACGAGGCGAATCAATGATTGTAGAATCTGGCGATCCAAATGCATTATTGAAACACCGATTTGAGATAATCGAAGGGAGAGACCGAGCAATGGCCTGGACAGTGGTGAATAGTATCTGCAACACCACAGGGGTCGAAAAGCCCAAATTCCTCCCTGATTTGTATGACTACAAAGAGAACCGATTCATTGAAATTGGAGTAACGCGAAGGGAAGTTCACATATACTATTTAGAAAAAGCCAACAAGATAAAATCAGAGAAAATACATATTCACATATTCTCATTCACTGGAGAGGAAATGGCCACCAAGGCGGACTACACCCTTGATGAAGAGAGCAGGGCAAGAATAAAAACCAGACTGTTCACTATAAGACAAGAAATGGCCAGTAGAGGTCTATGGGATTCCTTTCGTCAGTCCGAGAGAGGCGAAGAGACAATTGAAGAAAGATTTGAACTCACAGGAACCATGCGCAGGCTTGCCGACCAAAGTCTCCCACCGAACTTCTCCAGCCTTGAAAACTTTAGAGCCTATGTGGATGGATTCGAACCGAACGGCTGCATTGAGGGCAAACTTTCTCAAATGTCAAAAGAAGTGAACGCCAGAATTGAGCCATTTCTGAAGACAACACCACGCCCTCTCAGATTACCTGATGGGCCTCCCTGTTCTCAGCGGTCGAAGTTCTTGCTGATGGATGCCCTTAAGTTGAGCATCGAAGACCCTAGCCACGAGGGGGAGGGCATACCGCTGTATGATGCAATCAAATGCATGAAGACATTTTTTGGCTGGAAAGAGCCCAACATCGTAAAGCCGCATGAGAAAGGCATAAACCCTAATTACCTCCTGGCTTGGAAGCAGGTGCTGGCAGAACTTCAAGACATTGAAAATGAGGAGAAAATTCCAAAAACAAAGAACATGAAGAAAACAAGCCAATTGAAGTGGGCACTTGGTGAGAACATGGCTCCAGAAAAAGTGGACTTTGAGGACTGCAAAGATGTTAGCGATCTAAGACAGTACGACAGTGACGAACCAGAGTCTAGATCACTAGCAAGCTGGATTCAGAGTGAATTCAACAAGGCATGCGAACTGACAGATTCGAGTTGGATTGAACTTGATGAGATAGGGGAAGACGTTGCTCCAATCGAACACATTGCGAGTGTGAGGAGGAACTATTTCACAGCGGAGATATCCCATTGCAGGGCCACTGAATACATAATGAAGGGAGTATACATAAACACAGCCCTATTGAATGCATCCTGTGCAGCCATGGATGACTTCCAACTGATTCCAATGATAAGTAAGTGCAGAACTAAAGAAGGAAGACGGAAGACAAATCTGTATGGATTCATTATAAAAGGAAGATCCCATTTGAGGAATGACACCGATGTGGTAAACTTTGTGAGCATGGAATTCTCTCTAACTGACCCGAGGCTAGAGCCACACAAATGGGAAAAGTACTGTGTTCTTGAGATAGGAGACATGCTCCTACGGACTGCAATAGGCCAAGTGTCGAGGTCCATGTTCCTGTATGTGAGAACCAATGGGACTTCCAAGATCAAAATGAAATGGGGCATGGAGATGAGGCGATGCCTTCTTCAGTCCCTTCAACAAATTGAGAGCATGATTGAGGCCGAATCTTCTGTCAAAGAGAAGGACATGTCCAAGGAATTCTTTGAAAACAAATCAGAAACATGGCCAATTGGAGAATCACCCAAAGGGGTGGAGGAAGGCTCTATTGGGAAAGTATGCAGAACATTGCTAGCAAAGTCTGTGTTCAACAGCCTATATGCATCTCCACAACTCGAGGGGTTTTCAGCTGAATCAAGAAAATTGCTTCTCATTGTTCAGGCACTTAGGGACAACCTGGAACCTGGAACCTTCGATCTTGGGGGGCTATATGAAGCAATTGAGGAGTGCCTGATTAACGATCCCTGGGTTTTGCTTAATGCGTCTTGGTTCAACTCCTTCCTCACACATGCACTGAAATAGTTGTGGCAATGCTACTATTTGCTATCCATACTGTCCAAAAAAGTACCTTGTTTCTACT +>OQ584722.1 +AGCGAAAGCAGGTACTGATCCGAAATGGAAGACTTTGTGCGACAATGCTTCAATCCAATGATTGTCGAGCTTGCGGAAAAGGCAATGAAAGAATATGGGGAAGATCCGAAAATCGAGACAAACAAATTTGCCGCAATATGCACACACCTAGAAGTCTGTTTCATGTATTCGGATTTCCATTTTATTGATGAACGAGGCGAATCAATGATTGTAGAATCTGGCGATCCAAATGCATTATTGAAACACCGATTTGAGATAATCGAAGGGAGAGACCGAGCAATGGCCTGGACAGTGGTGAATAGTATCTGCAACACCACAGGGGTCGAAAAGCCCAAATTCCTCCCTGATTTGTATGACTACAAAGAGAACCGATTCATTGAAATTGGAGTAACGCGAAGGGAAGTTCACATATACTATTTAGAAAAAGCCAACAAGATAAAATCAGAGAAAATACATATTCACATATTCTCATTCACTGGAGAGGAAATGGCCACCAAGGCGGACTACACCCTTGATGAAGAGAGCAGGGCAAGAATAAAAACCAGACTGTTCACTATAAGACAAGAAATGGCCAGTAGAGGTCTATGGGATTCCTTTCGTCAGTCCGAGAGAGGCGAAGAGACAATTGAAGAAAGATTTGAACTCACAGGAACCATGCGCAGGCTTGCCGACCAAAGTCTCCCACCGAACTTCTCCAGCCTTGAAAACTTTAGAGCCTATGTGGATGGATTCGAACCGAACGGCTGCATTGAGGGCAAACTTTCTCAAATGTCAAAAGAAGTGAACGCCAGAATTGAGCCATTTCTGAAGACAACACCACGCCCTCTCAGATTACCTGATGGGCCTCCCTGTTCTCAGCGGTCGAAGTTCTTGCTGATGGATGCCCTTAAGTTGAGCATCGAAGACCCTAGCCACGAGGGGGAGGGCATACCGCTGTATGATGCAATCAAATGCATGAAGACATTTTTTGGCTGGAAAGAGCCCAACATCGTAAAGCCGCATGAGAAAGGCATAAACCCTAATTACCTCCTGGCTTGGAAGCAGGTGCTGGCAGAACTTCAAGACATTGAAAATGAGGAGAAAATTCCAAAAACAAAGAACATGAAGAAAACAAGCCAATTGAAGTGGGCACTTGGTGAGAACATGGCTCCAGAAAAAGTGGACTTTGAGGACTGCAAAGATGTTAGCGATCTAAGACAGTACGACAGTGACGAACCAGAGTCTAGATCACTAGCAAGCTGGATTCAGAGTGAATTCAACAAGGCATGCGAACTGACAGATTCGAGTTGGATTGAACTTGATGAGATAGGGGAAGACGTTGCTCCAATCGAACACATTGCGAGTGTGAGGAGGAACTATTTCACAGCGGAGGTATCCCATTGCAGGGCCACTGAATACATAATGAAGGGAGTATACATAAACACAGCCCTATTGAATGCATCCTGTGCAGCCATGGATGACTTCCAACTGATTCCAATGATAAGTAAGTGCAGAACTAAAGAAGGAAGACGGAAGACAAATCTGTATGGATTCATTATAAAAGGAAGATCCCATTTGAGGAATGACACCGATGTGGTAAACTTTGTGAGCATGGAATTCTCTCTAACTGACCCGAGGCTAGAGCCACACAAATGGGAAAAGTACTGTGTTCTTGAGATAGGAGACATGCTCCTACGGACTGCAATAGGCCAAGTGTCGAGGTCCATGTTCCTGTATGTGAGAACCAATGGGACTTCCAAGATCAAAATGAAATGGGGCATGGAGATGAGGCGATGCCTTCTTCAGTCCCTTCAACAAATTGAGAGCATGATTGAGGCCGAATCTTCTGTCAAAGAGAAGGACATGTCCAAGGAATTCTTTGAAAACAAATCAGAAACATGGCCAATTGGAGAATCACCCAAAGGGGTGGAGGAAGGCTCTATTGGGAAAGTATGCAGAACATTGCTAGCAAAGTCTGTGTTCAACAGCCTATATGCATCTCCACAACTCGAGGGGTTTTCAGCTGAATCAAGAAAATTGCTTCTCATTGTTCAGGCACTTAGGGACAACCTGGAACCTGGAACCTTCGATCTTGGGGGGCTATATGAAGCAATTGAGGAGTGCCTGATTAACGATCCCTGGGTTTTGCTTAATGCGTCTTGGTTCAACTCCTTCCTCACACATGCACTGAAATAGTTGTGGCAATGCTACTATTTGCTATCCATACTGTCCAAAAAAGTACCTTGTTTCTACT +>OQ595413.1 +AGCGAAAGCAGGTACTGATTCAAAATGGAAGACTTTGTGCGACAATGCTTCAATCCAATGATTGTCGAGCTTGCGGAAAAAGCAATGAAAGAATATGGGGAAGATCCGAAAATCGAGACAAACAAATTTGCCGCAATATGCACACACTTAGAAGTCTGTTTCATGTATTCGGATTTCCATTTTATTGATGAACGAGGCGAATCAATGATTGTAGAATCTGGCGATCCAAATGCATTATTGAAACACCGATTTGAGATAATCGAAGGGAGAGACCGAGCAATGGCCTGGACAGTGGTGAATAGTATCTGCAACACCACAGGGGTCGAAAAGCCCAAATTCCTCCCTGATTTGTATGACTACAAAGAGAACCGATTCATTGAAATTGGAGTAACGCGAAGGGAAGTTCACATATACTATTTAGAAAAAGCCAACAAGATAAAATCAGAGAAAACACATATTCACATATTCTCATTCACTGGAGAGGAAATGGCCACCAAGGCGGACTACACCCTTGATGAAGAGAGCAGGGCAAGAATAAAAACCAGACTGTTCACTATAAGACAAGAAATGGCCAGTAGAGGTCTATGGGATTCCTTTCGTCAGTCCGAGAGAGGCGAAGAGACAATTGAAGAAAGATTTGAAATCACAGGAACCATGCGCAGGCTTGCCGACCAAAGTCTCCCACCGAACTTCTCCAGCCTTGAAAACTTTAGAGCCTATGTGGATGGATTCGAACCGAACGGCTGCATTGAGGGCAAACTTTCTCAAATGTCAAAAGAAGTGAATGCCAGAATTGAGCCATTTCTGAAGACAACACCACGCCCTCTCAGATTACCTGATGGGCCTCCCTGTTCTCAGCGGTCGAAGTTCTTGCTGATGGATGCCCTTAAGTTGAGCATCGAAGACCCTAGCCACGAGGGGGAGGGCATACCGCTGTATGATGCAATCAAATGCATGAAGACATTTTTTGGCTGGAAAGAGCCCAACATCGTAAAGCCGCATGAGAAAGGCATAAACCCTAATTACCTCCTGGCTTGGAAGCAGGTGCTGGCAGAACTTCAAGACATTGAAAATGAGGAGAAAATTCCAAAAACAAAGAACATGAAGAAAACAAGCCAATTGAAGTGGGCACTTGGTGAGAACATGGCTCCAGAAAAAGTGGACTTTGAGGACTGCAAAGATGTTAGTGATCTAAGACAGTACGACAGTGACGAACCAGAGTCTAGATCACTAGCAAGCTGGATTCAGAGTGAATTCAACAAGGCATGCGAATTGACAGATTCGAGTTGGATTGAACTTGATGAGATAGGGGAAGACGTTGCTCCAATCGAACACATTGCGAGTGTGAGGAGGAACTATTTCACAGCGGAGGTATCCCATTGCAGGGCCACTGAATACATAATGAAGGGAGTATACATAAACACAGCCCTATTGAATGCATCCTGTGCAGCCATGGATGACTTCCAACTGATTCCAATGATAAGTAAGTGCAGAACTAAAGAAGGAAGACGGAAGACAAATCTGTATGGATTCATTATAAAAGGAAGATCCCATTTGAGGAATGACACCGATGTGGTAAACTTTGTGAGCATGGAATTCTCTCTAACTGACCCGAGGCTAGAGCCACACAAATGGGAAAAGTACTGTGTTCTTGAGATAGGAGACATGCTCCTACGGACTGCAATAGGCCAAGTGTCGAGGCCCATGTTCCTGTATGTGAGAACCAATGGGACTTCCAAGATCAAAATGAAATGGGGCATGGAGATGAGGCGATGCCTTCTTCAGTCCCTTCAACAAATTGAGAGCATGATCGAGGCCGAATCTTCTGTCAAAGAGAAGGACATGTCCAAGGAATTCTTTGAAAACAAATCAGAAACATGGCCAATTGGAGAATCACCCAAAGGGGTGGAGGAAGGCTCTATTGGGAAAGTATGCAGAACATTGCTAGCAAAGTCTGTGTTCAACAGCCTATATGCATCTCCACAACTCGAGGGGTTTTCAGCTGAATCAAGAAAATTGCTTCTCATTGTTCAGGCACTTAGGGACAACCTGGAACCTGGAACCTTCGATCTTGGGGGGCTATATGAAGCAATTGAGGAGTGCCTGATTAACGATCCCTGGGTTTTGCTTAATGCGTCTTGGTTCAACTCCTTCCTCACACATGCACTGAAATAGTTGTGGCAATGCTACTATTTGCTATCCATACTGTCCAAAAAAGTACCTTGTTTCTA +>AB807879.1 +TGATCCAAAATGGAAGACTTTGTGCGACAATGCTTCAATCCAATGATCGTCGAGCTTGCGGAAAAGACAATGAAAGAATATGGGGAAAGTCCAAAAATCGAAACGAACAAATTCGCCGCAATATGCACACACTTAGAAGTCTGCTTCATGTATTCGGATTTCCACTTTATAGATGAACGAGGCGAGTCAATAATTGCAGAATCTGGCGATCCGAATGCATTATTGAAACACCGATTTGAGATAATTGAAGGGAGAGACCGAACAATGGCTTGGACAGTGGTAAATAGTATCTGCAACACCACAGGAGTCAATAAGCCTAAATTCCTCCCAGACTTGTATGACTACAAAGAGAACCGATTCATTGAAATTGGAGTGACACGGCGGGAAGTTCACATATACTACCTAGAAAAAGCAAACAAGATAAAATCAGAGAGGACACACATTCACATATTCTCATTCACTGGAGAGGAAATGGCCACTAAAGCTGACTATACTCTTGATGAAGAGAGCAGAGCAAGAATCAAAACCAGGCTGTTCACTATAAGACAAGAGATGGCCAGTAGGGGTCTATGGGATTCCTTTCGTCAATCTGAGAGAGGCGAAGAGACAATTGAAGAAAGGTTTGAAATCACAGGAACCATGCGCAGGCTTGCTGACCAAAGCCTCCCACCGAACTTCTCCAGCCTTGAAAATTTTAGAGCCTATGTGGATGGATTCAAACCGAACGGCTGCATTGAGGGCAAGCTTTCTCAAATGTCAAAGGAAGTGAACGCCAGAATTGAGCCATTTATGAAGACAACACCACGCCCTCTCAGACTGCCTGAGGGGCCTCCCTGCTCCCAGCGGTCGAAGTTCTTACTGATGGATGCCCTTAAGTTAAGCATTGAAGATCCAAGCCATGAGGGGGAAGGCATACCACTATATGATGCAATCAAATGCATGAAGACTTTTTTCGGCTGGAAAGAGCCCAACATCGTAAAACCACATGAAAAGGGCATAAATCCCAATTACCTCCTGGCTTGGAAGCAGGTGCTGTCAGAACTCCAAGACATTGAAAATGAAGATAAAATCCCAAAAACAAAGAACATGAAGAAAACAAGCCAATTAAAGTGGGCACTTGGTGAGAATATGGCACCAGAAAAAGTAGACTTTGAGGACTGCAAAGATGTTAGCGATCTAAAACAGTATGACAGTGATGAACCAGAACCTAGGTCATTATCAAGCTGGATTCAGAGCGAATTCAACAAAGCATGCGAATTGACAGATTCGAGTTGGATTGAACTTGATGAAATAGGAGAAGATGTCGCTCCAATTGAGCACATTGCAAGTATGAGAAGAAACTATTTCACAGCGGAAGTGTCTCATTGCAGGGCCACTGAATACATAATGAAGGGAGTGTATATAAACACAGCCCTATTGAATGCATCCTGTGCAGCCATGGATGACTTCCAGTTGATTCCAATGATAAGCAAGTGCAGAACCAAAGAAGGAAGACGGAAAACAAATCTGTACGGATTCATTATAAAAGGAAGGTCCCATTTGAGGAACGACACCGATGTGGTAAACTTTGTGAGCATGGAATTCTCTCTTACTGACCCGAGGCTGGAACCACACAAGTGGGAAAAGTACTGTGTTCTTGAAATAGGAGACATGCTATTACGAACTGCAATAGGCCAGGTGTCAAGACCCATGTTCCTGTATGTGAGAACCAATGGGACGTCCAAGATTAAAATGAAATGGGGCATGGAGATGAGGCGATGCCTTCTTCAATCCCTTCAACAAATTGAGAGCATGATTGAGGCCGAGTCTTCTGTCAAAGAGAAAGACATGACCAAAGAATTCTTTGAAACCAAATCAGAAACGTGGCCAATTGGGGAATCACCTAAAGGGGTGGAAGAAAGCTCCATTGGAAAGGTGTGCAGAACATTACTATCAAAATCTGTATTCAACAGCCTATATGCATCTCCACAACTTGAGGGGTTTTCAGCTGAATCAAGAAAATTGCTTCTCATTGTTCAGGCACTTAGGGACAACCTGGAACCTGGAACCTTCGATCTTGGGGGGCTATATGAAGCAATTGAGGAGTGCCTAATTAATGATCCCTGGGTTTTGCTTAATGCATCTTGGTTCAACTCCTTCCTCACACATGCACTGAAATAGTTGTGGCAATGCTACTATTTGCTATCCATACTGTCCAAAA +>KU143482.1 +ATGGAAGACTTTGTGCGACAATGCTTCAATCCAATAATTGTCGAGCTTGCGGAAAAGGCAATGAAAGAATATGGGGAAGACCCGAAAATTGAGACAAACAAATTTGCTGCAATATGCACACACTTAGAAGTCTGTTTCATGTACTCAGACTTCCACTTTATTGACGAACGAGGGGAATCAATAATTGTAGAATCTGGCGATCCGAATGCATTATTGAAACACCGATTTGAGATAATTGAAGGGAGAGACCGAACAATGGCCTGGACAGTGGTGAATAGCATAAGCAACACCACAGGAGTCGGTAAGCCTAAATTCCTCCCAGATTTGTATGACTACAAAGAAAACCGGTTCATTGAAATTGGAGTGACAAGAAGGGAAGTTCACATATACTATCTAGAAAAAGCCAACAAGATAAAATCAGAGAAGACACACATTCACATATTCTCATTCACTGGGGAGGAAATGGCCACCAAAGCGGACTACACCCTCGATGAAGAGAGCAGAGCAAGAATAAAGACCAGGCTGTTCACTATAAGACAAGAAATGGCAAGCAGGGGTCTATGGGATTCCTTTCGTCAGTCCGAGAGAGGCGAAGAGACAATTGAAGAAAAATTTGAAATCACAGGAACAATGCGCAGGCTTGCCGATCAAAGTCTCCCACCGAACTTCTCCAGCCTTGAAAACTTTAGAGTCTATGTGGATGGATTCGAACCGAACGGCTGCATTGAGGGCAAGCTTTCTCAAATGTCAAAGGAAGTAAATGCCAGAATTGAGCCATTTCTGAAGACAACACCACGCCCTCTCAAATTACCTGATGGGCCTCCCTGCTCTCAGCGATCGAAGTTCTTGCTGATGGATGCTCTTAAGTTAAGCATCGAAGACCCGAGCCATGAAGGGGAAGGTATACCGCTATATGACGCAATCAAATGCATGAAGACATTTTTCGGCTGGAAGGAGCCCAATATCGTAAAACCACATGAGAAAGGCATAAACTCCAATTACCTCCTGGCTTGGAAGCAGGTGCTGACAGAACTCCAAGATCTTGAAAATGAAGAGAGAATCCCAAAAACAAAGAACATGAAGAAAACAAGCCAATTGAAGTGGGCACTTGGTGAGAACATGGCACCAGAAAAAGTAGACTTTGAGGACTGCAAAGATGTCAGTGATCTAAGACAGTATGACAGTGATGAACCAGAGTCTAGATCGCTAGCAAGCTGGATCCAGAGTGAATTCAACAAGGCATGCGAATTGACAGATTCGGGTTGGATTGAACTTGATGAAATAGGGGAAGACGTTGCCCCGATTGAGCACATTGCGAGTACGAGGAGGAATTATTTCACAGCGGAAGTATCCCATTGTAGGGCTACTGAGTACATAATGAAGGGAGTGTACATAAACACAGCCCTGTTGAATGCATCCTGTGCAGCTATGGATGACTTCCAACTGATTCCAATGATAAGCAAATGCAGAACAAAAGAAGGAAGACGGAAGACAAATCTGTATGGATTCATTATAAAAGGAAGATCCCATTTGAGAAATGACACCGATGTGGTAAACTTTGTGAGCATGGAATTCTCTCTCACTGACCCGAGATTGGAATCACACAAATGGGAGAAGTACTGTGTTCTTGAGATAGGAGACATGCTCCTACGGACTGCAATAGGCCAAGTGTCAAGGCCCATGTTCCTGTATGTGAGAACCAATGGGACTTCCAAGATCAAAATGAAATGGGGCATGGAGATGAGGCGATGTCTTCTTCAGTCCCTCCAACAAATTGAGAGCATGATTGAGGCTGAGTCTTCTGTTAAAGAGAAGGACATGACCAAGGAATTCTTTGAAAACAAATCAGAAACATGGCCAATTGGGGAATCACCCAAAGGAATGGAGGAAGGCTCCATTGGGAAGGTGTGCAGAACATTACTAGCAAAATCTGTGTTCAACAGCCTATATGCATCTCCACAACTTGAGGGGTTTTCAGCTGAATCGAGAAAATTGCTCCTCATTGTTCAGGCACTTAGGGACAACCTGGAACCTGGAACCTTCGATCTTGGGGGGCTATATGAAGCAATTGAGGAGTGCCTGATTAACGATCCCTGGGTTTTGCTTAATGCGTCCTGGTTCAACTCCTTCCTCACACATGCACTGAAATAGTTGTGGCAATGCTACTATTGCTATCCATACGTCCCAA +>OQ584675.1 +AGCGAAAGCAGGTACTGATTCGAAATGGAAGACTTTGTGCGACAATGCTTCAATCCAATGATTGTCGAGCTTGCGGAAAAAGCAATGAAAGAATATGGGGAAGATCCGAAAATCGAGACAAACAAATTTGCCGCAATATGCACACACCTAGAAGTCTGTTTCATGTATTCGGATTTCCATTTTATTGATGAACGAGGCGAATCAATGATTGTAGAATCTGGCGATCCAAATGCATTATTGAAACACCGATTTGAGATAATCGAAGGGAGAGACCGAGCAATGGCCTGGACAGTGGTGAATAGTATCTGCAACACCACAGGGGTCGAAAAGCCCAAATTCCTCCCTGATTTGTATGACTACAAAGAGAACCGATTCATTGAAATTGGAGTAACGCGAAGGGAAGTTCACATATACTATTTAGAAAAAGCCAACAAGATAAAATCAGAGAAAACACATATTCACATATTCTCATTCACTGGAGAGGAAATGGCCACCAAGGCGGACTACACCCTTGATGAAGAGAGCAGGGCAAGAATAAAAACCAGACTGTTCACTATAAGACAAGAAATGGCCAGTAGAGGTCTATGGGATTCCTTTCGTCAGTCCGAGAGAGGCGAAGAGACAATTGAAGAAAGATTTGAACTCACAGGAACCATGCGCAGGCTTGCCGACCAAAGTCTCCCACCGAACTTCTCCAGCCTTGAAAACTTTAGAGCCTATGTGGATGGATTCGAACCGAACGGCTGCATTGAGGGCAAACTTTCTCAAATGTCAAAAGAAGTGAACGCCAGAATTGAGCCATTTCTGAAGACAACACCACGCCCTCTCAGATTACCTGATGGGCCTCCCTGTTCTCAGCGGTCGAAGTTCTTGCTGATGGATGCCCTTAAGTTGAGCATCGAAGACCCTAGCCACGAGGGGGAGGGCATACCGCTGTATGATGCAATCAAATGCATGAAGACATTTTTTGGCTGGAAAGAGCCCAACATCGTAAAGCCGCATGAGAAAGGCATAAACCCTAATTACCTCCTGGCTTGGAAGCAGGTGCTGGCAGAACTTCAAGACATTGAAAATGAGGAGAAAATTCCAAAAACAAAGAACATGAAGAAAACAAGCCAATTGAAGTGGGCACTTGGTGAGAACATGGCTCCAGAAAAAGTGGACTTTGAGGACTGCAAAGATGTTAGCGATCTAAGACAGTACGACAGTGACGAACCAGAGTCTAGATCACTAGCAAGCTGGATTCAGAGTGAATTCAACAAGGCATGCGAACTGACAGATTCGAGTTGGATTGAACTTGATGAGATAGGGGAAGACGTTGCTCCAATCGAACACATTGCGAGTGTGAGGAGGAACTATTTCACAGCGGAGGTATCCCATTGCAGGGCCACTGAATACATAATGAAGGGAGTATACATAAACACAGCCCTATTGAATGCATCCTGTGCAGCCATGGATGACTTCCAACTGATTCCAATGATAAGTAAGTGCAGAACTAAAGAAGGAAGACGGAAGACAAATCTGTATGGATTCATTATAAAAGGAAGATCCCATTTGAGGAATGACACCGATGTGGTAAACTTTGTGAGCATGGAATTCTCTCTAACTGACCCGAGGCTAGAGCCACACAAATGGGAAAAGTACTGTGTTCTTGAGATAGGAGACATGCTCCTACGGACTGCAATAGGCCAAGTGTCGAGGTCCATGTTCCTGTATGTGAGAACCAATGGGACTTCCAAGATCAAAATGAAATGGGGCATGGAGATGAGGCGATGCCTTCTTCAGTCCCTTCAACAAATTGAGAGCATGATTGAGGCCGAATCTTCTGTCAAAGAGAAGGACATGTCCAAGGAATTCTTTGAAAACAAATCAGAAACATGGCCAATTGGAGAATCACCCAAAGGGGTGGAGGAAGGCTCTATTGGGAAAGTATGCAGAACATTGCTAGCAAAGTCTGTGTTCAACAGCCTATATGCATCTCCACAACTCGAGGGGTTTTCAGCTGAATCAAGAAAATTGCTTCTCATTGTTCAGGCACTTAGGGACAACCTGGAACCTGGAACCTTCGATCTTGGGGGGCTATATGAAGCAATTGAGGAGTGCCTGATTAACGATCCCTGGGTTTTGCTTAATGCGTCTTGGTTCAACTCCTTCCTCACACATGCACTGAAATAGTTGTGGCAATGCTACTATTTGCTATCCATACTGTCCAAAAAAGTACCTTGTTTCTACT +>KP097880.1 +ATGGAAGACTTTGTGCGACAATGCTTCAATCCAATGATCGTCGAGCTTGCGGAAAAGACAATGAAAGAATATGGGGAAAGTCCAAAAATCGAAACGAACAAATTCGCCGCAATATGCACACACTTAGAAGTCTGCTTCATGTATTCGGATTTCCACTTTATAGATGAACGAGGCGAGTCAATAATTGCAGAATCTGGCGATCCGAATGCATTATTGAAACACCGATTTGAGATAATTGAAGGGAGAGACCGAACAATGGCTTGGACAGTGGTAAATAGTATCTGCAACACCACAGGAGTCAATAAGCCTAAATTCCTCCCAGACTTGTATGACTACAAAGAGAACCGATTCATTGAAATTGGAGTGACACGGCGGGAAGTTCACCTATACTACCTAGAAAAAGCAAACAAGATAAAATCAGAGAGGACACACATTCACATATTCTCATTCACTGGAGAGGAAATGGCCACTAAAGCTGACTATACTCTTGATGAAGAGAGCAGAGCAAGAATCAAAACCAGGCTGTTCACCATAAGACAAGAGATGGCCAGTAGGGGTCTATGGGATTCCTTTCGTCAATCTGAGAGAGGCGAAGAGACAATTGAAGAAAGGTTTGAAATCACAGGAACCATGCGCAGGCTTGCTGACCAAAGCCTCCCACCGAACTTCTCCAGCCTTGAAAATTTTAGAGCCTATGTGGATGGATTCAAACCGAACGGCTGCATTGAGGGCAAGCTTTCTCAAATGTCAAAGGAAGTGAACGCCAGAATTGAGCCATTTATGAAGACAACACCACGCCCTCTCAGACTACCTGAGGGGCCTCCCTGCTCCCAGCGGTCGAAGTTCTTACTGATGGATGGCCTTAAGTTAAGCATTGAAGATCCAAGCCATGAGGGGGAAGGCATACCACTATATGATGCAATCAAATGCATGAAGACTTTTTTCGGCTGGAAAGAGCCCAACATCGTAAAACCACATGAAAAGGGCATAAATCCCAATTACCTCCTGGCTTGGAAGCAGGTGCTGTCAGAACTCCAAGACATTGAAAATGAAGATAAAATCCCAAAAACAAAGAACATGAAGAAAACAAGCCAATTAAAGTGGGCACTTGGTGAGAATATGGCACCAGAAAAAGTAGACTTTGAGGACTGCAAAGATGTTAGCGATCTAAAACAGTATGACAGTGATGAACCAGAACCTAGGTCATTATCAAGCTGGATTCAGAGCGAATTCAACAAAGCATGCGAATTGACAGATTCGAGTTGGATTGAACTTGATGAAATAGGAGAAGATGTCGCTCCAATTGAGCACATTGCAAGTATGAGAAGAAACTATTTCACAGCGGAAGTGTCTCATTGCAGGGCCACTGAATACATAATGAAGGGAGTGTATATAAACACAGCCCTATTGAATGCATCCTGTGCAGCCATGGATGACTTCCAGTTGATTCCAATGATAAGCAAGTGCAGAACCAAAGAAGGAAGACGGAAAACAAATCTGTACGGATTCATTATAAAAGGAAGGTCCCATTTGAGGAACGACACCGATGTGGTAAACTTTGTGAGCATGGAATTCTCTCTTACTGACCCGAGGCTGGAACCACACAAGTGGGAAAAGTACTGTGTTCTTGAAATAGGAGACATGCTATTACGAACTGCAATAGGCCAGGTGTCAAGACCCATGTTCCTGTATGTGAGAACCAATGGGACGTCCAAGATTAAAATGAAATGGGGCATGGAGATGAGGCGATGCCTTCTTCAATCCCTTCAACAAATTGAGAGCATGATTGAGGCCGAGTCTTCTGTCAAAGAGAAAGACATGACCAAAGAATTCTTTGAAACCAAATCAGAAACGTGGCCAATTGGGGAATCACCTAAAGGGGTGGAAGAAAGCCCCATTGGAAAGGTGTGCAGAACATTACTAGCAAAATCTGTATTCAACAGCCTATATGCATCTCCACAACTTGAGGGGTTTTCAGCTGAATCAAGAAAATTGCTTCTCATTGTTCAGGCACTTAGGGACAACCTGGAACCTGGAACCTTCGATCTTGGGGGGCTATATGAAGCAATTGAGGAGTGCCTAATTAATGATCCCTGGGTTTTGCTTAATGCATCTTGGTTCAACTCCTTCCTCACACATGCACTGAAATAG +>KP097878.1 +ATGGAAGACTTTGTGCGACAATGCTTCAATCCAATGATCGTCGAGCTTGCGGAAAAGACAATGAAAGAATATGGGGAAAGTCCAAAAATCGAGACGAACAAGTTCGCCGCAATATGCACACACTTAGAAGTCTGCTTCATGTATTCGGATTTCCACTTTATAGATGAACGAGGCGAGTCAATAATTGCAGAATCTGGCGATCCGAACGCATTATTGAAACACCGATTTGAGATAATTGAAGGGAGAGACCGAACAATGGCTTGGACAGTGGTAAATAGTATCTGCAACACCACAGGAGTCGATAAGCCTAAATTCCTCCCAGACTTGTATGACTACAAAGAGAACCGATTCATTGAAATTGGAGTGACACGGCGGGAAGTTCACATATACTATCTAGAAAAAGCAAACAAGATAAAATCAGAGAGGACACACATTCACATATTCTCATTCACTGGAGAGGAAATGGCCACTAAAGCTGACTATACTCTTGATGAGGAGAGCAGAGCAAGAATTAAAACCAGGCTGTTCACTATAAGACAAGAGATGGCCAGTAGGGGTCTATGGGATTCCTTTCGTCAATCCGAGAGAGGCGAAGAGACAATTGAAGAAAGGTTTGAAATCACAGGAACCATGCGCAGGCTTGCTGACCAAAGCCTCCCACCGAACTTCTCCAGCCTTGAAAATTTTAGAGCCTATGTGGATGGATTCGAACCGAACGGCTGCATTGAGGGCAAGCTTTCTCAAATGTCAAAGGAAGTGAACGCCAGAATTGAGCCATTTATGAAGACAACACCACGCCCTCTCAGACTACCTGAGGGGCCTCCCTGCTCCCAGCGGTCGAAGTTCTTACTGATGGATGCCCTTAAGTTAAGCATTGAAGATCCAAGCCATGAGGGGGAAGGTATACCCCTATATGATGCAATCAAATGCATGAAGACATTTTTCGGCTGGAAAGAGCCCAACATCGCAAAACCACATGAAAAGGGCATAAATTCCAATTACCTCCTGGCTTGGAAGCAGGTGCTGTCAGAACTCCAAGACATTGAAAATGAAGATAAAATCCCAAAAACAAAGAACATGAAGAAAACAAGCCAATTAAAGTGGGCACTTGGTGAGAATATGGCACCAGAAAAAGTAGACTTTGAGGACTGCAAAGATGTTGGCGATCTAAAACAGTATGACAGTGATGAACCAGAGCCTAGATCATTATCAAGCTGGATTCAGAACGAATTCAACAAAGCATGCGAATTGACAGATTCGAGTTGGATTGAACTTGATGAAATAGGAGAAGATGTTGCTCCAATTGAGCACATTGCAAGTATGAGAAGAAACTATTTCACAGCGGAAGTGTCTCATTGCAGGGCCACTGAATACATAATGAAGGGAGTGTATATAAACACAGCCCTACTGAATGCATCCTGTGCAGCCATGGATGACTTCCAGTTGATTCCAATGATAAGCAAGTGCAGAACCAAAGAAGGAAGACGGAAGACAAATCTGTACGGATTCATCATAAAAGGAAGGTCCCATTTGAGGAACGACACCGATGTGGTAAACTTTGTGAGCATGGAATTCTCTCTTACTGACCCGAGGCTGGAACCACACAAGTGGGAAAAGTACTGTGTTCTTGAAATAGGAGACATGCTATTACGAACTGCAATAGGCCAGGTGTCAAGACCCATGTTCCTGTATGTGAGAACCAATGGGACGTCCAAGATTAAGATGAAATGGGGCATGGAGATGAGGCGATGCCTTCTTCAATCTCTTCAACAAATTGAGAGCATGATTGAGGCCGAGTCTTCTGTTAAAGAGAAAGACATGACCAAAGAATTCTTTGAAACCAAATCAGAAACGTGGCCAATTGGGGAATCACCTAAAGGGGTGGAAGAAAGCTCCATTGGAAAGGTGTGCAGAACATTACTAGCAAAATCTGTATTCAACAGCCTATATGCATCTCCACAACTTGAGGGGTTTTCAGCTGAATCAAGAAAATTGCTTCTCATTGTTCAGGCACTTAGGGACAACCTGGAACCTGGAACCTTCGATCTTGGGGGGCTATATGAAGCAATTGAGGAGTGCCTGATTAATGATCCCTGGGTTTTGCTTAATGCATCTTGGTTCAACTCCTTCCTCACACATGCACTGAAATAG +>KP097872.1 +ATGGAAGACTTTGTGCGACAATGCTTCAATCCAATGATTGTCGAGCTTGCAGAAAAGGCAATGAAAGAATATGGGGAAGATCCAAAAATCGAAACGAACAAGTTTGCTGCGATATGCACACACTTGGAGGTTTGTTTCATGTATTCGGATTTTCACTTTATTGATGAACGGAGTGAATCAATAATTGTAGAATCTGGAGACCCAAATGCACTATTGAAACACCGATTTGAAATAATTGAAGGGAGAGACCGAACAATGGCCTGGACTGTGGTGAATAGTATTTGCAACACCACAGGAGTTGTGAAACCTAAATTTCTCCCAGATTTGTATGACTACAAAGAGAATCGATTCATTGAAATTGGAGTGACACGGAGGGAAGTTCATACATACTATCTGGAGAAAGCCAACAAGATAAAGTCCGAGAGGACACATATTCACATATTTTCATTCACAGGGGAGGAAATGGCCACCAAAGCGGACTACACCCTTGATGAAGAGAGCAGAGCAAGAATTAAAACCAGGCTGTTCACCATAAGGCAGGAAATGGCCAGTAGGGGCCTATGGGATTCCTTTCGTCAATCCGAGAGAGGCGAAGAGACAATTGAAGAAAAATTTGAAATCACTGGAACCATGCGCAGACTTGCAGACCAAAGTCTCCCTCCGAACTTCCCCAGCCTTGAAAACTTTAGAGCCTATGTGGATGGATTCAAACCGAACGGCTGCATTGAGGGCAAGCTTTCTCAAATGTCAAAAGAAGTGAATGCTAGAATTGAGCCATTTTTAAAGACAACACCACGCCCTCTCAGACTACCTGATGGGCCGTCTTGCTCTCAGCGGTCGAAGTTCCTGCTGATGGATGCCCTTAAATTAAGTATCGAAGACCCGAGTCATGAGGGAGAGGGGATACCACTATACGATGCAATCAAATGCATGAAGACATTTTTCGGCTGGAAAGAACCCAACATCGTGAAACCGCATGAAAAAGGTATAAACCCCAATTACCTCCTGGCTTGGAAGCAAGTTCTGGCAGAACTCCAAGATATTGAAAATGGGGAGAAAATCCCGAAAACAAAAAACATGAAAAAAACAAGCCAGTTGAAGTGGGCACTCGGTGAAAACATGGCACCAGAGAAAGTAGACTTTGAGGACTGCAAAGATATTAGCGATCTAAGACAGTATGACAGTGATGAACCAGAGTCTAGATCACTAGCAAGCTGGATTCAGAGTGAATTCAACAAGGCATGTGAATTGACAGATTCGAGTTGGATTGAATTTGATGAGATAGGAGAAGACGTAGCTCCAATCGAGCACATTGCAAGTATGAGAAGGAACTATTTTACAGCGGAAGTATCCCATTGCAGGGCCACTGAATACATAATGAAGGGAGTGTACATAAACACGGCCCTATTGAATGCTTCCTGTGCAGCCATGGATGACTTTCAACTGATTCCAATGATAAGCAAATGCAGGACCAAAGAAGGAAGGCGGAAGACTAATCTGTATGGATTCATTATAAAAGGGAGATCCCACTTGAGGAATGATACCGATGTGGTAAATTTTGTGAGTATGGAATTCTCTCTTACTGATCCGAGGCTGGAGCCACACAAGTGGGAAAAGTACTGTGTCCTCGAGATCGGAGACATGCTCCTCCGGACTGCAGTAGGCCAAGTTTCAAGGCCCATGTTCCTGTATATAAGAACCAATGGAACCTCCAAGATCAAAATGAAATGGGGCATGGAAATGAGGCGGTGCCTTCTTCAATCCCTTCAACAAATTGAAAGCATGATTGAGGCTGAGTCTTCTGTCAAAGAGAAGGACATGACCAAAGACTTCTTTGAAAACAAATCAGAAACATGGCCAATTGGAGAGTCCCCCAAGGGAGTGGAGGAAGGCTCCATCGGGAAGGTATGCAGAACCTTGCTAGCGAGGTCTGTGTTCAATAGTTTATATGCATCTCCACAACTCGAGGGGTTCTCAGCTGAATCAAGAAAATTGCTTCTCATTGTTCAGGCACTTAGGGACAACCTGGAACCTGGGACCTTTGATCTTGGAGGGCTATATGAAGCAATTGAGGAGTGCCTGATTAACGATCCCTGGGTTTTGCTTAATGCGTCTTGGTTCAACTCCTTCCTCGCACATGCACTGAAATAG +>MH681420.1 +CGACAATGCTTCAATCCAATGATTGTCGAGCTTGCGGAAAAGGCAATGAAAGAATATGGGGAAGATCCGAAAATTGAAACGAACAAATTTGCTGCAATATGCACACACTTGGAGGTCTGTTTCATGTATTCGGATTTTCACTTTATTGATGAACGGAGTGAATCAATAATTGTAGAATCTGGAGATCCGAACGCATTATTGAAACACCGATTTGAAATAATTGAAGGAAGAGACCGAACGATGGCCTGGACTGTGGTAAATAGTGTTTGCAACACCACAGGAGTCGAGAAACCTAAATTTCTCCCAGATTTGTATGACTACAAAGAGAACCGATTTATTGAAATTGGAGTGACACGGAGGGAAGTTCACACATATTATCTAGAGAAGGCCAACAAGATAAAGTCCGAGAAGACACATATTCACATATTCTCATTCACAGGAGAAGAGATGGCAACCAAAGCGGACTACACCCTTGATGAAGAGAGTAGGGCAAGAATCAAAACCAGGCTGTTCACAATAAGACAGGAAATGGCCAATAGGGGTCTATGGGATTCCTTTCGTCAATCCGAGAGAGGCGAAGAAACAATTGAAGAAAAATTTGAAATCACTGGAACCATGCGCAGACTTGCTGACCAAAGTCTCCCACCGAACTTCTCCAGCCTTGAAAACTTTAGAGCCTATGTGGATGGATTCGAACCGAACGGCTGCATTGAGGGCAAGCTTTCTCAAATGTCAAAAGAAGTGAATGCTAGAATTGAGCCATTTTTGAAANCAACGCCACGTCCTCTCAAATTACCAGATGGGCCTCCTTGCTCTCAGCGATCGAAATTCCTGCTGATGGATTCCCTTAAATTAAGTATCGAAGACCCGAGTCATGAGGGAGAAGGGATACCACTATACGATGCAATCAAATGCATGAAGACATTTTTCGGGTGGAAAGAGCCCGGCATCGTGAAACCACATGAGAAGGGTATAAACCCCAATTACCTCCTGACCTGGAAGCAAGTGATGGCAGAGCTCCAAGACATTGAAAATGATGAGAAAATCCCAAAAACAAAAAACATGAAAAAAACGAGCCAGTTGAGATGGGCACTCGGTGAGAACATGGCACCAGAGAAAGTAGATTTTGAGGACTGCAAAGATGTTAGAGATCTGAAACAATATGACAGTGATGAACCAGAAACTAGATCACTAGCAAGCTGGATTCAGAGTGAATTCAACAAAGCATGTGAATTGACAGACTCTAGTTGGATTGAACTTGATGAAATAGGAGAGGATGTTGCTCCAATTGAGCACATTGCAAGTATGAGAAGGAACTATTTCACAGAGGAAGTATCCCATTGCAGAGCCACTGAATACATAATGAAGGGAGTGTACATAAACACAGCCCTGTTGAATGCATCCTGTGCAGCCATGGATGACTTTCAACTGATTCCAATGATAAGCAAATGCAGAACCAAAGAAGGGAGACGGAAAACTAATCTGTATGGGTTTATTATAAAAGGAAGATCCCACTTGAGGAATGATACCGATGTGGTAAATTTTGTGAGTATGGAATTCTCTCTTACTGATCCGAGGTTGGAGCCACACAAATGGGAAAAGTACTGTGTCCTCGAGATAGGAGACATGCTCCTCCGGACTGCAGTAGGTCAAGTTTCAAGGCCCATGTTCCTGTACGTAAGAACCAACGGAACCTCCAAGATCAAAATGAAATGGGGCATGGAAATGAGACGATGCCTTCTTCAATCCCTTCAACAAATTGAAAGCATGATTGAAGCTGAATCTTCTGTCAAGGAGAAGGACATGACCAAAGAATTCTTTGAAAACAGATCAGAAACATGGCCGATCGGAGAATCCCCCAGGGGAGTGGAGGAAGGCTCCATCGGAAAGGTATGCAGAACCTTGCTGGCGAAGTCTGTTTTCAACAGTTTATATGCATCTTCACAACTCGAGGGGTTTTCAGCTGAATCAAGAAAACTGCTTCTCATTGCTCAGGCACTTAGGGACAACCTGGAACCTGGGACCTTCGATCTTGGAGGGCTATATGAAGCAATTGAGGAGTGCCTGATTAATGATCCCTGGGTTTTGCTTAATGCGTCTTGGCTCAACTCCTTCCTCGCACATGCACTGAAT +>KU971348.1 +ATGGAAGACTTTGTGCGACAATGCTTCAATCCAATGATCGTCGAGCTTGCAGAAAAGACAATGAAAGAATATGGGGAAAATCCAAAAATCGAAACGAACAAATTCGCCGCAATATGCACACACTTAGAAGTCTGCTTCATGTATTCGGATTTCCACTTTATAGATGAACGAGGCGAGTCAATAATCGCAGAATCTGGCGATCCAAATGCATTATTGAAACACCGATTTGAGATAATTGAAGGGAGGGACCGAACAATGGCTTGGACAGTAGTAAATAGTATCTGCAACACCACAGGAGTCAATAAGCCTAAATTCCTCCCAGACTTGTATGACTACAAAGAGAACCGATTCATTGAAATTGGAGTGACACGGCGGGAAGTTCATATATACTACCTAGAAAAAGCAAACAAGATAAAATCAGAGAGGACACACATCCACATATTCTCATTCACTGGAGAGGAAATGGCCACCAAAGCTGACTATACTCTTGATGAGGAGAGCAGAGCAAGAATTAAAACCAGGCTGTTCACTATAAGACAAGAGATGGCCAGTAGGGGTCTATGGGATTCCTTTCGTCAATCTGAGAGAGGCGAAGAGACAATTGAAGAAAGGTTTGAAATCACAGGAACCATGCGCAGGCTTGCTGACCAAAGCCTCCCACCGAACTTCTCCAGCCTTGGAAATTTTAGAGCCTATGTGGATGGATTCGAACCGAACGGCTGCATTGAGGGCAAGCTTTCTCAAATGTCAAAGGAAGTGAACGCCAGAATTGAGCCATTTATGAGGACAACACCACGCCCTCTCAGACTACCTGAGGGGCCTCCCTGCCCCCAGCGGTCGAAGTTCTTACTGATGGATGCCCTTAAGTTAAGCATTGAAGATCCAAGCCATGAAGGGGAAGGTATACCACTATATGATGCAATCAAATGCATGAAGACGTTTTTCGGCTGGAAAGATCCCAACATCGTAAAACCACATGAAAAGGGCATAAATCCCAATTACCTCCTGGCTTGGAAGCAGGTGCTATCAGAACTCCAAGACATTGAAAATGAAGATAAAATCCCAAAAACAAAGAACATGAAGAAAACAAGCCAATTAAAGTGGGTACTTGGTGAGAATATGGCACCAGAAAAAGTAGACTTTGAGGATTGCAAAGATGTTAGCGATCTAAAACAGTATGACAGTGATGAACCAGAACCTAGGTCATTATCAAGCTGGATTCAGAGCGAATTCAACAAAGCATGCGAATTGACAGATTCGAGTTGGATTGAACTTGATGAAATAGGAGAAGATGTCGCTCCAATTGAGCACATTGCAAGTATGAGAAGAAACTATTTCACAGCGGAAGTGTCTCATTGCAGGGCCACTGAATACATAATGAAGGGAGTGTATATAAACACAGCCCTATTGAATGCATCCAGTGCAGCCATGGATGACTTCCAACTGATTCCAATGATAAGCAAGTGCAGAACCAAAGAAGGAAGACGGAAAACAAATCTATACGGATTCATTATAAAAGGAAGGTCCCATTTGAGGAACGACACCGATGTGGTAAACTTTGTGAGCATGGAATTTTCTCTTACTGACCCGAGGCTGGAACCACACAAGTGGGAAAAGTACTGTGTTCTTGAAATAGGAGACATGCTATTACGAACTGCAATAGGCCAGGTGTCAAGACCCATGTTCCTGTATGTGAGAACCAATGGGACGTCCAAGATTAAGATGAAATGGGGCATGGAGATGAGGCGATGCCTTCTTCAATCCCTTCAACAAATTGAGAGCATGATTGAAGCCGAGTCTTCTGTCAAAGAGAAAGACATGACCAAAGAATTTTTTGAAACCAAATCAGAAACGTGGCCAATTGGGGAATCACCTAAAGGGGTGGAAGAAAGCTCCATTGGAAAGGTGTGCAGAACATTACTAGCAAAATCTGTATTCAACAGCCTATATGCATCTCCACAACTTGAGGGGTTTTCAGCCGAATCAAGAAAATTGCTTCTCATTGTTCAGGCACTTAGGGACAACCTGGAACCTGGGACCTTCGATCTTGGGGGGCTATATGAAGCAATTGAGGAGTGCCTGATTAATGATCCCTGGGTTTTGCTTAATGCATCTTGGTTCAACTCCTTCCTCACACATGCACTGAAATAG +>KU971420.1 +ATGGAAGACTTTGTGCGACAATGCTTCAATCCAATGATCGTCGAGCTTGCGGAAAAGACAATGAAAGAATATGGGGAAAATCCAAAAATCGAAACGAACAAATTCGCTGCAATATGCACACACTTAGAAGTCTGCTTCATGTATTCGGACTTCCACTTTATAGATGAACGAGGTGAGTCAATAATCGCAGAATCTGGCGATCCAAATGCATTATTGAAACACCGATTTGAGATAATTGAAGGGAGAGACCGAACAATGGCTTGGACAGTAGTAAATAGTATCTGCAACACCACAGGAGTCAATAAGCCTAAATTCCTCCCAGACTTGTATGACTACAAAGAGGACCGATTCATTGAAATTGGAGTGACACGGCGGGAAGTTCACATATACTACCTAGAAAAAGCAAACAAGATAAAATCAGAGAGGACACACATCCACATATTCTCGTTCACTGGAGAGGAAATGGCCACCAAAGCTGACTATACTCTTGATGAGGAGAGCAGAGCAAGAATTAAAACCAGGCTGTTCACTATAAGACAAGAGATGGCCAGTAGGGGTCTATGGGATTCCTTTCGTCAATCTGAGAGAGGCGAAGAGACACTTGAAGAAAGGTTTGAAATCACAGGAACCATGCGCAGGCTTGCTGACCAAAGCCTCCCACCGAACTTCTCCAGCCTTGGAAATTTTAGAGCCTATGTGGATGGATTCGAACCGAACGGCTGCATTGAGGGCAAGCTTTCTCAAATGTCAAAGGAAGTGAACGCCAGAATTGAGCCATTTATGAGGACAACACCACGCCCTCTCAGACTACCTGAGGGGCCTCCCTGCCCCCAGCGGTCGAAGTTCTTACTGATGGATGCCCTTAAGTTAAGCATTGAAGATCCAAGCCATGAGGGGGAAGGCATACCACTATATGATGCAATCAAATGCATGAAGACATTTTTCGGCTGGAAAGATCCCAACATCGTAAAGCCACATGAAAAGGGCATAAATCCCAATTACCTCCTGGCTTGGAAGCAGGTGCTATCAGAACTCCAAGACATTGAAAATGAAGATAAAATCCCAAAAACAAAGAACATGAAGAAAACAAGCCAATTAAAGTGGGTACTTGGTGAGAATAGGGCACCAGAAAAAGTAGACTTTGAGGATTGCAAAGATGTTAGCGATCTAAAACAGTATGACAGTGATGAACCAGAACCTAGGTCATTATCAAGCTGGATTCAGAGCGAATTCAACAAAGCATGCGAATTGACAGATTCGAGTTGGATTGAACTTGATGAAATAGGAGAAGATGTCGCTCCAATTGAGCACATTGCAAGTATGAGAAGAAACTATTTCACAGCGGAAGTGTCTCATTGCAGGGCCACTGAATACATAATGAAGGGAGTGTATATAAACACAGCTCTATTGAATGCATCCAGTGCAGCCATGGATGACTTCCAACTGATTCCAATGATAAGCAAGTGCAGAACCAAAGAAGGAAGACGGAAAACAAATCTATACGGATTCATTATAAAAGGAAGGTCCCATTTGAGGAACGACACCGATGTGGTAAACTTTGTGAGCATGGAATTTTCTCTTACTGACCCGAGGCTGGAACCACACAAGTGGGAAAAGTACTGTGTTCTTGAAATAGGAGACATGCTATTACGAACTGCAATAGGCCAGGTGTCAAGACCCATGTTCCTGTATATGAGAACCAATGGGACGTCCAAGATTAAGATGAAATGGGGCATGGAGATGAGGCGATGCCTTCTTCAATCCCTTCAACAAATTGAGAGCATGATTGAAGCCGAGTCTTCTGTCAAAGAGAAAGACATGACCAAAGAATTTTTTGAAACCAAATCAGAAACGTGGCCAATTGGGGAATCACCTGAAGGGGTGGAAGAAAGCCCCATTGGAAAGGTGTGCAGAACATTACTAGCAAAATCTGTATTCAACAGCCTATATGCATCTCCACAACTTGAGGGGTTTTCAGCCGAATCAAGAAAATTGCTTCTCATTGTTCAGGCACTTAGGGACAACCTGGAACCTGGGACCTTCGATCTTGGGGGGCTATATGAAGCAATTGAGGAGTGCCTGATTAATGATCCCTGGGTTTTGCTTAATGCATCTTGGTTCAACTCCTTCCTCACACATGCACTGAAATAG +>KX513198.1 +AGCGAAAGCAGGTACTGATCCAAAATGGAAGACTTTGTGCGACAATGCTTCAATCCAATGATCGTCGAGCTTGCGGAAAAGACAATGAAAGAATATGGGGAAAGTCCAAAAATCGAAACGAACAAATTCGCCGCAATATGCACACACTTAGAAGTCTGCTTCATGTATTCGGATTTCCACTTTATAGATGAACGAGGCGAGTCAATAATTGCAGAATCTGGCGATCCGAATGCATTATTGAAACACCGATTTGAGATAATTGAAGGGAGAGACCGAACAATGGCTTGGACAGTGGTAAATAGTATCTGCAACACCACAGGAGTCAATAAGCCTAAATTCCTCCCAGACTTGTATGACTACAAAGAGAACCGATTCATTGAAATTGGGGTGACACGGCGGGAAGTTCACATATACTACCTAGAAAAAGCAAACAAGATAAAATCAGAGAGGACACACATTCACATATTCTCATTCACTGGAGAGGAAATGGCCACTAAAGCTGACTATACTCTTGATGAAGAGAGCAGAGCAAGAATCAAAACCAGGCTGTTCACTATAAGACAAGAGATGGCCAGTAGGGGTCTATGGGATTCCTTTCGTCAATCTGAGAGAGGCGAAGAGACAATTGAAGAAAGGTTTGAAATCACAGGAACCATGCGCAGGCTTGCTGACCAAAGCCTCCCACCGAACTTCTCCAGCCTTGAAAATTTTAGAGCCTATGTGGATGGATTCAAACCGAACGGCTGCATTGAGGGCAAGCTTTCTCAAATGTCAAAGGAAGTGAACGCCAGAATTGAGCCATTTATGAAGACAACACCACGCCCTCTCAGACTACCTGATGGGCCTCCCTGCTCCCAGCGGTCGAAGTTCTTACTGATGGATGCCCTTAAGTTAAGCATTGAAGATCCAAGCCATGAGGGGGAAGGCATACCACTATATGATGCAATCAAATGCATGAAGACTTTTTTCGGATGGAAAGAGCCCAACATCGTAAAACCACATGAAAAGGGCATAAATCCCAATTACCTCCTGGCTTGGAAGCAGGTGCTGTCAGAACTCCAAGACATTGAAAATGAAGATAAAATCCCAAAAACAAAGAACATGAAGAAAACAAGCCAATTAAAGTGGGCACTTGGTGAGAATATGGCACCAGAAAAAGTAGACTTTGAGGACTGCAAAGATGTTAGCGATCTAAAACAGTATGACAGTGATGAACCAGAACCTAGGTCATTATCAAGCTGGATTCAGAGCGAATTCAACAAAGCCTGCGAATTGACAGATTCGAGTTGGATTGAACTTGATGAAATAGGAGAAGATGTCGCTCCAATTGAGCACATTGCAAGTATGAGAAGAAACTATTTCACAGCAGAAGTGTCTCATTGCAGGGCCACTGAATACATAATGAAGGGAGTGTATATAAACACAGCCCTATTGAATGCATCCTGTGCAGCCATGGATGACTTCCAGTTGATTCCAATGATAAGCAAGTGCAGAACCAAAGAAGGAAGACGGAAAACAAATCTGTACGGATTCATTATAAAAGGAAGGTCCCATTTGAGGAACGACACCGATGTGGTAAACTTTGTGAGCATGGAATTCTCTCTTACTGACCCGAGGCTGGAACCACACAAGTGGGAAAAGTACTGTGTTCTTGAAATAGGAGACATGCTATTACGAACTGCAATAGGCCAGGTGTCAAGACCCATGTTCCTGTATGTGAGAACCAATGGGACGTCCAAGATTAAAATGAAATGGGGCATGGAGATGAGGCGATGCCTTCTTCAATCCCTTCAACAAATTGAGAGCATGATTGAGGCCGAGTCTTCTGTCAAAGAGAAAGACATGACCAAAGAATTCTTTGAAACCAAATCAGAAACGTGGCCAATTGGGGAATCACCTAAAGGGGTGGAAGAAAGCTCCATTGGAAAGGTGTGCAGAACATTACTAGCAAAATCTGTATTCAACAGCCTATATGCATCTCCACAACTTGAGGGGTTTTCAGCTGAATCAAGAAAATTGCTTCTCATTGTTCAGGCACTTAGGGACAACCTGGAACCTGGAACCTTCGATCTTGGGGGGCTATATGAAGCAATTGAGGAGTGCCTAATTAATGATCCCTGGGTTTTGCTTAATGCATCTTGGTTCAACTCCTTCCTCACACATGCACTGAAATAGTTGTGGCAATGCTACTATTTGCTATCCATACTGTCCAAAAAAAGTACCTTGTTTCTACT +>KX215333.1 +AGCGAAAGCAGGTACTGATCCAAAATGGAAGACTTTGTGCGACAATGCTTCAATCCAATGATCGTCGAGCTTGCGGAAAAGACAATGAAAGAATATGGAGAAAGTCCAAAAATCGAAACGAACAAATTCGCCGCAATATGCACACACTTAGAAGTCTGCTTCATGTATTCAGATTTCCACTTTATAGATGAACAAGGCGAGTCAATAATTGCAGAATCTGGCGATCCGAATGCATTATTAAAACACCGATTTGAGATAATTGAAGGGAGAGACCGAACAATGGCTTGGACAGTGGTAAATAGTATCTGCAACACCACAGGAGTCGATAAGCCTAAATTCCTCCCAGATTTGTATGACTACAAAGAGAACCGATTCATTGAAATTGGAGTGACACGGAGGGAAGTTCACATATACTACCTGGAAAAAGCAAACAAGATAAAATCAGAGAGGACACACATTCACATATTCTCATTCACTGGAGAGGAAATGGCCACTAAAGCTGACTATACTCTTGATGAGGAGAGCAGAGCAAGAATTAAAACCAGGCTGTTCACTATAAGGCAAGAGATGGCCAGTAGGGGTCTATGGGATTCCTTTCGTCAATCCGAGAGAGGCGAAGAGACAATTGAAGAGAGGTTTGAAATCACAGGAACCATGCGCAGGCTTGCTGACCAAAGCCTCCCACCGAACTTCTCCAGCCTTGAAAATTTTAGAGCCTATGTGGATGGATTCGAACCGAATGGCTGCATTGAGGGCAAGCTTTCTCAAATGTCAAAGGAAGTGAACGCCAGAATTGAGCCATTTATGAAGACAACACCACGCCCTCTCAGACTACCTGAGGGCCCTCCCTGCTCCCAGCGGTCGAAATTCTTACTGATGGATGCCCTCAAATTAAGCATCGAAGATCCAAGCCATGAGGGGGAAGGTATACCACTATATGATGCAATCAAATGCATGAAGACATTTTTCGGCTGGAAAGAGCCCAACATCGTAAAACCACATGAAAAGGGTATAAATCCCAATTACCTCCTGGCTTGGAAGCAGGTGCTGGCAGAACTCCAAGACATTGAAAATGAAGATAAAATCCCAAAAACAAAGAACATGAAGAAAACAAGCCAATTAAAGTGGGCACTTGGTGAGAATATGGCACCAGAAAAAGTAGACTTTGAGGACTGCAAAGATGTTAGCGATCTAAGACAGTATGACAGTGATGAACCAGACCCTAGATCATTATCAAGCTGGATTCAGAGCGAATTCAACAAAGCATGCGAATTGTCAGATTCGATCTGGATTGAGCTTGATGAAATAGGAGAAGATGTTGCTCCAATTGAGCACATTGCAAGTATGAGAAGAAATTACTTCACGGCGGAAGTGTCTCATTGCAGGGCCACTGAATACATAATGAAGGGAGTGTATATAAACACAGCCCTATTGAATGCATCCTGTGCAGCCATGGATGACTTCCAGTTGATTCCAATGATAAGCAAGTGCAGAACCAAAGAAGGAAGACGGAAGACAAATCTGTATGGATTCATTATAAAAGGAAGGTCCCATTTGAGGAACGACACCGATGTGGTAAACTTTGTGAGCATGGAATTTTCTCTTACTGACCCGAGGCTGGAACCACACAAGTGGGAAAAGTACTGTGTTCTTGAAATAGGAGACATGCTATTACGAACCGCTATAGGCCAAGTGTCAAGACCCATGTTCCTGTATGTGAGAACCAATGGGACGTCCAAGATTAAGATGAAATGGGGCATGGAGATGAGGCGATGCCTTCTTCAATCCCTTCAACAAATTGAGAGCATGATTGAGGCCGAGTCTTCTGTCAAAGAGAAAGACATGACCAAAGAATTCTTTGAAACCAAATCAGAAACGTGGCCAATTGGGGAATCACCTAAAGGAGTGGAGGAAAGCTCCATTGGAAAGGTGTGCAGAACATTACTAGCAAAATCTGTATTCAACAGCCTATATGCATCCCCACAACTTGAGGGGTTTTCAGCTGAATCAAGAAAATTGCTTCTCATTGTTCAGGCACTTAGGGACAACCTGGAACCTGGAACCTTCGATCTTGGGGGGCTATATGAAGCAATTGAGGAGTGCCTGATTAATGATCCCTGGGTTTTGCTTAATGCATCTTGGTTCAACTCCTTCCTCACACATGCACTGAAATAGTTGTGGCAATGCTACTATTTGCTATCCATACTGTCCAAAAAAGTACCTTGTTTCTACT +>KX513246.1 +AGCGAAAGCAGGTACTGATCCAAAATGGAAGACTTTGTGCGACAATGCTTCAATCCAATGATCGTCGAGCTTGCGGAAAAGACAATGAAAGAATATGGGGAAAGTCCAAAAATCGAAACGAACAAATTCGCCGCAATATGCACACACTTAGAAGTCTGCTTCATGTATTCGGATTTCCACTTTATAGATGAACGAGGCGAGTCAATAATTGCAGAATCTGGCGATCCGAATGCATTATTGAAACACCGATTTGAGATAATTGAAGGGAGAGACCGAACAATGGCTTGGACAGTGGTAAATAGTATCTGCAACACCACAGGAGTCGATAAGCCTAAATTCCTCCCAGATTTGTATGACTACAAAGAGAACCGATTCATTGAAATTGGAGTGACACGGAGGGAAGTTCACATATACTACCTGGAAAAAGCAAACAAGATAAAATCAGAGAGGACACACATTCACATATTCTCATTCACTGGAGAGGAAATGGCCACTAAAGCTGACTATACTCTTGATGAGGAGAGCAGAGCAAGAATTAAAACCAGACTGTTCACTATAAGACAAGAGATGGCCAGTAGGGGTCTATGGGATTCCTTTCGTCAATCCGAGAGAGGCGAAGAGACAATTGAAGAAAGGTTTGAAATCACAGGAACCATGCGCAGGCTTGCTGACCAAAGCCTCCCACCGAACTTCTCCAGCCTTGAAAATTTTAGAGCCTATGTGGATGGATTCGAACCGAACGGCTGCATTGAGGGCAAGCTTTCTCAAATGTCAAAGGAAGTGAACGCCAGAATTGAGCCATTTATGAAGACAACACCACGCCCTCTCAGACTACCTGAGGGGCCTCCCTGCTCCCAGCGGTCGAAGTTCTTACTGATGGATGCCCTTAAATTAAGTATCGAAGATCCAAGCCATGAGGGGGAAGGTATACCACTATATGATGCAATCAAATGCATGAAGACATTTTTCGGCTGGAAAGAGCCCAACATCATAAAACCACATGAAAAGGGCATAAATCCCAATTACCTCCTGGCTTGGAAGCAGGTGCTGGCAGAACTCCAAGACATTGAAAATGAAGATAAAATCCCAAAAACAAAGAACATGAAGAAAACAAGCCAATTAAAGTGGGCACTTGGTGAGAATATGGCACCAGAAAAAGTAGACTTTGAGGACTGCAAAGATGTTAGCGATCTAAAACAGTATGACAGTGATGAACCAGAGCCTAGATCATTATCAAGCTGGATTCAGAGCGAATTCAACAAAGCATGCGAATTGACAGATTCGAGTTGGATTGAACTTGATGAAATAGGAGAAGATGTTGCTCCAATTGAGCACATTGCAAGTATGAGAAGAAACTATTTCACAGCAGAAGTGTCTCATTGCAGGGCCACTGAATACATAATGAAGGGAGTGTATATAAACACAGCCCTATTGAATGCATCCTGTGCAGCCATGGATGACTTCCAATTGATTCCAATGATCAGCAAGTGCAGAACCAAAGAAGGAAGACGGAAGACAAATCTGTATGGATTCATTATAAAAGGAAGGTCCCATTTGAGGAACGACACCGATGTGGTAAACTTTGTTAGCATGGAATTCTCTCTTACTGACCCGAGGCTGGAACCACACAAGTGGGAAAAGTACTGTGTTCTTGAAATAGGAAACATGCTATTACGAACTGCAATAGGCCAAGTGTCAAGGCCCATGTTCCTGTATGTGAGAACCAATGGGACGTCCAAGATTAAGATGAAATGGGGCATGGAGATGAGGCGATGCCTTCTTCAATCCCTTCAACAAATTGAGAGCATGATTGAGGCCGAGTCTTCTGTCAAAGAGAAAGACATGACCAAAGAATTCTTTGAAACCAAATCAGAAACGTGGCCAATTGGGGAATCACCTAAAGGGGTGGAGGAAAGCTCCATTGGAAAGGTGTGCAGAACATTACTCGCAAAATCTGTATTCAACTGCTTATATGCATCTCCACAACTTGAGGGGTTTTCAGCTGAATCAAGAAAATTGCTTCTCATTGTTCAGGCACTTAGGGACAACCTGGAACCTGGAACCTTCGATCTTGGGGGGCTATATGAAGCAATTGAGGAGTGCCTGATTAATGATCCCTGGGTTTTGCTTAATGCATCTTGGTTCAACTCCTTCATCACACATGCACTGAAATAGTTGTGGCAATGCTACTATTTGCTATCCATACTGTCCAAAAAAGTACCTTGTTTCTACT diff --git a/data/community/genspectrum/iav/h5n1/GG1996/PA/genome_annotation.gff3 b/data/community/genspectrum/iav/h5n1/GG1996/PA/genome_annotation.gff3 new file mode 100644 index 000000000..83be4d2c2 --- /dev/null +++ b/data/community/genspectrum/iav/h5n1/GG1996/PA/genome_annotation.gff3 @@ -0,0 +1,3 @@ +. . CDS 25 2175 . + . gene="PA" +. . CDS 25 594 . + . gene=PAX;ID=cds-PAX +. . CDS 596 784 . + . gene=PAX;ID=cds-PAX diff --git a/data/community/genspectrum/iav/h5n1/GG1996/PA/pathogen.json b/data/community/genspectrum/iav/h5n1/GG1996/PA/pathogen.json new file mode 100644 index 000000000..b8caec64e --- /dev/null +++ b/data/community/genspectrum/iav/h5n1/GG1996/PA/pathogen.json @@ -0,0 +1,19 @@ +{ + "schemaVersion": "3.0.0", + "alignmentParams": { + "minSeedCover": 0.01 + }, + "attributes": { + "name": "Influenza A/H5N1 (segment 3/PA)", + "reference name": "Influenza A virus (A/goose/Guangdong/1/1996(H5N1)) polymerase (PA) and PA-X protein (PA-X) genes, complete cds", + "reference accession": "NC_007359.1" + }, + "files": { + "reference": "reference.fasta", + "pathogenJson": "pathogen.json", + "changelog": "CHANGELOG.md", + "genomeAnnotation": "genome_annotation.gff3", + "readme": "README.md", + "examples": "examples.fasta" + } +} diff --git a/data/community/genspectrum/iav/h5n1/GG1996/PA/reference.fasta b/data/community/genspectrum/iav/h5n1/GG1996/PA/reference.fasta new file mode 100644 index 000000000..abfb2f7d6 --- /dev/null +++ b/data/community/genspectrum/iav/h5n1/GG1996/PA/reference.fasta @@ -0,0 +1,33 @@ +>NC_007359.1 Influenza A virus (A/goose/Guangdong/1/1996(H5N1)) polymerase (PA) and PA-X protein (PA-X) genes, complete cds +AGCAAAAGCAGGTACTGATCCAAAATGGAAGACTTTGTGCGACAATGCTTCAATCCAATGATTGTCGAGC +TTGCGGAAAAGGCAATGAAAGAATATGGGGAAGATCCGAAAATCGAAACGAACAAATTTGCCGCAATATG +CACGCACTTAGAAGTCTGTTTCATGTATTCAGATTTCCACTTTATTGATGAACGGGGCGAATCAACAATT +ATAGAATCTGGCGATCCCAATGCATTATTGAAACACCGGTTTGAAATAATCGAAGGGAGGGACCGAACAA +TGGCCTGGACAGTGGTGAATAGTATCTGCAACACCACAGGAGTTGAGAAGCCTAAATTTCTCCCAGATTT +GTATGACTACAAGGAGAACCGATTTATTGAAATTGGAGTGACACGGAGGGAAGTTCACACATACTATCTA +GAAAAAGCCAACAAGATAAAATCTGAGAAGACACACATTCACATATTCTCATTCACTGGAGAGGAAATGG +CCACCAAAGCGGACTACACCCTTGATGAAGAAAGCAGGGCCCGAATCAAAACCAGGCTGTTCACTATAAG +GCAGGAAATGGCCAGTAGGGGTTTATGGGATTCCTTTCGTCAGTCCGAGAGAGGCGAAGAGACAGTTGAA +GAAAGATTTGAAATCACAGGGACTATGTGCAGGCTTGCCGACCAAAGTCTCCCACCTAATTTCTCCAGCC +TTGAAAAATTTAGAGCCTATGTGGATGGATTCGAACCGAACGGCTGCATTGAGGGCAAGCTTTCTCAAAT +GTCGAAAGAAGTAAACGCCAGAATTGAGCCATTTCTGAAGACAACACCACGCCCTCTTAGATTACCTGAT +GGGCCTCCCTGCTCTCAGCGGTCGAAGTTTTTGCTGATGGATGCCCTTAAATTAAGCATCGAAGACCCGA +GTCATGAGGGGGAGGGGATACCGCTATATGATGCAATCAAATGCATGAAAACATTTTTCGGCTGGAAAGA +GCCCAACATTGTAAAACCACATGAAAAAGGCATAAACCCCAATTACCTCCTGGCTTGGAAGCAGGTGCTG +GCAGAGCTCCAAGATATTGAAAACGAGGAGAAAATTCCAAAGACAAAGAACATGAGGAAAACAAGCCAAT +TGAAGTGGGCACTTGGTGAGAATATGGCACCAGAGAAAGTAGACTTTGAGGATTGCAAAGATGTTAGCGA +TCTAAGGCAGTATGACAGTGATGAACCAAAGCCTAGATCACTAGCAAGCTGGATCCAGAGTGAATTCAAC +AAGGCATGCGAATTGACAGATTCAAGTTGGATTGAACTTGATGAAATAGGGGAAGACGTTGCTCCAATTG +AGCACATTGCAAGTATGAGAAGGAACTATTTCACAGCGGAAGTATCCCATTGCAGGGCTACTGAATACAT +AATGAAGGGAGTGTACATAAACACAGCTTTGTTGAATGCATCCTGTGCAGCCATGGATGACTTCCAACTG +ATCCCAATGATAAGCAAATGCAGAACCAAAGAAGGAAGACGGAAAACTAACCTGTATGGATTCCTTATAA +AAGGAAGATCCCATTTGAGAAATGACACCGATGTGGTAAACTTTGTGAGTATGGAATTCTCTCTTACTGA +TCCGAGGCTGGAGCCACACAGATGGGAAAAGTACTGCGTTCTTCGGATAGGAGACATGCTCTTACGGACT +GAAATAGGCCAAGTGTCAAGGCCCATGTTTCTTTATGTGAGAACCAATGGAACCTCCAAGATCAAGATGA +AATGGGGCATGGAAATGAGGCGATGCCCTTTTCAATCCCTTCAACAGATTGAGAGCATGATTGAGGCCGA +GTCTTCTGTCAAAGAAAAAGACATGACTAAAGAATTCTTTGAAAACAAATCAGAAACATGGCCAATTGGA +GAATCACCCAAGGGAGTGGAGGAAGGCTCCATCGGGAAGGTGTGCAGAACCTTACTGGCTAAATCTGTTT +TCAACAGTCTATATGCATCTCCACAACTCGAGGGGTTTTCAGCTGAATCAAGAAAATTGCTTCTCATTGT +TCAGGCACTTAGGGACAACCTGGAACCTGGAACCTTCGATCTTGGGGGGCTATATGAAGCAATTGAGGAG +TGCCTGATTAATGATCCCTGGGTTTTGCTTAATGCATCTTGGTTCAACTCCTTCCTCACACATGCACTAA +GATAGTTGTGGCAATGCTACTATTTGCTATCCATACTGTCCAAAAAAGTACCTTGTTTCTACT diff --git a/data/community/genspectrum/iav/h5n1/GG1996/PB1/CHANGELOG.md b/data/community/genspectrum/iav/h5n1/GG1996/PB1/CHANGELOG.md new file mode 100644 index 000000000..81199b7df --- /dev/null +++ b/data/community/genspectrum/iav/h5n1/GG1996/PB1/CHANGELOG.md @@ -0,0 +1,3 @@ +## Unreleased + +Initial release diff --git a/data/community/genspectrum/iav/h5n1/GG1996/PB1/README.md b/data/community/genspectrum/iav/h5n1/GG1996/PB1/README.md new file mode 100644 index 000000000..f63fb0eb3 --- /dev/null +++ b/data/community/genspectrum/iav/h5n1/GG1996/PB1/README.md @@ -0,0 +1,26 @@ +# H5N1 (segment2/ PB1) - dataset with A/Goose/Guangdong/1/96 reference + +| attribute | value | +| ------------------- | ----------------------------------------- | +| dataset name | community/genspectrum/iav/h5n1/GG1996/PB1 | +| reference strain | A/Goose/Guangdong/1/96(H5N1) | +| reference accession | NC_007358.1 | +| assembly accession | GCF_000864105.1 | + +## Authors and contacts + +Maintained by Genspectrum, Chaoran Chen and Anna Parker + +With the help of: Cornelius Roemer and Richard Neher + +## Scope of this dataset + +This dataset uses the first highly-pathogenic avian influenza (HPAI) isolate (A/Goose/Guangdong/1/96) as a reference and is suitable for the analysis of circulating and historical H5 sequences, including low-pathogenicity avian influenza (LPAI) isolates. + +## Features + +This simple dataset only supports alignment. + +## What is Nextclade dataset + +Read more about Nextclade datasets in Nextclade documentation: https://docs.nextstrain.org/projects/nextclade/en/stable/user/datasets.html diff --git a/data/community/genspectrum/iav/h5n1/GG1996/PB1/examples.fasta b/data/community/genspectrum/iav/h5n1/GG1996/PB1/examples.fasta new file mode 100644 index 000000000..83abfc17a --- /dev/null +++ b/data/community/genspectrum/iav/h5n1/GG1996/PB1/examples.fasta @@ -0,0 +1,38 @@ +>OP950303.1 +GCAAAAGCAGGCAAACCATTTGAATGGATGTCAATCCGACTTTACTTTTCTTAAAAGTGCCAGCGCAAAATGCCATAAGTACCACATTCCCTTATACTGGAGATCCCCCATACAGCCATGGAACAGGGACAGGATACACAATGGACACAGTCAACAGGACACATCAATACTCAGAGAAGGGAAAATGGACAACAAACACAGAAACCGGAGCACCTCAACTCAACCCAATTGATGGACCACTACCTGAGGACAACGAACCGAGCGGATATGCACAAACAGATTGCGTGTTGGAAGCAATGGCTTTCCTTGAAGAGTCCCACCCAGGGATCTTTGGAAACTCTTGTCTTGAAACGATGGAAGTCGTTCAGCAAACAAGAGTGGACAAACTAACTCAAGGTCGCCAGACTTATGACTGGACACTGAANNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNGGGAATAAAAGCAGGAGTGGATAGGTTCTATAGGACCTGCAAACTGGTCGGGATCAATATGAGCAAAAAGAAGTCTTACATAAACCGGACTGGAACATTTGAGTTCACAAGCTTTTTCTATCGCTATGGATTTGTGGCTAACTTCAGTATGGAGCTGCCCAGCTTTGGAGTTTCTGGGATCAATGAATCAGCTGATATGAGCATTGGCGTCACAGTGATAAAGAACAACATGATAAACAATGACCTTGGTCCAGCAACAGCTCAAATGGCCCTTCAACTATTCATCAAAGATTACAGGTACACGTACCGATGCCACAGAGGTGACACACAAATTCAAACGAGGAGATCATTCGAGCTGAAGAAGCTGTGGGAACAGACCCGTTCAAAGGCAGGACTGTTGGTGTCAGATGGAGGACCAAATTTATACAACATTCGGAATCTCCATATCCCAGAGGTCTGCATGAAGTGGGAGCTGATGGACGAAGATTACCAGGGCAGGTTGTGTAATCCTCTGAACCCATTTGTCAGTCATAAAGAAATTGAGTCCGTAAACAATGCTGTGGTGATGCCAGCACACGGTCCGGCCAAAAGCATGGAATATGATGCCATTGCGACTACACACTCATGGATTCCTAAAAGGAATCGTTCCATTCTCAATACCAGTCAAAGGGGAATTCTTGAGGATGAACAGATGTACCAGAAATGCTGCAGTTTATTCGAAAAATTTTTTCCCAGTAGTTCATACAGGAGACCAGTTGGAATTTCCAGCATGGTGGAGGCCATGGTGTCTAGGGCCCGAATCGATGCACGCATTGATTTCGAATCTGGAAGGATCAAGAAGGGAGAGTTTTCTGAGATCATGAAGATCTGTTCCACCATTGAAGAGCTCAGACGGCAAAAATAGTGAATTTAGCTTGTCCTTCATGAAAAAATGCCTTGTTTCTAC +>AB847563.1 +AACCATTTGAATGGATGTCAATCCGACTTTACTTTTCTTGAAAGTGCCAGTGCAAAATGCTATAAGTACCACATTCCCTTATACTGGAGACCCTCCATACAGCCATGGAACAGGGACAGGGTACACCATGGACACAGTCAACAGAACACACCAATATTCAGAAAAGGGGGAGTGGACAACAAACACAGAGACCGGAGCACCCCAACTCAACCCGATTGATGGACCATTACCTGAGGATAACGAGCCCAGTGGGTATGCACAAACAGATTGTGTATTAGAAGCAATGGCTTTCCTTGAAGAATCCCACCCAGGAATCTTTGAAAATTCGTGTCTTGAAACGATGGAAATTGTCCAACAAACAAGAGTTGACAAACTGACCCAAGGTCGCCAGACTTATGACTGGACATTGAATAGAAACCAACCGGCTGCAACTGCTTTGGCCAACACTATAGAAATTTTCAGATCAAACGGTCTGACAGCAAATGAATCGGGACGGCTGATAGATTTCCTCAAGGATGTGATGGAATCAATGGATAAGGAAGAAATGGAGATAACAACACATTTCCAGAGAAAGAGAAGAGTAAGAGACAACATGACCAAGAAAATGGTAACGCAAAGAACAATCGGGAAGAAAAAACAAAGGCTGAACAAAAGGAGCTACCTGATAAGAGCGCTGACACTGAACACAATGACCAAGGATGCAGAAAGGGGCAAGTTGAAGAGGCGAGCAATTGCAACACCCGGAATGCAAATCAGAGGATTCGTGTACTTCGTTGAAACACTAGCGAGGAGTATCTGTGAGAAACTTGAGCAATCTGGGCTCCCAGTCGGAGGAAATGAGAAGAAAGCTAAACTGGCAAACGTCGTGAGGAAGATGATGACCAACTCACAGGATACTGAACTCTCCTTTACAATTACTGGGGACAACACAAAATGGAATGAGAATCAAAATCCTAGGATGTTTCTGGCAATGATAACGTACATCACAAGGAACCAGCCAGAATGGTTTCGAAATGTTTTAAGCATTGCCCCTATAATGTTTTCAAACAAAATGGCAAGACTAGGGAAAGGATACATGTTCGAAAGTAAGAGCATGAAGTTACGAACACAAATACCAGCAGAAATGCTTGCAAACATTGATCTTAAATACTTCAATGAATTAACGAAAAGGAAAATTGAGAGGATAAGACCCCTATTAATAGATGGTACAGCCTCATTGAGCCCTGGAATGATGATGGGCATGTTCAACATGCTGAGTACAGTCCTGGGAGTTTCGATCCTGAATCTTGGACAGAAAAGGTACACCAAAACCACATATTGGTGGGACGGGCTACAATCCTCTGATGATTTCGCTCTTATTGTAAATGCCCCGAATCATGAAGGAATACAAGCAGGGGTAGATAGGTTTTATAGGGCTTGTAAGCTAGTTGGGATAAATATGAGCAAGAAGAAGTCTTACATAAATCGGACAGGGACATTTGAATTCACGAGCTTTTTCTACCGCTATGGATTCGTAGCCAATTTCAGTATGGAGCTGCCCAGTTTTGGAGTGTCTGGAATTAATGAATCGGCCGACATGAGCATTGGTGTTACAGTGATAAGAAACAATATGATAAACAACGACCTTGGGCCAGCAACAGCTCAGATGGCTCTTCAGCTATTCATCAAGGACTACAGATACACATACCGATGCCACAGAGGAGACACGCAAATCCAAACGAGGAGATCATTCGAGCTGAAGAAGCTATGGGAACAAACCCGTTCAAAGGCAGGACTATTAGTTTCAGATGGAGGACCAAATCTATACAATATCCGAAATCTCCATATTCCTGAGGTCTGCTTGAAATGGGAATTGATGGATGAAGACTACCAGGGTAGACTGTGCAATCCTCTGAATCCATTCGTCAGCCATAGGGAAATTGAATCTGTCAACAATGCTGTGGTAATGCCAGCTCATGGTCCGGCCAAGAGTATGGAATATGATGCCGTTGCAACCACACATTCTTGGATTCCTAAAAGGAATCGTTCCATTCTCAACACGAGTCAAAGGGGAATTCTTGAAGATGAACAGATGTACCAAAAGTGCTGCAATCTATTCGAGAAATTCTTCCCCAGTAGTTCGTATCGGAGACCAGTTGGAATTTCCAGTATGGTGGAGGCCATGGTGTCTCGGGCCCGAATTGACGCACGAATTGATTTCGAGTCTGGAAGGATTAAGAAAGAAGAGTTTGCTGAGATCATGAAGATCTGTTCCACCATTGAAGAGCTCAGACGGCAAAAATAGTGAATTTGGCTTGTCCTTCGTGAAA +>ON759335.1 +AAGCAGGAGTGGATAGGTTCTATAGGACCTGCAAACTGGTCGGGATCAATATGAGCAAAAAGAAGTCTTACATAAACCGGACTGGAACATTTGAGTTCACAAGCTTTTTCTATCGCTATGGATTTGTGGCTAACTTCAGTATGGAGCTGCCCAGCTTTGGAGTTTCTGGGATCAATGAATCAGCTGACATGAGCATTGGCGTCACAGTGATAAAGAACAACATGATAAACAATGACCTTGGTCCAGCAACAGCTCAAATGGCCCTTCAACTATTCATCAAAGATTACAGGTACACGTACCGATGCCACAGAGGTGACACACAAATTCAAACGAGGAGATCATTCGAGCTGAAGAAGCTGTGGGAACAGACCCGTTCAAAGGCAGGACTGTTGGTGTCAGATGGAGGACCAAATCTATACAACATTCGGAATCTCCATATCCCAGAGGTCTGCCTGAAGTGGGAGCTGATGGACGAAGATTACCAGAGCAGGTTGTGTAATCCTCTGAACCCATTTGTCAGTCATAAAGAAATTGAGTCCGTAAACAATGCTGTGGTGATGCCAGCACACGGTCCAGCCAAAAGCATGGAATATGATGCCATTGCGACTACACACTCATGGATTCCTAAAAGGAATCGTTCCATTCTCAATACCAGTCAAAGGGGAATTCTTGAGGATGAACAGATGTACCAGAAATGCTGCAGTCTATTCGAAAAATTTTTTCCCAGTAGTTCATACAGGAGACCAGTTGGAATTTCCAGCATGGTGGAGGCCATGGTGTCTAGGGCCCGAATCGATGCACGCATTGATTTCGAATCTGGAAGGATCAAGAAGGGAGAGTTTTCTGAGATCATGAAGATCTGTTCCACCATTGAAGAGCTCAGACGGCAAAAATAG +>MF116343.1 +AGCGAAAGCAGGCAAACCATTTGAATGGATGTCAATCCGACTTTACTTTTCTTAAAAGTACCAGTGCAAAATGCTATAAGTACCACATTCCCTTATACTGGAGACCCTCCATACAGCCATGGGACAGGGACAGGGTATACCATGGACACAGTCAACAGAACACACCAATATTCAGAAAAGGGGAAATGGACAACAAACACAGAGACTGGAGCACTCCAACTCAACCCGATTGATGGACCACTACCTGAGGATAATGAGCCCAGCGGGTATGCACAAACAGATTGTGTATTGGAAGCAATGGCTTTCCTTGAAGAATCCCACCCAGGAATCTTTGAAAACTCGTGTCTTGAAACGATGGAAATTATTCAACAAACAAGAGTGGATAAACTAACCCAAGGCCGCCAGACCTATGACTGGACATTGAATAGAAACCAACCGGCTGCAACTGCTTTGGCCAACACTATAGAAATATTCAGATTGAACGGTCTAACAGCCAGTGAATCGGGACGGCTAATAGATTTCCTCAAGGATGTGATGGAGTCAATGGATAAGGAGGAAATGGAGATAACAACACATTTCCAGAGAAAGAGAAGAGTGAGGGACAACATGACCAAGAAAATGATCACACAAAGAACAATAGGGAAGAAAAAACAAAGGCTGAACAAAAGGAGTTACCTGATAAGAGCACTGACATTGAACACAATGACGAAAGATGCAGAAAGAGGCAAATTGAAGAGGCGAGCAATTGCAACACCCGGAATGCAAATCAGAGGGTTCGTGTACTTTGTTGAAACACTAGCGAGGAGTATCTGTGAGAAGCTTGAGCAATCTGGACTCCCAGTCGGAGGGAATGAGAAGAAGGCTAAATTGGCAAACGTCGTGAGGAAGATGATGACTAACTCACAAGATACTGAACTCTCCTTTACAATTACTGGAGACAATACCAAGTGGAATGAGAATCAGAATCCTAGGATGTTTCTAGCAATGATAACGTACATCACAAGGAACCAGCCAGAATGGTTTCGGAATGTCCTAAGCATTGCCCCTATAATGTTCTCAAACAAAATGGCGAGATTAGGGAAAGGATACATGTTTGAGAGTAAGAGCATGAAGCTACGAACACAAATACCAGCAGAAATGCTCGCAACCATTGATCTTAAATACTTCAATGAATTAACAAAAAAGAAAATTGAGAAAATAAGACCTCTATTAATTGATGGTACAGCCTCATTGAGCCCTGGAATGATGATGGGCATGTTCAACATGCTGAGTACAGTCTTGGGAGTGTCAATTCTGAACCTTGGACAGAAAAGGTACACCAAAACCACATATTGGTGGGACGGACTCCAATCCTCTGATGATTTCGCCCTCATAGTAAATGCACCAAATCATGAGGGAATACAAGCAGGAGTGGATAGGTTTTATAGGACTTGTAAACTAGTTGGGATCAATATGAGCAAGAAGAAGTCTTACATAAATCGAACAGGGACATTCGAATTCACGAGTTTTTTCTACCGCTATGGATTTGTAGCCAATTTCAGTATGGAGTTGCCCAGTTTTGGAGTGTCTGGAATTAATGAATCGGCCGACATGAGCATTGGTGTTACGGTCATAAAAAACAATATGATAAACAATGACCTTGGGCCAGCAACAGCTCAGATGGCTCTTCAGCTATTCATCAAGGACTACAGATACACATACCGGTGCCACAGAGGGGATACGCAAATCCAAACGAGGAGATCATTTGAGCTGAGGAAGCTGTGGGAGCAAACCCGTTCAAAGGCAGGACTGTTGGTTTCAGATGGAGGACCAAATCTATACAATATCCGAAATCTCCATATTCCTGAAGTCTGCTTGAAATGGGAATTGATGGATGAAGATTACCAGGGCAGATTGTGTAATCCTCTGAATCCGTTCGTCAGCCATAAAGAAATTGAATCTGTCAACAATGCTGTAGTAATGCCAGCCCATGGCCCAGCCAAGAGTATGGAATATGATGCCGTCGCTACCACACATTCATGGATTCCTAAAAGGAATCGTTCTGTCCTCAATACGAGTCAAAGGGGGATTCTTGAGGATGAACAGATGTACCAGAAGTGTTGCAATCTATTCGAGAAATTCTTCCCCAGCAGTTCATATCGGAGGCCAGTTGGAATTTCCAGCATGGTGGAGGCCATGATGTCTAGGGCCCGAATTGACGCACGAATTGATTTCGAGTCTGGAAGGATGAAGAAAGAAGAGTTTGCTGAGATCATGAAGATCTGTTCCACCATTGAAGAGCTCAGACGGCAAAAATAGTGAATTTAGCTTGTCCTTCATGAAAAAATGCCTTGTTTCTACT +>KP097852.1 +ATGGATGTCAATCCGACTTTACTTTTCTTGAAGGTACCAGTGCAAAATGCTATAAGTACCACATTTCCTTATACTGGAGACCCTCCATACAGCCATGGAACAGGGACAGGATACACCATGGACACGGTCAACAGAACACACCAATACTCAGAAAAGGGGAAGTGGACAACAAACACAGAGACCGGAGCACCCCAACTCAACCCTATTGATGGACCACTACCTGAAGATAATGAGCCCAGTGGGTATGCACAAACAGATTGTGTATTGGAAGCAATGGCTTTCCTTGAAGAGTCCCACCCAGGGATCTTTGAAAACTCATGTCTTGAAACGATGGAAATTGTTCAACAAACAAGAGTGGACAAACTGACCCAAGGTCGCCAGACCTATGACTGGACATTGAATAGAAACCAACCGGCTGCAACTGCTTTGGCCAACACTATAGAAATCTTCAGATCGAACGGTCTAACAGCCAATGAGTCGGGACGGCTAATAGATTTCCTCAAAGATGTGATGGAATCAATGGACAAGGAGGAAATGGAGATAACAACACATTTCCAGAGAAAGAGAAGGGTGAGGGATAACATGACCAAGAAAATGGTCACACAAAGAACAATAGGGAAGAAAAAACAAAGGCTGAGCAAAAAGAGCTATCTGATAAGAGCATTGACACTGAACACAATGACAAAAGATGCAGAAAGGGGTAAATTGAAGAGGCGAGCGATTGCGACACCCGGAATGCAAATCAGAGGATTTGTCTACTTTGTTGAAACACTAGCGAGGTGTATCTGTGAAAAGCTTGAGCAATCTGGACTCCCAGTCGGAGGGAATGAGAAGAAGGCTAAATTGGCAAACGTCGTAAGGAAGATGATGACTAACTCACAAGATACTGAACTCTCCTTTACAATTACTGGGGACAATACCAAATGGAATGAGAATCAGAATCCTAGGATGTTTCTGGCAATGATAACGTACATCACAAGGAACCAGCCCGAATGGTTTCGGAATGTCTTGAGCATTGCTCCTATAATGTTCTCAAACAAAATGGCAAGACTAGGAAAAGGATATATGTTCGAAAGTAAGAGCATGAAGTTGCGAACGCAAATACCAGCAGAAATGCTTGCAAACATTGATCTTAAATACTTCAATGAATTAACGAAAAAGAAAATTGAGAAAATAAGGCCTCTATTAATAGATGGTACAGCCTCATTGAGTCCTGGAATGATGATGGGCATGTTCAACATGCTGAGTACAGTTCTAGGAGTTTCAATTCTGAATCTTGGACAGAAAAGGTACACCAAAACCACATATTGGTGGGACGGGCTCCAATCCTCTGATGATTTCGCTCTCATCGTAAATGCACCGAATCATGAGGGAATACAAGCAGGAGTGGATAGGTTTTATAGGACTTGTAAACTAGTTGGAATCAATATGAGCAAAAAGAAGTCTTACATAAATCGGACAGGGACATTTGAATTCACAAGCTTTTTCTACCGATATGGATTTGTAGCCAATTTCAGTATGGAGCTGCCCAGTTTTGGAGTGTCTGGAATTAATGAATCGGCCGACATGAGCATTGGTGTTACAGTGATAAAAAACAATATGATAAACAACGATCTTGGCCCAGCAACAGCTCAGATGGCTCTTCAGTTATTCATCAAAGACTACAGATACACATACCGATGTCACAGAGGAGATACGCAAATCCAAACAAGGAGATCATTCGAGCTGAGGAAGCTGTGGGAGCAAACCCGTTCAAAAGCAGGACTGTTGGTTTCAGATGGAGGACCAAATCTGTACAACATCCGAAATCTCCATATTCCTGAAGTCTGCTTAAAATGGGAATTGATGGATGTAGATTATCAGGGCAGACTGTGTAATCCTCTGAACCCGTTCGTCAGCCATAAGGAAATTGAATCTGTAAACAATGCTATAGTAATGCCAGCTCATGGCCCAGCCAAAAGTATGGAGTATGATGCTGTTGCAACTACACATTCATGGATTCCTAAAAGGAACCGTTCCATTCTCAATACTAGTCAAAGGGGAATTCTTGAGGATGAACAGATGTACCAGAAGTGCTGCAATCTATTCGAGAAATTCTTCCCCAGCAGTTCATATCGGAGGCCAGTTGGAATTTCCAGCATGGTGGAGGCCATGGTGTCTAGGGCCCGAATTGACGCACGAATTGATTTCGAGTCTGGAAGGATCAAGAAAGAAGAGTTTGCTGAGATCATGAAGATCTGTTCCACCATTGAAGAACTCAGACGGCAAAAATAGTGAATTTAGCTTGTCCTTCGTGAAA +>KP097868.1 +ATGGATGTCAACCCGACTTTACTTTTCTTGAAAGTGCCAGTGCAAAATGCTATAAGTACCACATTCCCTTATACTGGAGACCCTCCATACAGCCATGGAACAGGGACAGGGTACACCATGGACACAGTCAACAGAACACACCAATATTCAGAAAAGGGGGAGTGGACAACAAACACAGAGACCGGAGCACCCCAACTCAACCCGATTGATGGACCACTACCTGAGGATAACGAGCCCAGTGGGTATGCACAAACAGATTGTGTATTGGAAGCAATGGCTTTCCTTGAAGAATCCCACCCAGGAATCTTTGAAAATTCGTGTCTTGAAACGATGGAAATTGTTCAACAAACAAGAGTGGACAAACTGACTCAAGGTCGCCAGACTTATGACTGGACATTGAATAGAAACCAACCGGCTGCAACTGCTTTGGCCAACACTATAGAAATTTTCAGATCAAACGGTCTGACAGCAAATGAATCGGGACGGCTGATAGATTTCCTCAAGGACGTGATGGAATCAATGGATAAGGAAGAAATGGAGATAACAACACATTTCCAGAGAAAGAGAAGAGTAAGGGACAACATGACAAAGAAAATGGTAACGCAAAGAACAATCGGGAAGAAAAAACAAAGGCTGAACAAAAGGAGCTACCTGATAAGAGCGCTGACACTGAACACAATGACCAAGGACGCAGAAAGAGGCAAATTGAAGAGGCGAGCAATTGCAACACCCGGAATGCAAATCAGAGGATTCGTGTACTTTGTTGAAACACTAGCGAGGAGTATCTGTGAGAAACTTGAGCAATCTGGACTCCCAGTCGGAGGGAATGAGAAGAAAGCTAAACTGGCAAACGTCGTGAGGAAGATGATGACCAACTCACAGGATACTGAACTCTCCTTTACAATTACTGGGGACAATACAAAATGGAATGAGAATCAAAATCCTAGGATGTTTCTGGCAATGATAACGTACATCACAAGGAACCAGCCAGAATGGTTTCGAAATGTCTTAAGCATTGCCCCTATAATGTTCTCAAACAAGATGGCGAGATTAGGGAAAGGATACATGTTCGAAAGTAAGAGCATGAAGTTACGAACACAAATACCAGCAGAAATGCTTGCAAACATTGACCTCAAATACTTCAATGAAATAACGAAAAAGAAAATTGAGAAGATAAGACCTCTATTAATAGATGGTACAGCCTCATTGAGCCCTGGAATGATGATGGGCATGTTCAACATGCTGAGTACGGTCCTAGGAGTTTCAATCCTGAATCTTGGACAGAAAAGGTACACCAAAACCACATATTGGTGGGACGGGCTCCAATCCTCTGATGATTTCGCTCTCATTGTAAATGCACCGAATCATGAAGGAATACAAGCAGGGGTGGATAGATTTTATAGGACTTGTAAACTAGTTGGGATCAACATGAGCAAGAAGAAGTCTTACATAAATCGGACAGGGACATTTGAATTCACGAGCTTTTTCTACCGCTATGGATTCGTAGCCAATTTCAGTATGGAGCTGCCCAGTTTTGGAGTGTCTGGGATTAATGAATCGGCCGACATGAGCGTTGGTGTTACAGTGATAAAGAACAATATGATAAACAACGACCTTGGGCCAGCAACAGCTCAGATGGCTCTTCAGCTATTCATCAAGGACTACAGATACACATACCGATGCCACAGAGGAGATGCGCAAATCCAAACGAGGAGATCATTCGAGCTGAAGAAGCTATGGGAACAAACCCGTTCAAAGGCAGGACTGTTGGTTTCAGACGGAGGACCAAATCTATACAATATCCGAAATCTCCATATTCCTGAGGTCTGCTTGAAATGGGAATTGATGGATGAAGACTACCAGGGCAGGCTGTGCAATCCTCTGAATCCATTCGTCAGCCATAGGGAAATTGAATCAGTCAACAATGCTATAGTAATGCCAGCTCATGGCCCGGCCAAGAGTATGGAATATGATGCCGTTGCAACCACACATTCATGGATTCCTAAAAGGAATCGTTCCATTCTCAACACGAGTCAAAGGGGAATTCTTGAGGATGAACAGATGTACCAAAAGTGCTGCAATCTATTCGAGAAATTCTTTCCCAGTAGTTCGTATCGGAGGCCAGTTGGAATTTCCAGTATGGTGGAGGCCATGGTGTCTCGGGCTCGAATTGACGCACGAATTGATTTCGAGTCTGGAAGGATTAAGAAAGAAGAGTTTGCTGAGATCATGAAGATCTGTTCCACCATTGAAGAGCTCAGACGGCAAAAATAGTGAATTTGGCTTGTCCTTCGTGAAA +>KR271013.1 +ATGGATGTCAATCCGACTCTACTTTTCTTGAAAGTTCCAGCGCAAAATGCCATAAGCACCACATTCCCGTATACTGGAGACCCTCCATACAGCCATGGAACAGGAACAGGATACACCATGGACACGGTTAACAGAACACATCAATATTCAGAAAAGGGGAAGTGGACAACAAACTCAGAAACTGGAGCACCCCAACTTAACCCAATTGATGGACCACTGCCTGAGGACAATGAGCCGAGTGGATATGCACAAACGGACTGTGTCCTTGAAGCAATGGCTTTCCTTGAAGAGTCCCACCCAGGAATCTTTGAAAACTCGTGTCTTGAAACGATGGAAGTTGTTCAACAAACAAGAGTGGACAAATTGACCCAAGGCCGTCAAACCTATGATTGGACATTGAACAGGAATCAACCGGCTGCAACTGCATTAGCTAATACAATAGAGGTTTTCAGATCGAACGGTCTGACAGCTAATGAATCAGGAAGGCTAATAGATTTTCTCAAGGATGTAATGGAATCAATGGATAAAGATGAAATGGAAATAACAACACATTTCCAAAGAAAAAGAAGAGTGAGAGACAACATGACCAAGAAAATGGTCACACAAAGAACAATAGGAAAGAAGAAGCAGAGGTTAAACAAAAGGAGCTATCTAATAAGAGCATTGACATTAAACACAATGACAAAAGACGCCGAAAGAGGCAAATTAAAGAGAAGAGCAATTGCAACACCCGGAATGCAGATAAGAGGGTTTGTATACTTTGTTGAAACATTAGCAAGGAGCATTTGTGAGAAGCTTGAACAATCTGGACTCCCAGTTGGAGGCAATGAAAAGAAGGCTAAACTGGCAAATGTTGTGAGAAAAATGATGACTAATTCACAAGACACAGAACTCTCTTTCACGATCACTGGAGACAACACCAAATGGAATGAAAATCAGAATCCTAGGATGTTTCTGGCAATGATAACATATATAACAAGGAACCAACCTGAATGGTTTAGGAACGTCTTGAGCATTGCACCTATAATGTTCTCAAACAAAATGGCAAGACTAGGGAAAGGATACATGTTCGAAAGTAAGAGCATGAAGCTTCGAACACAAATACCGGCAGAAATGCTAGCAAGTATTGATCTGAAATATTTCAATGAGTCAACAAGAAAGAAGATAGAGAAGATAAGGCCTCTTCTAATAGATGGTACAGCCTCATTGAGCCCTGGAATGATGATGGGCATGTTCAACATGCTAAGTACAGTTTTGGGAGTTTCGATTCTAAATCTAGGGCAAAAGAGGTACACCAAAACAACATACTGGTGGGACGGACTCCAATCTTCTGATGACTTTGCTCTCATAGTGAATGCTCCGAATCATGAGGGAATACAGGCAGGAGTAGACAGATTCTATAGAACTTGCAAGCTGGTCGGAATCAACATGAGCAAAAAGAAGTCCTACATAAATAGAACAGGAACATTTGAATTCACAAGTTTTTTCTACCGCTATGGATTTGTAGCCAACTTCAGCATGGAATTGCCCAGCTTTGGGGTGTCTGGGATTAATGAATCTGCAGACATGAGCATTGGAGTGACAGTAATAAAGAACAACATGATAAACAATGACCTTGGACCAGCAACAGCCCAAATGGCTCTTCAGCTTTTCATCAAAGATTACAGATACACATATCGGTGTCACAGAGGAGACACACAAATCCAGACAAGAAGGTCATTCGAGCTGAGGAAGTTGTGGGAACAAACCCGCTCAAGAGCAGGACTGCTGGTCTCAGATGGAGGACCAAATCTATACAATATCCGGAATCTCCACATCCCGGAAGTCTGCTTGAAATGGGAGCTAATGGACGAAGACTATCAGGGAAGGCTTTGTAACCCCCTGAATCCGTTTGTCAGCCACAAAGAGATAGAGTCTGTAAACAATGCTGTGGTGATGCCAGCTCATGGCCCAGCCAAGAGCATGGAATATGATGCTGTTGCTACCACGCACTCCTGGATCCCTAAAAGGAACCGCTCCATCCTCAATACAAGCCAAAGGGGAATCCTTGAAGATGAACAGATGTATCAAAAATGCTGCAATCTGTTCGAGAAATTCTTCCCTAGCAGTTCATACAGGAGACCGGTTGGGATTTCCAGCATGGTGGAGGCCATGGTTTCTAGGGCCCGAATTGATGCGCGAATTGACTTCGAATCTGGACGGATTAAGAAGGAGGAGTTTGCTGAGATCATGAAGATCTGTTCCACCATTGAAGAGCTCAGACGGCAGAAGTAGTGAATTT +>KP097857.1 +ATGGATGTCAATCCGACTTTACTTTTCTTGAAAGTGCCAGTGCAAAATGCTATAAGTACCACATTCCCTTATACTGGAGACCCTCCATACAGCCATGGAACAGGGACAGGATACACCATGGACACAGTCAACAGAACACACCAATATTCAGAAAAGGGGGAGTGGACAACAAACACAGAGACCGGAGCACCCCAACTCAACCCGATCGATGGACCATTACCTGAGGATAACGAGCCCAGTGGGTATGCACAAACAGATTGTGTATTAGAAGCAATGGCTTTCCTTGAAGAATCCCACCCAGGAATCTTTGAAAATTCGTGTCTTGAAACGATGGAAATTGTCCAACAAACAAGAGTGGACAAACTAACCCAAGGTCGCCAGACTTATGACTGGACATTGAATAGAAACCAACCGGCTGCAACTGCTTTGGCCAACACTATAGAAATTTTCAGATCAAACGGTCTGACAGCAAATGAATCGGGACGGCTGATAGATTTCCTCAAGGATGTGATGGAATCAATGGATAAGGAAGAAATGGAGATAACAACACATTTCCAGAGAAAGAGAAGAGTAAGAGACAACATGACCAAGAAAATGGTAACGCAAAGAACAATCGGGAAGAAAAAACAAAGGCTGAACAAAAGGAGCTACCTGATAAGAGCGCTGACGCTGAACACAATGACCAAGGATGCAGAAAGAGGCAAACTGAAGAGGCGAGCAATTGCAACACCCGGAATGCAAATCAGAGGATTCGTGTACTTCGTTGAAACACTAGCGAGGAGTATCTGTGAGAAACTTGAGCAATCTGGACTCCCAGTCGGAGGGAATGAGAAGAAAGCTAAACTGGCAAACGTTGTGAGGAAGATGATGACCAACTCACAGGATACTGAACTCTCCTTTACAATTACTGGGGACAACACAAAATGGAATGAGAATCAAAATCCTAGGATGTTTCTGGCAATGATAACGTACATCACAAGGAACCAGCCAGAATGGTTTCGAAATGTTCTAAGCATTGCCCCTATAATGTTTTCAAACAAAATGGCGAGACTAGGGAAAGGATACATGTTCGAAAGTAAGAGCATGAAGTTACGAACACAAATACCAGCAGAAATGCTTGCAAACATTGACCTTAAATACTTCAATGAATTAACGAAAAGGAAAATTGAGAAGATAAGACCTCTATTAATAGATGGTACAGCCTCATTGAGCCCTGGAATGATGATGGGCATGTTCAACATGCTGAGTACAGTCCTAGGAGTTTCAATCCTGAATCTTGGACAGAAAAGGTACACCAAAACCACATATTGGTGGGACGGGCTCCAATCCTCTGATGATTTCGCTCTCATTGTAAATGCCCCGAATCATGAAGGAATACAAGCAGGGGTAGATAGGTTTTATAGGACTTGTAAACTAGTTGGGATAAATATGAGCAAGAAGAAGTCTTACATAAATCGGACAGGGACATTTGAATTCACGAGCTTTTTCTACCGCTATGGATTCGTAGCCAATTTCAGTATGGAGCTGCCCAGTTTTGGAGTGTCTGGAATTAATGAATCGGCCGACATGAGCATTGGTGTTACAGTGATAAAAAACAATATGATAAACAACGACCTTGGGCCAGCAACAGCTCAGATGGCTCTTCAGCTATTCATCAAGGACTACAGATACACATACCGATGCCACAGAGGAGACACGCAAATCCAAACGAGGAGATCATTCGAGCTGAAGAAGCTATGGGAACAAACCCGTTCAAAGGCAGGACTATTGGTTTCAGATGGAGGACCAAATCTATACAATATCCGAAATCTCCATATTCCTGAGGTCTGCTTGAAATGGGAATTGATGGATGAAGACTACCAGGGTAGACTGTGCAATCCTCTGAATCCATTCGTCAGCCATAGGGAAATTGAATCTGTCAACAATGCTATAGTAATGCCAGCTCATGGTCCGGCCAAGAGTATGGAATATGATGCCGTTGCAACCACACATTCTTGGATTCCTAAAAGGAATCGTTCCATTCTCAACACGAGTCAAAGGGGAATTCTTGAGGATGAACAGATGTACCAAAAGTGTTGCAATCTATTCGAGAAATTCTTTCCCAGTAGTTCGTATCGGAGACCAGTTGGAATTTCCAGTATGGTGGAGGCTATGGTGTCTCGGGCCCGAATTGACGCACGAATTGATTTCGAGTCCGGAAGGATTAAGAAAGAAGAGTTTGCTGAGATCATGAAGATCTGTTCCACCATTGAAGAGCTCAGACGGCAAAAATAGTGAATTTGGCTTGTCCTTCGTGAAA +>KX215269.1 +AGCGAAAGCAGGCAAACCATTTGAATGGATGTCAATCCGACTTTACTTTTCTTGAAAATTCCAGCACAAAATGCTATAAGCATTACATTCCCTTATACTGGAGATCCTCCCTACAGCCATGGAACAGGAACAGGATACACCATGGACACAGTCAATAGAACACATCAATACTCAGAGAAGGGGAGATGGACAACAAATACAGAGACTGGAGCACCTCAACTTAATCCAATTGATGGGCCACTACCTGAGGATAATGAGCCAAGTGGATATGCACAAACAGATTGTGTGTTGGAAGCGATGGCTTTCCTTGAAGAATCCCACCCAGGGATCTTTGAAAACTCATGTCTCGAAACTATGGAAATTGTTCAGCAAACAAGAGTGGACAAACTAACCCAAGGTCGCCAGACCTATGACTGGACATTGAATAGAAATCAACCGGCTGCAACTGCTTTGGCCAACACTATAGAGGTTTTCAGATTGAACGGTCTAACAGCCAGTGAATCAGGGAGACTAATAGATTTCCTCAAGGATGTAATGGAATCAATGGATAAAGAAGAGATGGAAATAACAACACATTTCCAAAGAAAGAGAAGAATAAGGGACAACATGACCAAGAAAATGGTAACACAAAGAACAATAGGGAAGAAGAAACAAAGGTTGAACAAGAAGAGCTACTTAATAAGAGCACTGACACTAAACACAATGACAAAAGATGCAGAAAGAGGCAAATTGAAGAGGAGGGCAATTGCAACACCCGGAATGCAGATCAGAGGATTCGTGTACTTTGTCGAAACATTAGCACGGACGATCTGTGAGAAACTTGAGCAATCTGGACTTCCTGTCGGAGGGAATGAGAAGAAGGCTAAATTGGCAAATGTCGTAAGAAAGATGATGACTAACTCACAAGACACAGAGCTCTCCTTTACGATTACTGGAGACAATACTAAATGGAATGAGAATCAGAATCCCCGAATGTTTCTTGCAATGATAACATACATCACAAGAAACCAACCTGAATGGTTTAGAAATGTCTTGAGCATTGCCCCTATAATGTTCTCAAACAAAATGGCGAGATTGGGAAAAGGTTACATGTTCGAGAGTAAGAGCATGAGGCTAAGGACACAAATACCAGCAGAAATGCTTGCAAACATTGATCTAAAGTACTTCAATGAAACAACAAGAAAGAAAATCGAGAAAATAAGACCTCTCCTAATAAGTGGTACAGCCTCGCTGAGCCCGGGAATGATGATGGGCATGTTCAACATGCTGAGCACGGTCTTAGGAGTCTCAGTCCTGAATCTTGGACAGAGGAGATACACCAAAACCACATACTGGTGGGATGGGCTCCAATCCTCTGATGATTTCGCTCTAATAGTGAATGCACCGAATCATGAGGGAATACAAGCAGGAGTGGACAGATTCTATAGGACTTGCAAGCTGGTTGGAATCAATATGAGCAAAAAGAAGTCTTACATAAATCGGACAGGGACATTTGAGTTCACAAGCTTTTTCTATCGATATGGATTTGTAGCCAATTTTAGCATGGAACTGCCCAGCTTTGGAGTATCTGGGATTAACGAGTCAGCTGACATGAGCATTGGAGTTACAGTTATAAAGAATAATATGATAAATAATGATCTTGGGCCAGCAACAGCACAAATGGCTCTTCAGCTATTCATTAAGGACTACAGGTACACATATCGTTGTCACAGAGGTGACACACAAATTCAGACGAGGAGATCATTTGAGCTGAAAAAGTTATGGGAGCAGACCCGCTCCAAAGCAGGACTGTTGGTATCCGATGGAGGACCGAATCTATACAACATCCGGAACCTCCACATTCCAGAGGTCTGCTTGAAATGGGAACTAATGGATGAAGACTACCGAGGTAGGCTGTGTAATCCTCTCAATCCATTTGTTAGTCATAAGGAAATTGAGTCCGTAAATAATGCTGTGGTAATGCCGGCCCATGGTCCAGCCAAGAGCATGGAGTATGATGCTGTTGCTACTACACATTCATGGATCCCTAAGAGGAACCGCTCCATTCTCAATACCAGCCAAAGGGGAATTCTTGAAGATGAGCAGATGTATCAGAAATGCTGCAATCTATTCGAGAAATTCTTTCCCAGTAGTTCATACAGGAGACCAGTTGGAATCTCCAGCATGGTAGAGGCCATGGTATCTAGGGCCCGAATTGATGCACGAATTGACTTCGAATCTGGAAGGATTAAAAAAGAAGAGTTTGCTGAGATCATGAAGATCTGTTCCACCATTGAAGAACTCAGACGGCAAAAATAGTGAATTTAGCTTGTCCTTCATGAAAAAATGCCTTGTTTCTACT +>LC167772.1 +GCAGGCAAACCATTTGAATGGATGTCAATCCGACTTTACTTTTTTTGAAAGTGCCGGTGCAGAATGCTATAAGTACCACATTCCCTTATACTGGAGACCCTCCATACAGCCATGGAACAGGGACAGGGTACACCATGGACACAGTCAACAGAACACACCAATACTCAGAAAAGGGGGAGTGGACAACAAACACAGAGACCGGAGCACCCCAACTCAACCCAATTGATGGACCATTACCTGAGGATAACGAGCCCAGTGGGTATGCACAAACAGATTGTGTATTAGAAGCAATGGCTTTCCTTGAAGAATCCCACCCAGGAATCTTTGAAAATTCGTGTCTTGAAACGATGGAAATTGTCCAACAAACAAGAGTTGACAAACTGACCCAAGGTCGCCAGACTTATGACTGGACATTGAATAGAAACCAACCGGCTGCAACTGCTTTGGCCAACACTATAGAAATTTTCAGATCAAACGGTCTGACAGCAAATGAATCGGGACGGCTGATAGATTTCCTCAAGGATGTGATGGAATCAATGGATAAGGAGGAAATGGAGATAACAACACATTTCCAGAGAAAGAGAAGAGTAAGAGACAACATGACCAAGAAAATGGTAACGCAGAGAACAATCGGGAAGAGAAAACAAAGGCTGAACAAAAGGAGCTACCTGATAAGAGCGCTGACACTGAACACAATGACCAAGGATGCAGAAAGGGGCAAATTGAAGAGGCGAGCAATTGCAACACCCGGAATGCAAATCAGAGGATTCGTATACTTCGTTGAAACACTAGCGAGGAGTATCTGTGAGAAACTTGAGCAATCTGGGCTCCCAGTCGGAGGGAATGAGAAGAAAGCTAAACTGGCAAATGTCGTGAGGAAGATGATGACCAATTCACAGGATACTGAACTCTCCTTTACAATTACTGGTGACAACACAAAATGGAATGAGAATCAAAATCCTAGGATGTTTCTGGCAATGATAACGTACATCACAAGGAACCAGCCAGAATGGTTTCGAAATGTTTTAAGCATTGCCCCTATAATGTTTTCAAACAAAATGGCAAGACTAGGGAAAGGATACATGTTCGAAAGTAAGAGCATGAAGTTACGAACACAAATACCAGCAGAAATGCTTGCAAACATTGATCTTAAATACTTCAATGAATTAACGAAAAGGAAAATTGAGAGGATAAGACCCCTATTAATAGATGGTACAGCCTCATTGAGCCCTGGAATGATGATGGGCATGTTCAACATGCTGAGTACAGTCCTAGGAGTTTCGATCCTGAATCTTGGACAGAAAAGGTACACCAAAACCACATATTGGTGGGACGGGCTTCAATCCTCTGATGATTTCGCTCTTATTGTAAATGCCCCAAATCATGAAGGAATACAAGCAGGGGTAGATAGGTTTTATAGGACTTGTAAACTAGTTGGGATAAATATGAGCAAGAAGAAGTCTTACATAAATCGGACAGGAACATTTGAATTCACGAGCTTTTTCTACCGCTATGGATTCGTAGCCAATTTCAGTATGGAGCTGCCCAGTTTTGGAGTGTCTGGAATTAATGAATCGGCCGACATGAGCATTGGTATTACAGTGATAAAGAACAATATGATAAACAACGACCTTGGGCCAGCAACAGCTCAGATGGCTCTTCAGCTATTCATCAAGGACTACAGATACACATACCGATGCCACAGAGGAGACACGCAAATCCACACGAGGAGATCATTCGAGCTGAAGAAGCTATGGGAACAAACCCGTTCAAAGGCAGGACTATTAGTGTCAGATGGAGGACCAAATCTGTACAATATCCGAAATCTCCATATTCCTGAGGTCTGCTTGAAATGGGAATTGATGGATGAAGACTACCAGGGTAGACTGTGCAATCCTCTGAATCCATTTGTCAGCCATAGGGAAATTGAATCTGTCAACAATGCTATGGTAATGCCAGCTCATGGTCCGGCCAAGAGTATGGAATATGATGCCGTTGCAACCACACATTCTTGGATTCCTAAAAGGAATCGTTCCATTCTCAACACTAGTCAAAGGGGAATTCTTGAGGATGAACAGATGTACCAAAAGTGCTGTAATCTATTCGAGAAATTCTTTCCCAGTAGTTCGTATCGGAGACCGGTTGGAATTTCCAGTATGGTGGAGGCCATGGTGTCTCGGGCCCGAATTGACGCACGAATTGATTCCGAGTCTGGAAGGATTAAGAAAGAAGAGTTTGCTGAGATCATGAAGATCTGTTCCACCATTGAAGAGCTCAGACGGCAAAAATAGTGAATTTGGCTTGTCCTTCGTGAAAAAATGCCTTGT +>PP854470.1 +ATGTCAACCCGACCTTACTCTTCTTGAAAGTTCCAGCGCAAAATGCCATAAGCACCACATTCCCGTATACTGGAGATCCTCCATACAGCCATGGAACAGGAACAGGATATACCATGGACACAGTTAACAGAACACATCAATATTCAGAAAAAGGGAAATGGACAACAAACTCAGAAACCGGGGCACCTCAACTCAATCCAATTGATGGACCATTGCCTGATGACAATGAGCCAAGTGGATATGCACAAACGGACTGCGTCCTTGAAGCAATGGCTTTCCTTGAAGAATCCCATCCAGGAATCTTTGAAAACTCGTGTCTTGAAACGATGGAAGTTGTTCAACAAACAAGAGTGGACAAGTTGACCCAAGGCCGTCAGACTTATGATTGGACATTAAACAGAAATCAGCCGGCTGCAACTGCATTAGCTAATACTATAGAGGTCTTCAGATCGAACGGTCTTACAGCTAATGAATCAGGAAGGCTAATAGATTTTCTCAAGGATGTGGTGGAATCAATGGATAAAGAGGAAATAGAAATAACAACGCATTTCCAAAGGAAAAGAAGAGTGAGAGACAACATGACCAAGAAAATGGTCACACAACGGACGATAGGAAAGAAGAAACAAAGGTTAAACAAAAGGAGCTATCTGATAAGAGCATTGACATTGAACACAATGACAAAAGACGCCGAAAGAGGCAAATTAAAGAGAAGGGCAATTGCAACACCCGGAATGCAAATCAGAGGGTTTGTGTACTTTGTTGAAACATTAGCAAGGAGCATTTGTGAGAAACTTGAACAATCTGGACTCCCAGTTGGAGGCAATGAAAAGAAGGCCAAACTAGCAAATGTTGTGAGAAAGATGATGACTAATTCGCAAGACACAGAGCTCTCTTTCACAATCACGGGAGACAACACTAAATGGAATGAGAATCAGAATCCTAGGATGTTTCTGGCAATGATAACATATATAACAAGGAACCAACCTGAATGGTTCAGGAATGTATTGAGCATTGCACCTATAATGTTCTCAAACAAAATGGCAAGACTAGGGAAAGGATACATGTTCGAAAGTAAGAGCATGAAGCTTCGAACACAGATACCGGCAGAAATGCTAGCGAGCATTGATCTGAAATACTTCAATGAGTTAACCAGGAAGAAAATAGAGAAGATAAGACCTCTTCTAATAGATGGTACGGCCTCATTAAGCCCTGGAATGATGATGGGCATGTTCAACATGCTGAGTACAGTTCTGGGAGTTTCGATTCTAAATCTAGGGCAAAAGAAGTACACCAAAACAACATACTGGTGGGATGGGCTGCAATCTTCTGATGACTTTGCTCTCATCGTGAATGCTCCAAATCATGAGGGAATACAAGCAGGAGTAGACAGATTCTATAGAACCTGCAAGCTGGTAGGAATCAATATGAGCAAAAAGAAGTCATACATAAACAGGACAGGAACATTTGAATTCACAAGTTTTTTCTATCGCTATGGATTTGTAGCCAATTTCAGCATGGAGTTGCCCAGCTTTGGAGTTTCTGGGATCAATGAATCTGCAGACATGAGCATTGGAGTAACAGTGATAAAGAACAACATGATCAACAATGATCTTGGACCAGCAACAGCCCAAATGGCTCTACAGCTATTCATCAAGGATTACAGATACACATATCGATGTCACAGAGGAGACACACAAATTCAAACAAGGAGGTCATTCGAGCTGAAAAAGTTATGGGAACAAACCCGCTCAAAACCAGGACTGCTGGTCTCAGATGGAGGGCCAAATCTATACAATATCCGAAATCTCCACATTCCGGAAGTCTGCTTAAAATGGGAGCTAATGGACGAAGACTATCAGGGAAGGCTTTGTAATCCCCTGAATCCGTTTGTAAGCCACAAAGAAATAGAGTCTGTGAACAATGCTGTGGTGATGCCAGCTCATGGCCCAGCTAAGAGTATGGAATATGATGCTGTTGCCACCACTCACTCCTGGATCCCCAAGAGGAACCGCTCTATTCTTAATACAAGCCAAAGGGGAATCCTTGAAGACGAACAGATGTATCAAAAGTGCTGCAATCTATTTGAAAAATTCTTCCCTAGCAGTTCATACAGGAGGCCGGTTGGAATTTCCAGCATGGTGGAGGCCATGGTTTCTAGGGCCCGAATTGATGCACGAATTGACTTCGAATCTGGACGGATTAAGAAGGAGGAGTTTGCTGAGATCATGAAGATCTGTTCCACCATTGAAGAGCTCAGACGGCAGAAATAGTGAATTTAGCTTGTCCTTCATGAAAAAATGCCTTGTTTCTACT +>PP390164.1 +CAGACCTATGATTGGACGTTAAACAGGAATCAGCCGGCTGCAACTGCATTAGCTAATACTATAGAGGTCTTCAGATCTAACGGTCTCACAGCCAATGAATCAGGAAGGCTAATAGATTTTCTCAAGGATGTGATGGAATCAATGGATAAGGAGGAAATGGAAATAACAACGCATTTCCAAAGGAAAAGAAGAGTGAGAGACAACATGACCAAGAAAATGGTCACACAAAGGACAATAGGAAAGAAGAAACAGAGGCTAAATAAAAAGAGCTATCTGATAAGAGCATTGACACTGAACACGATGACAAAAGACGCCGAAAGAGGCAAATTAAAAAGAAGGGCAATTGCGACACCTGGAATGCAAATCAGAGGGTTTGTGTACTTTGTTGAAACATTAGCGAGGAGCATTTGTGATAAGCTTGAACAATCTGGACTCCCAGTTGGGGGCAATGAAAAGAAGGCTAAACTGGCAAATGTTGTGAGAAAAATGATGACTAATTCGCAGGACACAGAGCTCTCTTTCACAATCACTGGAGACAACACCAAATGGAATGAAAATCAGAACCCTAGGATGTTTCTGGCAATGATAACATATATAACAAGGAACCAACCTGAATGGTTCAGGAATGTCTTAAGCATTGCACCTATAATGTTCTCAAATAAAATGGCAAGACTAGGGAAAGGGTACATGTTCGAAAGTAAGAGCATGAAGCTCCGAACACAAATACCAGCAGAAATGCTAGCAAGCATTGATATGAAGTACTTCAATGAGTCAACAAGGAAGAAAATAGAGAAGATAAGATCTCTTCTAATAGATGATACAGCCTCATTAAGCCCAGGAATGATGATGGGCATGTTCAATATGCTGAGTACAGTTTTGGGAGTTTCGATTCTAAATCTGGGACAAAGGAGGTACACCAAAACAACATACTGGTGGGACGGACTCCAATCCTCTGATGACTTTGCTCTCATAGTGAATGCTCCGAATCATGAGGGAATACAAGCAGGGGTAGACAGATTCTATAGAACCTGCAAGCTGGTCGGAATCAACATGAGCAAAAAGAAGTCCTACATAAACAGAACAGGAACATTTGAATTCACAAGTTTTTTCTACCGCTATGGATTTGTAGCCAATTTCAGTATGGAGTTGCCCAGCTTTGGAGTGTCTGGGATCAATGAATCTGCAGACATGAGCATTGGAGTAACAGTGATAAAGAACAACATGATCAACAATGATCTTGGACCAGCAACAGCTCAAATGGCTCTTCAGCTATTCATCAAGGATTACAGATACACATACCGATGTCACAGAGGAGACACACAAATTCAGACAAGGAGGTCGTTCGAGCTGAAGAAATTGTGGGAACAGACCCGCTCAAAAGCAGGGCTGCTGGTCTCAGATGGAGGACCAAATCTATACAATATTCGGAATCTTCACATTCCAGAAGTCTGC +>MN209244.1 +ATGGATGTCAATCCGACTTTACTTTTCTTAAAAGTGCCGGCGCAGAATGCTATAAGCACTACATTCCCTTACACTGGAGATCCTCCATACAGCCATGGAACAGGAACAGGATACACCATGGACACAGTCAACAGAACACATCAATACTCAGAAAAGGGAAAATGGACAACAAACACAGAAACCGGAGCACCCCAACTCAATCCAATTGATGGACCATTGCCAGAGGACAACGAGCCAAGCGGATATGCACAAACGGATTGTGTGTTGGAAGCAATGGCTTTCCTTGAGGAATCCCATCCAGGGATCTTTGAAAACTCTTGTCTTGAAACGATGGAAATCGTTCAGCAAACAAGAGTGGACAAACTAACCCAAGGTCGCCAGACTTATGACTGGACACTGAACAGAAACCAACCAGCTGCAACTGCTTTGGCAAACACTATAGAGGTGTTCAGATCGAACGGTCTGACAGCCAATGAGTCGGGGAGACTAATAGATTTCCTCAAAGATGTAATGGAATCAATGGATAAAGAAGAAATGGAAATAACAACACATTTCCAAAGAAAGAGAAGAGTGAAGGACAACATGACCAAGAAGATGGTCACACAAAGAACAATAGGAAAGAAGAAACAGAGGCTGAATAAAAGGAGTTACTTAATAAGAGCACTGACATTGAACACAATGACCAAAGATGCAGAAAGAGGTAAATTGAAGAGACGGGCAATTGCAACACCCGGGATGCAGATTAGAGGATTCGTATACTTTGTCGAAACACTAGCGAGGAGCATCTGTGAGAAACTCGAGCAATCTGGACTGCCTGTTGGAGGGAATGAGAAGAAGGCTAAATTGGCAAATGTCGTGAGGAAAATGATGACTAACTCACAAGATACAGAGCTTTCCTTTACAATTACTGGAGACAACACCAAATGGAATGAGAATCAAAATCCTCGAATGTTTTTGGCAATGATAACATACATCACAAGAAAACAACCTAAATGGTTCAGAAATGTTTTGAGCATTGCCCCTATAATGTTCTCAAACAAAATGGCGAGATTGGGGAAAGGATACATGTTTGAAAGTAAGAGCATGAAACTAAGGACACAAATACCGGCAGAGATGCTTGCAAACATTGATTTGAAGTATTTCAACGAATCAACGAGGAAGAAAATCGAGAAAATAAGACCTCTGCTGATTGATGGCACAGCCTCATTGAGTCCTGGAATGATGATGGGCATGTTCAATATGCTGAGCACAGTATTAGGGGTCTCAATCCTGAATCTTGGGCAAAAGAGGTACACCAAAACCATATACTGGTGGGATGGACTCCAATCTTCTGATGATTTCGCTCTCATAGTGAATGCACCAAGCCATGAGGGGATACAAGCAGGAGTTGATAGGTTTTATAGGACCTGCAAATTGGTTGGGATCAACATGAGCAAAAAGAAGTCTTACATAAACCGAACAGGAACATTTGAGTTTACAAGCTTCTTCTACCGCTATGGATTTGTAGCTAACTTCAGTATGGAGTTGCCCAGTTTTGGAGTGTCTGGAATCAATGAATCGGCTGACATGAGCATTGGAGTCACAGTGATAAAGAACAATATGATAAACAATGACCTTGGACCAGCAACAGCTCAAATGGCTCTCCAGCTATTCATCAAGGACTATAGGTACACGTACCGATGCCACAGGGGTGATACTCAAATTCAAACGAGGAGATCATTTGAACTGAAGAAGCTGTGGGAGCAGACCCGCTCAAAGGCAGGGCTATTGGTATCAGATGGAGGACCAAACCTATACAACATTCGAAATCTCCACATCCCAGAGGTCTGCTTAAAGTGGGAACTGATGGATGAAGACTACCAAGGCAGGCTGTGTAATCCTCTGAATCCGTTTGTCAGCCATAAGGAAATCGAGTCCGTGAACAATGCTGTGGTAATGCCAGCCCATGGTCCAGCCAAGAGCATGGAGTATGATGCTGTAGCGACTACACACTCGTGGATTCCTAAAAGGAACCGTTCCATTCTCAATACAAGCCAGAGGGGAATTCTTGAAGATGAGCAAATGTACCAGAAGTGCTGTAGTCTATTTGAGAAATTCTTCCCCAGCAGTTCATACAAGAGGCCAGTTGGAATTTCCAGCATGGTGGAGGCCATGGTGTCTAGGGCCCGAATTGATGCACGCATTGATTTCGAATCTGGAAGGATTAATAAAGAAGAGTTTGCTGAGATCATGAAGATCTGTTCCACCATTGAAGAGCTCAGACGGCAAAAGTAGTGAATTTAGCTTGTC +>KR010409.1 +ATGGATGTCAATCCGACTTTACTTTTCTTAAAAGTGCCAGCGCAAAATGCTATAAGTACTACATTCCCTTACACTGGAGATCCTCCATACAGCCATGGAACAGGAACAGGATACACCATGGACACCGTCAACAGAACACATCAATACTCAGAAAAGGGAAAATGGACAACAAACACAGAGACCGGAGCACCCCAACTCAACCCAATTGATGGACCATTACCAGAGGACAATGAGCCAAGCGGATATGCACAAACGGATTGCGTGTTGGAAGCAATGGCTTTCCTTGAGGAATCCCACCCAGGGATCTTTGAAAACTCTTGTCTTGAAACGATGGAAGTCGTTCAGCAAACAAGAGTGGACAAACTAACCCAAGGTCGCCAGACTTATGACTGGACACTGAACAGAAACCAACCAGCTGCAACTGCTTTGGCCAACACTATAGAGGTGTTCAGATCGAACGGTCTGACAGCCAATGAATCGGGGAGACTAATAGATTTCCTCAAGGATGTGATGGAATCAATGGATAAAGAAGAAATGGAAATAACAACACATTTCCAGAGAAAGAGAAGAGTGAGGGACAACATGACCAAGAAGATGGTCACACAAAGAACAATAGGAAAGAAGAAGCAGAGGCTGAATAAAAAGAGTTACTTAATAAGAGCACTGACATTGAACACAATGACCAAAGATGCAGAAAGAGGTAAATTGAAGAGACGAGCAATTGCAACACCCGGGATGCAAATTAGAGGATTCGTGTACTTTGTCGAAACACTAGCGAGGAGCATCTGTGAGAAACTCGAGCAATCTGGACTCCCTGTTGGAGGGAATGAGAAGAAGGCTAAATTGGCAAATGTCGTGAGGAAAATGATGACTAACTCACAAGATACAGAGCTTTCCTTTACAATTACTGGAGACAACACCAAATGGAATGAGAATCAAAATCCTCGGATGTTTTTGGCAATGATAACATACATCACAAGAAACCAACCTGAATGGTTCAGAAATGTTTTGAGCATTGCCCCTATAATGTTCTCAAACAAAATGGCGAGATTGGGGAAAGGATACATGTTTGAAAGTAAGAGCATGAAACTAAGGACACAAATACCGGCAGAGATGCTTGCAAACATTGATCTGAAATATTTCAACGAATCAACGAGAAAGAAAATCGAGAAAATAAGACCTCTGCTGATTGATGGCACAGCCTCATTGAGTCCTGGAATGATGATGGGCATGTTCAATATGCTGAGCACAGTATTAGGGGTCTCAATCCTGAATCTTGGGCAAAAGAGGTACACCAAAACCACATACTGGTGGGATGGACTCCAATCCTCTGATGATTTCGCTCTCATAGTGAATGCACCGAATCATGAGGGGATACAAGCAGGGGTTGATAGGTTCTATAGGACCTGCAAATTGGTTGGGATCAACATGAGCAAAAAGAAGTCTTACATAAACCGAACAGGAACATTTGAGTTTACAAGCTTTTTCTACCGCTATGGATTTGTAGCTAACTTCAGTATGGAGTTACCCAGTTTTGGAGTGTCTGGAATCAATGAATCGGCTGACATGAGCATTGGAGTTACAGTGATAAAGAACAATATGATAAACAATGACCTTGGACCAGCAACAGCTCAAATGGCTCTTCAGCTATTCATCAAGGACTATAGGTACACGTACCGATGCCACAGGGGTGATACACAAATTCAAACGAGGAGATCATTCGAGCTGAAGAAGCTGTGGGAGCAGACCCGTTCAAAGGCAGGGCTGTTGGTATCAGATGGAGGACCAAACCTATACAACATTCGAAATCTCCACATCCCAGAGGTCTGCTTAAAGTGGGAACTGATGGATGAAGACTACCAAGGCAGGCTGTGTAATCCTCTGAATCCGTTTGTCAGCCATAAGGAAATTGAGTCCGTGAACAATGCTGTGGTAATGCCAGCCCATGGCCCAGCCAAGAGCATGGAGTATGATGCTGTTGCGACTACACACTCATGGATTCCTAAGAGGAACCGTTCCATTCTCAATACCAGCCAAAGGGGAATTCTTGAAGATGAGCAAATGTACCAGAAGTGCTGTAGTCTATTTGAGAAATTCTTCCCCAGCAGTTCATACAGGAGGCCAGTTGGAATTTCCAGCATGGTGGAGGCCATGGTGTCTAGGGCCCGAATTGATGCACGCATTGATTTCGAATCTGGAAGGATTAAGAAAGAAGAGTTTGCTGAGATCATGAAGATCTGTTCCACCATTGAAGAGCTCAGACGGCAAAAATAGTGAATTTAG +>MF112364.1 +ATGGATGTCAATCCGACTTTACTTTTCTTGAAAGTGCCAGTGCAAAATGCCATAAGTACCACATTCCCTTATACTGGAGACCCTCCATACAGCCATGGAACAGGGACAGGGTACACCATGGACACCGTCAACAGAACACACCAATATTCAGAAAAGGGGGAGTGGACAACAAACACGGAGACCGGAGCACCCCAACTCAACCCAATTGATGGACCATTACCAGAGGACAACGAGCCAAGTGGGTATGCACAAACAGATTGTGTATTAGAAGCAATGGCTTTCCTTGAAGAATCCCACCCAGGAATCTTTGAAAATTCGTGTCTTGAAACGATGGAAATTGTCCAACAAACAAGAGTGGACAAATTAACCCAAGGTCGCCAGACTTATGACTGGACATTGAATAGAAACCAACCGGCTGCAACTGCTTTGGCCAACACTATAGAAATTTTCAGATCAAACGGTCTGACAGCAAGTGAATCGGGAAGGCTGATAGATTTCCTCAAGGATGTGATGGAATCAATGGATAAGGAAGAAATAGAGATAACAACACATTTCCAGAGAAAGAGAAGAGTAAGAGACAACATGACCAAGAAAATGGTAACGCAAAGAACAATCGGGAAGAAAAAACAAAGGCTGAACAAAAGAAGCTACCTGATAAGAGCGCTGACACTGAACACAATGACCAAAGATGCAGAAAGGGGCAAATTGAAGAGGCGAGCAATTGCAACACCCGGAATGCAAATCAGAGGATTCGTGTACTTCGTTGAAACACTAGCGAGAAGTATCTGTGAGAAACTTGAGCAATCTGGACTCCCAGTCGGAGGGAATGAGAAGAAAGCTAAACTGGCAAACGTCGTGAGGAAGATGATGACCAATTCACAGGATACTGAACTCTCCTTTACAATTACTGGGGACAACACGAAATGGAATGAGAATCAAAATCCTAGAGTGTTTCTGGCAATGATAACATACATCACAAGGAACCAGCCAGAATGGTTTCGAAATGTTTTAAGCATTGCCCCTATAATGTTTTCAAACAAATTGGCAAGACTAGGGAAAGGATACATGTTCGAAAGTAAGAGCATGAAGTTACGAACACAGATACCAGCAGAAATGCTTGCAAACATTGATCTTAAATACTTCAATGAATTAACGAAAAGGAAAATTGAAAAGATAAGACCCCTTTTAATAGATGGTACAGCCTCCTTGAGCCCTGGAATGATGATGGGCATGTTCAACATGCTGAGTACAGTCCTAGGAGTTTCAATCCTGAATCTTGGACAGAAAAGGTACACCAAAACCACATATTGGTGGGACGGGCTCCAATCCTCTGATGATTTCGCTCTTATTGTAAATGCCCCGAATCATGAAGGAATACAAGCAGGGGTAGATAGGTTTTATAGGACTTGTAAACTAGTTGGGATAAATATGAGCAAGAAGAAGTCTTACATAAATCGGACAGGGACATTTGAATTCACGAGCTTTTTCTACCGCTATGGATTCGTGGCCAATTTCAGTATGGAGCTGCCCAGTTTTGGAGTGTCTGGAATTAATGAGTCGGCCGACATGAGCATTGGTGTTACAGTGATAAAAAACAATATGATAAACAACGACCTTGGGCCAGCAACAGCTCAGATGGCTCTTCAGCTATTCATCAAGGACTACAGATACACATACCGATGCCACAGAGGAGACACGCAAATCCACACGAGGAGATCATTCGAGCTGAAGAAGCTATGGGAACAAACCCGTTCAAAGGCAGGACTATTGGTTTCAGATGGAGGACCAAATCTATACAATATCCGAAATCTTCATATTCCTGAGGTCTGCTTGAAATGGGAACTGATGGATGAAGACTACCAGGGTAGACTGTGCAATCCTCTGAATCCATTCGTCAGCCATAGGGAAATTGAATCTGTCAACAATGCTATGGTAATGCCAGCTCATGGTCCGGCCAAGAGTATGGAATATGATGCCGTTGCAACCACACATTCTTGGATTCCTAAAAGGAATCGTTCCATTCTCAACACAAGTCAAAGGGGAATTCTTGAGGATGAACAGATGTACCAAAAATGCTGCAATCTATTCGAGAAATTCTTTCCCAGTAGTTCGTATCGGAGACCAGTTGGAATTTCCAGTATGGTGGAGGCCATGGTGTCTCGGGCCCGAATTGACGCACGAATTGATTTCGAGTCTGGAAGGATTAAGAAAGAAGAGTTTGCTGAGATCATGAAGATCTGTTCCACCATTGAAGAGCTTAGACGGCAAAAATAG +>MF112405.1 +ATGGATGTCAATCCGACTTTACTTTTCTTGAAAGTGCCAGTGCAAAATGCCATAAGCACCACATTCCCTTATACTGGAGACCCTCCATACAGCCATGGAACAGGGACAGGGTACACCATGGACACAGTCAACAGAACACACCAATATTCAGAAAAGGGGGAGTGGACAACAAACACAGAGACCGGAGCACCCCAGCTCAACCCAATTGATGGACCATTACCGGAGGACAACGAGCCAAGTGGGTATGCACAAACAGATTGTGTATTGGAAGCAATGGCTTTCCTTGAAGAATCCCACCCAGGAATCTTTGAAAATTCGTGTCTTGAAACGATGGAAATTGTCCAACAAACAAGAGTGGACAAATTAACCCAAGGTCGCCAGACTTATGACTGGACATTGAATAGAAACCAACCGGCTGCAACTGCTTTGGCCAACACTATAGAAATTTTCAGATCAAACGGTCTGACAGCAAGTGAATCGGGAAGGCTGATAGATTTCCTCAAGGATGTGATGGAATCAATGGATAAGGAAGAAATAGAGATAACAACACATTTCCAGAGAAAGAGAAGAGTAAGAGACAACATGACCAAGAAAATGGTAACGCAAAGAACAATCGGGAAGAAAAAACAAAGGCTGAACAAAAGGAGCTACCTGATAAGAGCGCTGACACTGAACACAATGACCAAGGATGCAGAAAGGGGCAAATTGAAGAGGCGAGCAATTGCAACACCCGGAATGCAAATCAGAGGATTCGTGTACTTCGTTGAAACACTAGCGAGGAGTATCTGTGAGAAACTTGAGCAATCTGGACTCCCAGTCGGAGGGAATGAGAAGAAAGCTAAACTGGCAAACGTCGTGAGGAAGATGATGACCAATTCACAGGATACTGAACTCTCCTTTACAATTACTGGGGACAACACGAAATGGAATGAGAATCAAAATCCTAGAGTGTTTCTGGCAATGATAACATACATCACAAGGAACCAGCCTGAATGGTTTCGAAATGTTTTAAGCATTGCCCCTATAATGTTTTCAAACAAATTGGCAAGACTAGGGAAAGGATACATGTTCGAAAGTAAGAGCATGAAGTTACGAACACAGATACCAGCAGAAATGCTTGCAAACATTGATCTCAAATACTTCAATGAATCAACGAAAAGGAAAATTGAGAAGATAAGACCCCTTTTAATAGATGGTACAGCCTCCTTGAGCCCTGGAATGATGATGGGCATGTTCAACATGCTGAGTACAGTCCTAGGAGTTTCAATCCTGAATCTTGGACAGAAAAGGTACACCAAAACCACATATTGGTGGGACGGGCTCCAATCCTCTGATGATTTCGCTCTTATTGTAAATGCCCCGAATCATGAAGGAATACAAGCAGGGGTAGATAGGTTTTATAGGACTTGTAAACTAGTTGGGATAAATATGAGCAAGAAGAAGTCTTACATAAATCGGACAGGGACATTTGAATTCACGAGTTTTTTCTACCGCTATGGATTCGTGGCCAATTTCAGTATGGAGCTACCCAGTTTTGGAGTGTCTGGAATTAATGAGTCGGCCGACATGAGCATTGGTGTTACAGTGATAAAAAACAATATGATAAACAACGACCTTGGGCCAGCAACAGCTCAGATGGCTCTTCAGCTATTCATCAAGGACTACAGATACACATACCGATGCCACAGAGGAGACACGCAAATCCACACGAGGAGATCATTCGAGCTGAAGAAGCTATGGGAACAAACCCGTTCAAAGGCAGGACTATTGGTTTCAGATGGAGGACCAAATTTATACAATATCCGAAACCTTCATATTCCTGAGGTCTGCTTGAAATGGGAATTGATGGATGGAGACTACCAGGGTAGACTGTGCAATCCTCTGAATCCATTCGTCAGCCATAGGGAAATTGAATCTGTCAACAATGCTATGGTAATGCCAGCTCATGGTCCGGCCAAGAGTATGGAATATGATGCCGTTGCAACCACACATTCTTGGATTCCTAAAAGGAATCGTTCCATTCTCAACACAAGTCAAAGGGGAATTCTTGAGGATGAACAGATGTACCAAAAGTGCTGCAATCTATTCGAGAAATTCTTCCCCAGTAGTTCGTATCGGAGACCAGTTGGAATTTCCAGTATGGTGGAGGCCATGGTGTCTCGGGCCCGAATTGACGCACGAATTGATTTCGAGTCTGGAAGGATTAAGAAAGAAGAGTTTGCTGAGATCATAAAGATCTGTTCCACCATTGAAGAGCTCAGACGGCAAAAATAG +>MF112390.1 +ATGGATGTCAATCCGACTTTACTTTTCTTGAAAGTGCCAGTGCAAAATGCCATAAGTACCACATTCCCTTATACTGGAGACCCTCCATACAGCCATGGAACAGGGACAGGGTACACCATGGACACCGTCAACAGAACACACCAATATTCAGAAAAGGGGGAGTGGACAACAAACACAGAGACCGGAGCACCCCAACTCAACCCAATTGATGGACCATTACCAGAGGACAACGAGCCAAGTGGGTATGCACAAACAGATTGTGTATTAGAAGCAATGGCTTTCCTTGAAGAATCCCACCCAGGAATCTTTGAAAATTCGTGTCTTGAAACGATGGAAATTGTCCAACAAACAAGAGTGGACAAATTAACCCAAGGTCGCCAGACTTATGACTGGACATTGAATAGAAACCAACCGGCTGCAACTGCTTTGGCCAACACTATAGAAATTTTCAGATCAAACGGTCTGACAGCAAGTGAATCGGGAAGGCTGATAGATTTCCTCAAGGATGTGATGGAATCGATGGATAAGGAAGAAATAGAGATAACAACACATTTCCAGAGAAAGAGAAGAGTAAGAGACAACATGACCAAGAAAATGGTAACGCAAAGAACAATCGGGAAGAAAAAACAAAGGCTGAACAAAAGAAGCTACCTGATAAGAGCGCTGACACTGAACACAATGACCAAAGATGCAGAAAGGGGCAAATTGAAGAGGCGAGCAATTGCAACACCCGGAATGCAAATCAGAGGATTCGTGTACTTCGTTGAGACACTAGCGAGAAGTATCTGTGAGAAACTTGAGCAATCTGGACTCCCAGTCGGAGGGAATGAGAAGAAAGCTAAACTGGCAAACGTCGTGAGGAAGATGATGACCAATTCACAGGATACTGAACTCTCCTTTACAATTACTGGGGACAACACGAAATGGAATGAGAATCAAAATCCTAGAGTGTTTCTGGCAATGATAACATACATCACAAGGAACCAGCCAGAATGGTTTCGAAATGTTTTAAGCATTGCCCCTATAATGTTTTCAAACAAATTGGCAAGACTAGGGAAAGGATACATGTTCGAAAGTAAGAGCATGAAGTTACGAACACAGATACCAGCAGAAATGCTTGCAAACATTGATCTTAAATACTTCAATGAATTAACGAAAAGGAAAATTGAAAAGATAAGACCCCTTTTAATAGATGGTACAGCCTCCTTGAGCCCTGGAATGATGATGGGCATGTTCAACATGCTGAGTACAGTCCTAGGAGTTTCAATCCTGAATCTTGGACAGAAAAGGTACACCAAAACCACATATTGGTGGGACGGGCTCCAATCCTCTGATGATTTCGCTCTTATTGTAAATGCCCCGAATCATGAAGGAATACAAGCAGGGGTAGATAGGTTTTATAGGACTTGTAAACTAGTTGGGATAAATATGAGCAAGAAGAAGTCTTACATAAATCGGACAGGGACATTTGAATTCACGAGCTTTTTCTACCGCTATGGATTCGTGGCCAATTTCAGTATGGAGCTGCCCAGTTTTGGAGTGTCTGGAATTAATGAGTCGGCCGACATGAGCATTGGTGTTACAGTGATAAAAAACAATATGATAAACAACGACCTTGGGCCAGCAACAGCTCAGATGGCTCTTCAGCTATTCATCAAGGACTACAGATACACATACCGATGCCACAGAGGAGACACGCAAATCCACACGAGGAGATCATTCGAGCTGAAGAAGCTATGGGAACAAACCCGTTCAAAGGCAGGACTATTGGTTTCAGATGGAGGACCAAATCTATACAATATCCGAAATCTTCATATTCCTGAGGTCTGCTTGAAATGGGAACTGATGGATGAAGACTACCAGGGTAGACTGTGCAATCCTCTGAATCCATTCGTCAGCCATAGGGAAATTGAATCTGTCAACAATGCTATGGTAATGCCAGCTCATGGTCCGGCCAAGAGTATGGAATATGATGCCGTTGCAACCACACATTCTTGGATTCCTAAAAGGAATCGTTCCATTCTCAACACAAGTCAAAGGGGAATTCTTGAGGATGAACAGATGTACCAAAAATGCTGCAATCTATTCGAGAAATTCTTTCCCAGTAGTTCGTATCGGAGACCAGTTGGAATTTCCAGTATGGTGGAGGCCATGGTGTCTCGGGCCCGAATTGACGCACGAATTGATTTCGAGTCTGGAAGGATTAAGAAAGAAGAGTTTGCTGAGATCATGAAGATCTGTTCCACCATTGAAGAGCTCAGACGGCAAAAATAG +>MF112389.1 +ATGGATGTCAATCCGACTTTACTTTTCTTGAAAGTGCCAGTGCAAAATGCCATAAGTACCACATTCCCTTATACTGGAGACCCTCCATACAGCCATGGAACAGGGACAGGGTACACCATGGACACCGTCAACAGAACACACCAATATTCAGAAAAGGGGGAGTGGACAACAAACACAGAGACCGGAGCACCCCAACTCAACCCAATTGATGGACCATTACCAGAGGACAACGAGCCAAGTGGGTATGCACAAACAGATTGTGTATTAGAAGCAATGGCTTTCCTTGAAGAATCCCACCCAGGAATCTTTGAAAATTCGTGTCTTGAAACGATGGAAATTGTCCAACAAACAAGAGTGGACAAATTAACCCAAGGTCGCCAGACTTATGACTGGACATTGAATAGAAACCAACCGGCTGCAACTGCTTTGGCCAACACTATAGAAATTTTCAGATCAAACGGTCTGACAGCAAGTGAATCGGGAAGGCTGATAGATTTCCTCAAGGATGTGATGGAATCAATGGATAAGGAAGAAATAGAGATAACAACACATTTCCAGAGAAAGAGAAGAGTAAGAGACAACATGACCAAGAAAATGGTAACGCAAAGAACAATCGGGAAGAAAAAACAAAGGCTGAACAAAAGAAGCTACCTGATAAGAGCGCTGACACTGAACACAATGACCAAAGATGCAGAAAGGGGCAAATTGAAGAGGCGAGCAATTGCAACACCCGGAATGCAAATCAGAGGATTCGTGTACTTCGTTGAAACACTAGCGAGAAGTATCTGTGAGAAACTTGAGCAATCTGGACTCCCAGTCGGAGGGAATGAGAAGAAAGCTAAACTGGCAAACGTCGTGAGGAAGATGATGACCAATTCACAGGATACTGAACTCTCCTTTACAATTACTGGGGACAACACGAAATGGAATGAGAATCAAAATCCTAGAGTGTTTCTGGCAATGATAACATACATCACAAGGAACCAGCCAGAATGGTTTCGAAATGTTTTAAGCATTGCCCCTATAATGTTTTCAAACAAATTGGCAAGACTAGGGAAAGGATACATGTTCGAAAGTAAGAGCATGAAGTTACGAACACAGATACCAGCAGAAATGCTTGCAAACATTGATCTTAAATACTTCAATGAATTAACGAAAAGGAAAATTGAAAAGATAAGACCCCTTTTAATAGATGGTACAGCCTCCTTGAGCCCTGGAATGATGATGGGCATGTTCAACATGCTGAGTACAGTCCTAGGAGTTTCAATCCTGAATCTTGGACAGAAAAGGTACACCAAAACCACATATTGGTGGGACGGGCTCCAATCCTCTGATGATTTCGCTCTTATTGTAAATGCCCCGAATCATGAAGGAATACAAGCAGGAGTAGATAGGTTTTATAGGACTTGTAAACTAGTTGGGATAAATATGAGCAAGAAGAAGTCTTACATAAATCGGACAGGGACATTTGAATTCACGAGCTTTTTCTACCGCTATGGATTCGTGGCCAATTTCAGTATGGAGCTGCCCAGTTTTGGAGTGTCTGGAATTAATGAGTCGGCCGACATGAGCATTGGTGTTACAGTGATAAAAAACAATATGATAAACAACGACCTTGGGCCAGCAACAGCTCAGATGGCTCTTCAGCTATTCATCAAGGACTACAGATACACATACCGATGCCACAGAGGAGACACGCAAATCCACACGAGGAGATCATTCGAGCTGAAGAAGCTATGGGAACAAACCCGTTCAAAGGCAGGACTATTGGTTTCAGATGGAGGACCAAATCTATACAATATCCGAAATCTTCATATTCCTGAGGTCTGCTTGAAATGGGAACTGATGGATGAAGACTACCAGGGTAGACTGTGCAATCCTCTGAATCCATTCGTCAGCCATAGGGAAATTGAATCTGTCAACAATGCTATGGTAATGCCAGCTCATGGTCCGGCCAAGAGTATGGAATATGATGCCGTTGCAACCACACATTCTTGGATTCCTAAAAGGAATCGTTCCATTCTCAACACAAGTCAAAGGGGAATTCTTGAGGATGAACAGATGTACCAAAAATGCTGCAATCTATTCGAGAAATTCTTTCCCAGTAGTTCGTATCGGAGACCAGTTGGAATTTCCAGTATGGTGGAGGCCATGGTGTCTCGGGCCCGAATTGACGCACGAATTGATTTCGAGTCTGGAAGGATTAAGAAAGAAGAGTTTGCTGAGATCATGAAGATCTGTTCCACCATTGAAGAGCTCAGACGGCAAAAATAG +>MF112409.1 +ATGGATGTCAATCCGACTTTACTTTTCTTGAAAGTGCCAGTGCAAAATGCCATAAGCACCACATTCCCTTATACTGGAGACCCTCCATACAGCCATGGAACAGGGACAGGGTACACCATGGACACAGTCAACAGAACACACCAATATTCAGAAAAGGGGGAGTGGACAACAAACATAGAGACCGGAGCACCCCAGCTCAACCCAATTGATGGACCATTACCGGAGGACAACGAGCCAAGTGGGTATGCACAAACAGATTGTGTATTGGAAGCAATGGCTTTCCTTGAAGAATCCCACCCAGGAATCTTTGAAAATTCGTGTCTTGAAACGATGGAAATTGTCCAACAAACAAGAGTGGACAAATTAACCCAAGGTCGCCAGACTTATGACTGGACATTGAATAGAAACCAACCGGCTGCAACTGCTTTGGCCAACACTATAGAAATTTTCAGATCAAACGGTCTGACAGCAAGTGAATCGGGAAGGCTGATAGATTTCCTCAAGGATGTGATGGAATCAATGGATAAGGAAGAAATAGAGATAACAACACATTTCCAGAGAAAGAGAAGAGTAAGAGACAACATGACCAAGAAAATGGTAACGCAAAGAACAATCGGGAAGAAAAAACAAAGGCTGAACAAAAGGAGCTACCTGATAAGAGCGCTGACACTGAACACAATGACCAAGGATGCAGAAAGGGGCAAATTGAAGAGGCGAGCAATTGCAACACCCGGAATGCAAATCAGAGGATTCGTGTACTTCGTTGAAACACTAGCGAGGAGTATCTGTGAGAAACTTGAGCAATCTGGACTCCCAGTCGGAGGGAATGAGAAGAAAGCTAAACTGGCAAACGTCGTGAGGAAGATGATGACCAATTCACAGGATACTGAACTCTCCTTTACAATTACTGGGGACAACACGAAATGGAATGAGAATCAAAATCCTAGAGTGTTTCTGGCAATGATAACATACATCACAAGGAACCAGCCTGAATGGTTTCGAAATGTTTTAAGCATTGCCCCTATAATGTTTTCAAACAAATTGGCAAGACTAGGGAAAGGATACATGTTCGAAAGTAAGAGCATGAAGTTACGAACACAGATACCAGCAGAAATGCTTGCAAACATTGATCTCAAATACTTCAATGAATCAACGAAAAGGAAAATTGAGAAGATAAGACCCCTTTTGATAGATGGTACAGCCTCCTTGAGCCCTGGAATGATGATGGGCATGTTCAACATGCTGAGTACAGTCCTAGGAGTTTCAATCCTGAACCTTGGACAGAAAAGGTACACCAAAACCACATATTGGTGGGACGGGCTCCAATCCTCTGATGATTTCGCTCTTATTGTAAATGCCCCGAATCATGAAGGAATACAAGCAGGGGTAGATAGGTTTTATAGGACTTGTAAACTAGTTGGGATAAATATGAGCAAGAAGAAGTCTTACATAAATCGGACAGGGACATTTGAATTCACGAGTTTTTTCTACCGCTATGGATTCGTGGCCAATTTCAGTATGGAGCTACCCAGTTTTGGAGTGTCTGGAATTAATGAGTCGGCCGACATGAGCATTGGTGTTACAGTGATAAAAAACAATATGATAAACAACGACCTTGGGCCAGCAACAGCTCAGATGGCTCTTCAGCTATTCATCAAGGACTACAGATACACATACCGATGCCACAGAGGAGACACGCAAATCCACACGAGGAGATCATTCGAGCTGAAGAAGCTATGGGAACAAACCCGTTCAAAGGCAGGACTATTGGTTTCAGATGGAGGACCAAATTTATACAATATCCGAAACCTTCATATTCCTGAGGTCTGCTTGAAATGGGAATTGATGGATGAAGACTACCAGGGTAGACTGTGCAATCCTCTGAATCCATTCGTCAGCCATAGGGAAATTGAATCTGTCAACAATGCTATGGTAATGCCAGCTCATGGTCCGGCCAAGAGTATGGAATATGATGCCGTTGCAACCACACATTCTTGGATTCCTAAAAGGAATCGTTCCATTCTCAACACAAGTCAAAGGGGAATTCTTGAGGATGAACAGATGTACCAAAAGTGCTGCAATCTATTCGAGAAATTCTTCCCCAGTAGTTCGTATCGGAGACCAGTTGGAATTTCCAGTATGGTGGAGGCCATGGTGTCTCGGGCCCGAATTGACGCACGAATTGATTTCGAGTCTGGAAGGATTAAGAAAGAAGAGTTTGCTGAGATCATAAAGATCTGTTCCACCATTGAAGAGCTCAGACGGCAAAAATAG diff --git a/data/community/genspectrum/iav/h5n1/GG1996/PB1/genome_annotation.gff3 b/data/community/genspectrum/iav/h5n1/GG1996/PB1/genome_annotation.gff3 new file mode 100644 index 000000000..c220b4ed9 --- /dev/null +++ b/data/community/genspectrum/iav/h5n1/GG1996/PB1/genome_annotation.gff3 @@ -0,0 +1 @@ +. . CDS 25 2298 . + . gene="PB1" diff --git a/data/community/genspectrum/iav/h5n1/GG1996/PB1/pathogen.json b/data/community/genspectrum/iav/h5n1/GG1996/PB1/pathogen.json new file mode 100644 index 000000000..1df395aa8 --- /dev/null +++ b/data/community/genspectrum/iav/h5n1/GG1996/PB1/pathogen.json @@ -0,0 +1,19 @@ +{ + "schemaVersion": "3.0.0", + "alignmentParams": { + "minSeedCover": 0.01 + }, + "attributes": { + "name": "Influenza A/H5N1 (segment 2/PB1)", + "reference name": "Influenza A virus (A/goose/Guangdong/1/1996(H5N1)) polymerase (PB1) and PB1-F2 protein (PB1-F2) genes, complete cds", + "reference accession": "NC_007358.1" + }, + "files": { + "reference": "reference.fasta", + "pathogenJson": "pathogen.json", + "changelog": "CHANGELOG.md", + "genomeAnnotation": "genome_annotation.gff3", + "readme": "README.md", + "examples": "examples.fasta" + } +} diff --git a/data/community/genspectrum/iav/h5n1/GG1996/PB1/reference.fasta b/data/community/genspectrum/iav/h5n1/GG1996/PB1/reference.fasta new file mode 100644 index 000000000..8053671a4 --- /dev/null +++ b/data/community/genspectrum/iav/h5n1/GG1996/PB1/reference.fasta @@ -0,0 +1,35 @@ +>NC_007358.1 Influenza A virus (A/goose/Guangdong/1/1996(H5N1)) polymerase (PB1) and PB1-F2 protein (PB1-F2) genes, complete cds +AGCAAAAGCAGGCAAACCATTTGAATGGATGTCAATCCGACTTTACTTTTCTTAAAAGTGCCAGCGCAAA +ATGCTATAAGTACCACATTCCCTTATACTGGAGATCCTCCATACAGCCATGGAACAGGAACAGGATACAC +CATGGACACAGTCAACAGAACACATCAATATTCAGAAAAGGGGAAATGGACAACGAACACAGAGACTGGA +GCACCCCAACTCAATCCGATTGATGGACCACTACCTGAGGATAATGAGCCGAGTGGGTATGCACAAACAG +ATTGTGTATTGGAAGCAATGGCTTTCCTTGAAGAATCCCACCCAGGGATCTTTGAAAACTCGTGTCTTGA +AACGATGGAAGTTGTTCAGCAAACAAGAGTGGATAAGCTGACCCAAGGTCGCCAAACCTATGACTGGACA +TTGAAAAGAAACCAGCCGGCTGCAACCGCTTTGGCCAACACTATAGAGGTCTTCAGATCGAATGGTCTAA +CAGCCAATGAATCGGGAAGGCTAATAGATTTCCTCAAAGACGTGATGGAATCAATGGATAAGGGAGAAAT +GGAAATAATAACACATTTCCAGAGAAAGAGAAGAGTGAGGGACAACATGACCAAGAAAATGGTCACACAA +AGAACAATAGGGAAGAAAAAACAAAGGCTGAACAAAAGGAGCTACCTAATAAGAGCACTGACACTGAACA +CAATGACAAAAGACGCAGAAAGAGGCAAATTGAAGAGGCGGGCAATTGCAACACCCGGGATGCAAATCAG +AGGATTCGTGTACTTTGTCGAAACACTAGCGAGGAGTATCTGTGAGAAACTTGAGCAATCTGGACTCCCC +GTCGGAGGGAATGAAAAGAAGGCTAAATTGGCAAATGTCGTGAGGAAGATGATGACTAACTCACAAGATA +CAGAGCTCTCTTTTACAATTACTGGAGACAACACCAAATGGAATGAGAATCAGAACCCTCGGATGTTTCT +AGCAATGATAACATACATCACAAGGAACCAACCTGAATGGTTTAGAAATGTCTTAAGCATTGCTCCTATA +ATGTTCTCAAACAAGATGGCAAGATTAGGGAAAGGATACATGTTCGAAAGTAAGAGCATGAAGCTACGGA +CACAAATACCAGCAGAAATGCTTGCAAGCATTGACTTGAAATACTTCAACGAATCAACGAGAAAGAAAAT +CGAGAAAATAAGACCTCTACTAATAGATGGCACAGCCTCATTGAGTCCTGGAATGATGATGGGCATGTTC +AATATGCTGAGTACAGTCTTAGGAGTTTCAATCCTGAATCTTGGGCAGAAGAGGTACACCAAAACCACAT +ACTGGTGGGACGGACTCCAATCCTCTGATGATTTCGCTCTCATAGTGAATGCACCAAATCATGAGGGAAT +AGAAGCAGGGGTGGATAGGTTCTATAGGACTTGCAAACTAGTTGGAATCAATATGACCAAGAAGAAGTCT +TACATAAATCGGACAGGAACATGTGAATTCACAAGCTTCTTCTACCGCTATGGGTTCGTAGCCAACTTCA +GTATGGAGCTGCCCAGCTTTGGAGTGTCTGGGATTAATGAATCGGCTGACATGAGCATTGGTGTTACAGT +GATAAAGAACAATATGATGGACAACGACCTTGGACCAGCAACAGCTCAGATGGCTCTTCAGCTATTCATT +AAGGACTACAGATACCCATACCGATGCCACAGGGGGGATACACAAATCCAAACGAGGAGATCATTCGAGC +TGAAGAAGCTGTGGGAGCAGACCCGCTCAAAGGCAGGACTGTTGGTTTCAGATGGAGGACCAAACCCATA +CAATATCCGGAATCTCCACATTCCGGAGGCTGGCTTGAAGTGGGAATTGATGGATGAAGACTACCAGGGC +AGACTGTGTAATCCTCTGAACCCGTTTGTTAGTCATAAGGAAATTGAGTCTGTCAACAATGCTGTGGTAA +TGCCAGCTCATGGCCCAGCCAAGAGCATGGAATATGATGCAGTTGCGACTACACATTCATGGATTCCCAA +GAGGAATCGTTCCATTCTCAACACCAGCCAAAGGGGGATTCTTGAGGATGAACAGATGTATCAGAAGTGC +TGCAATCTATTCGAGAAATTCTTCCCTAGCAGTTCATATCGGAGGCCAGTTGGAATTTCCAGCATGGTGG +AGGCCATGGTGTCTAGGGCCCGAATTGATGCACGAATTGACTTCGAGTCTGGAAGGATTAAGAAAGAAGA +GTTTGCTGAGATCATGAAGATCTGTTCCACCATTGAAGAGCTCGGACGGCAAAAATAGTGAATTTAGCTT +GTCCTTCATGAAAAAATGCCTTGTTTCTACT diff --git a/data/community/genspectrum/iav/h5n1/GG1996/PB2/CHANGELOG.md b/data/community/genspectrum/iav/h5n1/GG1996/PB2/CHANGELOG.md new file mode 100644 index 000000000..81199b7df --- /dev/null +++ b/data/community/genspectrum/iav/h5n1/GG1996/PB2/CHANGELOG.md @@ -0,0 +1,3 @@ +## Unreleased + +Initial release diff --git a/data/community/genspectrum/iav/h5n1/GG1996/PB2/README.md b/data/community/genspectrum/iav/h5n1/GG1996/PB2/README.md new file mode 100644 index 000000000..4cb925408 --- /dev/null +++ b/data/community/genspectrum/iav/h5n1/GG1996/PB2/README.md @@ -0,0 +1,26 @@ +# H5N1 (segment1/ PB2) - dataset with A/Goose/Guangdong/1/96 reference + +| attribute | value | +| ------------------- | ----------------------------------------- | +| dataset name | community/genspectrum/iav/h5n1/GG1996/PB2 | +| reference strain | A/Goose/Guangdong/1/96(H5N1) | +| reference accession | NC_007357.1 | +| assembly accession | GCF_000864105.1 | + +## Authors and contacts + +Maintained by Genspectrum, Chaoran Chen and Anna Parker + +With the help of: Cornelius Roemer and Richard Neher + +## Scope of this dataset + +This dataset uses the first highly-pathogenic avian influenza (HPAI) isolate (A/Goose/Guangdong/1/96) as a reference and is suitable for the analysis of circulating and historical H5 sequences, including low-pathogenicity avian influenza (LPAI) isolates. + +## Features + +This simple dataset only supports alignment. + +## What is Nextclade dataset + +Read more about Nextclade datasets in Nextclade documentation: https://docs.nextstrain.org/projects/nextclade/en/stable/user/datasets.html diff --git a/data/community/genspectrum/iav/h5n1/GG1996/PB2/examples.fasta b/data/community/genspectrum/iav/h5n1/GG1996/PB2/examples.fasta new file mode 100644 index 000000000..d2cb03a43 --- /dev/null +++ b/data/community/genspectrum/iav/h5n1/GG1996/PB2/examples.fasta @@ -0,0 +1,38 @@ +>FJ868022.1 +TAGCAAAAGCAGGTCAATTATATTCAATATGGAGAGAATAAAAGAATTACGAGATCTAATGTCACAGTCCCGCACTCGCGAGATACTAACAAAAACCACTGTGGACCATATGGCCATAATCAAGAAATACACATCAGGAAGACAAGAGAAGAACCCTGCTCTCAGGATGAAATGGATGATGGCAATGAAATATCCAATCACAGCGGACAAGAGAATAATAGAGATGATTCCTGAAAGGAATGAAAAAGGGCAGACGCTCTGGAGCAAAACAAGTGATGCTGGATCGGACAGGGTGATGGTGTCTCCCCTAGCTGTGACTTGGTGGAATAGAAATGGGCCGGCGACAAGTGCAGTTCATTATCCAAAGGTTTACAAAACATACTTTGAGAAGGTTGAAAGGTTAAAACATGGAACCTTCGGTCCCGTTCATTTCCGAAACCAAGTTAAAATACGCCGCCGAGTTGATATAAATCCTGGCCATGCAGATCTCAGTGCTAAAGAAGCACAAGATGTCATCATGGAGGTCGTTTTCCCAAATGAAGTGGGAGCTAGAATATTGACATCAGAGTCGCAATTGACAATAACGAAAGAGAAGAAAGAAGAGCTCCAAGATTGTAAGATTGCTCCCTTAATGGTTGCATACATGTTGGAGAGGGAACTGGTCCGCAAAACCAGATTCCTACCGGTAGCAGGCGGAACAAGCAGTGTGTACATTGAGGTATTGCATTTGACTCAAGGGACCTGCTGGGAACAGATGTACACTCCAGGCGGAGAAGTGAGAAATGACGATGTCGACCAGAGTTTGGTCATCGCTGCCAGAAACATTGTTAGGAGAGCAACGGTATCAGCGGATCCACTGGCATCACTGCTGGAGATGTGTCACAGCACACAAATTGGTGGGATAAAGATGGTGGACATCCTTAGGCAAAATCCAACTGAGGAACAAGCTGTGGATATATGCAAAGCAGCAATGGGTCTGAGGATCAGTTCTTCCTTTAGCTTTGGAGGCTTCACTTTCAAAAGAACAAGTGGATCGTCCGTCAAAAAGGAAGAGGAAGTGCTTACAGGCAACCTCCAAACATTGAAAATAAGAGTACATGAGGGGTATGAGGAATTCACAATGGTTGGGCGGAGGGCAACAGCTATCCTGAGGAAAGCAACCAGAAGACTGATTCAGTTGATAGTAAGTGGAAGAGACGAACAATCAATCACTGAGGCAATCATTGTAGCAATGGTGTTCTCACAGGAGGATTGCATGATAAAGGCAGTCCGAGGTGATCTGAATTTCGTAAACAGAGCAAACCAAAGATTAAACCCCATGCATCAACTCTTGAGACATTTTCAAAAGGATGCAAGAGTGCTATTTCAGAATTGGGGAATTGAACCCATTGATAATGTCATGGGGATGATCGGAATATTACCTGACATGACTCCCAGCACAGAAATGTCACTGAGAGGAGTAAGAGTTAGTAAAATGGGAGTGGATGAATATTCTAGCACTGAGAGAGTAGTTGTAAGTATTGACCGTTTCTTAAGGGTTCGAGATCAGCGGGGGAATGTACTCTTATCACCCGAAGAGGTCAGCGAAACCCAGGGAACAGAGAAATTGACAATAACATATTCATCATCAATGATGTGGGAAATCAACGGTCCTGAATCAGTGCTTGTTAACACTTATCAGTGGATCATCAGAAACTGGGAGACTGTGAAGATTCAATGGTCTCAAGACCCCACGATGCTGTACAATAAGATGGAGTTTGAACCGTTCCAATCCTTGGTACCCAAGGCTGCCAGAGGTCAATACAGTGGATTTGTGAGAACATTATTCCAACAAATGCGTGACGTACTGGGGACATTTGATACTGTCCAGGTAATAAAGCTGCTACCATTTGCAGCAGCCCCACCGGAGCAGAGCAAGATGCAGTTTTCTTCTCTAACTGTGAATGTGAGAGGATCAGGAATGAGAATACTCGTAAGGGGCAATTCCCCTGTGTTCAACTATAATAAGGCAACCAAAAGGCTTACTGTTCTTGGAAAGGACGCAGGTGCCTTAACAGAGGATCCAGATGAAGGAACAGCCGGAGTGGAATCTGCAGTACTGAGGGGATTCTTAATTCTAGGCCAGGAGGACAAAAGGTATGGACCAGCATTAAGCATCAATGAACTGAGCAATCTTGCGAAGGGGGAGAAAGCTAACGTGCTGATAGGGCAAGGAGACGTGGTGTTAGTAATGAAACGAAAACGGGACTCTAGCATACTTACTGATAGCCAGACAGCGACCAAAAGGATTCGGATGGCCGTCAATTAG +>CY146689.1 +ATGGAGCGAATAAAAGAATTAAGAGATCTAATGTCACAGTCCCGCACTCGCGAGATACTAACAAAAACCACTGTGGACCATATGGCCATAATCAAGAAATACACATCAGGAAGACAAGAGAAGAATCCTGCGCTCAGAATGAAATGGATGATGGCAATGAAATATCCGATCACAGCGGACAAGAGAATAATAGACATGATTCCTGAAAGGAATGAACAAGGGCAGACGCTCTGGAGCAAGACAAATGATGCTGGGTCGGACAGGGTAATGGTGTCCCCCCTAGCTGTAACTTGGTGGAATAGGAATGGGCCGACGACAAGTACAGTTCATTATCCAAAAGTTTACAAAACATACTTCGAGAAGGTTGAAAGGTTAAAACATGGAACCTTCGGTCCCGTTCATTTCAGAAACCAAGTTAAAATACGCCGCCGGGTTGATACAAACCCTGGCCATGCAGATCTCAGTGCTAAAGAAGCACAAGATGTCATCATGGAAGTTGTTTTCCCAAATGAAGTGGGAGCTAGAATACTGACTTCAGAGTCGCAGTTGACAATAACGAAAGAGAAGAAAGAAGAGCTCCAAGATTGTAAGATTACTCCCTTAATGGTTGCATACATGTTGGAGAGGGAACTGGTCCGAAAAACCAGATTCCTACCGGTAGCAGGCGGAACAAGCAGTGTGTACATTGAGGTACTGCATTTGACTCAAGGAACCTGCTGGGAACAGATGTACACTCCAGGCGGAGAAGTAAGAAATGACGATGTTGACCAGAGTTTGATCATTGCTGCCAGAAGCATTGTTAGGAGAGCAACGGTATCAGCGGATCCATTGGCATCACTACTGGAGATGTGTCACAGCACACAAATTGGTGGGATAAGGATGGTGGACATCCTTAGACAGAATCCAACTGAGGAGCAAGCAGTGGATATATGCAAAGCAGCAATGGGTCTGAGGATCAGCTCATCCTTTAGTTTTGGAGGTTTCACTTTCAAAAGAACAAGTGGGTCATCCGTCACGAAGGAAGAAGAAGTGCTTACGGGCAACCTCCAAACATTGAAAATAAGAGTACATGAGGGGTATGAAGAATTCACAATGGTTGGGCAGAGGGCAACAGCTATCTTGAGGAAAGCAACTAGAAGGCTGATTCAGTTGATAGTAAGCGGACGAAATGAACAATCAATCGCTGAGGCAATTATTGTAGCGATGGTGTTCTCACAGGAGGATTGCATGATAAAGGCAGTCCGAGGCGATCTAAATTTCGTAAACAGAGCAAACCAAAGATTAAACCCCATGCATCAACTCCTGAGACATTTTCAAAAGGACGCAAAGGTGCTATTTCAGAATTGGGGAATTGAACCCATTGATAATGTCATGGGGATGATCGGGATATTACCTGACATGACTCCCAGCACCGAACTGTCGTTGAGAGGAGTAAGAGTTAGTAAAATGGGGGTAGATGAATACTCCAGCACTGAAAGAGTAGTTGTAAGCATTGACCGCTTCTTAAGGGTTCGAGATCAGCGGGGGAATGTACTCTTATCTCCCGAAGAGGTCAGTGAAACCCAGGGAACAGAGAAGTTGACAATAACATATTCGTCATCAATGATGTGGGAGATCAACGGTCCTGAGTCAGTGCTTGTCAACACCTATCAATGGATCATCAAAAACTGGGAAACCGTGAAGATTCAATGGTCTCAGGACCCCACGATGCTGTACAATAAGATGGAGTTCGAACCGTTCCAATCCTTGGTACCTAAAGCTACCAGAGGTCAATACAGTGGGTTTGTGAGAACATTATTCCAACAAATGCGTGACGTACTGGGAACATTTGATACTGTCCAGATAATAAAGCTGCTACCATTTGCAGCAGCTCCACCTGAGCAGAGCAGAATGCAGTTTTCTTCTCTAACTGTGAATGTGAGAGGCTCAGGAATGAGAATACTCGTAAGGGGCAATTCCCCTGTTTTCAACTACAATAAGGCAACCAAAAGGCTTACCGTTCTTGGAAAGGATGCAGGTGCACTAACAGAGGATCCAAACGAGGGGACAGCCGGAGTGGAATCTGCAGTACTGAGGGGATTCCTAATTCTAGGCAAGGAGGACAAAAGATATGGACCAGCATTGAGCATCAATGAACTGAGCAATCTTGCAAAAGGGGAGAAAGCTAATGTGCTGATAGGACAGGGAGATGTGGTGTTGGTAATGAAACGGAAACGGGACTCTAGCATACTTACTGACAGCCAGACAGCGACCAAAAGAATTCGGATGGCCATCAATTAG +>CY047466.1 +ATGGAGAGAATAAAGGAATTAAGAGATCTAATGTCACAGTCCCGCACTCGCGAGATACTAACAAAGACCACTGTGGACCATATGGCCATAATCAAGAAATACACATCAGGAAGACAAGAGAAGAACCCTGCTCTCAGAATGAAATGGATAATGGCAATGAAATATCCAATCACAGCGGACAAGAGAATAATGGAGATGATTCCTGAAAGGAATGAACAAGGACAGACACTCTGGAGCAAGACAAATGATGCTGGATCGGACAGGGTGATGGTGTCTCCCCTAGCTGTAACTTGGTGGAATAGGAATGGGCCGACGACAAGTACAGTTCATTATCCAAAGGTTTACAAAACATACTTTGAGAAGGTTGAAAGGTTAAGACATGGAACCTTCGGTCCCGTTCATTTCCGAAACCAAGTTAAAATACGCCGCCGAGTTGATACAAATCCTGGCCATGCAGATCTCAGTGCTAAAGAAGCACAAGATGTCATCATGGAGGTCGTTTTCCCAAATGAAGTGGGAGCTAGAATATTGACTTCAGAGTCACAATTGACAATAACGAAAGAGAAGAAAGAAGAGCTCCAAGATTGTAAGATTGCTCCCTTAATGGTTGCATACATGTTGGAAAGGGAACTGGTCCGCAAAACCAGATTCCTACCAGTAGCAGGCGGAACAAGCAGTGTGTACATTGAGGTATTGCATTTGACTCAAGGAACCTGCTGGGAACAGATGTACACTCCAGGCGGAGAAGTAAGAAATGACGATGTTGACCAGAGTTTGATCATTGCCGCCAGAAACATTGTTAGGAGAGCAACGGTATCAGCGGATCCACTGGCATCACTGCTGGAGATGTGTCACAGCACACAAATTGGTGGGATAAGGATGGTGGACATCCTTAGGCAAAATCCAACTGAGGAACAAGCTGTGGATATATGCAAAGCAGCAATGGGTCTGAGGATTAGTTCATCCTTTAGCTTTGGAGGCTTCACTTTCAAAAGAACAAGTGGATCATCCATCACGAAGGAAGAGGAAGTGCTTACAGGCAACCTCCAAACATTGAAAATAAGAGTACATGAAGGGTATGAGGAATTCACAATGGTTGGACAGAGGGCAACAGCTATCCTGAGGAAAGCAACTCGAAGGCTGATTCAGTTGATAGTGAGTGGAAGAAACGAACAATCAATCGCTGAGGCAATCATTGTAGCAATGGTGTTCTCACAGGAGGATTGCATGATAAAAGCAGTCCGAGGCGATCTGAATTTCGTAAACAGAGCAAACCAAAGATTAAACCCCATGCATCAACTCCTGAGACACTTTCAAAAGGACGCAAAAGTGCTATTTCAGAATTGGGGAACTGAACCCATTGATAATGTCATGGGGATGATCGGAATATTACCTGACATGACTCCCAGCACAGAAATGTCACTGAGAGGAGTAAGAGTTAGTAAAATGGGAGTAGATGAGTATTCCAGCACTGAGAGAGTAGTTGTAAGCATTGACCGCTTCTTAAGGGTTCGAGACCAGCGGGGGAACGTACTCTTATCTCCCGAAGAGGTCAGCGAAACCCAGGGAACAGAGAAGTTGACAATAACATATTCATCATCAATGATGTGGGAAATCAACGGTCCTGAGTCAGTGCTTGTTAACACTTACCAATGGATCATCAGAAACTGGGAGACCGTGAAAATTCAGTGGTCTCAGGACCCCACGATGTTGTACAATAAAATGGAGTTTGAACCGTTCCAATCCTTGGTACCTAAAGCTGCCAGAGGTCAATACAGTGGATTTGTGAGAACATTATTCCAACAAATGCGTGACGTACTGGGGACATTTGATACTGTCCAGATAATAAAGCTGCTACCATTTGCAGCAGCCCCACCGAAGCAGAGCAGAATGCAGTTTTCTTCTCTAACTGTGAATGTGAGAGGCTCAGGAATGAGAATACTCATAAGGGGCAATTCCCCTGTATTCAACTACAATAAGGCAACCAAAAGACTTACCGTTCTTGGAAAAGACGCAGGTGCATTAACAGAGGATCCAGATGAGGGGACAGCCGGAGTGGAATCTGCAGTACTGAGGGGGTTCCTAATTTTAGGCAAGGAGGACAAAAGATATGGACCAGCATTGAGCATCAATGAACTGAGCAATCTTGCAAAAGGGGAGAAAGCTAATGTGCTGATAGGGCAAGGAGACGTGGTGTTGGTAATGAAACGGAAACGGGACTCTAGCATACTTACTGACAGCCAGACAGCGACCAAAAGAATTCGGATGGCCATCAATTAG +>FM177116.1 +ATGGAGAGAATAAAGGAATTAAGAGATCTAATGTCCCAGTCCCGCACTCGCGAGATACTAACAAAGACCACTGTGGACCATATGGCCATAATCAAGAAATACACATCAGGAAGACAAGAGAAGAACCCTGCTCTCAGAATGAAATGGATGATGGCAATGAAATATCCAATCACAGCGGACAAGAGAATAATAGAGATGATTCCTGAAAGGAATGAACAAGGACAGACACTCTGGAGCAAGACAAATGATGCTGGATCGGACAGGGTGATGGTGTCTCCCCTAGCTGTAACCTGGTGGAATAGGAATGGGCCGACGACAAGTACAGTTCATTATCCAAAAGTTTACAAAACATACTTTGAGAAGGTTGAAAGGTTAAAACATGGAACCTTCGGTCCCGTTCATTTCCGAAACCAAGTTAAAATACGCCGCCGAGTTGATACAAATCCTGGCCATGCAGATCTCAGTGCTAAAGAAGCACAAGATGTCATCATGGAGGTCGTTTTCCCAAATGAAGTGGGAGCTAGAATATTGACTTCAGAGTCACAATTGACAATAACGAAAGAGAAGAAAGAAGAGCTCCAAGATTGTAAGATTGCTCCCTTAATGGTTGCATACATGTTGGAAAGGGAACTGGTCCGCAAAACCAGATTCCTACCAGTAGCAGGCGGAACAAGCAGTGTGTACATTGAGGTATTGCATTTGACTCAAGGAACCTGCTGGGAACAGATGTACACTCCAGGCGGAGAAGTAAGAAATGACGATGTTGACCAGAGTTTGATCATTGCTGCCAGAAACATTGTTAGGAGAGCAACGGTATCAGCGGATCCACTGGCATCACTGCTGGAGATGTGTCACAGCACACAAATTGGTGGGATAAGGATGGTGGACATCCTTAGGCAAAATCCAACTGAGGAACAAGCTGTGGATATATGCAAAGCAGCAATGGGTCTGAGGATTAGTTCATCCTTTAGCTTTGGAGGCTTCACTTTCAAAAGAACAAGTGGATCATCCGTCACGAAGGAGGAGGAAGTGCTTACAGGCAACCTCCAAACATTGAAAGTAAGAGTACATGAGGGGTATGAAGAATTCACAATGGTTGGGCAGAGGGCAACAGCTATCCTGAGGAAAGCAACTAGAAGGCTGATTCAGTTGATAGTAAGTGGAAGAGACGAACAATCAATCGCTGAGGCAATCATTGTAGCAATGGTGTTCTCACAGGAGGATTGCATGATAAAAGCAGTCCGAGGCGATCTGAATTTCGTAAACAGAGCAAACCAAAGATTAAACCCCATGCATCAACTCCTGAGACATTTTCAAAAGGACGCAAAAGTGCTATTTCAGAAGTGGGGAACTGAGCCCATTGATAATGTCATGGGGATGATCGGAATATTACCTGACATGACTCCCAGCACAGAAACATCACTGAGAGGAGTAAGAGTTAGTAAAATGGGAGTAGATGAGTATTCCAGCACTGAGAGAGTAGTTGTAAGCATTGACCGTTTCTTACGGGTTCGAGACCAGCGGGGGAACGTACTCTTATCTCCCGAAGAGGTCAGCGAAACCCAGGGAACAGAGAAGTTGACAATAACATATTCATCATCAATGATGTGGGAAATCAACGGTCCTGAGTCAGTGCTTGTTAACACTTACCAATGGATCATCAGAAACTGGGAAACCGTGAAAATTCAGTGGTCTCAGGACCCCACGATGTTGTACAATAAGATGGAGTTTGAACCGTTCCAATCCTTGGTACCTAAAGCTGCCAGAGGTCAATACAGTGGATTTGTGAGAACATTATTCCAACAAATGCGTGACGTACTGGGGACATTTGATACTGTCCAGATAATAAAGCTGCTACCATTTGCAGCAGCCCCACCGAAGCAGAGCAGAATGCAGTTTTCTTCTCTAACTGTGAATGTGAGAGGCTCAGGAATGAGAATACTCATAAGGGGCAATTCTCCTGTGTTCAACTACAATAAGGCAACCAAAAGACTTACTGTTCTTGGAAAGGACGCAGGTGCATTGACAGAGGATCCAGATGAGGGGACAGCCGGAGTGGAATCTGCAGTACTGAGGGGGTTCCTAATTCTAGGCAAGGAGGACAAAAGATATGGACCAGCATTGAGCATCAATGAACTGAGCAATCTTGCAAAAGGGGAGAAAGCTAATGTGCTGATAGGGCAAGGAGACGTGGTGTTGGTAATGAAACGGAAACGGGACTCTAGCATACTTACTGACAGCCAGACAGCGACCAAAAGAATTCGGATGGCCATCAATTAG +>AB827988.1 +AAATATATTCAATATGGAGAGAATAAAAGAATTAAGAGATCTAATGTCACAGTCCCGCACTCGCGAGATACTAACAAAAACCACTGTGGATCATATGGCCATAATCAAGAAATACACATCAGGAAGACAAGAAAAGAACCCTGCTATCAGAATGAAATGGATGATGGCAATGAAATATCCAATCACAGCAGACAAGAGAATAATGGAGATGATTCCTGAAAGGAATGAACAAGGGCAGACGCTTTGGAGCAAGACAAATGATGCTGGATCGGACAGGGTGATGGTGTCTCCCCTGGCCGTAACTTGGTGGAACAGAAATGGACCGACAACAAGTACAGTTCATTATCCAAAGGTTTACAAGACATACTTTGAGAAGGTTGAAAGGTTAAAACATGGAACCTTCGGTCCCGTTCACTTCCGAAATCAGGTTAAGATACGCCGTCGAGTTGATACAAATCCAGGCCATGCAGATCTTAGTGCTAAAGAGGCACAGGATGTCATTATGGAGGTTGTTTTCCCAAATGAAGTGGGAGCTAGAATATTGACATCAGAGTCGCAGTTGACCATAACTAGAGAGAAGAAAGAAGAGCTCCAGGATTGTAAGATTGCTCCTTTAATGGTGGCATACATGTTGGAAAGGGAGCTAGTCCGCAAAACCAGATTCCTACCGGTGGCAGGCGGAACAAGCAGTGTGTACATTGAGGTATTGCATTTGACTCAAGGAACCTGCTGGGAACAGATGTACACTCCAGGTGGAGAGGTTAGAAATGACGATGTTGACCAGAGTTTGATCATCGCTGCCAGAAACATTGTTAGGAGAGCAATGGTATCTGCTGATCCACTGGCATCACTATTGGAGATGTGCCACAGCACACAAATTGGTGGGATAAAGATGGTGGACATCCTTAGGCAAAATCCAACCGAAGAACAAGCTGTTGATATATGTAAAGCAGCAATGGGTTTGAGGATCAGTTCATCCTTTAGCTTTGGAGGCTTCACTTTCAAAAGAACAAGTGGATCATCCGTCAAGAAGGAAGAGGAAGTGCTTACAGGCAATCTCCAAACGTTGAAAATAAGAGTACATGAGGGCTATGAGGAATTCACAATGGTTGGGCGGAGAGCGACAGCTATCCTGAGGAAAGCAACCAGAAGACTGATTCAGTTGATAGTAAGTGGAAAAGACGAACAATCAATCGCTGAAGCAATCATTGTAGCAATGGTGTTCTCACAGGAGGATTGCATGATAAAAGCAGTCCGAGGCGACCTGAATTTCGTAAACAGAGCAAACCAAAGATTAAACCCCATGCATCAACTCTTGAGACACTTCCAAAAAGATGCAAAGGTGCTGTTTCAGAATTGGGGAATTGAACCTATTGATAATGTCATGGGGATGATCGGAATATTGCCTGATATGACTCCCAGCACAGAGATGTCACTGAGAGGAGTGAGAGTTAGTAAAATGGGAGTGGATGAATATTCCAGCACTGAGAGAGTGGTTGTAAGTATTGACCGTTTCTTAAGGGTTCGAGATCAACGGGGAAACGTACTCTTATCCCCCGAAGAGGTCAGCGAAACCCAGGGAACAGAGAAATTGACAATAACATATTCATCATCAATGATGTGGGAAATCAACGGTCCTGAATCAGTGCTTGTTAACACCTATCAATGGATCATCAGAAATTGGGAGACTGTGAAGACTCAATGGTCTCAAGACCCCACGATGCTGTACAATAAGATGGAGTTTGAACCGTTCCAATCCTTGGTACCCAAAGCTGTCAGAGGTCAATACAGTGGGTTTGTGAGAACCCTATTCCAACAAATGCGTGACGTACTAGGGACATTTGATACTGTTCAGATAATAAAGCTGCTACCATTTGCAGCAGCCCCACCAGAGCAGAGCAGAATGCAGTTTTCTTCTCTGACTGTGAATGTGAGAGGCTCAGGAATGAGAATACTCGTAAGGGGCAACTCCCCTGTGTTCAACTACAATAAGGTAACCAAAAGGCTTACCATTCTTGGAAAGGACGCAGGTGCATTAACAGAGGATCCAGATGAGGGAACAGCTGGAGTGGAATCTGCAGTACTAAGGGGATTCCTAATTCTAGGCAAGGAAGACAAAAGATATGGACCAGCATTGAGCATCAATGAACTGAGCAATCTTGCGAAAGGGGAGAAAGCTAATGTGCTGATAGGGCAAGGAGACGTGGTGTTGGTAATGAAACGGAAACGGGACTCTAGCATACTTACTGACAGCCAGACAGCGACCAAAAGAATTCGGATGGCCATCAATTAGTGTCGAATTGTTTAA +>OQ546748.1 +ATGGAAAGAATAAAAGAACTAAGAGATTTGATGTCACAGTCTCGCACTCGCGAGATACTGACAAAAACAACTGTGGACCATATGGCCATAATCAAGAAATACACATCGGGAAGACAGGAGAAAAATCCTGCCCTTAGGATGAAGTGGATGATGGCGATGAAATATCCAATTACAGCAGACAAAAGAATAATGGAGATGATCCCAGAAAGGAATGAGCAAGGTCAGACCCTTTGGAGCAAGACAAATGATGCTGGATCAGACAGAGTGATGGTGTCACCTCTGGCTGTGACGTGGTGGAACAGGAATGGACCAACGACAAGCACAGTCCATTATCCAAAGGTCTATAAAACCTATTTTGAAAAGGTCGAAAGACTAAAACATGGGACCTTCGGCCCCGTTCACTTCCGAAACCAGGTTAAAATACGCCGCAGGGTCGACATAAACCCAGGCCATGCAGATCTTAGTGCTAAGGAAGCACAGGATGTCATCATGGAGGTCGTATTCCCAAACGAAGTTGGGGCCAGAATATTAACATCGGAGTCACAGTTAACGATAACCAAGGAAAAGAAGGAGGAGCTTCAGGACTGCAAAATTGCCCCTTTAATGGTGGCTTATATGTTGGAGAGGGAACTGGTCCGCAAAACAAGATTTCTACCAGTAGCTGGAGGGACAAGCAGCGTGTATATCGAAGTATTACATTTGACCCAAGGGACCTGCTGGGAGCAAATGTACACACCGGGAGGTGAAGTGAGAAATGATGATGTTGATCAGAGTTTAATTATTGCTGCTAGAAATATTGTTAGAAGAGCAATAGTGTCAGCAGACCCGTTGGCTTCGCTTTTGGAGATGTGCCATAGTACACAGATTGGCGGGGTTAGGATGGTTGACATCCTTAGACAAAACCCAACAGAAGAACAGGCTGTGGATATATGTAAGGCAGCAATGGGCCTAAGGATCAGTTCATCCTTCAGTTTTGGAGGTTTCACTTTCAAAAGGACAAGTGGGTCATCTGTCTTTAGGGAAGAAGAGGTTCTCACAGGAAATCTCCAAACATTGAAAATAAGAGTACATGAAGGATATGAGGAATTCACAATGGTTGGGCGAAGAGCAACAGCCATTCTAAGGAAAGCAACCAGAAGATTGATCCAACTGATAGTGAGTGGGAAAGACGAGCAATCAATTGCCGAGGCAATCATAGTGGCAATGGTATTCTCACAAGAGGATTGTATGATAAAGGCAGTGAGAGGTGACTTGAACTTTGTCAACAGAGCAAACCAGCGGCTAAATCCCATGCATCAACTCCTGAGGCATTTCCAAAAAGATGCAAAAGTTCTGTTTCAAAACTGGGGAATTGAACCCATTGACAATGTAATGGGGATGATCGGAATATTGCCTGACATGACCCCCAGTACAGAGATGTCATTGAGAGGAGTGAGAGTTAGTAAAATGGGAGTAGATGAATATTCCAGTACTGAGAGAGTGGTCGTGAGTATTGATCGTTTCTTGAGGGTCCGAGACCAGAGGGGAAACGTACTCCTGTCTCCTGAAGAGGTTAGTGAAACACAGGGAACAGAAAAGCTGACTATAACATATTCATCGTCCATGATGTGGGAGATCAATGGCCCGGAATCAGTGCTAGTTAACACATATCAATGGATCATTAGAAATTGGGAAACTGTAAAGATTCAATGGTCCCAAGATCCTACAATGCTATACAATAAGATGGAATTTGAACCCTTTCAATCCCTAGTGCCTAAAGCTGTCAGAGGCCAATATAGTGGATTCGTAAGGGTTCTATTCCAACAAATGCGTGACGTACTGGGGACATTTGACACTGTCCAAATAATAAAGCTATTGCCATTTGCAGCAGCCCCGCCAGAGCAGAGCAGGATGCAGTTCTCTTCTCTAACTGTGAATGTGAGGGGTTCAGGAATGAGAATAGTTGTGAGAGGCAATTCTCCTGTGTTCAACTACAACAAGGCAACCAAGAGGCTTACGGTACTTGGGAAGGATGCAGGTGCATTGATGGAAGACCCAGATGAGGGAACAGCAGGAGTGGAATCTGCAGTATTGAGGGGATTTCTGATTCTGGGCAAAGAAGACAAGAGATATGGGCAAGCATTGAGCATCAACGAATTGAGCAATCTTGCGAAAGGAGAGAAGGCTAATGTGTTGATAGGGCAAGGAGACGTGGTGTTGGTAATGAAACGGAAACGGGACTCTAGCATACTTACTGACAGTCAGACAGCGACCAAAAGGATTCGAATGGCCATCAATTAA +>OQ683455.1 +AGCGAAAGCAGGTCAAATATATTCAATATGGAGAGAATAAAAGAACTAAGAGATCTAATGTCACAGTCTCGCACTCGCGAGATACTGACCAAAACCACTGTTGACCACATGGCCATAATCAAAAAGTACACATCGGGAAGGCAAGAGAAGAACCCCGCACTCAGAATGAAATGGATGATGGCAATGAAATATCCAATTACAGCAGATAAGCGAATAATGGAAATGATCCCTGAGAGGAATGAACAAGGGCAAACTCTCTGGAGCAAAACAAACGATGCCGGATCAGACCGAGTGATGGTATCACCCCTGGCTGTGACATGGTGGAACAGGAACGGACCAACAACAAGTACAGTCCACTACCCAAAGGTATATAAAACTTATTTCGAAAAAGTTGAAAGGTTGAAACACGGGACCTTTGGCCCTGTGCACTTCAGAAACCAAGTTAAGATAAGACGGAGGGTCGATATAAACCCGGGCCATGCTGACCTCAGTGCCAAAGAGGCGCAGGATGTAATCATGGAAGTCGTCTTCCCAAATGAAGTGGGAGCAAGGATATTGACGTCTGAGTCACAACTGACGATAACAAAGGAGAAAAAGGAAGAACTCCAGGACTGCAAAATCGCTCCTCTGATGGTTGCATACATGCTAGAAAGAGAGTTGGTTCGCAAGACGAGGTTTCTCCCAGTTGCTGGTGGGACAAGCAGTGTCTACATTGAGGTGCTGCATTTGACCCAGGGGACATGCTGGGAGCAGATGTACACTCCGGGAGGAGAAGTGAGGAACGATGATGTAGACCAAAGCTTAATCATTGCTGCCAGGAATATAGTAAGAAGAGCAACAGTATCAGCAGATCCATTAGCATCTCTATTGGAGATGTGTCACAGCACACAAATTGGGGGAATAAGGATGGTAGACATCCTTCGGCAAAATCCAACAGAGGAACAAGCCGTGGATATATGCAAGGCAGCAATGGGCTTGAGGATTAGCTCATCTTTCAGCTTTGGTGGATTCACTTTTAAAAGAACAAGTGGATCGTCAGTCAAAAAAGAAGAAGAAGTGCTAACAGGCAACCTTCAAACATTGAAAATAAGAGTACATGAGGGGTATGAAGAGTTCACAATGGTTGGGAGAAGAGCAACGGCCATTCTCAGGAAAGCAACCAGAAGGCTGATCCAGCTAATAGTAAGTGGGAGAGACGAGCAGTCAATTGCTGAAGCAATAATTGTGGCCATGGTATTCTCACAAGAGGACTGCATGATTAAAGCAGTTAGAGGTGACCTGAATTTTGTCAATAGGGCGAACCAGCGACTAAACCCAATGCATCAACTCTTGAGGCATTTCCAAAAGGATGCAAAGGTGCTTTTCCAAAATTGGGGAATTGAACCCATTGACAATGTGATGGGAATGATCGGGGTAATGCCCGACATGACCCCAAGTACTGAGATGTCGCTGAGGGGAATAAGAGTCAGTAAGATGGGAGTAGATGAATACTCAAGTACAGAGCGAGTAGTAGTAAGCATCGACCGGTTTTTAAGAGTTCGAGACCAACGGGGGAACGTACTATTATCACCCGAAGAGGTCAGTGAGACACAAGGAACGGAGAAACTGACAATCACTTATTCGTCATCAATGATGTGGGAGATCAATGGTCCTGAGTCGGTGTTGGTCAATACTTACCAGTGGATAATTAGAAACTGGGAAACTGTAAAAATTCAATGGTCACAGGATCCCACAATGTTGTATAATAAGATGGAATTCGAGCCATTCCAGTCTCTAGTCCCTAAAGCAGCCAGAGGTCAATACAGTGGGTTTGTGAGAACACTATTCCAGCAAATGAGAGATGTGCTTGGAACGTTTGACACTGTTCAAATAGTAAAACTCCTCCCCTTTGCTGCCGCCCCACCGGAACAAAGTAGGATGCAATTCTCCTCCCTGACTGTGAATGTAAGAGGATCAGGAATGAGGATACTGGTAAGAGGCAATTCACCAGTCTTCAATTACAACAAGGCCACCAAGAGGCTCACAGTTCTCGGGAAAGATGCAGGTGCATTGACCGAAGATCCAGATGAAGGCACAGCTGGAGTGGAGTCTGCTGTTTTAAGAGGATTCCTCATTTTGGGCAAAGAAGACAAGAGATATGGCCCAGCATTGAGCATCAATGAGCTGAGCAATCTTGCAAAGGGAGAGAAGGCTAATGTGCTAATTGGGCAAGGAGACGTAGTGTTGGTGATGAAACGGAAACGGGACTCTAGCATACTTACTGACAGCCAGACAGCGACCAAAAGAATTCGGATGGCCATCAATTAGTGTCGAATTATTTAAAAACGACCTTGTAAGTGGAGGTCGCTAGATGGTC +>OQ584693.1 +AGCGAAAGCAGGTCAATTATATTCAATATGGAGAGAATAAGAGAACTAAGAGATCTAATGTCACAGTCTCGCACTCGCGAGATACTCACCAAAACTACTGTGGACCACATGGCCATAATCAAAAAATACACATCGGGAAGGCAAGAGAAGAACCCCGCGCTCAGGATGAAATGGATGATGGCAATGAAATATCCAATCACAGCAGACAAGAGAATAATGGAAATGATTCCTGAAAGAAATGAACAAGGACAAACCCTTTGGAGCAAAACGAACGATGCCGGGTCTGACCGAGTGATGGTATCACCTCTGGCCGTGACATGGTGGAATAGGAACGGACCAACAACAAGTACGGTCCACTACCCAAAGGTATACAAAACGTATTTCGAAAAAGTTGAAAGATTGAAACATGGGACCTTTGGTCCTGTTCACTTCAGAAATCAAGTTAAGATAAGACGGAGAGTCGACATAAACCCAGGCCATGCAGACCTCAGTGCAAAAGAGGCGCAGGATGTAATCATGGAAGTTGTCTTCCCAAATGAAGTGGGAGCGAGAATAATAACATCGGAGTCACAACTGACGATAACAAAGGAGAAGAAGGAAGAACTCCAGGACTGCAAAATTGCACCTTTGATGGTCGCATACATGCTAGAAAGAGAGTTAGTCCGCAAGACGAGGTTCCTCCCAGTGGCTGGTGGAACAAGCAGTGTCTATATTGAGGTGCTGCATTTAACCCAGGGGACATGCTGGGAGCAGATGTACACTCCAGGAGGAGAAGTGAGAAATGATGATGTAGACCAGAGTTTGATTATCGCCGCCAGGAACATAGTAAGAAGAGCAACAGTATCAGCAGATCCACTAGCATCTCTATTGGAGATGTGCCACAGCACACAGATTGGGGGAATAAGGATGGTAGACATTCTTCGACAAAATCCAACAGAGGAACAAGCCGTGGATATATGCAAGGCAGCAATGGGCTTGAGGATTAGCTCATCTTTCAGCTTTGGTGGATTCACTTTCAAAAGAACAAGTGGATCATCAGTCAAAAGAGAAGAAGAAGTGCTTACGGGCAACCTTCAAACACTGAAAATAAGAGTACATGAGGGGTATGAAGAGTTCACGATGGTTGGAAGAAGAGCAACGGCTATTCTCAGGAAGGCAACCAGAAGGTTAATCCAGCTAATAGTAAGTGGAAGAGACGAGCAGTCAATTGCTGAAGCAATAATTGTGGCCATGGTATTCTCACAGGAAGACTGCATGATCAAGGCAGTTCGAGGTGATCTGAATTTTGTCAATAGGGCGAACCAGCGGCTGAATCCAATGCATCAACTCTTGAGACACTTCCAAAAGGATGCTAAAGTGCTTTTCCAAAACTGGGGAATTGAATCCATTGACAACGTGATGGGGATGATTGGGATATTGCCCGACATGACCCCAAGCACTGAGATGTCACTGAGGGGAATAAGAGTCAGCAAGATGGGAGTAGATGAATACTCCAGTACAGAGAGGGTGGTGGTGAGCATCGATCGATTTTTAAGAGTCCGGGACCAACGAGGGAACGTACTATTGTCACCAGAAGAAGTCAGCGAGACACACGGAACAGAGAAATTGACAATCACTTATTCATCATCAATGATGTGGGAGATTAATGGACCCGAATCGGTGTTGGTCAACACTTATCAATGGATCATCAGGAACTGGGAAACTGTGAAAATTCAATGGTCACAGGATCCCACAATGTTATATAATAAGATGGAATTCGAGCCATTCCAGTCTCTGATACCTAAAGCAGCCAGAGGTCAATACAGTGGATTCGTGAGGACACTATTCCAGCAGATGCGAGATGTGCTCGGAACATTTGACACTGTCCAAATAATAAAACTCCTCCCCTTTGCTGCTGCCCCACCAGAACAAAGTAGAATGCAATTCTCCTCCCTGACTGTAAATGTGAGAGGATCAGGAATGAGAATACTGGTTAGAGGCAATTCCCCAGTGTTCAATTACAACAAGGCTACCAAGAGGCTCACAGTTCTCGGGAAAGATGCAGGTGCATTGACCGAAGATCCAGATGAAGGCACAGCTGGAGTAGAGTCTGCTGTTCTAAGAGGATTCCTCATTTTGGGCAAAGAAGACAAGAGATATGGCCCAGCATTGAGCATCAATGAGCTGAGCAATCTTGCAAAGGGAGAGAAGGCTAATGTGCTAATTGGGCAAGGGGACGTGGTGTTGGTAATGAAACGGAAACGGGACTCTAGCATACTTACTGACAGCCAGACAGCGACCAAAAGGATTCGGATGGCCATCAATTAGTGTCGAATTGTTTAAAAACGACCTTGTTTCTACT +>OQ546779.1 +ATGGAACGAATAAAAGAATTAAGAGATCTAATGTCACAGTCCCGCACTCGCGAGATACTAACAAAAACCACTGTGGACCATATGGCCATAATCAAGAAATACACATCAGGAAGACAAGAGAAGAATCCTGCCCTCAGAATGAAATGGATGATGGCAATGAAGTATCCGATTACAGCGGACAAGAGAATAATAGATATGATTCCTGAAAGGAATGAACAAGGGCAGACACTCTGGAGCAAGACAAATGATGCTGGGTCGGACAGGGTGATGGTGTCCCCCCTAGCTGTAACTTGGTGGAATAGGAATGGGCCGACGACAAATACAGTTCATTATCCAAAAGTTTACAAAACATACTTCGAGAAAGTTGAAAGGTTAAAACATGGAACATTCGGCCCCGTCCATTTCCGAAACCAAGTTAAAATACGCCGCCGAGTTGATACAAACCCTGGCCATGCAGATCTCAGTGCTAAAGAAGCACAAGATGTCATCATGGAAGTTGTTTTCCCAAATGAGGTGGGAGCTAGAATATTGACTTCGGAGTCGCAATTGACAATAACAAAAGAGAAAAAAGAAGAGCTCCAAGATTGTAAGATTGCTCCCTTAATGGTTGCATACATGTTGGAAAGGGAACTGGTCCGCAAAACCAGATTCCTACCGGTAGCAGGCGGCACAAGCAGTGTGTACATTGAGGTACTGCATCTGACTCAAGGAACCTGCTGGGAGCAGATGTACACTCCAGGCGGAGAAGTAAGAAATGACGATGTTGACCAGAGTTTGATTATTGCTGCCAGAAACATTGTTAGGAGGGCAACGGTATCAGCGGATCCATTGGCATCACTGCTGGAGATGTGTCACAGCACACAAATTGGTGGGATAAGGATGGTGGACATCCTTAGGCAAAATCCAACTGAGGAACAAGCTGTGGATATATGCAGAGCAGCAATGGGTTTGAGGATCAGCTCATCCTTTAGTTTTGGAGGTTTCACTTTCAAAAGAACAAGTGGGTCATCCGCCACGAAGGAAGAGGAAGTGCTTACGGGCAACCTCCAAACATTGAAAATAAGAGTACATGAGGGGTATGAAGAATTCACAATGGTTGGGCAGAGGGCAACAGCTATCCTGAGGAAAGCAACTAGGAGGCTGATTCAGTTGATAGTAAGCGGAAGAAACGAGCAGTCAATCGCCGAGGCAATCATTGTAGCGATGGTGTTCTCACAGGAGGATTGTATGATAAAGGCAGTCCGAGGCGATCTAAATTTCGTAAACAGAGCAAACCAAAGATTAAATCCCATGCATCAACTCCTGAGACATTTTCAAAAGGACGCAAAGGTGCTATTTCAAAATTGGGGAATTGAACCCATTGATGATGTCATGGGGATGATCGGGATACTACCCGACATGACTCCAAGCACAGAACTGTCACTGAGAGGGGTGAGAGTTAGTAAAATGGGAGTGGATGAATATTCCAGCACTGAAAGAGTAGTTGTAAACATTGACCGCTTTTTAAGGGTTCGAGATCAGCGGGGGAATGTACTCTTATCTCCCGAAGAGGTCAGCGAAACCCAGGGGACAGAGAAGTTGACAATAACATATTCGTCATCAATGATGTGGGAAATCAACGGTCCTGAATCAGTGCTTGTCAACACCTACCAATGGATCATCAGAAATTGGGAAACTGTGAAGATTCAATGGTCTCAGGATCCCACGATGCTGTACAATAAGATGGAGTTCGAGCCGTTCCAATCCTTGGTACCTAAAGCTACCAGAGGTCAATACAGTGGATTTGTGAGAACATTATTTCAACAAATGCGTGATGTACTAGGGACATTTGATACTGTCCAGATAATAAAGCTGCTACCATTTGCAGCAGCACCACCTGAGCAGAGCAGAATGCAATTTTCTTCTCTAACTGTGAATGTGAGGGGCTCAGGAATGAGAATACCCGTAAGGGGCAATTCCCCTGTGTTCAACTACAATAAGGCAACCAAAAGGCTTGCCGTTCTTGGAAAGGACGCAGGTGCATTAACAGAGGATCCAGACGAGGGGACAGCCGGAGTGGAATCTGCAGTACTGAGGGGATTTCTAATTCTAGGCAAGGAGGACAAAAGATATGGACCAGCATTGAGCATCAATGAACTGAGCAATCTTGCAAAAGGGGAGAAAGCTAATGTGCTGATAGGGCAAGGAGACGTGGTGTTGGTAATGAAACGGAAACGGGACTCTAGCATACTTACTGACAGTCAGACAGCGACCAAAAGAATTCGGATGGCCATCAATTAG +>AB807877.1 +AAATATATTCAATATGGAACGAATAAAAGAATTAAGAGATCTAATGTCACAGTCCCGCACTCGCGAGATACTAACAAAAACCACTGTGGACCATATGGCCATAATCAAGAAATACACATCAGGAAGACAAGAGAAGAATCCTGCCCTCAGAATGAAATGGATGATGGCAATGAAGTATCCGATTACAGCGGACAAGAGAATAATAGATATGATTCCTGAAAGGAATGAACAAGGGCAGACACTCTGGAGCAAGACAAATGATGCTGGGTCGGACAGGGTGATGGTGTCCCCCCTAGCTGTAACTTGGTGGAATAGGAATGGGCCGACGACAAATACAGTTCATTATCCAAAAGTTTACAAAACATACTTCGAGAAAGTTGAAAGATTAAAACATGGAACATTCGGCCCCGTCCATTTCCGAAACCAAGTTAAAATACGCCGCCGAGTTGATACAAACCCTGGCCATGCAGATCTCAGTGCTAAAGAAGCACAAGATGTCATCATGGAAGTTGTTTTCCCAAATGAGGTGGGAGCTAGAATATTGACTTCGGAGTCGCAATTGACAATAACAAAAGAGAAGAAAGAAGAGCTCCAAGATTGTAAGATTGCTCCCTTAATGGTTGCATACATGTTGGAAAGGGAACTGGTCCGCAAAACCAGATTCCTACCGGTAGCAGGCGGCACAAGCAGTGTGTACATTGAGGTACTGCATCTGACTCAAGGAACCTGCTGGGAGCAGATGTACACTCCAGGCGGAGAAGTAAGAAATGACGATGTTGACCAGAGTTTGATCATTGCTGCCAGAAACATTGTTAGGAGGGCAACGGTATCAGCGGATCCATTGGCATCACTGCTGGAGATGTGTCACAGCACACAAATTGGTGGGATAAGGATGGTGGACATCCTTAGGCAAAATCCAACTGAGGAACAAGCTGTGGATATATGCAGAGCAGCAATGGGTTTGAGGATCAGCTCATCCTTTAGTTTTGGAGGTTTCACTTTCAAAAGAACAAGTGGGTCATCCGTCACGAAGGAAGAGGAAGTGCTTACGGGCAACCTCCAAACATTGAAAATAAGAGTACATGAGGGGTACGAAGAATTCACAATGGTTGGGCAGAGGGCAACAGCTATCCTAAGGAAAGCAACTAGGAGGCTGATTCAGTTGATAGTAAGCGGAAGAAACGAACAGTCAATCGCCGAGGCAATCATTGTAGCGATGGTGTTCTCACAAGAGGATTGTATGATAAAGGCAGTCCGAGGCGATCTAAATTTCGTAAACAGAGCAAACCAAAGATTAAATCCCATGCATCAACTCCTGAGACATTTTCAAAAGGACGCAAAGGTGCTATTTCAAAATTGGGGAATTGAACCCATTGATAATGTCATGGGGATGATCGGGATACTACCCGACATGACTCCAAGCACAGAACTGTCACTGAGAGGAGTGAGAGTTAGTAAAATGGGAGTGGATGAATATTCCAGCACTGAAAGAGTAGTTGTAAACATTGACCGCTTTTTAAGGGTTCGAGATCAGCGGGGGAATGTACTCTTATCTCCCGAAGAGGTCAGCGAAACCCAGGGGACAGAGAAGTTGACAATAACATATTCGTCATCAATGATGTGGGAAATCAACGGTCCTGAATCAGTGCTTGTCAACACCTACCAATGGATCATCAGAAATTGGGAAACTGTGAAGATTCAATGGTCTCAGGATCCCACGATGCTGTACAATAAGATGGAGTTCGAGCCGTTCCAATCCTTGGTACCTAAAGCTACCAGAGGTCAATACAGTGGATTTGTGAGAACATTATTTCAACAAATGCGTGATGTACTAGGGACATTTGATACTGTCCAGATAATAAAGCTGCTACCATTTGCAGCAGCACCACCTGAGCAGAGCAGAATGCAGTTTTCTTCTCTAACTGTGAATGTGAGGGGCTCAGGAATGAGAATACCCGTAAGGGGCAATTCCCCTGTGTTCAACTACAATAAGGCAACCAAAAGGCTTGCCGTTCTTGGAAAGGACGCAGGTGCATTAACAGAGGATCCAGACGAGGGGACAGCCGGAGTGGAATCTGCAGTACTGAGGGGATTTCTAATTCTAGGCAAGGAGGACAAAAGATATGGACCAGCATTGAGCATCAATGAACTGAGCAATCTTGCAAAAGGGGAGAAAGCTAATGTGCTGATAGGGCAAGGAGACGTGGTGTTGGTAATGAAACGGAAACGGGACTCTAGCATACTTACTGACAGTCAGACAGCGACCAAAAGAATTCGGATGGCCATCAATTAGTGTCGAATTGTTTAA +>CY111054.1 +AGCAAAAGCAGGTCAAATATATTCAATATGGAGAGAATAAAGGAATTAAGAGATCTAATGTCACAGTCCCGCACTCGCGAGATACTAACAAAGACCACTGTGGACCATATGGCCATAATCAAGAAATACACATCAGGAAGACAAGAGAAGAACCCTGCTCTCAGAATGAAATGGATGATGGCAATGAAATATCCAATCACAGCGGACAAGAGAATAATAGAGATGATTCCTGAAAGGAATGAACAAGGACAGACACTCTGGAGCAAGACAAATGATGCTGGATCGGACAGGGTAATGGTGTCTCCCCTAGCTGTAACTTGGTGGAATAGGAATGGGCCGACGACAAGTACAGTTCATTATCCAAAGGTTTACAAAACATACTTTGAGAAGGTTGAAAGGTTAAAACATGGAACCTTCGGTCCCGTTCATTTCCGAAACCAAGTTAAAATACGCCGCCGAGTTGATACAAATCCTGGCCATGCAGATCTCAGTGCTAAAGAAGCACAAGATGTCATCATGGAGGTCGTTTTCCCAAATGAAGTGGGAGCTAGAATATTGACTTCAGAGTCACAATTGACAATAACGAAAGAGAAGAAAGAAGAGCTCCACGATTGTAAGATTGCTCCCTTAATGGTTGCATACATGTTGGAAAGGGAACTGGTCCGCAAAACCAGATTCCTACCAGTAGCAGGCGGAACAAGCAGTGTGTACATTGAGGTATTGCATTTGACTCAAGGAACCTGCTGGGAACAGATGTACACTCCAGGCGGAGAGGTAAGAAATGACGATGTTGACCAGAGTTTGATCATTGCTGCCAGAAACATTGTTAGGAGAGCAACGGTATCAGCGGATCCACTGGCATCACTGCTGGAGATGTGTCACAGCACACAAATTGGTGGGATAAGGATGGTGGACATCCTTAGGCAAAATCCAACTGAGGAACAAGCTGTGGATATATGCAAAGCAGCAATGGGTCTGAGGATTAGTTCATCCTTTAGCTTTGGAGGCTTCACTTTCAAAAGAACAAGTGGATCATCCGTCACGAAGGAAGAGGAAGTTCTTACAGGCAACCTCCAAACATTGAAAATAAGAGTACATGAGGGGTATGAAGAATTTACAATGGTTGGGCAGAGGGCAACAGCTATCCTGAGGAAAGCAACTAGAAGGCTGATTCAGTTGATAGTAAGTGGAAGAAACGAACAATCAATCGCTGAGGCAATCATTGTAGCAATGGTGTTCTCACAGGAGGATTGCATGATAAAAGCAGTCCGAGGCGATCTGAATTTCGTAAACAGAGCAAACCAAAGATTAAACCCCATGCATCAACTCCTGAGACATTTTCAAAAGGACGCAAAAGTGCTATTTCAGAATTGGGGAACTGAGCCCATTGATAATGTCATGGGGATGATCGGAATATTGCCTGACATGACTCCCAGCACAGAAACATCACTGAGAGGAGTAAGAGTTAGTAAAATGGGAGTAGATGAGTATTCCAGCACTGAGAGAGTAGTTGTAAGCATTGACCGCTTCTTAAGGGTTCGAGACCAGCGGGGGAACGTACTCTTATCTCCTGAAGAGGTCAGCGAAACCCAGGGAACAGAGAAGTTGACAATAACATATTCATCATCAATGATGTGGGAAATCAACGGTCCTGAGTCAGTGCTTGTTAACACTTACCAATGGATCATCAGAAACTGGGAGACCGTGAAAATTCAGTGGTCTCAGGACCCCACTATGTTGTACAATAAGATGGAGTTCGAACCGTTCCAATCCTTGGTACCTAAAGCTGCCAGAGGTCAATACAGTGGATTTGTGAGAACATTATTCCAACAAATGCGTGACGTACTGGGGACATTTGATACTGTCCAGATAATAAAGCTGCTACCATTTGCAGCAGCTCCACCGAAGCAGAGCAGAATGCAGTTTTCTTCTCTAACTGTGAATGTGAGAGGCTCAGGAATGAGAATACTCATAAGGGGCAATTCCCCTGTGTTCAACTACAATAAGGCAACCAAAAGACTTACTGTTCTTGGAAAGGACGCAGGTGCATTGACAGAGGATCCAGATGAGGGGACAGCCGGAGTGGAATCTGCAGTACTGAGGGGGTTCCTAATTATAGGCAAGGAGGACAAAAGATATGGACCAGCATTGAGCATCAATGAACTGAGCAATCTTGCAAAAGGGGAGAAAGCTAATGTGCTAATAGGGCAAGGAGACGTGGTGTTGGTAATGAAACGGAAACGGGACTCTAGCCTACTTACTGACAGCCAGACAGCGACCAAAAGAATT +>OQ584503.1 +AAAGCAGGTCAATTATATTCAATATGGAGAGAATAAGAGAACTAAGAGATCTAATGTCACAGTCTCGCACTCGCGAGATACTCACCAAAACTACTGTGGACCACATGGCCATAATCAAAAAATACACATCGGGAAGGCAAGAGAAGAACCCCGCGCTCAGGATGAAATGGATGATGGCAATGAAATATCCAATCACAGCAGACAAGAGAATAATGGAAATGATTCCTGAAAGAAATGAACAAGGACAAACCCTTTGGAGCAAAACGAACGATGCCGGGTCTGACCGAGTGATGGTATCACCTCTGGCCGTGACATGGTGGAATAGGAACGGACCAACAACAAGTACGGTCCACTACCCAAAGGTATACAAAACGTATTTCGAAAAAGTTGAAAGATTGAAACATGGGACCTTTGGTCCTGTTCACTTCAGAAATCAAGTTAAGATAAGACGGAGAGTCGACATAAACCCAGGCCATGCAGACCTCAGTGCAAAAGAGGCGCAGGATGTAATCATGGAAGTTGTCTTCCCAAATGAAGTGGGAGCGAGAATAATAACATCGGAGTCACAACTGACGATAACAAAGGAGAAGAAGGAAGAACTCCAGGACTGCAAAATTGCACCTTTGATGGTCGCATACATGCTAGAAAGAGAGTTAGTCCGCAAGACGAGGTTCCTCCCAGTGGCTGGTGGAACAAGCAGTGTCTATATTGAGGTGCTGCATTTAACCCAGGGGACATGCTGGGAGCAGATGTACACTCCAGGAGGAGAAGTGAGAAATGATGATGTAGACCAGAGTTTGATTATCGCCGCCAGGAACATAGTAAGAAGAGCAACAGTATCAGCAGATCCACTAGCATCTCTATTGGAGATGTGCCACAGCACACAGATTGGGGGAATAAGGATGGTAGACATTCTTCGACAAAATCCAACAGAGGAACAAGCCGTGGATATATGCAAGGCAGCAATGGGCTTGAGGATTAGCTCATCTTTCAGCTTTGGTGGATTCACTTTCAAAAGAACAAGTGGATCATCAGTCAAAAGAGAAGAAGAAGTGCTTACGGGCAACCTTCAAACACTGAAAATAAGAGTACATGAGGGGTATGAAGAGTTCACGATGGTTGGAAGAAGAGCAACGGCTATTCTCAGGAAGGCAACCAGAAGGTTAATCCAGCTAATAGTAAGTGGAAGAGACGAGCAGTCAATTGCTGAAGCAATAATTGTGGCCATGGTATTCTCACAGGAAGACTGCATGATCAAGGCAGTTCGAGGTGATCTGAATTTTGTCAATAGGGCGAACCAGCGGCTGAATCCAATGCATCAACTCTTGAGACACTTCCAAAAGGATGCTAAAGTGCTTTTCCAAAACTGGGGAATTGAATCCATTGACAACGTGATGGGGATGATTGGGATATTGCCCGACATGACCCCAAGCACTGAGATGTCACTGAGGGGAATAAGAGTCAGCAAGATGGGAGTAGATGAATACTCCAGTACAGAGAGGGTGGTGGTGAGCATCGATCGATTTTTAAGAGTCCGGGACCAACGAGGGAACGTACTATTGTCACCAGAAGAAGTCAGCGAGACACACGGAACAGAGAAATTGACAATCACTTATTCATCATCAATGATGTGGGAGATTAATGGACCCGAATCGGTGTTGGTCAACACTTATCAATGGATCATCAGGAACTGGGAAACTGTGAAAATTCAATGGTCACAGGATCCCACAATGTTATATAATAAGATGGAATTCGAGCCATTCCAGTCTCTGATACCTAAAGCAGCCAGAGGTCAATACAGTGGATTCGTGAGGACACTATTCCAGCAGATGCGAGATGTGCTCGGAACATTTGACACTGTCCAAATAATAAAACTCCTCCCCTTTGCTGCTGCCCCACCAGAACAAAGTAGAATGCAATTCTCCTCCCTGACTGTAAATGTGAGAGGATCAGGAATGAGAATACTGGTTAGAGGCAATTCCCCAGTGTTCAATTACAACAAGGCTACCAAGAGGCTCACAGTTCTCGGGAAAGATGCAGGTGCATTGACCGAAGATCCAGATGAAGGCACAGCTGGAGTAGAGTCTGCTGTTCTAAGAGGATTCCTCATTTTGGGCAAAGAAGACAAGAGATATGGCCCAGCATTGAGCATCAATGAGCTGAGCAATCTTGCAAAGGGAGAGAAGGCTAATGTGCTAATTGGGCAAGGAGACGTGGTGTTGGTAATGAAACGGAAACGGGACTCTAGCATACTTACTGACAGCCAGACAGCGACCAAAAGGATTCGGATGGCCATCAATTAGTGTCGAATTGTTTAAAAACGACCTTGTTTCTACT +>OQ683471.1 +AGCGAAAGCAGGTCAAATATATTCAATATGGAGAGAATAAAAGAACTAAGAGATCTAATGTCACAGTCTCGCACTCGCGAGATACTCACCAAAACCACTGTGGACCACATGGCTATAATCAAAAAATACACATCAGGAAGGCAAGAGAAGAACCCCGCACTCAGGATGAAATGGATGATGGCAATGAAATATCCAATCACAGCAGACAAGAGAATAATGGAAATGATTCCTGAAAGAAATGAACAAGGACAAACCCTCTGGAGCAAAACGAACGATGCTGGGTCAGATCGAGTGATGGTATCACCTCTGGCTGTGACATGGTGGAATAGGAATGGGCCAACAACAAGTACGGTCCACTACCCAAAAGTATACAAAACTTATTTCGAAAAAGTTGAAAGGTTGAAACACGGGACCTTTGGCCCTGTCCACTTCAGAAATCAAGTTAAGATAAGACGGAGGGTCGACATAAACCCAGGCCATGCAGACCTCAGTGCCAAAGAGGCGCAGGATGTCATCATGGAAGTTGTCTTCCCAAATGAAGTGGGAGCGAGAATACTAACATCGGAGTCACAACTGACGATAACAAAGGAGAAGAAGGAAGAACTCCAGGACTGCAAAATCGCCCCTCTGATGGTCGCATACATGCTAGAAAGGGAGTTAGTCCGCAAGACGAGGTTCCTCCCAGTGGCTGGTGGAACAAGCAGTGTCTATATTGAGGTGCTGCATTTAACCCAGGGGACATGCTGGGAGCAGATGTACACTCCAGGAGGAGAAGTGAGAAATGATGATGTAGACCAGAGTTTGATTATTGCTGCCAGGAACATAGTAAGAAGAGCAACAGTATCAGCAGACCCACTAGCATCCCTACTGGAGATGTGCCACAGCACACAAATTGGGGGAATTAGGATGGTCGACATCCTTCGGCAAAATCCAACAGAGGAACAAGCCGTGGACATATGCAAGGCAGCAATGGGCTTGAGGATTAGCTCATCTTTCAGCTTTGGTGGATTCACTTTTAAAAGAACAAGTGGATCATCAGTCAAAAGAGAAGAAGAAGTGCTAACGGGCAACCTTCAAACATTGAAAATAAGAGTACATGAGGGGTATGAAGAGTTCACAATGGTTGGAAGAAGAGCAACGGCTATTCTCAGGAAGGCAACCAGAAGGTTGATCCAGCTAATAGTAAGTGGGAGAGACGAGCAGTCAATTGCAGAAGCAATAATTGTGGCCATGGTATTCTCACAAGAAGACTGCATGATCAAGGCAGTTCGAGGTGATCTGAATTTTGTCAATAGGGCGAACCAGCGGCTGAATCCAATGCATCAACTCTTGAGACACTTCCAAAAGGATGCTAAAGTGCTTTTCCAAAACTGGGGAATTGAACCCATTGACAATGTAATGGGGATGATCGGGATATTGCCCGACATGACCCCAAGCACTGATGTGTCACTGAGGGGGATAAGAGTCAGTAAAATGGGGGTAGATGAATACTCCAGTACAGAGAGGGTGGTGGTAAGCATCGACCGATTTTTACGAGTTAGGGACCAACGAGGGAACGTACTATTGTCACCTGAAGAAGTCAGCGAGACACAAGGAACAGAGAAATTGACAATCACTTATTCGTCGTCAATGATGTGGGAGGTCAATGGACCTGAGTCGGTGTTGGTCAACACTTATCAGTGGATCATCAGAAACTGGGAAAATGTGAAAATTCAATGGTCACAGGATCCCACAATGTTATATAATAAGATGGAATTCGAGCCATTCCAGTCTCTGGTGCCTAAAGCAACCAGAGGTCAATACAGTGGATTCGTGAGGACACTATTCCAGCAGATGCGAGATGTGCTCGGAACATTTGACACCGTTCAAATAATAAAACTCCTCCCCTTTGCTGCTGCCCCACCAGAACAAAGTAGAATGCAATTCTCATCCCTGACTGTAAATGTGAGAGGATCAGGAATGAGAATACTGGTAAGAGGCAATTCCCCAGTGTTCAATTACAACAAGGCCACTAAGAGGCTCACAGTTCTCGGGAAAGATGCAGGTGCATTGACCGAAGATCCAGATGAAGGCACAGCTGGAGTAGAGTCTGCTGTTTTACGAGGATTCCTCATTTTGGGCAAAGAAGACAAGAGGTATGGACCAGCATTGAGCATCAATGAGCTGAGCAATCTTGCAAAGGGAGAGAAGGCTAACGTGTTAATTGGGCAAGGAGACGTGGTGTTGGTAATGAAACGGAAACGGGACTCTAGCATACTTACCGACAGCCAGACAGCGACCAAAAGGATTCGGATGGCCATCAATTAGTGTCGAATTGTTTAAAAACGACCTTGTTTCTACT +>OQ565625.1 +AAAAGCARGTCAARTATATTCAATATGGAGAGAAKAAAAGARCTAAGAAATCCAATGTCACAGWCTCRCACTCGCGAGATNCWGACCAAAACCACTGTTGACCACATGGCCATAATCAAAAAGTACACATCRGGAAGGCAAGAGAAGAACCCCGCACTCAGAATGAAATGGATGATGGCAATGAAATATCCAATTACAGCAGATAAGCGAATAATGGAAATGATCCCTGAGAGGAATGAACAAGGGCAAACTCTCTGGAGCAAAACAAACGATGCCGGATCAGACCGAGTGATGGTATCACCCCTGGCTGTGACATGGTGGAACAGGAACGGACCAACAACAAGTACAGTTCACTACCCAAAGGTATATAAAACTTATTTCGAAAAAGTTGAAAGGTTGAAACACGGGACCTTTGGCCCTGTGCACTTCAGAAACCAAGTTAAGATAAGACGGAGGGTCGATATAAACCCRGGCCATGCTGACCTCAGTGCCAAAGAGGCGCAGGATGTAATCATGGAAGTCGTCTTCCCAAATGAAGTGGGAGCAAGGATATTGACGTCGGAGTCACAACTGACGATAACAAAGGAGAAAAAGGAAGAACTCCAGGACTGCAAAATCGCTCCTCTGATGGTTGCATACATGCTAGAAAGAGAGTTGGTTCGCAAGACGAGGTTTCTCCCAGTTGCTGGTGGGACAAGCAGTGTCTACATTGAGGTGCTGCATTTGACCCAGGGGACATGCTGGGAGCAGATGTACACTCCGGGAGGAGAAGTGAGGAACGATGATGTAGACCAAAGCTTGATCATTGCTGCCAGGAATATAGTAAGAAGAGCAACAGTATCAGCAGATCCATTAGCATCTCTATTGGAGATGTGTCACAGCACACAAATTGGGGGAATAAGGATGGTAGACATYCTTCGGCAAAATCCAACAGAGGAACAAGCCGTGGATATATGCAAGGCAGCAATGGGCTTGAGGATTAGCTCATCTTTCAGCTTTGGTGGATTCACTTTTAAAAGAACAAGTGGATCRTCAGTCAAAAAAGAAGAAGAAGTGCTAACAGGCAACCTTCAAACATTGAAAATAAGAGTACATGAGGGGTATGAAGAGTTCACAATGGTTGGGAGAAGAGCAACGGCCATTCTCAGGAAAGCAACCAGAAGGCTGATCCAGCTAATTGTAAGTGGGAGAGACGAGCAGTCAATTGCTGAAGCAATAATTGTGGCCATGGTATTCTCACAAGAGGACTGCATGATTAAAGCAGTTAGAGGTGACCTGAATTTTGTCAATAGGGCGAACCAGCGACTAAACCCAATGCATCAACTCTTGAGGCATTTCCAAAAGGATGCAAAGGTGCTTTTCCAAAATTGGGGAATTGAACCCATTGACAATGTGATGGGAATGATCGGGGTAATGCCCGACATGACCCCAAGTACTGAGATGTCGCTGAGGGGAATAAGAGTCAGTAAGATGGGAGTAGATGAATACTCAAGTACAGAGCGAGTAGTAGTAAGCATCGACCGGTTTTTAAGAGTTCGAGACCAACGGGGGAACGTACTATTATCACCCGAAGAGGTCAGTGAGACACAAGGAACGGAGAAACTGACAATCACTTATTCGTCATCAATGATGTGGGAGATCAATGGTCCTGAGTCGGTGTTGGTCAATACTTATCAGTGGATAATTAGAAACTGGGAAACTGTAAAAATTCAATGGTCACAGGATCCCACAATGTTGTATAATAAGATGGAATTCGAGCCATTCCAGTCTCTAGTCCCTAAGGCAGCCAGAGGTCAATACAGTGGGTTTGTGAGAACACTATTCCAGCAAATGCGAGATGTGCTTGGAACATTTGACACTGTTCAGATAGTAAAACTCCTCCCCTTTGCTGCCGCCCCACCGGAACAAAGTAGGATGCAGTTCTCCTCCCTGACTGTGAATGTAAGAGGATCAGGAATGAGGATACTGGTAAGAGGCAATTCACCAGTGTTCAATTACAACAAGGCCACCAAGAGGCTCACAGTTCTCGGGAAAGATGCAGGTGCATTGACCGAAGATCCAGATGAAGGCACAGCTGGAGTGGAGTCTGCTGTTTTAAGAGGATTCCTCATTTTGGGCAAAGAAGACAAGAGATATGGCCCAGCATTGAGCATCAACGAGCTGAGCAATCTTGCAAAGGGAGAGAAGGCTAATGTGCTAATTGGGCAAGGAGACGTAGTGTTGGTGATGAAACGGAAACRGGACTCTAGCATACTTACTGACAGCCAGACAGCGACCAAAAGGATTCGGATGGCCATCAATTAGTGTCRRATTATTTAAAAACGACCTKGTTTCTACT +>JF758718.1 +ATGGAGAGAATAAAAGAACTAAGAGATCTAATGTCACAGTCCCGCACCCGCGAGATACTCACCAAGACCACTGTGGACCATATGGCCATAATCAAAAAATACACATCAGGAAGACAAGAGAAGAACCCCGCACTCAGAATGAAGTGGATGATGGCAATGAAATATCCAATCACAGCTGACAAGAGAATAATGGAAATGATTCCTGAGAGGAATGAGCAAGGACAAACCCTCTGGAGCAAAACAAATGATGCCGGCTCAGACCGAGTGATGGTATCACCTCTGGCCGTGACATGGTGGAATAGGAATGGACCAACAACAAGCACAGTTCACTACCCGAAGGTATATAAAACTTATTTCGAAAAAGTCGAAAGGTTAAAGCATGGAACCTTTGGCCCCGTCCACTTCAGGAACCAAGTTAAGATAAGAAGGAGAGTTGACATAAACCCTGGCCATGCAGATCTCAGTGCTAAGGAAGCGCAGGATGTAATCATGGAAGTTGTCTTCCCAAATGAAGTAGGAGCTAGAATACTAACGTCGGAGTCACAGCTGACAATAACGAAAGAGAAGAAAGAAGAGCTCCAGGATTGTAAAATCGCCCCTTTGATGGTGGCATATATGCTAGAAAGAGAGTTGGTCCGCAAAACAAGATTCCTCCCAGTGGCTGGTGGAACAAGCAGTGTCTATATTGAGGTGTTGCATTTAACCCAGGGAACATGCTGGGAGCAGATGTACACTCCAGGAGGAGAAGTGAGAAATGATGATGTCGACCAAAGTCTGATTATCGCTGCCAGGAACATAGTAAGAAGAGCAACGGTATCGGCAGACCCATTAGCATCTTTGTTGGAAATGTGCCACAGCACACAGATTGGAGGAATAAGGATGGTGGACATCCTTAGGCAAAATCCAACAGAGGAACAAGCCGTGGACATATGCAAGGCAGCAATGGGACTAAGGATTAGCTCATCTTTCAGCTTCGGCGGATTCACTTTCAAAAGGACAAGTGGATCGTCAGTCAAGAAAGAAGAAGAAGTGCTTACGGGCAACCTTCAAACACTGAAAATAAGAGTGCATGAGGGGTATGAAGAATTCACAATGGTTGGAAGAAGAGCAACGGCTATTCTCAGAAAAGCAACCAGGAGATTGATCCAGCTAATAGTAAGTGGGAGGGATGAGCAGTCAATTGCTGAGGCAATAATCGTAGCCATGGTATTTTCGCAAGAGGATTGCATGATCAAAGCAGTTCGAGGCGATCTAAACTTTGTCAATAGGGCAAACCAGCGACTGAATCCCATGCATCAACTTTTGAGGCATTTCCAAAAAGATGCAAAGATGCTTTTCCAGAACTGGGGAATTGAACCCATTGACAATGTAATGGGAATGATCGGAATATTACCTGACATGACCCCAAGTACTGAGATATCGCTGAGGGGAATAAGAGTTAGCAAAATGGGAGTAGATGAGTACTCCAGCACGGAGAGAGTGGTGGTGAGCATTGACCGATTTTTGAGGGTTCGGGACCAACGGGGAAACGTATTATTGTCTCCCGAAGAAGTCAGTGAGACACAAGGAACAGAGAAGTTGACAATAACTTACTCGTCATCAATGATGTGGGAAATCAACGGTCCTGAGTCAGTGCTGGTCAATACTTATCAGTGGATCATTAGAAACTGGGAAACTGTGAAAATCCAATGGTCACAAGATCCCACGATGTTATACAATAAGATGGAATTCGAACCATTTCAGTCTCTTGTCCCTAAAGCTGCCAGAAGTCAATACAGCGGATTCGTGAGAACACTGTTCCAACAGATGCGAGATGTGCTTGGAACATTTGACACTGTTCAAATAATAAAACTTCTCCCTTTTGCTGCTGCTCCACCAGAGCAGAGTAGGATGCAATTCTCCTCACTGACTGTGAATGTAAGAGGATCAGGAATGAGGATACTGGTAAGAGGCAATTCTCCAGTGTTCAACTACAACAGGGCTACCAAGAGGCTTACGGTTCTTGGGAAGGATGCTGGTGCGTTGACCGAAGATCCTGATGAAGGCACAGCTGGAGTGGAGTCTGCCGTTCTGAGAGGATTCCTCATTTTAGGCAAAGAAGACAAAAGATATGGCCCAGCATTAAGCATCAATGAACTGAGCAATCTTGCAAAAGGAGAAAAGGCTAATGTGCTAATTGGGCAAGGAGACGTGGTGTTGGTAATGAAACGGAAACGGGACTCTAGCATACTTACTGACAGCCAGACAGCGACCAAAAGAATTCGGATGGCCATCAATTAG +>AB675582.1 +GGATGGTGGACATCCTTAGACAGAACCCAACTGAGGAACAAGCTGTGGATATATGCAAAGCAGCAATGGGTCTGAGGATCAGCTCATCCTTTAGTTTTGGAGGTTTCACTTTCAAAAGAACAAGTGGGTCATCCGTTACGAAGGAAGAAGAAGTGCTTACGGGCAACCTCCAAACACTGAAAATAAGAGTACATGAGGGGTATGAAGAATTCACAATGGTTGGGCAGAGGGCAACAGCTATCTTGAGGAAAGCAACTAGAAGGCTGATTCAGTTGATAGTAAGCGGACGAAATGAACAATCAATCGCTGAGGCAATTATTGTAGCGATGGTGTTCTCACAAGAGGATTGCATGATAAAGGCAGTCCGAGGCGATCTAAATTTCGTAAACAGGGCAAACCAAAGACTAAACCCCATGCATCAACTCCTGAGACATTTTCAAAAGGACGCAAAAGTGCTATTTCAAAATTGGGGAACTGAACCCATTGATAATGTCATGGGGATGATCGGGATATTACCTGACATGACTCCCAGCACAGAACTGTCACTGAGAGGAGTAAGAGTTAGTAAAATGGGAGTAGATGAATATTCCAGCACTGAAAGAGTAGTTGTAAGCATTGACCGCTTCTTAAGGGTTCGAGATCAGCGGGGGAATGTACTCTTATCTCCCGAAGAGGTCAGTGAAACCCAGGGAACAGAGAAGTTGACAATAACATATTCGTCATCAATGATGTGGGAGATCAACGGTCCTGAGTCAGTGCTTGTCAACACCTATCAATGGATCATCAGAAACTGGGAAACCGTGAAGATACAATGGTCTCAGGATCCCACGATGCTATACAATAAGATGGAGTTCGAACCGTTCCAATCCTTGGTACCTAAAGCTACCAGAGGTCAATACAGTGGATTTGTGAGAACGTTATTCCAACAAATGCGTGACGTACTGGGGACATTTGATACTGCCCAGATAATAAAGCTGCTACCATTTGCAGCAGCACCACCTGAGCAGAGCAGAATGCAGTTTTCTTCTCTAACTGTGAATGTGAGAGGCTCAGGAATGAGAATACTCGTAAGGGGCAATTCCCCTGTTTTCAACTACAATAAGGCAACCAAAAGGCTTACCGTTCTTGGAAAGGATGCAGGTGCATTAACAGAGGATCCAGACGAGGGGACAGCCGGAGTGGAATCTGCAGTACTGAGGGGATTCCTAATTC +>KP097829.1 +ATGGAACGGATAAAAGAATTAAGAGATCTAATGTCACAGTCCCGCACTCGCGAGATACTAACAAAAACCACTGTGGACCATATGGCCATAATCAAGAAATACACATCAGGAAGACAAGAGAAGAATCCTGCCCTCAGAATGAAATGGATGATGGCAATGAAGTATCCGATTACAGCGGACAAGAGAATAATAGATATGATTCCTGAAAGGAATGAACAAGGGCAGACACTCTGGAGCAAGACAAATGATGCTGGGTCGGACAGGGTGATGGTGTCCCCCCTAGCTGTAACTTGGTGGAATAGGAATGGGCCGACGACAAATACAGTTCATTATCCAAAAGTTTACAAAACATACTTCGAGAAGGTTGAAAGGTTAAAACATGGAACATTTGGCCCCGTCCATTTCCGAAACCAAGTTAAAATACGCCGCCGAGTTGATACAAACCCTGGCCATGCAGATCTCAGTGCTAAAGAAGCACAAGATGTCATCATGGAAGTTGTTTTCCCAAATGAGGTGGGAGCTAGAATATTGACTTCGGAGTCACAATTGACAATAACAAAAGAGAAGAAAGAAGAGCTCCAAGATTGTAAGATTGCTCCCTTAATGGTTGCATACATGTTGGAGAGGGAACTGGTCCGCAAAACCAGATTCCTACCGGTAGCAGGCGGCACAAGCAGTGTGTACATTGAGGTACTGCATTTGACTCAAGGAACCTGCTGGGAGCAGATGTACACTCCAGGCGGAGAAGTAAGAAATGACGATGTTGACCAGAGTTTGATCATTGCTGCCAGAAACATTGTTAGGAGAGCAACGGTATCAGCGGATCCACTGGCATCACTGCTGGAGATGTGTCACAGCACACAAATTGGTGGGATAAGGATGGTGGACATCCTTAGGCAAAATCCAACTGAGGAACAAGCTGTGGACATATGCAGAGCAGCAATGGGTTTGAGGATCAGCTCATCCTTTAGTTTTGGAGGTTTCACTTTCAAAAGAACAAGTGGGTCATCCGTCACGAAGGAAGAGGAAGTGCTTACGGGCAACCTCCAAACATTGAAAATAAGAGTACATGAGGGGTATGAAGAATTCACAATGGTTGGGCAGAGGGCAACAGCTATCCTGAGGAAAGCAACTAGGAGGCTGATTCAGTTGATAGTAAGCGGAAGAAACGAACAATCAATCGCTGAGGCAATCATTGTAGCGATGGTGTTCTCACAGGAGGATTGTATGATAAAGGCAGTCCGAGGCGATCTAAATTTCGTAAACAGAGCAAACCAAAGATTAAATCCCATGCATCAACTCCTGAGACATTTTCAAAAGGACACAAAGGTACTATTTCAGAATTGGGGAATTGAACCCATTGATAATGTCATGGGGATGATCGGGATACTACCCGACATGACTCCCAGCACAGAACTGTCACTGAGAGGAGTGAGAGTTAGTAAAATGGGAGTGGATGAATATTCCAGTACTGAAAGAGTAGTTGTAAACATTGACCGCTTTTTAAGGGTTCGAGATCAGCGGGGGAATGTACTCTTATCTCCCGAAGAGGTCAGCGAAACCCAGGGGACAGAGAAGTTGACAATAACATATTCGTCATCAATGATGTGGGAAATCAACGGTCCTGAATCAGTGCTCGTCAACACCTACCAATGGATCATCAGAAATTGGGAAACTGTGAAGATTCAATGGTCTCAGGATCCCACGATGCTGTACAATAAGATGGAGTTCGAGCCGTTCCAATCCTTGGTACCTAAAGCTACCAGAGGTCAATACAGTGGATTTGTGAGAACATTATTTCAACAAATGCGTGATGTACTAGGGACATTTGATACTGTCCAGATAATAAAGCTGCTACCATTTGCAGCAGCACCACCTGAGCAGAGCAGAATGCAGTTTTTTTCTCTAACTGTGAATGTGAGGGGCTCAGGAATGAGAATACTCGTAAGGGGCAATTCCCCTGTGTTCAACTACAATAAGGCAACCAAAAGGCTTACCGTTCTTGGAAAGGACGCAGGTGCATTAACAGAGGATCCAGACGAGGGGACAGCCGGAGTGGAATCCGCAGTACTGAGGGGATTCCTAATTCTAGGCAAGGAGGACAAAAGATATGGACCAGCATTGAGCATCAATGAACTGAGCAATCTTGCAAAAGGGGAGAAAGCTAATGTGCTGATAGGGCAAGGAGACGTGGTGTTGGTAATGAAACGGAAACGGGACTCTAGCATACTTACTGACAGCCAGACAGCGACCAAAAGAATTCGGATGGCCATCAATTAG +>KP097844.1 +ATGGAGAGAATAAAAGAATTAAAAGAGCTAATGTCAGAGTCCCGCACTCGCGAGATACTAACAAAAAGCACTGTGGACCCCCTTTTAATAATCAAGAAATACACATCAGGAAGACAAGAGAAGAACCCTGCTCTCAGAATGAAATGGATGATGGCAATGAAATATCCAATCACAGCGGACAAGAGAATAATAGAGATGGTTCCTGAAAGGAATGAACAAGGGCAAACGCTCTGGAGCAAGACAAATGACGCTGGATCGGACAGGGTGATGGTGTCTCCCCTAGCTGTGACTTGGTGGAATAGGAATGGGCCGACTTCAAACGCAGTCCATTACCCAAAGGTTTACAAAACATACTTTGAGAAGGTTGAAAGGTTAAAACATGGAACCTACGGTCCCGTTCATTTTCGGAACCAAGTTAAAATACGCCGCCGAGTTGATATAAATCCTGGCCATGCACATCTCACTTTTAAAGAAGCACAAGATGTCATCATGGAGGTCGTTTTCCCGAATGAAGTAGGAGCTAAAATATTGACATCAGAGTCGCAATTGACAATAACGAAAGAGAAGAAAGAAGAGCTCCAAAATTGTAAGATTGCTCCCTTAATGGTTGCATACATGTTGGAAAGGGAACTGGTCCGCAAAACCAGATTCCTACCGGTAGCAGGCGGGACAAGCAGCGTGTACATTGAGGTATTGCATTTGACTCAAGGGACCTGCTGGGAACAGATGTACACTCCAGGCGGAAAAGTGAGAAATGACGATGTTGACCAGAGTTTGATCATCGCTGCCAGAAACATTGTTAGGAGAGCAACGGTATCAGCGGATCCACTGGCATCATTGCTGGAGATGTGTCACAGCACACAGATCGGTGGGATAAGGATGGTGGACATTCTTAGACAAAATCCAACTGAGGAACAAGCTGTGGATATATGCAGAGCAGCAATGGGTCTGAGGATCAGTTCATCCTTTAGCTTTGGAGGCTTCACCTTCAAAAGAACAAGTGGATCATCTGTCACAAAGGAAGAGGAAGTGCTTACAGGCAACCTCCAAACATTGAAAATAAGAGTACATGAGGGGTATGAGGAATTCACAATGGTTGGGCGGAGGGCAACAGCTATCCTGAGGAAAGCAACTAGAAGGCTGATTCAGTTGATAGTAAGTGGAAGGGACGAACAATCAATCGCTGAGGCAATCATTGTAGCAATGGTGCTCTCCCAGGAGGATTGCATGATAAAGGCAGTCCGAGGCGATCTGAATTTCGTAAACAGAGCAAACCAAAGATTAAACCCCATGCATCAACTCCTGAGACATTTTCAAAAGGACGCAAAAGTGCTATTTCAGAATTGGGGAATTGAACCCATTGATAATATCATGGGGATGATCGGAATATTACCTGACATGACTCCCAGCACAGAAATGTCACTGAGAGGAGTAAGAGTTAGTAAAATGGGAGTGGATGAATATTCCAGCACTGAGAGAGTAGTTGCAAGTATTGACCGTTTCTTAAGGGTTCGAGATCAGCGGGGGAACATACTCTTATCTCCCGAAGAGGTCAGCGAGACCCAGGGAACAGAGAAATTGACAATAACATATTCATCGTCAATGATGTGGGAAATCAACGGTCCTGAGTCAGTGCTTGTTAACACTTATCAATGGATCATCAGAAACTGGGAGACTGTGAAGATTCAATGGTCTCAAGACCCCACGATGCTGTACAATAAGATGGAGTTTGAACCGTTCCAATCCTTGGTACCTAAAGCTTCCAGATGCCAATACAGTGGATTTGTGAGAACATTATTCCAACAAATGCGTGACGTACTGGGGACATTTGACACTGTCCAGATAATAAAGCTGCTACCATTTGCAGCAGCCCCACCGGAGCAGAGCAGAATGCAGTTTTCTTCTCTAACTGTGAATGTGAGAGGCTCAGGAATGAGAATACTCGTAAGGGGCAATTCCCCTGTGTTCAACTACAATAAGGCAACCAAAAGGCTTACCATTCTTGGAAAGGACGCAGGTGCATTAACAGAGGATCCAGATGAGGGGACAGCCGGAGTAGAATCTGCAGTACTGAGGGGATTCCTAATTCTAGGCAAGGAGGACAAAAGATATGGACCAGCATTGAGCATCAGTGAACTGAGCAATCTTGCGAAAGGGGAGAAAGCTAATGTGCTGATAGGGCAAGGGGACGTGGTGCTGGTAATGAAACGGAAACGGGACTCTAGCATACTTACTGACAGCCAGACAGCGACCAAAAGAATTCGGATGGCCATTAATTAG +>AB675549.1 +TGGTGGGATAAGGATGGTGGACATCCTTAGACAGAACCCAACTGAGGAACAAGCTGTGGATATATGCAAAGCAGCAATGGGTCTGAGGATCAGCTCATCCTTTAGTTTTGGAGGTTTCACTTTCAAAAGAACAAGTGGGTCATCCGTTACGAAGGAAGAAGAAGTGCTTACGGGCAACCTCCAAACACTGAAAATAAAAGTACATGAGGGGTATGAAGAATTCACAATGGTTGGGCAGAGGGCAACAGCTATCTTGAGGAAAGCAACTAGAAGGCTGATTCAGTTGATAGTAAGCGGACGAAATGAACAATCAATCGCTGAGGCAATTATTGTAGCGATGGTGTTCTCACAAGAGGATTGCATGATAAAGGCAGTCCGAGGCGATCTAAATTTCGTAAACAGGGCAAACCAAAGACTAAACCCCATGCATCAACTCCTGAGACATTTTCAAAAGGACGCAAAAGTGCTATTTCAAAATTGGGGAACTGAACCCATTGATAATGTCATGGGGATGATCGGGATATTACCTGACATGACTCCCAGCACAGAACTGTCACTGAGAGGAGTAAGAGTTAGTAAAATGGGAGTAGATGAATATTCCAGCACTGAAAGAGTAGTTGTAAGCATTGACCGCTTCTTAAGGGTTCGAGATCAGCGGGGGAATGTACTCTTATCTCCCGAAGAGGTCAGTGAAACCCAGGGAACAGAGAAGTTGACAATAACATATTCGTCATCAATGATGTGGGAGATCAACGGTCCTGAGTCAGTGCTTGTCAACACCTATCAATGGATCATCAGAAACTGGGAAACCGTGAAGATACAATGGTCTCAGGATCCCACGATGCTATACAATAAGATGGAGTTCGAACCGTTCCAATCCTTGGTACCTAAAGCTACCAGAGGTCAATACAGTGGATTTGTGAGAACGTTATTCCAACAAATGCGTGACGTACTGGGGACATTTGATACTGCCCAGATAATAAAGCTGCTACCATTTGCAGCAGCACCACCTGAGCAGAGCAGAATGCAGTTTTCTTCTCTAACTGTGAATGTGAGAGGCTCAGGAATGAGAATACTCGTAAGGGGCAATTCCCCTGTTTTCAACTACAATAAGGCAACCAAAAGGCTTACCGTTCTTGGAAAGGATGCAGGTGCATTAACAGAGGATCCAGACGAGGGGACAGCCGGAGTGGAATCTGCAGTACTGAGGGGA diff --git a/data/community/genspectrum/iav/h5n1/GG1996/PB2/genome_annotation.gff3 b/data/community/genspectrum/iav/h5n1/GG1996/PB2/genome_annotation.gff3 new file mode 100644 index 000000000..90d9b4aa4 --- /dev/null +++ b/data/community/genspectrum/iav/h5n1/GG1996/PB2/genome_annotation.gff3 @@ -0,0 +1 @@ +. . CDS 28 2307 . + . gene="PB2" diff --git a/data/community/genspectrum/iav/h5n1/GG1996/PB2/pathogen.json b/data/community/genspectrum/iav/h5n1/GG1996/PB2/pathogen.json new file mode 100644 index 000000000..f0cee110b --- /dev/null +++ b/data/community/genspectrum/iav/h5n1/GG1996/PB2/pathogen.json @@ -0,0 +1,19 @@ +{ + "schemaVersion": "3.0.0", + "alignmentParams": { + "minSeedCover": 0.01 + }, + "attributes": { + "name": "Influenza A/H5N1 (segment 1/PB2)", + "reference name": "Influenza A virus (A/Goose/Guangdong/1/96(H5N1)) polymerase (PB2) gene, complete cds", + "reference accession": "NC_007357.1" + }, + "files": { + "reference": "reference.fasta", + "changelog": "CHANGELOG.md", + "pathogenJson": "pathogen.json", + "genomeAnnotation": "genome_annotation.gff3", + "readme": "README.md", + "examples": "examples.fasta" + } +} diff --git a/data/community/genspectrum/iav/h5n1/GG1996/PB2/reference.fasta b/data/community/genspectrum/iav/h5n1/GG1996/PB2/reference.fasta new file mode 100644 index 000000000..765e6c938 --- /dev/null +++ b/data/community/genspectrum/iav/h5n1/GG1996/PB2/reference.fasta @@ -0,0 +1,35 @@ +>NC_007357.1 Influenza A virus (A/Goose/Guangdong/1/96(H5N1)) polymerase (PB2) gene, complete cds +AGCAAAAGCAGGTCAATTATATTCAATATGGAAAGAATAAAAGAACTAAGAGATCTAATGTCGCAGTCCC +GCACTCGCGAGATACTAACAAAAACCACTGTGGATCATATGGCCATAATCAAGAAATACACATCAGGAAG +ACAAGAGAAGAACCCTGCTCTCAGAATGAAATGGATGATGGCAATGAAATATCCAATCACAGCAGACAAG +AGAATAATGGAGATGATTCCTGAAAGGAATGAGCAAGGACAAACGCTTTGGAGCAAGACAAATGATGCTG +GGTCGGACAGAGTGATGGTGTCTCCCCTAGCTGTAACTTGGTGGAACAGGAATGGGCCGACAACAAGTAC +AGTCCATTATCCAAAGGTTTACAAAACATACTTTGAGAAGGTTGAAAGGTTAAAACATGGAACCTTCGGT +CCCGTTCATTTCCGAAACCAAGTTAAAATACGTCGCCGGGTGGATATAAACCCGGGCCATGCAGATCTCA +GTGCTAAAGAAGCACAAGATGTTATCATGGAGGTCGTTTTCCCAAATGAAGTGGGAGCTAGAATATTGAC +ATCAGAGTCGCAATTGACAATAACAAAAGAGAAGAAAGAAGAGCTCCAGGATTGTAAAATTGCTCCTTTA +ATGGTGGCATACATGTTGGAAAGAGAACTGGTCCGCAAAACCAGATTTCTACCGGTAGCAGGCGGAACAA +GCAGTGTGTACATTGAGGTATTGCATTTGACTCAAGGGACCTGTTGGGAACAGATGTACACTCCCGGCGG +AGAAGTAAGAAATGATGATGTTGACCAGAGTTTGATCATCGCTGCCAGAAACATTGTTAGGAGAGCAACA +GTATCAGCGGACCCACTGGCATCACTCTTGGAGATGTGTCACAGCACACAAATTGGGGGAATAAGGATGG +TGGACATCCTTAGGCAAAACCCAACTGAGGAGCAAGCTGTGGATATATGCAAAGCAGCAATGGGTTTGAG +GATCAGTTCATCCTTTAGCTTTGGAGGCTTCACTTTCAAAAGAACAAATGGATCATCCGTCAAGAAGGAA +GAGGAAGTGCTTACAGGCAACCTCCAAACATTGAAAATAAAAGTACATGAGGGGTATGAAGAATTCACAA +TGGTTGGGCGGAGAGCAACAGCTATCCTGAGGAAAGCAACTAGAAGGCTGATTCAGTTGATAGTAAGTGG +AAGAGATGAACAATCAATCGCTGAAGCGATCATTGTAGCAATGGTGTTCTCACAGGAGGATTGCATGATA +AAGGCAGTCCGAGGCGATCTGAATTTCGTGAACAGAGCAAACCAAAGATTGAACCCCATGCATCAACTCC +TGAGGCACTTCCAAAAAGATGCAAAAGTGCTGTTTCAGAACTGGGGAATTGAACCTATTGACAATGTCAT +GGGGATGATCGGAATATTACCTGACATGACTCCAAGCGCAGAGATGTCACTGAGAGGAGTGAGAGTTAGT +AAGATGGGAGTAGATGAATATTCCAGCACGGAGAGAGTGGTGGTGAGTATTGACCGTTTCTTGAGGGTCC +GAGATCAGCAGGGGAACGTACTCTTATCTCCTGAAGAGGTTAGTGAAACACAGGGAACAGAGAAGTTGAC +AATAACATATTCATCCTCAATGATGTGGGAAATCAACGGTCCTGAGTCAGTGCTTGTTAACACTTATCAA +TGGATCATCAGGAATTGGGAGACTGTAAAGATTCAATGGTCTCAAGATCCCACAATGCTGTACAATAAGA +TGGAGTTTGAATCGTTCCAATCCTTGGTGCCAAAGGCTGCCAGAAGCCAATATAGTGGATTTGTGAGAAC +ACTATTCCAACAGATGCGTGATGTTTTGGGGACATTTGATACTGTCCAAATAATCAAGCTGCTACCATTT +GCAGCAGCCCCACCGGAGCCGAGCAGAATGCAGTTTTCTTCTCTAACTGTGAATGTGAGAGGCTCAGGAA +TGAGAATACTCGTGAGGGGTAACTCCCCCGTGTTCAACTACAACAAGGCAACCAAAAGGCTTACAGTCCT +CGGAAAGGACGCAGGTGCATTAACAGAAGATCCAGACGAGGGAACAGCCGGGGTGGAATCTGCAGTATTG +AGGGGATTCCTAATTCTAGGCAGAGAGGACAAAAGATATGGACCCGCATTGAGCATCAATGAACTGAGCA +ATCTTGCAAAAGGGGAGAAGGCTAATGTATTGATAATGCAAGGAGACGTGGTGTTGGTAATGAAACGGAA +ACGGGACTTTAGCATACTTACTGACAGCCAGACAGCGACCAAAAGAATTCGGATGGCCATCAATTAGTGT +TGAATAGTTTAAAAACGACCTTGTTTCTACT