From 812571340fc00e0fe3d419ec6a5fea13c970f9a6 Mon Sep 17 00:00:00 2001 From: Hassan Daanaa <45001829+hsdaanaa@users.noreply.github.com> Date: Mon, 11 Feb 2019 03:42:42 +0900 Subject: [PATCH 01/12] tests --- alignmentrs_imports.py | 9 + test_alignment.txt | 132 +++++++++++++ test_alignment_0_8.py | 413 +++++++++++++++++++++++++++++++++++++++++ 3 files changed, 554 insertions(+) create mode 100644 alignmentrs_imports.py create mode 100644 test_alignment.txt create mode 100644 test_alignment_0_8.py diff --git a/alignmentrs_imports.py b/alignmentrs_imports.py new file mode 100644 index 0000000..1b82b75 --- /dev/null +++ b/alignmentrs_imports.py @@ -0,0 +1,9 @@ +import sys +sys.path.append('../') +from os import getcwd +from numpy import matrix, array, array_equal +import nose +import random +from classes import * +from funcs import * +from alignmentrs_test_funcs import * \ No newline at end of file diff --git a/test_alignment.txt b/test_alignment.txt new file mode 100644 index 0000000..e26dc19 --- /dev/null +++ b/test_alignment.txt @@ -0,0 +1,132 @@ +>marker_0 |91 sp| +CCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCNNNNNNNNN +>Dmel_528_2597 |10 sp| +ATGAAGAGCAAGGTGGATAAACCCGTAACCAATGGTGCACCAAATGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAAAAATCCGAAGCGGACTCGCAAATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGAGAAGCCGGCGGAGACCGAGGAAAAGGAAAATACCGCAAGCAACGCCAACCTGAAGGTGTCTCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGATACAAATGCTGAGCAGCGCACTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAAACGCCGTGCCCGCCATTGATGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAATTGGTTACAGCCTTCTGCATTCTGCAGACCCCGCAGTTCGCTAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCCCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAACAAGCCGTTGAGTGGCTTGAAAGTGAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTTTTCGTCCGTACTGGGACGGGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACACACAGCTTTTCGATTTGTATTTCTCCGGTTCCACCATTCACAGCGATGGCGTATATGCCAGATTGGCTAGTTTTCTTGTTAATGGCGGAAAGGATATGCTCGCCGCCTGGCAGCAATATATCGATTCTAAGCAGCCACTCAAACTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCCACGTGCTCCTCAACTTTAAGCCAAGGGAAGAACAACTCATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGTTGCATGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCTAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTTGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCACCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATTTCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTCAGCGTCGAGAGCCTTCACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCACTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTTAGTCAGACAGCCAAATGGCGACAGAAACAGTTGAACTACTTGTTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAAGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCAGTTGCTGCAGAAGACATTGAGTTACCTTAACAAAGAGTTGGGACAACCGGATGCGGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGAGCGGCCCAGCAAGGAATCCGATGTCGTTGGCCAATCATTCGAGGCTCTTATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCATCACCGTGTTGGAAGATCTGATTATCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGAGCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTTACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTTCTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGCTCAACATGAACAAAAATCCCCTGAGCAAAAAGAGCGATGGC------GAGGAGGAGAGCGATGACGAACTCGACAAGGAAGAATCGTTGAAGGATTCAAGCGATGATTCAGAAGATGAAGATGAAGATGAAGAGGAGGAC---GAGGGCGAGGACGATGCAGAGTCCCATTTGGCCCAAATTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAGGAGCAGGGCGAACGCTTGAATGCTGCTTTGGAGCGGTCTTTTCAGATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAGCACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAACCAAGAAACCAACTCAATCGGTAATCCTGGACGTGCTACATTGCGTGTTCCAGGTGTACAGCCATTGCGCCGCAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTCGCTAGGAATATCGAACTCAAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCCATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAAGAGACATCATTATTTGGCGGGACAGGTGCTTCGCTTACCTGGTCAGCCAGGCATCAGCAGATGGCGAGCCCAAGAAAAGTGCCGTCTGGCCCCTTCTAGTCGAATTCCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGCCAATGGCAGGGAGTTGCTCCGCTGGCCGTTGTCCTGGCCTCTCACTTGGACGTACAGAAAACACGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGTCGCTTTCAAGGACAACAACTCGTCTTCCAAGAAATTTGAGAAGCAGATAGCCAGATATGTAAATCAGCTAGAAACGAAGGCTAGCAGTTCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGTGGCAGAAACTGCGTGAACAAATTCAGCTCGTCGCCAAGGATCTTCAACCCAACAAGAAGGTGGCGAAGCAGAAGAAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGAAGATGAAGAGTCCACA--- +>Dmel_RG2 |47 sp| +ATGAAGAGCAAGGTGGATAAACCCGTAACCAATGGTGCACCAAATGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAAAAATCCGAAGCGGACTCGCAAATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGAGAAGCCGGCGGAGACCGAGGAAAAGGAAAATACCGCAAGCAACGGCAACCTGAAGGTGTCTCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGATACAAATGCTGAGCAGCGCACTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAAACGCCGTGCCCGCCATTGATGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAATTGGTTACAGCCTTCTGCATTCTGCAGACCCCGCAGTTCGCTAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCCCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTCCAACCCGAGCTAAACAAGCCGTTGAGTGGCTTGAAAGTGAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTTTTCGTCCGTACTGGGACGGGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACACACAGCTTTTCGATTTGTATTTCTCCGGTTCCACCATTCACAGCGATGGCGTATATGCCAGATTGGCTAGTTTTCTTGTTAATGGCGGAAAGGATATGCTCGCCGCCTGGCAGCAATATATCGATTCCAAGCAGCCACTCAAACTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCCACGTGCTCCTCAACTTTAAGCCAAGGGAAGAACAACTCATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGTTGCATGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCTAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTTGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCACCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATTTCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTCAGCGTCGAGAGCCTTCACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCACTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTTAGTCAGACAGCCAAATGGCGACAGAAACAGTTGAACTACTTGTTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAAGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCAGTTGCTGCAGAAGACATTGAGTTACCTTAACAAAGAGTTGGGACAACCGGATGCGGAGAGCAAATTGCGTTCGCCAAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGCAACTGCTGGAGCGGCCCAGCAAGGAATCGGATGTCGTTGGCCAATCATTCGAGGCTCTTATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCATCACCGTGTTGGAAGATCTGATTATCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGAGCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTTCTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGCTCAACATGAACAAAAATCCCCTGAGCAAAAAGAGCGATGGC------GAGGAGGAGAGCGATGACGAACTCGACGAGGAAGAATCGTTGAAGGATTCAAGCGATGATTCAGAAGATGAAGATGAAGATGAAGAGGAGGAC---GAGGGCGAGGACGATGCAGAGTCCCATTTGGCCCAAATTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAGGAGCAGGGCGAACGCTTGAATGCTGCTTTGGAGCGGTCTTTTCAGATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAGCACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAACCAAGAAACCAACTCAATCGGTAATCCTGGACGTGCTACATTGCGTGTTCCAGGTGTACAGCCATTGCGCCGCAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTCGCTAGGAATATCGAACTCAAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCCATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAAGAGACATCATTATTTGGCGGGACAGGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCGAGCCCAAGAAAAGTGCCGTCTGGCCCCTTCTAGTCGAATTCCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGCCAATGGCAGGGAGTTGCTCCGCTGGCCGTTGTCCTGGCCTCTCACTTGGACGTACAGAAAACACGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGTCGCTTTCAAGGACAACAACTCGTCTTCCAAGAAATTTGAGAAGCAGATAGCCAGATATGTAAATCAGCTAGAAACGAAGGCTAGCAGTTCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGTGGCAGAAACTGCGTGAACAAATTCAGCTCGTCGCCAAGGATCTTCAACCCAACAAGAAGGTGGCGAAGCAGAAGAAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGAAGATGAAGAGTCCACA--- +>Dmel_RG3 |22 sp| +ATGAAGAGCAAGGTGGATAAACCCGTAACCAATGGTGCACCAAATGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAAAAATCCGAAGCGGACTCGCAAATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGAGAAGCCGGCGGAGACCGAGGAAAAGGAAAATACCGCAAGCAACGGCAACCTGAAGGTGTCTCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGATACAAATGCTGAGCAGCGCACTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAAACGCCGTGCCCGCCATTGATGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAATTGGTTACAGCCTTCTGCATTCTGCAGACCCCGCAGTTCGCTAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCCCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAACAAGCCGTTGAGTGGCTTGAAAGTGAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGGGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACACACAGCTTTTCGATTTGTATTTCTCCGGTTCCACCATTCACAGCGATGGCGTATATGCCAGATTGGCTAGTTTTCTTGTTAATGGCGGAAACGATATGCTCGCCGCCTGGCAGCAATATATCGATTCCAAGCAGCCACTCAAACTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCCACGTGCTCCTCAACTTTAAGCCAAGGGAAGAACAACTCATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGTTGCATGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCTAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTTGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCACCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATTTCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTCAGCGTCGAGAGCCTTCACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCACTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTTAGTCAGACAGCCAAATGGCGACAGAAACAGTTGAACTACTTGTTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAAGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCAGTTGCTGCAGAAGACATTGAGTTACCTTAACAAAGAGTTGGGACAACCGGATGCGGAGAGCAAATTGCGTTCGCCAAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGAGCGGCCCAGCAAGGAATCGGATGTCGTTGGCCAATCATTCGAGGCTCTTATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCATCACCGTGTTGGAAGATCTGATTATCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGAGCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTTCTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGCTCAACATGAACAAAAATCCCCTGAGCAAAAAGAGCGATGGC------GAGGAGGAGAGCGATGACGAACTCGACGAGGAAGAATCGTTGAAGGATTCAAGCGATGNNNNNNNNNNNNNNNNNNNNNNTGAAGAGGAGGAC---GAGGGCGAGGACGATGCAGAGTCCCATTTGGCCCAAATTCGAGAGAGCGTTCGCCAGGCTTTGATCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAGGAGCAGGGCGAACGCTTGAATGCTGCTTTGGAGCGGTCTTTTCAGATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAGCACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAACCAAGAAACCAACTCAATCGGTAATCCTGGACGTGCTACATTGCGTCTTCCAGGTGTACAGCCATTGCGCCGCAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTCGCTAGGAATATCGAACTCAAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCCATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAGGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCGAGCCCAAGAAAAGTGCCGTCTGGCCCCTTCTAGTCGAATTCCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGCCAATGGCAGGGAGTTGCTCCGCTGGCCGTTGTCCTGGCCTCTCACTTGGACGTACAGAAAACACGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGTCGCTTTCAAGGACAACAACTCGTCTTCCAAGAAATTTGAGAAGCAGATAGCCAGATATGTAAATCAGCTAGAAACGAAGGCTAGCAGTTCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGTGGCAGAAACTGCGTGAACAAATTCAGCTCGTCGCCAAGGATCTTCAACCCAACAAGAAGGTGGCGAAGCAGAAGAAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGAAGATGAAGAGTCCACA--- +>Dmel_RG4N |15 sp| +ATGAAGAGCAAGGTGGATAAACCCGTAACCAATGGTGCACCAAATGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAAAAATCCGAAGCGGACTCGCAAATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGAGAAGCCGGCGGAGACCGAGGAAAAGGAAAATACCGCAAGCAACGGCAACCTGAAGGTGTCTCACATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGATACAAATGCTGAACAGCGCACTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAAACGCCGTGCCCGCCATTGATGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAATTGGTTACAGCCTTCTGCATTCTGCAGACCCCGCAGTTCGCTAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCCCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCNCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAACAAGCCGTTGAGTGGCTTGAAAGTGAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGGGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACACACAGCTTTTCGATTTGTATTTCTCCGGTTCCACCATTCACAGCGATGGCGTATATGCCAGATTGGCTAGTTTTCTTGTTAATGGCGGAAACGATATGCTCGCCGCCTGGCAGCAATATATCGATTCCAAGCAGCCACTCAAACTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCCACGTGCTCCTCAACTTTAAGCCAAGGGAAGAACAACTCATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGTTGCATGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCTAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTTGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCACCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATTTCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTCAGCGTCGAGAGCCTTCACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCACTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTTAGTCAGACAGCCAAATGGCGACAGAAACAGTTGAACTACTTGTTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAAGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCAGTTGCTGCAGAAGACATTGAGTTACCTTAACAAAGAGTTGGGACAACCGGATGCGGAGAGCAAATTGCGTTCGCCAAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGAGCGGCCCAGCAAGGAATCGGATGTCGTTGGCCAATCATTCGAGGCTCTTATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCATCACCGTGTTGGAAGATCTGATTATCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGAGCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTTCTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGCTCAACATGAACAAAAATCCCCTGAGCAAAAAGAGCGATGGC------GAGGAGGAGAGCGATGACGAACTCGACGAGGAAGAATCGTTGAAGGATTCAAGCGATGNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNAC---GAGGGCGAGGACGATGCAGAGTCCCATTTGGCCCAAATTCGAGAGAGCGTTCGCCAGGCTTTGATCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAGGAGCAGGGCGAACGCTTGAATGCTGCTTTGGAGCGGTCTTTTCAGATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAGCACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAACCAAGAAACCAACTCAATCGGTAATCCTGGACGTGCTACATTGCGTCTTCCAGGTGTACAGCCATTGCGCCGCAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTCGCTAGGAATATCGAACTCAAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCCATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAGGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCGAGCCCAAGAAAAGTGCCGTCTGGCCCCTTCTAGTCGAATTCCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGCCAATGGCAGGGAGTTGCTCCGCTGGCCGTTGTCCTGGCCTCTCACTTGGACGTACAGAAAACACGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGTCGCTTTCAAGGACAACAACTCGTCTTCCAAGAAATTTGAGAAGCAGATAGCCAGATATGTAAATCAGCTAGAAACGAAGGCTAGCAGTTCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGTGGCAGAAACTGCGTGAACAAATTCAGCTCGTCGCCAAGGATCTTCAACCCAACAAGAAGGTGGCGAAGCAGAAGAAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGAAGATGAAGAGTCCAGA--- +>Dmel_RG5 |45 sp| +ATGAAGAGCAAGGTGGATAAACCCGTAACCAATGGTGCACCAAATGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAAAAATCCGAAGCGGACTCGCAAATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGAGAAGCCGGCGGAGACCGAGGAAAAGGAAAATACCGCAAGCAACGGCAACCTGAAGGTGTCTCACATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGATACAAATGCTGAGCAGCGCACTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGTCTGGCCGCCAGTTACATACACTGCATCCTAAACGCCGTGCCCGCCATTGATGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAATTGGTTACAGCCTTCTGCATTCTGCAGACCCCGCAGTTCGCTAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCCCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAACAAGCCGTTGAGTGGCTTGAAAGTGAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGGGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACACACAGCTTTTCGATTTGTATTTCTCCGGTTCCACCATTCACAGCGATGGCGTATATGCCAGATTGGCTAGTTTTCTTGTTAATGGCGGAAACGATATGCTCGCCGCCTGGCAGCAATATATCGATTCCAAGCAGCCACTCAAACTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCCACGTGCTCCTCAACTTTAAGCCAAGGGAAGAACAACTCATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGTTGCATGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCTAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTTGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCACCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATTTCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTCAGCGTCGAGAGCCTTCACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCACTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTTAGTCAGACAGCCAAATGGCGACAGAAACAGTTGAACTACTTGTTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAAGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCAGTTGCTGCAGAAGACATTGAGTTACCTTAACAAAGAGTTGGGACAACCGGATGCGGAGAGCAAATTGCGTTCGCCAAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGAGCGGCCCAGCAAGGAATCGGATGTCGTTGGCCAATCATTCGAGGCTCTTATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCATCACCGTGTTGGAAGATCTGATTATCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGAGCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTNACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTTCTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGCTCAACATGAACAAAAATCCCCTGAGCAAAAAGAGCGATGGC------GAGGAGGAGAGCGATGACGAACTCGACGAGGAAGAATCGTTGAAGGATTCAAGCGATGATTCAGAAGATGAAGATGAAGATGAAGAGGAGGAC---GAGGGCGAGGACGATGCAGAGTCCCATTTGGCCCAAATTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAGGAGCAGGGCGAACGCTTGAATGCTGCTTTGGAGCGGTCTTTTCAGATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAGCACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAACCAAGAAACCAACTCAATCGGTAATCCTGGACGTGCTACATTGCGTCTTCCAGGTGTACAGCCATTGCGCCGCAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTCGCTAGGAATATCGAACTCAAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCCATTGAGCAGCTGATGTCGTCTGGCGACGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAGGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCGAGCCCAAGAAAAGTGCCGTCTGGCCCCTTCTAGTCGAATTCCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGCCAATGGCAGGGAGTTGCTCCGCTGGCCGTTGTCCTGGCCTCTCACTTGGACGTACAGAAAACACGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGTCGCTTTCAAGGACAACAACTCGTCTTCCAAGAAATTTGAGAAGCAGATAGCCAGATATGTAAATCAGCTAGAAACGAAGGCTAGCAGTTCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGTGGCAGAAACTGCGTGAACAAATTCAGCTCGTCGCCAAGGATCTTCAACCCAACAAGAAGGTGGCGAAGCAGAAGAAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGAAGATGAAGAGTCCACA--- +>Dmel_RG7 |32 sp| +ATGAAGAGCAAGGTGGATAAACCCGTAACCAATGGTGCACCAAATGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAAAAATCCGAAGCGGACTCGCAAATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGAGAAGCCGGCGGAGACCGAGGAAAAGGAAAATACCGCAAGCAACGGCAACCTGAAGGTGTCTCACATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGATACAAATGCTGAACAGCGCACTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAAACGCCGTGCCCGCCATTGATGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAATTGGTTACAGCCTTCTGCATTCTGCAGACCCCGCAGTTCGCTAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCCCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAACAAGCCGTTGAGTGGCTTGAAAGTGAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGGGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACACACAGCTTTTCGATTTGTATTTCTCCGGTTCCACCATTCACAGCGATGGCGTATATGCCAGATTGGCTAGTTTTCTTGTTAATGGCGGAAACGATATGCTCGCCGCCTGGCAGCAATATATCGATTCCAAGCAGCCACTCAAACTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCCACGTGCTCCTCAACTTTAAGCCAAGGGAAGAACAACTCATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGTTGCATGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCTAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTTGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCACCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATTTCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTCAGCGTCGAGAGCCTTCACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCACTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTTAGTCAGACAGCCAAATGGCGACAGAAACAGTTGAACTACTTGTTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAAGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCAGTTGCTGCAGAAGACATTGAGTTACCTTAACAAAGAGTTGGGACAACCGGATGCGGAGAGCAAATTGCGTTCGCCAAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGAGCGGCCCAGCAAGGAATCGGATGTCGTTGGCCAATCATTCGAGGCTCTTATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCATCACCGTGTTGGAAGATCTGATTATCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGAGCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTTCTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGCTCAACATGAACAAAAATCCCCTGAGCAAAAAGAGCGATGGC------GAGGAGGAGAGCGATGACGAACTCGACGAGGAAGAATCGTTGAAGGATTCAAGCGATGNNNNNNNNNNNNNNNNNNNNNNTGAAGAGGAGGAC---GAGGGCGAGGACGATGCAGAGTCCCATTTGGCCCAAATTCGAGAGAGCGTTCGCCAGGCTTTGATCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAGGAGCAGGGCGAACGCTTGAATGCTGCTTTGGAGCGGTCTTTTCAGATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAGCACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAACCAAGAAACCAACTCAATCGGTAATCCTGGACGTGCTACATTGCGTCTTCCAGGTGTACAGCCATTGCGCCGCAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTCGCTAGGAATATCGAACTCAAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCCATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAGGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCGAGCCCAAGAAAAGTGCCGTCTGGCCCCTTCTAGTCGAATTCCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGCCAATGGCAGGGAGTTGCTCCGCTGGCCGTTGTCCTGGCCTCTCACTTGGACGTACAGAAAACACGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGTCGCTTTCAAGGACAACAACTCGTCTTCCAAGAAATTTGAGAAGCAGATAGCCAGATATGTAAATCAGCTAGAAACGAAGGCTAGCAGTTCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGTGGCAGAAACTGCGTGAACAAATTCAGCTCGTCGCCAAGGATCTTCAACCCAACAAGAAGGTGGCGAAGCAGAAGAAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGAAGATGAAGAGTCCAGA--- +>Dmel_RG9 |108 sp| +ATGAAGAGCAAGGTGGATAAACCCGTAACCAATGGTGCACCAAATGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAAAAATCCGAAGCGGACTCGCAAATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGAGAAGCCGGCGGAGACCGAGGAAAAGGAAAATACCGCAAGCAACGCCAACCTGAAGGTGTCTCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGATACAAATGCTGAGCAGCGCACTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAAACGCCGTGCCCGCCATTGATGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCTGTCGGTCAATTGGTTACAGCCTTCTGCATTTTGCAGACCCCGCAGTTCGCTAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAACCCAGCTAAAGGGCAGGGAGTACTTGGTGTCCCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAACAAGCCGTTGAGTGGCTTGAAAGTGAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGGGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACACACAGCTTTTCGATTTGTATTTCTCCGGTTCCACCATTCACAGCGATGGCGTATATGCCAGATTGGCTAGTTTTCTTGTTAATGGCGGAAAGGATATGCTCGCCGCCTGGCAGCAATATATCGATTCCAAGCAGCCACTCAAACTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCCACGTGCTCCTCAACTTTAAGCCAAGGGAAGAACAACTCATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGTTGCATGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCTAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTTGTGTTACGAAAAGCAGTTTCAAAACGATGATAACAAACTTCACCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATTTCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTCAGCGTCGAGAGCCTTCACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCACTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTTAGTCAGACAGCCAAATGGCGACAGAAACAGTTGAACTACTTGTTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAAGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCAGTTGCTGCAGAAGACATTGAGTTACCTTAACAAAGAGTTGGGACAACCGGATGCGGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGAGCGGCCCAGCAAGGAATCCGATGTCGTTGGCCAATCATTCGAGGCTCTTATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCATCACCGTGTTGGAAGATCTGATTATCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGAGCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTTCTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCATCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGCTCAACATGAACAAAAATCCCCTGAGCAAAAAGAGCGATGGC------GAGGAGGAGAGCGATGACGAACTCGACGAGGAAGAATCGTTGAAGGATTCAAGCGATGATTCAGAAGATGAAGATGAAGATGAAGAGGAGGAC---GAGGGCGAGGACGATGCAGAGTCCCATTTGGCCCAAATTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAGGAGCAGGGCGAACGCTTGAATGCTGCTTTGGAGCGGTCTTTTCAGATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAGCACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAACCAAGAAACCAACTCAATCGGTAATCCTGGACGTGCTACATTGCGTGTTCCAGGTGTACAGCCATTGCGCCGCAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTCGCTAGGAATATCGAACTCAAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCCATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAGGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCGAGCCCAAGAAAAGTGCCGTCTGGCCCCTTCTAGTCGAATTCCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGCCAATGGCAGGGAGTTGCTCCGCTGGCCGTTGTCCTGGCCTCTCACTTGGACGTACAGAAAACACGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGTCGCTTTCAAGGACAACAACTCGTCTTCCAAGAAATTTGAGAAGCAGATAGCCAGATATGTAAATCAGCTAGAAACGAAGGCTAGCAGTTCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGTGGCAGAAACTGCGTGAACAAATTCAGCTCGTCGCCAAGGATCTTCAACCCAACAAGAAGGTGGCGAAGCAGAAGAAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGAAGATGAAGAGTCCACA--- +>Dmel_RG18N |8 sp| +ATGAAGAGCAAGGTGGATAAACCCGTAACCAATGGTGCACCAAATGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAAAAATCCGAAGCGGACTCGCAAATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGAGAAGCCGGCGGAGACCGAGGAAAAGGAAAATACCGCAAGCAACGCCAACCTGAAGGTGTCTCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGATACAAATGCTGAGCAGCGCACTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAAACGCCGTGCCCGCCATTGATGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAATTGGTTACAGCCTTCTGCATTCTGCAGACCCCGCAGTTCGCTAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCCCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAACAAGCCGTTGAGTGGCTTGAAAGTGAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGGGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACACACAGCTTTTCGATTTGTATTTCTCCGGTTCCACCATTCACAGCGATGGCGTATATGCCAGATTGGCTAGTTTTCTTGTTAATGGCGGAAAGGATATGCTCGCCGCCTGGCAGCAATATATCGATTCCAAGCAGCCACTCAAACTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCCACGTGCTCCTCAACTTTAAGCCAAGGGAAGAACAACTCATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGTTGCATGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCTAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTTGTGTTACGAAAAGCAGTTTCAAAACGATGATAACAAACTTCACCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATTTCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTCAGCGTCGAGAGCCTTCACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCACTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTTAGTCAGACAGCCAAATGGCGACAGAAACAGTTGAACTACTTGTTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAAGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCAGTTGCTGCAGAAGACATTGAGTTACCTTAACAAAGAGTTGGGACAACCGGATGCGGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGAGCGGCCCAGCAAGGAATCGGATGTCGTTGGCCAATCATTCGAGGCTCTTATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCATCACCGTGTTGGAAGATCTGATTATCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGAGCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTTCTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCATCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGCTCAACATGAACAAAAATCCCCTGAGCAAAAAGAGCGATGGC------GAGGAGGAGAGCGATGACGAACTCGACGAGGAGGAATCGTTGAAGGATTCAAGCGATGATTCAGAAGATGAAGATGAAGATGAAGAGGAGGAC---GAGGGCGAGGACGATGCAGAGTCCCATTTGGCCCAAATTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAGGAGCAGGGCGAACGCTTGAATGCTGCTTTGGAGCGGTCTTTTCAGATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAGCACCAACCTGCTGCACTTTCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAACCAAGAAACCAACTCAATCGGTAATCCTGGACGTGCTACATTGNGTNTTCCAGGTGTACAGCCATTGCGCCGCAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTCGCTAGGAATATCGAACTCAAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCCATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAAGAGACATCATTATTTGGCGGGAAAGGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCGAGCCCAAGAAAAGTGCCGTCTGGCCCCTTCTAGTCGAATTCCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGCCAATGGCAGGGAGTTGCTCCGCTGGCCGTTGTCCTGGCCTCTCACTTGGACGTACAGAAAACACGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGTCGCTTTCAAGGACAACAACTCGTCTTCCAAGAAATTTGAGAAGCAGATAGCCAGATATGTAAATCAGCTAGAAACGAAGGCTAGCAGTTCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGTGGCAGAAACTGCGTGAACAAATTCAGCTCGTCGCCAAGGATCTTCAACCCAACAAGAAGGTGGCGAAGCAGAAGAAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGAAGATGAAGAGTCCACA--- +>Dmel_RG19 |54 sp| +ATGAAGAGCAAGGTGGATAAACCCGTAACCAATGGTGCACCAAATGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAAAAATCCGAAGCGGACTCGCAAATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGAGAAGCCGGCGGAGACCGAGGAAAAGGAAAATACCGCAAGCAACGGCAACCTGAAGGTGTCTCACATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGATACAAATGCTGAGCAGCGCACTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAAACGCCGTGCCCGCCATTGATGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAATTGGTTACAGCCTTCTGCATTCTGCAGACCCCGCAGTTCGCTAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCCCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAACAAGCCGTTGAGTGGCTTGAAAGTGAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGGGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACACACAGCTTTTCGATTTGTATTTCTCCGGTTCCACCATTCACAGCGATGGCGTATATGCCAGATTGGCTAGTTTTCTTGTTAATGGCGGAAAGGATATGCTCGCCGCCTGGCAGCAATATATCGATTCCAAGCAGCCACTCAAACTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCCACGTGCTCCTCAACTTTAAGCCAAGGGAAGAACAACTCATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGTTGCATGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCTAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTTGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCACCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATTTCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTCAGCGTCGAGAGCCTTCACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCACTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTTAGTCAGACAGCCAAATGGCGACAGAAACAGTTGAACTACTTGTTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAAGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCAGTTGCTGCAGAAGACATTGAGTTACCTTAACAAAGAGTTGGGACAACCGGATGCGGAGAGCAAATTGCGTTCGCCAAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGAGCGGCCCAGCAAGGAATCGGATGTCGTTGGCCAATCATTCGAGGCTCTTATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCATCACCGTGTTGGAAGATCTGATTATCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGAGCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTTCTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGCTCAACATGAACAAAAATCCCCTGAGCAAAAAGAGCGATGGC------GAGGAGGAGAGCGATGACGAACTCGACGAGGAAGAATCGTTGAAGGATTCAAGCGATGNNNNNNNNNNNNNNNNNNNNNNTGAAGAGGAGGAC---GAGGGCGAGGACGATGCAGAGTCCCATTTGGCCCAAATTCGAGAGAGCGTTCGCCAGGCTTTGATCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAGGAGCAGGGCGAACGCTTGAATGCTGCTTTGGAGCGGTCTTTTCAGATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAGCACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAACCAAGAAACCAACTCAATCGGTAATCCTGGACGTGCTACATTGCGTCTTCCAGGTGTACAGCCATTGCGCCGCAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTCGCTAGGAATATCGAACTCAAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCCATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAGGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCGAGCCCAAGAAAAGTGCCGTCTGGCCCCTTCTAGTCGAATTCCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGCCAATGGCAGGGAGTTGCTCCGCTGGCCGTTGTCCTGGCCTCTCACTTGGACGTACAGAAAACACGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGTCGCTTTCAAGGACAACAACTCGTCTTCCAAGAAATTTGAGAAGCAGATAGCCAGATATGTAAATCAGCTAGAAACGAAGGCTAGCAGTTCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGTGGCAGAAACTGCGTGAACAAATTCAGCTCGTCGCCAAGGATCTTCAACCCAACAAGAAGGTGGCGAAGCAGAAGAAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGAAGATGAAGAGTCCACA--- +>Dmel_RG22 |6 sp| +ATGAAGAGCAAGGTGGATAAACCCGTAACCAATGGTGCACCAAATGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAAAAATCCGAAGCGGACTCGCAAATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGAGAAGCCGGCGGAGACCGAGGAAAAGGAAAATACCGCAAGCAACGGCAACCTGAAGGTGTCTCACATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGATACAAATGCTGAGCAGCGCACTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGTCTGGCCGCCAGTTACATACACTGCATCCTAAACGCCGTGCCCGCCATTGATGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAATTGGTTACAGCCTTCTGCATTCTGCAGACCCCGCAGTTCGCTAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCCCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAACAAGCCGTTGAGTGGCTTGAAAGTGAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGGGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACACACAGCTTTTCGATTTGTATTTCTCCGGTTCCACCATTCACAGCGATGGCGTATATGCCAGATTGGCTAGTTTTCTTGTTAATGGCGGAAACGATATGCTCGCCGCCTGGCAGCAATATATCGATTCCAAGCAGCCACTCAAACTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCCACGTGCTCCTCAACTTTAAGCCAAGGGAAGAACAACTCATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGTTGCATGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCTAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTTGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCACCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATTTCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTCAGCGTCGAGAGCCTTCACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCACTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTTAGTCAGACAGCCAAATGGCGACAGAAACAGTTGAACTACTTGTTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAAGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCAGTTGCTGCAGAAGACATTGAGTTACCTTAACAAAGAGTTGGGACAACCGGATGCGGAGAGCAAATTGCGTTCGCCAAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGAGCGGCCCAGCAAGGAATCGGATGTCGTTGGCCAATCATTCGAGGCTCTTATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCATCACCGTGTTGGAAGATCTGATTATCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGAGCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTTCTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGCTCAACATGAACAAAAATCCCCTGAGCAAAAAGAGCGATGGC------GAGGAGGAGAGCGATGACGAACTCGACGAGGAAGAATCGTTGAAGGATTCAAGCGATGATTCAGAAGATGAAGATGAAGATGAAGAGGAGGAC---GAGGGCGAGGACGATGCAGAGTCCCATTTGGCCCAAATTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAGGAGCAGGGCGAACGCTTGAATGCTGCTTTGGAGCGGTCTTTTCAGATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAGCACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAACCAAGAAACCAACTCAATCGGTAATCCTGGACGTGCTACATTGCGTGTTCCAGGTGTACAGCCATTGCGCCGCAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTCGCTAGGAATATCGAACTCAAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCCATTGAGCAGCTGATGTCGTCTGGCGANGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAAGAGACATCATTATTTGGCGGGACAGGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCGAGCCCAAGAAAAGTGCCGTCTGGCCCCTTCTAGTCGAATTCCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGCCAATGGCAGGGAGTTGCTCCGCTGGCCGTTGTCCTGGCCTCTCACTTGGACGTACAGAAAACACGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGTCGCTTTCAAGGACAACAACTCGTCTTCCAAGAAATTTGAGAAGCAGATAGCCAGATATGTAAATCAGCTAGAAACGAAGGCTAGCAGTTCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGTGGCAGAAACTGCGTGAACAAATTCAGCTCGTCGCCAAGGATCTTCAACCCAACAAGAAGGTGGCGAAGCAGAAGAAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGAAGATGAAGAGTCCACA--- +>Dmel_RG24 |43 sp| +ATGAAGAGCAAGGTGGATAAACCCGTAACCAATGGTGCACCAAATGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAAAAATCCGAAGCGGACTCGCAAATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGAGAAGCCGGCGGAGACCGAGGAAAAGGAAAATACCGCAAGCAACGGCAACCTGAAGGTGTCTCACATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGATACAAATGCTGAGCAGCGCACTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGTCTGGCCGCCAGTTACATACACTGCATCCTAAACGCCGTGCCCGCCATTGATGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCATCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAATTGGTTACAGCCTTCTGCATTCTGCAGACCCCGCAGTTCGCTAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCCCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAACAAGCCGTTGAGTGGCTTGAAAGTGAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGGGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACACACAGCTTTTCGATTTGTATTTCTCCGGTTCCACCATTCACAGCGATGGCGTATATGCCAGATTGGCTAGTTTTCTTGTTAATGGCGGAAACGATATGCTCGCCGCCTGGCAGCAATATATCGATTCCAAGCAGCCACTCAAACTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCCACGTGCTCCTCAACTTTAAGCCAAGGGAAGAACAACTCATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGTTGCATGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCTAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTTGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCACCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATTTCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTCAGCGTCGAGAGCCTTCACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCACTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTTAGTCAGACAGCCAAATGGCGACAGAAACAGTTGAACTACTTGTTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAAGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCAGTTGCTGCAGAAGACATTGAGTTACCTTAACAAAGAGTTGGGACAACCGGATGCGGAGAGCAAATTGCGTTCGCCAAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGAGCGGCCCAGCAAGGAATCGGATGTCGTTGGCCAATCATTCGAGGCTCTTATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCATCACCGTGTTGGAAGATCTGATTATCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGAGCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTTCTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGCTCAACATGAACAAAAATCCCCTGAGCAAAAAGAGCGATGGC------GAGGAGGAGAGCGATGACGAACTCGACGAGGAAGAATCGTTGAAGGATTCAAGCGATGNNNNNNNNNNNNNNNNNNNNNNTGAAGAGGAGGAC---GAGGGCGAGGACGATGCAGAGTCCCATTTGGCCCAAATTCGAGAGAGCGTTCGCCAGGCTTTGATCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAGGAGCAGGGCGAACGCTTGAATGCTGCTTTGGAGCGGTCTTTTCAGATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAGCACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAACCAAGAAACCAACTCAATCGGTAATCCTGGACGTGCTACATTGCGTCTTCCAGGTGTACAGCCATTGCGCCGCAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTCGCTAGGAATATCGAACTCAAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCCATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAGGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCGAGCCCAAGAAAAGTGCCGTCTGGCCCCTTCTAGTCGAATTCCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGCCAATGGCAGGGAGTTGCTCCGCTGGCCGTTGTCCTGGCCTCTCACTTGGACGTACAGAAAACACGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGTCGCTTTCAAGGACAACAACTCGTCTTCCAAGAAATTTGAGAAGCAGATAGCCAGATATGTAAATCAGCTAGAAACGAAGGCTAGCAGTTCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGTGGCAGAAACTGCGTGAACAAATTCAGCTCGTCGCCAAGGATCTTCAACCCAACAAGAAGGTGGCGAAGCAGAAGAAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGAAGATGAAGAGTCCACA--- +>Dmel_RG25 |71 sp| +ATGAAGAGCAAGGTGGATAAACCCGTAACCAATGGTGCACCAAATGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAAAAATCCGAAGCGGACTCGCAAATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGAGAAGCCGGCGGAGACCGAGGAAAAGGAAAATACCGCAAGCAACGCCAACCTGAAGGTGTCTCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGATACAAATGCTGAGCAGCGCACTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAAACGCCGTGCCCGCCATTGATGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAATTGGTTACAGCCTTCTGCATTCTGCAGACCCCGCAGTTCGCTAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCCCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAACAAGCCGTTGAGTGGCTTGAAAGTGAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGGGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACACACAGCTTTTCGATTTGTATTTCTCCGGTTCCACCATTCACAGCGATGGCGTATATGCCAGATTGGCTAGTTTTCTTGTTAATGGCGGAAAGGATATGCTCGCCGCCTGGCAGCAATATATCGATTCCAAGCAGCCACTCAAACTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCCACGTGCTCCTCAACTTTAAGCCAAGGGAAGAACAACTCATCCTAGATATCTTTACACCGACCTGTGTACAGTTCCTGTTGCATGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCTAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTTGTGTTACGAAAAGCAGTTTCAAAACGATGATAACAAACTTCACCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATTTCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTCAGCGTCGAGAGCCTTCACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCACTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTTAGTCAGACAGCCAAATGGCGACAGAAACAGTTGAACTACTTGTTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAAGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCAGTTGCTGCAGAAGACATTGAGTTACCTTAACAAAGAGTTGGGACAACCGGATGCGGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGAGCGGCCCAGCAAGGAATCGGATGTCGTTGGCCAATCATTCGAGGCTCTTATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCATCACCGTGTTGGAAGATCTGATTATCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGAGCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTTCTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGCTCAACATGAACAAAAATCCCCTGAGCAAAAAGAGCGATGGC------GAGGAGGAGAGCGATGACGAACTCGACGAGGAAGAATCGTTGAAGGATTCAAGCGATGATTCAGAAGATGAAGATGAAGATGAAGAGGAGGAC---GAGGGCGAGGACGATGCAGAGTCCCATTTGGCCCAAATTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAGGAGCAGGGCGAACGCTTGAATGCTGCTTTGAAGCGGTCTTTTCAGATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAGCACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGACCTCTTCATAACCAAGAAACCAACTCAATCGGTAATCCTGGACGTGCTACATTGCGTGTTCCAGGTGTACAGCCATTGCGCCGCAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTCGCTAGGAATATCGAACTCAAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCCATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAAGAGACATCATTATTTGGCGGGACAGGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCGAGCCCAAGAAAAGTGCCGTCTGGCCCCTTCTAGTCGAATTCCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGCCAATGGCAGGGAGTTGCTCCGCTGGCCGTTGTCCTGGCCTCTCACTTGGACGTACAGAAAACACGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGTCGCTTTCAAGGACAACAACTCGTCTTCCAAGAAATTTGAGAAGCAGATAGCCAGATATGTAAATCAGCTAGAAACGAAGGCTAGCAGTTCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGTGGCAGAAACTGCGTGAACAAATTCAGCTCGTCGCCAAGGATCTTCAACCCAACAAGAAGGTGGCGAAGCAGAAGAAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGAAGATGAAGAGTCCACA--- +>Dmel_RG28 |74 sp| +ATGAAGAGCAAGGTGGATAAACCCGTAACCAATGGTGCACCAAATGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAAAAATCCGAAGCGGACTCGCAAATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGAGAAGCCGGCGGAGACCGAGGAAAAGGAAAATACCGCAAGCAACGGCAACCTGAAGGTGTCTCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGATACAAATGCTGAGCAGCGCACTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAAACGCCGTGCCCGCCATTGATGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAATTGGTTACAGCCTTCTGCATTCTGCAGACCCCGCAGTTCGCTAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCCCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTCCAACCCGAGCTAAACAAGCCGTTGAGTGGCTTGAAAGTGAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTTTTCGTCCGTACTGGGACGGGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACACACAGCTTTTCGATTTGTATTTCTCCGGTTCCACCATTCACAGCGATGGCGTATATGCCAGATTGGCTAGTTTTCTTGTTAATGGCGGAAAGGATATGCTCGCCGCCTGGCAGCAATATATCGATTCCAAGCAGCCACTCAAACTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCCACGTGCTCCTCAACTTTAAGCCAAGGGAAGAACAACTCATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGTTGCATGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCTAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTTGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCACCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATTTCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTCAGCGTCGAGAGCCTTCACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCACTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTTAGTCAGACAGCCAAATGGCGACAGAAACAGTTGAACTACTTGTTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAAGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCAGTTGCTGCAGAAGACATTGAGTTACCTTAACAAAGAGTTGGGACAACCGGATGCGGAGAGCAAATTGCGTTCGCCAAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGCAACTGCTGGAGCGGCCCAGCAAGGAATCGGATGTCGTTGGCCAATCATTCGAGGCTCTTATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCATCACCGTGTTGGAAGATCTGATTATCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGAGCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTTCTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGCTCAACATGAACAAAAATCCCCTGAGCAAAAAGAGCGATGGC------GAGGAGGAGAGCGATGACGAACTCGACGAGGAAGAATCGTTGAAGGATTCAAGCGATGATTCAGAAGATGAAGATGAAGATGAAGAGGAGGAC---GAGGGCGAGGACGATGCAGAGTCCCATTTGGCCCAAATTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAGGAGCAGGGCGAACGCTTGAATGCTGCTTTGGAGCGGTCTTTTCAGATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAGCACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAACCAAGAAACCAACTCAATCGGTAATCCTGGACGTGCTACATTGCGTGTTCCAGGTGTACAGCCATTGCGCCGCAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTCGCTAGGAATATCGAACTCAAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCCATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAAGAGACATCATTATTTGGCGGGACAGGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCGAGCCCAAGAAAAGTGCCGTCTGGCCCCTTCTAGTCGAATTCCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGCCAATGGCAGGGAGTTGCTCCGCTGGCCGTTGTCCTGGCCTCTCACTTGGACGTACAGAAAACACGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGTCGCTTTCAAGGACAACAACTCGTCTTCCAAGAAATTTGAGAAGCAGATAGCCAGATATGTAAATCAGCTAGAAACGAAGGCTAGCAGTTCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGTGGCAGAAACTGCGTGAACAAATTCAGCTCGTCGCCAAGGATCTTCAACCCAACAAGAAGGTGGCGAAGCAGAAGAAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGAAGATGAAGAGTCCACA--- +>Dmel_RG32N |56 sp| +ATGAAGAGCAAGGTGGATAAACCCGTAACCAATGGTGCACCAAATGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAAAAATCCGAAGCGGACTCGCAAATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGAGAAGCCGGCGGAGACCGAGGAAAAGGAAAATACCGCAAGCAACGGCAACCTGAAGGTGTCTCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGATACAAATGCTGAGCAGCGCACTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGTCTGGCCGCCAGTTACATACACTGCATCCTAAACGCCGTGCCCGCCATTGATGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAATTGGTTACAGCCTTCTGCATTCTGCAGACCCCGCAGTTCGCTAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCCCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAACAAGCCGTTGAGTGGCTTGAAAGTGAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTTTTCGTCCGTACTGGGACGGGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACACACAGCTTTTCGATTTGTATTTCTCCGGTTCCACCATTCACAGCGATGGCGTATATGCCAGATTGGCTAGTTTTCTTGTTAATGGCGGAAAGGATATGCTCGCCGCCTGGCAGCAATATATCGATTCCAAGCAGCCACTCAAACTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCCACGTGCTCCTCAACTTTAAGCCAAGGGAAGAACAACTCATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGTTGCATGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCTAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTTGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCACCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATTTCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTCAGCGTCGAGAGCCTTCACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGTCGAGTGCACTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTTAGTCAGACAGCCAAATGGCGACAGAAACAGTTGAACTACTTGTTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAAGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCAGTTGCTGCAGAAGACATTAAGTTACCTTAACAAAGAGTTGGGACAACCGGATGCGGAGAGCAAATTGCGTTCGCCAAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGAGCGGCCCAGCAAGGAATCGGATGTCGTTGGCCAATCATTCGAGGCTCTTATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCATCACCGTGTTGGAAGATCTGATTATCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGAGCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTTCTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGCTCAACATGAACAAAAATCCCCTGAGCAAAAAGAGCGATGGC------GAGGAGGAGAGCGATGACGAACTCGACGAGGAAGAATCGTTGAAGGATTCAAGCGATGATTCAGAAGATGAAGATGAAGATGAAGAGGAGGAC---GAGGGCGAGGACGATGCAGAGTCCCATTTGGCCCAAATTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAGGAGCAGGGCGAACGCTTGAATGCTGCTTTGGAGCGGTCTTTTCAGATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAGCACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAACCAAGAAACCAACTCAATCGGTAATCCTGGACGTGCTACATTGCGTGTTCCAGGTGTACAGCCATTGCGCCGCAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTCGCTAGGAATATCGAACTCAAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCCATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAAGAGACATCATTATTTGGCGGGACAGGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCGAGCCCAAGAAAAGTGCCGTCTGGCCCCTTCTAGTCGAATTCCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGCCAATGGCAGGGAGTTGCTCCGCTGGCCGTTGTCCTGGCCTCTCACTTGGACGTACAGAAAACACGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGTCGCTTTCAAGGACAACAACTCGTCTTCCAAGAAATTTGAGAAGCAGATAGCCAGATATGTAAATCAGCTAGAAACGAAGGCTAGCAGTTCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGTGGCAGAAACTGCGTGAACAAATTCAGCTCGTCGCCAAGGATCTTCAACCCAACAAGAAGGTGGCGAAGCAGAAGAAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGAAGATGAAGAGTCCACA--- +>Dmel_RG33 |64 sp| +ATGAAGAGCAAGGTAGATAAACCCGTAACCAATGGTGCACCAAATGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAAAAATCCGAAGCGGACTCGCAAATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGAGAAGCCGGCGGAGACCGAGGAAAAGGAAAATACCGCAAGCAACGCCAACCTGAAGGTGTCTCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTNAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGATACAAATGCTGAGCAGCGCACTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAAACGCCGTGCCCGCCATTGATGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGNCAATTGGTTACAGCCTTCTGCATTCTGCAGACCCCGCAGTTCGCTAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCCCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGNGGNGTACGTGTGGCCACTTCTGCAACCCGAGCTAAACAAGCCGTTGAGTGGCTTGAAAGTGAACACTTGCGATGTCTTGCTCGCCGTGCATCTGANNNNTTCGTCCGTACTGGGACGGGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACACACAGCTTTTCGATTTGTATTTCTCCGGTTCCACCATTCACAGCGATGGCGTATATGCCAGATTGGCTAGTTTTCTTGTTAATGGCGGAAAGGATATGCTCGCCGCCTGGCAGCAATATATCGATTCCAAGCAGCCACTCAAACTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCCACGTGCTNCTCAACTTTAAGCCAAGGGAAGAACAACTCATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGTTGCATGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCTAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTTGTGTTACGAAAAGCAGTTNCAAAACGATGATAACAAACTTCACCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATTTCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTCAGCGTCGAGAGCCTTCACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCACTGCCTTAACCAGATGCAACTGATACTGAACCACTCAAAGCTTAGTCAGACAGCCAAATGGCGACAGAAACAGTTGAACTACTTGTTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAAGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCAGTTGCTGCAGAAGACATTGAGTTACCTTAACAAAGAGTTGGGACAACCGGATGCGGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGAGCGGCCCAGCAAGGAATCGGATGTCGTTGGCCAATCATTCGAGGCTCTTATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCATCACCGTGTTGGAAGATCTGATTATCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGAGCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTTCTGGCGGGAGTTTGTTCAACTGGTGGNCACCGCTTTGATTCCGCANCTTGAGCACGGTAACCTAGAACNGGTCCTCGAAGTGCTCAACATGAACAAAAATCCCCTNAGCAAAAAGAGCGATGGC------GAGGAGGAGAGCGATGACGAACTCGACGAGGAGGAATCGTTGAAGGATTCAAGCGATGATTCAGAAGATGAAGATGAAGATGAAGAGGAGGAC---GAGGGCGAGGACGATGCAGAGTCCCATTTGGCCCAAATTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAGGAGCAGGGCGAACGCTTGAATGCTGCTTTGGAGCGGTCTTTTCAGATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAGCACCAACCTGCTGCACTTTCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAACCAAGAAACCAACTCAATCGGTAATCCTGGACGTGCTACATTNNNNNTTCCAGGTGTACAGCCATTGCGCCGCAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTCGCTAGGAATATCGAACTCAAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCCATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAAGAGACATCATTATTTGGCGGGACAGGTGCTTCGCNTACCTGGTCAGCCAGGCATCAGCAGATGGCGAGCCCAAGAAAAGTGCCGTCTGGCCCCTTCTAGTCGAATTCCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGCCAATGGCAGGGAGTTGCTCCGCTGGCCGTTGTCCTGGCCTCTCACTTGGACGTACAGAAAACACGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGTCGCTTTCAAGGACAACAACTCGTCTTCCAAGAAATTTGAGAAGCAGATAGCCAGATATGTAAATCAGCTAGAAACGAAGGCTAGCAGTTCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGTGGCAGAAACTGCGTGAACAAATTCAGCTCGTCGCCAAGGATCTTCAACCCAACAAGAAGGTGGCGAAGCAGAAGAAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGAAGATGAAGAGTCCACA--- +>Dmel_RG34 |58 sp| +ATGAAGAGCAAGGTGGATAAACCCGTAACCAATGGTGCACCAAATGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAAAAATCCGAAGCGGACTCGCAAATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGAGAAGCCGGCGGAGACCGAGGAAAAGGAAAATACCGCAAGCAACGNCAACCTGAAGGTGTCTCACATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGATACAAATGCTGAGCAGCGCACTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGTCTGGCCGCCAGTTACATACACTGCATCCTAAACGCCGTGCCCGCCATTGATGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAATTGGTTACAGCCTTCTGCATTCTGCAGACCCCGCAGTTCGCTAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCCCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAACAAGCCGTTGAGTGGCTTGAAAGTGAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGGGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACACACAGCTTTTCGATTTGTATTTCTCCGGTTCCACCATTCACAGCGATGGCGTATATGCCAGATTGGCTAGTTTTCTTGTTAATGGCGGAAACGATATGCTCGCCGCCTGGCAGCAATATATCGATTCCAAGCAGCCACTCAAACTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCCACGTGCTCCTCAACTTTAAGCCAAGGGAAGAACAACTCATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGTTGCATGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCTAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTTGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCACCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATTTCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTCAGCGTCGAGAGCCTTCACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCACTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTTAGTCAGACAGCCAAATGGCGACAGAAACAGTTGAACTACTTGTTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAAGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCAGTTGCTGCAGAAGACATTGAGTTACCTTAACAAAGAGTTGGGACAACCGGATGCGGAGAGCAAATTGCGTTCGCCAAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGAGCGGCCCAGCAAGGAATCGGATGTCGTTGGCCAATCATTCGAGGCTCTTATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCATCACCGTGTTGGAAGATCTGATTATCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGAGCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTTCTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGCTCAACATGAACAAAAATCCCCTGAGCAAAAAGAGCGATGGC------GAGGAGGAGAGCGATGACGAACTCGACGAGGAAGAATCGTTGAAGGATTCAAGCGATGATTCAGAAGATGAAGATGAAGATGAAGAGGAGGAC---GAGGGCGAGGACGATGCAGAGTCCCATTTGGCCCAAATTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAGGAGCAGGGCGAACGCTTGAATGCTGCTTTGGAGCGGTCTTTTCAGATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAGCACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAACCAAGAAACCAACTCAATCGGTAATCCTGGACGTGCTACATTGCGTCTTCCAGGTGTACAGCCATTGCGCCGCAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTCGCTAGGAATATCGAACTCAAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCCATTGAGCAGCTGATGTCGTCTGGCGACGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAGGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCGAGCCCAAGAAAAGTGCCGTCTGGCCCCTTCTAGTCGAATTCCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGCCAATGGCAGGGAGTTGCTCCGCTGGCCGTTGTCCTGGCCTCTCACTTGGACGTACAGAAAACACGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGTCGCTTTCAAGGACAACAACTCGTCTTCCAAGAAATTTGAGAAGCAGATAGCCAGATATGTAAATCAGCTAGAAACGAAGGCTAGCAGTTCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGTGGCAGAAACTGCGTGAACAAATTCAGCTCGTCGCCAAGGATCTTCAACCCAACAAGAAGGTGGCGAAGCAGAAGAAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGAAGATGAAGAGTCCACA--- +>Dmel_RG36 |128 sp| +ATGAAGAGCAAGGTGGATAAACCCGTAACCAATGGTGCACCAAATGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAAAAATCCGAAGCGGACTCGCAAATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGAGAAGCCGGCGGAGACCGAGGAAAAGGAAAATACCGCAAGCAACGCCAACCTGAAGGTGTCTCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGATACAAATGCTGAGCAGCGCACTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAAACGCCGTGCCCGCCATTGATGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAATTGGTTACAGCCTTCTGCATTCTGCAGACCCCGCAGTTCGCTAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCCCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAACAAGCCGTTGAGTGGCTTGAAAGTGAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGGGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACACACAGCTTTTCGATTTGTATTTCTCCGGTTCCACCATTCACAGCGATGGCGTATATGCCAGATTGGCTAGTTTTCTTGTTAATGGCGGAAAGGATATGCTCGCCGCCTGGCAGCAATATATCGATTCCAAGCAGCCACTCAAACTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCCACGTGCTCCTCAACTTTAAGCCAAGGGAAGAACAACTCATCCTAGATATCTTTACACCGACCTGTGTACAGTTCCTGTTGCATGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCTAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTTGTGTTACGAAAAGCAGTTTCAAAACGATGATAACAAACTTCACCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATTTCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTCAGCGTCGAGAGCCTTCACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCACTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTTAGTCAGACAGCCAAATGGCGACAGAAACAGTTGAACTACTTGTTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAAGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCAGTTGCTGCAGAAGACATTGAGTTACCTTAACAAAGAGTTGGGACAACCGGATGCGGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGAGCGGCCCAGCAAGGAATCCGATGTCGTTGGCCAATCATTCGAGGCTCTTATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCATCACCGTGTTGGAAGATCTGATTATCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGAGCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTTCTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGCTCAACATGAACAAAAATCCCCTGAGCAAAAAGAGCGATGGC------GAGGAGGAGAGCGATGACGAACTCGACGAGGAAGAATTGTTGAAGGATTCAAGCGATGATTCAGAAGATGAAGATGAAGATGAAGAGGAGGAC---GAGGGCGAGGACGATGCAGAGTCCCATTTGGCCCAAATTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAGGAGCAGGGCGAACGCTTGAATGCTGCTTTGGAGCGGTCTTTTCAGATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAGCACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAACCAAGAAACCAACTCAATCGGTAATCCTGGACGTGCTACATTGCGTGTTCCAGGTGTACAGCCATTGCGCCGCAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTCGCTAGGAATATCGAACTCAAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCCATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAGGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCGAGCCCAAGAAAAGTGCCGTCTGGCCCCTTCTAGTCGAATTCCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGCCAATGGCAGGGAGTTGCTCCGCTGGCCGTTGTCCTGGCCTCTCACTTGGACGTACAGAAAACACGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGTCGCTTTCAAGGACAACAACTCGTCTTCCAAGAAATTTGAGAAGCAGATAGCCAGATATGTAAATCAGCTAGAAACGAAGGCTAGCAGTTCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGTGGCAGAAACTGCGTGAACAAATTCAGCTCGTCGCCAAGGATCTTCAACCCAACAAGAAGGTGGCGAAGCAGAAGAAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGAAGATGAAGAGTCCAGA--- +>Dmel_RG38N |27 sp| +ATGAAGAGCAAGGTGGATAAACCCGTAACCAATGGTGCACCAAATGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAAAAATCCGAAGCGGACTCGCAAATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGAGGAGCCGGCGGAGACCGAGGAAAAGGAAAATACCGCAAGCAACGCCAACCTGAAGGTGTCTCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGATACAAATGCTGAGCAGCGCACTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAAACGCCGTGCCCGCCATTGATGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAATTGGTTACAGCCTTCTGCATTCTGCAGACCCCGCAGTTCGCTAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCCCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAACAAGCCGTTGAGTGGCTTGAAAGTGAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGGGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACACACAGCTTTTCGATTTGTATTTCTCCGGTTCCACCATTCACAGCGATGGCGTATATGCCAGATTGGCTAGTTTTCTTGTTAATGGCGGAAAGGATATGCTCGCCGCCTGGCAGCAATATATCGATTCCAAGCAGCCACTCAAACTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCCACGTGCTCCTCAACTTTAAGCCAAGGGAAGAACAACTCATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGTTGCATGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCTAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTAGTTTTGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCACCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATTTCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTCAGCGTCGAGAGCCTTCACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCACTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTTAGTCAGACAGCCAAATGGCGGCAGAAACAGTTGAACTACTTGTTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAAGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCAGTTGCTGCAGAAGACATTGAGTTACCTTAACAAAGAGTTGGGACAACCGGATGCGGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGAGCGGCCCAGCAAGGAATCGGATGTCGTTGGCCAATCATTCGAGGCTCTTATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCATCACCGTGTTGGAAGATCTGATTATCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGAGCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTTCTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCATCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGCTCAACATGAACAAAAATCCCCTGAGCAAAAAGAGCGATGGC------GAGGAGGAGAGCGATGACGAACTCGACGAGGAAGAATCGTTGAAGGATTCAAGCGATGATTCAGAAGATGAAGATGAAGATGAAGAGGAGGAC---GAGGGCGAGGACGATGCAGAGTCCCATTTGGCCCAAATTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAGGAGCAGGGCGAACGCTTGAATGCTGCTTTGGAGCGGTCTTTTCAGATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAGCACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAACCAAGAAACCAACTCAATCGGTAATCCTGGACGTGCTACATTGCGTCTTCCAGGTGTACAGCCATTGCGCCGCAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTCGCTAGGAATATCGAACTCAAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCCATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAGGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCGAGCCCAAGAAAAGTGCCGTCTGGCCCCTTCTAGTCGAATTCCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGCCAATGGCAGGGAGTTGCTCCGCTGGCCGTTGTCCTGGCCTCTCACTTGGACGTACAGAAAACACGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGTCGCTTTCAAGGACAACAACTCGTCTTCCAAGAAATTTGAGAAGCAGATAGCCAGATATGTAAATCAGCTAGAAACGAAGGCTAGCAGTTCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGTGGCAGAAACTGCGTGAACAAATTCAGCTCGTCGCCAAGGATCTTCAACCCAACAAGAAGGTGGCGAAGCAGAAGAAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGAAGATGAAGAGTCCACA--- +>Dmel_FBtr0070119 |30 sp| +ATGAAGAGCAAGGTGGATAAACCCGTAACCAATGGTGCACCAAATGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAAAAATCCGAAGCGGACTCGCAAATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGAGAAGCCGGCGGAGACCGAGGAAAAGGAAAATACCGCAAGCAACGCCAACCTGAAGGTGTCTCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGATACAAATGCTGAGCAGCGCACTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAAACGCCGTGCCCGCCATTGATGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAATTGGTTACAGCCTTCTGCATTCTGCAGACCCCGCAGTTCGCTAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCCCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAACAAGCCGTTGAGTGGCTTGAAAGTGAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTTTTCGTCCGTACTGGGACGGGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACACACAGCTTTTCGATTTGTATTTCTCCGGTTCCACCATTCACAGCGATGGCGTATATGCCAGATTGGCTAGTTTTCTTGTTAATGGCGGAAAGGATATGCTCGCCGCCTGGCAGCAATATATCGATTCTAAGCAGCCACTCAAACTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCCACGTGCTCCTCAACTTTAAGCCAAGGGAAGAACAACTCATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGTTGCATGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCTAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTTGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCACCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATTTCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTCAGCGTCGAGAGCCTTCACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCACTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTTAGTCAGACAGCCAAATGGCGACAGAAACAGTTGAACTACTTGTTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAAGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCAGTTGCTGCAGAAGACATTGAGTTACCTTAACAAAGAGTTGGGACAACCGGATGCGGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGAGCGGCCCAGCAAGGAATCCGATGTCGTTGGCCAATCATTCGAGGCTCTTATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCATCACCGTGTTGGAAGATCTGATTATCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGAGCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTTACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTTCTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGCTCAACATGAACAAAAATCCCCTGAGCAAAAAGAGCGATGGC------GAGGAGGAGAGCGATGACGAACTCGACAAGGAAGAATCGTTGAAGGATTCAAGCGATGATTCAGAAGATGAAGATGAAGATGAAGAGGAGGAC---GAGGGCGAGGACGATGCAGAGTCCCATTTGGCCCAAATTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAGGAGCAGGGCGAACGCTTGAATGCTGCTTTGGAGCGGTCTTTTCAGATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAGCACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAACCAAGAAACCAACTCAATCGGTAATCCTGGACGTGCTACATTGCGTGTTCCAGGTGTACAGCCATTGCGCCGCAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTCGCTAGGAATATCGAACTCAAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCCATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAAGAGACATCATTATTTGGCGGGACAGGTGCTTCGCTTACCTGGTCAGCCAGGCATCAGCAGATGGCGAGCCCAAGAAAAGTGCCGTCTGGCCCCTTCTAGTCGAATTCCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGCCAATGGCAGGGAGTTGCTCCGCTGGCCGTTGTCCTGGCCTCTCACTTGGACGTACAGAAAACACGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGTCGCTTTCAAGGACAACAACTCGTCTTCCAAGAAATTTGAGAAGCAGATAGCCAGATATGTAAATCAGCTAGAAACGAAGGCTAGCAGTTCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGTGGCAGAAACTGCGTGAACAAATTCAGCTCGTCGCCAAGGATCTTCAACCCAACAAGAAGGTGGCGAAGCAGAAGAAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGAAGATGAAGAGTCCACA--- +>Dsim_ref2 |106 sp| +ATGAAAAGCAAGGTGGATAAACCCATAACCACTGGTGCACCAAGTGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAGAAATCCGACGCGGACACGCAGATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGTGAAGCCGGCGGAGACCGAGGAAAAGGAAAATATCGCGAGCAACGGCAACCTGAAGGTGTCGCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGACACAAATGCTGAGCAGCGCGCTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAACCGCCGTGCCCGCCATCGACGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAAGTGGTTACAGCCTTCGGCATTTTGCAGAGCCCGCAGTTCGCCAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCTCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAACAAGCCGTTGAGTGGCTTGAAAGTAAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGAGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACTCACAGCTTTTCGATTTGTATTTCTCCGGCTCCACCATTCACAGCGATGACGTATACGCCAGATTGGCTAGTTTTCTTATGAATGGCGGAAAGGAAATGCTCGCCGCCTGGCAGCAGTATATTGATTCCAAGCAGCCACTCAAATTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCAACGTGCTCCGCAACTTTAAGCCAAGGGAAGAACAACTTATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGCTGCAGGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCAAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTCGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCAGCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGATGATATCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTTAGCGTCGAGAGCCTTTACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCATTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTGAGCCAGGCAACACAATGGCGACAGAAGCAGTTGAACTACTTGCTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAGGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCACTTGCTGCAGAAGACATTGAGTTACCTTAACAAAAAGTTGGGGGAACCGGATGCAGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGCGCGGCCCAGCAAGGAAACGGATGTCGTTGGCCAAACATTCGAGGCTCTAATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCGTCACCGTGTTGGAGGATCTGATTATCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGATCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTACTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGTTCAACATGAACAAAAATCCCTTGAGCAAGAAGGACGATGGC------GAGGAGGAGAGCGAAGACGAAGTCGACGAGGAAGAATCGTTGAAGGATTCGAGCGATGATTCAGACGATGAAGATGAAGATGAAGAGGAGGAC---GAAGACGAGGACGATGAAGAGTCCCATTTGGCCCAAATTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAGGAGCAGGGCAAACGCTTGAATGCTGCTTTGGAGCAGTCTTTTCAAATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAACACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAAACAAGAAACCAACTCAATCGGTAATCCTGGACGTGCTGCATTGCGTCTTCCAGGTGTACCGCCATTGCGCCACAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTTGCCAGGAATATCGAACTCAAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCTATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAAGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCAAGCCCAAGGAAAGTGCTGTCTGGCCCCTTCTAGTCGAATTTCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGTCAATGGCAGGGCGTTGCTCCACTGGCTGTTGTCCTGGCCTCCCACTTGGACGTACAGAAAACGCGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGCCGCTTTCAAGGACAACTGCTCGTCTTCCAACAAATTTGAGAAGAAGATAGCCAGATACGTAAATCAGCTAGAAACGGAGACTAGTAGTCCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGCGTCAGAAACTGCGTGAACAGATTCAGCTCGTCGCCAAAAACCTTCAACCCAACAAGAAGGCGGCGAAGCAG---AAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGATGATGAAGAGTCCACA--- +>Dsim_MD03 |0 sp| +ATGAAAAGCAAGGTGGATAAACCCATAACCACTGGTGCACCAAGTGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAGAAATCCGACGCGGACACGCAGATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGTGAAGCCGGCGGAGACCGAGGAAAAGGAAAATATCGCGAGCAACGGCAACCTGAAGGTGTCGCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGACACAAATGCTGAGCAGCGCGCTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAACCGCCGTGCCCGCCATCGACGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAAGTGGTTACAGCCTTCGGCATTTTGCAGAGCCCGCAGTTCGCCAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCTCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAANAAGCCGTTGAGTGGCTTGAAAGTAAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGAGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACTCACAGCTTTTCGATTTGTATTTCTCCGGCTCCACCATTCACAGCGATGACGTATACGCCAGATTGGCTAGTTTTCTTATGAATGGCGGAAAGGAAATGCTCGCCGCCTGGCAGCAGTATATTGATTCCAAGCAGCCACTCAAATTGAATGCAGCCAAGGCGTGTACCATCCAAGTACTGAGCAACGTGCTCCGCAACTTTAAGCCAAGGGAAGAACAACTTATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGCTGCAGGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCAAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTCGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCAGCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATATCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTAAGCGTCGAGAGCCTTTACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCATTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTGAGCCAGGCAACACAATGGCGACAGAAGCAGTTGAACTACTTGCTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAAGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCACTTGCTGCAGAAGACATTGAGTTACCTTAACAAAAAGTTGGGGGAACCGGATGCAGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGCGCGGCCCAGCAAGGAAACGGATGTCGTTGGCCAAACATTCGAGGCTCTAATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCGTCACCGTGTTGGAGGATCTGATTNTCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGATCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTACTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGTTCAACATGAACAAAAATCCCTTGAGCAAGAAGGACGATGGC------GAGGAGGAGAGCGAAGACGAAGTCGACGAGGAAGAATCGTTGAAGGATTCGAGCGATGATTCAGACGATGAAGATGAAGATGAAGAGGAGNAC---GAAGACGAGGACGATGAAGAGTCCCATTTGGCCCAAANTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAAGAGCAGGGCAAACGCTTGAATGCTGCTTTGGAGCAGTCTTTTCAAATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAACACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAAACAAGAAACCAACTCAATCGGTAATCCTGGNCGTGCTGCATTGCGTCTTCCAGGTGTACCGCCATTGCGCCACAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTTGCCAGGAATATCGAACTCGAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCAATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAAGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCAAGCCCAAGGAAAGTGCTGTCTGGCCNCTTCTAGTCGAATTTCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGTCAATGGCAGGGCGTTGCTCCACTGGCTGTTGTCCTGGCCTCCCACTTGGACGTACAGAAAACGCGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGCCGCTTTCAAGGACAACTGCTCGTCTTCCAACAAATTTGAGAAGAAGATAGCCAGATACGTAAATCAGCTAGAAACGGAGACTAGTAGTCCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGCGTCAGAAACTGCGTGAACAGATTCAGCTCGTCGCCAAAAACCTTCAACCCAACAAGAAGGCGGCGAAGCAG---AAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGATGATGAAGAGTCCACA--- +>Dsim_MD06 |87 sp| +ATGAAAAGCAAGGTGGATAAACCCATAACCACTGGTGCACCAAGTGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAGAAATCCGACGCGGACACGCAGATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGTGAAGCCGGCGGAGACCGAGGAAAAGGAAAATATCGCGAGCAACGGCAACCTGAAGGTGTCGCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGACACAAATGCTGAGCAGCGCGCTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAACCGCCGTGCCCGCCATCGACGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAAGTGGTTACAGCCTTCGGCATTTTGCAGAGCCCGCAGTTCGCCAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCTCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAANAAGCCGTTGAGTGGCTTGAAAGTAAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGAGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACTCACAGCTTTTCGATTTGTATTTCTCCGGCTCCACCATTCACAGCGATGACGTATACGCCAGATTGGCTAGTTTTCTTATGAATGGCGGAAAGGAAATGCTCGCCGCCTGGCAGCAGTATATTGATTCCAAGCAGCCACTCAAATTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCAACGTGCTCCGCAACTTTAAGCCAAGGGAAGAACAACTTATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGCTGCAGGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCAAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTCGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCAGCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATATCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTTAGCGTCGAGAGCCTTTACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCATTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTGAGCCAGGCAACACAATGGCGACAGAAGCAGTTGAACTACTTGCTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAAGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCACTTGCTGCAGAAGACATTGAGTTACCTTAACAAAAAGTTGGGGGAACCGGATGCAGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGCGCGGCCCAGCAAGGAAACGGATGTCGTTGGCCAAACATTCGAGGCTCTAATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCGTCACCGTGTTGGAGGATCTGATTNTCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGATCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTACTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGTTCAACATGAACAAAAATCCCTTGAGCAAGAAGGACGATGGC------GAGGAGGAGAGCGAAGACGAAGTCGACGAGGAAGAATCGTTGAAGGATTCGAGCGATGATTCAGACGATGAAGATGAAGATGAAGAGGAGNAC---GAAGACGAGGACGATGAAGAGTCCCATTTGGCCCAAANTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAAGAGCAGGGCAAACGCTTGAATGCTGCTTTGGAGCAGTCTTTTCAAATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAACACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAAACAAGAAACCAACTCAATCGGTAATCCTGGNCGTGCTGCATTGCGTCTTCCAGGTGTACCGCCATTGCGCCACAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTTGCCAGGAATATCGAACTCGAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCAATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAAGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCAAGCCCAAGGAAAGTGCTGTCTGGCCNCTTCTAGTCGAATTTCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGTCAATGGCAGGGCGTTGCTCCACTGGCTGTTGTCCTGGCCTCCCACTTGGACGTACAGAAAACGCGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGCCGCTTTCAAGGACAACTGCTCGTCTTCCAACAAATTTGAGAAGAAGATAGCCAGATACGTAAATCAGCTAGAAACGGAGACTAGTAGTCCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGCGTCAGAAACTGCGTGAACAGATTCAGCTCGTCGCCAAAAACCTTCAACCCAACAAGAAGGCGGCGAAGCAG---AAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGATGATGAAGAGTCCACA--- +>Dsim_MD105 |108 sp| +ATGAAAAGCAAGGTGGATAAACCCATAACCACTGGTGCACCAAGTGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAGAAATCCGACGCGGACACGCAGATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGTGAAGCCGGCGGAGACCGAGGAAAAGGAAAATATCGCGAGCAACGGCAACCTGAAGGTGTCGCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGACACAAATGCTGAGCAGCGCGCTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAACCGCCGTGCCCGCCATCGACGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAAGTGGTTACAGCCTTCGGCATTTTGCAGAGCCCGCAGTTCGCCAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCTCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAANAAGCCGTTGAGTGGCTTGAAAGTAAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGAGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACTCACAGCTTTTCGATTTGTATTTCTCCGGCTCCACCATTCACAGCGATGACGTATACGCCAGATTGGCTAGTTTTCTTATGAATGGCGGAAAGGAAATGCTCGCCGCCTGGCAGCAGTATATTGATTCCAAGCAGCCACTCAAATTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCAACGTGCTCCGCAACTTTAAGCCAAGGGAAGAACAACTTATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGCTGCAGGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCTAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTCGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCAGCTGCTGCTTAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATATCCTTGCCGCGTTTCTGTCAGAAACTGATAAATCAACTAAGCGTCGAGAGCCTTTATAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCATTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTGAGCCAGGCAACACAATGGCGACAGAAGCAGTTGAACTACTTGCTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAGGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCACTTGCTGCAGAAGACATTGAGTTACCTTAACAAAAAGTTGGGGGAACCGGATGCAGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGCGCGGCCCAGCAAGGAAACGGATGTCGTTGGCCAAACATTCGAGGCTCTAATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCGTCACCGTGTTGGAGGATCTGATTNTCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGATCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTACTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGTTCAACATGAACAAAAATCCCTTGAGCAAGAAGGACGATGGC------GAGGAGGAGAGCGAAGACGAAGTCGACGAGGAAGAATCGTTGAAGGATTCGAGCGATGATTCAGACGATGAAGATGAAGATGAAGAGGAGNAC---GAAGACGAGGACGATGAAGAGTCCCATTTGGCCCAAANTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAAGAGCAGGGCAAACGCTTGAATGCTGCTTTGGAGCAGTCTTTTCAAATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAACACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAAACAAGAAACCAACTCAATCGGTAATCCTGGNCGTGCTGCATTGCGTCTTCCAGGTGTACCGCCATTGCGCCACAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTTGCCAGGAATATCGAACTCGAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCAATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAAGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCAAGCCCAAGGAAAGTGCTGTCTGGCCNCTTCTAGTCGAATTTCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGTCAATGGCAGGGCGTTGCTCCACTGGCTGTTGTCCTGGCCTCCCACTTGGACGTACAGAAAACGCGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGCCGCTTTCAAGGACAACTGCTCGTCTTCCAACAAATTTGAGAAGAAGATAGCCAGATACGTAAATCAGCTAGAAACGGAGACTAGTAGTCCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGCGTCAGAAACTGCGTGAACAGATTCAGCTCGTCGCCAAAAACCTTCAACCCAACAAGAAGGCGGCGAAGCAG---AAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGATGATGAAGAGTCCACA--- +>Dsim_MD106 |118 sp| +ATGAAAAGCAAGGTGGATAAACCCATAACCACTGGTGCACCAAGTGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAGAAATCCGACGCGGACACGCAGATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGTGAAGCCGGCGGAGACCGAGGAAAAGGAAAATATCGCGAGCAACGGCAACCTGAAGGTGTCGCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGACACAAATGCTGAGCAGCGCGCTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAACCGCCGTGCCCGCCATCGACGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAAGTGGTTACAGCCTTCGGCATTTTGCAGAGCCCGCAGTTCGCCAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCTCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAANAAGCCGTTGAGTGGCTTGAAAGTAAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGAGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACTCACAGCTTTTCGATTTGTATTTCTCCGGCTCCACCATTCACAGCGATGACGTATACGCCAGATTGGCTAGTTTTCTTATGAATGGCGGAAAGGAAATGCTCGCCGCCTGGCAGCAGTATATTGATTCCAAGCAGCCACTCAAATTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCAACGTGCTCCGCAACTTTAAGCCAAGGGAAGAACAACTTATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGCTGCAGGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCAAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTCGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCAGCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATATCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTTAGCGTCGAGAGCCTTTACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCATTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTGAGCCAGGCAACACAATGGCGACAGAAGCAGTTGAACTACTTGCTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAAGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCACTTGCTGCAGAAGACATTGAGTTACCTTAACAAAAAGTTGGGGGAACCGGATGCAGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGCGCGGCCCAGCAAGGAAACGGATGTCGTTGGCCAAACATTCGAGGCTCTAATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCGTCACCGTGTTGGAGGATCTGATTNTCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGATCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTACTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGTTCAACATGAACAAAAATCCCTTGAGCAAGAAGGACGATGGC------GAGGAGGAGAGCGAAGACGAAGTCGACGAGGAAGAATCGTTGAAGGATTCGAGCGATGATTCAGACGATGAAGATGAAGATGAAGAGGAGNAC---GAAGACGAGGACGATGAAGAGTCCCATTTGGCCCAAANTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAGGAGCAGGGCAAACGCTTGAATGCTGCTTTGGAGCAGTCTTTTCAAATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAACACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAAACAAGAAACCAACTCAATCGGTAATCCTGGNCGTGCTGCATTGCGTCTTCCAGGTGTACCGCCATTGCGCCACAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTTGCCAGGAATATCGAACTCGAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCCATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAAGTGCTTCGCCTACCTGGTCAGCCAGGCATCGGCAGATGGCAAGCCCAAGGAAAGTGCTGTCTGGCCNCTTCTAGTCGAATTTCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGTCAATGGCAGGGCGTTGCTCCACTGGCTGTTGTCCTGGCCTCCCACTTGGACGTACAGAAAACGCGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGCCGCTTTCAAGGACAACTGCTCGTCTTCCAACAAATTTGAGAAGAAGATAGCCAGATACGTAAATCAGCTAGAAACGGAGACTAGTAGTCCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGCGTCAGAAACTGCGTGAACAGATTCAGCTCGTCGCCAAAAACCTTCAACCCAACAAGAAGGCGGCGAAGCAG---AAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGATGATGAAGAGTCCACA--- +>Dsim_MD146 |57 sp| +ATGAAAAGCAAGGTGGATAAACCCATAACCACTGGTGCACCAAGTGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAGAAATCCGACGCGGACACGCAGATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGTGAAGCCGGCGGAGACCGAGGAAAAGGAAAATATCGCGAGCAACGGCAACCTGAAGGTGTCGCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGACACAAATGCTGAGCAGCGCGCTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAACCGCCGTGCCCGCCATCGACGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAAGTGGTTACAGCCTTCGGCATTTTGCAGAGCCCGCAGTTCGCCAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCTCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAANAAGCCGTTGAGTGGCTTGAAAGTAAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGAGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACTCACAGCTTTTCGATTTGTATTTCTCCGGCTCCACCATTCACAGCGATGACGTATACGCCAGATTGGCTAGTTTTCTTATGAATGGCGGAAAGGAAATGCTCGCCGCCTGGCAGCAGTATATTGATTCCAAGCAGCCACTCAAATTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCAACGTGCTCCGCAACTTTAAGCCAAGGGAAGAACAACTTATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGCTGCAGGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCTAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTCGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCAGCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATATCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTTAGCGTCGAGAGCCTTTACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCATTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTGAGCCAGGCAACACAATGGCGACAGAAGCAGTTGAACTACTTGCTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAAGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCACTTGCTGCAGAAGACATTGAGTTACCTTAACAAAAAGTTGGGGGAACCGGATGCAGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGCGCGGCCCAGCAAGGAAACGGATGTCGTTGGCCAAACATTCGAGGCTCTAATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCGTCACCGTGTTGGAGGATCTGATTNTCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGATCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTACTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGTTCAACATGAACAAAAATCCCTTGAGCAAGAAGGACGATGGC------GAGGAGGAGAGCGAAGACGAAGTCGACGAGGAAGAATCGTTGAAGGATTCGAGCGATGATTCAGACGATGAAGATGAAGATGAAGAGGAGNAC---GAAGACGAGGACGATGAAGAGTCCCATTTGGCCCAAANTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAAGAGCAGGGCAAACGCTTGAATGCTGCTTTGGAGCAGTCTTTTCAAATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAACACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAAACAAGAAACCAACTCAATCGGTAATCCTGGNCGTGCTGCATTGCGTCTTCCAGGTGTACCGCCATTGCGCCACAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTTGCCAGGAATATCGAACTCGAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCAATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAAGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCAAGCCCAAGGAAAGTGCTGTCTGGCCNCTTCTAGTCGAATTTCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGTCAATGGCAGGGCGTTGCTCCACTGGCTGTTGTCCTGGCCTCCCACTTGGACGTACAGAAAACGCGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGCCGCTTTCAAGGACAACTGCTCGTCTTCCAACAAATTTGAGAAGAAGATAGCCAGATACGTAAATCAGCTAGAAACGGAGACTAGTAGTCCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGCGTCAGAAACTGCGTGAACAGATTCAGCTCGTCGCCAAAAACCTTCAACCCAACAAGAAGGCGGCGAAGCAG---AAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGATGATGAAGAGTCCACA--- +>Dsim_MD15 |77 sp| +ATGAAAAGCAAGGTGGATAAACCCATAACCACTGGTGCACCAAGTGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAGAAATCCGACGCGGACACGCAGATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGTGAAGCCGGCGGAGACCGAGGAAAAGGAAAATATCGCGAGCAACGGCAACCTGAAGGTGTCGCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGACACAAATGCTGAGCAGCGCGCTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTGACCGCCGTGCCCGCCATCGACGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAAGTGGTTACAGCCTTCGGCATTTTGCAGAGCCCGCAGTTCGCCAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCTCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAANAAGCCGTTGAGTGGCTTGAAAGTAAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGAGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACTCACAGCTTTTCGATTTGTATTTCTCCGGCTCCACCATTCACAGCGATGACGTATACGCCAGATTGGCTAGTTTTCTTATGAATGGCGGAAAGGAAATGCTCGCCGCCTGGCAGCAGTATATTGATTCCAAGCAGCCACTCAAATTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCAACGTGCTCCGCAACTTTAAGCCAAGGGAAGAACAACTTATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGCTGCAGGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCAAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTCGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCAGCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATATCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTTAGCGTCGAGAGCCTTTACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCATTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTGAGCCAGGCAACACAATGGCGACAGAAGCAGTTGAACTACTTGCTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAAGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCACTTGCTGCAGAAGACATTGAGTTACCTTAACAAAAAGTTGGGGGAACCGGATGCAGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGCGCGGCCCAGCAAGGAAACGGATGTCGTTGGCCAAACATTCGAGGCTCTAATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCGTCACCGTGTTGGAGGATCTGATTNTCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGATCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTACTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGTTCAACATGAACAAAAATCCCTTGAGCAAGAAGGACGATGGC------GAGGAGGAGAGCGAAGACGAAGTCGACGAGGAAGAATCGTTGAAGGATTCGAGCGATGATTCAGACGATGAAGATGAAGATGAAGAGGAGNAC---GAAGACGAGGACGATGAAGAGTCCCATTTGGCCCAAANTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAGGAGCAGGGCAAACGCTTGAATGCTGCTTTGGAGCAGTCTTTTCAAATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAACACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAAACAAGAAACCAACTCAATCGGTAATCCTGGNCGTGCTGCATTGCGTCTTCCAGGTGTACCGCCATTGCGCCACAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTTGCCAGGAATATCGAACTCGAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCAATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAAGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCAAGCCCAAGGAAAGTGCTGTCTGGCCNCTTCTAGTCGAATTTCTGGAGCTGTGGGTATCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGTCAATGGCAGGGCGTTGCTCCACTGGCTGTTGTCCTGGCCTCCCACTTGGACCTACAGAAAACGCGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGCCGCTTTCAAGGACAACTGCTCGTCTTCCAACAAATTTGAGAAGAAGATAGCCAGATACGTAAATCAGCTAGAAACGGAGACTAGTAGTCCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGCGTCAGAAACTGCGTGAACAGATTCAGCTCGTCGCCAAAAACCTTCAACCCAACAAGAAGGCGGCGAAGCAG---AAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGATGATGAAGAGTCCACA--- +>Dsim_MD197 |86 sp| +ATGAAAAGCAAGGTGGATAAACCCATAACCACTGGTGCACCAAGTGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAGAAATCCGACGCGGACACGCAGATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGTGAAGCCGGCGGAGACCGAGGAAAAGGAAAATATCGCGAGCAACGGCAACCTGAAGGTGTCGCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGACACAAATGCTGAGCAGCGCGCTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAACCGCCGTGCCCGCCATCGACGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAAGTGGTTACAGCCTTCGGCATTTTGCAGAGCCCGCAGTTCGCCAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCTCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAANAAGCCGTTGAGTGGCTTGAAAGTAAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGAGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACTCACAGCTTTTCGATTTGTATTTCTCCGGCTCCACCATTCACAGCGATGACGTATACGCCAGATTGGCTAGTTTTCTTATGAATGGCGGAAAGGAAATGCTCGCCGCCTGGCAGCAGTATATTGATTCCAAGCAGCCACTCAAATTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCAACGTGCTCCGCAACTTTAAGCCAAGGGAAGAACAACTTATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGCTGCAGGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCAAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTCGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCAGCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATATCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTAAGCGTCGAGAGCCTTTACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCATTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTGAGCCAGGCAACACAATGGCGACAGAAGCAGTTGAACTACTTGCTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAGGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCACTTGCTGCAAAAGACATTGAGTTACCTTAACAAAAAGTTGGGGGAACCGGATGCAGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGCGCGGCCCAGCAAGGAAACGGATGTCGTTGGCCAAACATTCGAGGCTCTAATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCGTCACCGTGTTGGAGGATCTGATTNTCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGATCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTACTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGTTCAACATGAACAAAAATCCCTTGAGCAAGAAGGACGATGGC------GAGGAGGAGAGCGAAGACGAAGTCGACGAGGAAGAATCGTTGAAGGATTCGAGCGATGATTCAGACGATGAAGATGAAGATGAAGAGGAGNAC---GAAGACGAGGACGATGAAGAGTCCCATTTGGCCCAAANTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAGGAGCAGGGCAAACGCTTGAATGCTGCTTTGGAGCAGTCTTTTCAAATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAACACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAAACAAGAAACCAACTCAATCGGTAATCCTGGNCGTGCTGCATTGCGTCTTCCAGGTGTACCGCCATTGCGCCACAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTTGCCAGGAATATCGAACTCAAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCTATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAAGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCAAGCCCAAGGAAAGTGCTGTCTGGCCNCTTCTAGTCGAATTTCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGTCAATGGCAGGGCGTTGCTCCACTGGCTGTTGTCCTGGCCTCCCACTTGGACGTACAGAAAACGCGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGCCGCTTTCAAGGACAACTGCTCGTCTTCCAACAAATTTGAGAAGAAGATAGCCAGATACGTAAATCAGCTAGAAACGGAGACTAGTAGTCCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGCGTCAGAAACTGCGTGAACAGATTCAGCTCGTCGCCAAAAACCTTCAACCCAACAAGAAGGCGGCGAAGCAG---AAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGATGATGAAGAGTCCACA--- +>Dsim_MD199 |87 sp| +ATGAAAAGCAAGGTGGATAAACCCATAACCACTGGTGCACCAAGTGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAGAAATCCGACGCGGACACGCAGATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGTGAAGCCGGCGGAGACCGAGGAAAAGGAAAATATCGCGAGCAACGGCAACCTGAAGGTGTCGCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGACACAAATGCTGAGCAGCGCGCTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAACCGCCGTGCCCGCCATCGACGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAAGTGGTTACAGCCTTCGGCATTTTGCAGAGCCCGCAGTTCGCCAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCTCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAANAAGCCGTTGAGTGGCTTGAAAGTAAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGAGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACTCACAGCTTTTCGATTTGTATTTATCCGGCTCCACCATTCACAGCGATGACGTATACGCCAGATTGGCTAGTTTTCTTATGAATGGCGGAAAGGAAATGCTCGCCGCCTGGCAGCAGTATATTGATTCCAAGCAGCCACTCAAATTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCAACGTGCTCCGCAACTTTAAGCCAAGGGAAGAACAACTTATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGCTGCAGGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCAAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTCGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCAGCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATATCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTTAGCGTCGAGAGCCTTTACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCATTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTGAGCCAGGCAACACAATGGCGACAGAAGCAGTTGAACTACTTGCTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAGGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCACTTGCTGCAAAAGACATTGAGTTACCTTAACAAAAAGTTGGGGGAACCGGATGCAGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGCGCGGCCCAGCAAGGAAACGGATGTCGTTGGCCAAACATTCGAGGCTCTAATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCGTCACCGTGTTGGAGGATCTGATTNTCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGATCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTACTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGTTCAACATGAACAAAAATCCCTTGAGCAAGAAGGACGATGGC------GAGGAGGAGAGCGAAGACGAAGTCGACGAGGAAGAATCGTTGAAGGATTCGAGCGATGATTCAGACGATGAAGATGAAGATGAAGAGGAGNAC---GAAGACGAGGACGATGAAGAGTCCCATTTGGCCCAAANTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAGGAGCAGGGCAAACGCTTGAATGCTGCTTTGGAGCAGTCTTTTCAAATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAACACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAAACAAGAAACCAACTCAATCGGTAATCCTGGNCGTGCTGCATTGCGTCTTCCAGGTGTACCGCCATTGCGCCACAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTTGCCAGGAATATCGAACTCGAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCAATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAAGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCAAGCCCAAGGAAAGTGCTGTCTGGCCNCTTCTAGTCGAATTTCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGTCAATGGCAGGGCGTTGCTCCACTGGCTGTTGTCCTGGCCTCCCACTTGGACGTACAGAAAACGCGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGCCGCTTTCAAGGACAACTGCTCGTCTTCCAACAAATTTGAGAAGAAGATAGCCAGATACGTAAATCAGCTAGAAACGGAGACTAGTAGTCCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGCGTCAGAAACTGCGTGAACAGATTCAGCTCGTCGCCAAAAACCTTCAACCCAACAAGAAGGCGGCGAAGCAG---AAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGATGATGAAGAGTCCACA--- +>Dsim_MD201 |47 sp| +ATGAAAAGCAAGGTGGATAAACCCATAACCACTGGTGCACCAAGTGCAACCAAGACAAAGGGCAAGGAGGACCGCAAGCGGGCAAAAACTCAGAAATCCGACGCGGACACGCAGATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGTGAAGCCGGCGGAGACCGAGGAAAAGGAAAATATCGCGAGCAACGGCAACCTGAAGGTGTCGCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGACACAAATGCTGAGCAGCGCGCTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAACCGCCGTGCCCGCCATCGACGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAAGTGGTTACAGCCTTCGGCATTTTGCAGAGCCCGCAGTTCGCCAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCTCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAANAAGCCGTTGAGTGGCTTGAAAGTAAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGAGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACTCACAGCTTTTCGATTTGTATTTCTCCGGCTCCACCATTCACAGCGATGACGTATACGCCAGATTGGCTAGTTTTCTTATGAATGGAGGAAAGGAAATGCTCGCCGCCTGGCAGCAGTATATTGATTCCAAGCAGCCACTCAAATTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCAACGTGCTCCGCAACTTTAAGCCAAGGGAAGAACAACTTATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGCTGCAGGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCAAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTCGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCAGCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATATCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTTAGCGTCGAGAGCCTTTACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCATTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTGAGCCAGGCAACACAATGGCGACAGAAGCAGTTGAACTACTTGCTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAAGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCACTTGCTGCAGAAGACATTGAGTTACCTTAACAAAAAGTTGGGGGAACCGGATGCAGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGCGCGGCCCAGCAAGGAAACGGATGTCGTTGGCCAAACATTCGAGGCTCTAATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCGTCACCGTGTTGGAGGATCTGATTNTCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGATCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTACTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGTTCAACATGAACAAAAATCCCTTGAGCAAGAAGGACGATGGC------GAGGAGGAGAGCGAAGACGAAGTCGACGAGGAAGAATCGTTGAAGGATTCGAGCGATGATTCAGACGATGAAGATGAAGATGAAGAGGAGNAC---GAAGACGAGGACGATGAAGAGTCCCATTTGGCCCAAANTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAAGAGCAGGGCAAACGCTTGAATGCTGCTTTGGAGCAGTCTTTTCAAATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAACACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAAACAAGAAACCAACTCAATCGGTAATCCTGGNCGTGCTGCATTGCGTCTTCCAGGTGTACCGCCATTGCGCCACAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTTGCCAGGAATATCGAACTCGAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCCATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAAGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCAAGCCCAAGGAAAGTGCTGTCTGGCCNCTTCTAGTCGAATTTCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGTCAATGGCAGGGCGTTGCTCCACTGGCTGTTGTCCTGGCCTCCCACTTGGACGTACAGAAAACGCGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGCCGCTTTCAAGGACAACTGCTCGTCTTCCAACAAATTTGAGAAGAAGATAGCCAGATACGTAAATCAGCTAGAAACGGAGACTAGTAGTCCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGCGTCAGAAACTGCGTGAACAGATTCAGCTCGTCGCCAAAAACCTTCAACCCAACAAGAAGGCGGCGAAGCAG---AAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGATGATGAAGAGTCCACA--- +>Dsim_MD221 |76 sp| +ATGAAAAGCAAGGTGGATAAACCCATAACCACTGGTGCACCAAGTGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAGAAATCCGACGCGGACACGCAGATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGTGAAGCCGGCGGAGACCGAGGAAAAGGAAAATATCGCGAGCAACGGCAACCTGAAGGTGTCGCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGACACAAATGCTGAGCAGCGCGCTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAACCGCCGTGCCCGCCATCGACGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAAGTGGTTACAGCCTTCGGCATTTTGCAGAGCCCGCAGTTCGCCAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCTCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAANAAGCCGTTGAGTGGCTTGAAAGTAAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGAGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACTCACAGCTTTTCGATTTGTATTTCTCCGGCTCCACCATTCACAGCGATGACGTATACGCCAGATTGGCTAGTTTTCTTATGAATGGCGGAAAGGAAATGCTCGCCGCCTGGCAGCAGTATATTGATTCCAAGCAGCCACTCAAATTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCAACGTGCTCCGCAACTTTAAGCCAAGGGAAGAACAACTTATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGCTGCAGGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCTAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTCGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCAGCTGCTGCTTAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATATCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTAAGCGTCGAGAGCCTTTACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCATTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTGAGCCAGGCAACACAATGGCGACAGAAGCAGTTGAACTACTTGCTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAGGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCACTTGCTGCAGAAGACATTGAGTTACCTTAACAAAAAGTTGGGGGAACCGGATGCAGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGCGCGGCCCAGCAAGGAAACGGATGTCGTTGGCCAAACATTCGAGGCTCTAATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCGTCACCGTGTTGGAGGATCTGATTNTCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGATCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTACTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGTTCAACATGAACAAAAATCCCTTGAGCAAGAAGGACGATGGC------GAGGAGGAGAGCGAAGACGAAGTCGACGAGGAAGAATCGTTGAAGGATTCGAGCGATGATTCAGACGATGAAGATGAAGATGAAGAGGAGNAC---GAAGACGAGGACGATGAAGAGTCCCATTTGGCCCAAANTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAGGAGCAGGGCAAACGCTTGAATGCTGCTTTGGAGCAGTCTTTTCAAATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAACACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAAACAAGAAACCAACTCAATCGGTAATCCTGGNCGTGCTGCATTGCGTCTTCCAGGTGTACCGCCATTGCGCCACAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTTGCCAGGAATATCGAACTCGAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCCATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAAGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCAAGCCCAAGGAAAGTGCTGTCTGGCCNCTTCTAGTCGAATTTCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGTCAATGGCAGGGCGTTGCTCCACTGGCTGTTGTCCTGGCCTCCCACTTGGACGTACAGAAAACGCGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGCCGCTTTCAAGGACAACTGCTCGTCTTCCAACAAATTTGAGAAGAAGATAGCCAGATACGTAAATCAGCTAGAAACGGAGACTAGTAGTCCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGCGTCAGAAACTGCGTGAACAGATTCAGCTCGTCGCCAAAAACCTTCAACCCAACAAGAAGGCGGCGAAGCAG---AAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGATGATGAAGAGTCCACA--- +>Dsim_MD224 |103 sp| +ATGAAAAGCAAGGTGGATAAACCCATAACCACTGGTGCACCAAGTGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAGAAATCCGACGCGGACACGCAGATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGTGAAGCCGGCGGAGACCGAGGAAAAGGAAAATATCGCGAGCAACGGCAACCTGAAGGTGTCGCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGACACAAATGCTGAGCAGCGCGCTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAACCGCCGTGCCCGCCATCGACGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAAGTGGTTACAGCCTTCGGCATTTTGCAGAGCCCGCAGTTCGCCAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCTCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAANAAGCCGTTGAGTGGCTTGAAAGTAAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGAGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACTCACAGCTTTTCGATTTGTATTTCTCCGGCTCCACCATTCACAGCGATGACGTATACGCCAGATTGGCTAGTTTTCTTATGAATGGCGGAAAGGAAATGCTCGCCGCCTGGCAGCAGTATATTGATTCCAAGCAGCCACTCAAATTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCAACGTGCTCCGCAACTTTAAGCCAAGGGAAGAACAACTTATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGCTGCAGGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCAAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTCGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCAGCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATATCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTTAGCGTCGAGAGCCTTTACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCATTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTGAGCCAGGCAACACAATGGCGACAGAAGCAGTTGAACTACTTGCTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAAGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCACTTGCTGCAGAAGACATTGAGTTACCTTAACAAAAAGTTGGGGGAACCGGATGCAGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGCGCGGCCCAGCAAGGAAACGGATGTCGTTGGCCAAACATTCGAGGCTCTAATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCGTCACCGTGTTGGAGGATCTGATTNTCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGATCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTACTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGTTCAACATGAACAAAAATCCCTTGAGCAAGAAGGACGATGGC------GAGGAGGAGAGCGAAGACGAAGTCGACGAGGAAGAATCGTTGAAGGATTCGAGCGATGATTCAGACGATGAAGATGAAGATGAAGAGGAGNAC---GAAGACGAGGACGATGAAGAGTCCCATTTGGCCCAAANTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAGGAGCAGGGCAAACGCTTGAATGCTGCTTTGGAGCAGTCTTTTCAAATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAACACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAAACAAGAAACCAACTCAATCGGTAATCCTGGNCGTGCTGCATTGCGTCTTCCAGGTGTACCGCCATTGCGCCACAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTTGCCAGGAATATCGAACTCGAGGAAAATCAGAGCACCGCTCCCATTCTGGAAGCAATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAAGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCAAGCCCAAGGAAAGTGCTGTCTGGCCNCTTCTAGTCGAATTTCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGTCAATGGCAGGGCGTTGCTCCACTGGCTGTTGTCCTGGCCTCCCACTTGGACGTACAGAAAACGCGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGCCGCTTTCAAGGACAACTGCTCGTCTTCCAACAAATTTGAGAAGAAGATAGCCAGATACGTAAATCAGCTAGAAACGGAGACTAGTAGTCCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGCGTCAGAAACTGCGTGAACAGATTCAGCTCGTCGCCAAAAACCTTCAACCCAACAAGAAGGCGGCGAAGCAG---AAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGATGATGAAGAGTCCACA--- +>Dsim_MD225 |0 sp| +ATGAAAAGCAAGGTGGATAAACCCATAACCACTGGTGCACCAAGTGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAGAAATCCGACGCGGACACGCAGATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGTGAAGCCGGCGGAGACCGAGGAAAAGGAAAATATCGCGAGCAACGGCAACCTGAAGGTGTCGCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGACACAAATGCTGAGCAGCGCGCTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAACCGCCGTGCCCGCCATCGACGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAAGTGGTTACAGCCTTCGGCATTTTGCAGAGCCCGCAGTTCGCCAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCTCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAANAAGCCGTTGAGTGGCTTGAAAGTAAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGAGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACTCACAGCTTTTCGATTTGTATTTCTCCGGCTCCACCATTCACAGCGATGACGTATACGCCAGATTGGCTAGTTTTCTTATGAATGGCGGAAAGGAAATGCTCGCCGCCTGGCAGCAGTATATTGATTCCAAGCAGCCACTCAAATTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCAACGTGCTCCGCAACTTTAAGCCAAGGGAAGAACAACTTATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGCTGCAGGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCAAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTCGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCAGCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATATCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTTAGCGTCGAGAGCCTTTACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCATTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTGAGCCAGGCAACACAATGGCGACAGAAGCAGTTGAACTACTTGCTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAAGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCACTTGCTGCAGAAGACATTGAGTTACCTTAACAAAAAGTTGGGGGAACCGGATGCAGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGCGCGGCCCAGCAAGGAAACGGATGTCGTTGGCCAAACATTCGAGGCTCTAATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCGTCACCGTGTTGGAGGATCTGATTNTCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGATCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTACTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGTTCAACATGAACAAAAATCCCTTGAGCAAGAAGGACGATGGC------GAGGAGGAGAGCGAAGACGAAGTCGACGAGGAAGAATCGTTGAAGGATTCGAGCGATGATTCAGACGATGAAGATGAAGATGAAGAGGAGNAC---GAAGACGAGGACGATGAAGAGTCCCATTTGGCCCAAANTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAAGAGCAGGGCAAACGCTTGAATGCTGCTTTGGAGCAGTCTTTTCAAATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAACACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAAACAAGAAACCAACTCAATCGGTAATCCTGGNCGTGCTGCATTGCGTCTTCCAGGTGTACCGCCATTGCGCCACAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTTGCCAGGAATATCGAACTCGAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCAATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAAGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCAAGCCCAAGGAAAGTGCTGTCTGGCCNCTTCTAGTCGAATTTCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGTCAATGGCAGGGCGTTGCTCCACTGGCTGTTGTCCTGGCCTCCCACTTGGACGTACAGAAAACGCGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGCCGCTTTCAAGGACAACTGCTCGTCTTCCAACAAATTTGAGAAGAAGATAGCCAGATACGTAAATCAGCTAGAAACGGAGACTAGTAGTCCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGCGTCAGAAACTGCGTGAACAGATTCAGCTCGTCGACAAAAACCTTCAACCCAACAAGAAGGCGGCGAAGCAG---AAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGATGATGAAGAGTCCACA--- +>Dsim_MD233 |45 sp| +ATGAAAAGCAAGGTGGATAAACCCATAACCACTGGTGCACCAAGTGCAACCAAGACAAAGGGCAAGGAGGACCGCAAGCGGGCAAAAACTCAGAAATCCGACGCGGACACGCAGATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGTGAAGCCGGCGGAGACCGAGGAAAAGGAAAATATCGCGAGCAACGGCAACCTGAAGGTGTCGCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGACACAAATGCTGAGCAGCGCGCTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAACCGCCGTGCCCGCCATCGACGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAAGTGGTTACAGCCTTCGGCATTTTGCAGAGCCCGCAGTTCGCCAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCTCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAANAAGCCGTTGAGTGGCTTGAAAGTAAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGAGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACTCACAGCTTTTCGATTTGTATTTCTCCGGCTCCACCATTCACAGCGATGACGTATACGCCAGATTGGCTAGTTTTCTTATGAATGGCGGAAAGGAAATGCTCGCCGCCTGGCAGCAGTATATTGATTCCAAGCAGCCACTCAAATTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCAACGTGCTCCGCAACTTTAAGCCAAGGGAAGAACAACTTATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGCTGCAGGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCAAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTCGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCAGCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATATCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTTAGCGTCGAGAGCCTTTACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCATTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTGAGCCAGGCAACACAATGGCGACAGAAGCAGTTGAACTACTTGCTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAAGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCACTTGCTGCAGAAGACATTGAGTTACCTTAACAAAAAGTTGGGGGAACCGGATGCAGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGCGCGGCCCAGCAAGGAAACGGATGTCGTTGGCCAAACATTCGAGGCTCTAATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCGTCACCGTGTTGGAGGATCTGATTNTCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGATCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTACTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGTTCAACATGAACAAAAATCCCTTGAGCAAGAAGGACGATGGC------GAGGAGGAGAGCGAAGACGAAGTCGACGAGGAAGAATCGTTGAAGGATTCGAGCGATGATTCAGACGATGAAGATGAAGATGAAGAGGAGNAC---GAAGACGAGGACGATGAAGAGTCCCATTTGGCCCAAANTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAGGAGCAGGGCAAACGCTTGAATGCTGCTTTGGAGCAGTCTTTTCAAATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAACACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAAACAAGAAACCAACTCAATCGGTAATCCTGGNCGTGCTGCATTGCGTCTTCCAGGTGTACCGCCATTGCGCCACAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTTGCCAGGAATATCGAACTCGAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCCATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAAGTGCTTCGCCTACCTGGTCAGCCAGGCATCGGCAGATGGCAAGCCCAAGGAAAGTGCTGTCTGGCCNCTTCTAGTCGAATTTCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGTCAATGGCAGGGCGTTGCTCCACTGGCTGTTGTCCTGGCCTCCCACTTGGACGTACAGAAAACGCGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGCCGCTTTCAAGGACAACTGCTCGTCTTCCAACAAATTTGAGAAGAAGATAGCCAGATACGTAAATCAGCTAGAAACGGAGACTAGTAGTCCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGCGTCAGAAACTGCGTGAACAGATTCAGCTCGTCGCCAAAAACCTTCAACCCAACAAGAAGGCGGCGAAGCAG---AAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGATGATGAAGAGTCCACA--- +>Dsim_MD235 |4 sp| +ATGAAAAGCAAGGTGGATAAACCCATAACCACTGGTGCACCAAGTGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAGAAATCCGACGCGGACACGCAGATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGTGAAGCCGGCGGAGACCGAGGAAAAGGAAAATATCGCGAGCAACGGCAACCTGAAGGTGTCGCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGACACAAATGCTGAGCAGCGCGCTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAACCGCCGTGCCCGCCATCGACGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAAGTGGTTACAGCCTTCGGCATTTTGCAGAGCCCGCAGTTCGCCAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCTCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAANAAGCCGTTGAGTGGCTTGAAAGTAAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGAGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACTCACAGCTTTTCGATTTGTATTTCTCCGGCTCCACCATTCACAGCGATGACGTATACGCCAGATTGGCTAGTTTTCTTATGAATGGCGGAAAGGAAATGCTCGCCGCCTGGCAGCAGTATATTGATTCCAAGCAGCCACTCAAATTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCAACGTGCTCCGCAACTTTAAGCCAAGGGAAGACCAACTTATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGCTGCAGGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCAAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTCGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCAGCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATATCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTTAGCGTCGAGAGCCTTTACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCATTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTGAGCCAGGCAACACAATGGCGACAGAAGCAGTTGAACTACTTGCTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAAGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCACTTGCTGCAGAAGACATTGAGTTACCTTAACAAAAAGTTGGGGGAACCGGATGCAGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGCGCGGCCCAGCAAGGAAACGGATGTCGTTGGCCAAACATTCGAGGCTCTAATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCGTCACCGTGTTGGAGGATCTGATTNTCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGATCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTACTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGTTCAACATGAACAAAAATCCCTTGAGCAAGAAGGACGATGGC------GAGGAGGAGAGCGAAGACGAAGTCGACGAGGAAGAATCGTTGAAGGATTCGAGCGATGATTCAGACGATGAAGATGAAGATGAAGAGGAGNAC---GAAGACGAGGACGATGAAGAGTCCCATTTGGCCCAAANTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAAGAGCAGGGCAAACGCTTGAATGCTGCTTTGGAGCAGTCTTTTCAAATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAACACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAAACAAGAAACCAACTCAATCGGTAATCCTGGNCGTGCTGCATTGCGTCTTCCAGGTGTACCGCCATTGCGCCACAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTTGCCAGGAATATCGAACTCGAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCAATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAAGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCAAGCCCAAGGAAAGTGCTGTCTGGCCNCTTCTAGTCGAATTTCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGTCAATGGCAGGGCGTTGCTCCACTGGCTGTTGTCCTGGCCTCCCACTTGGACGTACAGAAAACGCGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGCCGCTTTCAAGGACAACTGCTCGTCTTCCAACAAATTTGAGAAGAAGATAGCCAGATACGTAAATCAGCTAGAAACGGAGACTAGTAGTCCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGCGTCAGAAACTGCGTGAACAGATTCAGCTCGTCGCCAAAAACCTTCAACCCAACAAGAAGGCGGCGAAGCAG---AAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGATGATGAAGAGTCCACA--- +>Dsim_MD238 |83 sp| +ATGAAAAGCAAGGTGGATAAACCCATAACCACTGGTGCACCAAGTGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAGAAATCCGACGCGGACACGCAGATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGTGAAGCCGGCGGAGACCGAGGAAAAGGAAAATATCGCGAGCAACGGCAACCTGAAGGTGTCGCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGACACAAATGCTGAGCAGCGCGCTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAACCGCCGTGCCCGCCATCGACGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAAGTGGTTACAGCCTTCGGCATTTTGCAGAGCCCGCAGTTCGCCAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCTCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAANAAGCCGTTGAGTGGCTTGAAAGTAAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGAGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACTCACAGCTTTTCGATTTGTATTTCTCCGGCTCCACCATTCACAGCGATGACGTATACGCCAGATTGGCTAGTTTTCTTATGAATGGCGGAAAGGAAATGCTCGCCGCCTGGCAGCAGTATATTGATTCCAAGCAGCCACTCAAATTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCAACGTGCTCCGCAACTTTAAGCCAAGGGAAGAACAACTTATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGCTGCAGGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCTAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTCGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCAGCTGCTGCTTAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATATCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTTAGCGTCGAGAGCCTTTACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCATTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTGAGCCAGGCAACACAATGGCGACAGAAGCAGTTGAACTACTTGCTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAAGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCACTTGCTGCAGAAGACATTGAGTTACCTTAACAAAAAGTTGGGGGAACCGGATGCAGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGCGCGGCCCAGCAAGGAAACGGATGTCGTTGGCCAAACATTCGAGGCTCTAATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCGTCACCGTGTTGGAGGATCTGATTNTCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGATCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTACTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGTTCAACATGAACAAAAATCCCTTGAGCAAGAAGGACGATGGC------GAGGAGGAGAGCGAAGACGAAGTCGACGAGGAAGAATCGTTGAAGGATTCGAGCGATGATTCAGACGATGAAGATGAAGATGAAGAGGAGNAC---GAAGACGAGGACGATGAAGAGTCCCATTTGGCCCAAANTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAAGAGCAGGGCAAACGCTTGAATGCTGCTTTGGAGCAGTCTTTTCAAATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAACACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAAACAAGAAACCAACTCAATCGGTAATCCTGGNCGTGCTGCATTGCGTCTTCCAGGTGTACCGCCATTGCGCCACAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTTGCCAGGAATATCGAACTCGAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCAATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAAGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCAAGCCCAAGGAAAGTGCTGTCTGGCCNCTTCTAGTCGAATTTCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGTCAATGGCAGGGCGTTGCTCCACTGGCTGTTGTCCTGGCCTCCCACTTGGACGTACAGAAAACGCGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGCCGCTTTCAAGGACAACTGCTCGTCTTCCAACAAATTTGAGAAGAAGATAGCCAGATACGTAAATCAGCTAGAAACGGAGACTAGTAGTCCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGCGTCAGAAACTGCGTGAACAGATTCAGCTCGTCGCCAAAAACCTTCAACCCAACAAGAAGGCGGCGAAGCAG---AAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGATGATGAAGAGTCCACA--- +>Dsim_MD243 |100 sp| +ATGAAAAGCAAGGTGGATAAACCCATAACCACTGGTGCACCAAGTGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAGAAATCCGACGCGGACACGCAGATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGTGAAGCCGGCGGAGACCGAGGAAAAGGAAAATATCGCGAGCAACAGCAACCTGAAGGTGTCGCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGACACAAATGCTGAGCAGCGCGCTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAACCGCCGTGCCCGCCATCGACGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAAGTGGTTACAGCCTTCGGCATTTTGCAGAGCCCGCAGTTCGCCAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCTCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAANAAGCCGTTGAGTGGCTTGAAAGTAAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGAGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACTCACAGCTTTTCGATTTGTATTTCTCCGGCTCCACCATTCACAGCGATGACGTATACGCCAGATTGGCTAGTTTTCTTATGAATGGCGGAAAGGAAATGCTCGCCGCCTGGCAGCAGTATATTGATTCCAAGCAGCCACTCAAATTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCAACGTGCTCCGCAACTTTAAGCCAAGGGAAGAACAACTTATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGCTGCAGGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCAAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTCGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCAGCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATATCCTTGCCGCGTTTCTGCCAGAAAATGATAAATCAACTAAGCGTCGAGAGCCTTTACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCATTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTGAGCCAGGCAACACAATGGCGACAGAAGCAGTTGAACTACTTGCTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAAGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCACTTGCTGCAGAAGACATTGAGTTACCTTAACAAAAAGTTGGGGGAACCGGATGCAGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGCGCGGCCCAGCAAGGAAACGGATGTCGTTGGCCAAACATTCGAGGCTCTAATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCGTCACCGTGTTGGAGGATCTGATTNTCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGATCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTACTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGTTCAACATGAACAAAAATCCCTTGAGCAAGAAGGACGATGGC------GAGGAGGAGAGCGAAGACGAAGTCGACGAGGAAGAATCGTTGAAGGATTCGAGCGATGATTCAGACGATGAAGATGAAGATGAAGAGGAGNAC---GAAGACGAGGACGATGAAGAGTCCCATTTGGCCCAAANTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAAGAGCAGGGCAAACGCTTGAATGCTGCTTTGGAGCAGTCTTTTCAAATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAACACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAAACAAGAAACCAACTCAATCGGTAATCCTGGNCGTGCTGCATTGCGTCTTCCAGGTGTACCGCCATTGCGCCACAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTTGCCAGGAATATCGAACTCGAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCAATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAAGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCAAGCCCAAGGAAAGTGCTGTCTGGCCNCTTCTAGTCGAATTTCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGTCAATGGCAGGGCGTTGCTCCACTGGCTGTTGTCCTGGCCTCCCACTTGGACGTACAGAAAACGCGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGCCGCTTTCAAGGACAACTGCTCGTCTTCCAACAAATTTGAGAAGAAGATAGCCAGATACGTAAATCAGCTAGAAACGGAGACTAGTAGTCCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGCGTCAGAAACTGCGTGAACAGATTCAGCTCGTCGCCAAAAACCTTCAACCCAACAAGAAGGCGGCGAAGCAG---AAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGATGATGAAGAGTCCACA--- +>Dsim_MD251 |39 sp| +ATGAAAAGCAAGGTGGATAAACCCATAACCACTGGTGCACCAAGTGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAGAAATCCGACGCGGACACGCAGATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGTGAAGCCGGCGGAGACCGAGGAAAAGGAAAATATCGCGAGCAACGGCAACCTGAAGGTGTCGCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGACACAAATGCTGAGCAGCGCGCTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAACCGCCGTGCCCGCCATCGACGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAAGTGGTTACAGCCTTCGGCATTTTGCAGAGCCCGCAGTTCGCCAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCTCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAANAAGCCGTTGAGTGGCTTGAAAGTAAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGAGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACTCACAGCTTTTCGATTTGTATTTCTCCGGCTCCACCATTCACAGCGATGACGTATACGCCAGATTGGCTAGTTTTCTTATGAATGGCGGAAAGGAAATGCTCGCCGCCTGGCAGCAGTATATTGATTCCAAGCAGCCACTCAAATTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCAACGTGCTCCGCAACTTTAAGCCAAGGGAAGAACAACTTATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGCTGCAGGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCAAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTCGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCAGCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATATCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTTAGCGTCGAGAGCCTTTACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCATTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTGAGCCAGGCAACACAATGGCGACAGAAGCAGTTGAACTACTTGCTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAAGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCACTTGCTGCAGAAGACATTGAGTTACCTTAACAAAAAGTTGGGGGAACCGGATGCAGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGCGCGGCCCAGCAAGGAAACGGATGTCGTTGGCCAAACATTCGAGGCTCTAATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCGTCACCGTGTTGGAGGATCTGATTNTCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGATCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTACTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGTTCAACATGAACAAAAATCCCTTGAGCAAGAAGGACGATGGC------GAGGAGGAGAGCGAAGACGAAGTCGACGAGGAAGAATCGTTGAAGGATTCGAGCGATGATTCAGACGATGAAGATGAAGATGAAGAGGAGNAC---GAAGACGAGGACGATGAAGAGTCCCATTTGGCCCAAANTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAAGAGCAGGGCAAACGCTTGAATGCTGCTTTGGAGCAGTCTTTTCAAATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAACACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAAACAAGAAACCAACTCAATCGGTAATCCTGGNCGTGCTGCATTGCGTCTTCCAGGTGTACCGCCATTGCGCCACAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTTGCCAGGAATATCGAACTCGAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCAATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAAGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCAAGCCCAAGGAAAGTGCTGTCTGGCCNCTTCTAGTCGAATTTCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGTCAATGGCAGGGCGTTGCTCCACTGGCTGTTGTCCTGGCCTCCCACTTGGACGTACAGAAAACGCGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGCCGCTTTCAAGGACAACTGCTCGTCTTCCAACAAATTTGAGAAGAAGATAGCCAGATACGTAAATCAGCTAGAAACGGAGACTAGTAGTCCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGCGTCAGAAACTGCGTGAACAGATTCAGCTCGTCGCCAAAAACCTTCAACCCAACAAGAAGGCGGCGAAGCAG---AAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGATGATGAAGAGTCCACA--- +>Dsim_MD255 |95 sp| +ATGAAAAGCAAGGTGGATAAACCCATAACCACTGGTGCACCAAGTGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAGAAATCCGACGCGGACACGCAGATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGTGAAGCCGGCGGAGACCGAGGAAAAGGAAAATATCGCGAGCAACGGCAACCTGAAGGTGTCGCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGACACAAATGCTGAGCAGCGCGCTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAACCGCCGTGCCCGCCATCGACGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAAGTGGTTACAGCCTTCGGCATTTTGCAGAGCCCGCAGTTCGCCAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCTCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAANAAGCCGTTGAGTGGCTTGAAAGTAAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGAGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACTCACAGCTTTTCGATTTGTATTTCTCCGGCTCCACCATTCACAGCGATGACGTATACGCCAGATTGGCTAGTTTTCTTATGAATGGCGGAAAGGAAATGCTCGCCGCCTGGCAGCAGTATATTGATTCCAAGCAGCCACTCAAATTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCAACGTGCTCCGCAACTTTAAGCCAAGGGAAGAACAACTTATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGCTGCAGGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCTAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTCGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCAGCTGCTGCTTAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATATCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTAAGCGTCGAGAGCCTTTACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCATTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTGAGCCAGGCAACACAATGGCGACAGAAGCAGTTGAACTACTTGCTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAGGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCACTTGCTGCAAAAGACATTGAGTTACCTTAACAAAAAGTTGGGGGAACCGGATGCAGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGCGCGGCCCAGCAAGGAAACGGATGTCGTTGGCCAAACATTCGAGGCTCTAATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCGTCACCGTGTTGGAGGATCTGATTNTCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGATCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTACTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGTTCAACATGAACAAAAATCCCTTGAGCAAGAAGGACGATGGC------GAGGAGGAGAGCGAAGACGAAGTCGACGAGGAAGAATCGTTGAAGGATTCGAGCGATGATTCAGACGATGAAGATGAAGATGAAGAGGAGNAC---GAAGACGAGGACGATGAAGAGTCCCATTTGGCCCAAANTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAGGAGCAGGGCAAACGCTTGAATGCTGCTTTGGAGCAGTCTTTTCAAATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAACACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAAACAAGAAACCAACTCAATCGGTAATCCTGGNCGTGCTGCATTGCGTCTTCCAGGTGTACCGCCATTGCGCCACAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTTGCCAGGAATATCGAACTCGAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCAATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAAGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCAAGCCCAAGGAAAGTGCTGTCTGGCCNCTTCTAGTCGAATTTCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGTCAATGGCAGGGCGTTGCTCCACTGGCTGTTGTCCTGGCCTCCCACTTGGACGTACAGAAAACGCGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGCCGCTTTCAAGGACAACTGCTCGTCTTCCAACAAATTTGAGAAGAAGATAGCCAGATACGTAAATCAGCTAGAAACGGAGACTAGTAGTCCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGCGTCAGAAACTGCGTGAACAGATTCAGCTCGTCGCCAAAAACCTTCAACCCAACAAGAAGGCGGCGAAGCAG---AAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGATGATGAAGAGTCCACA--- +>Dsim_MD63 |81 sp| +ATGAAAAGCAAGGTGGATAAACCCATAACCACTGGTGCACCAAGTGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAGAAATCCGACGCGGACACGCAGATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGTGAAGCCGGCGGAGACCGAGGAAAAGGAAAATATCGCGAGCAACGGCAACCTGAAGGTGTCGCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGACACAAATGCTGAGCAGCGCGCTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAACCGCCGTGCCCGCCATCGACGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAAGTGGTTACAGCCTTCGGCATTTTGCAGAGCCCGCAGTTCGCCAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCTCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAANAAGCCGTTGAGTGGCTTGAAAGTAAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGAGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACTCACAGCTTTTCGATTTGTATTTCTCCGGCTCCACCATTCACAGCGATGACGTATACGCCAGATTGGCTAGTTTTCTTATGAATGGCGGAAAGGAAATGCTCGCCGCCTGGCAGCAGTATATTGATTCCAAGCAGCCACTCAAATTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCAACGTGCTCCGCAACTTTAAGCCAAGGGAAGAACAACTTATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGCTGCAGGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCAAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTCGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCAGCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATATCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTTAGCGTCGAGAGCCTTTACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCATTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTGAGCCAGGCAACACAATGGCGACAGAAGCAGTTGAACTACTTGCTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAAGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCACTTGCTGCAGAAGACATTGAGTTACCTTAACAAAAAGTTGGGGGAACCGGATGCAGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGCGCGGCCCAGCAAGGAAACGGATGTCGTTGGCCAAACATTCGAGGCTCTAATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCGTCACCGTGTTGGAGGATCTGATTNTCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGATCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTACTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGTTCAACATGAACAAAAATCCCTTGAGCAAGAAGGACGATGGC------GAGGAGGAGAGCGAAGACGAAGTCGACGAGGAAGAATCGTTGAAGGATTCGAGCGATGATTCAGACGATGAAGATGAAGATGAAGAGGAGNAC---GAAGACGAGGACGATGAAGAGTCCCATTTGGCCCAAANTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAAGAGCAGGGCAAACGCTTGAATGCTGCTTTGGAGCAGTCTTTTCAAATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAACACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAAACAAGAAACCAACTCAATCGGTAATCCTGGNCGTGCTGCATTGCGTCTTCCAGGTGTACCGCCATTGCGCCACAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTTGCCAGGAATATCGAACTCGAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCAATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAAGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCAAGCCCAAGGAAAGTGCTGTCTGGCCNCTTCTAGTCGAATTTCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGTCAATGGCAGGGCGTTGCTCCACTGGCTGTTGTCCTGGCCTCCCACTTGGACGTACAGAAAACGCGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGCCGCTTTCAAGGACAACTGCTCGTCTTCCAACAAATTTGAGAAGAAGATAGCCAGATACGTAAATCAGCTAGAAACGGAGACTAGTAGTCCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGCGTCAGAAACTGCGTGAACAGATTCAGCTCGTCGCCAAAAACCTTCAACCCAACAAGAAGGCGGCGAAGCAG---AAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGATGATGAAGAGTCCACA--- +>Dsim_MD72 |130 sp| +ATGAAAAGCAAGGTGGATAAACCCATAACCACTGGTGCACCAAGTGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAGAAATCCGACGCGGACACGCAGATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGTGAAGCCGGCGGAGACCGAGGAAAAGGAAAATATCGCGAGCAACGGCAACCTGAAGGTGTCGCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGACACAAATGCTGAGCAGCGCGCTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAACCGCCGTGCCCGCCATCGACGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAAGTGGTTACAGCCTTCGGCATTTTGCAGAGCCCGCAGTTCGCCAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCTCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAANAAGCCGTTGAGTGGCTTGAAAGTAAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGAGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACTCACAGCTTTTCGATTTGTATTTCTCCGGCTCCACCATTCACAGCGATGACGTATACGCCAGATTGGCTAGTTTTCTTATGAATGGCGGAAAGGAAATGCTCGCCGCCTGGCAGCAGTATATTGATTCCAAGCAGCCACTCAAATTGAATGCGGCCAAGGCGTGTGCCATCCAAGTACTGAGCAACGTGCTCCGCAACTTTAAGCCAAGGGAAGAACAACTTATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGCTGCAGGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCAAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTCGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCAGCTGCTGCTTAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATATCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTAAGCGTCGAGAGCCTTTACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCATTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTGAGCCAGGCAACACAATGGCGACAGAAGCAGTTGAACTACTTGCTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAGGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCACTTGCTGCAGAAGACATTGAGTTACCTTAACAAAAAGTTGGGGGAACCGGATGCAGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGCGCGGCCCAGCAAGGAAACGGATGTCGTTGGCCAAACATTCGAGGCTCTAATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCGTCACCGTGTTGGAGGATCTGATTNTCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGATCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTACTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGTTCAACATGAACAAAAATCCCTTGAGCAAGAAGGACGATGGC------GAGGAGGAGAGCGAAGACGAAGTCGACGAGGAAGAATCGTTGAAGGATTCGAGCGATGATTCAGACGATGAAGATGAAGATGAAGAGGAGNAC---GAAGACGAGGACGATGAAGAGTCCCATTTGGCCCAAANTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAGGAGCAGGGCAAACGCTTGAATGCTGCTTTGGAGCAGTCTTTTCAAATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAACACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAAACAAGAAACCAACTCAATCGGTAATCCTGGNCGTGCTGCATTGCGTCTTCCAGGTGTACCGCCATTGCGCCACAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTTGCCAGGAATATCGAACTCAAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCTATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAAGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCAAGCCCAAGGAAAGTGCTGTCTGGCCNCTTCTAGTCGAATTTCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGTCAATGGCAGGGCGTTGCTCCACTGGCTGTTGTCCTGGCCTCCCACTTGGACGTACAGAAAACGCGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGCCGCTTTCAAGGACAACTGCTCGTCTTCCAACAAATTTGAGAAGAAGATAGCCAGATACGTAAATCAGCTAGAAACGGAGACTAGTAGTCCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGCGTCAGAAACTGCGTGAACAGATTCAGCTCGTCGCCAAAAACCTTCAACCCAACAAGAAGGCGGCGAAGCAG---AAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGATGATGAAGAGTCCACA--- +>Dsim_MD73 |112 sp| +ATGAAAAGCAAGGTGGATAAACCCATAACCACTGGTGCACCAAGTGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAGAAATCCGACGCGGACACGCAGATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGTGAAGCCGGCGGAGACCGAGGAAAAGGAAAATATCGCGAGCAACGGCAACCTGAAGGTGTCGCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGACACAAATGCTGAGCAGCGCGCTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAACCGCCGTGCCCGCCATCGACGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAAGTGGTTACAGCCTTCGGCATTTTGCAGAGCCCGCAGTTCGCCAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCTCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAANAAGCCGTTGAGTGGCTTGAAAGTAAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGAGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACTCACAGCTTTTCGATTTGTATTTCTCCGGCTCCACCATTCACAGCGATGACGTATACGCCAGATTGGCTAGTTTTCTTATGAATGGCGGAAAGGAAATGCTCGCCGCCTGGCAGCAGTATATTGATTCCAAGCAGCCACTCAAATTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCAACGTGCTCCGCAACTTTAAGCCAAGGGAAGAACAACTTATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGCTGCAGGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCAAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTCGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCAGCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATATCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTTAGCGTCGAGAGCCTTTACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCATTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTGAGCCAGGCAACACAATGGCGACAGAAGCAGTTGAACTACTTGCTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAAGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCACTTGCTGCAGAAGACATTGAGTTACCTTAACAAAAAGTTGGGGGAACCGGATGCAGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGCGCGGCCCAGCAAGGAAACGGATGTCGTTGGCCAAACATTCGAGGCTCTAATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCGTCACCGTGTTGGAGGATCTGATTNTCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGATCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTACTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGTTCAACATGAACAAAAATCCCTTGAGCAAGAAGGACGATGGC------GAGGAGGAGAGCGAAGACGAAGTCGACGAGGAAGAATCGTTGAAGGATTCGAGCGATGATTCAGACGATGAAGATGAAGATGAAGAGGAGNAC---GAAGACGAGGACGATGAAGAGTCCCATTTGGCCCAAANTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAAGAGCAGGGCAAACGCTTGAATGCTGCTTTGGAGCAGTCTTTTCAAATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAACACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAAACAAGAAACCAACTCAATCGGTAATCCTGGNCGTGCTGCATTGCGTCTTCCAGGTGTACCGCCATTGCGCCACAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTTGCCAGGAATATCGAACTCGAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCAATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAAGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCAAGCCCAAGGAAAGTGCTGTCTGGCCNCTTCTAGTCGAATTTCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGTCAATGGCAGGGCGTTGCTCCACTGGCTGTTGTCCTGGCCTCCCACTTGGACGTACAGAAAACGCGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGCCGCTTTCAAGGACAACTGCTCGTCTTCCAACAAATTTGAGAAGAAGATAGCCAGATACGTAAATCAGCTAGAAACGGAGACTAGTAGTCCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGCGTCAGAAACTGCGTGAACAGATTCAGCTCGTCGCCAAAAACCTTCAACCCAACAAGAAGGCGGCGAAGCAG---AAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGATGATGAAGAGTCCACA--- +>Dsim_NS05 |55 sp| +ATGAAAAGCAAGGTGGATAAACCCATAACCACTGGTGCACCAAGTGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAGAAATCCGACGCGGACACGCAGATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGTGAAGCCGGCGGAGACCGAGGAAAAGGAAAATATCGCGAGCAACGGCAACCTGAAGGTGTCGCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGACACAAATGCTGAGCAGCGCGCTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAACCGCCGTGCCCGCCATCGACGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAAGTGGTTACAGCCTTCGGCATTTTGCAGAGCCCGCAGTTCGCCAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCTCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAANAAGCCGTTGAGTGGCTTGAAAGTAAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGAGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACTCACAGCTTTTCGATTTGTATTTCTCCGGCTCCACCATTCACAGCGATGACGTATACGCCAGATTGGCTAGTTTTCTTATGAATGGCGGAAAGGAAATGCTCGCCGCCTGGCAGCAGTATATTGATTCCAAGCAGCCACTCAAATTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCAACGTGCTCCGCAACTTTAAGCCAAGGGAAGAACAACTTATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGCTGCAGGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCTAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTCGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCAGCTGCTGCTTAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATATCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTAAGCGTCGAGAGCCTTTACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCATTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTGAGCCAGGCAACACAATGGCGACAGAAGCAGTTGAACTACTTGCTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAGGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCACTTGCTGCAGAAGACATTGAGTTACCTTAACAAAAAGTTGGGGGAACCGGATGCAGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGCGCGGCCCAGCAAGGAAACGGATGTCGTTGGCCAAACATTCGAGGCTCTAATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCGTCACCGTGTTGGAGGATCTGATTNTCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGATCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTACTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGTTCAACATGAACAAAAATCCCTTGAGCAAGAAGGACGATGGC------GAGGAGGAGAGCGAAGACGAAGTCGACGAGGAAGAATCGTTGAAGGATTCGAGCGATGATTCAGACGATGAAGATGAAGATGAAGAGGAGNAC---GAAGACGAGGACGATGAAGAGTCCCATTTGGCCCAAANTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAGGAGCAGGGCAAACGCTTGAATGCTGCTTTGGAGCAGTCTTTTCAAATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAACACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAAACAAGAAACCAACTCAATCGGTAATCCTGGNCGTGCTGCATTGCGTCTTCCAGGTGTACCGCCATTGCGCCACAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTTGCCAGGAATATCGAACTCAAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCTATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAAGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCAAGCCCAAGGAAAGTGCTGTCTGGCCNCTTCTAGTCGAATTTCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGTCAATGGCAGGGCGTTGCTCCACTGGCTGTTGTCCTGGCCTCCCACTTGGACGTACAGAAAACGCGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGCCGCTTTCAAGGACAACTGCTCGTCTTCCAACAAATTTGAGAAGAAGATAGCCAGATACGTAAATCAGCTAGAAACGGAGACTAGTAGTCCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGCGTCAGAAACTGCGTGAACAGATTCAGCTCGTCGCCAAAAACCTTCAACCCAACAAGAAGGCGGCGAAGCAG---AAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGATGATGAAGAGTCCACA--- +>Dsim_NS11 |6 sp| +ATGAAAAGCAAGGTGGATAAACCCATAACCACTGGTGCACCAAGTGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAGAAATCCGACGCGGACACGCAGATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGTGAAGCCGGCGGAGACCGAGGAAAAGGAAAATATCGCGAGCAACGGCAACCTGAAGGTGTCGCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGACACAAATGCTGAGCAGCGCGCTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAACCGCCGTGCCCGCCATCGACGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAAGTGGTTACAGCCTTCGGCATTTTGCAGAGCCCGCAGTTCGCCAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCTCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAANAAGCCGTTGAGTGGCTTGAAAGTAAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGAGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACTCACAGCTTTTCGATTTGTATTTCTCCGGCTCCACCATTCACAGCGATGACGTATACGCCAGATTGGCTAGTTTTCTTATGAATGGCGGAAAGGAAATGCTCGCCGCCTGGCAGCAGTATATTGATTCCAAGCAGCCACTCAAATTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCAACGTGCTCCGCAACTTTAAGCCAAGGGAAGAACAACTTATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGCTGCAGGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCTAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTCGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCAGCTGCTGCTTAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATATCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTAAGCGTCGAGAGCCTTTACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCATTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTGAGCCAGGCAACACAATGGCGACAGAAGCAGTTGAACTACTTGCTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAGGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCACTTGCTGCAGAAGACATTGAGTTACCTTAACAAAAAGTTGGGGGAACCGGATGCAGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGCGCGGCCCAGCAAGGAAACGGATGTCGTTGGCCAAACATTCGAGGCTCTAATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCGTCACCGTGTTGGAGGATCTGATTNTCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGATCAAGTTAACGAAGAGCTCAAATGGCAGGACGTACTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTACTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGTTCAACATGAACAAAAATCCCTTGAGCAAGAAGGACGATGGC------GAGGAGGAGAGCGAAGACGAAGTCGACGAGGAAGAATCGTTGAAGGATTCGAGCGATGATTCAGACGATGAAGATGAAGATGAAGAGGAGNAC---GAAGACGAGGACGATGAAGAGTCCCATTTGGCCCAAANTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAGGAGCAGGGCAAACGCTTGAATGCTGCTTTGGAGCAGTCTTTTCAAATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAACACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAAACAAGAAACCAACTCAATCGGTAATCCTGGNCGTGCTGCATTGCGTCTTCCAGGTGTACCGCCATTGCGCCACAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTTGCCAGGAATATCGAACTCGAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCCATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAAGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCAAGCCCAAGGAAAGTGCTGTCTGGCCNCTTCTAGTCGAATTTCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGTCAATGGCAGGGCGTTGCTCCACTGGCTGTTGTCCTGGCCTCCCACTTGGACGTACAGAAAACGCGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGCCGCTTTCAAGGACAACTGCTCGTCTTCCAACAAATTTGAGAAGAAGATAGCCAGATACGTAAATCAGCTAGAAACGGAGACTAGTAGTCCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGCGTCAGAAACTGCGTGAACAGATTCAGCTCGTCGCCAAAAACCTTCAACCCAACAAGAAGGCGGCGAAGCAG---AAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGATGATGAAGAGTCCACA--- +>Dsim_NS111 |107 sp| +ATGAAAAGCAAGGTGGATAAACCCATAACCACTGGTGCACCAAGTGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAGAAATCCGACGCGGACACGCAGATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGTGAAGCCGGCGGAGACCGAGGAAAAGGAAAATATCGCGAGCAACGGCAACCTGAAGGTGTCGCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGACACAAATGCTGAGCAGCGCGCTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAACCGCCGTGCCCGCCATCGACGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAAGTGGTTACAGCCTTCGGCATTTTGCAGAGCCCGCAGTTCGCCAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCTCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAANAAGCCGTTGAGTGGCTTGAAAGTAAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGAGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACTCACAGCTTTTCGATTTGTATTTCTCCGGCTCCACCATTCACAGCGATGACGTATACGCCAGATTGGCTAGTTTTCTTATGAATGGCGGAAAGGAAATGCTCGCCGCCTGGCAGCAGTATATTGATTCCAAGCAGCCACTCAAATTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCAACGTGCTCCGCAACTTTAAGCCAAGGGAAGAACAACTTATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGCTGCAGGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCAAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTCGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCAGCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATATCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTTAGCGTCGAGAGCCTTTACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCATTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTGAGCCAGGCAACACAATGGCGACAGAAGCAGTTGAACTACTTGCTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAAGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCACTTGCTGCAGAAGACATTGAGTTACCTTAACAAAAAGTTGGGGGAACCGGATGCAGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGCGCGGCCCAGCAAGGAAACGGATGTCGTTGGCCAAACATTCGAGGCTCTAATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCGTCACCGTGTTGGAGGATCTGATTNTCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGATCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTACTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGTTCAACATGAACAAAAATCCCTTGAGCAAGAAGGACGATGGC------GAGGAGGAGAGCGAAGACGAAGTCGACGAGGAAGAATCGTTGAAGGATTCGAGCGATGATTCAGACGATGAAGATGAAGATGAAGAGGAGNAC---GAAGACGAGGACGATGAAGAGTCCCATTTGGCCCAAANTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAAGAGCAGGGCAAACGCTTGAATGCTGCTTTGGAGCAGTCTTTTCAAATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAACACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAAACAAGAAACCAACTCAATCGGTAATCCTGGNCGTGCTGCATTGCGTCTTCCAGGTGTACCGCCATTGCGCCACAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTTGCCAGGAATATCGAACTCGAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCAATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAAGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCAAGCCCAAGGAAAGTGCTGTCTGGCCNCTTCTAGTCGAATTTCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGTCAATGGCAGGGCGTTGCTCCACTGGCTGTTGTCCTGGCCTCCCACTTGGACGTACAGAAAACGCGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGCCGCTTTCAAGGACAACTGCTCGTCTTCCAACAAATTTGAGAAGAAGATAGCCAGATACGTAAATCAGCTAGAAACGGAGACTAGTAGTCCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGCGTCAGAAACTGCGTGAACAGATTCAGCTCGTCGCCAAAAACCTTCAACCCAACAAGAAGGCGGCGAAGCAG---AAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGATGATGAAGAGTCCACA--- +>Dsim_NS113 |129 sp| +ATGAAAAGCAAGGTGGATAAACCCATAACCACTGGTGCACCAAGTGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAGAAATCCGACGCGGACACGCAGATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGTGAAGCCGGCGGAGACCGAGGAAAAGGAAAATATCGCGAGCAACGGCAACCTGAAGGTGTCGCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGACACAAATGCTGAGCAGCGCGCTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAACCGCCGTGCCCGCCATCGACGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAAGTGGTTACAGCCTTCGGCATTTTGCAGAGCCCGCAGTTCGCCAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCTCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAANAAGCCGTTGAGTGGCTTGAAAGTAAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGAGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACTCACAGCTTTTCGATTTGTATTTCTCCGGCTCCACCATTCACAGCGATGACGTATACGCCAGATTGGCTAGTTTTCTTATGAATGGCGGAAAGGAAATGCTCGCCGCCTGGCAGCAGTATATTGATTCCAAGCAGCCACTCAAATTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCAACGTGCTCCGCAACTTTAAGCCAAGGGAAGAACAACTTATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGCTGCAGGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCTAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTCGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCAGCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATATCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTAAGCGTCGAGAGCCTTTACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCATTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTGAGCCAGGCAACACAATGGCGACAGAAGCAGTTGAACTACTTGCTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAGGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCACTTGCTGCAGAAGACATTGAGTTACCTTAACAAAAAGTTGGGGGAACCGGATGCAGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGCGCGGCCCAGCAAGGAAACGGATGTCGTTGGCCAAACATTCGAGGCTCTAATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCGTCACCGTGTTGGAGGATCTGATTNTCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGATCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTACTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGTTCAACATGAACAAAAATCCCTTGAGCAAGAAGGACGATGGC------GAGGAGGAGAGCGAAGACGAAGTCGACGAGGAAGAATCGTTGAAGGATTCGAGCGATGATTCAGACGATGAAGATGAAGATGAAGAGGAGNAC---GAAGACGAGGACGATGAAGAGTCCCATTTGGCCCAAANTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAAGAGCAGGGCAAACGCTTGAATGCTGCTTTGGAGCAGTCTTTTCAAATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAACACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAAACAAGAAACCAACTCAATCGGTAATCCTGGNCGTGCTGCATTGCGTCTTCCAGGTGTACCGCCATTGCGCCACAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTTGCCAGGAATATCGAACTCGAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCAATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAAGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCAAGCCCAAGGAAAGTGCTGTCTGGCCNCTTCTAGTCGAATTTCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGTCAATGGCAGGGCGTTGCTCCACTGGCTGTTGTCCTGGCCTCCCACTTGGACGTACAGAAAACGCGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGCCGCTTTCAAGGACAACTGCTCGTCTTCCAACAAATTTGAGAAGAAGATAGCCAGATACGTAAATCAGCTAGAAACGGAGACTAGTAGTCCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGCGTCAGAAACTGCGTGAACAGATTCAGCTCGTCGCCAAAAACCTTCAACCCAACAAGAAGGCGGCGAAGCAG---AAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGATGATGAAGAGTCCACA--- +>Dsim_NS116 |73 sp| +ATGAAAAGCAAGGTGGATAAACCCATAACCACTGGTGCACCAAGTGCAACCAAGACAAAGGGCAAGGAGGACCGCAAGCGGGCAAAAACTCAGAAATCCGACGCGGACACGCAGATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGTGAAGCCGGCGGAGACCGAGGAAAAGGAAAATATCGCGAGCAACGGCAACCTGAAGGTGTCGCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGACACAAATGCTGAGCAGCGCGCTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAACCGCCGTGCCCGCCATCGACGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAAGTGGTTACAGCCTTCGGCATTTTGCAGAGCCCGCAGTTCGCCAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCTCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAANAAGCCGTTGAGTGGCTTGAAAGTAAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGAGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACTCACAGCTTTTCGATTTGTATTTCTCCGGCTCCACCATTCACAGCGATGACGTATACGCCAGATTGGCTAGTTTTCTTATGAATGGAGGAAAGGAAATGCTCGCCGCCTGGCAGCAGTATATTGATTCCAAGCAGCCACTCAAATTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCAACGTGCTCCGCAACTTTAAGCCAAGGGAAGAACAACTTATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGCTGCAGGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCAAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTCGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCAGCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATATCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTTAGCGTCGAGAGCCTTTACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCATTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTGAGCCAGGCAACACAATGGCGACAGAAGCAGTTGAACTACTTGCTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAAGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCACTTGCTGCAGAAGACATTGAGTTACCTTAACAAAAAGTTGGGGGAACCGGATGCAGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGCGCGGCCCAGCAAGGAAACGGATGTCGTTGGCCAAACATTCGAGGCTCTAATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCGTCACCGTGTTGGAGGATCTGATTNTCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGATCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTACTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGTTCAACATGAACAAAAATCCCTTGAGCAAGAAGGACGATGGC------GAGGAGGAGAGCGAAGACGAAGTCGACGAGGAAGAATCGTTGAAGGATTCGAGCGATGATTCAGACGATGAAGATGAAGATGAAGAGGAGNAC---GAAGACGAGGACGATGAAGAGTCCCATTTGGCCCAAANTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAAGAGCAGGGCAAACGCTTGAATGCTGCTTTGGAGCAGTCTTTTCAAATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAACACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAAACAAGAAACCAACTCAATCGGTAATCCTGGNCGTGCTGCATTGCGTCTTCCAGGTGTACCGCCATTGCGCCACAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTTGCCAGGAATATCGAACTCGAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCCATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAAGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCAAGCCCAAGGAAAGTGCTGTCTGGCCNCTTCTAGTCGAATTTCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGTCAATGGCAGGGCGTTGCTCCACTGGCTGTTGTCCTGGCCTCCCACTTGGACGTACAGAAAACGCGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGCCGCTTTCAAGGACAACTGCTCGTCTTCCAACAAATTTGAGAAGAAGATAGCCAGATACGTAAATCAGCTAGAAACGGAGACTAGTAGTCCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGCGTCAGAAACTGCGTGAACAGATTCAGCTCGTCGCCAAAAACCTTCAACCCAACAAGAAGGCGGCGAAGCAG---AAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGATGATGAAGAGTCCACA--- +>Dsim_NS137 |2 sp| +ATGAAAAGCAAGGTGGATAAACCCATAACCACTGGTGCACCAAGTGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAGAAATCCGACGCGGACACGCAGATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGTGAAGCCGGCGGAGACCGAGGAAAAGGAAAATATCGCGAGCAACGGCAACCTGAAGGTGTCGCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGACACAAATGCTGAGCAGCGCGCTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAACCGCCGTGCCCGCCATCGACGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAAGTGGTTACAGCCTTCGGCATTTTGCAGAGCCCGCAGTTCGCCAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCTCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAANAAGCCGTTGAGTGGCTTGAAAGTAAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGAGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACTCACAGCTTTTCGATTTGTATTTCTCCGGCTCCACCATTCACAGCGATGACGTATACGCCAGATTGGCTAGTTTTCTTATGAATGGCGGAAAGGAAATGCTCGCCGCCTGGCAGCAGTATATTGATTCCAAGCAGCCACTCAAATTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCAACGTGCTCCGCAACTTTAAGCCAAGGGAAGAACAACTTATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGCTGCAGGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCAAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTCGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCAGCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATATCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTAAGCGTCGAGAGCCTTTACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCATTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTGAGCCAGGCAACACAATGGCGACAGAAGCAGTTGAACTACTTGCTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAGGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCACTTGCTGCAGAAGACATTGAGTTACCTTAACAAAAAGTTGGGGGAACCGGATGCAGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGCGCGGCCCAGCAAGGAAACGGATGTCGTTGGCCAAACATTCGAGGCTCTAATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCGTCACCGTGTTGGAGGATCTGATTNTCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGATCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTACTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGTTCAACATGAACAAAAATCCCTTGAGCAAGAAGGACGATGGC------GAGGAGGAGAGCGAAGACGAAGTCGACGAGGAAGAATCGTTGAAGGATTCGAGCGATGATTCAGACGATGAAGATGAAGATGAAGAGGAGNAC---GAAGACGAGGACGATGAAGAGTCCCATTTGGCCCAAANTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAGGAGCAGGGCAAACGCTTGAATGCTGCTTTGGAGCAGTCTTTTCAAATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAACACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAAACAAGAAACCAACTCAATCGGTAATCCTGGNCGTGCTGCATTGCGTCTTCCAGGTGTACCGCCATTGCGCCACAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTTGCCAGGAATATCGAACTCGAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCCATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAAGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCAAGCCCAAGGAAAGTGCTGTCTGGCCNCTTCTAGTCGAATTTCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGTCAATGGCAGGGCGTTGCTCCACTGGCTGTTGTCCTGGCCTCCCACTTGGACGTACAGAAAACGCGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGCCGCTTTCAAGGACAACTGCTCGTCTTCCAACAAATTTGAGAAGAAGATAGCCAGATACGTAAATCAGCTAGAAACGGAGACTAGTAGTCCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGCGTCAGAAACTGCGTGAACAGATTCAGCTCGTCGCCAAAAACCTTCAACCCAACAAGAAGGCGGCGAAGCAG---AAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGATGATGAAGAGTCCACA--- +>Dsim_NS19 |95 sp| +ATGAAAAGCAAGGTGGATAAACCCATAACCACTGGTGCACCAAGTGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAGAAATCCGACGCGGACACGCAGATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGTGAAGCCGGCGGAGACCGAGGAAAAGGAAAATATCGCGAGCAACGGCAACCTGAAGGTGTCGCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGACACAAATGCTGAGCAGCGCGCTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAACCGCCGTGCCCGCCATCGACGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAAGTGGTTACAGCCTTCGGCATTTTGCAGAGCCCGCAGTTCGCCAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCTCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAANAAGCCGTTGAGTGGCTTGAAAGTAAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGAGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACTCACAGCTTTTCGATTTGTATTTCTCCGGCTCCACCATTCACAGCGATGACGTATACGCCAGATTGGCTAGTTTTCTTATGAATGGCGGAAAGGAAATGCTCGCCGCCTGGCAGCAGTATATTGATTCCAAGCAGCCACTCAAATTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCAACGTGCTCCGCAACTTTAAGCCAAGGGAAGAACAACTTATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGCTGCAGGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCAAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTCGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCAGCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATATCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTTAGCGTCGAGAGCCTTTACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCATTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTGAGCCAGGCAACACAATGGCGACAGAAGCAGTTGAACTACTTGCTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAAGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCACTTGCTGCAGAAGACATTGAGTTACCTTAACAAAAAGTTGGGGGAACCGGATGCAGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGCGCGGCCCAGCAAGGAAACGGATGTCGTTGGCCAAACATTCGAGGCTCTAATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCGTCACCGTGTTGGAGGATCTGATTNTCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGATCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTACTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGTTCAACATGAACAAAAATCCCTTGAGCAAGAAGGACGATGGC------GAGGAGGAGAGCGAAGACGAAGTCGACGAGGAAGAATCGTTGAAGGATTCGAGCGATGATTCAGACGATGAAGATGAAGATGAAGAGGAGNAC---GAAGACGAGGACGATGAAGAGTCCCATTTGGCCCAAANTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAAGAGCAGGGCAAACGCTTGAATGCTGCTTTGGAGCAGTCTTTTCAAATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAACACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAAACAAGAAACCAACTCAATCGGTAATCCTGGNCGTGCTGCATTGCGTCTTCCAGGTGTACCGCCATTGCGCCACAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTTGCCAGGAATATCGAACTCGAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCAATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAAGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCAAGCCCAAGGAAAGTGCTGTCTGGCCNCTTCTAGTCGAATTTCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGTCAATGGCAGGGCGTTGCTCCACTGGCTGTTGTCCTGGCCTCCCACTTGGACGTACAGAAAACGCGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGCCGCTTTCAAGGACAACTGCTCGTCTTCCAACAAATTTGAGAAGAAGATAGCCAGATACGTAAATCAGCTAGAAACGGAGACTAGTAGTCCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGCGTCAGAAACTGCGTGAACAGATTCAGCTCGTCGCCAAAAACCTTCAACCCAACAAGAAGGCGGCGAAGCAG---AAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGATGATGAAGAGTCCACA--- +>Dsim_NS33 |50 sp| +ATGAAAAGCAAGGTGGATAAACCCATAACCACTGGTGCACCAAGTGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAGAAATCCGACGCGGACACGCAGATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGTGAAGCCGGCGGAGACCGAGGAAAAGGAAAATATCGCGAGCAACGGCAACCTGAAGGTGTCGCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGACACAAATGCTGAGCAGCGCGCTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAACCGCCGTGCCCGCCATCGACGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAAGTGGTTACAGCCTTCGGCATTTTGCAGAGCCCGCAGTTCGCCAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCTCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAANAAGCCGTTGAGTGGCTTGAAAGTAAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGAGAGAACATTCTAGCCAGCTTATGGCCCAAGAAACCAGTGTACTCACAGCTTTTCGATTTGTATTTCTCCGGCTCCACCATTCACAGCGATGACGTATACGCCAGATTGGCTAGTTTTCTTATGAATGGCGGAAAGGAAATGCTCGCCGCCTGGCAGCAGTATATTGATTCCAAGCAGCCACTCAAATTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCAACGTGCTCCGCAACTTTAAGCCAAGGGAAGAACAACTTATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGCTGCAGGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCAAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTCGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCAGCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATATCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTTAGCGTCGAGAGCCTTTACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCATTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTGAGCCAGGCAACACAATGGCGACAGAAGCAGTTGAACTACTTGCTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAAGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCACTTGCTGCAGAAGACATTGAGTTACCTTAACAAAAAGTTGGGGGAACCGGATGCAGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGCGCGGCCCAGCAAGGAAACGGATGTCGTTGGCCAAACATTCGAGGCTCTAATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCGTCACCGTGTTGGAGGATCTGATTNTCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGATCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTACTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGTTCAACATGAACAAAAATCCCTTGAGCAAGAAGGACGATGGC------GAGGAGGAGAGCGAAGACGAAGTCGACGAGGAAGAATCGTTGAAGGATTCGAGCGATGATTCAGACGATGAAGATGAAGATGAAGAGGAGNAC---GAAGACGAGGACGATGAAGAGTCCCATTTGGCCCAAANTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAAGAGCAGGGCAAACGCTTGAATGCTGCTTTGGAGCAGTCTTTTCAAATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAACACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAAACAAGAAACCAACTCAATCGGTAATCCTGGNCGTGCTGCATTGCGTCTTCCAGGTGTACCGCCATTGCGCCACAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTTGCCAGGAATATCGAACTCGAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCAATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAAGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCAAGCCCAAGGAAAGTGCTGTCTGGCCNCTTCTAGTCGAATTTCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGTCAATGGCAGGGCGTTGCTCCACTGGCTGTTGTCCTGGCCTCCCACTTGGACGTACAGAAAACGCGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGCCGCTTTCAAGGACAACTGCTCGTCTTCCAACAAATTTGAGAAGAAGATAGCCAGATACGTAAATCAGCTAGAAACGGAGACTAGTAGTCCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGCGTCAGAAACTGCGTGAACAGATTCAGCTCGTCGCCAAAAACCTTCAACCCAACAAGAAGGCGGCGAAGCAG---AAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGATGATGAAGAGTCCACA--- +>Dsim_NS37 |115 sp| +ATGAAAAGCAAGGTGGATAAACCCATAACCACTGGTGCACCAAGTGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAGAAATCCGACGCGGACACGCAGATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGTGAAGCCGGCGGAGACCGAGGAAAAGGAAAATATCGCGAGCAACGGCAACCTGAAGGTGTCGCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGACACAAATGCTGAGCAGCGCGCTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAACCGCCGTGCCCGCCATCGACGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAAGTGGTTACAGCCTTCGGCATTTTGCAGAGCCCGCAGTTCGCCAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCTCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAANAAGCCGTTGAGTGGCTTGAAAGTAAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGAGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACTCACAGCTTTTCGATTTGTATTTCTCCGGCTCCACCATTCACAGCGATGACGTATACGCCAGATTGGCTAGTTTTCTTATGAATGGCGGAAAGGAAATGCTCGCCGCCTGGCAGCAGTATATTGATTCCAAGCAGCCACTCAAATTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCAACGTGCTCCGCAACTTTAAGCCAAGGGAAGAACAACTTATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGCTGCAGGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCAAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTCGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCAGCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATATCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTAAGCGTCGAGAGCCTTTACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCATTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTGAGCCAGGCAACACAATGGCGACAGAAGCAGTTGAACTACTTGCTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAGGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCACTTGCTGCAGAAGACATTGAGTTACCTTAACAAAAAGTTGGGGGAACCGGATGCAGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGCGCGGCCCAGCAAGGAAACGGATGTCGTTGGCCAAACATTCGAGGCTCTAATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCGTCACCGTGTTGGAGGATCTGATTNTCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGATCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTACTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGTTCAACATGAACAAAAATCCCTTGAGCAAGAAGGACGATGGC------GAGGAGGAGAGCGAAGACGAAGTCGACGAGGAAGAATCGTTGAAGGATTCGAGCGATGATTCAGACGATGAAGATGAAGATGAAGAGGAGNAC---GAAGACGAGGACGATGAAGAGTCCCATTTGGCCCAAANTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAGGAGCAGGGCAAACGCTTGAATGCTGCTTTGGAGCAGTCTTTTCAAATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAACACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAAACAAGAAACCAACTCAATCGGTAATCCTGGNCGTGCTGCATTGCGTCTTCCAGGTGTACCGCCATTGCGCCACAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTTGCCAGGAATATCGAACTCGAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCCATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAAGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCAAGCCCAAGGAAAGTGCTGTCTGGCCNCTTCTAGTCGAATTTCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGTCAATGGCAGGGCGTTGCTCCACTGGCTGTTGTCCTGGCCTCCCACTTGGACGTACAGAAAACGCGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGCCGCTTTCAAGGACAACTGCTCGTCTTCCAACAAATTTGAGAAGAAGATAGCCAGATACGTAAATCAGCTAGAAACGGAGACTAGTAGTCCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGCGTCAGAAACTGCGTGAACAGATTCAGCTCGTCGCCAAAAACCTTCAACCCAACAAGAAGGCGGCGAAGCAG---AAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGATGATGAAGAGTCCACA--- +>Dsim_NS39 |121 sp| +ATGAAAAGCAAGGTGGATAAACCCATAACCACTGGTGCACCAAGTGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAGAAATCCGACGCGGACACGCAGATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGTGAAGCCGGCGGAGACCGAGGAAAAGGAAAATATCGCGAGCAACGGCAACCTGAAGGTGTCGCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGACACAAATGCTGAGCAGCGCGCTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAACCGCCGTGCCCGCCATCGACGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAAGTGGTTACAGCCTTCGGCATTTTGCAGAGCCCGCAGTTCGCCAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCTCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAANAAGCCGTTGAGTGGCTTGAAAGTAAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGAGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACTCACAGCTTTTCGATTTGTATTTCTCCGGCTCCACCATTCACAGCGATGACGTATACGCCAGATTGGCTAGTTTTCTTATGAATGGCGGAAAGGAAATGCTCGCCGCCTGGCAGCAGTATATTGATTCCAAGCAGCCACTCAAATTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCAACGTGCTCCGCAACTTTAAGCCAAGGGAAGAACAACTTATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGCTGCAGGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCTAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTCGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCAGCTGCTGCTTAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATATCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTAAGCGTCGAGAGCCTTTACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCATTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTGAGCCAGGCAACACAATGGCGACAGAAGCAGTTGAACTACTTGCTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAGGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCACTTGCTGCAGAAGACATTGAGTTACCTTAACAAAAAGTTGGGGGAACCGGATGCAGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGCGCGGCCCAGCAAGGAAACGGATGTCGTTGGCCAAACATTCGAGGCTCTAATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCGTCACCGTGTTGGAGGATCTGATTNTCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGATCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTACTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGTTCAACATGAACAAAAATCCCTTGAGCAAGAAGGACGATGGC------GAGGAGGAGAGCGAAGACGAAGTCGACGAGGAAGAATCGTTGAAGGATTCGAGCGATGATTCAGACGATGAAGATGAAGATGAAGAGGAGNAC---GAAGACGAGGACGATGAAGAGTCCCATTTGGCCCAAANTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAGGAGCAGGGCAAACGCTTGAATGCTGCTTTGGAGCAGTCTTTTCAAATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAACACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAAACAAGAAACCAACTCAATCGGTAATCCTGGNCGTGCTGCATTGCGTCTTCCAGGTGTACCGCCATTGCGCCACAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTTGCCAGGAATATCGAACTCGAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCCATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAAGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCAAGCCCAAGGAAAGTGCTGTCTGGCCNCTTCTAGTCGAATTTCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGTCAATGGCAGGGCGTTGCTCCACTGGCTGTTGTCCTGGCCTCCCACTTGGACGTACAGAAAACGCGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGCCGCTTTCAAGGACAACTGCTCGTCTTCCAACAAATTTGAGAAGAAGATAGCCAGATACGTAAATCAGCTAGAAACGGAGACTAGTAGTCCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGCGTCAGAAACTGCGTGAACAGATTCAGCTCGTCGCCAAAAACCTTCAACCCAACAAGAAGGCGGCGAAGCAG---AAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGATGATGAAGAGTCCACA--- +>Dsim_NS40 |2 sp| +ATGAAAAGCAAGGTGGATAAACCCATAACCACTGGTGCACCAAGTGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAGAAATCCGACGCGGACACGCAGATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGTGAAGCCGGCGGAGACCGAGGAAAAGGAAAATATCGCGAGCAACGGCAACCTGAAGGTGTCGCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGACACAAATGCTGAGCAGCGCGCTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAACCGCCGTGCCCGCCATCGACGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAAGTGGTTACAGCCTTCGGCATTTTGCAGAGCCCGCAGTTCGCCAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCTCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAANAAGCCGTTGAGTGGCTTGAAAGTAAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGAGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACTCACAGCTTTTCGATTTGTATTTCTCCGGCTCCACCATTCACAGCGATGACGTATACGCCAGATTGGCTAGTTTTCTTATGAATGGCGGAAAGGAAATGCTCGCCGCCTGGCAGCAGTATATTGATTCCAAGCAGCCACTCAAATTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCAACGTGCTCCGCAACTTTAAGCCAAGGGAAGAACAACTTATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGCTGCAGGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCTAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTCGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCAGCTGCTGCTTAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATATCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTAAGCGTCGAGAGCCTTTACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCATTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTGAGCCAGGCAACACAATGGCGACAGAAGCAGTTGAACTACTTGCTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAGGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCACTTGCTGCAGAAGACATTGAGTTACCTTAACAAAAAGTTGGGGGAACCGGATGCAGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGCGCGGCCCAGCAAGGAAACGGATGTCGTTGGCCAAACATTCGAGGCTCTAATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCGTCACCGTGTTGGAGGATCTGATTNTCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGATCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTACTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGTTCAACATGAACAAAAATCCCTTGAGCAAGAAGGACGATGGC------GAGGAGGAGAGCGAAGACGAAGTCGACGAGGAAGAATCGTTGAAGGATTCGAGCGATGATTCAGACGATGAAGATGAAGATGAAGAGGAGNAC---GAAGACGAGGACGATGAAGAGTCCCATTTGGCCCAAANTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAAGAGCAGGGCAAACGCTTGAATGCTGCTTTGGAGCAGTCTTTTCAAATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAACACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAAACAAGAAACCAACTCAATCGGTAATCCTGGNCGTGCTGCATTGCGTCTTCCAGGTGTACCGCCATTGCGCCACAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTTGCCAGGAATATCGAACTCAAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCTATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAAGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCAAGCCCAAGGAAAGTGCTGTCTGGCCNCTTCTAGTCGAATTTCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGTCAATGGCAGGGCGTTGCTCCACTGGCTGTTGTCCTGGCCTCCCACTTGGACGTACAGAAAACGCGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCAAGCAAGGTCGCCGGCTCGAAGCCGCTTTCAAGGACAACTGCTCGTCTTCCAACAAATTTGAGAAGAAGATAGCCAGATACGTAAATCAGCTAGAAACGGAGACTAGTAGTCCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGCGTCAGAAACTGCGTGAACAGATTCAGCTCGTCGCCAAAAACCTTCAACCCAACAAGAAGGCGGCGAAGCAG---AAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGATGATGAAGAGTCCACA--- +>Dsim_NS49 |45 sp| +ATGAAAAGCAAGGGGGATAAACCCATAACCACTGGTGCACCAAGTGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAGAAATCCGACGCGGACACGCAGATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGTGAAGCCGGCGGAGACCGAGGAAAAGGAAAATATCGCGAGCAACGGCAACCTGAAGGTGTCGCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGACACAAATGCTGAGCAGCGCGCTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAACCGCCGTGCCCGCCATCGACGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAAGTGGTTACAGCCTTCGGCATTTTGCAGAGCCCGCAGTTCGCCAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCTCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAANAAGCCGTTGAGTGGCTTGAAAGTAAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGAGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACTCACAGCTTTTCGATTTGTATTTCTCCGGCTCCACCATTCACAGCGATGACGTATACGCCAGATTGGCTAGTTTTCTTATGAATGGCGGAAAGGAAATGCTCGCCGCCTGGCAGCAGTATATTGATTCCAAGCAGCCACTCAAATTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCAACGTGCTCCGCAACTTTAAGCCAAGGGAAGAACAACTTATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGCTGCAGGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCTAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTCGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCAGCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATATCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTAAGCGTCGAGAGCCTTTACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCATTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTGAGCCAGGCAACACAATGGCGACAGAAGCAGTTGAACTACTTGCTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAGGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCACTTGCTGCAGAAGACATTGAGTTACCTTAACAAAAAGTTGGGGGAACCGGATGCAGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGCGCGGCCCAGCAAGGAAACGGATGTCGTTGGCCAAACATTCGAGGCTCTAATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCGTCACCGTGTTGGAGGATCTGATTNTCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGATCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTACTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGTTCAACATGAACAAAAATCCCTTGAGCAAGAAGGACGATGGC------GAGGAGGAGAGCGAAGACGAAGTCGACGAGGAAGAATCGTTGAAGGATTCGAGCGATGATTCAGACGATGAAGATGAAGATGAAGAGGAGNAC---GAAGACGAGGACGATGAAGAGTCCCATTTGGCCCAAANTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAGGAGCAGGGCAAACGCTTGAATGCTGCTTTGGAGCAGTCTTTTCAAATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAACACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAAACAAGAAACCAACTCAATCGGTAATCCTGGNCGTGCTGCATTGCGTCTTCCAGGTGTACCGCCATTGCGCCACAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTTGCCAGGAATATCGAACTCGAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCCATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAAGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCAAGCCCAAGGAAAGTGCTGTCTGGCCNCTTCTAGTCGAATTTCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGTCAATGGCAGGGCGTTGCTCCACTGGCTGTTGTCCTGGCCTCCCACTTGGACGTACAGAAAACGCGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGCCGCTTTCAAGGACAACTGCTCGTCTTCCAACAAATTTGAGAAGAAGATAGCCAGATACGTAAATCAGCTAGAAACGGAGACTAGTAGTCCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGCGTCAGAAACTGCGTGAACAGATTCAGCTCGTCGCCAAAAACCTTCAACCCAACAAGAAGGCGGCGAAGCAG---AAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGATGATGAAGAGTCCACA--- +>Dsim_NS50 |95 sp| +ATGAAAAGCAAGGTGGATAAACCCATAACCACTGGTGCACCAAGTGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAGAAATCCGACGCGGACACGCAGATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGTGAAGCCGGCGGAGACCGAGGAAAAGGAAAATATCGCGAGCAACGGCAACCTGAAGGTGTCGCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGACACAAATGCTGAGCAGCGCGCTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAACCGCCGTGCCCGCCATCGACGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAAGTGGTTACAGCCTTCGGCATTTTGCAGAGCCCGCAGTTCGCCAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCTCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAANAAGCCGTTGAGTGGCTTGAAAGTAAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGAGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACTCACAGCTTTTCGATTTGTATTTCTCCGGCTCCACCATTCACAGCGATGACGTATACGCCAGATTGGCTAGTTTTCTTATGAATGGCGGAAAGGAAATGCTCGCCGCCTGGCAGCAGTATATTGATTCCAAGCAGCCACTCAAATTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCAACGTGCTCCGCAACTTTAAGCCAAGGGAAGAACAACTTATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGCTGCAGGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCTAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTCGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCAGCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATATCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTAAGCGTCGAGAGCCTTTACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCATTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTGAGCCAGGCAACACAATGGCGACAGAAGCAGTTGAACTACTTGCTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAGGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCACTTGCTGCAGAAGACATTGAGTTACCTTAACAAAAAGTTGGGGGAACCGGATGCAGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGCGCGGCCCAGCAAGGAAACGGATGTCGTTGGCCAAACATTCGAGGCTCTAATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCGTCACCGTGTTGGAGGATCTGATTNTCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGATCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTACTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGTTCAACATGAACAAAAATCCCTTGAGCAAGAAGGACGATGGC------GAGGAGGAGAGCGAAGACGAAGTCGACGAGGAAGAATCGTTGAAGGATTCGAGCGATGATTCAGACGATGAAGATGAAGATGAAGAGGAGNAC---GAAGACGAGGACGATGAAGAGTCCCATTTGGCCCAAANTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAGGAGCAGGGCAAACGCTTGAATGCTGCTTTGGAGCAGTCTTTTCAAATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAACACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAAACAAGAAACCAACTCAATCGGTAATCCTGGNCGTGCTGCATTGCGTCTTCCAGGTGTACCGCCATTGCGCCACAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTTGCCAGGAATATCGAACTCGAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCCATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAAGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCAAGCCCAAGGAAAGTGCTGTCTGGCCNCTTCTAGTCGAATTTCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGTCAATGGCAGGGCGTTGCTCCACTGGCTGTTGTCCTGGCCTCCCACTTGGACGTACAGAAAACGCGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGCCGCTTTCAAGGACAACTGCTCGTCTTCCAACAAATTTGAGAAGAAGATAGCCAGATACGTAAATCAGCTAGAAACGGAGACTAGTAGTCCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGTGGCGAGAAGCGTCAGAAACTGCGTGAACAGATTCAGCTCGTCGCCAAAAACCTTCAACCCAACAAGAAGGCGGCGAAGCAG---AAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGATGATGAAGAGTCCACA--- +>Dsim_NS63 |23 sp| +ATGAAAAGCAAGGTGGATAAACCCATAACCACTGGTGCACCAAGTGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAGAAATCCGACGCGGACACGCAGATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGTGAAGCCGGCGGAGACCGAGGAAAAGGAAAATATCGCGAGCAACGGCAACCTGAAGGTGTCGCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGACACAAATGCTGAGCAGCGCGCTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAACCGCCGTGCCCGCCATCGACGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAAGTGGTTACAGCCTTCGGCATTTTGCAGAGCCCGCAGTTCGCCAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCTCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAANAAGCCGTTGAGTGGCTTGAAAGTAAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGAGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACTCACAGCTTTTCGATTTGTATTTCTCCGGCTCCACCATTCACAGCGATGACGTATACGCCAGATTGGCTAGTTTTCTTATGAATGGCGGAAAGGAAATGCTCGCCGCCTGGCAGCAGTATATTGATTCCAAGCAGCCACTCAAATTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCAACGTGCTCCGCAACTTTAAGCCAAGGGAAGAACAACTTATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGCTGCAGGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCAAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTCGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCAGCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATATCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTTAGCGTCGAGAGCCTTTACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCATTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTGAGCCAGGCAACACAATGGCGACAGAAGCAGTTGAACTACTTGCTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAAGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCACTTGCTGCAGAAGACATTGAGTTACCTTAACAAAAAGTTGGGGGAACCGGATGCAGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGCGCGGCCCAGCAAGGAAACGGATGTCGTTGGCCAAACATTCGAGGCTCTAATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCGTCACCGTGTTGGAGGATCTGATTNTCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGATCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTACTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGTTCAACATGAACAAAAATCCCTTGAGCAAGAAGGACGATGGC------GAGGAGGAGAGCGAAGACGAAGTCGACGAGGAAGAATCGTTGAAGGATTCGAGCGATGATTCAGACGATGAAGATGAAGATGAAGAGGAGNAC---GAAGACGAGGACGATGAAGAGTCCCATTTGGCCCAAANTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAAGAGCAGGGCAAACGCTTGAATGCTGCTTTGGAGCAGTCTTTTCAAATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAACACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAAACAAGAAACCAACTCAATCGGTAATCCTGGNCGTGCTGCATTGCGTCTTCCAGGTGTACCGCCATTGCGCCACAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTTGCCAGGAATATCGAACTCGAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCAATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAAGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCAAGCCCAAGGAAAGTGCTGTCTGGCCNCTTCTAGTCGAATTTCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGTCAATGGCAGGGCGTTGCTCCACTGGCTGTTGTCCTGGCCTCCCACTTGGACGTACAGAAAACGCGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGCCGCTTTCAAGGACAACTGCTCGTCTTCCAACAAATTTGAGAAGAAGATAGCCAGATACGTAAATCAGCTAGAAACGGAGACTAGTAGTCCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGCGTCAGAAACTGCGTGAACAGATTCAGCTCGTCGCCAAAAACCTTCAACCCAACAAGAAGGCGGCGAAGCAG---AAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGATGATGAAGAGTCCACA--- +>Dsim_NS64 |20 sp| +ATGAAAAGCAAGGTGGATAAACCCATAACCACTGGTGCACCAAGTGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAGAAATCCGACGCGGACACGCAGATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGTGAAGCCGGCGGAGACCGAGGAAAAGGAAAATATCGCGAGCAACGGCAACCTGAAGGTGTCGCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGACACAAATGCTGAGCAGCGCGCTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAACCGCCGTGCCCGCCATCGACGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAAGTGGTTACAGCCTTCGGCATTTTGCAGAGCCCGCAGTTCGCCAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCTCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAANAAGCCGTTGAGTGGCTTGAAAGTAAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGAGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACTCACAGCTTTTCGATTTGTATTTCTCCGGCTCCACCATTCACAGCGATGACGTATACGCCAGATTGGCTAGTTTTCTTATGAATGGCGGAAAGGAAATGCTCGCCGCCTGGCAGCAGTATATTGATTCCAAGCAGCCACTCAAATTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCAACGTGCTCCGCAACTTTAAGCCAAGGGAAGAACAACTTATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGCTGCAGGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCAAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTCGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCAGCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATATCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTTAGCGTCGAGAGCCTTTACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCATTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTGAGCCAGGCAACACAATGGCGACAGAAGCAGTTGAACTACTTGCTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAAGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCACTTGCTGCAGAAGACATTGAGTTACCTTAACAAAAAGTTGGGGGAACCGGATGCAGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGCGCGGCCCAGCAAGGAAACGGATGTCGTTGGCCAAACATTCGAGGCTCTAATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCGTCACCGTGTTGGAGGATCTGATTNTCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGATCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTACTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGTTCAACATGAACAAAAATCCCTTGAGCAAGAAGGACGATGGC------GAGGAGGAGAGCGAAGACGAAGTCGACGAGGAAGAATCGTTGAAGGATTCGAGCGATGATTCAGACGATGAAGATGAAGATGAAGAGGAGNAC---GAAGACGAGGACGATGAAGAGTCCCATTTGGCCCAAANTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAAGAGCAGGGCAAACGCTTGAATGCTGCTTTGGAGCAGTCTTTTCAAATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAACACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAAACAAGAAACCAACTCAATCGGTAATCCTGGNCGTGCTGCATTGCGTCTTCCAGGTGTACCGCCATTGCGCCACAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTTGCCAGGAATATCGAACTCGAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCAATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAAGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCAAGCCCAAGGAAAGTGCTGTCTGGCCNCTTCTAGTCGAATTTCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGTCAATGGCAGGGCGTTGCTCCACTGGCTGTTGTCCTGGCCTCCCACTTGGACGTACAGAAAACGCGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGCCGCTTTCAAGGACAACTGCTCGTCTTCCAACAAATTTGAGAAGAAGATAGCCAGATACGTAAATCAGCTAGAAACGGAGACTAGTAGTCCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGCGTCAGAAACTGCGTGAACAGATTCAGCTCGTCGCCAAAAACCTTCAACCCAACAAGAAGGCGGCGAAGCAG---AAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGATGATGAAGAGTCCACA--- +>Dsim_NS67 |16 sp| +ATGAAAAGCAAGGTGGATAAACCCATAACCACTGGTGCACCAAGTGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAGAAATCCGACGCGGACACGCAGATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGTGAAGCCGGCGGAGACCGAGGAAAAGGAAAATATCGCGAGCAACGGCAACCTGAAGGTGTCGCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGACACAAATGCTGAGCAGCGCGCTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAACCGCCGTGCCCGCCATCGACGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAAGTGGTTACAGCCTTCGGCATTTTGCAGAGCCCGCAGTTCGCCAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCTCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAANAAGCCGTTGAGTGGCTTGAAAGTAAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGAGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACTCACAGCTTTTCGATTTGTATTTCTCCGGCTCCACCATTCACAGCGATGACGTATACGCCAGATTGGCTAGTTTTCTTATGAATGGCGGAAAGGAAATGCTCGCCGCCTGGCAGCAGTATATTGATTCCAAGCAGCCACTCAAATTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCAACGTGCTCCGCAACTTTAAGCCAAGGGAAGAACAACTTATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGCTGCAGGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCTAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTCGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCAGCTGCTGCTTAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATATCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTAAGCGTCGAGAGCCTTTACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCATTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTGAGCCAGGCAACACAATGGCGACAGAAGCAGTTGAACTACTTGCTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAAGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCACTTGCTGCAGAAGACATTGAGTTACCTTAACAAAAAGTTGGGGGAACCGGATGCAGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGCGCGGCCCAGCAAGGAAACGGATGTCGTTGGCCAAACATTCGAGGCTCTAATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCGTCACCGTGTTGGAGGATCTGATTNTCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGATCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTACTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGTTCAACATGAACAAAAATCCCTTGAGCAAGAAGGACGATGGC------GAGGAGGAGAGCGAAGACGAAGTCGACGAGGAAGAATCGTTGAAGGATTCGAGCGATGATTCAGACGATGAAGATGAAGATGAAGAGGAGNAC---GAAGACGAGGACGATGAAGAGTCCCATTTGGCCCAAANTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAAGAGCAGGGCAAACGCTTGAATGCTGCTTTGGAGCAGTCTTTTCAAATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAACACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAAACAAGAAACCAACTCAATCGGTAATCCTGGNCGTGCTGCATTGCGTCTTCCAGGTGTACCGCCATTGCGCCACAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTTGCCAGGAATATCGAACTCGAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCAATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAAGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCAAGCCCAAGGAAAGTGCTGTCTGGCCNCTTCTAGTCGAATTTCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGTCAATGGCAGGGCGTTGCTCCACTGGCTGTTGTCCTGGCCTCCCACTTGGACGTACAGAAAACGCGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGCCGCTTTCAAGGACAACTGCTCGTCTTCCAACAAATTTGAGAAGAAGATAGCCAGATACGTAAATCAGCTAGAAACGGAGACTAGTAGTCCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGCGTCAGAAACTGCGTGAACAGATTCAGCTCGTCGCCAAAAACCTTCAACCCAACAAGAAGGCGGCGAAGCAG---AAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGATGATGAAGAGTCCACA--- +>Dsim_NS78 |93 sp| +ATGAAAAGCAAGGGGGATAAACCCATAACCACTGGTGCACCAAGTGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAGAAATCCGACGCGGACACGCAGATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGTGAAGCCGGCGGAGACCGAGGAAAAGGAAAATATCGCGAGCAACGGCAACCTGAAGGTGTCGCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGACACAAATGCTGAGCAGCGCGCTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAACCGCCGTGCCCGCCATCGACGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAAGTGGTTACAGCCTTCGGCATTTTGCAGAGCCCGCAGTTCGCCAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCTCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAANAAGCCGTTGAGTGGCTTGAAAGTAAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGAGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACTCACAGCTTTTCGATTTGTATTTCTCCGGCTCCACCATTCACAGCGATGACGTATACGCCAGATTGGCTAGTTTTCTTATGAATGGCGGAAAGGAAATGCTCGCCGCCTGGCAGCAGTATATTGATTCCAAGCAGCCACTCAAATTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCAACGTGCTCCGCAACTTTAAGCCAAGGGAAGAACAACTTATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGCTGCAGGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCAAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTCGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCAGCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATATCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTTAGCGTCGAGAGCCTTTACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCATTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTGAGCCAGGCAACACAATGGCGACAGAAGCAGTTGAACTACTTGCTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAGGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCACTTGCTGCAGAAGACATTGAGTTACCTTAACAAAAAGTTGGGGGAACCGGATGCAGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGCGCGGCCCAGCAAGGAAACGGATGTCGTTGGCCAAACATTCGAGGCTCTAATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCGTCACCGTGTTGGAGGATCTGATTNTCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGATCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTACTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGTTCAACATGAACAAAAATCCCTTGAGCAAGAAGGACGATGGC------GAGGAGGAGAGCGAAGACGAAGTCGACGAGGAAGAATCGTTGAAGGATTCGAGCGATGATTCAGACGATGAAGATGAAGATGAAGAGGAGNAC---GAAGACGAGGACGATGAAGAGTCCCATTTGGCCCAAANTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAGGAGCAGGGCAAACGCTTGAATGCTGCTTTGGAGCAGTCTTTTCAAATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAACACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAAACAAGAAACCAACTCAATCGGTAATCCTGGNCGTGCTGCATTGCGTCTTCCAGGTGTACCGCCATTGCGCCACAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTTGCCAGGAATATCGAACTCGAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCCATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAAGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCAAGCCCAAGGAAAGTGCTGTCTGGCCNCTTCTAGTCGAATTTCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGTCAATGGCAGGGCGTTGCTCCACTGGCTGTTGTCCTGGCCTCCCACTTGGACGTACAGAAAACGCGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGCCGCTTTCAAGGACAACTGCTCGTCTTCCAACAAATTTGAGAAGAAGATAGCCAGATACGTAAATCAGCTAGAAACGGAGACTAGTAGTCCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGCGTCAGAAACTGCGTGAACAGATTCAGCTCGTCGCCAAAAACCTTCAACCCAACAAGAAGGCGGCGAAGCAG---AAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGATGATGAAGAGTCCACA--- +>Dsim_NS79 |52 sp| +ATGAAAAGCAAGGTGGATAAACCCATAACCACTGGTGCACCAAGTGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAGAAATCCGACGCGGACACGCAGATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGTGAAGCCGGCGGAGACCGAGGAAAAGGAAAATATCGCGAGCAACGGCAACCTGAAGGTGTCGCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGACACAAATGCTGAGCAGCGCGCTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAACCGCCGTGCCCGCCATCGACGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAAGTGGTTACAGCCTTCGGCATTTTGCAGAGCCCGCAGTTCGCCAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCTCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAANAAGCCGTTGAGTGGCTTGAAAGTAAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGAGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACTCACAGCTTTTCGATTTGTATTTCTCCGGCTCCACCATTCACAGCGATGACGTATACGCCAGATTGGCTAGTTTTCTTATGAATGGCGGAAAGGAAATGCTCGCCGCCTGGCAGCAGTATATTGATTCCAAGCAGCCACTCAAATTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCAACGTGCTCCGCAACTTTAAGCCAAGGGAAGAACAACTTATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGCTGCAGGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCAAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTCGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCAGCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATATCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTTAGCGTCGAGAGCCTTTACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCATTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTGAGCCAGGCAACACAATGGCGACAGAAGCAGTTGAACTACTTGCTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAAGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCACTTGCTGCAGAAGACATTGAGTTACCTTAACAAAAAGTTGGGGGAACCGGATGCAGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGCGCGGCCCAGCAAGGAAACGGATGTCGTTGGCCAAACATTCGAGGCTCTAATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCGTCACCGTGTTGGAGGATCTGATTNTCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGATCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTACTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGTTCAACATGAACAAAAATCCCTTGAGCAAGAAGGACGATGGC------GAGGAGGAGAGCGAAGACGAAGTCGACGAGGAAGAATCGTTGAAGGATTCGAGCGATGATTCAGACGATGAAGATGAAGATGAAGAGGAGNAC---GAAGACGAGGACGATGAAGAGTCCCATTTGGCCCAAANTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAAGAGCAGGGCAAACGCTTGAATGCTGCTTTGGAGCAGTCTTTTCAAATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAACACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAAACAAGAAACCAACTCAATCGGTAATCCTGGNCGTGCTGCATTGCGTCTTCCAGGTGTACCGCCATTGCGCCACAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTTGCCAGGAATATCGAACTCGAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCAATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAAGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCAAGCCCAAGGAAAGTGCTGTCTGGCCNCTTCTAGTCGAATTTCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGTCAATGGCAGGGCGTTGCTCCACTGGCTGTTGTCCTGGCCTCCCACTTGGACGTACAGAAAACGCGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGCCGCTTTCAAGGACAACTGCTCGTCTTCCAACAAATTTGAGAAGAAGATAGCCAGATACGTAAATCAGCTAGAAACGGAGACTAGTAGTCCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGCGTCAGAAACTGCGTGAACAGATTCAGCTCGTCGCCAAAAACCTTCAACCCAACAAGAAGGCGGCGAAGCAG---AAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGATGATGAAGAGTCCACA--- +>Dsim_NS89 |128 sp| +ATGAAAAGCAAGGTGGATAAACCCATAACCACTGGTGCACCAAGTGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAGAAATCCGACGCGGACACGCAGATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGTGAAGCCGGCGGAGACCGAGGAAAAGGAAAATATCGCGAGCAACGGCAACCTGAAGGTGTCGCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGACACAAATGCTGAGCAGCGCGCTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAACCGCCGTGCCCGCCATCGACGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAAGTGGTTACAGCCTTCGGCATTTTGCAGAGCCCGCAGTTCGCCAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCTCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAANAAGCCGTTGAGTGGCTTGAAAGTAAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGAGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACTCACAGCTTTTCGATTTGTATTTCTCCGGCTCCACCATTCACAGCGATGACGTATACGCCAGATTGGCTAGTTTTCTTATGAATGGCGGAAAGGAAATGCTCGCCGCCTGGCAGCAGTATATTGATTCCAAGCAGCCACTCAAATTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCAACGTGCTCCGCAACTTTAAGCCAAGGGAAGAACAACTTATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGCTGCAGGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCTAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTCGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCAGCTGCTGCTTAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATATCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTAAGCGTCGAGAGCCTTTACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCATTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTGAGCCAGGCAACACAATGGCGACAGAAGCAGTTGAACTACTTGCTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAGGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCACTTGCTGCAGAAGACATTGAGTTACCTTAACAAAAAGTTGGGGGAACCGGATGCAGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGCGCGGCCCAGCAAGGAAACGGATGTCGTTGGCCAAACATTCGAGGCTCTAATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCGTCACCGTGTTGGAGGATCTGATTNTCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGATCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTACTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGTTCAACATGAACAAAAATCCCTTGAGCAAGAAGGACGATGGC------GAGGAGGAGAGCGAAGACGAAGTCGACGAGGAAGAATCGTTGAAGGATTCGAGCGATGATTCAGACGATGAAGATGAAGATGAAGAGGAGNAC---GAAGACGAGGACGATGAAGAGTCCCATTTGGCCCAAANTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAGGAGCAGGGCAAACGCTTGAATGCTGCTTTGGAGCAGTCTTTTCAAATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAACACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAAACAAGAAACCAACTCAATCGGTAATCCTGGNCGTGCTGCATTGCGTCTTCCAGGTGTACCGCCATTGCGCCACAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTTGCCAGGAATATCGAACTCAAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCTATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAAGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCAAGCCCAAGGAAAGTGCTGTCTGGCCNCTTCTAGTCGAATTTCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGTCAATGGCAGGGCGTTGCTCCACTGGCTGTTGTCCTGGCCTCCCACTTGGACGTACAGAAAACGCGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGCCGCTTTCAAGGACAACTGCTCGTCTTCCAACAAATTTGAGAAGAAGATAGCCAGATACGTAAATCAGCTAGAAACGGAGACTAGTAGTCCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGCGTCAGAAACTGCGTGAACAGATTCAGCTCGTCGCCAAAAACCTTCAACCCAACAAGAAGGCGGCGAAGCAG---AAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGATGATGAAGAGTCCACA--- +>Dsim_NS95 |25 sp| +ATGAAAAGCAAGGTGGATAAACCCATAACCACTGGTGCACCAAGTGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAGAAATCCGACGCGGACACGCAGATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGTGAAGCCGGCGGAGACCGAGGAAAAGGAAAATATCGCGAGCAACGGCAACCTGAAGGTGTCGCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGNNNNNNNNNATGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGACACAAATGCTGAGCAGCGCGCTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAACCGCCGTGCCCGCCATCGACGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAAGTGGTTACAGCCTTCGGCATTTTGCAGAGCCCGCAGTTCGCCAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCTCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAANAAGCCGTTGAGTGGCTTGAAAGTAAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGAGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACTCACAGCTTTTCGATTTGTATTTCTCCGGCTCCACCATTCACAGCGATGACGTATACGCCAGATTGGCTAGTTTTCTTATGAATGGCGGAAAGGAAATGCTCGCCGCCTGGCAGCAGTATATTGATTCCAAGCAGCCACTCAAATTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCAACGTGCTCCGCAACTTTAAGCCAAGGGAAGAACAACTTATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGCTGCAGGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCAAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTCGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCAGCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATATCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTTAGCGTCGAGAGCCTTTACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCATTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTGAGCCAGGCAACACAATGGCGACAGAAGCAGTTGAACTACTTGCTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAAGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCACTTGCTGCAGAAGACATTGAGTTACCTTAACAAAAAGTTGGGGGAACCGGATGCAGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGCGCGGCCCAGCAAGGAAACGGATGTCGTTGGCCAAACATTCGAGGCTCTAATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCGTCACCGTGTTGGAGGATCTGATTNTCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGATCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTACTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGTTCAACATGAACAAAAATCCCTTGAGCAAGAAGGACGATGGC------GAGGAGGAGAGCGAAGACGAAGTCGACGAGGAAGAATCGTTGAAGGATTCGAGCGATGATTCAGACGATGAAGATGAAGATGAAGAGGAGNAC---GAAGACGAGGACGATGAAGAGTCCCATTTGGCCCAAANTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAAGAGCAGGGCAAACGCTTGAATGCTGCTTTGGAGCAGTCTTTTCAAATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAACACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAAACAAGAAACCAACTCAATCGGTAATCCTGGNCGTGCTGCATTGCGTCTTCCAGGTGTACCGCCATTGCGCCACAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTTGCCAGGAATATCGAACTCGAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCAATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAAGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCAAGCCCAAGGAAAGTGCTGTCTGGCCNCTTCTAGTCGAATTTCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGTCAATGGCAGGGCGTTGCTCCACTAGCTGTTGTCCTGGCCTCCCACTTGGACGTACAGAAAACGCGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGCCGCTTTCAAGGACAACTGCTCGTCTTCCAACAAATTTGAGAAGAAGATAGCCAGATACGTAAATCAGCTAGAAACGGAGACTAGTAGTCCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGCGTCAGAAACTGCGTGAACAGATTCAGCTCGTCGCCAAAAACCTTCAACCCAACAAGAAGGCGGCGAAGCAG---AAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGATGATGAAGAGTCCACA--- +>Dsim_NS96 |98 sp| +ATGAAAAGCAAGGTGGATAAACCCATAACCACTGGTGCACCAAGTGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAGAAATCCGACGCGGACACGCAGATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGTGAAGCCGGCGGAGACCGAGGAAAAGGAAAATATCGCGAGCAACGGCAACCTGAAGGTGTCGCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGACACAAATGCTGAGCAGCGCGCTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAACCGCCGTGCCCGCCATCGACGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAAGTGGTTACAGCCTTCGGCATTTTGCAGAGCCCGCAGTTCGCCAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCTCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAANAAGCCGTTGAGTGGCTTGAAAGTAAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGAGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACTCACAGCTTTTCGATTTGTATTTCTCCGGCTCCACCATTCACAGCGATGACGTATACGCCAGATTGGCTAGTTTTCTTATGAATGGCGGAAAGGAAATGCTCGCCGCCTGGCAGCAGTATATTGATTCCAAGCAGCCACTCAAATTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCAACGTGCTCCGCAACTTTAAGCCAAGGGAAGAACAACTTATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGCTGCAGGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCTAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTCGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCAGCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATATCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTAAGCGTCGAGAGCCTTTACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCATTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTGAGCCAGGCAACACAATGGCGACAGAAGCAGTTGAACTACTTGCTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAGGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCACTTGCTGCAGAAGACATTGAGTTACCTTAACAAAAAGTTGGGGGAACCGGATGCAGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGCGCGGCCCAGCAAGGAAACGGATGTCGTTGGCCAAACATTCGAGGCTCTAATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCGTCACCGTGTTGGAGGATCTGATTNTCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGATCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTACTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGTTCAACATGAACAAAAATCCCTTGAGCAAGAAGGACGATGGC------GAGGAGGAGAGCGAAGACGAAGTCGACGAGGAAGAATCGTTGAAGGATTCGAGCGATGATTCAGACGATGAAGATGAAGATGAAGAGGAGNAC---GAAGACGAGGACGATGAAGAGTCCCATTTGGCCCAAANTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAGGAGCAGGGCAAACGCTTGAATGCTGCTTTGGAGCAGTCTTTTCAAATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAACACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAAACAAGAAACCAACTCAATCGGTAATCCTGGNCGTGCTGCATTGCGTCTTCCAGGTGTACCGCCATTGCGCCACAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTTGCCAGGAATATCGAACTCGAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCCATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAAGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCAAGCCCAAGGAAAGTGCTGTCTGGCCNCTTCTAGTCGAATTTCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGTCAATGGCAGGGCGTTGCTCCACTGGCTGTTGTCCTGGCCTCCCACTTGGACGTACAGAAAACGCGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGCCGCTTTCAAGGACAACTGCTCGTCTTCCAACAAATTTGAGAAGAAGATAGCCAGATACGTAAATCAGCTAGAAACGGAGACTAGTAGTCCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGCGTCAGAAACTGCGTGAACAGATTCAGCTCGTCGCCAAAAACCTTCAACCCAACAAGAAGGCGGCGAAGCAG---AAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGATGATGAAGAGTCCACA--- +>Dyak_528_2597 |32 sp| +ATGAAGAGCAAAGTGGACAAACCCATAACCAATGGTGCACCCGCCAAGACAAAGACC------AAGGAGGAGCGCAAACGGACGAAATCCCTGAAATCCGACGCGGACACCGAGATACCGGCCAAGATTTCCAAGGTGTCCAAGACCAAGAAGGAGAAGCCGAAGCCATCGGAGGCCGAGGAAAAGGAGAACACCGCAAGCAACGGCAACCTGAAGGTGTCGCAGATCAACAAAGCCGTGTTTGTGGTTTTCAAGAAGTTGCAGGGCAGCCAGCTGACCAAGAAGATGATCAATTCCCTTATAACGCTGCTGCGCGACGACACAAATGCGGAGCAGCGCGCTGCGACCATCTGCTACGTGCTCAAACGCTTGATCCGCTCCACAGGCGCAGATGACATGAAGGCGGTGGGCCTGGCCGCCAGTTATATACACTGCATCCTAGCCGCCGTGCCCGCCATTGACGCACTTGAGGTTCTGGACACTCTAAAGCGCGATCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCTGCCGTCGGTCAGTTGATAACAGCCTTTTGCATTCTGCAGACCCCGCAGTTCGCCAAGGCCGAGCCCAAGCTGGTTTCGGCGGTCTTCCAGATTCTAGCGGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCCATGTGCGGCGATATCCTAGCGGACTCCTTCAAACAGCTGCCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAACAAGCCGCTGAGTGGCTTGAAAGTCAACACCTGCGATGTCTTGCTGGCCGTGCACCTGACCTATTCGTCCGTGCTGGGACGGGAGAACATTCTGGCCAGCTTGTGGCCCAAGAAACCGGTGTACACGCAGCTTTTCGATCTGTACTTCGCCGGCTCCACCATTCACAGTGATGGCGTGTACGCCAGATTGGCTATTTTTCTTGTAAATGGTGGGAAGGAAATGCTCGCCGCCTGGCAGCAGTACATCGCTTCCAAGCAGCCACTGAAACTAAACGCAGCCAAGGCGTGTGCGATCCAAGTGCTGAGTCACATACTCCTCAACTTTAAGCCAGCGGACGAAGAACTCATCCTGGATATTTTTACACCTACCTGTGTACAATTTCTGCTGCAGGAATGCTCTGCTGTAAAATGGGACAAAGCTGAGGCCAAGAAGCCGTCCCAAAAGAAGCTGAGGGAGATTTGCTTCAAGTTCGAGGCCTCCTTGGTGCTATGTTTCGAAAAGCAGTTCCAAAACGATGAAAGCAAGCTTCAGCTGCTGCTCAAACTGCTGGACCACACACTGCAGTTGGACTCGGTGATTTGCTTGCCGCGCTTCTGCCAGCAACTGATAGGTCAGTTGAGCGTCGAGAGCCTCCAGAAGCTGTACGACTTCTACAACAACAAGCTGTACTCGTTGGAGGACGAGGACAGAGTCAGCCGAGTGCACTGCCTCAACCAGATGCAGGTTATACTGCACCACCCAACGCTCAGCCAGGCAACCAAATGGCGTCAGAAGCAGCTGAACTACTTGCTGCTCGCTGGCCTTTTCCACGTAGATGCCAGTAAGAAGCCGTGCGAGGCCTCCAAAGCCAGCGCGTTCAGTCGCCAGTGCTCGGCGCGTTGCGAGGAGATATTCCTGGGTTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCAGTTGCTGCAGAAGACACTGAGTTACCTTAACAAGGAGTTGGGACAACCGGATGCAGAAAACAAGCTGCGTTCGCCGAGGGATGAGTCACTGCAGAAGGCATGGAAGCAGGTCGAGAAACTGCTGGCGAAGCCCAGCGAGGAAACGGATGTCGTTGGCCAAACATTCGAGGCTCTCATCCTGTTTGTGTCGTTGGCTTTGTGCACGAAGATTCCCCTGTCCGTCACCGTGCTGGACGATCTGATTATCTGCCGCAAGAACGCACTGCAAAAGAGCAAGAAACAGGTCAACGAAGAGCTCCAATGGCAGGATGTGCTCACGGATGCCCTGCTCCAGTTACTCCTGCAAACAGGTCACTTCTGGCGGGAGTTTGTTCATCTGGTGGCCACCGCTCTGATTCCCCACCTCGAGCATGGTAACCTCGAACAGGTCCTCGAAGTGCTCAATATGAACAGGAATCCCCTGAGCAAGAAGGACGAGGGCGAGGAGGAGGAGGAGAGCGACGAGGAAGTCGAGGGGGAAGAATCGCCGAAAGATTCGAGCGACGACTCA---GACGGCGATGAAGATGAAGACGAAGATGGAGAGGACGAGGACGATGAGGAGTCCCATTTGGCCCAGATCCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCAGACGATGATGGCGCCAGCAGCGTGGACTGGAACGATGTTGGCGAGGAGCAGGGTGAACGCCTGAATGCTGCTCTGGAGCGATCCTTCCAGTTGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCGACCAAATCGGAGCGCATTGACAACACCAACCTGCTGCACTTCCGCATTCGCGCCTTGGATTTGTTGGAGCTGTTCATAAGCAAGAAACCAACTCAGTCGGTAATCCTGGACGTGCTGCATTGCGTCTTCCAGGTGTACCGCCACTGTAGCGGCGACAGCAAGCTGCAATCCCTGCGAGAAGCCAGCTTGAAGTTGCTTAAGAAGATACTCGCCAAGAATATTGAACTCAACGAGCAGCAGAGTAACGCACCCATTCTGGAAGCAATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCACCAACCGACAGGCCAAAGGAGACATCATTGTTTGGCGAGACAAGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCGAGCCCAAGAATAGCACCGTGTGGCCTCTGCTGGTCGAGTTCCTGGAGCTGTGGGTAGCCAAGCGTCGCAGTCGCCTCTCCCTGGCGAGTTTCGAAGCCCTCTTTCAGTCTGCCCAATGGCAGGGCGTTGCTCCGCTGGCCGTTGTCCTGGCCTCCCATTTGGACGTGAAGAAAACACGCAGTTTTCGGCGAGCCCAGATATTGAAGCTTCTCAGTGAGCAGTGCCGCCGACTCGAGTCCGCTTTCAAGGACAACAGCTCGTCTGCCAAGGAGTTTGAGAAGCAGATAGCACGATATGTGAACCAACTGGAAACGGAGGCCAGTAGTTCCAAGGAACTCAATCTGCTGCTCAAGATCCTCGCCCAAGGAGGCCAGAAGCGGCAGAAACTGCGCGAAAAGATCCAACTCGTCGCTAAGAACCTTCAGCCCACCAAGAAGGCGACGAAGCAGAAGGAGCAGGCAGCCGCCGAACCCACAGAACCCATGGATGTGGAAGATGAGGAGCAGGCCACA +>Dyak_FBgn0234128 |108 sp| +ATGAAGAGCAAAGTGGACAAACCCATAACCAATGGTGCACCCGCCAAGACAAAGACC------AAGGAGGAGCGCAAACGGACGAAATCCCTGAAATCCGACGCGGACACCGAGATACCGGCCAAGATTTCCAAGGTGTCCAAGACCAAGAAGGAGAAGCCGAAGCCATCGGAGGCCGAGGAAAAGGAGAACACCGCAAGCAACGGCAACCTGAAGGTGTCGCAGATCAACAAAGCCGTGTTTGTGGTTTTCAAGAAGTTGCAGGGCAGCCAGCTGACCAAGAAGATGATCAATTCCCTTATAACGCTGCTGCGCGACGACACAAATGCGGAGCAGCGCGCTGCGACCATCTGCTACGTGCTCAAACGCTTGATCCGCTCCACAGGCGCAGATGACATGAAGGCGGTGGGCCTGGCCGCCAGTTATATACACTGCATCCTAGCCGCCGTGCCCGCCATTGACGCACTTGAGGTTCTGGACACTCTAAAGCGCGATCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCTGCCGTCGGTCAGTTGATAACAGCCTTTTGCATTCTGCAGACCCCGCAGTTCGCCAAGGCCGAGCCCAAGCTGGTTTCGGCGGTCTTCCAGATTCTAGCGGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCCATGTGCGGCGATATCCTAGCGGACTCCTTCAAACAGCTGCCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAACAAGCCGCTGAGTGGCTTGAAAGTCAACACCTGCGATGTCTTGCTGGCCGTGCACCTGACCTATTCGTCCGTGCTGGGACGGGAGAACATTCTGGCCAGCTTGTGGCCCAAGAAACCGGTGTACACGCAGCTTTTCGATCTGTACTTCGCCGGCTCCACCATTCACAGTGATGGCGTGTACGCCAGATTGGCTATTTTTCTTGTAAATGGTGGGAAGGAAATGCTCGCCGCCTGGCAGCAGTACATCGCTTCCAAGCAGCCACTGAAACTAAACGCAGCCAAGGCGTGTGCGATCCAAGTGCTGAGTCACATACTCCTCAACTTTAAGCCAGCGGACGAAGAACTCATCCTGGATATTTTTACACCTACCTGTGTACAATTTCTGCTGCAGGAATGCTCTGCTGTAAAATGGGACAAAGCTGAGGCCAAGAAGCCGTCCCAAAAGAAGCTGAGGGAGATTTGCTTCAAGTTCGAGGCCTCCTTGGTGCTATGTTTCGAAAAGCAGTTCCAAAACGATGAAAGCAAGCTTCAGCTGCTGCTCAAACTGCTGGACCACACACTGCAGTTGGACTCGGTGATTTGCTTGCCGCGCTTCTGCCAGCAACTGATAGGTCAGTTGAGCGTCGAGAGCCTCCAGAAGCTGTACGACTTCTACAACAACAAGCTGTACTCGTTGGAGGACGAGGACAGAGTCAGCCGAGTGCACTGCCTCAACCAGATGCAGGTTATACTGCACCACCCAACGCTCAGCCAGGCAACCAAATGGCGTCAGAAGCAGCTGAACTACTTGCTGCTCGCTGGCCTTTTCCACGTAGATGCCAGTAAGAAGCCGTGCGAGGCCTCCAAAGCCAGCGCGTTCAGTCGCCAGTGCTCGGCGCGTTGCGAGGAGATATTCCTGGGTTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCAGTTGCTGCAGAAGACACTGAGTTACCTTAACAAGGAGTTGGGACAACCGGATGCAGAAAACAAGCTGCGTTCGCCGAGGGATGAGTCACTGCAGAAGGCATGGAAGCAGGTCGAGAAACTGCTGGCGAAGCCCAGCGAGGAAACGGATGTCGTTGGCCAAACATTCGAGGCTCTCATCCTGTTTGTGTCGTTGGCTTTGTGCACGAAGATTCCCCTGTCCGTCACCGTGCTGGACGATCTGATTATCTGCCGCAAGAACGCACTGCAAAAGAGCAAGAAACAGGTCAACGAAGAGCTCCAATGGCAGGATGTGCTCACGGATGCCCTGCTCCAGTTACTCCTGCAAACAGGTCACTTCTGGCGGGAGTTTGTTCATCTGGTGGCCACCGCTCTGATTCCCCACCTCGAGCATGGTAACCTCGAACAGGTCCTCGAAGTGCTCAATATGAACAGGAATCCCCTGAGCAAGAAGGACGAGGGCGAGGAGGAGGAGGAGAGCGACGAGGAAGTCGAGGGGGAAGAATCGCCGAAAGATTCGAGCGACGACTCA---GACGGCGATGAAGATGAAGACGAAGATGGAGAGGACGAGGACGATGAGGAGTCCCATTTGGCCCAGATCCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCAGACGATGATGGCGCCAGCAGCGTGGACTGGAACGATGTTGGCGAGGAGCAGGGTGAACGCCTGAATGCTGCTCTGGAGCGATCCTTCCAGTTGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCGACCAAATCGGAGCGCATTGACAACACCAACCTGCTGCACTTCCGCATTCGCGCCTTGGATTTGTTGGAGCTGTTCATAAGCAAGAAACCAACTCAGTCGGTAATCCTGGACGTGCTGCATTGCGTCTTCCAGGTGTACCGCCACTGTAGCGGCGACAGCAAGCTGCAATCCCTGCGAGAAGCCAGCTTGAAGTTGCTTAAGAAGATACTCGCCAAGAATATTGAACTCAACGAGCAGCAGAGTAACGCACCCATTCTGGAAGCAATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCACCAACCGACAGGCCAAAGGAGACATCATTGTTTGGCGAGACAAGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCGAGCCCAAGAATAGCACCGTGTGGCCTCTGCTGGTCGAGTTCCTGGAGCTGTGGGTAGCCAAGCGTCGCAGTCGCCTCTCCCTGGCGAGTTTCGAAGCCCTCTTTCAGTCTGCCCAATGGCAGGGCGTTGCTCCGCTGGCCGTTGTCCTGGCCTCCCATTTGGACGTGAAGAAAACACGCAGTTTTCGGCGAGCCCAGATATTGAAGCTTCTCAGTGAGCAGTGCCGCCGACTCGAGTCCGCTTTCAAGGACAACAGCTCGTCTGCCAAGGAGTTTGAGAAGCAGATAGCACGATATGTGAACCAACTGGAAACGGAGGCCAGTAGTTCCAAGGAACTCAATCTGCTGCTCAAGATCCTCGCCCAAGGAGGCCAGAAGCGGCAGAAACTGCGCGAAAAGATCCAACTCGTCGCTAAGAACCTTCAGCCCACCAAGAAGGCGACGAAGCAGAAGGAGCAGGCAGCCGCCGAACCCACAGAACCCATGGATGTGGAAGATGAGGAGCAGGCCACA +>Dere_528_2597 |50 sp| +ATGAAGAGCAAAGTGGACAAAGCCATGACCAATGGTGCACCCGCCATGACAAAAACC------AAGGAGGACCGCAAACGGACAAAATCCCTGAAATCGAATGCGGACACGGGGGGACCGGCCAAGATTGCGCGGGTGTCCAAG------CAGGAGAAGCCAAAGCCATCGGAAACCGATGAGAAGGAAAACACGGCGAGCAACGGGAACCTGAAGATGTCGCAAATCAACAAAGCCGTGTTTGTGGTCTTCAAGAAGATGCAGGGCAGTCAACTAACCAAGAAGATGATCAATTCCCTCGTAACGCTGCTACGCGACGACACAAATGCTGAACAGCGTACTGCGACCACTTGTTACGTGCTCAAGCGCTTGATCCGCTCCACAGGTGCAGATGACATGAATGCGGTCGTCCTGGCCGCCAGTTATATACACTGCATCCTAACCGCCGTGCCCGCCATTGACGCATTTGAGGTTCTGGAGACGCTAAAGCGAGATCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCTGCCGTCGGTCAGTTGGTTACAGCCTTTTGCATTCTGCAGACCCCGCAGTTCGCTAAGGCGGAGCCCAAGCTGGTAACGGCAGTCTTCCAGATTCTAGCGGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCCATGTGTGGCGATATCCTAGCAGACTCCTTCAAACAGCTACCTGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGTTAAACAAGCCCCTGAGTGGCTTGAAAGTAAACACCTGCGATGTTTTGCTGGCCGTGCACTTGACCTATTCGTCCGTACTGGGACGGGCGGACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACACACAGCTCTTCGATCTGTATTTCTCCGGCTCCACCATTCACAGTGATGGCGTATACACTAGATTGGCTATCTTTCTTGTAAATGGTGGGAAGGAAATGCTCGCCGCCTGGGAGCAGTACATCGCTTCCAAGCAGCCACTAAAAGTAAATGCAGCCAAGGCGTGTGCGATCCAAGTACTGAGCCACGTTCTCCTCAACTTTAAGCCAACGGAAGAGCAGCTCATCCTGGATGTTTTTACACCTACCTGTGTACAATTTCTGCTGCAGGAATGTTCATCTGTAAAATGGGATAAAGGTGAGGCCAAGAAACCCTCCCAAAAGAAGCTGAGGGAGATTTGCTTTAAGTTCGAGGCATCCTTGGTTTTATGTTTCGAAAATCAGTTCCAAAACGATTATATCAAGCTTCAGCTGCTGCTCAAATTACTGGACCACACATTGCAGTTGGACTCGGTGATTAGCTTGCCGCGCTTCTGCCAGCAGCTAATAAATCAATTGAGCGTCGAGAGTCTCCAGAAGCTGTACGATTTCTACAACAATAAATTGTACTCATTGGAGGATGAGGATAGAGTCAGCCGAGTGCACTGCCTGAACCAGATGCAGTTGATACTGCACCATTCAGCGCTTAGCCAGGCAACCAAATGGCGTCAGAAGCAATTGAACTACTTGCTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAAGAAGCCGTGCGAAGCCTCAAAAGCCAGCGCTTTCAGTCGCCAGTGTTCGGCGCGTTGTGAGGAAATATTCCTGGGTTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCAGTTACTGCAGAAGACGTTGAGTTATCTTAACAAAGAGTTGGCACAGGCGGATGCAGAGAGCAAATTGCGTTCGCCGAGAGACGAATCTCTGCAGAAAGCATGGAAACAGGTCGAGAAACTGCTGGCAAAGCCCAGCCAGGAAACGGATGTCGTTGGCCAAACATTCGAGGCTCTCATCCTGTTTGTTTCTTTGGCTTTGTGCGCAAAGATTCCCCTATCCGTCACCGTGTTGGATGATCTGATTATCTGCCGTAAAAACGCACTGCAAAAGAGCAAGAAACAGGATAACGAAGAGCTCCAATGGCAGGATGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTTCTGGCGTGAGTTTGTCCATCTGGTGGCCACCGCTTTGATTCCCCACCTCGAGCACGGTAACCTCGAACAGGTCCTCGAAGTGCTCAACATGAACAGAAATCCTTTGAGCAAGAAGGATGAGGGC------GAGGAGGAGAGCGACGAGGAAATCGAGGAGGAGGAATCGTTGAAAGATTCGAGCGATGACTCG---GACGGCGATGAAGATGAAGAGGAG------GAGGACGAGAACGATGAGGAGTCCCATTTGGCCCAGATTCGAGAAAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCAGATGACGACGGCGCCAGCAGCGTGGACTGGAACGATGTTGACGAGGAGCAGGGTGAACGCCTAAATGCTGCTTTGGAGCGCTCTTTTCAGTTGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCGACCAAATCGGAACGCATTGATAACACCAACCTGCTGCACTTTCGCATTCGTGCCTTGGATTTGTTGGAGCTGTTCATAACCAAGAAACCAACTCAGTCGGTTATCCTGGACGTGCTGCATTGCGTTTTCCAGGTGTACCGCCATTGCAGCGGAGATAGCAAACTGCAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTTAAAAAGATACTCGCCAGAAACATTGAACTCCAGGAAAATCAGAGTAACGCACCCATTCTGGGAGCCATTGAGCAGTTGATGTCGTCTGGCGAGGAGCATTCAGAAGAAGACCAGGAGAATAGCAAGCAACCCGCCAACCGACAGGCCAAAGCAGACATCATAGTTTGGCGAGATAAGTGCTTCGCTTACCTGGTCAGCCAGGCATCAGCAGGTGGCGAGCCCAAGAATAGCACCGTATGGCCTCTTCTGGTGGAATTCCTGGAGCTGTGGGTAGCCAAACGTCGTAGTCGCCTATCTCTGGCTAGTTTCGAGGCCCTCTTTCAGTCTGGTCAATGGCAGGGCGTTGCTCCGCTGGCCGTTGCCCTGGCCTCCCATTTGGACGTGAAAAAAACACGCAGTTTTCGGCGGGCACAGATATTGAAGCTTCTCAGTGAGCAATGTCGCCGACTCGAATCCGCCTTTAAGGACAACAGCTCGTCTTCCAAGGAGTTTGAGAAACAGATAGCCAGATATGTGAATGAACTGGAAACGGAGGCCAGTAGTTCCAAGGAACTCAATCTGCTGCTCAAGATCCTCGCCCAAGGAAACCAGAAGAGGCAGAAACTGCGTGAAAAGATCCAAATCGTCGCTAAAAGTCTTCAGCCCACCAAGAAGGCGATGAAG---------CAGGCAGCCGCT---------GAACCCATGGTTGTGGAAGATGAGGAGCACGTCACA \ No newline at end of file diff --git a/test_alignment_0_8.py b/test_alignment_0_8.py new file mode 100644 index 0000000..991494d --- /dev/null +++ b/test_alignment_0_8.py @@ -0,0 +1,413 @@ +#! /usr/env/bin/ Python3 +from alignmentrs_imports import * +# TODO - check valid ids, check invalid ids, + # check mixed type input (list, int, str) + # check invalid type + # check invalid optional arg. input +#---------------------------------------------------- +class TestAlignment: + """This is a TestClass for alignmentrs v0.8 library + + test type: nosetests + input file name: test_alignment.txt This is an + alignment text file + + strategy + -------- + - created dictionary from test file + dict.keys = sample ids, dict.values = [sample_description, sample_sequence] + this enables comparisons between dict items + (expected outputs) and alignentrs output + + tests applied + ------------- + tests for expected output for valid input #(EVI) + tests for output type (EOT) + tests for expected errors (EE)""" + + # basic test for expected outputs + def setup(self): + # initiates alignment object for tests + self.aln_file = Alignment.from_fasta('test_alignment.txt', 'test_align', 'marker') + self.test_aln_file = fasta_to_dict('test_alignment.txt') # for test_dict + #for methods that exclude marker sequence + self.test_aln_file_wo_marker = fasta_to_dict('test_alignment.txt') + del self.test_aln_file_wo_marker['marker_0'] + + def teardown(self): + pass +#---------------------------------------------------- + def test_nrows(self): + """checks if algn_obj.nrow returns expected type + and number of rows in alignment. + compares number of keys in test_dict(sample_ids) + against algn_obj.nrow output. + + pass if: + algn_obj.nrow returns int and matches + len(dict.keys)""" + + nrows = self.aln_file.nrows + test_nrows = len(list(row for row in self.test_aln_file.keys())) #checks number of ids in dict.keys + + assert isinstance(nrows,int) #(EOT) + assert nrows == test_nrows +#---------------------------------------------------- + def test_nsamples(self): + """checks if algn_obj.nsamples returns expected type + and number of samples in alignment. + compares algn_obj.nsamples against len(dict.items). + + pass if: + algn_obj.nrow returns int and matches + len(dict.items)""" + + nsamples = self.aln_file.nsamples + test_nsamples = len(list(sample for sample in \ + self.test_aln_file_wo_marker.items())) + + assert isinstance(nsamples,int) #(EOT) + assert nsamples == test_nsamples +#---------------------------------------------------- + def test_nmarkers(self): + """checks if algn_obj.nmarkers returns expected + output type and number of markers in alignment. + compares number of markers in algn_obj. against + number of test_dict keys with 'marker' keyword + + pass if: + output is int + number of markers in aln.obj == number of markers + in test_dict""" + + nmarkers = self.aln_file.nmarkers + test_nmarkers = len(list(sample for sample in self.test_aln_file.items() \ + if 'marker' in sample[0])) + + assert isinstance(nmarkers, int) + assert nmarkers == test_nmarkers +#---------------------------------------------------- + def test_nsites(self): + """checks if algn_obj.nsites returns expected + output type and number of sites in alignment. + compares number of sites in algn_obj. against + sequence length of a random key in test_dict. + *note: assumes all samples have same len + + pass if: + output is int + number of sites in aln.obj == sequence length + of any test_dict.key()""" + + nsites = self.aln_file.nsites + # extracts random test_dict id to use for seq len + random_seq_id = random.choice(list(self.test_aln_file.keys())) + random_seq_len = self.test_aln_file[random_seq_id][1] + test_nsites = len(random_seq_len) + + assert isinstance(nsites, int) + assert nsites == test_nsites +#---------------------------------------------------- + def test_sample_ids(self): + """checks if all sample ids in align.obj matches + ids in test_dictr. checks if method returns + expected type: (list) + pass if: + sample_ids in align.obj matches keys in test_dict""" + sample_ids = self.aln_file.sample_ids + test_sample_ids = list(sample_id for sample_id in \ + self.test_aln_file.keys() if not 'marker' in sample_id) + + assert isinstance(sample_ids,list) + assert sample_ids == test_sample_ids +#---------------------------------------------------- + def test_sample_descriptions(self): + """checks if descriptions in align.obj match descriptions + in test_dict. checks if expected type is returned + pass if: + expected type : list + descriptions in align.obj matches descriptions + in test_dict.""" + + sample_descriptions = self.aln_file.sample_descriptions + # description is first index pos in test_dict.values + test_descriptions = list(self.test_aln_file[desc][0] for desc in \ + self.test_aln_file.keys() if 'marker' not in desc) + + assert isinstance(sample_descriptions,list) + assert sample_descriptions == test_descriptions +#---------------------------------------------------- + def test_sample_sequences(self): + """checks if sequences in align.obj match sequences + in test_dict. checks if expected type is returned + pass if: + expected type : list + sequences in align.obj matches sequences + in test_dict.""" + + sample_sequences = self.aln_file.sample_sequences + # sequence is second index pos in test_dict.values + test_sample_sequences = list(self.test_aln_file[sample_id][1] for sample_id in \ + self.test_aln_file.keys() if not 'marker' in sample_id) + + assert isinstance(sample_sequences,list) + assert sample_sequences == test_sample_sequences +#---------------------------------------------------- + def test_marker_ids(self): + """checks if marker_ids in align.obj match marker_ids + in test_dict. checks if expected type is returned + pass if: + expected type : list + marker_ids in align.obj matches marker_ids + in test_dict.""" + + marker_ids = self.aln_file.marker_ids + # marker ids are considered as any key that has 'marker keyword in test_dict' + test_marker_ids = list(marker_id for marker_id in \ + self.test_aln_file.keys() \ + if 'marker' in marker_id) + + assert isinstance(marker_ids,list) + assert marker_ids == test_marker_ids +#---------------------------------------------------- + def test_marker_descriptions(self): + """checks if marker_descriptions in align.obj and + test_dict match. checks if expected type is returned + pass if: + expected type : list + marker_descriptions in align.obj matches marker_descriptions + in test_dict.""" + + marker_descriptions = self.aln_file.marker_descriptions + test_marker_descriptions = list(self.test_aln_file[marker_desc][0] \ + for marker_desc in self.test_aln_file.keys() \ + if 'marker' in marker_desc) + + assert isinstance(marker_descriptions,list) + assert marker_descriptions == test_marker_descriptions +#---------------------------------------------------- + def test_marker_sequences(self): + """checks if marker_sequences in align.obj and + test_dict match. checks if expected type is returned + pass if: + expected type : list + marker_sequences in align.obj matches marker_sequences + in test_dict.""" + + marker_sequences = self.aln_file.marker_sequences + test_marker_sequences = list(self.test_aln_file[marker_id][1] \ + for marker_id in self.test_aln_file.keys() \ + if 'marker' in marker_id) + + assert isinstance(marker_sequences,list) + assert marker_sequences == test_marker_sequences +#---------------------------------------------------- + # class methods + + # Does not work properly + + #def test_subset(cls): + # """Returns a subset of the alignment by samples, markers and sites.""" + # sample_ids = [1,2,3] + # marker_ids = ['marker_0'] + # aln_obj = Alignment.from_fasta('test_alignment.txt', 'test_align', 'marker') + + # subset = (aln_obj,sample_ids, marker_ids) + # test_subset = +#---------------------------------------------------- + def test_get_samples(self): + # TODO - check valid ids, check invalid ids, + # check mixed type input (list, int, str) + # check invalid type + # check invalid optional arg. input + + """Returns a list of sequence strings containing only the samples + specified by the index.""" + test_names = ['Dmel_RG4N', 'Dmel_RG7'] + get_samples = self.aln_file.get_samples(test_names) + + test_list = [] + #extracts expected sequences from test dictionary + for index in range(len(self.test_aln_file['Dmel_RG4N'][1])): + nuc1 = self.test_aln_file['Dmel_RG4N'][1][index] + nuc2 = self.test_aln_file['Dmel_RG7'][1][index] + test_list = test_list + [[nuc1,nuc2]] + + assert [sample for sample in get_samples] == test_list +#---------------------------------------------------- + # can't test yet becausse returns an object + #def test_get_markers(self, i, match_prefix=False, match_suffix=False): + #"""Returns a list of sequence strings containing only the markers + #specified by the index.""" + + # error with row and column posisiton + #def test_get_sites(self): + #"""Returns a new alignment containing only the sites specified + #by the given list of column numbers.""" +#---------------------------------------------------- + # Setter/Replacer + def test_replace_samples(self): + """Replaces the sequence for a given row in the alignment matrix.""" + new_sample = 'A' * 3432 + replace_sample = self.aln_file.replace_samples(['Dmel_528_2597'], [new_sample]) + sample_sequences = self.aln_file.sample_sequences + + assert new_sample in sample_sequences +#---------------------------------------------------- + def test_insert_samples_from_lists(self): + """Inserts new sequences in the alignment matrix at the specifiedrow position inplace.""" + + new_sample_id = 'Dsim99201' + new_sample_desc = '|CH2912|' + new_sample_sequence = 'GCCGATGT' * 429 + self.aln_file.insert_samples_from_lists(1, [new_sample_id], [new_sample_desc], [new_sample_sequence]) + #assert self.aln_file.sample_sequences[1:2] == new_sample_sequence # error here + assert self.aln_file.sample_ids[1] == new_sample_id + assert self.aln_file.sample_descriptions[1] == new_sample_desc +#---------------------------------------------------- + def test_append_sample_from_lists(self): + """Inserts new sequences after the last row of the alignment matrix + inplace. This increases the total number of samples.""" + + new_sample_id = 'Dere_lastind' + new_sample_desc = '|last_ind|' + new_sample_sequence = 'GCCGAAAA' * 429 + self.aln_file.append_sample_from_lists([new_sample_id], [new_sample_desc], [new_sample_sequence]) + assert self.aln_file.sample_sequences[-1] == new_sample_sequence + assert self.aln_file.sample_ids[-1] == new_sample_id + assert self.aln_file.sample_descriptions[-1] == new_sample_desc +#---------------------------------------------------- + def test_remove_samples(self): + """Removes sample sequences based on the given index.""" + index_to_remove = 1 + sequence_to_remove = self.aln_file.sample_sequences[index_to_remove] + self.aln_file.remove_samples(index_to_remove) + assert sequence_to_remove != self.aln_file.sample_sequences[1] + + + def test_retain_samples(self): + """Keeps sample sequences based on the given index.""" + + self.aln_file.retain_samples([1,2,3,4,5]) + assert self.aln_file.nsamples == 5 + assert len(self.aln_file.sample_ids) == 5 + assert len(self.aln_file.sample_descriptions) == 5 + assert len(self.aln_file.sample_sequences) == 5 + assert self.aln_file.nmarkers == 1 + assert len(self.aln_file.marker_ids) == 1 + assert len(self.aln_file.marker_descriptions) == 1 + assert len(self.aln_file.marker_sequences) == 1 +#---------------------------------------------------- + def test_remove_sites(self): + """Removes sites based on the given list of column numbers.""" + self.aln_file.remove_sites([0,1,2]) + + assert self.aln_file.nsites == (3432-3) + #TODO- should assert to that the positions are not ATG once + # get samples sequences is fixes +#---------------------------------------------------- + def test_retain_sites(self): + """Keeps sites based on the given list of column numbers.""" + self.aln_file.retain_sites([0,1,2]) + assert self.aln_file.nsites == 3 + #TODO- should assert to that the positions are not ATG once + # get samples sequences is fixes +#---------------------------------------------------- + def test_from_fasta(cls): + """Create an Alignment object from a FASTA-formatted file.""" + aln_obj = Alignment.from_fasta('test_alignment.txt', 'test_align', 'marker') + assert aln_obj.nsites == 3432 + assert aln_obj.nsamples == 65 + assert aln_obj.nmarkers == 1 +#---------------------------------------------------- + # Format converters + # tested, remove hashtag when done + #def test_to_fasta(self): + """Saves the alignment as a FASTA-formatted text file.""" + #create_aln_file = self.aln_file.to_fasta('test_aln_file') # should change input to path_to_file + #TODO- check if len(currentdir) increases by one, + #check if test_aln_file in dir + #use from_fasta to create new alingment object +#---------------------------------------------------- + def test_to_sample_matrix(self): + """Converts sequences into a numpy matrix.""" # is this matrix or array? + seq_matrix = self.aln_file.to_sample_matrix() + test_seq_matrix = array([list(key[1]) for key in self.test_aln_file.values() if 'A' in key[1]]) # use key names + assert array_equal(seq_matrix, test_seq_matrix) +#---------------------------------------------------- + def test_to_marker_matrix(self, size=1): + """Converts sequences into a numpy matrix.""" + mseq_matrix = self.aln_file.to_marker_matrix() + test_mseq_matrix = array([list(self.test_aln_file[marker][1]) for marker in \ + self.test_aln_file.keys() if 'marker' in marker]) + assert array_equal(mseq_matrix, test_mseq_matrix) +#---------------------------------------------------- + # Iterators + def test_iter_sites(self): + """Iterates column-wise over the alignment""" + iter_seq = list(self.aln_file.iter_sites(0,1)) + + test_cols = [] + seqs = [] + for num in range(0,1): + for value in self.test_aln_file.values(): + seq = value[1] + #if not 'A' in seq: + #continue + seqs.append(seq[num]) + + test_cols.append(sorted(seqs)) + seqs = [] + + print(test_cols, iter_seq) + assert test_cols == iter_seq +#---------------------------------------------------- + def test_iter_sample_sites(self, start=0, stop=None, size=1): + """Iterates column-wise over the sample alignment. Excludes markers. """ + iter_seq = list(self.aln_file.iter_sample_sites(0,10)) + + test_cols = [] + seqs = [] + for num in range(0,10): + for value in self.test_aln_file_wo_marker.values(): + seq = value[1] + seqs.append(seq[num]) + + test_cols.append(seqs) + seqs = [] + + assert test_cols == iter_seq +#---------------------------------------------------- + def test_iter_marker_sites(self): + """Iterates column-wise over the marker alignment. Excludes samples. """ + iter_seq = list(self.aln_file.iter_marker_sites(0,10)) + + test_cols = [] + seqs = [] + for num in range(0,10): + for value in self.test_aln_file.values(): + + seq = value[1] + if set(seq) != {'C', 'N'}: + continue + seqs.append(seq[num]) + + test_cols.append(seqs) + seqs = [] + + assert test_cols == iter_seq +#---------------------------------------------------- + # How does this work? + + # Block-related methods + + #def test_set_blocklists(self, ref_seq, description_encoder=None): +# """Creates new block information for the sequences given a reference. """ +#---------------------------------------------------- + # def test_parse_description_as_blocks(self, description_decoder=None): +# """Parses sample description into block data.""" +#---------------------------------------------------- + # def test_write_blocks_to_description(self, description_encoder): +# """Writes each sample's block data as a string, replacing its + # description.""" +#---------------------------------------------------- \ No newline at end of file From fa4ce3e6d13130d619a1805cec4177d1d2ea78fb Mon Sep 17 00:00:00 2001 From: Hassan Daanaa <45001829+hsdaanaa@users.noreply.github.com> Date: Tue, 12 Feb 2019 03:28:02 +0900 Subject: [PATCH 02/12] Add files via upload --- test_alignment_0_8_b.py | 330 ++++++++++++++++++++++++++++++++++++++++ test_alignment_b.txt | 8 + 2 files changed, 338 insertions(+) create mode 100644 test_alignment_0_8_b.py create mode 100644 test_alignment_b.txt diff --git a/test_alignment_0_8_b.py b/test_alignment_0_8_b.py new file mode 100644 index 0000000..da3baa6 --- /dev/null +++ b/test_alignment_0_8_b.py @@ -0,0 +1,330 @@ +#! /usr/env/bin/ Python3 +from alignmentrs_imports import * +#---------------------------------------------------- +class TestAlignment: + + # basic test for expected outputs + def setup(self): + # initiates alignment object for tests + self.aln_file = Alignment.from_fasta('test_alignment_b.txt', 'test_align', 'marker') + + def teardown(self): + pass +#---------------------------------------------------- + def test_nrows(self): + """checks if aln.obj.nrows output matches expected rows + of alignment""" + nrows = self.aln_file.nrows + expected_nrows = 4 + + assert isinstance(nrows,int) + assert nrows == expected_nrows +#---------------------------------------------------- + def test_nsamples(self): + """checks if aln.obj.nsamples output matches + number of samples being tested""" + + nsamples = self.aln_file.nsamples + expected_nsamples = 3 + + assert isinstance(nsamples,int) + assert nsamples == expected_nsamples +#---------------------------------------------------- + def test_nmarkers(self): + """checks if aln.obj.nmarkers matches + expected number of markers in the sample""" + + nmarkers = self.aln_file.nmarkers + expected_nmarkers = 1 + + assert isinstance(nmarkers, int) + assert nmarkers == expected_nmarkers +#---------------------------------------------------- + def test_nsites(self): + """checks if aln.obj.nsites output matches expected number + of sites in alignment(i.e sequence length) file""" + + nsites = self.aln_file.nsites + expected_nsites = 26 + + assert isinstance(nsites, int) + assert nsites == expected_nsites +#---------------------------------------------------- + def test_sample_ids(self): + """checks if all aln.obj.sample_ids match output + ids in alignment file""" + + sample_ids = self.aln_file.sample_ids + expected_sample_ids = ['Dmel_528_2597', 'Dmel_RG2', 'Dmel_RG4N'] + + assert isinstance(sample_ids,list) + assert sample_ids == expected_sample_ids +#---------------------------------------------------- + def test_sample_descriptions(self): + """checks if aln.obj.sample_descriptions output matches sample + descriptions in alignment file""" + + sample_descriptions = self.aln_file.sample_descriptions + expected_descriptions = ['|10 sp|', '|47 sp|', '|15 sp|'] + + assert isinstance(sample_descriptions,list) + assert sample_descriptions == expected_descriptions +#---------------------------------------------------- + def test_sample_sequences(self): + """checks if aln.obj.sample_sequences output match sequences + in alignment file""" + + sample_sequences = self.aln_file.sample_sequences + expected_sample_sequences = ['ATGAAGAGCAAGGTGGGGGGGGGGGG', + 'ATGAAGAGCAAGGTGGACCCCCCCCC', + 'ATGAAGAGCAAGGTGGAAAAAAAAAA'] + + assert isinstance(sample_sequences,list) + assert sample_sequences == expected_sample_sequences +#---------------------------------------------------- + def test_marker_ids(self): + """checks if aln.obj.marker_ids matches output marker ids in + alignment file""" + + marker_ids = self.aln_file.marker_ids + expected_marker_ids = ['marker_0'] + + assert isinstance(marker_ids, list) + assert marker_ids == expected_marker_ids +#---------------------------------------------------- + def test_marker_descriptions(self): + """checks if aln.obj.marker_descriptions output + matches descriptions in alignment file""" + + marker_descriptions = self.aln_file.marker_descriptions + expected_marker_descriptions = ['|91 sp|'] + + assert isinstance(marker_descriptions,list) + assert marker_descriptions == expected_marker_descriptions +#---------------------------------------------------- + def test_marker_sequences(self): + """checks if align.obj.marker_sequences output + matches marker sequences alignment file""" + + marker_sequences = self.aln_file.marker_sequences + expected_marker_sequences = ['CCCCCCCCCCCCCCCCCCCCCCCCCC'] + + assert isinstance(marker_sequences,list) + assert marker_sequences == expected_marker_sequences +#---------------------------------------------------- + # class methods + + # Does not work properly + + #def test_subset(cls): + # """Returns a subset of the alignment by samples, markers and sites.""" + # sample_ids = [1,2,3] + # marker_ids = ['marker_0'] + # aln_obj = Alignment.from_fasta('test_alignment.txt', 'test_align', 'marker') + + # subset = (aln_obj,sample_ids, marker_ids) + # test_subset = +#---------------------------------------------------- + def test_get_samples(self): + """tests aln.object.get_samples returns expected + sequences sample of an alignment file + tests: + valid input + invalid sample id + invalid types""" + # valid input + get_sample_str = self.aln_file.get_samples('Dmel_528_2597') + get_sample_index = self.aln_file.get_samples(0) + expected_sites = 26 + expected_samples = 1 + expected_markers = 0 + expected_sequence = ['ATGAAGAGCAAGGTGGGGGGGGGGGG'] + test_sample_list = [get_sample_str,get_sample_index] + + for test in test_sample_list: + assert isinstance(test, object) + assert test.nsites == expected_sites + assert test.nsamples == expected_samples + assert test.nmarkers == expected_markers + assert test.sample_sequences == expected_sequence + + # invalid sample_id + try: + invalid_sample_name_str = self.aln_file.get_samples('Dmel_528_259700') + invalid_sample_name_lst = self.aln_file.get_samples(['Dmel_528_259700']) + invalid_sample_id_int = self.aln_file.get_samples(-1) + invalid_sample_id_lst = self.aln_file.get_samples([-1]) + + except: + assert ValueError + + # invalid type + test_invalid_types = [{'Dmel_528_2597':0 },('Dmel_528_2597')] + try: + + for invalid_input in test_invalid_types: + invalid_id = self.aln_file.get_samples(invalid_input) + except: + assert ValueError + + try: + test_invalid_list_items = [[],[{'Dmel_528_2597':0 }]] + + for invalid_input in test_invalid_list_items: + invalid_id = self.aln_file.get_samples(invalid_input) + except: + assert ValueError +#---------------------------------------------------- + def test_get_markers(self): + """tests if aln.object.get_markers returns expected + marker sequences of an alignment file + tests: + valid input + invalid sample id + invalid types""" + + # VI + get_markers_str = self.aln_file.get_markers('marker_0') + get_markers_int = self.aln_file.get_markers(0) + get_markers_list_str = self.aln_file.get_markers(['marker_0']) + get_markers_list_int = self.aln_file.get_markers([0]) + expected_marker_sequence = ['CCCCCCCCCCCCCCCCCCCCCCCCCC'] + tests = [get_markers_str, get_markers_int, get_markers_list_str, get_markers_list_int] + for test in tests: + assert isinstance(test,object) + assert test.sequences == ['CCCCCCCCCCCCCCCCCCCCCCCCCC'] + assert test.nsites == 26 + #assert test.nsamples == 1 # attribute error + + # IVI + try: + inv_markers_str = self.aln_file.get_markers('marker_01') + inv_markers_int = self.aln_file.get_markers(1) + inv_markers_list_str = self.aln_file.get_markers(['marker_01']) + inv_markers_list_int = self.aln_file.get_markers([1]) + tests = [inv_markers_str, inv_markers_int, inv_markers_list_str, inv_markers_list_int] + + except ValueError: + pass + + # IVT + try: + test_invalid_types = [{'marker_0':0 },('marker_0')] + except ValueError: + pass + +#---------------------------------------------------- + #def test_get_sites(self): # row error + # """Returns a new alignment containing only the sites specified + # #by the given list of column numbers.""" +#---------------------------------------------------- + # Setter/Replacer + def test_replace_samples(self): # + """tests if aln.object.replace_samples replaces the sequence + of one or more sample in the aln.object""" + + new_sample = 'AT' * 13 + prev_sample_sequence = self.aln_file.sample_sequences[0] + self.aln_file.replace_samples(['Dmel_528_2597'], [new_sample]) + curr_sequence = self.aln_file.sample_sequences[0] + + assert not prev_sample_sequence == curr_sequence + assert curr_sequence == new_sample +#---------------------------------------------------- + def test_insert_samples_from_lists(self): + """tests if aln.object.insert_samples_from_lists adds one or + more sequences in the aln.object""" + + new_sample_id = 'Dsim99201' + new_sample_desc = '|CH2912|' + new_sample_sequence = 'G' * 26 + self.aln_file.insert_samples_from_lists(1, [new_sample_id], + [new_sample_desc], + [new_sample_sequence]) + + assert self.aln_file.sample_ids[1] == new_sample_id + assert self.aln_file.sample_descriptions[1] == new_sample_desc + # error here, returns does not insert expected sequence value + #assert self.aln_file.sample_sequences[1] == new_sample_sequence +#---------------------------------------------------- + def test_append_sample_from_lists(self): + """tests if append_sample_from_lists adds one or + more sequences in the last index of aln.object""" + + new_sample_id = 'Dere_lastind' + new_sample_desc = '|last_ind|' + new_sample_sequence = 'G' * 26 + self.aln_file.append_sample_from_lists([new_sample_id], [new_sample_desc], [new_sample_sequence]) + assert self.aln_file.sample_sequences[-1] == new_sample_sequence + assert self.aln_file.sample_ids[-1] == new_sample_id + assert self.aln_file.sample_descriptions[-1] == new_sample_desc +#---------------------------------------------------- + def test_remove_samples(self): + """tests if aln.obj.remove_samples removes all sample + information of one or more indices from the alignment object""" + + index_to_remove = 1 + sequence_to_remove = self.aln_file.sample_sequences[index_to_remove] + self.aln_file.remove_samples(index_to_remove) + assert sequence_to_remove != self.aln_file.sample_sequences[1] +#---------------------------------------------------- + def test_retain_samples(self): + """tests if aln.obj.retain_samples removes all sample + information apart from specified indices in + alignment object""" + + self.aln_file.retain_samples([1]) + assert self.aln_file.nsamples == 1 + assert len(self.aln_file.sample_ids) == 1 + assert len(self.aln_file.sample_descriptions) == 1 + assert len(self.aln_file.sample_sequences) == 1 + assert self.aln_file.nmarkers == 1 + assert len(self.aln_file.marker_ids) == 1 + assert len(self.aln_file.marker_descriptions) == 1 + assert len(self.aln_file.marker_sequences) == 1 +#---------------------------------------------------- + def test_remove_sites(self): + """tests if aln.obj.remove_sites removes all one or more + sequences from the alignment sequences""" + + self.aln_file.remove_sites([2]) + assert self.aln_file.nsites == (25) +#---------------------------------------------------- + def test_retain_sites(self): + """tests if aln.obj.retain_sites all sequences + apart from specified sequences in alignment sequences""" + self.aln_file.retain_sites([0,1,2]) + assert self.aln_file.nsites == 3 + #TODO- should assert to that the positions are not ATG once + # get samples sequences is fixes +#---------------------------------------------------- + def test_from_fasta(cls): + """Create an Alignment object from a FASTA-formatted file.""" + aln_obj = Alignment.from_fasta('test_alignment_b.txt', 'test_align', 'marker') + assert aln_obj.nsites == 26 + assert aln_obj.nsamples == 3 + assert aln_obj.nmarkers == 1 +#---------------------------------------------------- + # Format converters + # tested, remove hashtag when done + #def test_to_fasta(self): + """Saves the alignment as a FASTA-formatted text file.""" + #create_aln_file = self.aln_file.to_fasta('test_aln_file') # should change input to path_to_file + #TODO- check if len(currentdir) increases by one, + #check if test_aln_file in dir + #use from_fasta to create new alingment object + + # How does this work? + + # Block-related methods + + #def test_set_blocklists(self, ref_seq, description_encoder=None): +# """Creates new block information for the sequences given a reference. """ +#---------------------------------------------------- + # def test_parse_description_as_blocks(self, description_decoder=None): +# """Parses sample description into block data.""" +#---------------------------------------------------- + # def test_write_blocks_to_description(self, description_encoder): +# """Writes each sample's block data as a string, replacing its + # description.""" +#---------------------------------------------------- \ No newline at end of file diff --git a/test_alignment_b.txt b/test_alignment_b.txt new file mode 100644 index 0000000..4811f60 --- /dev/null +++ b/test_alignment_b.txt @@ -0,0 +1,8 @@ +>marker_0 |91 sp| +CCCCCCCCCCCCCCCCCCCCCCCCCC +>Dmel_528_2597 |10 sp| +ATGAAGAGCAAGGTGGGGGGGGGGGG +>Dmel_RG2 |47 sp| +ATGAAGAGCAAGGTGGACCCCCCCCC +>Dmel_RG4N |15 sp| +ATGAAGAGCAAGGTGGAAAAAAAAAA \ No newline at end of file From 9a57de9139fd1bc7e8fa62471bba3d39a1cbc519 Mon Sep 17 00:00:00 2001 From: Hassan Daanaa <45001829+hsdaanaa@users.noreply.github.com> Date: Tue, 12 Feb 2019 03:40:39 +0900 Subject: [PATCH 03/12] tests - alignmntrs 0.8 includes tests for classes .py incomplete - so will be updated frequently. --- alignmentrs/aln/test_alignment_0_8_b.py | 330 ++++++++++++++++++++++++ alignmentrs/aln/test_alignment_b.txt | 8 + 2 files changed, 338 insertions(+) create mode 100644 alignmentrs/aln/test_alignment_0_8_b.py create mode 100644 alignmentrs/aln/test_alignment_b.txt diff --git a/alignmentrs/aln/test_alignment_0_8_b.py b/alignmentrs/aln/test_alignment_0_8_b.py new file mode 100644 index 0000000..da3baa6 --- /dev/null +++ b/alignmentrs/aln/test_alignment_0_8_b.py @@ -0,0 +1,330 @@ +#! /usr/env/bin/ Python3 +from alignmentrs_imports import * +#---------------------------------------------------- +class TestAlignment: + + # basic test for expected outputs + def setup(self): + # initiates alignment object for tests + self.aln_file = Alignment.from_fasta('test_alignment_b.txt', 'test_align', 'marker') + + def teardown(self): + pass +#---------------------------------------------------- + def test_nrows(self): + """checks if aln.obj.nrows output matches expected rows + of alignment""" + nrows = self.aln_file.nrows + expected_nrows = 4 + + assert isinstance(nrows,int) + assert nrows == expected_nrows +#---------------------------------------------------- + def test_nsamples(self): + """checks if aln.obj.nsamples output matches + number of samples being tested""" + + nsamples = self.aln_file.nsamples + expected_nsamples = 3 + + assert isinstance(nsamples,int) + assert nsamples == expected_nsamples +#---------------------------------------------------- + def test_nmarkers(self): + """checks if aln.obj.nmarkers matches + expected number of markers in the sample""" + + nmarkers = self.aln_file.nmarkers + expected_nmarkers = 1 + + assert isinstance(nmarkers, int) + assert nmarkers == expected_nmarkers +#---------------------------------------------------- + def test_nsites(self): + """checks if aln.obj.nsites output matches expected number + of sites in alignment(i.e sequence length) file""" + + nsites = self.aln_file.nsites + expected_nsites = 26 + + assert isinstance(nsites, int) + assert nsites == expected_nsites +#---------------------------------------------------- + def test_sample_ids(self): + """checks if all aln.obj.sample_ids match output + ids in alignment file""" + + sample_ids = self.aln_file.sample_ids + expected_sample_ids = ['Dmel_528_2597', 'Dmel_RG2', 'Dmel_RG4N'] + + assert isinstance(sample_ids,list) + assert sample_ids == expected_sample_ids +#---------------------------------------------------- + def test_sample_descriptions(self): + """checks if aln.obj.sample_descriptions output matches sample + descriptions in alignment file""" + + sample_descriptions = self.aln_file.sample_descriptions + expected_descriptions = ['|10 sp|', '|47 sp|', '|15 sp|'] + + assert isinstance(sample_descriptions,list) + assert sample_descriptions == expected_descriptions +#---------------------------------------------------- + def test_sample_sequences(self): + """checks if aln.obj.sample_sequences output match sequences + in alignment file""" + + sample_sequences = self.aln_file.sample_sequences + expected_sample_sequences = ['ATGAAGAGCAAGGTGGGGGGGGGGGG', + 'ATGAAGAGCAAGGTGGACCCCCCCCC', + 'ATGAAGAGCAAGGTGGAAAAAAAAAA'] + + assert isinstance(sample_sequences,list) + assert sample_sequences == expected_sample_sequences +#---------------------------------------------------- + def test_marker_ids(self): + """checks if aln.obj.marker_ids matches output marker ids in + alignment file""" + + marker_ids = self.aln_file.marker_ids + expected_marker_ids = ['marker_0'] + + assert isinstance(marker_ids, list) + assert marker_ids == expected_marker_ids +#---------------------------------------------------- + def test_marker_descriptions(self): + """checks if aln.obj.marker_descriptions output + matches descriptions in alignment file""" + + marker_descriptions = self.aln_file.marker_descriptions + expected_marker_descriptions = ['|91 sp|'] + + assert isinstance(marker_descriptions,list) + assert marker_descriptions == expected_marker_descriptions +#---------------------------------------------------- + def test_marker_sequences(self): + """checks if align.obj.marker_sequences output + matches marker sequences alignment file""" + + marker_sequences = self.aln_file.marker_sequences + expected_marker_sequences = ['CCCCCCCCCCCCCCCCCCCCCCCCCC'] + + assert isinstance(marker_sequences,list) + assert marker_sequences == expected_marker_sequences +#---------------------------------------------------- + # class methods + + # Does not work properly + + #def test_subset(cls): + # """Returns a subset of the alignment by samples, markers and sites.""" + # sample_ids = [1,2,3] + # marker_ids = ['marker_0'] + # aln_obj = Alignment.from_fasta('test_alignment.txt', 'test_align', 'marker') + + # subset = (aln_obj,sample_ids, marker_ids) + # test_subset = +#---------------------------------------------------- + def test_get_samples(self): + """tests aln.object.get_samples returns expected + sequences sample of an alignment file + tests: + valid input + invalid sample id + invalid types""" + # valid input + get_sample_str = self.aln_file.get_samples('Dmel_528_2597') + get_sample_index = self.aln_file.get_samples(0) + expected_sites = 26 + expected_samples = 1 + expected_markers = 0 + expected_sequence = ['ATGAAGAGCAAGGTGGGGGGGGGGGG'] + test_sample_list = [get_sample_str,get_sample_index] + + for test in test_sample_list: + assert isinstance(test, object) + assert test.nsites == expected_sites + assert test.nsamples == expected_samples + assert test.nmarkers == expected_markers + assert test.sample_sequences == expected_sequence + + # invalid sample_id + try: + invalid_sample_name_str = self.aln_file.get_samples('Dmel_528_259700') + invalid_sample_name_lst = self.aln_file.get_samples(['Dmel_528_259700']) + invalid_sample_id_int = self.aln_file.get_samples(-1) + invalid_sample_id_lst = self.aln_file.get_samples([-1]) + + except: + assert ValueError + + # invalid type + test_invalid_types = [{'Dmel_528_2597':0 },('Dmel_528_2597')] + try: + + for invalid_input in test_invalid_types: + invalid_id = self.aln_file.get_samples(invalid_input) + except: + assert ValueError + + try: + test_invalid_list_items = [[],[{'Dmel_528_2597':0 }]] + + for invalid_input in test_invalid_list_items: + invalid_id = self.aln_file.get_samples(invalid_input) + except: + assert ValueError +#---------------------------------------------------- + def test_get_markers(self): + """tests if aln.object.get_markers returns expected + marker sequences of an alignment file + tests: + valid input + invalid sample id + invalid types""" + + # VI + get_markers_str = self.aln_file.get_markers('marker_0') + get_markers_int = self.aln_file.get_markers(0) + get_markers_list_str = self.aln_file.get_markers(['marker_0']) + get_markers_list_int = self.aln_file.get_markers([0]) + expected_marker_sequence = ['CCCCCCCCCCCCCCCCCCCCCCCCCC'] + tests = [get_markers_str, get_markers_int, get_markers_list_str, get_markers_list_int] + for test in tests: + assert isinstance(test,object) + assert test.sequences == ['CCCCCCCCCCCCCCCCCCCCCCCCCC'] + assert test.nsites == 26 + #assert test.nsamples == 1 # attribute error + + # IVI + try: + inv_markers_str = self.aln_file.get_markers('marker_01') + inv_markers_int = self.aln_file.get_markers(1) + inv_markers_list_str = self.aln_file.get_markers(['marker_01']) + inv_markers_list_int = self.aln_file.get_markers([1]) + tests = [inv_markers_str, inv_markers_int, inv_markers_list_str, inv_markers_list_int] + + except ValueError: + pass + + # IVT + try: + test_invalid_types = [{'marker_0':0 },('marker_0')] + except ValueError: + pass + +#---------------------------------------------------- + #def test_get_sites(self): # row error + # """Returns a new alignment containing only the sites specified + # #by the given list of column numbers.""" +#---------------------------------------------------- + # Setter/Replacer + def test_replace_samples(self): # + """tests if aln.object.replace_samples replaces the sequence + of one or more sample in the aln.object""" + + new_sample = 'AT' * 13 + prev_sample_sequence = self.aln_file.sample_sequences[0] + self.aln_file.replace_samples(['Dmel_528_2597'], [new_sample]) + curr_sequence = self.aln_file.sample_sequences[0] + + assert not prev_sample_sequence == curr_sequence + assert curr_sequence == new_sample +#---------------------------------------------------- + def test_insert_samples_from_lists(self): + """tests if aln.object.insert_samples_from_lists adds one or + more sequences in the aln.object""" + + new_sample_id = 'Dsim99201' + new_sample_desc = '|CH2912|' + new_sample_sequence = 'G' * 26 + self.aln_file.insert_samples_from_lists(1, [new_sample_id], + [new_sample_desc], + [new_sample_sequence]) + + assert self.aln_file.sample_ids[1] == new_sample_id + assert self.aln_file.sample_descriptions[1] == new_sample_desc + # error here, returns does not insert expected sequence value + #assert self.aln_file.sample_sequences[1] == new_sample_sequence +#---------------------------------------------------- + def test_append_sample_from_lists(self): + """tests if append_sample_from_lists adds one or + more sequences in the last index of aln.object""" + + new_sample_id = 'Dere_lastind' + new_sample_desc = '|last_ind|' + new_sample_sequence = 'G' * 26 + self.aln_file.append_sample_from_lists([new_sample_id], [new_sample_desc], [new_sample_sequence]) + assert self.aln_file.sample_sequences[-1] == new_sample_sequence + assert self.aln_file.sample_ids[-1] == new_sample_id + assert self.aln_file.sample_descriptions[-1] == new_sample_desc +#---------------------------------------------------- + def test_remove_samples(self): + """tests if aln.obj.remove_samples removes all sample + information of one or more indices from the alignment object""" + + index_to_remove = 1 + sequence_to_remove = self.aln_file.sample_sequences[index_to_remove] + self.aln_file.remove_samples(index_to_remove) + assert sequence_to_remove != self.aln_file.sample_sequences[1] +#---------------------------------------------------- + def test_retain_samples(self): + """tests if aln.obj.retain_samples removes all sample + information apart from specified indices in + alignment object""" + + self.aln_file.retain_samples([1]) + assert self.aln_file.nsamples == 1 + assert len(self.aln_file.sample_ids) == 1 + assert len(self.aln_file.sample_descriptions) == 1 + assert len(self.aln_file.sample_sequences) == 1 + assert self.aln_file.nmarkers == 1 + assert len(self.aln_file.marker_ids) == 1 + assert len(self.aln_file.marker_descriptions) == 1 + assert len(self.aln_file.marker_sequences) == 1 +#---------------------------------------------------- + def test_remove_sites(self): + """tests if aln.obj.remove_sites removes all one or more + sequences from the alignment sequences""" + + self.aln_file.remove_sites([2]) + assert self.aln_file.nsites == (25) +#---------------------------------------------------- + def test_retain_sites(self): + """tests if aln.obj.retain_sites all sequences + apart from specified sequences in alignment sequences""" + self.aln_file.retain_sites([0,1,2]) + assert self.aln_file.nsites == 3 + #TODO- should assert to that the positions are not ATG once + # get samples sequences is fixes +#---------------------------------------------------- + def test_from_fasta(cls): + """Create an Alignment object from a FASTA-formatted file.""" + aln_obj = Alignment.from_fasta('test_alignment_b.txt', 'test_align', 'marker') + assert aln_obj.nsites == 26 + assert aln_obj.nsamples == 3 + assert aln_obj.nmarkers == 1 +#---------------------------------------------------- + # Format converters + # tested, remove hashtag when done + #def test_to_fasta(self): + """Saves the alignment as a FASTA-formatted text file.""" + #create_aln_file = self.aln_file.to_fasta('test_aln_file') # should change input to path_to_file + #TODO- check if len(currentdir) increases by one, + #check if test_aln_file in dir + #use from_fasta to create new alingment object + + # How does this work? + + # Block-related methods + + #def test_set_blocklists(self, ref_seq, description_encoder=None): +# """Creates new block information for the sequences given a reference. """ +#---------------------------------------------------- + # def test_parse_description_as_blocks(self, description_decoder=None): +# """Parses sample description into block data.""" +#---------------------------------------------------- + # def test_write_blocks_to_description(self, description_encoder): +# """Writes each sample's block data as a string, replacing its + # description.""" +#---------------------------------------------------- \ No newline at end of file diff --git a/alignmentrs/aln/test_alignment_b.txt b/alignmentrs/aln/test_alignment_b.txt new file mode 100644 index 0000000..4811f60 --- /dev/null +++ b/alignmentrs/aln/test_alignment_b.txt @@ -0,0 +1,8 @@ +>marker_0 |91 sp| +CCCCCCCCCCCCCCCCCCCCCCCCCC +>Dmel_528_2597 |10 sp| +ATGAAGAGCAAGGTGGGGGGGGGGGG +>Dmel_RG2 |47 sp| +ATGAAGAGCAAGGTGGACCCCCCCCC +>Dmel_RG4N |15 sp| +ATGAAGAGCAAGGTGGAAAAAAAAAA \ No newline at end of file From 32d72e1566316710d14b53c753158994c8131368 Mon Sep 17 00:00:00 2001 From: Hassan Daanaa <45001829+hsdaanaa@users.noreply.github.com> Date: Tue, 12 Feb 2019 03:44:24 +0900 Subject: [PATCH 04/12] changed name adjusted name to match version 0.8.2 --- test_alignment_0_8_b.py => test_alignment_0_8_2_b.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) rename test_alignment_0_8_b.py => test_alignment_0_8_2_b.py (99%) diff --git a/test_alignment_0_8_b.py b/test_alignment_0_8_2_b.py similarity index 99% rename from test_alignment_0_8_b.py rename to test_alignment_0_8_2_b.py index da3baa6..09323f5 100644 --- a/test_alignment_0_8_b.py +++ b/test_alignment_0_8_2_b.py @@ -327,4 +327,4 @@ def test_from_fasta(cls): # def test_write_blocks_to_description(self, description_encoder): # """Writes each sample's block data as a string, replacing its # description.""" -#---------------------------------------------------- \ No newline at end of file +#---------------------------------------------------- From d2839e12d152a71e729e7fb5d4d81b8136bef3c6 Mon Sep 17 00:00:00 2001 From: Hassan Daanaa <45001829+hsdaanaa@users.noreply.github.com> Date: Tue, 12 Feb 2019 03:44:51 +0900 Subject: [PATCH 05/12] Rename test_alignment_0_8_2_b.py to test_alignment_0_8_2.py --- test_alignment_0_8_2_b.py => test_alignment_0_8_2.py | 0 1 file changed, 0 insertions(+), 0 deletions(-) rename test_alignment_0_8_2_b.py => test_alignment_0_8_2.py (100%) diff --git a/test_alignment_0_8_2_b.py b/test_alignment_0_8_2.py similarity index 100% rename from test_alignment_0_8_2_b.py rename to test_alignment_0_8_2.py From 3582ba88724688c2116fe274239d1a63ca43ae59 Mon Sep 17 00:00:00 2001 From: kent Date: Tue, 12 Feb 2019 15:22:05 +0900 Subject: [PATCH 06/12] Moves test to tests folder --- .../test_alignment.py} | 18 ++++++++++++++++++ 1 file changed, 18 insertions(+) rename alignmentrs/{aln/test_alignment_0_8_b.py => tests/test_alignment.py} (94%) diff --git a/alignmentrs/aln/test_alignment_0_8_b.py b/alignmentrs/tests/test_alignment.py similarity index 94% rename from alignmentrs/aln/test_alignment_0_8_b.py rename to alignmentrs/tests/test_alignment.py index da3baa6..1069bda 100644 --- a/alignmentrs/aln/test_alignment_0_8_b.py +++ b/alignmentrs/tests/test_alignment.py @@ -5,6 +5,24 @@ class TestAlignment: # basic test for expected outputs def setup(self): + # Create an alignment for testing + self.temp_filename = 'temp.aln' + with open(self.temp_filename, 'w') as fp: + print('>marker_0 |91 sp|\n', file=fp) + print('CCCCCCCCCCCCCCCCCCCCCCCCCC\n', file=fp) + print('>Dmel_528_2597 |10 sp|\n', file=fp) + print('ATGAAGAGCAAGGTGGGGGGGGGGGG\n', file=fp) + print('>Dmel_RG2 |47 sp|\n', file=fp) + print('ATGAAGAGCAAGGTGGACCCCCCCCC\n', file=fp) + print('>Dmel_RG4N |15 sp|\n', file=fp) + print('ATGAAGAGCAAGGTGGAAAAAAAAAA\n', file=fp) + # initiates alignment object for tests + self.aln_file = Alignment.from_fasta(self.temp_file.name, 'test_align', marker_kw='marker') + + def teardown(self): + if os.path.exists(self.temp_filename): + os.remove(self.temp_filename) + # initiates alignment object for tests self.aln_file = Alignment.from_fasta('test_alignment_b.txt', 'test_align', 'marker') From ab0429313cf14977e0073ea48ff9b17d2986e4ca Mon Sep 17 00:00:00 2001 From: kent Date: Tue, 12 Feb 2019 15:43:49 +0900 Subject: [PATCH 07/12] Adds .noseids to files to ignore --- .gitignore | 5 ++++- 1 file changed, 4 insertions(+), 1 deletion(-) diff --git a/.gitignore b/.gitignore index a5dc885..8e757ec 100644 --- a/.gitignore +++ b/.gitignore @@ -175,4 +175,7 @@ Cargo.lock # End of https://www.gitignore.io/api/rust,macos,python,visualstudiocode # Ignores .cargo/config which is specific to MacOS -/.cargo/config \ No newline at end of file +/.cargo/config + +# Ignores noseids +.noseids \ No newline at end of file From e90456ab76be973eb68062c9537ee94f91a103a4 Mon Sep 17 00:00:00 2001 From: kent Date: Tue, 12 Feb 2019 15:54:23 +0900 Subject: [PATCH 08/12] Refactors test_nrows and test_nsamples and adds comments --- alignmentrs/tests/test_alignment.py | 331 +++++++++++++++------------- 1 file changed, 174 insertions(+), 157 deletions(-) diff --git a/alignmentrs/tests/test_alignment.py b/alignmentrs/tests/test_alignment.py index 1069bda..984de60 100644 --- a/alignmentrs/tests/test_alignment.py +++ b/alignmentrs/tests/test_alignment.py @@ -1,8 +1,14 @@ -#! /usr/env/bin/ Python3 -from alignmentrs_imports import * -#---------------------------------------------------- -class TestAlignment: - +import os +from alignmentrs.aln import Alignment + +def type_error(expected, actual): + return 'Expected type {}, instead got {}'.format(expected, actual) + +def value_error(expected, actual): + return 'Expected value {}, instead got {}'.format(expected, actual) + +class TestAlignmentGetters: + # basic test for expected outputs def setup(self): # Create an alignment for testing @@ -17,118 +23,121 @@ def setup(self): print('>Dmel_RG4N |15 sp|\n', file=fp) print('ATGAAGAGCAAGGTGGAAAAAAAAAA\n', file=fp) # initiates alignment object for tests - self.aln_file = Alignment.from_fasta(self.temp_file.name, 'test_align', marker_kw='marker') + self.aln_file = Alignment.from_fasta(self.temp_filename, 'test_align', marker_kw='marker') def teardown(self): if os.path.exists(self.temp_filename): os.remove(self.temp_filename) - - # initiates alignment object for tests - self.aln_file = Alignment.from_fasta('test_alignment_b.txt', 'test_align', 'marker') - - def teardown(self): - pass -#---------------------------------------------------- - def test_nrows(self): - """checks if aln.obj.nrows output matches expected rows - of alignment""" - nrows = self.aln_file.nrows - expected_nrows = 4 - - assert isinstance(nrows,int) - assert nrows == expected_nrows -#---------------------------------------------------- - def test_nsamples(self): - """checks if aln.obj.nsamples output matches - number of samples being tested""" - - nsamples = self.aln_file.nsamples - expected_nsamples = 3 - - assert isinstance(nsamples,int) - assert nsamples == expected_nsamples -#---------------------------------------------------- - def test_nmarkers(self): - """checks if aln.obj.nmarkers matches - expected number of markers in the sample""" - + + def test_nrows_type(self): + """Checks if aln.obj.nrows output matches expected rows + of alignment + """ + expected = int + result = type(self.aln_file.nrows) + assert expected == result, type_error(expected, result) + + def test_nrows_value(self): + """Checks if aln.obj.nrows output matches expected rows + of alignment + """ + expected = 4 + result = self.aln_file.nrows + assert expected == result, value_error(expected, result) + + def test_nsamples_type(self): + """Checks if aln.obj.nrows output matches expected rows + of alignment + """ + expected = int + result = type(self.aln_file.nsamples) + assert expected == result, type_error(expected, result) + + def test_nsamples_value(self): + """Checks if aln.obj.nrows output matches expected rows + of alignment + """ + expected = 3 + result = self.aln_file.nsamples + assert expected == result, value_error(expected, result) + + # TODO: Refactor tests so that each test is very simple and + # multiple assertions are minimized, see test_nrows* and test_nsamples* + # TODO: Make "printer" functions like type_error and value_error + # above to standardize errors when the assertion + + def test_nmarkers(self): + """Checks if aln.obj.nmarkers matches + expected number of markers in the sample + """ nmarkers = self.aln_file.nmarkers expected_nmarkers = 1 - - assert isinstance(nmarkers, int) - assert nmarkers == expected_nmarkers -#---------------------------------------------------- + assert isinstance(nmarkers, int) # TODO: Text shown when assertion fails + assert nmarkers == expected_nmarkers # TODO: Text shown when assertion fails + def test_nsites(self): """checks if aln.obj.nsites output matches expected number - of sites in alignment(i.e sequence length) file""" - + of sites in alignment(i.e sequence length) file + """ nsites = self.aln_file.nsites expected_nsites = 26 - - assert isinstance(nsites, int) - assert nsites == expected_nsites -#---------------------------------------------------- + assert isinstance(nsites, int) # TODO: Text shown when assertion fails + assert nsites == expected_nsites # TODO: Text shown when assertion fails + def test_sample_ids(self): - """checks if all aln.obj.sample_ids match output - ids in alignment file""" - + """Checks if all aln.obj.sample_ids match output + ids in alignment file + """ sample_ids = self.aln_file.sample_ids expected_sample_ids = ['Dmel_528_2597', 'Dmel_RG2', 'Dmel_RG4N'] - - assert isinstance(sample_ids,list) - assert sample_ids == expected_sample_ids -#---------------------------------------------------- - def test_sample_descriptions(self): - """checks if aln.obj.sample_descriptions output matches sample - descriptions in alignment file""" - - sample_descriptions = self.aln_file.sample_descriptions + assert isinstance(sample_ids, list) # TODO: Text shown when assertion fails + assert sample_ids == expected_sample_ids # TODO: Text shown when assertion fails + + def test_sample_descriptions(self): + """Checks if aln.obj.sample_descriptions output matches sample + descriptions in alignment file + """ + sample_descriptions = self.aln_file.sample_descriptions expected_descriptions = ['|10 sp|', '|47 sp|', '|15 sp|'] - - assert isinstance(sample_descriptions,list) - assert sample_descriptions == expected_descriptions -#---------------------------------------------------- - def test_sample_sequences(self): - """checks if aln.obj.sample_sequences output match sequences - in alignment file""" - - sample_sequences = self.aln_file.sample_sequences - expected_sample_sequences = ['ATGAAGAGCAAGGTGGGGGGGGGGGG', - 'ATGAAGAGCAAGGTGGACCCCCCCCC', - 'ATGAAGAGCAAGGTGGAAAAAAAAAA'] - - assert isinstance(sample_sequences,list) - assert sample_sequences == expected_sample_sequences -#---------------------------------------------------- + assert isinstance(sample_descriptions, list) # TODO: Text shown when assertion fails + assert sample_descriptions == expected_descriptions # TODO: Text shown when assertion fails + + def test_sample_sequences(self): + """Checks if aln.obj.sample_sequences output match sequences + in alignment file + """ + sample_sequences = self.aln_file.sample_sequences + expected_sample_sequences = ['ATGAAGAGCAAGGTGGGGGGGGGGGG', + 'ATGAAGAGCAAGGTGGACCCCCCCCC', + 'ATGAAGAGCAAGGTGGAAAAAAAAAA'] + assert isinstance(sample_sequences, list) # TODO: Text shown when assertion fails + assert sample_sequences == expected_sample_sequences # TODO: Text shown when assertion fails + def test_marker_ids(self): - """checks if aln.obj.marker_ids matches output marker ids in - alignment file""" - - marker_ids = self.aln_file.marker_ids + """Checks if aln.obj.marker_ids matches output marker ids in + alignment file + """ + marker_ids = self.aln_file.marker_ids expected_marker_ids = ['marker_0'] - - assert isinstance(marker_ids, list) - assert marker_ids == expected_marker_ids -#---------------------------------------------------- + assert isinstance(marker_ids, list) # TODO: Text shown when assertion fails + assert marker_ids == expected_marker_ids # TODO: Text shown when assertion fails + def test_marker_descriptions(self): - """checks if aln.obj.marker_descriptions output + """checks if aln.obj.marker_descriptions output matches descriptions in alignment file""" - - marker_descriptions = self.aln_file.marker_descriptions + marker_descriptions = self.aln_file.marker_descriptions expected_marker_descriptions = ['|91 sp|'] - - assert isinstance(marker_descriptions,list) - assert marker_descriptions == expected_marker_descriptions -#---------------------------------------------------- + assert isinstance(marker_descriptions, list) # TODO: Text shown when assertion fails + assert marker_descriptions == expected_marker_descriptions # TODO: Text shown when assertion fails + def test_marker_sequences(self): - """checks if align.obj.marker_sequences output - matches marker sequences alignment file""" - - marker_sequences = self.aln_file.marker_sequences + """Checks if align.obj.marker_sequences output + matches marker sequences alignment file + """ + marker_sequences = self.aln_file.marker_sequences expected_marker_sequences = ['CCCCCCCCCCCCCCCCCCCCCCCCCC'] - - assert isinstance(marker_sequences,list) - assert marker_sequences == expected_marker_sequences + assert isinstance(marker_sequences, list) # TODO: Text shown when assertion fails + assert marker_sequences == expected_marker_sequences # TODO: Text shown when assertion fails #---------------------------------------------------- # class methods @@ -144,7 +153,7 @@ def test_marker_sequences(self): # test_subset = #---------------------------------------------------- def test_get_samples(self): - """tests aln.object.get_samples returns expected + """Tests aln.object.get_samples returns expected sequences sample of an alignment file tests: valid input @@ -158,7 +167,12 @@ def test_get_samples(self): expected_markers = 0 expected_sequence = ['ATGAAGAGCAAGGTGGGGGGGGGGGG'] test_sample_list = [get_sample_str,get_sample_index] - + + # TODO: Do not make compound tests! + # Each assertion should be a separate test so that it will fail for + # that specific test. + # For example, test.nsites == expected_sites is unnecessary because it + # duplicates an existing test - test_nsites for test in test_sample_list: assert isinstance(test, object) assert test.nsites == expected_sites @@ -167,53 +181,56 @@ def test_get_samples(self): assert test.sample_sequences == expected_sequence # invalid sample_id + # TODO: This should be a separate test try: invalid_sample_name_str = self.aln_file.get_samples('Dmel_528_259700') invalid_sample_name_lst = self.aln_file.get_samples(['Dmel_528_259700']) invalid_sample_id_int = self.aln_file.get_samples(-1) invalid_sample_id_lst = self.aln_file.get_samples([-1]) - except: - assert ValueError + assert ValueError # TODO: Text shown when assertion fails # invalid type - test_invalid_types = [{'Dmel_528_2597':0 },('Dmel_528_2597')] + # TODO: This should be a separate test + test_invalid_types = [{'Dmel_528_2597': 0},('Dmel_528_2597')] try: - for invalid_input in test_invalid_types: - invalid_id = self.aln_file.get_samples(invalid_input) + invalid_id = self.aln_file.get_samples(invalid_input) except: - assert ValueError - + assert ValueError # TODO: Text shown when assertion fails + + # TODO: This should be a separate test try: test_invalid_list_items = [[],[{'Dmel_528_2597':0 }]] - for invalid_input in test_invalid_list_items: invalid_id = self.aln_file.get_samples(invalid_input) except: - assert ValueError -#---------------------------------------------------- + assert ValueError # TODO: Text shown when assertion fails + def test_get_markers(self): - """tests if aln.object.get_markers returns expected + """Tests if aln.object.get_markers returns expected marker sequences of an alignment file tests: valid input invalid sample id - invalid types""" + invalid types + """ # VI get_markers_str = self.aln_file.get_markers('marker_0') get_markers_int = self.aln_file.get_markers(0) + # TODO: testing single char and list should be different tests as they are two scenarios of calling the method get_markers_list_str = self.aln_file.get_markers(['marker_0']) get_markers_list_int = self.aln_file.get_markers([0]) expected_marker_sequence = ['CCCCCCCCCCCCCCCCCCCCCCCCCC'] tests = [get_markers_str, get_markers_int, get_markers_list_str, get_markers_list_int] for test in tests: - assert isinstance(test,object) + assert isinstance(test, object) assert test.sequences == ['CCCCCCCCCCCCCCCCCCCCCCCCCC'] assert test.nsites == 26 #assert test.nsamples == 1 # attribute error + # What is VI, IVI, IVT?? # IVI try: inv_markers_str = self.aln_file.get_markers('marker_01') @@ -221,7 +238,6 @@ def test_get_markers(self): inv_markers_list_str = self.aln_file.get_markers(['marker_01']) inv_markers_list_int = self.aln_file.get_markers([1]) tests = [inv_markers_str, inv_markers_int, inv_markers_list_str, inv_markers_list_int] - except ValueError: pass @@ -237,10 +253,10 @@ def test_get_markers(self): # #by the given list of column numbers.""" #---------------------------------------------------- # Setter/Replacer - def test_replace_samples(self): # - """tests if aln.object.replace_samples replaces the sequence - of one or more sample in the aln.object""" - + def test_replace_samples(self): + """Tests if aln.object.replace_samples replaces the sequence + of one or more sample in the aln.object + """ new_sample = 'AT' * 13 prev_sample_sequence = self.aln_file.sample_sequences[0] self.aln_file.replace_samples(['Dmel_528_2597'], [new_sample]) @@ -248,81 +264,82 @@ def test_replace_samples(self): # assert not prev_sample_sequence == curr_sequence assert curr_sequence == new_sample -#---------------------------------------------------- + def test_insert_samples_from_lists(self): - """tests if aln.object.insert_samples_from_lists adds one or - more sequences in the aln.object""" - + """Tests if aln.object.insert_samples_from_lists adds one or + more sequences in the aln.object + """ new_sample_id = 'Dsim99201' new_sample_desc = '|CH2912|' new_sample_sequence = 'G' * 26 self.aln_file.insert_samples_from_lists(1, [new_sample_id], [new_sample_desc], [new_sample_sequence]) - - assert self.aln_file.sample_ids[1] == new_sample_id - assert self.aln_file.sample_descriptions[1] == new_sample_desc + assert self.aln_file.sample_ids[1] == new_sample_id # TODO: Text shown when assertion + assert self.aln_file.sample_descriptions[1] == new_sample_desc # TODO: Text shown when assertion # error here, returns does not insert expected sequence value #assert self.aln_file.sample_sequences[1] == new_sample_sequence -#---------------------------------------------------- + def test_append_sample_from_lists(self): - """tests if append_sample_from_lists adds one or - more sequences in the last index of aln.object""" - + """Tests if append_sample_from_lists adds one or + more sequences in the last index of aln.object + """ new_sample_id = 'Dere_lastind' new_sample_desc = '|last_ind|' new_sample_sequence = 'G' * 26 - self.aln_file.append_sample_from_lists([new_sample_id], [new_sample_desc], [new_sample_sequence]) - assert self.aln_file.sample_sequences[-1] == new_sample_sequence - assert self.aln_file.sample_ids[-1] == new_sample_id - assert self.aln_file.sample_descriptions[-1] == new_sample_desc -#---------------------------------------------------- + self.aln_file.append_sample_from_lists([new_sample_id],[new_sample_desc], [new_sample_sequence]) + assert self.aln_file.sample_sequences[-1] == new_sample_sequence # TODO: Text shown when assertion + assert self.aln_file.sample_ids[-1] == new_sample_id # TODO: Text shown when assertion + assert self.aln_file.sample_descriptions[-1] == new_sample_desc # TODO: Text shown when assertion + def test_remove_samples(self): - """tests if aln.obj.remove_samples removes all sample - information of one or more indices from the alignment object""" - + """Tests if aln.obj.remove_samples removes all sample + information of one or more indices from the alignment object + """ index_to_remove = 1 sequence_to_remove = self.aln_file.sample_sequences[index_to_remove] self.aln_file.remove_samples(index_to_remove) - assert sequence_to_remove != self.aln_file.sample_sequences[1] -#---------------------------------------------------- + assert sequence_to_remove != self.aln_file.sample_sequences[1] # TODO: Text shown when assertion + def test_retain_samples(self): - """tests if aln.obj.retain_samples removes all sample + """Tests if aln.obj.retain_samples removes all sample information apart from specified indices in - alignment object""" - + alignment object + """ self.aln_file.retain_samples([1]) - assert self.aln_file.nsamples == 1 - assert len(self.aln_file.sample_ids) == 1 - assert len(self.aln_file.sample_descriptions) == 1 - assert len(self.aln_file.sample_sequences) == 1 - assert self.aln_file.nmarkers == 1 - assert len(self.aln_file.marker_ids) == 1 - assert len(self.aln_file.marker_descriptions) == 1 - assert len(self.aln_file.marker_sequences) == 1 -#---------------------------------------------------- + assert self.aln_file.nsamples == 1 # TODO: Text shown when assertion fails + assert len(self.aln_file.sample_ids) == 1 # TODO: Text shown when assertion fails + assert len(self.aln_file.sample_descriptions) == 1 # TODO: Text shown when assertion fails + assert len(self.aln_file.sample_sequences) == 1 # TODO: Text shown when assertion fails + assert self.aln_file.nmarkers == 1 # TODO: Text shown when assertion fails + assert len(self.aln_file.marker_ids) == 1 # TODO: Text shown when assertion fails + assert len(self.aln_file.marker_descriptions) == 1 # TODO: Text shown when assertion fails + assert len(self.aln_file.marker_sequences) == 1 # TODO: Text shown when assertion fails + + # TODO: Other than count, test whether the correct sample was retained + def test_remove_sites(self): """tests if aln.obj.remove_sites removes all one or more sequences from the alignment sequences""" self.aln_file.remove_sites([2]) - assert self.aln_file.nsites == (25) -#---------------------------------------------------- + assert self.aln_file.nsites == (25) # TODO: Text shown when assertion fails + def test_retain_sites(self): """tests if aln.obj.retain_sites all sequences apart from specified sequences in alignment sequences""" self.aln_file.retain_sites([0,1,2]) - assert self.aln_file.nsites == 3 + assert self.aln_file.nsites == 3 # TODO: Text shown when assertion fails #TODO- should assert to that the positions are not ATG once # get samples sequences is fixes -#---------------------------------------------------- + def test_from_fasta(cls): """Create an Alignment object from a FASTA-formatted file.""" aln_obj = Alignment.from_fasta('test_alignment_b.txt', 'test_align', 'marker') - assert aln_obj.nsites == 26 - assert aln_obj.nsamples == 3 - assert aln_obj.nmarkers == 1 -#---------------------------------------------------- + assert aln_obj.nsites == 26 # TODO: Text shown when assertion fails + assert aln_obj.nsamples == 3 # TODO: Text shown when assertion fails + assert aln_obj.nmarkers == 1 # TODO: Text shown when assertion fails + # Format converters # tested, remove hashtag when done #def test_to_fasta(self): From c4a97d34da09daedf639b4778b7c3ec88773e011 Mon Sep 17 00:00:00 2001 From: kent Date: Tue, 12 Feb 2019 16:02:27 +0900 Subject: [PATCH 09/12] Removes mock aln file --- alignmentrs/aln/test_alignment_b.txt | 8 -------- 1 file changed, 8 deletions(-) delete mode 100644 alignmentrs/aln/test_alignment_b.txt diff --git a/alignmentrs/aln/test_alignment_b.txt b/alignmentrs/aln/test_alignment_b.txt deleted file mode 100644 index 4811f60..0000000 --- a/alignmentrs/aln/test_alignment_b.txt +++ /dev/null @@ -1,8 +0,0 @@ ->marker_0 |91 sp| -CCCCCCCCCCCCCCCCCCCCCCCCCC ->Dmel_528_2597 |10 sp| -ATGAAGAGCAAGGTGGGGGGGGGGGG ->Dmel_RG2 |47 sp| -ATGAAGAGCAAGGTGGACCCCCCCCC ->Dmel_RG4N |15 sp| -ATGAAGAGCAAGGTGGAAAAAAAAAA \ No newline at end of file From eb93b131ebe5eb8afae13fa2fc877e2452812640 Mon Sep 17 00:00:00 2001 From: kent Date: Tue, 12 Feb 2019 16:03:26 +0900 Subject: [PATCH 10/12] Removes unnecessary files --- alignmentrs_imports.py | 9 - test_alignment.txt | 132 ------------- test_alignment_0_8.py | 413 ---------------------------------------- test_alignment_0_8_2.py | 330 -------------------------------- test_alignment_b.txt | 8 - 5 files changed, 892 deletions(-) delete mode 100644 alignmentrs_imports.py delete mode 100644 test_alignment.txt delete mode 100644 test_alignment_0_8.py delete mode 100644 test_alignment_0_8_2.py delete mode 100644 test_alignment_b.txt diff --git a/alignmentrs_imports.py b/alignmentrs_imports.py deleted file mode 100644 index 1b82b75..0000000 --- a/alignmentrs_imports.py +++ /dev/null @@ -1,9 +0,0 @@ -import sys -sys.path.append('../') -from os import getcwd -from numpy import matrix, array, array_equal -import nose -import random -from classes import * -from funcs import * -from alignmentrs_test_funcs import * \ No newline at end of file diff --git a/test_alignment.txt b/test_alignment.txt deleted file mode 100644 index e26dc19..0000000 --- a/test_alignment.txt +++ /dev/null @@ -1,132 +0,0 @@ ->marker_0 |91 sp| -CCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCNNNNNNNNN ->Dmel_528_2597 |10 sp| -ATGAAGAGCAAGGTGGATAAACCCGTAACCAATGGTGCACCAAATGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAAAAATCCGAAGCGGACTCGCAAATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGAGAAGCCGGCGGAGACCGAGGAAAAGGAAAATACCGCAAGCAACGCCAACCTGAAGGTGTCTCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGATACAAATGCTGAGCAGCGCACTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAAACGCCGTGCCCGCCATTGATGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAATTGGTTACAGCCTTCTGCATTCTGCAGACCCCGCAGTTCGCTAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCCCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAACAAGCCGTTGAGTGGCTTGAAAGTGAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTTTTCGTCCGTACTGGGACGGGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACACACAGCTTTTCGATTTGTATTTCTCCGGTTCCACCATTCACAGCGATGGCGTATATGCCAGATTGGCTAGTTTTCTTGTTAATGGCGGAAAGGATATGCTCGCCGCCTGGCAGCAATATATCGATTCTAAGCAGCCACTCAAACTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCCACGTGCTCCTCAACTTTAAGCCAAGGGAAGAACAACTCATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGTTGCATGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCTAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTTGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCACCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATTTCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTCAGCGTCGAGAGCCTTCACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCACTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTTAGTCAGACAGCCAAATGGCGACAGAAACAGTTGAACTACTTGTTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAAGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCAGTTGCTGCAGAAGACATTGAGTTACCTTAACAAAGAGTTGGGACAACCGGATGCGGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGAGCGGCCCAGCAAGGAATCCGATGTCGTTGGCCAATCATTCGAGGCTCTTATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCATCACCGTGTTGGAAGATCTGATTATCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGAGCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTTACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTTCTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGCTCAACATGAACAAAAATCCCCTGAGCAAAAAGAGCGATGGC------GAGGAGGAGAGCGATGACGAACTCGACAAGGAAGAATCGTTGAAGGATTCAAGCGATGATTCAGAAGATGAAGATGAAGATGAAGAGGAGGAC---GAGGGCGAGGACGATGCAGAGTCCCATTTGGCCCAAATTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAGGAGCAGGGCGAACGCTTGAATGCTGCTTTGGAGCGGTCTTTTCAGATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAGCACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAACCAAGAAACCAACTCAATCGGTAATCCTGGACGTGCTACATTGCGTGTTCCAGGTGTACAGCCATTGCGCCGCAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTCGCTAGGAATATCGAACTCAAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCCATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAAGAGACATCATTATTTGGCGGGACAGGTGCTTCGCTTACCTGGTCAGCCAGGCATCAGCAGATGGCGAGCCCAAGAAAAGTGCCGTCTGGCCCCTTCTAGTCGAATTCCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGCCAATGGCAGGGAGTTGCTCCGCTGGCCGTTGTCCTGGCCTCTCACTTGGACGTACAGAAAACACGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGTCGCTTTCAAGGACAACAACTCGTCTTCCAAGAAATTTGAGAAGCAGATAGCCAGATATGTAAATCAGCTAGAAACGAAGGCTAGCAGTTCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGTGGCAGAAACTGCGTGAACAAATTCAGCTCGTCGCCAAGGATCTTCAACCCAACAAGAAGGTGGCGAAGCAGAAGAAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGAAGATGAAGAGTCCACA--- ->Dmel_RG2 |47 sp| -ATGAAGAGCAAGGTGGATAAACCCGTAACCAATGGTGCACCAAATGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAAAAATCCGAAGCGGACTCGCAAATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGAGAAGCCGGCGGAGACCGAGGAAAAGGAAAATACCGCAAGCAACGGCAACCTGAAGGTGTCTCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGATACAAATGCTGAGCAGCGCACTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAAACGCCGTGCCCGCCATTGATGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAATTGGTTACAGCCTTCTGCATTCTGCAGACCCCGCAGTTCGCTAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCCCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTCCAACCCGAGCTAAACAAGCCGTTGAGTGGCTTGAAAGTGAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTTTTCGTCCGTACTGGGACGGGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACACACAGCTTTTCGATTTGTATTTCTCCGGTTCCACCATTCACAGCGATGGCGTATATGCCAGATTGGCTAGTTTTCTTGTTAATGGCGGAAAGGATATGCTCGCCGCCTGGCAGCAATATATCGATTCCAAGCAGCCACTCAAACTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCCACGTGCTCCTCAACTTTAAGCCAAGGGAAGAACAACTCATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGTTGCATGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCTAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTTGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCACCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATTTCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTCAGCGTCGAGAGCCTTCACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCACTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTTAGTCAGACAGCCAAATGGCGACAGAAACAGTTGAACTACTTGTTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAAGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCAGTTGCTGCAGAAGACATTGAGTTACCTTAACAAAGAGTTGGGACAACCGGATGCGGAGAGCAAATTGCGTTCGCCAAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGCAACTGCTGGAGCGGCCCAGCAAGGAATCGGATGTCGTTGGCCAATCATTCGAGGCTCTTATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCATCACCGTGTTGGAAGATCTGATTATCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGAGCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTTCTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGCTCAACATGAACAAAAATCCCCTGAGCAAAAAGAGCGATGGC------GAGGAGGAGAGCGATGACGAACTCGACGAGGAAGAATCGTTGAAGGATTCAAGCGATGATTCAGAAGATGAAGATGAAGATGAAGAGGAGGAC---GAGGGCGAGGACGATGCAGAGTCCCATTTGGCCCAAATTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAGGAGCAGGGCGAACGCTTGAATGCTGCTTTGGAGCGGTCTTTTCAGATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAGCACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAACCAAGAAACCAACTCAATCGGTAATCCTGGACGTGCTACATTGCGTGTTCCAGGTGTACAGCCATTGCGCCGCAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTCGCTAGGAATATCGAACTCAAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCCATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAAGAGACATCATTATTTGGCGGGACAGGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCGAGCCCAAGAAAAGTGCCGTCTGGCCCCTTCTAGTCGAATTCCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGCCAATGGCAGGGAGTTGCTCCGCTGGCCGTTGTCCTGGCCTCTCACTTGGACGTACAGAAAACACGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGTCGCTTTCAAGGACAACAACTCGTCTTCCAAGAAATTTGAGAAGCAGATAGCCAGATATGTAAATCAGCTAGAAACGAAGGCTAGCAGTTCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGTGGCAGAAACTGCGTGAACAAATTCAGCTCGTCGCCAAGGATCTTCAACCCAACAAGAAGGTGGCGAAGCAGAAGAAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGAAGATGAAGAGTCCACA--- ->Dmel_RG3 |22 sp| -ATGAAGAGCAAGGTGGATAAACCCGTAACCAATGGTGCACCAAATGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAAAAATCCGAAGCGGACTCGCAAATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGAGAAGCCGGCGGAGACCGAGGAAAAGGAAAATACCGCAAGCAACGGCAACCTGAAGGTGTCTCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGATACAAATGCTGAGCAGCGCACTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAAACGCCGTGCCCGCCATTGATGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAATTGGTTACAGCCTTCTGCATTCTGCAGACCCCGCAGTTCGCTAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCCCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAACAAGCCGTTGAGTGGCTTGAAAGTGAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGGGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACACACAGCTTTTCGATTTGTATTTCTCCGGTTCCACCATTCACAGCGATGGCGTATATGCCAGATTGGCTAGTTTTCTTGTTAATGGCGGAAACGATATGCTCGCCGCCTGGCAGCAATATATCGATTCCAAGCAGCCACTCAAACTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCCACGTGCTCCTCAACTTTAAGCCAAGGGAAGAACAACTCATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGTTGCATGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCTAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTTGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCACCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATTTCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTCAGCGTCGAGAGCCTTCACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCACTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTTAGTCAGACAGCCAAATGGCGACAGAAACAGTTGAACTACTTGTTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAAGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCAGTTGCTGCAGAAGACATTGAGTTACCTTAACAAAGAGTTGGGACAACCGGATGCGGAGAGCAAATTGCGTTCGCCAAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGAGCGGCCCAGCAAGGAATCGGATGTCGTTGGCCAATCATTCGAGGCTCTTATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCATCACCGTGTTGGAAGATCTGATTATCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGAGCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTTCTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGCTCAACATGAACAAAAATCCCCTGAGCAAAAAGAGCGATGGC------GAGGAGGAGAGCGATGACGAACTCGACGAGGAAGAATCGTTGAAGGATTCAAGCGATGNNNNNNNNNNNNNNNNNNNNNNTGAAGAGGAGGAC---GAGGGCGAGGACGATGCAGAGTCCCATTTGGCCCAAATTCGAGAGAGCGTTCGCCAGGCTTTGATCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAGGAGCAGGGCGAACGCTTGAATGCTGCTTTGGAGCGGTCTTTTCAGATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAGCACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAACCAAGAAACCAACTCAATCGGTAATCCTGGACGTGCTACATTGCGTCTTCCAGGTGTACAGCCATTGCGCCGCAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTCGCTAGGAATATCGAACTCAAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCCATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAGGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCGAGCCCAAGAAAAGTGCCGTCTGGCCCCTTCTAGTCGAATTCCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGCCAATGGCAGGGAGTTGCTCCGCTGGCCGTTGTCCTGGCCTCTCACTTGGACGTACAGAAAACACGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGTCGCTTTCAAGGACAACAACTCGTCTTCCAAGAAATTTGAGAAGCAGATAGCCAGATATGTAAATCAGCTAGAAACGAAGGCTAGCAGTTCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGTGGCAGAAACTGCGTGAACAAATTCAGCTCGTCGCCAAGGATCTTCAACCCAACAAGAAGGTGGCGAAGCAGAAGAAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGAAGATGAAGAGTCCACA--- ->Dmel_RG4N |15 sp| -ATGAAGAGCAAGGTGGATAAACCCGTAACCAATGGTGCACCAAATGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAAAAATCCGAAGCGGACTCGCAAATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGAGAAGCCGGCGGAGACCGAGGAAAAGGAAAATACCGCAAGCAACGGCAACCTGAAGGTGTCTCACATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGATACAAATGCTGAACAGCGCACTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAAACGCCGTGCCCGCCATTGATGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAATTGGTTACAGCCTTCTGCATTCTGCAGACCCCGCAGTTCGCTAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCCCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCNCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAACAAGCCGTTGAGTGGCTTGAAAGTGAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGGGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACACACAGCTTTTCGATTTGTATTTCTCCGGTTCCACCATTCACAGCGATGGCGTATATGCCAGATTGGCTAGTTTTCTTGTTAATGGCGGAAACGATATGCTCGCCGCCTGGCAGCAATATATCGATTCCAAGCAGCCACTCAAACTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCCACGTGCTCCTCAACTTTAAGCCAAGGGAAGAACAACTCATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGTTGCATGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCTAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTTGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCACCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATTTCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTCAGCGTCGAGAGCCTTCACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCACTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTTAGTCAGACAGCCAAATGGCGACAGAAACAGTTGAACTACTTGTTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAAGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCAGTTGCTGCAGAAGACATTGAGTTACCTTAACAAAGAGTTGGGACAACCGGATGCGGAGAGCAAATTGCGTTCGCCAAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGAGCGGCCCAGCAAGGAATCGGATGTCGTTGGCCAATCATTCGAGGCTCTTATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCATCACCGTGTTGGAAGATCTGATTATCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGAGCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTTCTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGCTCAACATGAACAAAAATCCCCTGAGCAAAAAGAGCGATGGC------GAGGAGGAGAGCGATGACGAACTCGACGAGGAAGAATCGTTGAAGGATTCAAGCGATGNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNAC---GAGGGCGAGGACGATGCAGAGTCCCATTTGGCCCAAATTCGAGAGAGCGTTCGCCAGGCTTTGATCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAGGAGCAGGGCGAACGCTTGAATGCTGCTTTGGAGCGGTCTTTTCAGATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAGCACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAACCAAGAAACCAACTCAATCGGTAATCCTGGACGTGCTACATTGCGTCTTCCAGGTGTACAGCCATTGCGCCGCAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTCGCTAGGAATATCGAACTCAAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCCATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAGGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCGAGCCCAAGAAAAGTGCCGTCTGGCCCCTTCTAGTCGAATTCCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGCCAATGGCAGGGAGTTGCTCCGCTGGCCGTTGTCCTGGCCTCTCACTTGGACGTACAGAAAACACGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGTCGCTTTCAAGGACAACAACTCGTCTTCCAAGAAATTTGAGAAGCAGATAGCCAGATATGTAAATCAGCTAGAAACGAAGGCTAGCAGTTCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGTGGCAGAAACTGCGTGAACAAATTCAGCTCGTCGCCAAGGATCTTCAACCCAACAAGAAGGTGGCGAAGCAGAAGAAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGAAGATGAAGAGTCCAGA--- ->Dmel_RG5 |45 sp| -ATGAAGAGCAAGGTGGATAAACCCGTAACCAATGGTGCACCAAATGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAAAAATCCGAAGCGGACTCGCAAATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGAGAAGCCGGCGGAGACCGAGGAAAAGGAAAATACCGCAAGCAACGGCAACCTGAAGGTGTCTCACATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGATACAAATGCTGAGCAGCGCACTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGTCTGGCCGCCAGTTACATACACTGCATCCTAAACGCCGTGCCCGCCATTGATGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAATTGGTTACAGCCTTCTGCATTCTGCAGACCCCGCAGTTCGCTAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCCCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAACAAGCCGTTGAGTGGCTTGAAAGTGAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGGGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACACACAGCTTTTCGATTTGTATTTCTCCGGTTCCACCATTCACAGCGATGGCGTATATGCCAGATTGGCTAGTTTTCTTGTTAATGGCGGAAACGATATGCTCGCCGCCTGGCAGCAATATATCGATTCCAAGCAGCCACTCAAACTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCCACGTGCTCCTCAACTTTAAGCCAAGGGAAGAACAACTCATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGTTGCATGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCTAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTTGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCACCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATTTCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTCAGCGTCGAGAGCCTTCACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCACTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTTAGTCAGACAGCCAAATGGCGACAGAAACAGTTGAACTACTTGTTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAAGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCAGTTGCTGCAGAAGACATTGAGTTACCTTAACAAAGAGTTGGGACAACCGGATGCGGAGAGCAAATTGCGTTCGCCAAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGAGCGGCCCAGCAAGGAATCGGATGTCGTTGGCCAATCATTCGAGGCTCTTATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCATCACCGTGTTGGAAGATCTGATTATCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGAGCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTNACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTTCTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGCTCAACATGAACAAAAATCCCCTGAGCAAAAAGAGCGATGGC------GAGGAGGAGAGCGATGACGAACTCGACGAGGAAGAATCGTTGAAGGATTCAAGCGATGATTCAGAAGATGAAGATGAAGATGAAGAGGAGGAC---GAGGGCGAGGACGATGCAGAGTCCCATTTGGCCCAAATTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAGGAGCAGGGCGAACGCTTGAATGCTGCTTTGGAGCGGTCTTTTCAGATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAGCACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAACCAAGAAACCAACTCAATCGGTAATCCTGGACGTGCTACATTGCGTCTTCCAGGTGTACAGCCATTGCGCCGCAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTCGCTAGGAATATCGAACTCAAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCCATTGAGCAGCTGATGTCGTCTGGCGACGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAGGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCGAGCCCAAGAAAAGTGCCGTCTGGCCCCTTCTAGTCGAATTCCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGCCAATGGCAGGGAGTTGCTCCGCTGGCCGTTGTCCTGGCCTCTCACTTGGACGTACAGAAAACACGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGTCGCTTTCAAGGACAACAACTCGTCTTCCAAGAAATTTGAGAAGCAGATAGCCAGATATGTAAATCAGCTAGAAACGAAGGCTAGCAGTTCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGTGGCAGAAACTGCGTGAACAAATTCAGCTCGTCGCCAAGGATCTTCAACCCAACAAGAAGGTGGCGAAGCAGAAGAAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGAAGATGAAGAGTCCACA--- ->Dmel_RG7 |32 sp| -ATGAAGAGCAAGGTGGATAAACCCGTAACCAATGGTGCACCAAATGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAAAAATCCGAAGCGGACTCGCAAATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGAGAAGCCGGCGGAGACCGAGGAAAAGGAAAATACCGCAAGCAACGGCAACCTGAAGGTGTCTCACATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGATACAAATGCTGAACAGCGCACTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAAACGCCGTGCCCGCCATTGATGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAATTGGTTACAGCCTTCTGCATTCTGCAGACCCCGCAGTTCGCTAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCCCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAACAAGCCGTTGAGTGGCTTGAAAGTGAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGGGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACACACAGCTTTTCGATTTGTATTTCTCCGGTTCCACCATTCACAGCGATGGCGTATATGCCAGATTGGCTAGTTTTCTTGTTAATGGCGGAAACGATATGCTCGCCGCCTGGCAGCAATATATCGATTCCAAGCAGCCACTCAAACTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCCACGTGCTCCTCAACTTTAAGCCAAGGGAAGAACAACTCATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGTTGCATGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCTAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTTGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCACCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATTTCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTCAGCGTCGAGAGCCTTCACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCACTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTTAGTCAGACAGCCAAATGGCGACAGAAACAGTTGAACTACTTGTTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAAGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCAGTTGCTGCAGAAGACATTGAGTTACCTTAACAAAGAGTTGGGACAACCGGATGCGGAGAGCAAATTGCGTTCGCCAAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGAGCGGCCCAGCAAGGAATCGGATGTCGTTGGCCAATCATTCGAGGCTCTTATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCATCACCGTGTTGGAAGATCTGATTATCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGAGCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTTCTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGCTCAACATGAACAAAAATCCCCTGAGCAAAAAGAGCGATGGC------GAGGAGGAGAGCGATGACGAACTCGACGAGGAAGAATCGTTGAAGGATTCAAGCGATGNNNNNNNNNNNNNNNNNNNNNNTGAAGAGGAGGAC---GAGGGCGAGGACGATGCAGAGTCCCATTTGGCCCAAATTCGAGAGAGCGTTCGCCAGGCTTTGATCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAGGAGCAGGGCGAACGCTTGAATGCTGCTTTGGAGCGGTCTTTTCAGATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAGCACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAACCAAGAAACCAACTCAATCGGTAATCCTGGACGTGCTACATTGCGTCTTCCAGGTGTACAGCCATTGCGCCGCAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTCGCTAGGAATATCGAACTCAAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCCATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAGGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCGAGCCCAAGAAAAGTGCCGTCTGGCCCCTTCTAGTCGAATTCCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGCCAATGGCAGGGAGTTGCTCCGCTGGCCGTTGTCCTGGCCTCTCACTTGGACGTACAGAAAACACGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGTCGCTTTCAAGGACAACAACTCGTCTTCCAAGAAATTTGAGAAGCAGATAGCCAGATATGTAAATCAGCTAGAAACGAAGGCTAGCAGTTCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGTGGCAGAAACTGCGTGAACAAATTCAGCTCGTCGCCAAGGATCTTCAACCCAACAAGAAGGTGGCGAAGCAGAAGAAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGAAGATGAAGAGTCCAGA--- ->Dmel_RG9 |108 sp| -ATGAAGAGCAAGGTGGATAAACCCGTAACCAATGGTGCACCAAATGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAAAAATCCGAAGCGGACTCGCAAATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGAGAAGCCGGCGGAGACCGAGGAAAAGGAAAATACCGCAAGCAACGCCAACCTGAAGGTGTCTCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGATACAAATGCTGAGCAGCGCACTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAAACGCCGTGCCCGCCATTGATGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCTGTCGGTCAATTGGTTACAGCCTTCTGCATTTTGCAGACCCCGCAGTTCGCTAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAACCCAGCTAAAGGGCAGGGAGTACTTGGTGTCCCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAACAAGCCGTTGAGTGGCTTGAAAGTGAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGGGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACACACAGCTTTTCGATTTGTATTTCTCCGGTTCCACCATTCACAGCGATGGCGTATATGCCAGATTGGCTAGTTTTCTTGTTAATGGCGGAAAGGATATGCTCGCCGCCTGGCAGCAATATATCGATTCCAAGCAGCCACTCAAACTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCCACGTGCTCCTCAACTTTAAGCCAAGGGAAGAACAACTCATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGTTGCATGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCTAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTTGTGTTACGAAAAGCAGTTTCAAAACGATGATAACAAACTTCACCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATTTCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTCAGCGTCGAGAGCCTTCACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCACTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTTAGTCAGACAGCCAAATGGCGACAGAAACAGTTGAACTACTTGTTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAAGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCAGTTGCTGCAGAAGACATTGAGTTACCTTAACAAAGAGTTGGGACAACCGGATGCGGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGAGCGGCCCAGCAAGGAATCCGATGTCGTTGGCCAATCATTCGAGGCTCTTATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCATCACCGTGTTGGAAGATCTGATTATCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGAGCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTTCTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCATCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGCTCAACATGAACAAAAATCCCCTGAGCAAAAAGAGCGATGGC------GAGGAGGAGAGCGATGACGAACTCGACGAGGAAGAATCGTTGAAGGATTCAAGCGATGATTCAGAAGATGAAGATGAAGATGAAGAGGAGGAC---GAGGGCGAGGACGATGCAGAGTCCCATTTGGCCCAAATTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAGGAGCAGGGCGAACGCTTGAATGCTGCTTTGGAGCGGTCTTTTCAGATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAGCACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAACCAAGAAACCAACTCAATCGGTAATCCTGGACGTGCTACATTGCGTGTTCCAGGTGTACAGCCATTGCGCCGCAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTCGCTAGGAATATCGAACTCAAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCCATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAGGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCGAGCCCAAGAAAAGTGCCGTCTGGCCCCTTCTAGTCGAATTCCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGCCAATGGCAGGGAGTTGCTCCGCTGGCCGTTGTCCTGGCCTCTCACTTGGACGTACAGAAAACACGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGTCGCTTTCAAGGACAACAACTCGTCTTCCAAGAAATTTGAGAAGCAGATAGCCAGATATGTAAATCAGCTAGAAACGAAGGCTAGCAGTTCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGTGGCAGAAACTGCGTGAACAAATTCAGCTCGTCGCCAAGGATCTTCAACCCAACAAGAAGGTGGCGAAGCAGAAGAAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGAAGATGAAGAGTCCACA--- ->Dmel_RG18N |8 sp| -ATGAAGAGCAAGGTGGATAAACCCGTAACCAATGGTGCACCAAATGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAAAAATCCGAAGCGGACTCGCAAATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGAGAAGCCGGCGGAGACCGAGGAAAAGGAAAATACCGCAAGCAACGCCAACCTGAAGGTGTCTCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGATACAAATGCTGAGCAGCGCACTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAAACGCCGTGCCCGCCATTGATGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAATTGGTTACAGCCTTCTGCATTCTGCAGACCCCGCAGTTCGCTAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCCCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAACAAGCCGTTGAGTGGCTTGAAAGTGAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGGGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACACACAGCTTTTCGATTTGTATTTCTCCGGTTCCACCATTCACAGCGATGGCGTATATGCCAGATTGGCTAGTTTTCTTGTTAATGGCGGAAAGGATATGCTCGCCGCCTGGCAGCAATATATCGATTCCAAGCAGCCACTCAAACTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCCACGTGCTCCTCAACTTTAAGCCAAGGGAAGAACAACTCATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGTTGCATGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCTAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTTGTGTTACGAAAAGCAGTTTCAAAACGATGATAACAAACTTCACCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATTTCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTCAGCGTCGAGAGCCTTCACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCACTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTTAGTCAGACAGCCAAATGGCGACAGAAACAGTTGAACTACTTGTTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAAGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCAGTTGCTGCAGAAGACATTGAGTTACCTTAACAAAGAGTTGGGACAACCGGATGCGGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGAGCGGCCCAGCAAGGAATCGGATGTCGTTGGCCAATCATTCGAGGCTCTTATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCATCACCGTGTTGGAAGATCTGATTATCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGAGCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTTCTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCATCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGCTCAACATGAACAAAAATCCCCTGAGCAAAAAGAGCGATGGC------GAGGAGGAGAGCGATGACGAACTCGACGAGGAGGAATCGTTGAAGGATTCAAGCGATGATTCAGAAGATGAAGATGAAGATGAAGAGGAGGAC---GAGGGCGAGGACGATGCAGAGTCCCATTTGGCCCAAATTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAGGAGCAGGGCGAACGCTTGAATGCTGCTTTGGAGCGGTCTTTTCAGATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAGCACCAACCTGCTGCACTTTCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAACCAAGAAACCAACTCAATCGGTAATCCTGGACGTGCTACATTGNGTNTTCCAGGTGTACAGCCATTGCGCCGCAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTCGCTAGGAATATCGAACTCAAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCCATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAAGAGACATCATTATTTGGCGGGAAAGGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCGAGCCCAAGAAAAGTGCCGTCTGGCCCCTTCTAGTCGAATTCCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGCCAATGGCAGGGAGTTGCTCCGCTGGCCGTTGTCCTGGCCTCTCACTTGGACGTACAGAAAACACGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGTCGCTTTCAAGGACAACAACTCGTCTTCCAAGAAATTTGAGAAGCAGATAGCCAGATATGTAAATCAGCTAGAAACGAAGGCTAGCAGTTCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGTGGCAGAAACTGCGTGAACAAATTCAGCTCGTCGCCAAGGATCTTCAACCCAACAAGAAGGTGGCGAAGCAGAAGAAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGAAGATGAAGAGTCCACA--- ->Dmel_RG19 |54 sp| -ATGAAGAGCAAGGTGGATAAACCCGTAACCAATGGTGCACCAAATGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAAAAATCCGAAGCGGACTCGCAAATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGAGAAGCCGGCGGAGACCGAGGAAAAGGAAAATACCGCAAGCAACGGCAACCTGAAGGTGTCTCACATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGATACAAATGCTGAGCAGCGCACTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAAACGCCGTGCCCGCCATTGATGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAATTGGTTACAGCCTTCTGCATTCTGCAGACCCCGCAGTTCGCTAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCCCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAACAAGCCGTTGAGTGGCTTGAAAGTGAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGGGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACACACAGCTTTTCGATTTGTATTTCTCCGGTTCCACCATTCACAGCGATGGCGTATATGCCAGATTGGCTAGTTTTCTTGTTAATGGCGGAAAGGATATGCTCGCCGCCTGGCAGCAATATATCGATTCCAAGCAGCCACTCAAACTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCCACGTGCTCCTCAACTTTAAGCCAAGGGAAGAACAACTCATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGTTGCATGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCTAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTTGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCACCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATTTCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTCAGCGTCGAGAGCCTTCACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCACTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTTAGTCAGACAGCCAAATGGCGACAGAAACAGTTGAACTACTTGTTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAAGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCAGTTGCTGCAGAAGACATTGAGTTACCTTAACAAAGAGTTGGGACAACCGGATGCGGAGAGCAAATTGCGTTCGCCAAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGAGCGGCCCAGCAAGGAATCGGATGTCGTTGGCCAATCATTCGAGGCTCTTATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCATCACCGTGTTGGAAGATCTGATTATCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGAGCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTTCTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGCTCAACATGAACAAAAATCCCCTGAGCAAAAAGAGCGATGGC------GAGGAGGAGAGCGATGACGAACTCGACGAGGAAGAATCGTTGAAGGATTCAAGCGATGNNNNNNNNNNNNNNNNNNNNNNTGAAGAGGAGGAC---GAGGGCGAGGACGATGCAGAGTCCCATTTGGCCCAAATTCGAGAGAGCGTTCGCCAGGCTTTGATCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAGGAGCAGGGCGAACGCTTGAATGCTGCTTTGGAGCGGTCTTTTCAGATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAGCACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAACCAAGAAACCAACTCAATCGGTAATCCTGGACGTGCTACATTGCGTCTTCCAGGTGTACAGCCATTGCGCCGCAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTCGCTAGGAATATCGAACTCAAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCCATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAGGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCGAGCCCAAGAAAAGTGCCGTCTGGCCCCTTCTAGTCGAATTCCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGCCAATGGCAGGGAGTTGCTCCGCTGGCCGTTGTCCTGGCCTCTCACTTGGACGTACAGAAAACACGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGTCGCTTTCAAGGACAACAACTCGTCTTCCAAGAAATTTGAGAAGCAGATAGCCAGATATGTAAATCAGCTAGAAACGAAGGCTAGCAGTTCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGTGGCAGAAACTGCGTGAACAAATTCAGCTCGTCGCCAAGGATCTTCAACCCAACAAGAAGGTGGCGAAGCAGAAGAAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGAAGATGAAGAGTCCACA--- ->Dmel_RG22 |6 sp| -ATGAAGAGCAAGGTGGATAAACCCGTAACCAATGGTGCACCAAATGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAAAAATCCGAAGCGGACTCGCAAATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGAGAAGCCGGCGGAGACCGAGGAAAAGGAAAATACCGCAAGCAACGGCAACCTGAAGGTGTCTCACATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGATACAAATGCTGAGCAGCGCACTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGTCTGGCCGCCAGTTACATACACTGCATCCTAAACGCCGTGCCCGCCATTGATGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAATTGGTTACAGCCTTCTGCATTCTGCAGACCCCGCAGTTCGCTAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCCCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAACAAGCCGTTGAGTGGCTTGAAAGTGAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGGGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACACACAGCTTTTCGATTTGTATTTCTCCGGTTCCACCATTCACAGCGATGGCGTATATGCCAGATTGGCTAGTTTTCTTGTTAATGGCGGAAACGATATGCTCGCCGCCTGGCAGCAATATATCGATTCCAAGCAGCCACTCAAACTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCCACGTGCTCCTCAACTTTAAGCCAAGGGAAGAACAACTCATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGTTGCATGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCTAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTTGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCACCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATTTCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTCAGCGTCGAGAGCCTTCACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCACTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTTAGTCAGACAGCCAAATGGCGACAGAAACAGTTGAACTACTTGTTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAAGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCAGTTGCTGCAGAAGACATTGAGTTACCTTAACAAAGAGTTGGGACAACCGGATGCGGAGAGCAAATTGCGTTCGCCAAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGAGCGGCCCAGCAAGGAATCGGATGTCGTTGGCCAATCATTCGAGGCTCTTATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCATCACCGTGTTGGAAGATCTGATTATCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGAGCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTTCTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGCTCAACATGAACAAAAATCCCCTGAGCAAAAAGAGCGATGGC------GAGGAGGAGAGCGATGACGAACTCGACGAGGAAGAATCGTTGAAGGATTCAAGCGATGATTCAGAAGATGAAGATGAAGATGAAGAGGAGGAC---GAGGGCGAGGACGATGCAGAGTCCCATTTGGCCCAAATTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAGGAGCAGGGCGAACGCTTGAATGCTGCTTTGGAGCGGTCTTTTCAGATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAGCACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAACCAAGAAACCAACTCAATCGGTAATCCTGGACGTGCTACATTGCGTGTTCCAGGTGTACAGCCATTGCGCCGCAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTCGCTAGGAATATCGAACTCAAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCCATTGAGCAGCTGATGTCGTCTGGCGANGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAAGAGACATCATTATTTGGCGGGACAGGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCGAGCCCAAGAAAAGTGCCGTCTGGCCCCTTCTAGTCGAATTCCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGCCAATGGCAGGGAGTTGCTCCGCTGGCCGTTGTCCTGGCCTCTCACTTGGACGTACAGAAAACACGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGTCGCTTTCAAGGACAACAACTCGTCTTCCAAGAAATTTGAGAAGCAGATAGCCAGATATGTAAATCAGCTAGAAACGAAGGCTAGCAGTTCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGTGGCAGAAACTGCGTGAACAAATTCAGCTCGTCGCCAAGGATCTTCAACCCAACAAGAAGGTGGCGAAGCAGAAGAAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGAAGATGAAGAGTCCACA--- ->Dmel_RG24 |43 sp| -ATGAAGAGCAAGGTGGATAAACCCGTAACCAATGGTGCACCAAATGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAAAAATCCGAAGCGGACTCGCAAATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGAGAAGCCGGCGGAGACCGAGGAAAAGGAAAATACCGCAAGCAACGGCAACCTGAAGGTGTCTCACATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGATACAAATGCTGAGCAGCGCACTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGTCTGGCCGCCAGTTACATACACTGCATCCTAAACGCCGTGCCCGCCATTGATGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCATCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAATTGGTTACAGCCTTCTGCATTCTGCAGACCCCGCAGTTCGCTAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCCCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAACAAGCCGTTGAGTGGCTTGAAAGTGAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGGGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACACACAGCTTTTCGATTTGTATTTCTCCGGTTCCACCATTCACAGCGATGGCGTATATGCCAGATTGGCTAGTTTTCTTGTTAATGGCGGAAACGATATGCTCGCCGCCTGGCAGCAATATATCGATTCCAAGCAGCCACTCAAACTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCCACGTGCTCCTCAACTTTAAGCCAAGGGAAGAACAACTCATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGTTGCATGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCTAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTTGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCACCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATTTCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTCAGCGTCGAGAGCCTTCACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCACTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTTAGTCAGACAGCCAAATGGCGACAGAAACAGTTGAACTACTTGTTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAAGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCAGTTGCTGCAGAAGACATTGAGTTACCTTAACAAAGAGTTGGGACAACCGGATGCGGAGAGCAAATTGCGTTCGCCAAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGAGCGGCCCAGCAAGGAATCGGATGTCGTTGGCCAATCATTCGAGGCTCTTATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCATCACCGTGTTGGAAGATCTGATTATCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGAGCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTTCTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGCTCAACATGAACAAAAATCCCCTGAGCAAAAAGAGCGATGGC------GAGGAGGAGAGCGATGACGAACTCGACGAGGAAGAATCGTTGAAGGATTCAAGCGATGNNNNNNNNNNNNNNNNNNNNNNTGAAGAGGAGGAC---GAGGGCGAGGACGATGCAGAGTCCCATTTGGCCCAAATTCGAGAGAGCGTTCGCCAGGCTTTGATCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAGGAGCAGGGCGAACGCTTGAATGCTGCTTTGGAGCGGTCTTTTCAGATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAGCACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAACCAAGAAACCAACTCAATCGGTAATCCTGGACGTGCTACATTGCGTCTTCCAGGTGTACAGCCATTGCGCCGCAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTCGCTAGGAATATCGAACTCAAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCCATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAGGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCGAGCCCAAGAAAAGTGCCGTCTGGCCCCTTCTAGTCGAATTCCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGCCAATGGCAGGGAGTTGCTCCGCTGGCCGTTGTCCTGGCCTCTCACTTGGACGTACAGAAAACACGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGTCGCTTTCAAGGACAACAACTCGTCTTCCAAGAAATTTGAGAAGCAGATAGCCAGATATGTAAATCAGCTAGAAACGAAGGCTAGCAGTTCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGTGGCAGAAACTGCGTGAACAAATTCAGCTCGTCGCCAAGGATCTTCAACCCAACAAGAAGGTGGCGAAGCAGAAGAAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGAAGATGAAGAGTCCACA--- ->Dmel_RG25 |71 sp| -ATGAAGAGCAAGGTGGATAAACCCGTAACCAATGGTGCACCAAATGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAAAAATCCGAAGCGGACTCGCAAATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGAGAAGCCGGCGGAGACCGAGGAAAAGGAAAATACCGCAAGCAACGCCAACCTGAAGGTGTCTCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGATACAAATGCTGAGCAGCGCACTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAAACGCCGTGCCCGCCATTGATGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAATTGGTTACAGCCTTCTGCATTCTGCAGACCCCGCAGTTCGCTAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCCCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAACAAGCCGTTGAGTGGCTTGAAAGTGAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGGGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACACACAGCTTTTCGATTTGTATTTCTCCGGTTCCACCATTCACAGCGATGGCGTATATGCCAGATTGGCTAGTTTTCTTGTTAATGGCGGAAAGGATATGCTCGCCGCCTGGCAGCAATATATCGATTCCAAGCAGCCACTCAAACTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCCACGTGCTCCTCAACTTTAAGCCAAGGGAAGAACAACTCATCCTAGATATCTTTACACCGACCTGTGTACAGTTCCTGTTGCATGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCTAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTTGTGTTACGAAAAGCAGTTTCAAAACGATGATAACAAACTTCACCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATTTCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTCAGCGTCGAGAGCCTTCACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCACTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTTAGTCAGACAGCCAAATGGCGACAGAAACAGTTGAACTACTTGTTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAAGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCAGTTGCTGCAGAAGACATTGAGTTACCTTAACAAAGAGTTGGGACAACCGGATGCGGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGAGCGGCCCAGCAAGGAATCGGATGTCGTTGGCCAATCATTCGAGGCTCTTATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCATCACCGTGTTGGAAGATCTGATTATCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGAGCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTTCTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGCTCAACATGAACAAAAATCCCCTGAGCAAAAAGAGCGATGGC------GAGGAGGAGAGCGATGACGAACTCGACGAGGAAGAATCGTTGAAGGATTCAAGCGATGATTCAGAAGATGAAGATGAAGATGAAGAGGAGGAC---GAGGGCGAGGACGATGCAGAGTCCCATTTGGCCCAAATTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAGGAGCAGGGCGAACGCTTGAATGCTGCTTTGAAGCGGTCTTTTCAGATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAGCACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGACCTCTTCATAACCAAGAAACCAACTCAATCGGTAATCCTGGACGTGCTACATTGCGTGTTCCAGGTGTACAGCCATTGCGCCGCAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTCGCTAGGAATATCGAACTCAAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCCATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAAGAGACATCATTATTTGGCGGGACAGGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCGAGCCCAAGAAAAGTGCCGTCTGGCCCCTTCTAGTCGAATTCCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGCCAATGGCAGGGAGTTGCTCCGCTGGCCGTTGTCCTGGCCTCTCACTTGGACGTACAGAAAACACGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGTCGCTTTCAAGGACAACAACTCGTCTTCCAAGAAATTTGAGAAGCAGATAGCCAGATATGTAAATCAGCTAGAAACGAAGGCTAGCAGTTCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGTGGCAGAAACTGCGTGAACAAATTCAGCTCGTCGCCAAGGATCTTCAACCCAACAAGAAGGTGGCGAAGCAGAAGAAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGAAGATGAAGAGTCCACA--- ->Dmel_RG28 |74 sp| -ATGAAGAGCAAGGTGGATAAACCCGTAACCAATGGTGCACCAAATGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAAAAATCCGAAGCGGACTCGCAAATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGAGAAGCCGGCGGAGACCGAGGAAAAGGAAAATACCGCAAGCAACGGCAACCTGAAGGTGTCTCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGATACAAATGCTGAGCAGCGCACTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAAACGCCGTGCCCGCCATTGATGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAATTGGTTACAGCCTTCTGCATTCTGCAGACCCCGCAGTTCGCTAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCCCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTCCAACCCGAGCTAAACAAGCCGTTGAGTGGCTTGAAAGTGAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTTTTCGTCCGTACTGGGACGGGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACACACAGCTTTTCGATTTGTATTTCTCCGGTTCCACCATTCACAGCGATGGCGTATATGCCAGATTGGCTAGTTTTCTTGTTAATGGCGGAAAGGATATGCTCGCCGCCTGGCAGCAATATATCGATTCCAAGCAGCCACTCAAACTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCCACGTGCTCCTCAACTTTAAGCCAAGGGAAGAACAACTCATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGTTGCATGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCTAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTTGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCACCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATTTCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTCAGCGTCGAGAGCCTTCACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCACTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTTAGTCAGACAGCCAAATGGCGACAGAAACAGTTGAACTACTTGTTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAAGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCAGTTGCTGCAGAAGACATTGAGTTACCTTAACAAAGAGTTGGGACAACCGGATGCGGAGAGCAAATTGCGTTCGCCAAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGCAACTGCTGGAGCGGCCCAGCAAGGAATCGGATGTCGTTGGCCAATCATTCGAGGCTCTTATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCATCACCGTGTTGGAAGATCTGATTATCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGAGCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTTCTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGCTCAACATGAACAAAAATCCCCTGAGCAAAAAGAGCGATGGC------GAGGAGGAGAGCGATGACGAACTCGACGAGGAAGAATCGTTGAAGGATTCAAGCGATGATTCAGAAGATGAAGATGAAGATGAAGAGGAGGAC---GAGGGCGAGGACGATGCAGAGTCCCATTTGGCCCAAATTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAGGAGCAGGGCGAACGCTTGAATGCTGCTTTGGAGCGGTCTTTTCAGATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAGCACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAACCAAGAAACCAACTCAATCGGTAATCCTGGACGTGCTACATTGCGTGTTCCAGGTGTACAGCCATTGCGCCGCAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTCGCTAGGAATATCGAACTCAAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCCATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAAGAGACATCATTATTTGGCGGGACAGGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCGAGCCCAAGAAAAGTGCCGTCTGGCCCCTTCTAGTCGAATTCCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGCCAATGGCAGGGAGTTGCTCCGCTGGCCGTTGTCCTGGCCTCTCACTTGGACGTACAGAAAACACGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGTCGCTTTCAAGGACAACAACTCGTCTTCCAAGAAATTTGAGAAGCAGATAGCCAGATATGTAAATCAGCTAGAAACGAAGGCTAGCAGTTCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGTGGCAGAAACTGCGTGAACAAATTCAGCTCGTCGCCAAGGATCTTCAACCCAACAAGAAGGTGGCGAAGCAGAAGAAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGAAGATGAAGAGTCCACA--- ->Dmel_RG32N |56 sp| -ATGAAGAGCAAGGTGGATAAACCCGTAACCAATGGTGCACCAAATGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAAAAATCCGAAGCGGACTCGCAAATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGAGAAGCCGGCGGAGACCGAGGAAAAGGAAAATACCGCAAGCAACGGCAACCTGAAGGTGTCTCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGATACAAATGCTGAGCAGCGCACTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGTCTGGCCGCCAGTTACATACACTGCATCCTAAACGCCGTGCCCGCCATTGATGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAATTGGTTACAGCCTTCTGCATTCTGCAGACCCCGCAGTTCGCTAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCCCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAACAAGCCGTTGAGTGGCTTGAAAGTGAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTTTTCGTCCGTACTGGGACGGGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACACACAGCTTTTCGATTTGTATTTCTCCGGTTCCACCATTCACAGCGATGGCGTATATGCCAGATTGGCTAGTTTTCTTGTTAATGGCGGAAAGGATATGCTCGCCGCCTGGCAGCAATATATCGATTCCAAGCAGCCACTCAAACTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCCACGTGCTCCTCAACTTTAAGCCAAGGGAAGAACAACTCATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGTTGCATGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCTAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTTGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCACCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATTTCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTCAGCGTCGAGAGCCTTCACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGTCGAGTGCACTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTTAGTCAGACAGCCAAATGGCGACAGAAACAGTTGAACTACTTGTTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAAGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCAGTTGCTGCAGAAGACATTAAGTTACCTTAACAAAGAGTTGGGACAACCGGATGCGGAGAGCAAATTGCGTTCGCCAAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGAGCGGCCCAGCAAGGAATCGGATGTCGTTGGCCAATCATTCGAGGCTCTTATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCATCACCGTGTTGGAAGATCTGATTATCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGAGCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTTCTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGCTCAACATGAACAAAAATCCCCTGAGCAAAAAGAGCGATGGC------GAGGAGGAGAGCGATGACGAACTCGACGAGGAAGAATCGTTGAAGGATTCAAGCGATGATTCAGAAGATGAAGATGAAGATGAAGAGGAGGAC---GAGGGCGAGGACGATGCAGAGTCCCATTTGGCCCAAATTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAGGAGCAGGGCGAACGCTTGAATGCTGCTTTGGAGCGGTCTTTTCAGATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAGCACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAACCAAGAAACCAACTCAATCGGTAATCCTGGACGTGCTACATTGCGTGTTCCAGGTGTACAGCCATTGCGCCGCAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTCGCTAGGAATATCGAACTCAAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCCATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAAGAGACATCATTATTTGGCGGGACAGGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCGAGCCCAAGAAAAGTGCCGTCTGGCCCCTTCTAGTCGAATTCCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGCCAATGGCAGGGAGTTGCTCCGCTGGCCGTTGTCCTGGCCTCTCACTTGGACGTACAGAAAACACGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGTCGCTTTCAAGGACAACAACTCGTCTTCCAAGAAATTTGAGAAGCAGATAGCCAGATATGTAAATCAGCTAGAAACGAAGGCTAGCAGTTCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGTGGCAGAAACTGCGTGAACAAATTCAGCTCGTCGCCAAGGATCTTCAACCCAACAAGAAGGTGGCGAAGCAGAAGAAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGAAGATGAAGAGTCCACA--- ->Dmel_RG33 |64 sp| -ATGAAGAGCAAGGTAGATAAACCCGTAACCAATGGTGCACCAAATGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAAAAATCCGAAGCGGACTCGCAAATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGAGAAGCCGGCGGAGACCGAGGAAAAGGAAAATACCGCAAGCAACGCCAACCTGAAGGTGTCTCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTNAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGATACAAATGCTGAGCAGCGCACTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAAACGCCGTGCCCGCCATTGATGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGNCAATTGGTTACAGCCTTCTGCATTCTGCAGACCCCGCAGTTCGCTAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCCCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGNGGNGTACGTGTGGCCACTTCTGCAACCCGAGCTAAACAAGCCGTTGAGTGGCTTGAAAGTGAACACTTGCGATGTCTTGCTCGCCGTGCATCTGANNNNTTCGTCCGTACTGGGACGGGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACACACAGCTTTTCGATTTGTATTTCTCCGGTTCCACCATTCACAGCGATGGCGTATATGCCAGATTGGCTAGTTTTCTTGTTAATGGCGGAAAGGATATGCTCGCCGCCTGGCAGCAATATATCGATTCCAAGCAGCCACTCAAACTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCCACGTGCTNCTCAACTTTAAGCCAAGGGAAGAACAACTCATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGTTGCATGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCTAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTTGTGTTACGAAAAGCAGTTNCAAAACGATGATAACAAACTTCACCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATTTCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTCAGCGTCGAGAGCCTTCACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCACTGCCTTAACCAGATGCAACTGATACTGAACCACTCAAAGCTTAGTCAGACAGCCAAATGGCGACAGAAACAGTTGAACTACTTGTTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAAGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCAGTTGCTGCAGAAGACATTGAGTTACCTTAACAAAGAGTTGGGACAACCGGATGCGGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGAGCGGCCCAGCAAGGAATCGGATGTCGTTGGCCAATCATTCGAGGCTCTTATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCATCACCGTGTTGGAAGATCTGATTATCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGAGCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTTCTGGCGGGAGTTTGTTCAACTGGTGGNCACCGCTTTGATTCCGCANCTTGAGCACGGTAACCTAGAACNGGTCCTCGAAGTGCTCAACATGAACAAAAATCCCCTNAGCAAAAAGAGCGATGGC------GAGGAGGAGAGCGATGACGAACTCGACGAGGAGGAATCGTTGAAGGATTCAAGCGATGATTCAGAAGATGAAGATGAAGATGAAGAGGAGGAC---GAGGGCGAGGACGATGCAGAGTCCCATTTGGCCCAAATTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAGGAGCAGGGCGAACGCTTGAATGCTGCTTTGGAGCGGTCTTTTCAGATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAGCACCAACCTGCTGCACTTTCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAACCAAGAAACCAACTCAATCGGTAATCCTGGACGTGCTACATTNNNNNTTCCAGGTGTACAGCCATTGCGCCGCAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTCGCTAGGAATATCGAACTCAAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCCATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAAGAGACATCATTATTTGGCGGGACAGGTGCTTCGCNTACCTGGTCAGCCAGGCATCAGCAGATGGCGAGCCCAAGAAAAGTGCCGTCTGGCCCCTTCTAGTCGAATTCCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGCCAATGGCAGGGAGTTGCTCCGCTGGCCGTTGTCCTGGCCTCTCACTTGGACGTACAGAAAACACGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGTCGCTTTCAAGGACAACAACTCGTCTTCCAAGAAATTTGAGAAGCAGATAGCCAGATATGTAAATCAGCTAGAAACGAAGGCTAGCAGTTCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGTGGCAGAAACTGCGTGAACAAATTCAGCTCGTCGCCAAGGATCTTCAACCCAACAAGAAGGTGGCGAAGCAGAAGAAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGAAGATGAAGAGTCCACA--- ->Dmel_RG34 |58 sp| -ATGAAGAGCAAGGTGGATAAACCCGTAACCAATGGTGCACCAAATGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAAAAATCCGAAGCGGACTCGCAAATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGAGAAGCCGGCGGAGACCGAGGAAAAGGAAAATACCGCAAGCAACGNCAACCTGAAGGTGTCTCACATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGATACAAATGCTGAGCAGCGCACTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGTCTGGCCGCCAGTTACATACACTGCATCCTAAACGCCGTGCCCGCCATTGATGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAATTGGTTACAGCCTTCTGCATTCTGCAGACCCCGCAGTTCGCTAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCCCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAACAAGCCGTTGAGTGGCTTGAAAGTGAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGGGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACACACAGCTTTTCGATTTGTATTTCTCCGGTTCCACCATTCACAGCGATGGCGTATATGCCAGATTGGCTAGTTTTCTTGTTAATGGCGGAAACGATATGCTCGCCGCCTGGCAGCAATATATCGATTCCAAGCAGCCACTCAAACTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCCACGTGCTCCTCAACTTTAAGCCAAGGGAAGAACAACTCATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGTTGCATGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCTAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTTGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCACCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATTTCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTCAGCGTCGAGAGCCTTCACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCACTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTTAGTCAGACAGCCAAATGGCGACAGAAACAGTTGAACTACTTGTTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAAGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCAGTTGCTGCAGAAGACATTGAGTTACCTTAACAAAGAGTTGGGACAACCGGATGCGGAGAGCAAATTGCGTTCGCCAAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGAGCGGCCCAGCAAGGAATCGGATGTCGTTGGCCAATCATTCGAGGCTCTTATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCATCACCGTGTTGGAAGATCTGATTATCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGAGCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTTCTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGCTCAACATGAACAAAAATCCCCTGAGCAAAAAGAGCGATGGC------GAGGAGGAGAGCGATGACGAACTCGACGAGGAAGAATCGTTGAAGGATTCAAGCGATGATTCAGAAGATGAAGATGAAGATGAAGAGGAGGAC---GAGGGCGAGGACGATGCAGAGTCCCATTTGGCCCAAATTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAGGAGCAGGGCGAACGCTTGAATGCTGCTTTGGAGCGGTCTTTTCAGATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAGCACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAACCAAGAAACCAACTCAATCGGTAATCCTGGACGTGCTACATTGCGTCTTCCAGGTGTACAGCCATTGCGCCGCAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTCGCTAGGAATATCGAACTCAAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCCATTGAGCAGCTGATGTCGTCTGGCGACGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAGGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCGAGCCCAAGAAAAGTGCCGTCTGGCCCCTTCTAGTCGAATTCCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGCCAATGGCAGGGAGTTGCTCCGCTGGCCGTTGTCCTGGCCTCTCACTTGGACGTACAGAAAACACGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGTCGCTTTCAAGGACAACAACTCGTCTTCCAAGAAATTTGAGAAGCAGATAGCCAGATATGTAAATCAGCTAGAAACGAAGGCTAGCAGTTCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGTGGCAGAAACTGCGTGAACAAATTCAGCTCGTCGCCAAGGATCTTCAACCCAACAAGAAGGTGGCGAAGCAGAAGAAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGAAGATGAAGAGTCCACA--- ->Dmel_RG36 |128 sp| -ATGAAGAGCAAGGTGGATAAACCCGTAACCAATGGTGCACCAAATGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAAAAATCCGAAGCGGACTCGCAAATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGAGAAGCCGGCGGAGACCGAGGAAAAGGAAAATACCGCAAGCAACGCCAACCTGAAGGTGTCTCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGATACAAATGCTGAGCAGCGCACTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAAACGCCGTGCCCGCCATTGATGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAATTGGTTACAGCCTTCTGCATTCTGCAGACCCCGCAGTTCGCTAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCCCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAACAAGCCGTTGAGTGGCTTGAAAGTGAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGGGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACACACAGCTTTTCGATTTGTATTTCTCCGGTTCCACCATTCACAGCGATGGCGTATATGCCAGATTGGCTAGTTTTCTTGTTAATGGCGGAAAGGATATGCTCGCCGCCTGGCAGCAATATATCGATTCCAAGCAGCCACTCAAACTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCCACGTGCTCCTCAACTTTAAGCCAAGGGAAGAACAACTCATCCTAGATATCTTTACACCGACCTGTGTACAGTTCCTGTTGCATGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCTAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTTGTGTTACGAAAAGCAGTTTCAAAACGATGATAACAAACTTCACCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATTTCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTCAGCGTCGAGAGCCTTCACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCACTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTTAGTCAGACAGCCAAATGGCGACAGAAACAGTTGAACTACTTGTTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAAGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCAGTTGCTGCAGAAGACATTGAGTTACCTTAACAAAGAGTTGGGACAACCGGATGCGGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGAGCGGCCCAGCAAGGAATCCGATGTCGTTGGCCAATCATTCGAGGCTCTTATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCATCACCGTGTTGGAAGATCTGATTATCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGAGCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTTCTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGCTCAACATGAACAAAAATCCCCTGAGCAAAAAGAGCGATGGC------GAGGAGGAGAGCGATGACGAACTCGACGAGGAAGAATTGTTGAAGGATTCAAGCGATGATTCAGAAGATGAAGATGAAGATGAAGAGGAGGAC---GAGGGCGAGGACGATGCAGAGTCCCATTTGGCCCAAATTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAGGAGCAGGGCGAACGCTTGAATGCTGCTTTGGAGCGGTCTTTTCAGATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAGCACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAACCAAGAAACCAACTCAATCGGTAATCCTGGACGTGCTACATTGCGTGTTCCAGGTGTACAGCCATTGCGCCGCAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTCGCTAGGAATATCGAACTCAAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCCATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAGGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCGAGCCCAAGAAAAGTGCCGTCTGGCCCCTTCTAGTCGAATTCCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGCCAATGGCAGGGAGTTGCTCCGCTGGCCGTTGTCCTGGCCTCTCACTTGGACGTACAGAAAACACGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGTCGCTTTCAAGGACAACAACTCGTCTTCCAAGAAATTTGAGAAGCAGATAGCCAGATATGTAAATCAGCTAGAAACGAAGGCTAGCAGTTCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGTGGCAGAAACTGCGTGAACAAATTCAGCTCGTCGCCAAGGATCTTCAACCCAACAAGAAGGTGGCGAAGCAGAAGAAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGAAGATGAAGAGTCCAGA--- ->Dmel_RG38N |27 sp| -ATGAAGAGCAAGGTGGATAAACCCGTAACCAATGGTGCACCAAATGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAAAAATCCGAAGCGGACTCGCAAATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGAGGAGCCGGCGGAGACCGAGGAAAAGGAAAATACCGCAAGCAACGCCAACCTGAAGGTGTCTCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGATACAAATGCTGAGCAGCGCACTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAAACGCCGTGCCCGCCATTGATGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAATTGGTTACAGCCTTCTGCATTCTGCAGACCCCGCAGTTCGCTAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCCCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAACAAGCCGTTGAGTGGCTTGAAAGTGAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGGGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACACACAGCTTTTCGATTTGTATTTCTCCGGTTCCACCATTCACAGCGATGGCGTATATGCCAGATTGGCTAGTTTTCTTGTTAATGGCGGAAAGGATATGCTCGCCGCCTGGCAGCAATATATCGATTCCAAGCAGCCACTCAAACTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCCACGTGCTCCTCAACTTTAAGCCAAGGGAAGAACAACTCATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGTTGCATGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCTAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTAGTTTTGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCACCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATTTCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTCAGCGTCGAGAGCCTTCACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCACTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTTAGTCAGACAGCCAAATGGCGGCAGAAACAGTTGAACTACTTGTTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAAGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCAGTTGCTGCAGAAGACATTGAGTTACCTTAACAAAGAGTTGGGACAACCGGATGCGGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGAGCGGCCCAGCAAGGAATCGGATGTCGTTGGCCAATCATTCGAGGCTCTTATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCATCACCGTGTTGGAAGATCTGATTATCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGAGCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTTCTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCATCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGCTCAACATGAACAAAAATCCCCTGAGCAAAAAGAGCGATGGC------GAGGAGGAGAGCGATGACGAACTCGACGAGGAAGAATCGTTGAAGGATTCAAGCGATGATTCAGAAGATGAAGATGAAGATGAAGAGGAGGAC---GAGGGCGAGGACGATGCAGAGTCCCATTTGGCCCAAATTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAGGAGCAGGGCGAACGCTTGAATGCTGCTTTGGAGCGGTCTTTTCAGATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAGCACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAACCAAGAAACCAACTCAATCGGTAATCCTGGACGTGCTACATTGCGTCTTCCAGGTGTACAGCCATTGCGCCGCAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTCGCTAGGAATATCGAACTCAAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCCATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAGGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCGAGCCCAAGAAAAGTGCCGTCTGGCCCCTTCTAGTCGAATTCCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGCCAATGGCAGGGAGTTGCTCCGCTGGCCGTTGTCCTGGCCTCTCACTTGGACGTACAGAAAACACGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGTCGCTTTCAAGGACAACAACTCGTCTTCCAAGAAATTTGAGAAGCAGATAGCCAGATATGTAAATCAGCTAGAAACGAAGGCTAGCAGTTCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGTGGCAGAAACTGCGTGAACAAATTCAGCTCGTCGCCAAGGATCTTCAACCCAACAAGAAGGTGGCGAAGCAGAAGAAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGAAGATGAAGAGTCCACA--- ->Dmel_FBtr0070119 |30 sp| -ATGAAGAGCAAGGTGGATAAACCCGTAACCAATGGTGCACCAAATGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAAAAATCCGAAGCGGACTCGCAAATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGAGAAGCCGGCGGAGACCGAGGAAAAGGAAAATACCGCAAGCAACGCCAACCTGAAGGTGTCTCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGATACAAATGCTGAGCAGCGCACTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAAACGCCGTGCCCGCCATTGATGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAATTGGTTACAGCCTTCTGCATTCTGCAGACCCCGCAGTTCGCTAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCCCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAACAAGCCGTTGAGTGGCTTGAAAGTGAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTTTTCGTCCGTACTGGGACGGGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACACACAGCTTTTCGATTTGTATTTCTCCGGTTCCACCATTCACAGCGATGGCGTATATGCCAGATTGGCTAGTTTTCTTGTTAATGGCGGAAAGGATATGCTCGCCGCCTGGCAGCAATATATCGATTCTAAGCAGCCACTCAAACTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCCACGTGCTCCTCAACTTTAAGCCAAGGGAAGAACAACTCATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGTTGCATGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCTAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTTGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCACCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATTTCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTCAGCGTCGAGAGCCTTCACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCACTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTTAGTCAGACAGCCAAATGGCGACAGAAACAGTTGAACTACTTGTTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAAGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCAGTTGCTGCAGAAGACATTGAGTTACCTTAACAAAGAGTTGGGACAACCGGATGCGGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGAGCGGCCCAGCAAGGAATCCGATGTCGTTGGCCAATCATTCGAGGCTCTTATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCATCACCGTGTTGGAAGATCTGATTATCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGAGCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTTACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTTCTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGCTCAACATGAACAAAAATCCCCTGAGCAAAAAGAGCGATGGC------GAGGAGGAGAGCGATGACGAACTCGACAAGGAAGAATCGTTGAAGGATTCAAGCGATGATTCAGAAGATGAAGATGAAGATGAAGAGGAGGAC---GAGGGCGAGGACGATGCAGAGTCCCATTTGGCCCAAATTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAGGAGCAGGGCGAACGCTTGAATGCTGCTTTGGAGCGGTCTTTTCAGATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAGCACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAACCAAGAAACCAACTCAATCGGTAATCCTGGACGTGCTACATTGCGTGTTCCAGGTGTACAGCCATTGCGCCGCAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTCGCTAGGAATATCGAACTCAAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCCATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAAGAGACATCATTATTTGGCGGGACAGGTGCTTCGCTTACCTGGTCAGCCAGGCATCAGCAGATGGCGAGCCCAAGAAAAGTGCCGTCTGGCCCCTTCTAGTCGAATTCCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGCCAATGGCAGGGAGTTGCTCCGCTGGCCGTTGTCCTGGCCTCTCACTTGGACGTACAGAAAACACGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGTCGCTTTCAAGGACAACAACTCGTCTTCCAAGAAATTTGAGAAGCAGATAGCCAGATATGTAAATCAGCTAGAAACGAAGGCTAGCAGTTCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGTGGCAGAAACTGCGTGAACAAATTCAGCTCGTCGCCAAGGATCTTCAACCCAACAAGAAGGTGGCGAAGCAGAAGAAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGAAGATGAAGAGTCCACA--- ->Dsim_ref2 |106 sp| -ATGAAAAGCAAGGTGGATAAACCCATAACCACTGGTGCACCAAGTGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAGAAATCCGACGCGGACACGCAGATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGTGAAGCCGGCGGAGACCGAGGAAAAGGAAAATATCGCGAGCAACGGCAACCTGAAGGTGTCGCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGACACAAATGCTGAGCAGCGCGCTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAACCGCCGTGCCCGCCATCGACGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAAGTGGTTACAGCCTTCGGCATTTTGCAGAGCCCGCAGTTCGCCAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCTCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAACAAGCCGTTGAGTGGCTTGAAAGTAAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGAGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACTCACAGCTTTTCGATTTGTATTTCTCCGGCTCCACCATTCACAGCGATGACGTATACGCCAGATTGGCTAGTTTTCTTATGAATGGCGGAAAGGAAATGCTCGCCGCCTGGCAGCAGTATATTGATTCCAAGCAGCCACTCAAATTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCAACGTGCTCCGCAACTTTAAGCCAAGGGAAGAACAACTTATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGCTGCAGGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCAAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTCGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCAGCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGATGATATCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTTAGCGTCGAGAGCCTTTACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCATTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTGAGCCAGGCAACACAATGGCGACAGAAGCAGTTGAACTACTTGCTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAGGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCACTTGCTGCAGAAGACATTGAGTTACCTTAACAAAAAGTTGGGGGAACCGGATGCAGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGCGCGGCCCAGCAAGGAAACGGATGTCGTTGGCCAAACATTCGAGGCTCTAATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCGTCACCGTGTTGGAGGATCTGATTATCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGATCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTACTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGTTCAACATGAACAAAAATCCCTTGAGCAAGAAGGACGATGGC------GAGGAGGAGAGCGAAGACGAAGTCGACGAGGAAGAATCGTTGAAGGATTCGAGCGATGATTCAGACGATGAAGATGAAGATGAAGAGGAGGAC---GAAGACGAGGACGATGAAGAGTCCCATTTGGCCCAAATTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAGGAGCAGGGCAAACGCTTGAATGCTGCTTTGGAGCAGTCTTTTCAAATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAACACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAAACAAGAAACCAACTCAATCGGTAATCCTGGACGTGCTGCATTGCGTCTTCCAGGTGTACCGCCATTGCGCCACAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTTGCCAGGAATATCGAACTCAAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCTATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAAGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCAAGCCCAAGGAAAGTGCTGTCTGGCCCCTTCTAGTCGAATTTCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGTCAATGGCAGGGCGTTGCTCCACTGGCTGTTGTCCTGGCCTCCCACTTGGACGTACAGAAAACGCGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGCCGCTTTCAAGGACAACTGCTCGTCTTCCAACAAATTTGAGAAGAAGATAGCCAGATACGTAAATCAGCTAGAAACGGAGACTAGTAGTCCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGCGTCAGAAACTGCGTGAACAGATTCAGCTCGTCGCCAAAAACCTTCAACCCAACAAGAAGGCGGCGAAGCAG---AAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGATGATGAAGAGTCCACA--- ->Dsim_MD03 |0 sp| -ATGAAAAGCAAGGTGGATAAACCCATAACCACTGGTGCACCAAGTGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAGAAATCCGACGCGGACACGCAGATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGTGAAGCCGGCGGAGACCGAGGAAAAGGAAAATATCGCGAGCAACGGCAACCTGAAGGTGTCGCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGACACAAATGCTGAGCAGCGCGCTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAACCGCCGTGCCCGCCATCGACGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAAGTGGTTACAGCCTTCGGCATTTTGCAGAGCCCGCAGTTCGCCAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCTCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAANAAGCCGTTGAGTGGCTTGAAAGTAAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGAGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACTCACAGCTTTTCGATTTGTATTTCTCCGGCTCCACCATTCACAGCGATGACGTATACGCCAGATTGGCTAGTTTTCTTATGAATGGCGGAAAGGAAATGCTCGCCGCCTGGCAGCAGTATATTGATTCCAAGCAGCCACTCAAATTGAATGCAGCCAAGGCGTGTACCATCCAAGTACTGAGCAACGTGCTCCGCAACTTTAAGCCAAGGGAAGAACAACTTATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGCTGCAGGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCAAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTCGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCAGCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATATCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTAAGCGTCGAGAGCCTTTACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCATTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTGAGCCAGGCAACACAATGGCGACAGAAGCAGTTGAACTACTTGCTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAAGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCACTTGCTGCAGAAGACATTGAGTTACCTTAACAAAAAGTTGGGGGAACCGGATGCAGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGCGCGGCCCAGCAAGGAAACGGATGTCGTTGGCCAAACATTCGAGGCTCTAATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCGTCACCGTGTTGGAGGATCTGATTNTCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGATCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTACTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGTTCAACATGAACAAAAATCCCTTGAGCAAGAAGGACGATGGC------GAGGAGGAGAGCGAAGACGAAGTCGACGAGGAAGAATCGTTGAAGGATTCGAGCGATGATTCAGACGATGAAGATGAAGATGAAGAGGAGNAC---GAAGACGAGGACGATGAAGAGTCCCATTTGGCCCAAANTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAAGAGCAGGGCAAACGCTTGAATGCTGCTTTGGAGCAGTCTTTTCAAATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAACACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAAACAAGAAACCAACTCAATCGGTAATCCTGGNCGTGCTGCATTGCGTCTTCCAGGTGTACCGCCATTGCGCCACAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTTGCCAGGAATATCGAACTCGAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCAATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAAGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCAAGCCCAAGGAAAGTGCTGTCTGGCCNCTTCTAGTCGAATTTCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGTCAATGGCAGGGCGTTGCTCCACTGGCTGTTGTCCTGGCCTCCCACTTGGACGTACAGAAAACGCGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGCCGCTTTCAAGGACAACTGCTCGTCTTCCAACAAATTTGAGAAGAAGATAGCCAGATACGTAAATCAGCTAGAAACGGAGACTAGTAGTCCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGCGTCAGAAACTGCGTGAACAGATTCAGCTCGTCGCCAAAAACCTTCAACCCAACAAGAAGGCGGCGAAGCAG---AAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGATGATGAAGAGTCCACA--- ->Dsim_MD06 |87 sp| -ATGAAAAGCAAGGTGGATAAACCCATAACCACTGGTGCACCAAGTGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAGAAATCCGACGCGGACACGCAGATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGTGAAGCCGGCGGAGACCGAGGAAAAGGAAAATATCGCGAGCAACGGCAACCTGAAGGTGTCGCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGACACAAATGCTGAGCAGCGCGCTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAACCGCCGTGCCCGCCATCGACGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAAGTGGTTACAGCCTTCGGCATTTTGCAGAGCCCGCAGTTCGCCAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCTCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAANAAGCCGTTGAGTGGCTTGAAAGTAAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGAGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACTCACAGCTTTTCGATTTGTATTTCTCCGGCTCCACCATTCACAGCGATGACGTATACGCCAGATTGGCTAGTTTTCTTATGAATGGCGGAAAGGAAATGCTCGCCGCCTGGCAGCAGTATATTGATTCCAAGCAGCCACTCAAATTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCAACGTGCTCCGCAACTTTAAGCCAAGGGAAGAACAACTTATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGCTGCAGGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCAAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTCGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCAGCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATATCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTTAGCGTCGAGAGCCTTTACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCATTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTGAGCCAGGCAACACAATGGCGACAGAAGCAGTTGAACTACTTGCTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAAGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCACTTGCTGCAGAAGACATTGAGTTACCTTAACAAAAAGTTGGGGGAACCGGATGCAGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGCGCGGCCCAGCAAGGAAACGGATGTCGTTGGCCAAACATTCGAGGCTCTAATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCGTCACCGTGTTGGAGGATCTGATTNTCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGATCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTACTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGTTCAACATGAACAAAAATCCCTTGAGCAAGAAGGACGATGGC------GAGGAGGAGAGCGAAGACGAAGTCGACGAGGAAGAATCGTTGAAGGATTCGAGCGATGATTCAGACGATGAAGATGAAGATGAAGAGGAGNAC---GAAGACGAGGACGATGAAGAGTCCCATTTGGCCCAAANTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAAGAGCAGGGCAAACGCTTGAATGCTGCTTTGGAGCAGTCTTTTCAAATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAACACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAAACAAGAAACCAACTCAATCGGTAATCCTGGNCGTGCTGCATTGCGTCTTCCAGGTGTACCGCCATTGCGCCACAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTTGCCAGGAATATCGAACTCGAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCAATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAAGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCAAGCCCAAGGAAAGTGCTGTCTGGCCNCTTCTAGTCGAATTTCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGTCAATGGCAGGGCGTTGCTCCACTGGCTGTTGTCCTGGCCTCCCACTTGGACGTACAGAAAACGCGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGCCGCTTTCAAGGACAACTGCTCGTCTTCCAACAAATTTGAGAAGAAGATAGCCAGATACGTAAATCAGCTAGAAACGGAGACTAGTAGTCCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGCGTCAGAAACTGCGTGAACAGATTCAGCTCGTCGCCAAAAACCTTCAACCCAACAAGAAGGCGGCGAAGCAG---AAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGATGATGAAGAGTCCACA--- ->Dsim_MD105 |108 sp| -ATGAAAAGCAAGGTGGATAAACCCATAACCACTGGTGCACCAAGTGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAGAAATCCGACGCGGACACGCAGATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGTGAAGCCGGCGGAGACCGAGGAAAAGGAAAATATCGCGAGCAACGGCAACCTGAAGGTGTCGCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGACACAAATGCTGAGCAGCGCGCTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAACCGCCGTGCCCGCCATCGACGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAAGTGGTTACAGCCTTCGGCATTTTGCAGAGCCCGCAGTTCGCCAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCTCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAANAAGCCGTTGAGTGGCTTGAAAGTAAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGAGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACTCACAGCTTTTCGATTTGTATTTCTCCGGCTCCACCATTCACAGCGATGACGTATACGCCAGATTGGCTAGTTTTCTTATGAATGGCGGAAAGGAAATGCTCGCCGCCTGGCAGCAGTATATTGATTCCAAGCAGCCACTCAAATTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCAACGTGCTCCGCAACTTTAAGCCAAGGGAAGAACAACTTATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGCTGCAGGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCTAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTCGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCAGCTGCTGCTTAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATATCCTTGCCGCGTTTCTGTCAGAAACTGATAAATCAACTAAGCGTCGAGAGCCTTTATAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCATTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTGAGCCAGGCAACACAATGGCGACAGAAGCAGTTGAACTACTTGCTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAGGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCACTTGCTGCAGAAGACATTGAGTTACCTTAACAAAAAGTTGGGGGAACCGGATGCAGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGCGCGGCCCAGCAAGGAAACGGATGTCGTTGGCCAAACATTCGAGGCTCTAATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCGTCACCGTGTTGGAGGATCTGATTNTCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGATCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTACTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGTTCAACATGAACAAAAATCCCTTGAGCAAGAAGGACGATGGC------GAGGAGGAGAGCGAAGACGAAGTCGACGAGGAAGAATCGTTGAAGGATTCGAGCGATGATTCAGACGATGAAGATGAAGATGAAGAGGAGNAC---GAAGACGAGGACGATGAAGAGTCCCATTTGGCCCAAANTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAAGAGCAGGGCAAACGCTTGAATGCTGCTTTGGAGCAGTCTTTTCAAATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAACACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAAACAAGAAACCAACTCAATCGGTAATCCTGGNCGTGCTGCATTGCGTCTTCCAGGTGTACCGCCATTGCGCCACAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTTGCCAGGAATATCGAACTCGAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCAATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAAGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCAAGCCCAAGGAAAGTGCTGTCTGGCCNCTTCTAGTCGAATTTCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGTCAATGGCAGGGCGTTGCTCCACTGGCTGTTGTCCTGGCCTCCCACTTGGACGTACAGAAAACGCGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGCCGCTTTCAAGGACAACTGCTCGTCTTCCAACAAATTTGAGAAGAAGATAGCCAGATACGTAAATCAGCTAGAAACGGAGACTAGTAGTCCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGCGTCAGAAACTGCGTGAACAGATTCAGCTCGTCGCCAAAAACCTTCAACCCAACAAGAAGGCGGCGAAGCAG---AAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGATGATGAAGAGTCCACA--- ->Dsim_MD106 |118 sp| -ATGAAAAGCAAGGTGGATAAACCCATAACCACTGGTGCACCAAGTGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAGAAATCCGACGCGGACACGCAGATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGTGAAGCCGGCGGAGACCGAGGAAAAGGAAAATATCGCGAGCAACGGCAACCTGAAGGTGTCGCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGACACAAATGCTGAGCAGCGCGCTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAACCGCCGTGCCCGCCATCGACGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAAGTGGTTACAGCCTTCGGCATTTTGCAGAGCCCGCAGTTCGCCAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCTCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAANAAGCCGTTGAGTGGCTTGAAAGTAAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGAGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACTCACAGCTTTTCGATTTGTATTTCTCCGGCTCCACCATTCACAGCGATGACGTATACGCCAGATTGGCTAGTTTTCTTATGAATGGCGGAAAGGAAATGCTCGCCGCCTGGCAGCAGTATATTGATTCCAAGCAGCCACTCAAATTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCAACGTGCTCCGCAACTTTAAGCCAAGGGAAGAACAACTTATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGCTGCAGGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCAAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTCGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCAGCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATATCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTTAGCGTCGAGAGCCTTTACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCATTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTGAGCCAGGCAACACAATGGCGACAGAAGCAGTTGAACTACTTGCTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAAGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCACTTGCTGCAGAAGACATTGAGTTACCTTAACAAAAAGTTGGGGGAACCGGATGCAGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGCGCGGCCCAGCAAGGAAACGGATGTCGTTGGCCAAACATTCGAGGCTCTAATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCGTCACCGTGTTGGAGGATCTGATTNTCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGATCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTACTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGTTCAACATGAACAAAAATCCCTTGAGCAAGAAGGACGATGGC------GAGGAGGAGAGCGAAGACGAAGTCGACGAGGAAGAATCGTTGAAGGATTCGAGCGATGATTCAGACGATGAAGATGAAGATGAAGAGGAGNAC---GAAGACGAGGACGATGAAGAGTCCCATTTGGCCCAAANTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAGGAGCAGGGCAAACGCTTGAATGCTGCTTTGGAGCAGTCTTTTCAAATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAACACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAAACAAGAAACCAACTCAATCGGTAATCCTGGNCGTGCTGCATTGCGTCTTCCAGGTGTACCGCCATTGCGCCACAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTTGCCAGGAATATCGAACTCGAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCCATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAAGTGCTTCGCCTACCTGGTCAGCCAGGCATCGGCAGATGGCAAGCCCAAGGAAAGTGCTGTCTGGCCNCTTCTAGTCGAATTTCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGTCAATGGCAGGGCGTTGCTCCACTGGCTGTTGTCCTGGCCTCCCACTTGGACGTACAGAAAACGCGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGCCGCTTTCAAGGACAACTGCTCGTCTTCCAACAAATTTGAGAAGAAGATAGCCAGATACGTAAATCAGCTAGAAACGGAGACTAGTAGTCCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGCGTCAGAAACTGCGTGAACAGATTCAGCTCGTCGCCAAAAACCTTCAACCCAACAAGAAGGCGGCGAAGCAG---AAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGATGATGAAGAGTCCACA--- ->Dsim_MD146 |57 sp| -ATGAAAAGCAAGGTGGATAAACCCATAACCACTGGTGCACCAAGTGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAGAAATCCGACGCGGACACGCAGATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGTGAAGCCGGCGGAGACCGAGGAAAAGGAAAATATCGCGAGCAACGGCAACCTGAAGGTGTCGCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGACACAAATGCTGAGCAGCGCGCTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAACCGCCGTGCCCGCCATCGACGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAAGTGGTTACAGCCTTCGGCATTTTGCAGAGCCCGCAGTTCGCCAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCTCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAANAAGCCGTTGAGTGGCTTGAAAGTAAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGAGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACTCACAGCTTTTCGATTTGTATTTCTCCGGCTCCACCATTCACAGCGATGACGTATACGCCAGATTGGCTAGTTTTCTTATGAATGGCGGAAAGGAAATGCTCGCCGCCTGGCAGCAGTATATTGATTCCAAGCAGCCACTCAAATTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCAACGTGCTCCGCAACTTTAAGCCAAGGGAAGAACAACTTATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGCTGCAGGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCTAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTCGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCAGCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATATCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTTAGCGTCGAGAGCCTTTACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCATTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTGAGCCAGGCAACACAATGGCGACAGAAGCAGTTGAACTACTTGCTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAAGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCACTTGCTGCAGAAGACATTGAGTTACCTTAACAAAAAGTTGGGGGAACCGGATGCAGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGCGCGGCCCAGCAAGGAAACGGATGTCGTTGGCCAAACATTCGAGGCTCTAATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCGTCACCGTGTTGGAGGATCTGATTNTCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGATCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTACTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGTTCAACATGAACAAAAATCCCTTGAGCAAGAAGGACGATGGC------GAGGAGGAGAGCGAAGACGAAGTCGACGAGGAAGAATCGTTGAAGGATTCGAGCGATGATTCAGACGATGAAGATGAAGATGAAGAGGAGNAC---GAAGACGAGGACGATGAAGAGTCCCATTTGGCCCAAANTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAAGAGCAGGGCAAACGCTTGAATGCTGCTTTGGAGCAGTCTTTTCAAATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAACACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAAACAAGAAACCAACTCAATCGGTAATCCTGGNCGTGCTGCATTGCGTCTTCCAGGTGTACCGCCATTGCGCCACAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTTGCCAGGAATATCGAACTCGAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCAATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAAGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCAAGCCCAAGGAAAGTGCTGTCTGGCCNCTTCTAGTCGAATTTCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGTCAATGGCAGGGCGTTGCTCCACTGGCTGTTGTCCTGGCCTCCCACTTGGACGTACAGAAAACGCGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGCCGCTTTCAAGGACAACTGCTCGTCTTCCAACAAATTTGAGAAGAAGATAGCCAGATACGTAAATCAGCTAGAAACGGAGACTAGTAGTCCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGCGTCAGAAACTGCGTGAACAGATTCAGCTCGTCGCCAAAAACCTTCAACCCAACAAGAAGGCGGCGAAGCAG---AAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGATGATGAAGAGTCCACA--- ->Dsim_MD15 |77 sp| -ATGAAAAGCAAGGTGGATAAACCCATAACCACTGGTGCACCAAGTGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAGAAATCCGACGCGGACACGCAGATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGTGAAGCCGGCGGAGACCGAGGAAAAGGAAAATATCGCGAGCAACGGCAACCTGAAGGTGTCGCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGACACAAATGCTGAGCAGCGCGCTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTGACCGCCGTGCCCGCCATCGACGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAAGTGGTTACAGCCTTCGGCATTTTGCAGAGCCCGCAGTTCGCCAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCTCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAANAAGCCGTTGAGTGGCTTGAAAGTAAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGAGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACTCACAGCTTTTCGATTTGTATTTCTCCGGCTCCACCATTCACAGCGATGACGTATACGCCAGATTGGCTAGTTTTCTTATGAATGGCGGAAAGGAAATGCTCGCCGCCTGGCAGCAGTATATTGATTCCAAGCAGCCACTCAAATTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCAACGTGCTCCGCAACTTTAAGCCAAGGGAAGAACAACTTATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGCTGCAGGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCAAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTCGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCAGCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATATCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTTAGCGTCGAGAGCCTTTACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCATTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTGAGCCAGGCAACACAATGGCGACAGAAGCAGTTGAACTACTTGCTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAAGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCACTTGCTGCAGAAGACATTGAGTTACCTTAACAAAAAGTTGGGGGAACCGGATGCAGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGCGCGGCCCAGCAAGGAAACGGATGTCGTTGGCCAAACATTCGAGGCTCTAATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCGTCACCGTGTTGGAGGATCTGATTNTCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGATCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTACTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGTTCAACATGAACAAAAATCCCTTGAGCAAGAAGGACGATGGC------GAGGAGGAGAGCGAAGACGAAGTCGACGAGGAAGAATCGTTGAAGGATTCGAGCGATGATTCAGACGATGAAGATGAAGATGAAGAGGAGNAC---GAAGACGAGGACGATGAAGAGTCCCATTTGGCCCAAANTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAGGAGCAGGGCAAACGCTTGAATGCTGCTTTGGAGCAGTCTTTTCAAATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAACACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAAACAAGAAACCAACTCAATCGGTAATCCTGGNCGTGCTGCATTGCGTCTTCCAGGTGTACCGCCATTGCGCCACAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTTGCCAGGAATATCGAACTCGAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCAATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAAGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCAAGCCCAAGGAAAGTGCTGTCTGGCCNCTTCTAGTCGAATTTCTGGAGCTGTGGGTATCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGTCAATGGCAGGGCGTTGCTCCACTGGCTGTTGTCCTGGCCTCCCACTTGGACCTACAGAAAACGCGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGCCGCTTTCAAGGACAACTGCTCGTCTTCCAACAAATTTGAGAAGAAGATAGCCAGATACGTAAATCAGCTAGAAACGGAGACTAGTAGTCCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGCGTCAGAAACTGCGTGAACAGATTCAGCTCGTCGCCAAAAACCTTCAACCCAACAAGAAGGCGGCGAAGCAG---AAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGATGATGAAGAGTCCACA--- ->Dsim_MD197 |86 sp| -ATGAAAAGCAAGGTGGATAAACCCATAACCACTGGTGCACCAAGTGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAGAAATCCGACGCGGACACGCAGATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGTGAAGCCGGCGGAGACCGAGGAAAAGGAAAATATCGCGAGCAACGGCAACCTGAAGGTGTCGCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGACACAAATGCTGAGCAGCGCGCTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAACCGCCGTGCCCGCCATCGACGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAAGTGGTTACAGCCTTCGGCATTTTGCAGAGCCCGCAGTTCGCCAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCTCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAANAAGCCGTTGAGTGGCTTGAAAGTAAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGAGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACTCACAGCTTTTCGATTTGTATTTCTCCGGCTCCACCATTCACAGCGATGACGTATACGCCAGATTGGCTAGTTTTCTTATGAATGGCGGAAAGGAAATGCTCGCCGCCTGGCAGCAGTATATTGATTCCAAGCAGCCACTCAAATTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCAACGTGCTCCGCAACTTTAAGCCAAGGGAAGAACAACTTATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGCTGCAGGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCAAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTCGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCAGCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATATCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTAAGCGTCGAGAGCCTTTACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCATTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTGAGCCAGGCAACACAATGGCGACAGAAGCAGTTGAACTACTTGCTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAGGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCACTTGCTGCAAAAGACATTGAGTTACCTTAACAAAAAGTTGGGGGAACCGGATGCAGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGCGCGGCCCAGCAAGGAAACGGATGTCGTTGGCCAAACATTCGAGGCTCTAATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCGTCACCGTGTTGGAGGATCTGATTNTCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGATCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTACTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGTTCAACATGAACAAAAATCCCTTGAGCAAGAAGGACGATGGC------GAGGAGGAGAGCGAAGACGAAGTCGACGAGGAAGAATCGTTGAAGGATTCGAGCGATGATTCAGACGATGAAGATGAAGATGAAGAGGAGNAC---GAAGACGAGGACGATGAAGAGTCCCATTTGGCCCAAANTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAGGAGCAGGGCAAACGCTTGAATGCTGCTTTGGAGCAGTCTTTTCAAATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAACACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAAACAAGAAACCAACTCAATCGGTAATCCTGGNCGTGCTGCATTGCGTCTTCCAGGTGTACCGCCATTGCGCCACAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTTGCCAGGAATATCGAACTCAAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCTATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAAGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCAAGCCCAAGGAAAGTGCTGTCTGGCCNCTTCTAGTCGAATTTCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGTCAATGGCAGGGCGTTGCTCCACTGGCTGTTGTCCTGGCCTCCCACTTGGACGTACAGAAAACGCGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGCCGCTTTCAAGGACAACTGCTCGTCTTCCAACAAATTTGAGAAGAAGATAGCCAGATACGTAAATCAGCTAGAAACGGAGACTAGTAGTCCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGCGTCAGAAACTGCGTGAACAGATTCAGCTCGTCGCCAAAAACCTTCAACCCAACAAGAAGGCGGCGAAGCAG---AAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGATGATGAAGAGTCCACA--- ->Dsim_MD199 |87 sp| -ATGAAAAGCAAGGTGGATAAACCCATAACCACTGGTGCACCAAGTGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAGAAATCCGACGCGGACACGCAGATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGTGAAGCCGGCGGAGACCGAGGAAAAGGAAAATATCGCGAGCAACGGCAACCTGAAGGTGTCGCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGACACAAATGCTGAGCAGCGCGCTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAACCGCCGTGCCCGCCATCGACGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAAGTGGTTACAGCCTTCGGCATTTTGCAGAGCCCGCAGTTCGCCAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCTCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAANAAGCCGTTGAGTGGCTTGAAAGTAAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGAGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACTCACAGCTTTTCGATTTGTATTTATCCGGCTCCACCATTCACAGCGATGACGTATACGCCAGATTGGCTAGTTTTCTTATGAATGGCGGAAAGGAAATGCTCGCCGCCTGGCAGCAGTATATTGATTCCAAGCAGCCACTCAAATTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCAACGTGCTCCGCAACTTTAAGCCAAGGGAAGAACAACTTATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGCTGCAGGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCAAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTCGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCAGCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATATCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTTAGCGTCGAGAGCCTTTACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCATTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTGAGCCAGGCAACACAATGGCGACAGAAGCAGTTGAACTACTTGCTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAGGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCACTTGCTGCAAAAGACATTGAGTTACCTTAACAAAAAGTTGGGGGAACCGGATGCAGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGCGCGGCCCAGCAAGGAAACGGATGTCGTTGGCCAAACATTCGAGGCTCTAATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCGTCACCGTGTTGGAGGATCTGATTNTCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGATCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTACTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGTTCAACATGAACAAAAATCCCTTGAGCAAGAAGGACGATGGC------GAGGAGGAGAGCGAAGACGAAGTCGACGAGGAAGAATCGTTGAAGGATTCGAGCGATGATTCAGACGATGAAGATGAAGATGAAGAGGAGNAC---GAAGACGAGGACGATGAAGAGTCCCATTTGGCCCAAANTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAGGAGCAGGGCAAACGCTTGAATGCTGCTTTGGAGCAGTCTTTTCAAATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAACACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAAACAAGAAACCAACTCAATCGGTAATCCTGGNCGTGCTGCATTGCGTCTTCCAGGTGTACCGCCATTGCGCCACAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTTGCCAGGAATATCGAACTCGAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCAATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAAGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCAAGCCCAAGGAAAGTGCTGTCTGGCCNCTTCTAGTCGAATTTCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGTCAATGGCAGGGCGTTGCTCCACTGGCTGTTGTCCTGGCCTCCCACTTGGACGTACAGAAAACGCGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGCCGCTTTCAAGGACAACTGCTCGTCTTCCAACAAATTTGAGAAGAAGATAGCCAGATACGTAAATCAGCTAGAAACGGAGACTAGTAGTCCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGCGTCAGAAACTGCGTGAACAGATTCAGCTCGTCGCCAAAAACCTTCAACCCAACAAGAAGGCGGCGAAGCAG---AAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGATGATGAAGAGTCCACA--- ->Dsim_MD201 |47 sp| -ATGAAAAGCAAGGTGGATAAACCCATAACCACTGGTGCACCAAGTGCAACCAAGACAAAGGGCAAGGAGGACCGCAAGCGGGCAAAAACTCAGAAATCCGACGCGGACACGCAGATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGTGAAGCCGGCGGAGACCGAGGAAAAGGAAAATATCGCGAGCAACGGCAACCTGAAGGTGTCGCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGACACAAATGCTGAGCAGCGCGCTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAACCGCCGTGCCCGCCATCGACGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAAGTGGTTACAGCCTTCGGCATTTTGCAGAGCCCGCAGTTCGCCAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCTCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAANAAGCCGTTGAGTGGCTTGAAAGTAAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGAGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACTCACAGCTTTTCGATTTGTATTTCTCCGGCTCCACCATTCACAGCGATGACGTATACGCCAGATTGGCTAGTTTTCTTATGAATGGAGGAAAGGAAATGCTCGCCGCCTGGCAGCAGTATATTGATTCCAAGCAGCCACTCAAATTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCAACGTGCTCCGCAACTTTAAGCCAAGGGAAGAACAACTTATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGCTGCAGGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCAAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTCGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCAGCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATATCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTTAGCGTCGAGAGCCTTTACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCATTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTGAGCCAGGCAACACAATGGCGACAGAAGCAGTTGAACTACTTGCTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAAGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCACTTGCTGCAGAAGACATTGAGTTACCTTAACAAAAAGTTGGGGGAACCGGATGCAGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGCGCGGCCCAGCAAGGAAACGGATGTCGTTGGCCAAACATTCGAGGCTCTAATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCGTCACCGTGTTGGAGGATCTGATTNTCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGATCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTACTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGTTCAACATGAACAAAAATCCCTTGAGCAAGAAGGACGATGGC------GAGGAGGAGAGCGAAGACGAAGTCGACGAGGAAGAATCGTTGAAGGATTCGAGCGATGATTCAGACGATGAAGATGAAGATGAAGAGGAGNAC---GAAGACGAGGACGATGAAGAGTCCCATTTGGCCCAAANTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAAGAGCAGGGCAAACGCTTGAATGCTGCTTTGGAGCAGTCTTTTCAAATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAACACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAAACAAGAAACCAACTCAATCGGTAATCCTGGNCGTGCTGCATTGCGTCTTCCAGGTGTACCGCCATTGCGCCACAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTTGCCAGGAATATCGAACTCGAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCCATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAAGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCAAGCCCAAGGAAAGTGCTGTCTGGCCNCTTCTAGTCGAATTTCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGTCAATGGCAGGGCGTTGCTCCACTGGCTGTTGTCCTGGCCTCCCACTTGGACGTACAGAAAACGCGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGCCGCTTTCAAGGACAACTGCTCGTCTTCCAACAAATTTGAGAAGAAGATAGCCAGATACGTAAATCAGCTAGAAACGGAGACTAGTAGTCCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGCGTCAGAAACTGCGTGAACAGATTCAGCTCGTCGCCAAAAACCTTCAACCCAACAAGAAGGCGGCGAAGCAG---AAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGATGATGAAGAGTCCACA--- ->Dsim_MD221 |76 sp| -ATGAAAAGCAAGGTGGATAAACCCATAACCACTGGTGCACCAAGTGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAGAAATCCGACGCGGACACGCAGATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGTGAAGCCGGCGGAGACCGAGGAAAAGGAAAATATCGCGAGCAACGGCAACCTGAAGGTGTCGCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGACACAAATGCTGAGCAGCGCGCTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAACCGCCGTGCCCGCCATCGACGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAAGTGGTTACAGCCTTCGGCATTTTGCAGAGCCCGCAGTTCGCCAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCTCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAANAAGCCGTTGAGTGGCTTGAAAGTAAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGAGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACTCACAGCTTTTCGATTTGTATTTCTCCGGCTCCACCATTCACAGCGATGACGTATACGCCAGATTGGCTAGTTTTCTTATGAATGGCGGAAAGGAAATGCTCGCCGCCTGGCAGCAGTATATTGATTCCAAGCAGCCACTCAAATTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCAACGTGCTCCGCAACTTTAAGCCAAGGGAAGAACAACTTATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGCTGCAGGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCTAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTCGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCAGCTGCTGCTTAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATATCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTAAGCGTCGAGAGCCTTTACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCATTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTGAGCCAGGCAACACAATGGCGACAGAAGCAGTTGAACTACTTGCTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAGGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCACTTGCTGCAGAAGACATTGAGTTACCTTAACAAAAAGTTGGGGGAACCGGATGCAGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGCGCGGCCCAGCAAGGAAACGGATGTCGTTGGCCAAACATTCGAGGCTCTAATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCGTCACCGTGTTGGAGGATCTGATTNTCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGATCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTACTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGTTCAACATGAACAAAAATCCCTTGAGCAAGAAGGACGATGGC------GAGGAGGAGAGCGAAGACGAAGTCGACGAGGAAGAATCGTTGAAGGATTCGAGCGATGATTCAGACGATGAAGATGAAGATGAAGAGGAGNAC---GAAGACGAGGACGATGAAGAGTCCCATTTGGCCCAAANTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAGGAGCAGGGCAAACGCTTGAATGCTGCTTTGGAGCAGTCTTTTCAAATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAACACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAAACAAGAAACCAACTCAATCGGTAATCCTGGNCGTGCTGCATTGCGTCTTCCAGGTGTACCGCCATTGCGCCACAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTTGCCAGGAATATCGAACTCGAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCCATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAAGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCAAGCCCAAGGAAAGTGCTGTCTGGCCNCTTCTAGTCGAATTTCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGTCAATGGCAGGGCGTTGCTCCACTGGCTGTTGTCCTGGCCTCCCACTTGGACGTACAGAAAACGCGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGCCGCTTTCAAGGACAACTGCTCGTCTTCCAACAAATTTGAGAAGAAGATAGCCAGATACGTAAATCAGCTAGAAACGGAGACTAGTAGTCCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGCGTCAGAAACTGCGTGAACAGATTCAGCTCGTCGCCAAAAACCTTCAACCCAACAAGAAGGCGGCGAAGCAG---AAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGATGATGAAGAGTCCACA--- ->Dsim_MD224 |103 sp| -ATGAAAAGCAAGGTGGATAAACCCATAACCACTGGTGCACCAAGTGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAGAAATCCGACGCGGACACGCAGATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGTGAAGCCGGCGGAGACCGAGGAAAAGGAAAATATCGCGAGCAACGGCAACCTGAAGGTGTCGCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGACACAAATGCTGAGCAGCGCGCTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAACCGCCGTGCCCGCCATCGACGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAAGTGGTTACAGCCTTCGGCATTTTGCAGAGCCCGCAGTTCGCCAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCTCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAANAAGCCGTTGAGTGGCTTGAAAGTAAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGAGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACTCACAGCTTTTCGATTTGTATTTCTCCGGCTCCACCATTCACAGCGATGACGTATACGCCAGATTGGCTAGTTTTCTTATGAATGGCGGAAAGGAAATGCTCGCCGCCTGGCAGCAGTATATTGATTCCAAGCAGCCACTCAAATTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCAACGTGCTCCGCAACTTTAAGCCAAGGGAAGAACAACTTATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGCTGCAGGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCAAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTCGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCAGCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATATCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTTAGCGTCGAGAGCCTTTACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCATTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTGAGCCAGGCAACACAATGGCGACAGAAGCAGTTGAACTACTTGCTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAAGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCACTTGCTGCAGAAGACATTGAGTTACCTTAACAAAAAGTTGGGGGAACCGGATGCAGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGCGCGGCCCAGCAAGGAAACGGATGTCGTTGGCCAAACATTCGAGGCTCTAATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCGTCACCGTGTTGGAGGATCTGATTNTCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGATCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTACTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGTTCAACATGAACAAAAATCCCTTGAGCAAGAAGGACGATGGC------GAGGAGGAGAGCGAAGACGAAGTCGACGAGGAAGAATCGTTGAAGGATTCGAGCGATGATTCAGACGATGAAGATGAAGATGAAGAGGAGNAC---GAAGACGAGGACGATGAAGAGTCCCATTTGGCCCAAANTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAGGAGCAGGGCAAACGCTTGAATGCTGCTTTGGAGCAGTCTTTTCAAATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAACACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAAACAAGAAACCAACTCAATCGGTAATCCTGGNCGTGCTGCATTGCGTCTTCCAGGTGTACCGCCATTGCGCCACAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTTGCCAGGAATATCGAACTCGAGGAAAATCAGAGCACCGCTCCCATTCTGGAAGCAATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAAGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCAAGCCCAAGGAAAGTGCTGTCTGGCCNCTTCTAGTCGAATTTCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGTCAATGGCAGGGCGTTGCTCCACTGGCTGTTGTCCTGGCCTCCCACTTGGACGTACAGAAAACGCGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGCCGCTTTCAAGGACAACTGCTCGTCTTCCAACAAATTTGAGAAGAAGATAGCCAGATACGTAAATCAGCTAGAAACGGAGACTAGTAGTCCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGCGTCAGAAACTGCGTGAACAGATTCAGCTCGTCGCCAAAAACCTTCAACCCAACAAGAAGGCGGCGAAGCAG---AAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGATGATGAAGAGTCCACA--- ->Dsim_MD225 |0 sp| -ATGAAAAGCAAGGTGGATAAACCCATAACCACTGGTGCACCAAGTGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAGAAATCCGACGCGGACACGCAGATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGTGAAGCCGGCGGAGACCGAGGAAAAGGAAAATATCGCGAGCAACGGCAACCTGAAGGTGTCGCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGACACAAATGCTGAGCAGCGCGCTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAACCGCCGTGCCCGCCATCGACGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAAGTGGTTACAGCCTTCGGCATTTTGCAGAGCCCGCAGTTCGCCAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCTCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAANAAGCCGTTGAGTGGCTTGAAAGTAAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGAGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACTCACAGCTTTTCGATTTGTATTTCTCCGGCTCCACCATTCACAGCGATGACGTATACGCCAGATTGGCTAGTTTTCTTATGAATGGCGGAAAGGAAATGCTCGCCGCCTGGCAGCAGTATATTGATTCCAAGCAGCCACTCAAATTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCAACGTGCTCCGCAACTTTAAGCCAAGGGAAGAACAACTTATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGCTGCAGGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCAAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTCGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCAGCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATATCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTTAGCGTCGAGAGCCTTTACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCATTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTGAGCCAGGCAACACAATGGCGACAGAAGCAGTTGAACTACTTGCTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAAGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCACTTGCTGCAGAAGACATTGAGTTACCTTAACAAAAAGTTGGGGGAACCGGATGCAGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGCGCGGCCCAGCAAGGAAACGGATGTCGTTGGCCAAACATTCGAGGCTCTAATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCGTCACCGTGTTGGAGGATCTGATTNTCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGATCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTACTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGTTCAACATGAACAAAAATCCCTTGAGCAAGAAGGACGATGGC------GAGGAGGAGAGCGAAGACGAAGTCGACGAGGAAGAATCGTTGAAGGATTCGAGCGATGATTCAGACGATGAAGATGAAGATGAAGAGGAGNAC---GAAGACGAGGACGATGAAGAGTCCCATTTGGCCCAAANTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAAGAGCAGGGCAAACGCTTGAATGCTGCTTTGGAGCAGTCTTTTCAAATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAACACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAAACAAGAAACCAACTCAATCGGTAATCCTGGNCGTGCTGCATTGCGTCTTCCAGGTGTACCGCCATTGCGCCACAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTTGCCAGGAATATCGAACTCGAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCAATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAAGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCAAGCCCAAGGAAAGTGCTGTCTGGCCNCTTCTAGTCGAATTTCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGTCAATGGCAGGGCGTTGCTCCACTGGCTGTTGTCCTGGCCTCCCACTTGGACGTACAGAAAACGCGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGCCGCTTTCAAGGACAACTGCTCGTCTTCCAACAAATTTGAGAAGAAGATAGCCAGATACGTAAATCAGCTAGAAACGGAGACTAGTAGTCCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGCGTCAGAAACTGCGTGAACAGATTCAGCTCGTCGACAAAAACCTTCAACCCAACAAGAAGGCGGCGAAGCAG---AAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGATGATGAAGAGTCCACA--- ->Dsim_MD233 |45 sp| -ATGAAAAGCAAGGTGGATAAACCCATAACCACTGGTGCACCAAGTGCAACCAAGACAAAGGGCAAGGAGGACCGCAAGCGGGCAAAAACTCAGAAATCCGACGCGGACACGCAGATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGTGAAGCCGGCGGAGACCGAGGAAAAGGAAAATATCGCGAGCAACGGCAACCTGAAGGTGTCGCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGACACAAATGCTGAGCAGCGCGCTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAACCGCCGTGCCCGCCATCGACGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAAGTGGTTACAGCCTTCGGCATTTTGCAGAGCCCGCAGTTCGCCAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCTCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAANAAGCCGTTGAGTGGCTTGAAAGTAAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGAGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACTCACAGCTTTTCGATTTGTATTTCTCCGGCTCCACCATTCACAGCGATGACGTATACGCCAGATTGGCTAGTTTTCTTATGAATGGCGGAAAGGAAATGCTCGCCGCCTGGCAGCAGTATATTGATTCCAAGCAGCCACTCAAATTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCAACGTGCTCCGCAACTTTAAGCCAAGGGAAGAACAACTTATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGCTGCAGGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCAAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTCGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCAGCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATATCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTTAGCGTCGAGAGCCTTTACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCATTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTGAGCCAGGCAACACAATGGCGACAGAAGCAGTTGAACTACTTGCTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAAGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCACTTGCTGCAGAAGACATTGAGTTACCTTAACAAAAAGTTGGGGGAACCGGATGCAGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGCGCGGCCCAGCAAGGAAACGGATGTCGTTGGCCAAACATTCGAGGCTCTAATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCGTCACCGTGTTGGAGGATCTGATTNTCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGATCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTACTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGTTCAACATGAACAAAAATCCCTTGAGCAAGAAGGACGATGGC------GAGGAGGAGAGCGAAGACGAAGTCGACGAGGAAGAATCGTTGAAGGATTCGAGCGATGATTCAGACGATGAAGATGAAGATGAAGAGGAGNAC---GAAGACGAGGACGATGAAGAGTCCCATTTGGCCCAAANTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAGGAGCAGGGCAAACGCTTGAATGCTGCTTTGGAGCAGTCTTTTCAAATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAACACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAAACAAGAAACCAACTCAATCGGTAATCCTGGNCGTGCTGCATTGCGTCTTCCAGGTGTACCGCCATTGCGCCACAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTTGCCAGGAATATCGAACTCGAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCCATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAAGTGCTTCGCCTACCTGGTCAGCCAGGCATCGGCAGATGGCAAGCCCAAGGAAAGTGCTGTCTGGCCNCTTCTAGTCGAATTTCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGTCAATGGCAGGGCGTTGCTCCACTGGCTGTTGTCCTGGCCTCCCACTTGGACGTACAGAAAACGCGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGCCGCTTTCAAGGACAACTGCTCGTCTTCCAACAAATTTGAGAAGAAGATAGCCAGATACGTAAATCAGCTAGAAACGGAGACTAGTAGTCCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGCGTCAGAAACTGCGTGAACAGATTCAGCTCGTCGCCAAAAACCTTCAACCCAACAAGAAGGCGGCGAAGCAG---AAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGATGATGAAGAGTCCACA--- ->Dsim_MD235 |4 sp| -ATGAAAAGCAAGGTGGATAAACCCATAACCACTGGTGCACCAAGTGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAGAAATCCGACGCGGACACGCAGATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGTGAAGCCGGCGGAGACCGAGGAAAAGGAAAATATCGCGAGCAACGGCAACCTGAAGGTGTCGCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGACACAAATGCTGAGCAGCGCGCTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAACCGCCGTGCCCGCCATCGACGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAAGTGGTTACAGCCTTCGGCATTTTGCAGAGCCCGCAGTTCGCCAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCTCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAANAAGCCGTTGAGTGGCTTGAAAGTAAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGAGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACTCACAGCTTTTCGATTTGTATTTCTCCGGCTCCACCATTCACAGCGATGACGTATACGCCAGATTGGCTAGTTTTCTTATGAATGGCGGAAAGGAAATGCTCGCCGCCTGGCAGCAGTATATTGATTCCAAGCAGCCACTCAAATTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCAACGTGCTCCGCAACTTTAAGCCAAGGGAAGACCAACTTATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGCTGCAGGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCAAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTCGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCAGCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATATCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTTAGCGTCGAGAGCCTTTACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCATTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTGAGCCAGGCAACACAATGGCGACAGAAGCAGTTGAACTACTTGCTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAAGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCACTTGCTGCAGAAGACATTGAGTTACCTTAACAAAAAGTTGGGGGAACCGGATGCAGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGCGCGGCCCAGCAAGGAAACGGATGTCGTTGGCCAAACATTCGAGGCTCTAATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCGTCACCGTGTTGGAGGATCTGATTNTCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGATCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTACTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGTTCAACATGAACAAAAATCCCTTGAGCAAGAAGGACGATGGC------GAGGAGGAGAGCGAAGACGAAGTCGACGAGGAAGAATCGTTGAAGGATTCGAGCGATGATTCAGACGATGAAGATGAAGATGAAGAGGAGNAC---GAAGACGAGGACGATGAAGAGTCCCATTTGGCCCAAANTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAAGAGCAGGGCAAACGCTTGAATGCTGCTTTGGAGCAGTCTTTTCAAATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAACACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAAACAAGAAACCAACTCAATCGGTAATCCTGGNCGTGCTGCATTGCGTCTTCCAGGTGTACCGCCATTGCGCCACAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTTGCCAGGAATATCGAACTCGAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCAATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAAGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCAAGCCCAAGGAAAGTGCTGTCTGGCCNCTTCTAGTCGAATTTCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGTCAATGGCAGGGCGTTGCTCCACTGGCTGTTGTCCTGGCCTCCCACTTGGACGTACAGAAAACGCGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGCCGCTTTCAAGGACAACTGCTCGTCTTCCAACAAATTTGAGAAGAAGATAGCCAGATACGTAAATCAGCTAGAAACGGAGACTAGTAGTCCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGCGTCAGAAACTGCGTGAACAGATTCAGCTCGTCGCCAAAAACCTTCAACCCAACAAGAAGGCGGCGAAGCAG---AAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGATGATGAAGAGTCCACA--- ->Dsim_MD238 |83 sp| -ATGAAAAGCAAGGTGGATAAACCCATAACCACTGGTGCACCAAGTGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAGAAATCCGACGCGGACACGCAGATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGTGAAGCCGGCGGAGACCGAGGAAAAGGAAAATATCGCGAGCAACGGCAACCTGAAGGTGTCGCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGACACAAATGCTGAGCAGCGCGCTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAACCGCCGTGCCCGCCATCGACGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAAGTGGTTACAGCCTTCGGCATTTTGCAGAGCCCGCAGTTCGCCAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCTCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAANAAGCCGTTGAGTGGCTTGAAAGTAAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGAGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACTCACAGCTTTTCGATTTGTATTTCTCCGGCTCCACCATTCACAGCGATGACGTATACGCCAGATTGGCTAGTTTTCTTATGAATGGCGGAAAGGAAATGCTCGCCGCCTGGCAGCAGTATATTGATTCCAAGCAGCCACTCAAATTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCAACGTGCTCCGCAACTTTAAGCCAAGGGAAGAACAACTTATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGCTGCAGGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCTAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTCGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCAGCTGCTGCTTAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATATCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTTAGCGTCGAGAGCCTTTACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCATTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTGAGCCAGGCAACACAATGGCGACAGAAGCAGTTGAACTACTTGCTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAAGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCACTTGCTGCAGAAGACATTGAGTTACCTTAACAAAAAGTTGGGGGAACCGGATGCAGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGCGCGGCCCAGCAAGGAAACGGATGTCGTTGGCCAAACATTCGAGGCTCTAATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCGTCACCGTGTTGGAGGATCTGATTNTCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGATCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTACTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGTTCAACATGAACAAAAATCCCTTGAGCAAGAAGGACGATGGC------GAGGAGGAGAGCGAAGACGAAGTCGACGAGGAAGAATCGTTGAAGGATTCGAGCGATGATTCAGACGATGAAGATGAAGATGAAGAGGAGNAC---GAAGACGAGGACGATGAAGAGTCCCATTTGGCCCAAANTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAAGAGCAGGGCAAACGCTTGAATGCTGCTTTGGAGCAGTCTTTTCAAATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAACACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAAACAAGAAACCAACTCAATCGGTAATCCTGGNCGTGCTGCATTGCGTCTTCCAGGTGTACCGCCATTGCGCCACAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTTGCCAGGAATATCGAACTCGAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCAATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAAGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCAAGCCCAAGGAAAGTGCTGTCTGGCCNCTTCTAGTCGAATTTCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGTCAATGGCAGGGCGTTGCTCCACTGGCTGTTGTCCTGGCCTCCCACTTGGACGTACAGAAAACGCGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGCCGCTTTCAAGGACAACTGCTCGTCTTCCAACAAATTTGAGAAGAAGATAGCCAGATACGTAAATCAGCTAGAAACGGAGACTAGTAGTCCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGCGTCAGAAACTGCGTGAACAGATTCAGCTCGTCGCCAAAAACCTTCAACCCAACAAGAAGGCGGCGAAGCAG---AAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGATGATGAAGAGTCCACA--- ->Dsim_MD243 |100 sp| -ATGAAAAGCAAGGTGGATAAACCCATAACCACTGGTGCACCAAGTGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAGAAATCCGACGCGGACACGCAGATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGTGAAGCCGGCGGAGACCGAGGAAAAGGAAAATATCGCGAGCAACAGCAACCTGAAGGTGTCGCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGACACAAATGCTGAGCAGCGCGCTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAACCGCCGTGCCCGCCATCGACGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAAGTGGTTACAGCCTTCGGCATTTTGCAGAGCCCGCAGTTCGCCAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCTCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAANAAGCCGTTGAGTGGCTTGAAAGTAAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGAGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACTCACAGCTTTTCGATTTGTATTTCTCCGGCTCCACCATTCACAGCGATGACGTATACGCCAGATTGGCTAGTTTTCTTATGAATGGCGGAAAGGAAATGCTCGCCGCCTGGCAGCAGTATATTGATTCCAAGCAGCCACTCAAATTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCAACGTGCTCCGCAACTTTAAGCCAAGGGAAGAACAACTTATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGCTGCAGGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCAAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTCGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCAGCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATATCCTTGCCGCGTTTCTGCCAGAAAATGATAAATCAACTAAGCGTCGAGAGCCTTTACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCATTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTGAGCCAGGCAACACAATGGCGACAGAAGCAGTTGAACTACTTGCTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAAGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCACTTGCTGCAGAAGACATTGAGTTACCTTAACAAAAAGTTGGGGGAACCGGATGCAGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGCGCGGCCCAGCAAGGAAACGGATGTCGTTGGCCAAACATTCGAGGCTCTAATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCGTCACCGTGTTGGAGGATCTGATTNTCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGATCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTACTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGTTCAACATGAACAAAAATCCCTTGAGCAAGAAGGACGATGGC------GAGGAGGAGAGCGAAGACGAAGTCGACGAGGAAGAATCGTTGAAGGATTCGAGCGATGATTCAGACGATGAAGATGAAGATGAAGAGGAGNAC---GAAGACGAGGACGATGAAGAGTCCCATTTGGCCCAAANTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAAGAGCAGGGCAAACGCTTGAATGCTGCTTTGGAGCAGTCTTTTCAAATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAACACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAAACAAGAAACCAACTCAATCGGTAATCCTGGNCGTGCTGCATTGCGTCTTCCAGGTGTACCGCCATTGCGCCACAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTTGCCAGGAATATCGAACTCGAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCAATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAAGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCAAGCCCAAGGAAAGTGCTGTCTGGCCNCTTCTAGTCGAATTTCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGTCAATGGCAGGGCGTTGCTCCACTGGCTGTTGTCCTGGCCTCCCACTTGGACGTACAGAAAACGCGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGCCGCTTTCAAGGACAACTGCTCGTCTTCCAACAAATTTGAGAAGAAGATAGCCAGATACGTAAATCAGCTAGAAACGGAGACTAGTAGTCCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGCGTCAGAAACTGCGTGAACAGATTCAGCTCGTCGCCAAAAACCTTCAACCCAACAAGAAGGCGGCGAAGCAG---AAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGATGATGAAGAGTCCACA--- ->Dsim_MD251 |39 sp| -ATGAAAAGCAAGGTGGATAAACCCATAACCACTGGTGCACCAAGTGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAGAAATCCGACGCGGACACGCAGATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGTGAAGCCGGCGGAGACCGAGGAAAAGGAAAATATCGCGAGCAACGGCAACCTGAAGGTGTCGCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGACACAAATGCTGAGCAGCGCGCTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAACCGCCGTGCCCGCCATCGACGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAAGTGGTTACAGCCTTCGGCATTTTGCAGAGCCCGCAGTTCGCCAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCTCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAANAAGCCGTTGAGTGGCTTGAAAGTAAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGAGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACTCACAGCTTTTCGATTTGTATTTCTCCGGCTCCACCATTCACAGCGATGACGTATACGCCAGATTGGCTAGTTTTCTTATGAATGGCGGAAAGGAAATGCTCGCCGCCTGGCAGCAGTATATTGATTCCAAGCAGCCACTCAAATTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCAACGTGCTCCGCAACTTTAAGCCAAGGGAAGAACAACTTATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGCTGCAGGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCAAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTCGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCAGCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATATCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTTAGCGTCGAGAGCCTTTACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCATTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTGAGCCAGGCAACACAATGGCGACAGAAGCAGTTGAACTACTTGCTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAAGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCACTTGCTGCAGAAGACATTGAGTTACCTTAACAAAAAGTTGGGGGAACCGGATGCAGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGCGCGGCCCAGCAAGGAAACGGATGTCGTTGGCCAAACATTCGAGGCTCTAATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCGTCACCGTGTTGGAGGATCTGATTNTCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGATCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTACTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGTTCAACATGAACAAAAATCCCTTGAGCAAGAAGGACGATGGC------GAGGAGGAGAGCGAAGACGAAGTCGACGAGGAAGAATCGTTGAAGGATTCGAGCGATGATTCAGACGATGAAGATGAAGATGAAGAGGAGNAC---GAAGACGAGGACGATGAAGAGTCCCATTTGGCCCAAANTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAAGAGCAGGGCAAACGCTTGAATGCTGCTTTGGAGCAGTCTTTTCAAATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAACACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAAACAAGAAACCAACTCAATCGGTAATCCTGGNCGTGCTGCATTGCGTCTTCCAGGTGTACCGCCATTGCGCCACAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTTGCCAGGAATATCGAACTCGAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCAATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAAGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCAAGCCCAAGGAAAGTGCTGTCTGGCCNCTTCTAGTCGAATTTCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGTCAATGGCAGGGCGTTGCTCCACTGGCTGTTGTCCTGGCCTCCCACTTGGACGTACAGAAAACGCGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGCCGCTTTCAAGGACAACTGCTCGTCTTCCAACAAATTTGAGAAGAAGATAGCCAGATACGTAAATCAGCTAGAAACGGAGACTAGTAGTCCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGCGTCAGAAACTGCGTGAACAGATTCAGCTCGTCGCCAAAAACCTTCAACCCAACAAGAAGGCGGCGAAGCAG---AAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGATGATGAAGAGTCCACA--- ->Dsim_MD255 |95 sp| -ATGAAAAGCAAGGTGGATAAACCCATAACCACTGGTGCACCAAGTGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAGAAATCCGACGCGGACACGCAGATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGTGAAGCCGGCGGAGACCGAGGAAAAGGAAAATATCGCGAGCAACGGCAACCTGAAGGTGTCGCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGACACAAATGCTGAGCAGCGCGCTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAACCGCCGTGCCCGCCATCGACGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAAGTGGTTACAGCCTTCGGCATTTTGCAGAGCCCGCAGTTCGCCAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCTCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAANAAGCCGTTGAGTGGCTTGAAAGTAAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGAGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACTCACAGCTTTTCGATTTGTATTTCTCCGGCTCCACCATTCACAGCGATGACGTATACGCCAGATTGGCTAGTTTTCTTATGAATGGCGGAAAGGAAATGCTCGCCGCCTGGCAGCAGTATATTGATTCCAAGCAGCCACTCAAATTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCAACGTGCTCCGCAACTTTAAGCCAAGGGAAGAACAACTTATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGCTGCAGGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCTAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTCGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCAGCTGCTGCTTAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATATCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTAAGCGTCGAGAGCCTTTACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCATTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTGAGCCAGGCAACACAATGGCGACAGAAGCAGTTGAACTACTTGCTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAGGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCACTTGCTGCAAAAGACATTGAGTTACCTTAACAAAAAGTTGGGGGAACCGGATGCAGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGCGCGGCCCAGCAAGGAAACGGATGTCGTTGGCCAAACATTCGAGGCTCTAATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCGTCACCGTGTTGGAGGATCTGATTNTCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGATCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTACTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGTTCAACATGAACAAAAATCCCTTGAGCAAGAAGGACGATGGC------GAGGAGGAGAGCGAAGACGAAGTCGACGAGGAAGAATCGTTGAAGGATTCGAGCGATGATTCAGACGATGAAGATGAAGATGAAGAGGAGNAC---GAAGACGAGGACGATGAAGAGTCCCATTTGGCCCAAANTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAGGAGCAGGGCAAACGCTTGAATGCTGCTTTGGAGCAGTCTTTTCAAATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAACACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAAACAAGAAACCAACTCAATCGGTAATCCTGGNCGTGCTGCATTGCGTCTTCCAGGTGTACCGCCATTGCGCCACAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTTGCCAGGAATATCGAACTCGAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCAATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAAGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCAAGCCCAAGGAAAGTGCTGTCTGGCCNCTTCTAGTCGAATTTCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGTCAATGGCAGGGCGTTGCTCCACTGGCTGTTGTCCTGGCCTCCCACTTGGACGTACAGAAAACGCGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGCCGCTTTCAAGGACAACTGCTCGTCTTCCAACAAATTTGAGAAGAAGATAGCCAGATACGTAAATCAGCTAGAAACGGAGACTAGTAGTCCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGCGTCAGAAACTGCGTGAACAGATTCAGCTCGTCGCCAAAAACCTTCAACCCAACAAGAAGGCGGCGAAGCAG---AAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGATGATGAAGAGTCCACA--- ->Dsim_MD63 |81 sp| -ATGAAAAGCAAGGTGGATAAACCCATAACCACTGGTGCACCAAGTGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAGAAATCCGACGCGGACACGCAGATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGTGAAGCCGGCGGAGACCGAGGAAAAGGAAAATATCGCGAGCAACGGCAACCTGAAGGTGTCGCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGACACAAATGCTGAGCAGCGCGCTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAACCGCCGTGCCCGCCATCGACGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAAGTGGTTACAGCCTTCGGCATTTTGCAGAGCCCGCAGTTCGCCAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCTCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAANAAGCCGTTGAGTGGCTTGAAAGTAAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGAGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACTCACAGCTTTTCGATTTGTATTTCTCCGGCTCCACCATTCACAGCGATGACGTATACGCCAGATTGGCTAGTTTTCTTATGAATGGCGGAAAGGAAATGCTCGCCGCCTGGCAGCAGTATATTGATTCCAAGCAGCCACTCAAATTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCAACGTGCTCCGCAACTTTAAGCCAAGGGAAGAACAACTTATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGCTGCAGGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCAAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTCGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCAGCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATATCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTTAGCGTCGAGAGCCTTTACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCATTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTGAGCCAGGCAACACAATGGCGACAGAAGCAGTTGAACTACTTGCTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAAGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCACTTGCTGCAGAAGACATTGAGTTACCTTAACAAAAAGTTGGGGGAACCGGATGCAGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGCGCGGCCCAGCAAGGAAACGGATGTCGTTGGCCAAACATTCGAGGCTCTAATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCGTCACCGTGTTGGAGGATCTGATTNTCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGATCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTACTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGTTCAACATGAACAAAAATCCCTTGAGCAAGAAGGACGATGGC------GAGGAGGAGAGCGAAGACGAAGTCGACGAGGAAGAATCGTTGAAGGATTCGAGCGATGATTCAGACGATGAAGATGAAGATGAAGAGGAGNAC---GAAGACGAGGACGATGAAGAGTCCCATTTGGCCCAAANTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAAGAGCAGGGCAAACGCTTGAATGCTGCTTTGGAGCAGTCTTTTCAAATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAACACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAAACAAGAAACCAACTCAATCGGTAATCCTGGNCGTGCTGCATTGCGTCTTCCAGGTGTACCGCCATTGCGCCACAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTTGCCAGGAATATCGAACTCGAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCAATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAAGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCAAGCCCAAGGAAAGTGCTGTCTGGCCNCTTCTAGTCGAATTTCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGTCAATGGCAGGGCGTTGCTCCACTGGCTGTTGTCCTGGCCTCCCACTTGGACGTACAGAAAACGCGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGCCGCTTTCAAGGACAACTGCTCGTCTTCCAACAAATTTGAGAAGAAGATAGCCAGATACGTAAATCAGCTAGAAACGGAGACTAGTAGTCCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGCGTCAGAAACTGCGTGAACAGATTCAGCTCGTCGCCAAAAACCTTCAACCCAACAAGAAGGCGGCGAAGCAG---AAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGATGATGAAGAGTCCACA--- ->Dsim_MD72 |130 sp| -ATGAAAAGCAAGGTGGATAAACCCATAACCACTGGTGCACCAAGTGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAGAAATCCGACGCGGACACGCAGATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGTGAAGCCGGCGGAGACCGAGGAAAAGGAAAATATCGCGAGCAACGGCAACCTGAAGGTGTCGCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGACACAAATGCTGAGCAGCGCGCTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAACCGCCGTGCCCGCCATCGACGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAAGTGGTTACAGCCTTCGGCATTTTGCAGAGCCCGCAGTTCGCCAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCTCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAANAAGCCGTTGAGTGGCTTGAAAGTAAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGAGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACTCACAGCTTTTCGATTTGTATTTCTCCGGCTCCACCATTCACAGCGATGACGTATACGCCAGATTGGCTAGTTTTCTTATGAATGGCGGAAAGGAAATGCTCGCCGCCTGGCAGCAGTATATTGATTCCAAGCAGCCACTCAAATTGAATGCGGCCAAGGCGTGTGCCATCCAAGTACTGAGCAACGTGCTCCGCAACTTTAAGCCAAGGGAAGAACAACTTATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGCTGCAGGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCAAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTCGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCAGCTGCTGCTTAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATATCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTAAGCGTCGAGAGCCTTTACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCATTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTGAGCCAGGCAACACAATGGCGACAGAAGCAGTTGAACTACTTGCTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAGGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCACTTGCTGCAGAAGACATTGAGTTACCTTAACAAAAAGTTGGGGGAACCGGATGCAGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGCGCGGCCCAGCAAGGAAACGGATGTCGTTGGCCAAACATTCGAGGCTCTAATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCGTCACCGTGTTGGAGGATCTGATTNTCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGATCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTACTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGTTCAACATGAACAAAAATCCCTTGAGCAAGAAGGACGATGGC------GAGGAGGAGAGCGAAGACGAAGTCGACGAGGAAGAATCGTTGAAGGATTCGAGCGATGATTCAGACGATGAAGATGAAGATGAAGAGGAGNAC---GAAGACGAGGACGATGAAGAGTCCCATTTGGCCCAAANTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAGGAGCAGGGCAAACGCTTGAATGCTGCTTTGGAGCAGTCTTTTCAAATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAACACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAAACAAGAAACCAACTCAATCGGTAATCCTGGNCGTGCTGCATTGCGTCTTCCAGGTGTACCGCCATTGCGCCACAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTTGCCAGGAATATCGAACTCAAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCTATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAAGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCAAGCCCAAGGAAAGTGCTGTCTGGCCNCTTCTAGTCGAATTTCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGTCAATGGCAGGGCGTTGCTCCACTGGCTGTTGTCCTGGCCTCCCACTTGGACGTACAGAAAACGCGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGCCGCTTTCAAGGACAACTGCTCGTCTTCCAACAAATTTGAGAAGAAGATAGCCAGATACGTAAATCAGCTAGAAACGGAGACTAGTAGTCCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGCGTCAGAAACTGCGTGAACAGATTCAGCTCGTCGCCAAAAACCTTCAACCCAACAAGAAGGCGGCGAAGCAG---AAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGATGATGAAGAGTCCACA--- ->Dsim_MD73 |112 sp| -ATGAAAAGCAAGGTGGATAAACCCATAACCACTGGTGCACCAAGTGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAGAAATCCGACGCGGACACGCAGATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGTGAAGCCGGCGGAGACCGAGGAAAAGGAAAATATCGCGAGCAACGGCAACCTGAAGGTGTCGCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGACACAAATGCTGAGCAGCGCGCTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAACCGCCGTGCCCGCCATCGACGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAAGTGGTTACAGCCTTCGGCATTTTGCAGAGCCCGCAGTTCGCCAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCTCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAANAAGCCGTTGAGTGGCTTGAAAGTAAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGAGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACTCACAGCTTTTCGATTTGTATTTCTCCGGCTCCACCATTCACAGCGATGACGTATACGCCAGATTGGCTAGTTTTCTTATGAATGGCGGAAAGGAAATGCTCGCCGCCTGGCAGCAGTATATTGATTCCAAGCAGCCACTCAAATTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCAACGTGCTCCGCAACTTTAAGCCAAGGGAAGAACAACTTATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGCTGCAGGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCAAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTCGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCAGCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATATCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTTAGCGTCGAGAGCCTTTACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCATTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTGAGCCAGGCAACACAATGGCGACAGAAGCAGTTGAACTACTTGCTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAAGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCACTTGCTGCAGAAGACATTGAGTTACCTTAACAAAAAGTTGGGGGAACCGGATGCAGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGCGCGGCCCAGCAAGGAAACGGATGTCGTTGGCCAAACATTCGAGGCTCTAATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCGTCACCGTGTTGGAGGATCTGATTNTCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGATCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTACTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGTTCAACATGAACAAAAATCCCTTGAGCAAGAAGGACGATGGC------GAGGAGGAGAGCGAAGACGAAGTCGACGAGGAAGAATCGTTGAAGGATTCGAGCGATGATTCAGACGATGAAGATGAAGATGAAGAGGAGNAC---GAAGACGAGGACGATGAAGAGTCCCATTTGGCCCAAANTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAAGAGCAGGGCAAACGCTTGAATGCTGCTTTGGAGCAGTCTTTTCAAATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAACACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAAACAAGAAACCAACTCAATCGGTAATCCTGGNCGTGCTGCATTGCGTCTTCCAGGTGTACCGCCATTGCGCCACAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTTGCCAGGAATATCGAACTCGAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCAATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAAGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCAAGCCCAAGGAAAGTGCTGTCTGGCCNCTTCTAGTCGAATTTCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGTCAATGGCAGGGCGTTGCTCCACTGGCTGTTGTCCTGGCCTCCCACTTGGACGTACAGAAAACGCGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGCCGCTTTCAAGGACAACTGCTCGTCTTCCAACAAATTTGAGAAGAAGATAGCCAGATACGTAAATCAGCTAGAAACGGAGACTAGTAGTCCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGCGTCAGAAACTGCGTGAACAGATTCAGCTCGTCGCCAAAAACCTTCAACCCAACAAGAAGGCGGCGAAGCAG---AAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGATGATGAAGAGTCCACA--- ->Dsim_NS05 |55 sp| -ATGAAAAGCAAGGTGGATAAACCCATAACCACTGGTGCACCAAGTGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAGAAATCCGACGCGGACACGCAGATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGTGAAGCCGGCGGAGACCGAGGAAAAGGAAAATATCGCGAGCAACGGCAACCTGAAGGTGTCGCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGACACAAATGCTGAGCAGCGCGCTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAACCGCCGTGCCCGCCATCGACGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAAGTGGTTACAGCCTTCGGCATTTTGCAGAGCCCGCAGTTCGCCAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCTCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAANAAGCCGTTGAGTGGCTTGAAAGTAAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGAGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACTCACAGCTTTTCGATTTGTATTTCTCCGGCTCCACCATTCACAGCGATGACGTATACGCCAGATTGGCTAGTTTTCTTATGAATGGCGGAAAGGAAATGCTCGCCGCCTGGCAGCAGTATATTGATTCCAAGCAGCCACTCAAATTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCAACGTGCTCCGCAACTTTAAGCCAAGGGAAGAACAACTTATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGCTGCAGGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCTAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTCGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCAGCTGCTGCTTAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATATCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTAAGCGTCGAGAGCCTTTACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCATTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTGAGCCAGGCAACACAATGGCGACAGAAGCAGTTGAACTACTTGCTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAGGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCACTTGCTGCAGAAGACATTGAGTTACCTTAACAAAAAGTTGGGGGAACCGGATGCAGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGCGCGGCCCAGCAAGGAAACGGATGTCGTTGGCCAAACATTCGAGGCTCTAATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCGTCACCGTGTTGGAGGATCTGATTNTCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGATCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTACTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGTTCAACATGAACAAAAATCCCTTGAGCAAGAAGGACGATGGC------GAGGAGGAGAGCGAAGACGAAGTCGACGAGGAAGAATCGTTGAAGGATTCGAGCGATGATTCAGACGATGAAGATGAAGATGAAGAGGAGNAC---GAAGACGAGGACGATGAAGAGTCCCATTTGGCCCAAANTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAGGAGCAGGGCAAACGCTTGAATGCTGCTTTGGAGCAGTCTTTTCAAATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAACACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAAACAAGAAACCAACTCAATCGGTAATCCTGGNCGTGCTGCATTGCGTCTTCCAGGTGTACCGCCATTGCGCCACAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTTGCCAGGAATATCGAACTCAAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCTATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAAGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCAAGCCCAAGGAAAGTGCTGTCTGGCCNCTTCTAGTCGAATTTCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGTCAATGGCAGGGCGTTGCTCCACTGGCTGTTGTCCTGGCCTCCCACTTGGACGTACAGAAAACGCGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGCCGCTTTCAAGGACAACTGCTCGTCTTCCAACAAATTTGAGAAGAAGATAGCCAGATACGTAAATCAGCTAGAAACGGAGACTAGTAGTCCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGCGTCAGAAACTGCGTGAACAGATTCAGCTCGTCGCCAAAAACCTTCAACCCAACAAGAAGGCGGCGAAGCAG---AAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGATGATGAAGAGTCCACA--- ->Dsim_NS11 |6 sp| -ATGAAAAGCAAGGTGGATAAACCCATAACCACTGGTGCACCAAGTGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAGAAATCCGACGCGGACACGCAGATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGTGAAGCCGGCGGAGACCGAGGAAAAGGAAAATATCGCGAGCAACGGCAACCTGAAGGTGTCGCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGACACAAATGCTGAGCAGCGCGCTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAACCGCCGTGCCCGCCATCGACGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAAGTGGTTACAGCCTTCGGCATTTTGCAGAGCCCGCAGTTCGCCAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCTCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAANAAGCCGTTGAGTGGCTTGAAAGTAAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGAGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACTCACAGCTTTTCGATTTGTATTTCTCCGGCTCCACCATTCACAGCGATGACGTATACGCCAGATTGGCTAGTTTTCTTATGAATGGCGGAAAGGAAATGCTCGCCGCCTGGCAGCAGTATATTGATTCCAAGCAGCCACTCAAATTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCAACGTGCTCCGCAACTTTAAGCCAAGGGAAGAACAACTTATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGCTGCAGGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCTAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTCGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCAGCTGCTGCTTAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATATCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTAAGCGTCGAGAGCCTTTACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCATTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTGAGCCAGGCAACACAATGGCGACAGAAGCAGTTGAACTACTTGCTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAGGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCACTTGCTGCAGAAGACATTGAGTTACCTTAACAAAAAGTTGGGGGAACCGGATGCAGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGCGCGGCCCAGCAAGGAAACGGATGTCGTTGGCCAAACATTCGAGGCTCTAATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCGTCACCGTGTTGGAGGATCTGATTNTCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGATCAAGTTAACGAAGAGCTCAAATGGCAGGACGTACTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTACTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGTTCAACATGAACAAAAATCCCTTGAGCAAGAAGGACGATGGC------GAGGAGGAGAGCGAAGACGAAGTCGACGAGGAAGAATCGTTGAAGGATTCGAGCGATGATTCAGACGATGAAGATGAAGATGAAGAGGAGNAC---GAAGACGAGGACGATGAAGAGTCCCATTTGGCCCAAANTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAGGAGCAGGGCAAACGCTTGAATGCTGCTTTGGAGCAGTCTTTTCAAATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAACACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAAACAAGAAACCAACTCAATCGGTAATCCTGGNCGTGCTGCATTGCGTCTTCCAGGTGTACCGCCATTGCGCCACAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTTGCCAGGAATATCGAACTCGAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCCATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAAGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCAAGCCCAAGGAAAGTGCTGTCTGGCCNCTTCTAGTCGAATTTCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGTCAATGGCAGGGCGTTGCTCCACTGGCTGTTGTCCTGGCCTCCCACTTGGACGTACAGAAAACGCGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGCCGCTTTCAAGGACAACTGCTCGTCTTCCAACAAATTTGAGAAGAAGATAGCCAGATACGTAAATCAGCTAGAAACGGAGACTAGTAGTCCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGCGTCAGAAACTGCGTGAACAGATTCAGCTCGTCGCCAAAAACCTTCAACCCAACAAGAAGGCGGCGAAGCAG---AAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGATGATGAAGAGTCCACA--- ->Dsim_NS111 |107 sp| -ATGAAAAGCAAGGTGGATAAACCCATAACCACTGGTGCACCAAGTGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAGAAATCCGACGCGGACACGCAGATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGTGAAGCCGGCGGAGACCGAGGAAAAGGAAAATATCGCGAGCAACGGCAACCTGAAGGTGTCGCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGACACAAATGCTGAGCAGCGCGCTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAACCGCCGTGCCCGCCATCGACGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAAGTGGTTACAGCCTTCGGCATTTTGCAGAGCCCGCAGTTCGCCAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCTCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAANAAGCCGTTGAGTGGCTTGAAAGTAAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGAGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACTCACAGCTTTTCGATTTGTATTTCTCCGGCTCCACCATTCACAGCGATGACGTATACGCCAGATTGGCTAGTTTTCTTATGAATGGCGGAAAGGAAATGCTCGCCGCCTGGCAGCAGTATATTGATTCCAAGCAGCCACTCAAATTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCAACGTGCTCCGCAACTTTAAGCCAAGGGAAGAACAACTTATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGCTGCAGGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCAAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTCGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCAGCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATATCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTTAGCGTCGAGAGCCTTTACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCATTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTGAGCCAGGCAACACAATGGCGACAGAAGCAGTTGAACTACTTGCTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAAGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCACTTGCTGCAGAAGACATTGAGTTACCTTAACAAAAAGTTGGGGGAACCGGATGCAGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGCGCGGCCCAGCAAGGAAACGGATGTCGTTGGCCAAACATTCGAGGCTCTAATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCGTCACCGTGTTGGAGGATCTGATTNTCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGATCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTACTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGTTCAACATGAACAAAAATCCCTTGAGCAAGAAGGACGATGGC------GAGGAGGAGAGCGAAGACGAAGTCGACGAGGAAGAATCGTTGAAGGATTCGAGCGATGATTCAGACGATGAAGATGAAGATGAAGAGGAGNAC---GAAGACGAGGACGATGAAGAGTCCCATTTGGCCCAAANTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAAGAGCAGGGCAAACGCTTGAATGCTGCTTTGGAGCAGTCTTTTCAAATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAACACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAAACAAGAAACCAACTCAATCGGTAATCCTGGNCGTGCTGCATTGCGTCTTCCAGGTGTACCGCCATTGCGCCACAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTTGCCAGGAATATCGAACTCGAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCAATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAAGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCAAGCCCAAGGAAAGTGCTGTCTGGCCNCTTCTAGTCGAATTTCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGTCAATGGCAGGGCGTTGCTCCACTGGCTGTTGTCCTGGCCTCCCACTTGGACGTACAGAAAACGCGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGCCGCTTTCAAGGACAACTGCTCGTCTTCCAACAAATTTGAGAAGAAGATAGCCAGATACGTAAATCAGCTAGAAACGGAGACTAGTAGTCCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGCGTCAGAAACTGCGTGAACAGATTCAGCTCGTCGCCAAAAACCTTCAACCCAACAAGAAGGCGGCGAAGCAG---AAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGATGATGAAGAGTCCACA--- ->Dsim_NS113 |129 sp| -ATGAAAAGCAAGGTGGATAAACCCATAACCACTGGTGCACCAAGTGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAGAAATCCGACGCGGACACGCAGATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGTGAAGCCGGCGGAGACCGAGGAAAAGGAAAATATCGCGAGCAACGGCAACCTGAAGGTGTCGCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGACACAAATGCTGAGCAGCGCGCTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAACCGCCGTGCCCGCCATCGACGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAAGTGGTTACAGCCTTCGGCATTTTGCAGAGCCCGCAGTTCGCCAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCTCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAANAAGCCGTTGAGTGGCTTGAAAGTAAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGAGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACTCACAGCTTTTCGATTTGTATTTCTCCGGCTCCACCATTCACAGCGATGACGTATACGCCAGATTGGCTAGTTTTCTTATGAATGGCGGAAAGGAAATGCTCGCCGCCTGGCAGCAGTATATTGATTCCAAGCAGCCACTCAAATTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCAACGTGCTCCGCAACTTTAAGCCAAGGGAAGAACAACTTATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGCTGCAGGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCTAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTCGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCAGCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATATCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTAAGCGTCGAGAGCCTTTACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCATTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTGAGCCAGGCAACACAATGGCGACAGAAGCAGTTGAACTACTTGCTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAGGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCACTTGCTGCAGAAGACATTGAGTTACCTTAACAAAAAGTTGGGGGAACCGGATGCAGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGCGCGGCCCAGCAAGGAAACGGATGTCGTTGGCCAAACATTCGAGGCTCTAATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCGTCACCGTGTTGGAGGATCTGATTNTCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGATCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTACTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGTTCAACATGAACAAAAATCCCTTGAGCAAGAAGGACGATGGC------GAGGAGGAGAGCGAAGACGAAGTCGACGAGGAAGAATCGTTGAAGGATTCGAGCGATGATTCAGACGATGAAGATGAAGATGAAGAGGAGNAC---GAAGACGAGGACGATGAAGAGTCCCATTTGGCCCAAANTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAAGAGCAGGGCAAACGCTTGAATGCTGCTTTGGAGCAGTCTTTTCAAATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAACACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAAACAAGAAACCAACTCAATCGGTAATCCTGGNCGTGCTGCATTGCGTCTTCCAGGTGTACCGCCATTGCGCCACAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTTGCCAGGAATATCGAACTCGAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCAATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAAGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCAAGCCCAAGGAAAGTGCTGTCTGGCCNCTTCTAGTCGAATTTCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGTCAATGGCAGGGCGTTGCTCCACTGGCTGTTGTCCTGGCCTCCCACTTGGACGTACAGAAAACGCGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGCCGCTTTCAAGGACAACTGCTCGTCTTCCAACAAATTTGAGAAGAAGATAGCCAGATACGTAAATCAGCTAGAAACGGAGACTAGTAGTCCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGCGTCAGAAACTGCGTGAACAGATTCAGCTCGTCGCCAAAAACCTTCAACCCAACAAGAAGGCGGCGAAGCAG---AAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGATGATGAAGAGTCCACA--- ->Dsim_NS116 |73 sp| -ATGAAAAGCAAGGTGGATAAACCCATAACCACTGGTGCACCAAGTGCAACCAAGACAAAGGGCAAGGAGGACCGCAAGCGGGCAAAAACTCAGAAATCCGACGCGGACACGCAGATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGTGAAGCCGGCGGAGACCGAGGAAAAGGAAAATATCGCGAGCAACGGCAACCTGAAGGTGTCGCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGACACAAATGCTGAGCAGCGCGCTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAACCGCCGTGCCCGCCATCGACGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAAGTGGTTACAGCCTTCGGCATTTTGCAGAGCCCGCAGTTCGCCAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCTCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAANAAGCCGTTGAGTGGCTTGAAAGTAAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGAGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACTCACAGCTTTTCGATTTGTATTTCTCCGGCTCCACCATTCACAGCGATGACGTATACGCCAGATTGGCTAGTTTTCTTATGAATGGAGGAAAGGAAATGCTCGCCGCCTGGCAGCAGTATATTGATTCCAAGCAGCCACTCAAATTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCAACGTGCTCCGCAACTTTAAGCCAAGGGAAGAACAACTTATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGCTGCAGGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCAAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTCGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCAGCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATATCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTTAGCGTCGAGAGCCTTTACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCATTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTGAGCCAGGCAACACAATGGCGACAGAAGCAGTTGAACTACTTGCTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAAGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCACTTGCTGCAGAAGACATTGAGTTACCTTAACAAAAAGTTGGGGGAACCGGATGCAGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGCGCGGCCCAGCAAGGAAACGGATGTCGTTGGCCAAACATTCGAGGCTCTAATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCGTCACCGTGTTGGAGGATCTGATTNTCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGATCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTACTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGTTCAACATGAACAAAAATCCCTTGAGCAAGAAGGACGATGGC------GAGGAGGAGAGCGAAGACGAAGTCGACGAGGAAGAATCGTTGAAGGATTCGAGCGATGATTCAGACGATGAAGATGAAGATGAAGAGGAGNAC---GAAGACGAGGACGATGAAGAGTCCCATTTGGCCCAAANTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAAGAGCAGGGCAAACGCTTGAATGCTGCTTTGGAGCAGTCTTTTCAAATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAACACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAAACAAGAAACCAACTCAATCGGTAATCCTGGNCGTGCTGCATTGCGTCTTCCAGGTGTACCGCCATTGCGCCACAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTTGCCAGGAATATCGAACTCGAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCCATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAAGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCAAGCCCAAGGAAAGTGCTGTCTGGCCNCTTCTAGTCGAATTTCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGTCAATGGCAGGGCGTTGCTCCACTGGCTGTTGTCCTGGCCTCCCACTTGGACGTACAGAAAACGCGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGCCGCTTTCAAGGACAACTGCTCGTCTTCCAACAAATTTGAGAAGAAGATAGCCAGATACGTAAATCAGCTAGAAACGGAGACTAGTAGTCCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGCGTCAGAAACTGCGTGAACAGATTCAGCTCGTCGCCAAAAACCTTCAACCCAACAAGAAGGCGGCGAAGCAG---AAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGATGATGAAGAGTCCACA--- ->Dsim_NS137 |2 sp| -ATGAAAAGCAAGGTGGATAAACCCATAACCACTGGTGCACCAAGTGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAGAAATCCGACGCGGACACGCAGATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGTGAAGCCGGCGGAGACCGAGGAAAAGGAAAATATCGCGAGCAACGGCAACCTGAAGGTGTCGCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGACACAAATGCTGAGCAGCGCGCTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAACCGCCGTGCCCGCCATCGACGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAAGTGGTTACAGCCTTCGGCATTTTGCAGAGCCCGCAGTTCGCCAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCTCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAANAAGCCGTTGAGTGGCTTGAAAGTAAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGAGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACTCACAGCTTTTCGATTTGTATTTCTCCGGCTCCACCATTCACAGCGATGACGTATACGCCAGATTGGCTAGTTTTCTTATGAATGGCGGAAAGGAAATGCTCGCCGCCTGGCAGCAGTATATTGATTCCAAGCAGCCACTCAAATTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCAACGTGCTCCGCAACTTTAAGCCAAGGGAAGAACAACTTATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGCTGCAGGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCAAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTCGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCAGCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATATCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTAAGCGTCGAGAGCCTTTACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCATTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTGAGCCAGGCAACACAATGGCGACAGAAGCAGTTGAACTACTTGCTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAGGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCACTTGCTGCAGAAGACATTGAGTTACCTTAACAAAAAGTTGGGGGAACCGGATGCAGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGCGCGGCCCAGCAAGGAAACGGATGTCGTTGGCCAAACATTCGAGGCTCTAATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCGTCACCGTGTTGGAGGATCTGATTNTCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGATCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTACTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGTTCAACATGAACAAAAATCCCTTGAGCAAGAAGGACGATGGC------GAGGAGGAGAGCGAAGACGAAGTCGACGAGGAAGAATCGTTGAAGGATTCGAGCGATGATTCAGACGATGAAGATGAAGATGAAGAGGAGNAC---GAAGACGAGGACGATGAAGAGTCCCATTTGGCCCAAANTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAGGAGCAGGGCAAACGCTTGAATGCTGCTTTGGAGCAGTCTTTTCAAATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAACACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAAACAAGAAACCAACTCAATCGGTAATCCTGGNCGTGCTGCATTGCGTCTTCCAGGTGTACCGCCATTGCGCCACAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTTGCCAGGAATATCGAACTCGAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCCATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAAGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCAAGCCCAAGGAAAGTGCTGTCTGGCCNCTTCTAGTCGAATTTCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGTCAATGGCAGGGCGTTGCTCCACTGGCTGTTGTCCTGGCCTCCCACTTGGACGTACAGAAAACGCGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGCCGCTTTCAAGGACAACTGCTCGTCTTCCAACAAATTTGAGAAGAAGATAGCCAGATACGTAAATCAGCTAGAAACGGAGACTAGTAGTCCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGCGTCAGAAACTGCGTGAACAGATTCAGCTCGTCGCCAAAAACCTTCAACCCAACAAGAAGGCGGCGAAGCAG---AAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGATGATGAAGAGTCCACA--- ->Dsim_NS19 |95 sp| -ATGAAAAGCAAGGTGGATAAACCCATAACCACTGGTGCACCAAGTGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAGAAATCCGACGCGGACACGCAGATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGTGAAGCCGGCGGAGACCGAGGAAAAGGAAAATATCGCGAGCAACGGCAACCTGAAGGTGTCGCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGACACAAATGCTGAGCAGCGCGCTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAACCGCCGTGCCCGCCATCGACGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAAGTGGTTACAGCCTTCGGCATTTTGCAGAGCCCGCAGTTCGCCAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCTCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAANAAGCCGTTGAGTGGCTTGAAAGTAAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGAGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACTCACAGCTTTTCGATTTGTATTTCTCCGGCTCCACCATTCACAGCGATGACGTATACGCCAGATTGGCTAGTTTTCTTATGAATGGCGGAAAGGAAATGCTCGCCGCCTGGCAGCAGTATATTGATTCCAAGCAGCCACTCAAATTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCAACGTGCTCCGCAACTTTAAGCCAAGGGAAGAACAACTTATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGCTGCAGGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCAAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTCGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCAGCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATATCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTTAGCGTCGAGAGCCTTTACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCATTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTGAGCCAGGCAACACAATGGCGACAGAAGCAGTTGAACTACTTGCTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAAGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCACTTGCTGCAGAAGACATTGAGTTACCTTAACAAAAAGTTGGGGGAACCGGATGCAGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGCGCGGCCCAGCAAGGAAACGGATGTCGTTGGCCAAACATTCGAGGCTCTAATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCGTCACCGTGTTGGAGGATCTGATTNTCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGATCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTACTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGTTCAACATGAACAAAAATCCCTTGAGCAAGAAGGACGATGGC------GAGGAGGAGAGCGAAGACGAAGTCGACGAGGAAGAATCGTTGAAGGATTCGAGCGATGATTCAGACGATGAAGATGAAGATGAAGAGGAGNAC---GAAGACGAGGACGATGAAGAGTCCCATTTGGCCCAAANTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAAGAGCAGGGCAAACGCTTGAATGCTGCTTTGGAGCAGTCTTTTCAAATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAACACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAAACAAGAAACCAACTCAATCGGTAATCCTGGNCGTGCTGCATTGCGTCTTCCAGGTGTACCGCCATTGCGCCACAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTTGCCAGGAATATCGAACTCGAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCAATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAAGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCAAGCCCAAGGAAAGTGCTGTCTGGCCNCTTCTAGTCGAATTTCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGTCAATGGCAGGGCGTTGCTCCACTGGCTGTTGTCCTGGCCTCCCACTTGGACGTACAGAAAACGCGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGCCGCTTTCAAGGACAACTGCTCGTCTTCCAACAAATTTGAGAAGAAGATAGCCAGATACGTAAATCAGCTAGAAACGGAGACTAGTAGTCCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGCGTCAGAAACTGCGTGAACAGATTCAGCTCGTCGCCAAAAACCTTCAACCCAACAAGAAGGCGGCGAAGCAG---AAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGATGATGAAGAGTCCACA--- ->Dsim_NS33 |50 sp| -ATGAAAAGCAAGGTGGATAAACCCATAACCACTGGTGCACCAAGTGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAGAAATCCGACGCGGACACGCAGATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGTGAAGCCGGCGGAGACCGAGGAAAAGGAAAATATCGCGAGCAACGGCAACCTGAAGGTGTCGCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGACACAAATGCTGAGCAGCGCGCTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAACCGCCGTGCCCGCCATCGACGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAAGTGGTTACAGCCTTCGGCATTTTGCAGAGCCCGCAGTTCGCCAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCTCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAANAAGCCGTTGAGTGGCTTGAAAGTAAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGAGAGAACATTCTAGCCAGCTTATGGCCCAAGAAACCAGTGTACTCACAGCTTTTCGATTTGTATTTCTCCGGCTCCACCATTCACAGCGATGACGTATACGCCAGATTGGCTAGTTTTCTTATGAATGGCGGAAAGGAAATGCTCGCCGCCTGGCAGCAGTATATTGATTCCAAGCAGCCACTCAAATTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCAACGTGCTCCGCAACTTTAAGCCAAGGGAAGAACAACTTATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGCTGCAGGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCAAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTCGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCAGCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATATCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTTAGCGTCGAGAGCCTTTACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCATTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTGAGCCAGGCAACACAATGGCGACAGAAGCAGTTGAACTACTTGCTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAAGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCACTTGCTGCAGAAGACATTGAGTTACCTTAACAAAAAGTTGGGGGAACCGGATGCAGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGCGCGGCCCAGCAAGGAAACGGATGTCGTTGGCCAAACATTCGAGGCTCTAATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCGTCACCGTGTTGGAGGATCTGATTNTCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGATCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTACTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGTTCAACATGAACAAAAATCCCTTGAGCAAGAAGGACGATGGC------GAGGAGGAGAGCGAAGACGAAGTCGACGAGGAAGAATCGTTGAAGGATTCGAGCGATGATTCAGACGATGAAGATGAAGATGAAGAGGAGNAC---GAAGACGAGGACGATGAAGAGTCCCATTTGGCCCAAANTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAAGAGCAGGGCAAACGCTTGAATGCTGCTTTGGAGCAGTCTTTTCAAATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAACACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAAACAAGAAACCAACTCAATCGGTAATCCTGGNCGTGCTGCATTGCGTCTTCCAGGTGTACCGCCATTGCGCCACAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTTGCCAGGAATATCGAACTCGAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCAATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAAGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCAAGCCCAAGGAAAGTGCTGTCTGGCCNCTTCTAGTCGAATTTCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGTCAATGGCAGGGCGTTGCTCCACTGGCTGTTGTCCTGGCCTCCCACTTGGACGTACAGAAAACGCGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGCCGCTTTCAAGGACAACTGCTCGTCTTCCAACAAATTTGAGAAGAAGATAGCCAGATACGTAAATCAGCTAGAAACGGAGACTAGTAGTCCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGCGTCAGAAACTGCGTGAACAGATTCAGCTCGTCGCCAAAAACCTTCAACCCAACAAGAAGGCGGCGAAGCAG---AAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGATGATGAAGAGTCCACA--- ->Dsim_NS37 |115 sp| -ATGAAAAGCAAGGTGGATAAACCCATAACCACTGGTGCACCAAGTGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAGAAATCCGACGCGGACACGCAGATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGTGAAGCCGGCGGAGACCGAGGAAAAGGAAAATATCGCGAGCAACGGCAACCTGAAGGTGTCGCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGACACAAATGCTGAGCAGCGCGCTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAACCGCCGTGCCCGCCATCGACGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAAGTGGTTACAGCCTTCGGCATTTTGCAGAGCCCGCAGTTCGCCAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCTCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAANAAGCCGTTGAGTGGCTTGAAAGTAAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGAGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACTCACAGCTTTTCGATTTGTATTTCTCCGGCTCCACCATTCACAGCGATGACGTATACGCCAGATTGGCTAGTTTTCTTATGAATGGCGGAAAGGAAATGCTCGCCGCCTGGCAGCAGTATATTGATTCCAAGCAGCCACTCAAATTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCAACGTGCTCCGCAACTTTAAGCCAAGGGAAGAACAACTTATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGCTGCAGGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCAAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTCGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCAGCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATATCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTAAGCGTCGAGAGCCTTTACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCATTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTGAGCCAGGCAACACAATGGCGACAGAAGCAGTTGAACTACTTGCTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAGGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCACTTGCTGCAGAAGACATTGAGTTACCTTAACAAAAAGTTGGGGGAACCGGATGCAGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGCGCGGCCCAGCAAGGAAACGGATGTCGTTGGCCAAACATTCGAGGCTCTAATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCGTCACCGTGTTGGAGGATCTGATTNTCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGATCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTACTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGTTCAACATGAACAAAAATCCCTTGAGCAAGAAGGACGATGGC------GAGGAGGAGAGCGAAGACGAAGTCGACGAGGAAGAATCGTTGAAGGATTCGAGCGATGATTCAGACGATGAAGATGAAGATGAAGAGGAGNAC---GAAGACGAGGACGATGAAGAGTCCCATTTGGCCCAAANTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAGGAGCAGGGCAAACGCTTGAATGCTGCTTTGGAGCAGTCTTTTCAAATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAACACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAAACAAGAAACCAACTCAATCGGTAATCCTGGNCGTGCTGCATTGCGTCTTCCAGGTGTACCGCCATTGCGCCACAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTTGCCAGGAATATCGAACTCGAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCCATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAAGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCAAGCCCAAGGAAAGTGCTGTCTGGCCNCTTCTAGTCGAATTTCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGTCAATGGCAGGGCGTTGCTCCACTGGCTGTTGTCCTGGCCTCCCACTTGGACGTACAGAAAACGCGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGCCGCTTTCAAGGACAACTGCTCGTCTTCCAACAAATTTGAGAAGAAGATAGCCAGATACGTAAATCAGCTAGAAACGGAGACTAGTAGTCCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGCGTCAGAAACTGCGTGAACAGATTCAGCTCGTCGCCAAAAACCTTCAACCCAACAAGAAGGCGGCGAAGCAG---AAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGATGATGAAGAGTCCACA--- ->Dsim_NS39 |121 sp| -ATGAAAAGCAAGGTGGATAAACCCATAACCACTGGTGCACCAAGTGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAGAAATCCGACGCGGACACGCAGATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGTGAAGCCGGCGGAGACCGAGGAAAAGGAAAATATCGCGAGCAACGGCAACCTGAAGGTGTCGCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGACACAAATGCTGAGCAGCGCGCTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAACCGCCGTGCCCGCCATCGACGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAAGTGGTTACAGCCTTCGGCATTTTGCAGAGCCCGCAGTTCGCCAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCTCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAANAAGCCGTTGAGTGGCTTGAAAGTAAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGAGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACTCACAGCTTTTCGATTTGTATTTCTCCGGCTCCACCATTCACAGCGATGACGTATACGCCAGATTGGCTAGTTTTCTTATGAATGGCGGAAAGGAAATGCTCGCCGCCTGGCAGCAGTATATTGATTCCAAGCAGCCACTCAAATTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCAACGTGCTCCGCAACTTTAAGCCAAGGGAAGAACAACTTATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGCTGCAGGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCTAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTCGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCAGCTGCTGCTTAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATATCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTAAGCGTCGAGAGCCTTTACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCATTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTGAGCCAGGCAACACAATGGCGACAGAAGCAGTTGAACTACTTGCTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAGGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCACTTGCTGCAGAAGACATTGAGTTACCTTAACAAAAAGTTGGGGGAACCGGATGCAGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGCGCGGCCCAGCAAGGAAACGGATGTCGTTGGCCAAACATTCGAGGCTCTAATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCGTCACCGTGTTGGAGGATCTGATTNTCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGATCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTACTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGTTCAACATGAACAAAAATCCCTTGAGCAAGAAGGACGATGGC------GAGGAGGAGAGCGAAGACGAAGTCGACGAGGAAGAATCGTTGAAGGATTCGAGCGATGATTCAGACGATGAAGATGAAGATGAAGAGGAGNAC---GAAGACGAGGACGATGAAGAGTCCCATTTGGCCCAAANTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAGGAGCAGGGCAAACGCTTGAATGCTGCTTTGGAGCAGTCTTTTCAAATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAACACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAAACAAGAAACCAACTCAATCGGTAATCCTGGNCGTGCTGCATTGCGTCTTCCAGGTGTACCGCCATTGCGCCACAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTTGCCAGGAATATCGAACTCGAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCCATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAAGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCAAGCCCAAGGAAAGTGCTGTCTGGCCNCTTCTAGTCGAATTTCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGTCAATGGCAGGGCGTTGCTCCACTGGCTGTTGTCCTGGCCTCCCACTTGGACGTACAGAAAACGCGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGCCGCTTTCAAGGACAACTGCTCGTCTTCCAACAAATTTGAGAAGAAGATAGCCAGATACGTAAATCAGCTAGAAACGGAGACTAGTAGTCCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGCGTCAGAAACTGCGTGAACAGATTCAGCTCGTCGCCAAAAACCTTCAACCCAACAAGAAGGCGGCGAAGCAG---AAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGATGATGAAGAGTCCACA--- ->Dsim_NS40 |2 sp| -ATGAAAAGCAAGGTGGATAAACCCATAACCACTGGTGCACCAAGTGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAGAAATCCGACGCGGACACGCAGATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGTGAAGCCGGCGGAGACCGAGGAAAAGGAAAATATCGCGAGCAACGGCAACCTGAAGGTGTCGCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGACACAAATGCTGAGCAGCGCGCTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAACCGCCGTGCCCGCCATCGACGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAAGTGGTTACAGCCTTCGGCATTTTGCAGAGCCCGCAGTTCGCCAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCTCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAANAAGCCGTTGAGTGGCTTGAAAGTAAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGAGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACTCACAGCTTTTCGATTTGTATTTCTCCGGCTCCACCATTCACAGCGATGACGTATACGCCAGATTGGCTAGTTTTCTTATGAATGGCGGAAAGGAAATGCTCGCCGCCTGGCAGCAGTATATTGATTCCAAGCAGCCACTCAAATTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCAACGTGCTCCGCAACTTTAAGCCAAGGGAAGAACAACTTATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGCTGCAGGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCTAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTCGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCAGCTGCTGCTTAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATATCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTAAGCGTCGAGAGCCTTTACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCATTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTGAGCCAGGCAACACAATGGCGACAGAAGCAGTTGAACTACTTGCTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAGGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCACTTGCTGCAGAAGACATTGAGTTACCTTAACAAAAAGTTGGGGGAACCGGATGCAGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGCGCGGCCCAGCAAGGAAACGGATGTCGTTGGCCAAACATTCGAGGCTCTAATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCGTCACCGTGTTGGAGGATCTGATTNTCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGATCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTACTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGTTCAACATGAACAAAAATCCCTTGAGCAAGAAGGACGATGGC------GAGGAGGAGAGCGAAGACGAAGTCGACGAGGAAGAATCGTTGAAGGATTCGAGCGATGATTCAGACGATGAAGATGAAGATGAAGAGGAGNAC---GAAGACGAGGACGATGAAGAGTCCCATTTGGCCCAAANTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAAGAGCAGGGCAAACGCTTGAATGCTGCTTTGGAGCAGTCTTTTCAAATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAACACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAAACAAGAAACCAACTCAATCGGTAATCCTGGNCGTGCTGCATTGCGTCTTCCAGGTGTACCGCCATTGCGCCACAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTTGCCAGGAATATCGAACTCAAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCTATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAAGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCAAGCCCAAGGAAAGTGCTGTCTGGCCNCTTCTAGTCGAATTTCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGTCAATGGCAGGGCGTTGCTCCACTGGCTGTTGTCCTGGCCTCCCACTTGGACGTACAGAAAACGCGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCAAGCAAGGTCGCCGGCTCGAAGCCGCTTTCAAGGACAACTGCTCGTCTTCCAACAAATTTGAGAAGAAGATAGCCAGATACGTAAATCAGCTAGAAACGGAGACTAGTAGTCCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGCGTCAGAAACTGCGTGAACAGATTCAGCTCGTCGCCAAAAACCTTCAACCCAACAAGAAGGCGGCGAAGCAG---AAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGATGATGAAGAGTCCACA--- ->Dsim_NS49 |45 sp| -ATGAAAAGCAAGGGGGATAAACCCATAACCACTGGTGCACCAAGTGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAGAAATCCGACGCGGACACGCAGATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGTGAAGCCGGCGGAGACCGAGGAAAAGGAAAATATCGCGAGCAACGGCAACCTGAAGGTGTCGCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGACACAAATGCTGAGCAGCGCGCTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAACCGCCGTGCCCGCCATCGACGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAAGTGGTTACAGCCTTCGGCATTTTGCAGAGCCCGCAGTTCGCCAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCTCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAANAAGCCGTTGAGTGGCTTGAAAGTAAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGAGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACTCACAGCTTTTCGATTTGTATTTCTCCGGCTCCACCATTCACAGCGATGACGTATACGCCAGATTGGCTAGTTTTCTTATGAATGGCGGAAAGGAAATGCTCGCCGCCTGGCAGCAGTATATTGATTCCAAGCAGCCACTCAAATTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCAACGTGCTCCGCAACTTTAAGCCAAGGGAAGAACAACTTATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGCTGCAGGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCTAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTCGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCAGCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATATCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTAAGCGTCGAGAGCCTTTACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCATTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTGAGCCAGGCAACACAATGGCGACAGAAGCAGTTGAACTACTTGCTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAGGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCACTTGCTGCAGAAGACATTGAGTTACCTTAACAAAAAGTTGGGGGAACCGGATGCAGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGCGCGGCCCAGCAAGGAAACGGATGTCGTTGGCCAAACATTCGAGGCTCTAATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCGTCACCGTGTTGGAGGATCTGATTNTCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGATCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTACTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGTTCAACATGAACAAAAATCCCTTGAGCAAGAAGGACGATGGC------GAGGAGGAGAGCGAAGACGAAGTCGACGAGGAAGAATCGTTGAAGGATTCGAGCGATGATTCAGACGATGAAGATGAAGATGAAGAGGAGNAC---GAAGACGAGGACGATGAAGAGTCCCATTTGGCCCAAANTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAGGAGCAGGGCAAACGCTTGAATGCTGCTTTGGAGCAGTCTTTTCAAATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAACACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAAACAAGAAACCAACTCAATCGGTAATCCTGGNCGTGCTGCATTGCGTCTTCCAGGTGTACCGCCATTGCGCCACAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTTGCCAGGAATATCGAACTCGAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCCATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAAGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCAAGCCCAAGGAAAGTGCTGTCTGGCCNCTTCTAGTCGAATTTCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGTCAATGGCAGGGCGTTGCTCCACTGGCTGTTGTCCTGGCCTCCCACTTGGACGTACAGAAAACGCGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGCCGCTTTCAAGGACAACTGCTCGTCTTCCAACAAATTTGAGAAGAAGATAGCCAGATACGTAAATCAGCTAGAAACGGAGACTAGTAGTCCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGCGTCAGAAACTGCGTGAACAGATTCAGCTCGTCGCCAAAAACCTTCAACCCAACAAGAAGGCGGCGAAGCAG---AAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGATGATGAAGAGTCCACA--- ->Dsim_NS50 |95 sp| -ATGAAAAGCAAGGTGGATAAACCCATAACCACTGGTGCACCAAGTGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAGAAATCCGACGCGGACACGCAGATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGTGAAGCCGGCGGAGACCGAGGAAAAGGAAAATATCGCGAGCAACGGCAACCTGAAGGTGTCGCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGACACAAATGCTGAGCAGCGCGCTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAACCGCCGTGCCCGCCATCGACGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAAGTGGTTACAGCCTTCGGCATTTTGCAGAGCCCGCAGTTCGCCAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCTCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAANAAGCCGTTGAGTGGCTTGAAAGTAAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGAGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACTCACAGCTTTTCGATTTGTATTTCTCCGGCTCCACCATTCACAGCGATGACGTATACGCCAGATTGGCTAGTTTTCTTATGAATGGCGGAAAGGAAATGCTCGCCGCCTGGCAGCAGTATATTGATTCCAAGCAGCCACTCAAATTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCAACGTGCTCCGCAACTTTAAGCCAAGGGAAGAACAACTTATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGCTGCAGGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCTAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTCGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCAGCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATATCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTAAGCGTCGAGAGCCTTTACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCATTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTGAGCCAGGCAACACAATGGCGACAGAAGCAGTTGAACTACTTGCTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAGGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCACTTGCTGCAGAAGACATTGAGTTACCTTAACAAAAAGTTGGGGGAACCGGATGCAGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGCGCGGCCCAGCAAGGAAACGGATGTCGTTGGCCAAACATTCGAGGCTCTAATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCGTCACCGTGTTGGAGGATCTGATTNTCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGATCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTACTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGTTCAACATGAACAAAAATCCCTTGAGCAAGAAGGACGATGGC------GAGGAGGAGAGCGAAGACGAAGTCGACGAGGAAGAATCGTTGAAGGATTCGAGCGATGATTCAGACGATGAAGATGAAGATGAAGAGGAGNAC---GAAGACGAGGACGATGAAGAGTCCCATTTGGCCCAAANTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAGGAGCAGGGCAAACGCTTGAATGCTGCTTTGGAGCAGTCTTTTCAAATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAACACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAAACAAGAAACCAACTCAATCGGTAATCCTGGNCGTGCTGCATTGCGTCTTCCAGGTGTACCGCCATTGCGCCACAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTTGCCAGGAATATCGAACTCGAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCCATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAAGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCAAGCCCAAGGAAAGTGCTGTCTGGCCNCTTCTAGTCGAATTTCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGTCAATGGCAGGGCGTTGCTCCACTGGCTGTTGTCCTGGCCTCCCACTTGGACGTACAGAAAACGCGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGCCGCTTTCAAGGACAACTGCTCGTCTTCCAACAAATTTGAGAAGAAGATAGCCAGATACGTAAATCAGCTAGAAACGGAGACTAGTAGTCCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGTGGCGAGAAGCGTCAGAAACTGCGTGAACAGATTCAGCTCGTCGCCAAAAACCTTCAACCCAACAAGAAGGCGGCGAAGCAG---AAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGATGATGAAGAGTCCACA--- ->Dsim_NS63 |23 sp| -ATGAAAAGCAAGGTGGATAAACCCATAACCACTGGTGCACCAAGTGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAGAAATCCGACGCGGACACGCAGATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGTGAAGCCGGCGGAGACCGAGGAAAAGGAAAATATCGCGAGCAACGGCAACCTGAAGGTGTCGCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGACACAAATGCTGAGCAGCGCGCTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAACCGCCGTGCCCGCCATCGACGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAAGTGGTTACAGCCTTCGGCATTTTGCAGAGCCCGCAGTTCGCCAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCTCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAANAAGCCGTTGAGTGGCTTGAAAGTAAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGAGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACTCACAGCTTTTCGATTTGTATTTCTCCGGCTCCACCATTCACAGCGATGACGTATACGCCAGATTGGCTAGTTTTCTTATGAATGGCGGAAAGGAAATGCTCGCCGCCTGGCAGCAGTATATTGATTCCAAGCAGCCACTCAAATTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCAACGTGCTCCGCAACTTTAAGCCAAGGGAAGAACAACTTATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGCTGCAGGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCAAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTCGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCAGCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATATCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTTAGCGTCGAGAGCCTTTACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCATTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTGAGCCAGGCAACACAATGGCGACAGAAGCAGTTGAACTACTTGCTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAAGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCACTTGCTGCAGAAGACATTGAGTTACCTTAACAAAAAGTTGGGGGAACCGGATGCAGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGCGCGGCCCAGCAAGGAAACGGATGTCGTTGGCCAAACATTCGAGGCTCTAATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCGTCACCGTGTTGGAGGATCTGATTNTCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGATCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTACTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGTTCAACATGAACAAAAATCCCTTGAGCAAGAAGGACGATGGC------GAGGAGGAGAGCGAAGACGAAGTCGACGAGGAAGAATCGTTGAAGGATTCGAGCGATGATTCAGACGATGAAGATGAAGATGAAGAGGAGNAC---GAAGACGAGGACGATGAAGAGTCCCATTTGGCCCAAANTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAAGAGCAGGGCAAACGCTTGAATGCTGCTTTGGAGCAGTCTTTTCAAATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAACACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAAACAAGAAACCAACTCAATCGGTAATCCTGGNCGTGCTGCATTGCGTCTTCCAGGTGTACCGCCATTGCGCCACAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTTGCCAGGAATATCGAACTCGAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCAATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAAGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCAAGCCCAAGGAAAGTGCTGTCTGGCCNCTTCTAGTCGAATTTCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGTCAATGGCAGGGCGTTGCTCCACTGGCTGTTGTCCTGGCCTCCCACTTGGACGTACAGAAAACGCGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGCCGCTTTCAAGGACAACTGCTCGTCTTCCAACAAATTTGAGAAGAAGATAGCCAGATACGTAAATCAGCTAGAAACGGAGACTAGTAGTCCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGCGTCAGAAACTGCGTGAACAGATTCAGCTCGTCGCCAAAAACCTTCAACCCAACAAGAAGGCGGCGAAGCAG---AAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGATGATGAAGAGTCCACA--- ->Dsim_NS64 |20 sp| -ATGAAAAGCAAGGTGGATAAACCCATAACCACTGGTGCACCAAGTGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAGAAATCCGACGCGGACACGCAGATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGTGAAGCCGGCGGAGACCGAGGAAAAGGAAAATATCGCGAGCAACGGCAACCTGAAGGTGTCGCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGACACAAATGCTGAGCAGCGCGCTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAACCGCCGTGCCCGCCATCGACGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAAGTGGTTACAGCCTTCGGCATTTTGCAGAGCCCGCAGTTCGCCAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCTCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAANAAGCCGTTGAGTGGCTTGAAAGTAAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGAGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACTCACAGCTTTTCGATTTGTATTTCTCCGGCTCCACCATTCACAGCGATGACGTATACGCCAGATTGGCTAGTTTTCTTATGAATGGCGGAAAGGAAATGCTCGCCGCCTGGCAGCAGTATATTGATTCCAAGCAGCCACTCAAATTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCAACGTGCTCCGCAACTTTAAGCCAAGGGAAGAACAACTTATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGCTGCAGGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCAAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTCGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCAGCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATATCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTTAGCGTCGAGAGCCTTTACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCATTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTGAGCCAGGCAACACAATGGCGACAGAAGCAGTTGAACTACTTGCTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAAGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCACTTGCTGCAGAAGACATTGAGTTACCTTAACAAAAAGTTGGGGGAACCGGATGCAGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGCGCGGCCCAGCAAGGAAACGGATGTCGTTGGCCAAACATTCGAGGCTCTAATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCGTCACCGTGTTGGAGGATCTGATTNTCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGATCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTACTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGTTCAACATGAACAAAAATCCCTTGAGCAAGAAGGACGATGGC------GAGGAGGAGAGCGAAGACGAAGTCGACGAGGAAGAATCGTTGAAGGATTCGAGCGATGATTCAGACGATGAAGATGAAGATGAAGAGGAGNAC---GAAGACGAGGACGATGAAGAGTCCCATTTGGCCCAAANTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAAGAGCAGGGCAAACGCTTGAATGCTGCTTTGGAGCAGTCTTTTCAAATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAACACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAAACAAGAAACCAACTCAATCGGTAATCCTGGNCGTGCTGCATTGCGTCTTCCAGGTGTACCGCCATTGCGCCACAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTTGCCAGGAATATCGAACTCGAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCAATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAAGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCAAGCCCAAGGAAAGTGCTGTCTGGCCNCTTCTAGTCGAATTTCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGTCAATGGCAGGGCGTTGCTCCACTGGCTGTTGTCCTGGCCTCCCACTTGGACGTACAGAAAACGCGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGCCGCTTTCAAGGACAACTGCTCGTCTTCCAACAAATTTGAGAAGAAGATAGCCAGATACGTAAATCAGCTAGAAACGGAGACTAGTAGTCCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGCGTCAGAAACTGCGTGAACAGATTCAGCTCGTCGCCAAAAACCTTCAACCCAACAAGAAGGCGGCGAAGCAG---AAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGATGATGAAGAGTCCACA--- ->Dsim_NS67 |16 sp| -ATGAAAAGCAAGGTGGATAAACCCATAACCACTGGTGCACCAAGTGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAGAAATCCGACGCGGACACGCAGATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGTGAAGCCGGCGGAGACCGAGGAAAAGGAAAATATCGCGAGCAACGGCAACCTGAAGGTGTCGCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGACACAAATGCTGAGCAGCGCGCTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAACCGCCGTGCCCGCCATCGACGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAAGTGGTTACAGCCTTCGGCATTTTGCAGAGCCCGCAGTTCGCCAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCTCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAANAAGCCGTTGAGTGGCTTGAAAGTAAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGAGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACTCACAGCTTTTCGATTTGTATTTCTCCGGCTCCACCATTCACAGCGATGACGTATACGCCAGATTGGCTAGTTTTCTTATGAATGGCGGAAAGGAAATGCTCGCCGCCTGGCAGCAGTATATTGATTCCAAGCAGCCACTCAAATTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCAACGTGCTCCGCAACTTTAAGCCAAGGGAAGAACAACTTATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGCTGCAGGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCTAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTCGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCAGCTGCTGCTTAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATATCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTAAGCGTCGAGAGCCTTTACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCATTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTGAGCCAGGCAACACAATGGCGACAGAAGCAGTTGAACTACTTGCTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAAGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCACTTGCTGCAGAAGACATTGAGTTACCTTAACAAAAAGTTGGGGGAACCGGATGCAGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGCGCGGCCCAGCAAGGAAACGGATGTCGTTGGCCAAACATTCGAGGCTCTAATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCGTCACCGTGTTGGAGGATCTGATTNTCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGATCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTACTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGTTCAACATGAACAAAAATCCCTTGAGCAAGAAGGACGATGGC------GAGGAGGAGAGCGAAGACGAAGTCGACGAGGAAGAATCGTTGAAGGATTCGAGCGATGATTCAGACGATGAAGATGAAGATGAAGAGGAGNAC---GAAGACGAGGACGATGAAGAGTCCCATTTGGCCCAAANTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAAGAGCAGGGCAAACGCTTGAATGCTGCTTTGGAGCAGTCTTTTCAAATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAACACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAAACAAGAAACCAACTCAATCGGTAATCCTGGNCGTGCTGCATTGCGTCTTCCAGGTGTACCGCCATTGCGCCACAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTTGCCAGGAATATCGAACTCGAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCAATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAAGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCAAGCCCAAGGAAAGTGCTGTCTGGCCNCTTCTAGTCGAATTTCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGTCAATGGCAGGGCGTTGCTCCACTGGCTGTTGTCCTGGCCTCCCACTTGGACGTACAGAAAACGCGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGCCGCTTTCAAGGACAACTGCTCGTCTTCCAACAAATTTGAGAAGAAGATAGCCAGATACGTAAATCAGCTAGAAACGGAGACTAGTAGTCCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGCGTCAGAAACTGCGTGAACAGATTCAGCTCGTCGCCAAAAACCTTCAACCCAACAAGAAGGCGGCGAAGCAG---AAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGATGATGAAGAGTCCACA--- ->Dsim_NS78 |93 sp| -ATGAAAAGCAAGGGGGATAAACCCATAACCACTGGTGCACCAAGTGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAGAAATCCGACGCGGACACGCAGATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGTGAAGCCGGCGGAGACCGAGGAAAAGGAAAATATCGCGAGCAACGGCAACCTGAAGGTGTCGCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGACACAAATGCTGAGCAGCGCGCTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAACCGCCGTGCCCGCCATCGACGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAAGTGGTTACAGCCTTCGGCATTTTGCAGAGCCCGCAGTTCGCCAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCTCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAANAAGCCGTTGAGTGGCTTGAAAGTAAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGAGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACTCACAGCTTTTCGATTTGTATTTCTCCGGCTCCACCATTCACAGCGATGACGTATACGCCAGATTGGCTAGTTTTCTTATGAATGGCGGAAAGGAAATGCTCGCCGCCTGGCAGCAGTATATTGATTCCAAGCAGCCACTCAAATTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCAACGTGCTCCGCAACTTTAAGCCAAGGGAAGAACAACTTATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGCTGCAGGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCAAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTCGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCAGCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATATCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTTAGCGTCGAGAGCCTTTACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCATTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTGAGCCAGGCAACACAATGGCGACAGAAGCAGTTGAACTACTTGCTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAGGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCACTTGCTGCAGAAGACATTGAGTTACCTTAACAAAAAGTTGGGGGAACCGGATGCAGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGCGCGGCCCAGCAAGGAAACGGATGTCGTTGGCCAAACATTCGAGGCTCTAATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCGTCACCGTGTTGGAGGATCTGATTNTCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGATCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTACTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGTTCAACATGAACAAAAATCCCTTGAGCAAGAAGGACGATGGC------GAGGAGGAGAGCGAAGACGAAGTCGACGAGGAAGAATCGTTGAAGGATTCGAGCGATGATTCAGACGATGAAGATGAAGATGAAGAGGAGNAC---GAAGACGAGGACGATGAAGAGTCCCATTTGGCCCAAANTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAGGAGCAGGGCAAACGCTTGAATGCTGCTTTGGAGCAGTCTTTTCAAATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAACACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAAACAAGAAACCAACTCAATCGGTAATCCTGGNCGTGCTGCATTGCGTCTTCCAGGTGTACCGCCATTGCGCCACAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTTGCCAGGAATATCGAACTCGAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCCATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAAGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCAAGCCCAAGGAAAGTGCTGTCTGGCCNCTTCTAGTCGAATTTCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGTCAATGGCAGGGCGTTGCTCCACTGGCTGTTGTCCTGGCCTCCCACTTGGACGTACAGAAAACGCGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGCCGCTTTCAAGGACAACTGCTCGTCTTCCAACAAATTTGAGAAGAAGATAGCCAGATACGTAAATCAGCTAGAAACGGAGACTAGTAGTCCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGCGTCAGAAACTGCGTGAACAGATTCAGCTCGTCGCCAAAAACCTTCAACCCAACAAGAAGGCGGCGAAGCAG---AAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGATGATGAAGAGTCCACA--- ->Dsim_NS79 |52 sp| -ATGAAAAGCAAGGTGGATAAACCCATAACCACTGGTGCACCAAGTGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAGAAATCCGACGCGGACACGCAGATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGTGAAGCCGGCGGAGACCGAGGAAAAGGAAAATATCGCGAGCAACGGCAACCTGAAGGTGTCGCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGACACAAATGCTGAGCAGCGCGCTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAACCGCCGTGCCCGCCATCGACGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAAGTGGTTACAGCCTTCGGCATTTTGCAGAGCCCGCAGTTCGCCAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCTCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAANAAGCCGTTGAGTGGCTTGAAAGTAAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGAGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACTCACAGCTTTTCGATTTGTATTTCTCCGGCTCCACCATTCACAGCGATGACGTATACGCCAGATTGGCTAGTTTTCTTATGAATGGCGGAAAGGAAATGCTCGCCGCCTGGCAGCAGTATATTGATTCCAAGCAGCCACTCAAATTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCAACGTGCTCCGCAACTTTAAGCCAAGGGAAGAACAACTTATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGCTGCAGGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCAAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTCGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCAGCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATATCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTTAGCGTCGAGAGCCTTTACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCATTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTGAGCCAGGCAACACAATGGCGACAGAAGCAGTTGAACTACTTGCTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAAGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCACTTGCTGCAGAAGACATTGAGTTACCTTAACAAAAAGTTGGGGGAACCGGATGCAGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGCGCGGCCCAGCAAGGAAACGGATGTCGTTGGCCAAACATTCGAGGCTCTAATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCGTCACCGTGTTGGAGGATCTGATTNTCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGATCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTACTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGTTCAACATGAACAAAAATCCCTTGAGCAAGAAGGACGATGGC------GAGGAGGAGAGCGAAGACGAAGTCGACGAGGAAGAATCGTTGAAGGATTCGAGCGATGATTCAGACGATGAAGATGAAGATGAAGAGGAGNAC---GAAGACGAGGACGATGAAGAGTCCCATTTGGCCCAAANTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAAGAGCAGGGCAAACGCTTGAATGCTGCTTTGGAGCAGTCTTTTCAAATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAACACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAAACAAGAAACCAACTCAATCGGTAATCCTGGNCGTGCTGCATTGCGTCTTCCAGGTGTACCGCCATTGCGCCACAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTTGCCAGGAATATCGAACTCGAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCAATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAAGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCAAGCCCAAGGAAAGTGCTGTCTGGCCNCTTCTAGTCGAATTTCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGTCAATGGCAGGGCGTTGCTCCACTGGCTGTTGTCCTGGCCTCCCACTTGGACGTACAGAAAACGCGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGCCGCTTTCAAGGACAACTGCTCGTCTTCCAACAAATTTGAGAAGAAGATAGCCAGATACGTAAATCAGCTAGAAACGGAGACTAGTAGTCCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGCGTCAGAAACTGCGTGAACAGATTCAGCTCGTCGCCAAAAACCTTCAACCCAACAAGAAGGCGGCGAAGCAG---AAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGATGATGAAGAGTCCACA--- ->Dsim_NS89 |128 sp| -ATGAAAAGCAAGGTGGATAAACCCATAACCACTGGTGCACCAAGTGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAGAAATCCGACGCGGACACGCAGATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGTGAAGCCGGCGGAGACCGAGGAAAAGGAAAATATCGCGAGCAACGGCAACCTGAAGGTGTCGCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGACACAAATGCTGAGCAGCGCGCTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAACCGCCGTGCCCGCCATCGACGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAAGTGGTTACAGCCTTCGGCATTTTGCAGAGCCCGCAGTTCGCCAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCTCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAANAAGCCGTTGAGTGGCTTGAAAGTAAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGAGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACTCACAGCTTTTCGATTTGTATTTCTCCGGCTCCACCATTCACAGCGATGACGTATACGCCAGATTGGCTAGTTTTCTTATGAATGGCGGAAAGGAAATGCTCGCCGCCTGGCAGCAGTATATTGATTCCAAGCAGCCACTCAAATTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCAACGTGCTCCGCAACTTTAAGCCAAGGGAAGAACAACTTATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGCTGCAGGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCTAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTCGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCAGCTGCTGCTTAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATATCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTAAGCGTCGAGAGCCTTTACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCATTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTGAGCCAGGCAACACAATGGCGACAGAAGCAGTTGAACTACTTGCTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAGGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCACTTGCTGCAGAAGACATTGAGTTACCTTAACAAAAAGTTGGGGGAACCGGATGCAGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGCGCGGCCCAGCAAGGAAACGGATGTCGTTGGCCAAACATTCGAGGCTCTAATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCGTCACCGTGTTGGAGGATCTGATTNTCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGATCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTACTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGTTCAACATGAACAAAAATCCCTTGAGCAAGAAGGACGATGGC------GAGGAGGAGAGCGAAGACGAAGTCGACGAGGAAGAATCGTTGAAGGATTCGAGCGATGATTCAGACGATGAAGATGAAGATGAAGAGGAGNAC---GAAGACGAGGACGATGAAGAGTCCCATTTGGCCCAAANTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAGGAGCAGGGCAAACGCTTGAATGCTGCTTTGGAGCAGTCTTTTCAAATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAACACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAAACAAGAAACCAACTCAATCGGTAATCCTGGNCGTGCTGCATTGCGTCTTCCAGGTGTACCGCCATTGCGCCACAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTTGCCAGGAATATCGAACTCAAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCTATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAAGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCAAGCCCAAGGAAAGTGCTGTCTGGCCNCTTCTAGTCGAATTTCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGTCAATGGCAGGGCGTTGCTCCACTGGCTGTTGTCCTGGCCTCCCACTTGGACGTACAGAAAACGCGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGCCGCTTTCAAGGACAACTGCTCGTCTTCCAACAAATTTGAGAAGAAGATAGCCAGATACGTAAATCAGCTAGAAACGGAGACTAGTAGTCCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGCGTCAGAAACTGCGTGAACAGATTCAGCTCGTCGCCAAAAACCTTCAACCCAACAAGAAGGCGGCGAAGCAG---AAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGATGATGAAGAGTCCACA--- ->Dsim_NS95 |25 sp| -ATGAAAAGCAAGGTGGATAAACCCATAACCACTGGTGCACCAAGTGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAGAAATCCGACGCGGACACGCAGATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGTGAAGCCGGCGGAGACCGAGGAAAAGGAAAATATCGCGAGCAACGGCAACCTGAAGGTGTCGCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGNNNNNNNNNATGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGACACAAATGCTGAGCAGCGCGCTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAACCGCCGTGCCCGCCATCGACGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAAGTGGTTACAGCCTTCGGCATTTTGCAGAGCCCGCAGTTCGCCAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCTCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAANAAGCCGTTGAGTGGCTTGAAAGTAAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGAGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACTCACAGCTTTTCGATTTGTATTTCTCCGGCTCCACCATTCACAGCGATGACGTATACGCCAGATTGGCTAGTTTTCTTATGAATGGCGGAAAGGAAATGCTCGCCGCCTGGCAGCAGTATATTGATTCCAAGCAGCCACTCAAATTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCAACGTGCTCCGCAACTTTAAGCCAAGGGAAGAACAACTTATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGCTGCAGGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCAAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTCGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCAGCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATATCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTTAGCGTCGAGAGCCTTTACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCATTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTGAGCCAGGCAACACAATGGCGACAGAAGCAGTTGAACTACTTGCTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAAGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCACTTGCTGCAGAAGACATTGAGTTACCTTAACAAAAAGTTGGGGGAACCGGATGCAGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGCGCGGCCCAGCAAGGAAACGGATGTCGTTGGCCAAACATTCGAGGCTCTAATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCGTCACCGTGTTGGAGGATCTGATTNTCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGATCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTACTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGTTCAACATGAACAAAAATCCCTTGAGCAAGAAGGACGATGGC------GAGGAGGAGAGCGAAGACGAAGTCGACGAGGAAGAATCGTTGAAGGATTCGAGCGATGATTCAGACGATGAAGATGAAGATGAAGAGGAGNAC---GAAGACGAGGACGATGAAGAGTCCCATTTGGCCCAAANTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAAGAGCAGGGCAAACGCTTGAATGCTGCTTTGGAGCAGTCTTTTCAAATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAACACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAAACAAGAAACCAACTCAATCGGTAATCCTGGNCGTGCTGCATTGCGTCTTCCAGGTGTACCGCCATTGCGCCACAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTTGCCAGGAATATCGAACTCGAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCAATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAAGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCAAGCCCAAGGAAAGTGCTGTCTGGCCNCTTCTAGTCGAATTTCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGTCAATGGCAGGGCGTTGCTCCACTAGCTGTTGTCCTGGCCTCCCACTTGGACGTACAGAAAACGCGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGCCGCTTTCAAGGACAACTGCTCGTCTTCCAACAAATTTGAGAAGAAGATAGCCAGATACGTAAATCAGCTAGAAACGGAGACTAGTAGTCCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGCGTCAGAAACTGCGTGAACAGATTCAGCTCGTCGCCAAAAACCTTCAACCCAACAAGAAGGCGGCGAAGCAG---AAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGATGATGAAGAGTCCACA--- ->Dsim_NS96 |98 sp| -ATGAAAAGCAAGGTGGATAAACCCATAACCACTGGTGCACCAAGTGCAACCAAGACAAAGGCCAAGGAGGACCGCAAGCGGGCAAAAACTCAGAAATCCGACGCGGACACGCAGATACCGGCCAAGATTTTGAAGAAGTCCAAG------------AAGGTGAAGCCGGCGGAGACCGAGGAAAAGGAAAATATCGCGAGCAACGGCAACCTGAAGGTGTCGCAGATCAACAAGGCCGTTTTTGTGGTCTTCAAAAAGATGCAGGGCAGTCAACTGACCAAGAAGATGATCAATTCGCTCATAACACTGCTGCGCGATGACACAAATGCTGAGCAGCGCGCTGCGACCACCGGCTACGTGCTCAAGCGCCTGATCCGCTCCACAGGAGCAGATGACATGAAGACGGTGAGCCTGGCCGCCAGTTACATACACTGCATCCTAACCGCCGTGCCCGCCATCGACGCTTTTGAGGTTCTGGAGACTCTGAAGCGAGACCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCGGCCGTCGGTCAAGTGGTTACAGCCTTCGGCATTTTGCAGAGCCCGCAGTTCGCCAAGGCCGAGCCCAAGCTGGTTACGGCAGTCTTCCAGATTCTGGCAGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCTCTGTGTGGTGATATCCTGGCGGTCTCCTTTAAACAGCTACCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAANAAGCCGTTGAGTGGCTTGAAAGTAAACACTTGCGATGTCTTGCTCGCCGTGCATCTGACCTATTCGTCCGTACTGGGACGAGAGAACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACTCACAGCTTTTCGATTTGTATTTCTCCGGCTCCACCATTCACAGCGATGACGTATACGCCAGATTGGCTAGTTTTCTTATGAATGGCGGAAAGGAAATGCTCGCCGCCTGGCAGCAGTATATTGATTCCAAGCAGCCACTCAAATTGAATGCAGCCAAGGCGTGTGCCATCCAAGTACTGAGCAACGTGCTCCGCAACTTTAAGCCAAGGGAAGAACAACTTATCCTGGATATCTTTACACCGACCTGTGTACAGTTCCTGCTGCAGGAATGTTCATCTGTGAAATGGGACAAAGGTGAGGGCAAGAAACCGTCGCTAAAGAAGCTGAAGGAGATTTGCTTCAAGTTCGAGGGATCCTTGGTTTCGTGTTACGAAAAGCAGTTCCAAAACGATGATAACAAACTTCAGCTGCTGCTCAAACTGCTGGAGCACACACTGCAGCTGGACTCGGTGATATCCTTGCCGCGTTTCTGCCAGAAACTGATAAATCAACTAAGCGTCGAGAGCCTTTACAAGCTGTACGACTACTACAACAACAAGCTGTACTCATTGGAGGACGAGGACAGAGTCAGCCGAGTGCATTGCCTTAACCAGATGCAATTGATACTGAACCACTCAAAGCTGAGCCAGGCAACACAATGGCGACAGAAGCAGTTGAACTACTTGCTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAGGAAGCCGTGTGAAGCTGCCCAAGCCAGCGCTTTTAGTCGCCAGTGCGCGGCGCGTTGTGAGGAGATATTCCTGGGCTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCACTTGCTGCAGAAGACATTGAGTTACCTTAACAAAAAGTTGGGGGAACCGGATGCAGAGAGCAAATTGCGTTCGCCGAGAGACGAATCACTGCAAAAGGCATGGAAGCAGGTCGAGAAACTGCTGGCGCGGCCCAGCAAGGAAACGGATGTCGTTGGCCAAACATTCGAGGCTCTAATCCTGTTTGTTTCTTTGGCTTTGTGCACAAAGATTCCCCCATCCGTCACCGTGTTGGAGGATCTGATTNTCTGCCGTAAGAATGCACTGCAAAAGAGCAAGGATCAAGTTAACGAAGAGCTCAAATGGCAGGACGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTACTGGCGGGAGTTTGTTCAACTGGTGGCCACCGCTTTGATTCCGCACCTTGAGCACGGTAACCTAGAACAGGTCCTCGAAGTGTTCAACATGAACAAAAATCCCTTGAGCAAGAAGGACGATGGC------GAGGAGGAGAGCGAAGACGAAGTCGACGAGGAAGAATCGTTGAAGGATTCGAGCGATGATTCAGACGATGAAGATGAAGATGAAGAGGAGNAC---GAAGACGAGGACGATGAAGAGTCCCATTTGGCCCAAANTCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCTGATGACGATGGCGCCAGCAGCGTGGATTGGAACGATGTGGACGAGGAGCAGGGCAAACGCTTGAATGCTGCTTTGGAGCAGTCTTTTCAAATGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCCACCAAATCGGAACGCATTGATAACACCAACCTGCTGCACTTCCGCATTCGTGCCTTGGATTTGTTGGAGCTCTTCATAAACAAGAAACCAACTCAATCGGTAATCCTGGNCGTGCTGCATTGCGTCTTCCAGGTGTACCGCCATTGCGCCACAGACAGCAAACTACAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTCAAAAAGATACTTGCCAGGAATATCGAACTCGAGGAAAATCAGAGCACCGCACCCATTCTGGAAGCCATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCGCCAGCCGACAGGCCAAAGGAGACATCATTATTTGGCGGGACAAGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCAAGCCCAAGGAAAGTGCTGTCTGGCCNCTTCTAGTCGAATTTCTGGAGCTGTGGGTAGCCAAGCGACGTAGTCGCCTCTCTCTGGCCAGTTTCGAAGCCCTCTTTCAGTCTGGTCAATGGCAGGGCGTTGCTCCACTGGCTGTTGTCCTGGCCTCCCACTTGGACGTACAGAAAACGCGCAGTTTTCGGCGGGCACAGATACTGAAGCTGCTCAGCGAGCAAGGTCGCCGGCTCGAAGCCGCTTTCAAGGACAACTGCTCGTCTTCCAACAAATTTGAGAAGAAGATAGCCAGATACGTAAATCAGCTAGAAACGGAGACTAGTAGTCCCAAGGAACTCAATCTGCTGCTTAAGATCCTCGCCCAAGGAGGCGAGAAGCGTCAGAAACTGCGTGAACAGATTCAGCTCGTCGCCAAAAACCTTCAACCCAACAAGAAGGCGGCGAAGCAG---AAGCAGGCAGCCGCC---------AAACCTATGGTCGTGGATGATGAAGAGTCCACA--- ->Dyak_528_2597 |32 sp| -ATGAAGAGCAAAGTGGACAAACCCATAACCAATGGTGCACCCGCCAAGACAAAGACC------AAGGAGGAGCGCAAACGGACGAAATCCCTGAAATCCGACGCGGACACCGAGATACCGGCCAAGATTTCCAAGGTGTCCAAGACCAAGAAGGAGAAGCCGAAGCCATCGGAGGCCGAGGAAAAGGAGAACACCGCAAGCAACGGCAACCTGAAGGTGTCGCAGATCAACAAAGCCGTGTTTGTGGTTTTCAAGAAGTTGCAGGGCAGCCAGCTGACCAAGAAGATGATCAATTCCCTTATAACGCTGCTGCGCGACGACACAAATGCGGAGCAGCGCGCTGCGACCATCTGCTACGTGCTCAAACGCTTGATCCGCTCCACAGGCGCAGATGACATGAAGGCGGTGGGCCTGGCCGCCAGTTATATACACTGCATCCTAGCCGCCGTGCCCGCCATTGACGCACTTGAGGTTCTGGACACTCTAAAGCGCGATCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCTGCCGTCGGTCAGTTGATAACAGCCTTTTGCATTCTGCAGACCCCGCAGTTCGCCAAGGCCGAGCCCAAGCTGGTTTCGGCGGTCTTCCAGATTCTAGCGGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCCATGTGCGGCGATATCCTAGCGGACTCCTTCAAACAGCTGCCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAACAAGCCGCTGAGTGGCTTGAAAGTCAACACCTGCGATGTCTTGCTGGCCGTGCACCTGACCTATTCGTCCGTGCTGGGACGGGAGAACATTCTGGCCAGCTTGTGGCCCAAGAAACCGGTGTACACGCAGCTTTTCGATCTGTACTTCGCCGGCTCCACCATTCACAGTGATGGCGTGTACGCCAGATTGGCTATTTTTCTTGTAAATGGTGGGAAGGAAATGCTCGCCGCCTGGCAGCAGTACATCGCTTCCAAGCAGCCACTGAAACTAAACGCAGCCAAGGCGTGTGCGATCCAAGTGCTGAGTCACATACTCCTCAACTTTAAGCCAGCGGACGAAGAACTCATCCTGGATATTTTTACACCTACCTGTGTACAATTTCTGCTGCAGGAATGCTCTGCTGTAAAATGGGACAAAGCTGAGGCCAAGAAGCCGTCCCAAAAGAAGCTGAGGGAGATTTGCTTCAAGTTCGAGGCCTCCTTGGTGCTATGTTTCGAAAAGCAGTTCCAAAACGATGAAAGCAAGCTTCAGCTGCTGCTCAAACTGCTGGACCACACACTGCAGTTGGACTCGGTGATTTGCTTGCCGCGCTTCTGCCAGCAACTGATAGGTCAGTTGAGCGTCGAGAGCCTCCAGAAGCTGTACGACTTCTACAACAACAAGCTGTACTCGTTGGAGGACGAGGACAGAGTCAGCCGAGTGCACTGCCTCAACCAGATGCAGGTTATACTGCACCACCCAACGCTCAGCCAGGCAACCAAATGGCGTCAGAAGCAGCTGAACTACTTGCTGCTCGCTGGCCTTTTCCACGTAGATGCCAGTAAGAAGCCGTGCGAGGCCTCCAAAGCCAGCGCGTTCAGTCGCCAGTGCTCGGCGCGTTGCGAGGAGATATTCCTGGGTTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCAGTTGCTGCAGAAGACACTGAGTTACCTTAACAAGGAGTTGGGACAACCGGATGCAGAAAACAAGCTGCGTTCGCCGAGGGATGAGTCACTGCAGAAGGCATGGAAGCAGGTCGAGAAACTGCTGGCGAAGCCCAGCGAGGAAACGGATGTCGTTGGCCAAACATTCGAGGCTCTCATCCTGTTTGTGTCGTTGGCTTTGTGCACGAAGATTCCCCTGTCCGTCACCGTGCTGGACGATCTGATTATCTGCCGCAAGAACGCACTGCAAAAGAGCAAGAAACAGGTCAACGAAGAGCTCCAATGGCAGGATGTGCTCACGGATGCCCTGCTCCAGTTACTCCTGCAAACAGGTCACTTCTGGCGGGAGTTTGTTCATCTGGTGGCCACCGCTCTGATTCCCCACCTCGAGCATGGTAACCTCGAACAGGTCCTCGAAGTGCTCAATATGAACAGGAATCCCCTGAGCAAGAAGGACGAGGGCGAGGAGGAGGAGGAGAGCGACGAGGAAGTCGAGGGGGAAGAATCGCCGAAAGATTCGAGCGACGACTCA---GACGGCGATGAAGATGAAGACGAAGATGGAGAGGACGAGGACGATGAGGAGTCCCATTTGGCCCAGATCCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCAGACGATGATGGCGCCAGCAGCGTGGACTGGAACGATGTTGGCGAGGAGCAGGGTGAACGCCTGAATGCTGCTCTGGAGCGATCCTTCCAGTTGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCGACCAAATCGGAGCGCATTGACAACACCAACCTGCTGCACTTCCGCATTCGCGCCTTGGATTTGTTGGAGCTGTTCATAAGCAAGAAACCAACTCAGTCGGTAATCCTGGACGTGCTGCATTGCGTCTTCCAGGTGTACCGCCACTGTAGCGGCGACAGCAAGCTGCAATCCCTGCGAGAAGCCAGCTTGAAGTTGCTTAAGAAGATACTCGCCAAGAATATTGAACTCAACGAGCAGCAGAGTAACGCACCCATTCTGGAAGCAATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCACCAACCGACAGGCCAAAGGAGACATCATTGTTTGGCGAGACAAGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCGAGCCCAAGAATAGCACCGTGTGGCCTCTGCTGGTCGAGTTCCTGGAGCTGTGGGTAGCCAAGCGTCGCAGTCGCCTCTCCCTGGCGAGTTTCGAAGCCCTCTTTCAGTCTGCCCAATGGCAGGGCGTTGCTCCGCTGGCCGTTGTCCTGGCCTCCCATTTGGACGTGAAGAAAACACGCAGTTTTCGGCGAGCCCAGATATTGAAGCTTCTCAGTGAGCAGTGCCGCCGACTCGAGTCCGCTTTCAAGGACAACAGCTCGTCTGCCAAGGAGTTTGAGAAGCAGATAGCACGATATGTGAACCAACTGGAAACGGAGGCCAGTAGTTCCAAGGAACTCAATCTGCTGCTCAAGATCCTCGCCCAAGGAGGCCAGAAGCGGCAGAAACTGCGCGAAAAGATCCAACTCGTCGCTAAGAACCTTCAGCCCACCAAGAAGGCGACGAAGCAGAAGGAGCAGGCAGCCGCCGAACCCACAGAACCCATGGATGTGGAAGATGAGGAGCAGGCCACA ->Dyak_FBgn0234128 |108 sp| -ATGAAGAGCAAAGTGGACAAACCCATAACCAATGGTGCACCCGCCAAGACAAAGACC------AAGGAGGAGCGCAAACGGACGAAATCCCTGAAATCCGACGCGGACACCGAGATACCGGCCAAGATTTCCAAGGTGTCCAAGACCAAGAAGGAGAAGCCGAAGCCATCGGAGGCCGAGGAAAAGGAGAACACCGCAAGCAACGGCAACCTGAAGGTGTCGCAGATCAACAAAGCCGTGTTTGTGGTTTTCAAGAAGTTGCAGGGCAGCCAGCTGACCAAGAAGATGATCAATTCCCTTATAACGCTGCTGCGCGACGACACAAATGCGGAGCAGCGCGCTGCGACCATCTGCTACGTGCTCAAACGCTTGATCCGCTCCACAGGCGCAGATGACATGAAGGCGGTGGGCCTGGCCGCCAGTTATATACACTGCATCCTAGCCGCCGTGCCCGCCATTGACGCACTTGAGGTTCTGGACACTCTAAAGCGCGATCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCTGCCGTCGGTCAGTTGATAACAGCCTTTTGCATTCTGCAGACCCCGCAGTTCGCCAAGGCCGAGCCCAAGCTGGTTTCGGCGGTCTTCCAGATTCTAGCGGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCCATGTGCGGCGATATCCTAGCGGACTCCTTCAAACAGCTGCCCGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGCTAAACAAGCCGCTGAGTGGCTTGAAAGTCAACACCTGCGATGTCTTGCTGGCCGTGCACCTGACCTATTCGTCCGTGCTGGGACGGGAGAACATTCTGGCCAGCTTGTGGCCCAAGAAACCGGTGTACACGCAGCTTTTCGATCTGTACTTCGCCGGCTCCACCATTCACAGTGATGGCGTGTACGCCAGATTGGCTATTTTTCTTGTAAATGGTGGGAAGGAAATGCTCGCCGCCTGGCAGCAGTACATCGCTTCCAAGCAGCCACTGAAACTAAACGCAGCCAAGGCGTGTGCGATCCAAGTGCTGAGTCACATACTCCTCAACTTTAAGCCAGCGGACGAAGAACTCATCCTGGATATTTTTACACCTACCTGTGTACAATTTCTGCTGCAGGAATGCTCTGCTGTAAAATGGGACAAAGCTGAGGCCAAGAAGCCGTCCCAAAAGAAGCTGAGGGAGATTTGCTTCAAGTTCGAGGCCTCCTTGGTGCTATGTTTCGAAAAGCAGTTCCAAAACGATGAAAGCAAGCTTCAGCTGCTGCTCAAACTGCTGGACCACACACTGCAGTTGGACTCGGTGATTTGCTTGCCGCGCTTCTGCCAGCAACTGATAGGTCAGTTGAGCGTCGAGAGCCTCCAGAAGCTGTACGACTTCTACAACAACAAGCTGTACTCGTTGGAGGACGAGGACAGAGTCAGCCGAGTGCACTGCCTCAACCAGATGCAGGTTATACTGCACCACCCAACGCTCAGCCAGGCAACCAAATGGCGTCAGAAGCAGCTGAACTACTTGCTGCTCGCTGGCCTTTTCCACGTAGATGCCAGTAAGAAGCCGTGCGAGGCCTCCAAAGCCAGCGCGTTCAGTCGCCAGTGCTCGGCGCGTTGCGAGGAGATATTCCTGGGTTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCAGTTGCTGCAGAAGACACTGAGTTACCTTAACAAGGAGTTGGGACAACCGGATGCAGAAAACAAGCTGCGTTCGCCGAGGGATGAGTCACTGCAGAAGGCATGGAAGCAGGTCGAGAAACTGCTGGCGAAGCCCAGCGAGGAAACGGATGTCGTTGGCCAAACATTCGAGGCTCTCATCCTGTTTGTGTCGTTGGCTTTGTGCACGAAGATTCCCCTGTCCGTCACCGTGCTGGACGATCTGATTATCTGCCGCAAGAACGCACTGCAAAAGAGCAAGAAACAGGTCAACGAAGAGCTCCAATGGCAGGATGTGCTCACGGATGCCCTGCTCCAGTTACTCCTGCAAACAGGTCACTTCTGGCGGGAGTTTGTTCATCTGGTGGCCACCGCTCTGATTCCCCACCTCGAGCATGGTAACCTCGAACAGGTCCTCGAAGTGCTCAATATGAACAGGAATCCCCTGAGCAAGAAGGACGAGGGCGAGGAGGAGGAGGAGAGCGACGAGGAAGTCGAGGGGGAAGAATCGCCGAAAGATTCGAGCGACGACTCA---GACGGCGATGAAGATGAAGACGAAGATGGAGAGGACGAGGACGATGAGGAGTCCCATTTGGCCCAGATCCGAGAGAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCAGACGATGATGGCGCCAGCAGCGTGGACTGGAACGATGTTGGCGAGGAGCAGGGTGAACGCCTGAATGCTGCTCTGGAGCGATCCTTCCAGTTGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCGACCAAATCGGAGCGCATTGACAACACCAACCTGCTGCACTTCCGCATTCGCGCCTTGGATTTGTTGGAGCTGTTCATAAGCAAGAAACCAACTCAGTCGGTAATCCTGGACGTGCTGCATTGCGTCTTCCAGGTGTACCGCCACTGTAGCGGCGACAGCAAGCTGCAATCCCTGCGAGAAGCCAGCTTGAAGTTGCTTAAGAAGATACTCGCCAAGAATATTGAACTCAACGAGCAGCAGAGTAACGCACCCATTCTGGAAGCAATTGAGCAGCTGATGTCGTCTGGCGAGGAGCATTCAGAAGAGGACCAAGAGAACGGCAAGCAGCCCACCAACCGACAGGCCAAAGGAGACATCATTGTTTGGCGAGACAAGTGCTTCGCCTACCTGGTCAGCCAGGCATCAGCAGATGGCGAGCCCAAGAATAGCACCGTGTGGCCTCTGCTGGTCGAGTTCCTGGAGCTGTGGGTAGCCAAGCGTCGCAGTCGCCTCTCCCTGGCGAGTTTCGAAGCCCTCTTTCAGTCTGCCCAATGGCAGGGCGTTGCTCCGCTGGCCGTTGTCCTGGCCTCCCATTTGGACGTGAAGAAAACACGCAGTTTTCGGCGAGCCCAGATATTGAAGCTTCTCAGTGAGCAGTGCCGCCGACTCGAGTCCGCTTTCAAGGACAACAGCTCGTCTGCCAAGGAGTTTGAGAAGCAGATAGCACGATATGTGAACCAACTGGAAACGGAGGCCAGTAGTTCCAAGGAACTCAATCTGCTGCTCAAGATCCTCGCCCAAGGAGGCCAGAAGCGGCAGAAACTGCGCGAAAAGATCCAACTCGTCGCTAAGAACCTTCAGCCCACCAAGAAGGCGACGAAGCAGAAGGAGCAGGCAGCCGCCGAACCCACAGAACCCATGGATGTGGAAGATGAGGAGCAGGCCACA ->Dere_528_2597 |50 sp| -ATGAAGAGCAAAGTGGACAAAGCCATGACCAATGGTGCACCCGCCATGACAAAAACC------AAGGAGGACCGCAAACGGACAAAATCCCTGAAATCGAATGCGGACACGGGGGGACCGGCCAAGATTGCGCGGGTGTCCAAG------CAGGAGAAGCCAAAGCCATCGGAAACCGATGAGAAGGAAAACACGGCGAGCAACGGGAACCTGAAGATGTCGCAAATCAACAAAGCCGTGTTTGTGGTCTTCAAGAAGATGCAGGGCAGTCAACTAACCAAGAAGATGATCAATTCCCTCGTAACGCTGCTACGCGACGACACAAATGCTGAACAGCGTACTGCGACCACTTGTTACGTGCTCAAGCGCTTGATCCGCTCCACAGGTGCAGATGACATGAATGCGGTCGTCCTGGCCGCCAGTTATATACACTGCATCCTAACCGCCGTGCCCGCCATTGACGCATTTGAGGTTCTGGAGACGCTAAAGCGAGATCTGGCCGTTGGCAGCCAGCAGAGGGGCAAGGAGGACTCACTAGCTGCCGTCGGTCAGTTGGTTACAGCCTTTTGCATTCTGCAGACCCCGCAGTTCGCTAAGGCGGAGCCCAAGCTGGTAACGGCAGTCTTCCAGATTCTAGCGGCCCAGCTAAAGGGCAGGGAGTACTTGGTGTCCATGTGTGGCGATATCCTAGCAGACTCCTTCAAACAGCTACCTGCTGCGATCTTCGAGGAGTACGTGTGGCCACTTCTGCAACCCGAGTTAAACAAGCCCCTGAGTGGCTTGAAAGTAAACACCTGCGATGTTTTGCTGGCCGTGCACTTGACCTATTCGTCCGTACTGGGACGGGCGGACATTCTAGCCAGCTTGTGGCCCAAGAAACCAGTGTACACACAGCTCTTCGATCTGTATTTCTCCGGCTCCACCATTCACAGTGATGGCGTATACACTAGATTGGCTATCTTTCTTGTAAATGGTGGGAAGGAAATGCTCGCCGCCTGGGAGCAGTACATCGCTTCCAAGCAGCCACTAAAAGTAAATGCAGCCAAGGCGTGTGCGATCCAAGTACTGAGCCACGTTCTCCTCAACTTTAAGCCAACGGAAGAGCAGCTCATCCTGGATGTTTTTACACCTACCTGTGTACAATTTCTGCTGCAGGAATGTTCATCTGTAAAATGGGATAAAGGTGAGGCCAAGAAACCCTCCCAAAAGAAGCTGAGGGAGATTTGCTTTAAGTTCGAGGCATCCTTGGTTTTATGTTTCGAAAATCAGTTCCAAAACGATTATATCAAGCTTCAGCTGCTGCTCAAATTACTGGACCACACATTGCAGTTGGACTCGGTGATTAGCTTGCCGCGCTTCTGCCAGCAGCTAATAAATCAATTGAGCGTCGAGAGTCTCCAGAAGCTGTACGATTTCTACAACAATAAATTGTACTCATTGGAGGATGAGGATAGAGTCAGCCGAGTGCACTGCCTGAACCAGATGCAGTTGATACTGCACCATTCAGCGCTTAGCCAGGCAACCAAATGGCGTCAGAAGCAATTGAACTACTTGCTGCTCGCTGGCCTTTTCCACTTAGATGCCAGTAAGAAGCCGTGCGAAGCCTCAAAAGCCAGCGCTTTCAGTCGCCAGTGTTCGGCGCGTTGTGAGGAAATATTCCTGGGTTCCCTGCTGCACAAGTGCTCGGGTCTGCCAGGACTTTGCCAGTTACTGCAGAAGACGTTGAGTTATCTTAACAAAGAGTTGGCACAGGCGGATGCAGAGAGCAAATTGCGTTCGCCGAGAGACGAATCTCTGCAGAAAGCATGGAAACAGGTCGAGAAACTGCTGGCAAAGCCCAGCCAGGAAACGGATGTCGTTGGCCAAACATTCGAGGCTCTCATCCTGTTTGTTTCTTTGGCTTTGTGCGCAAAGATTCCCCTATCCGTCACCGTGTTGGATGATCTGATTATCTGCCGTAAAAACGCACTGCAAAAGAGCAAGAAACAGGATAACGAAGAGCTCCAATGGCAGGATGTGCTCACAGATGCCCTACTCCAGTTACTTTTGCAAACAGGTCACTTCTGGCGTGAGTTTGTCCATCTGGTGGCCACCGCTTTGATTCCCCACCTCGAGCACGGTAACCTCGAACAGGTCCTCGAAGTGCTCAACATGAACAGAAATCCTTTGAGCAAGAAGGATGAGGGC------GAGGAGGAGAGCGACGAGGAAATCGAGGAGGAGGAATCGTTGAAAGATTCGAGCGATGACTCG---GACGGCGATGAAGATGAAGAGGAG------GAGGACGAGAACGATGAGGAGTCCCATTTGGCCCAGATTCGAGAAAGCGTTCGCCAGGCTTTGGTCAACGATGGCGACGCAGATGACGACGGCGCCAGCAGCGTGGACTGGAACGATGTTGACGAGGAGCAGGGTGAACGCCTAAATGCTGCTTTGGAGCGCTCTTTTCAGTTGTTCCGACCCAAGTCGCGCAAAGCCCAGGAGAAGGAGCGTCCGACCAAATCGGAACGCATTGATAACACCAACCTGCTGCACTTTCGCATTCGTGCCTTGGATTTGTTGGAGCTGTTCATAACCAAGAAACCAACTCAGTCGGTTATCCTGGACGTGCTGCATTGCGTTTTCCAGGTGTACCGCCATTGCAGCGGAGATAGCAAACTGCAATCCTTGCGAGAAGCCAGTTTGAAGTTGCTTAAAAAGATACTCGCCAGAAACATTGAACTCCAGGAAAATCAGAGTAACGCACCCATTCTGGGAGCCATTGAGCAGTTGATGTCGTCTGGCGAGGAGCATTCAGAAGAAGACCAGGAGAATAGCAAGCAACCCGCCAACCGACAGGCCAAAGCAGACATCATAGTTTGGCGAGATAAGTGCTTCGCTTACCTGGTCAGCCAGGCATCAGCAGGTGGCGAGCCCAAGAATAGCACCGTATGGCCTCTTCTGGTGGAATTCCTGGAGCTGTGGGTAGCCAAACGTCGTAGTCGCCTATCTCTGGCTAGTTTCGAGGCCCTCTTTCAGTCTGGTCAATGGCAGGGCGTTGCTCCGCTGGCCGTTGCCCTGGCCTCCCATTTGGACGTGAAAAAAACACGCAGTTTTCGGCGGGCACAGATATTGAAGCTTCTCAGTGAGCAATGTCGCCGACTCGAATCCGCCTTTAAGGACAACAGCTCGTCTTCCAAGGAGTTTGAGAAACAGATAGCCAGATATGTGAATGAACTGGAAACGGAGGCCAGTAGTTCCAAGGAACTCAATCTGCTGCTCAAGATCCTCGCCCAAGGAAACCAGAAGAGGCAGAAACTGCGTGAAAAGATCCAAATCGTCGCTAAAAGTCTTCAGCCCACCAAGAAGGCGATGAAG---------CAGGCAGCCGCT---------GAACCCATGGTTGTGGAAGATGAGGAGCACGTCACA \ No newline at end of file diff --git a/test_alignment_0_8.py b/test_alignment_0_8.py deleted file mode 100644 index 991494d..0000000 --- a/test_alignment_0_8.py +++ /dev/null @@ -1,413 +0,0 @@ -#! /usr/env/bin/ Python3 -from alignmentrs_imports import * -# TODO - check valid ids, check invalid ids, - # check mixed type input (list, int, str) - # check invalid type - # check invalid optional arg. input -#---------------------------------------------------- -class TestAlignment: - """This is a TestClass for alignmentrs v0.8 library - - test type: nosetests - input file name: test_alignment.txt This is an - alignment text file - - strategy - -------- - - created dictionary from test file - dict.keys = sample ids, dict.values = [sample_description, sample_sequence] - this enables comparisons between dict items - (expected outputs) and alignentrs output - - tests applied - ------------- - tests for expected output for valid input #(EVI) - tests for output type (EOT) - tests for expected errors (EE)""" - - # basic test for expected outputs - def setup(self): - # initiates alignment object for tests - self.aln_file = Alignment.from_fasta('test_alignment.txt', 'test_align', 'marker') - self.test_aln_file = fasta_to_dict('test_alignment.txt') # for test_dict - #for methods that exclude marker sequence - self.test_aln_file_wo_marker = fasta_to_dict('test_alignment.txt') - del self.test_aln_file_wo_marker['marker_0'] - - def teardown(self): - pass -#---------------------------------------------------- - def test_nrows(self): - """checks if algn_obj.nrow returns expected type - and number of rows in alignment. - compares number of keys in test_dict(sample_ids) - against algn_obj.nrow output. - - pass if: - algn_obj.nrow returns int and matches - len(dict.keys)""" - - nrows = self.aln_file.nrows - test_nrows = len(list(row for row in self.test_aln_file.keys())) #checks number of ids in dict.keys - - assert isinstance(nrows,int) #(EOT) - assert nrows == test_nrows -#---------------------------------------------------- - def test_nsamples(self): - """checks if algn_obj.nsamples returns expected type - and number of samples in alignment. - compares algn_obj.nsamples against len(dict.items). - - pass if: - algn_obj.nrow returns int and matches - len(dict.items)""" - - nsamples = self.aln_file.nsamples - test_nsamples = len(list(sample for sample in \ - self.test_aln_file_wo_marker.items())) - - assert isinstance(nsamples,int) #(EOT) - assert nsamples == test_nsamples -#---------------------------------------------------- - def test_nmarkers(self): - """checks if algn_obj.nmarkers returns expected - output type and number of markers in alignment. - compares number of markers in algn_obj. against - number of test_dict keys with 'marker' keyword - - pass if: - output is int - number of markers in aln.obj == number of markers - in test_dict""" - - nmarkers = self.aln_file.nmarkers - test_nmarkers = len(list(sample for sample in self.test_aln_file.items() \ - if 'marker' in sample[0])) - - assert isinstance(nmarkers, int) - assert nmarkers == test_nmarkers -#---------------------------------------------------- - def test_nsites(self): - """checks if algn_obj.nsites returns expected - output type and number of sites in alignment. - compares number of sites in algn_obj. against - sequence length of a random key in test_dict. - *note: assumes all samples have same len - - pass if: - output is int - number of sites in aln.obj == sequence length - of any test_dict.key()""" - - nsites = self.aln_file.nsites - # extracts random test_dict id to use for seq len - random_seq_id = random.choice(list(self.test_aln_file.keys())) - random_seq_len = self.test_aln_file[random_seq_id][1] - test_nsites = len(random_seq_len) - - assert isinstance(nsites, int) - assert nsites == test_nsites -#---------------------------------------------------- - def test_sample_ids(self): - """checks if all sample ids in align.obj matches - ids in test_dictr. checks if method returns - expected type: (list) - pass if: - sample_ids in align.obj matches keys in test_dict""" - sample_ids = self.aln_file.sample_ids - test_sample_ids = list(sample_id for sample_id in \ - self.test_aln_file.keys() if not 'marker' in sample_id) - - assert isinstance(sample_ids,list) - assert sample_ids == test_sample_ids -#---------------------------------------------------- - def test_sample_descriptions(self): - """checks if descriptions in align.obj match descriptions - in test_dict. checks if expected type is returned - pass if: - expected type : list - descriptions in align.obj matches descriptions - in test_dict.""" - - sample_descriptions = self.aln_file.sample_descriptions - # description is first index pos in test_dict.values - test_descriptions = list(self.test_aln_file[desc][0] for desc in \ - self.test_aln_file.keys() if 'marker' not in desc) - - assert isinstance(sample_descriptions,list) - assert sample_descriptions == test_descriptions -#---------------------------------------------------- - def test_sample_sequences(self): - """checks if sequences in align.obj match sequences - in test_dict. checks if expected type is returned - pass if: - expected type : list - sequences in align.obj matches sequences - in test_dict.""" - - sample_sequences = self.aln_file.sample_sequences - # sequence is second index pos in test_dict.values - test_sample_sequences = list(self.test_aln_file[sample_id][1] for sample_id in \ - self.test_aln_file.keys() if not 'marker' in sample_id) - - assert isinstance(sample_sequences,list) - assert sample_sequences == test_sample_sequences -#---------------------------------------------------- - def test_marker_ids(self): - """checks if marker_ids in align.obj match marker_ids - in test_dict. checks if expected type is returned - pass if: - expected type : list - marker_ids in align.obj matches marker_ids - in test_dict.""" - - marker_ids = self.aln_file.marker_ids - # marker ids are considered as any key that has 'marker keyword in test_dict' - test_marker_ids = list(marker_id for marker_id in \ - self.test_aln_file.keys() \ - if 'marker' in marker_id) - - assert isinstance(marker_ids,list) - assert marker_ids == test_marker_ids -#---------------------------------------------------- - def test_marker_descriptions(self): - """checks if marker_descriptions in align.obj and - test_dict match. checks if expected type is returned - pass if: - expected type : list - marker_descriptions in align.obj matches marker_descriptions - in test_dict.""" - - marker_descriptions = self.aln_file.marker_descriptions - test_marker_descriptions = list(self.test_aln_file[marker_desc][0] \ - for marker_desc in self.test_aln_file.keys() \ - if 'marker' in marker_desc) - - assert isinstance(marker_descriptions,list) - assert marker_descriptions == test_marker_descriptions -#---------------------------------------------------- - def test_marker_sequences(self): - """checks if marker_sequences in align.obj and - test_dict match. checks if expected type is returned - pass if: - expected type : list - marker_sequences in align.obj matches marker_sequences - in test_dict.""" - - marker_sequences = self.aln_file.marker_sequences - test_marker_sequences = list(self.test_aln_file[marker_id][1] \ - for marker_id in self.test_aln_file.keys() \ - if 'marker' in marker_id) - - assert isinstance(marker_sequences,list) - assert marker_sequences == test_marker_sequences -#---------------------------------------------------- - # class methods - - # Does not work properly - - #def test_subset(cls): - # """Returns a subset of the alignment by samples, markers and sites.""" - # sample_ids = [1,2,3] - # marker_ids = ['marker_0'] - # aln_obj = Alignment.from_fasta('test_alignment.txt', 'test_align', 'marker') - - # subset = (aln_obj,sample_ids, marker_ids) - # test_subset = -#---------------------------------------------------- - def test_get_samples(self): - # TODO - check valid ids, check invalid ids, - # check mixed type input (list, int, str) - # check invalid type - # check invalid optional arg. input - - """Returns a list of sequence strings containing only the samples - specified by the index.""" - test_names = ['Dmel_RG4N', 'Dmel_RG7'] - get_samples = self.aln_file.get_samples(test_names) - - test_list = [] - #extracts expected sequences from test dictionary - for index in range(len(self.test_aln_file['Dmel_RG4N'][1])): - nuc1 = self.test_aln_file['Dmel_RG4N'][1][index] - nuc2 = self.test_aln_file['Dmel_RG7'][1][index] - test_list = test_list + [[nuc1,nuc2]] - - assert [sample for sample in get_samples] == test_list -#---------------------------------------------------- - # can't test yet becausse returns an object - #def test_get_markers(self, i, match_prefix=False, match_suffix=False): - #"""Returns a list of sequence strings containing only the markers - #specified by the index.""" - - # error with row and column posisiton - #def test_get_sites(self): - #"""Returns a new alignment containing only the sites specified - #by the given list of column numbers.""" -#---------------------------------------------------- - # Setter/Replacer - def test_replace_samples(self): - """Replaces the sequence for a given row in the alignment matrix.""" - new_sample = 'A' * 3432 - replace_sample = self.aln_file.replace_samples(['Dmel_528_2597'], [new_sample]) - sample_sequences = self.aln_file.sample_sequences - - assert new_sample in sample_sequences -#---------------------------------------------------- - def test_insert_samples_from_lists(self): - """Inserts new sequences in the alignment matrix at the specifiedrow position inplace.""" - - new_sample_id = 'Dsim99201' - new_sample_desc = '|CH2912|' - new_sample_sequence = 'GCCGATGT' * 429 - self.aln_file.insert_samples_from_lists(1, [new_sample_id], [new_sample_desc], [new_sample_sequence]) - #assert self.aln_file.sample_sequences[1:2] == new_sample_sequence # error here - assert self.aln_file.sample_ids[1] == new_sample_id - assert self.aln_file.sample_descriptions[1] == new_sample_desc -#---------------------------------------------------- - def test_append_sample_from_lists(self): - """Inserts new sequences after the last row of the alignment matrix - inplace. This increases the total number of samples.""" - - new_sample_id = 'Dere_lastind' - new_sample_desc = '|last_ind|' - new_sample_sequence = 'GCCGAAAA' * 429 - self.aln_file.append_sample_from_lists([new_sample_id], [new_sample_desc], [new_sample_sequence]) - assert self.aln_file.sample_sequences[-1] == new_sample_sequence - assert self.aln_file.sample_ids[-1] == new_sample_id - assert self.aln_file.sample_descriptions[-1] == new_sample_desc -#---------------------------------------------------- - def test_remove_samples(self): - """Removes sample sequences based on the given index.""" - index_to_remove = 1 - sequence_to_remove = self.aln_file.sample_sequences[index_to_remove] - self.aln_file.remove_samples(index_to_remove) - assert sequence_to_remove != self.aln_file.sample_sequences[1] - - - def test_retain_samples(self): - """Keeps sample sequences based on the given index.""" - - self.aln_file.retain_samples([1,2,3,4,5]) - assert self.aln_file.nsamples == 5 - assert len(self.aln_file.sample_ids) == 5 - assert len(self.aln_file.sample_descriptions) == 5 - assert len(self.aln_file.sample_sequences) == 5 - assert self.aln_file.nmarkers == 1 - assert len(self.aln_file.marker_ids) == 1 - assert len(self.aln_file.marker_descriptions) == 1 - assert len(self.aln_file.marker_sequences) == 1 -#---------------------------------------------------- - def test_remove_sites(self): - """Removes sites based on the given list of column numbers.""" - self.aln_file.remove_sites([0,1,2]) - - assert self.aln_file.nsites == (3432-3) - #TODO- should assert to that the positions are not ATG once - # get samples sequences is fixes -#---------------------------------------------------- - def test_retain_sites(self): - """Keeps sites based on the given list of column numbers.""" - self.aln_file.retain_sites([0,1,2]) - assert self.aln_file.nsites == 3 - #TODO- should assert to that the positions are not ATG once - # get samples sequences is fixes -#---------------------------------------------------- - def test_from_fasta(cls): - """Create an Alignment object from a FASTA-formatted file.""" - aln_obj = Alignment.from_fasta('test_alignment.txt', 'test_align', 'marker') - assert aln_obj.nsites == 3432 - assert aln_obj.nsamples == 65 - assert aln_obj.nmarkers == 1 -#---------------------------------------------------- - # Format converters - # tested, remove hashtag when done - #def test_to_fasta(self): - """Saves the alignment as a FASTA-formatted text file.""" - #create_aln_file = self.aln_file.to_fasta('test_aln_file') # should change input to path_to_file - #TODO- check if len(currentdir) increases by one, - #check if test_aln_file in dir - #use from_fasta to create new alingment object -#---------------------------------------------------- - def test_to_sample_matrix(self): - """Converts sequences into a numpy matrix.""" # is this matrix or array? - seq_matrix = self.aln_file.to_sample_matrix() - test_seq_matrix = array([list(key[1]) for key in self.test_aln_file.values() if 'A' in key[1]]) # use key names - assert array_equal(seq_matrix, test_seq_matrix) -#---------------------------------------------------- - def test_to_marker_matrix(self, size=1): - """Converts sequences into a numpy matrix.""" - mseq_matrix = self.aln_file.to_marker_matrix() - test_mseq_matrix = array([list(self.test_aln_file[marker][1]) for marker in \ - self.test_aln_file.keys() if 'marker' in marker]) - assert array_equal(mseq_matrix, test_mseq_matrix) -#---------------------------------------------------- - # Iterators - def test_iter_sites(self): - """Iterates column-wise over the alignment""" - iter_seq = list(self.aln_file.iter_sites(0,1)) - - test_cols = [] - seqs = [] - for num in range(0,1): - for value in self.test_aln_file.values(): - seq = value[1] - #if not 'A' in seq: - #continue - seqs.append(seq[num]) - - test_cols.append(sorted(seqs)) - seqs = [] - - print(test_cols, iter_seq) - assert test_cols == iter_seq -#---------------------------------------------------- - def test_iter_sample_sites(self, start=0, stop=None, size=1): - """Iterates column-wise over the sample alignment. Excludes markers. """ - iter_seq = list(self.aln_file.iter_sample_sites(0,10)) - - test_cols = [] - seqs = [] - for num in range(0,10): - for value in self.test_aln_file_wo_marker.values(): - seq = value[1] - seqs.append(seq[num]) - - test_cols.append(seqs) - seqs = [] - - assert test_cols == iter_seq -#---------------------------------------------------- - def test_iter_marker_sites(self): - """Iterates column-wise over the marker alignment. Excludes samples. """ - iter_seq = list(self.aln_file.iter_marker_sites(0,10)) - - test_cols = [] - seqs = [] - for num in range(0,10): - for value in self.test_aln_file.values(): - - seq = value[1] - if set(seq) != {'C', 'N'}: - continue - seqs.append(seq[num]) - - test_cols.append(seqs) - seqs = [] - - assert test_cols == iter_seq -#---------------------------------------------------- - # How does this work? - - # Block-related methods - - #def test_set_blocklists(self, ref_seq, description_encoder=None): -# """Creates new block information for the sequences given a reference. """ -#---------------------------------------------------- - # def test_parse_description_as_blocks(self, description_decoder=None): -# """Parses sample description into block data.""" -#---------------------------------------------------- - # def test_write_blocks_to_description(self, description_encoder): -# """Writes each sample's block data as a string, replacing its - # description.""" -#---------------------------------------------------- \ No newline at end of file diff --git a/test_alignment_0_8_2.py b/test_alignment_0_8_2.py deleted file mode 100644 index 09323f5..0000000 --- a/test_alignment_0_8_2.py +++ /dev/null @@ -1,330 +0,0 @@ -#! /usr/env/bin/ Python3 -from alignmentrs_imports import * -#---------------------------------------------------- -class TestAlignment: - - # basic test for expected outputs - def setup(self): - # initiates alignment object for tests - self.aln_file = Alignment.from_fasta('test_alignment_b.txt', 'test_align', 'marker') - - def teardown(self): - pass -#---------------------------------------------------- - def test_nrows(self): - """checks if aln.obj.nrows output matches expected rows - of alignment""" - nrows = self.aln_file.nrows - expected_nrows = 4 - - assert isinstance(nrows,int) - assert nrows == expected_nrows -#---------------------------------------------------- - def test_nsamples(self): - """checks if aln.obj.nsamples output matches - number of samples being tested""" - - nsamples = self.aln_file.nsamples - expected_nsamples = 3 - - assert isinstance(nsamples,int) - assert nsamples == expected_nsamples -#---------------------------------------------------- - def test_nmarkers(self): - """checks if aln.obj.nmarkers matches - expected number of markers in the sample""" - - nmarkers = self.aln_file.nmarkers - expected_nmarkers = 1 - - assert isinstance(nmarkers, int) - assert nmarkers == expected_nmarkers -#---------------------------------------------------- - def test_nsites(self): - """checks if aln.obj.nsites output matches expected number - of sites in alignment(i.e sequence length) file""" - - nsites = self.aln_file.nsites - expected_nsites = 26 - - assert isinstance(nsites, int) - assert nsites == expected_nsites -#---------------------------------------------------- - def test_sample_ids(self): - """checks if all aln.obj.sample_ids match output - ids in alignment file""" - - sample_ids = self.aln_file.sample_ids - expected_sample_ids = ['Dmel_528_2597', 'Dmel_RG2', 'Dmel_RG4N'] - - assert isinstance(sample_ids,list) - assert sample_ids == expected_sample_ids -#---------------------------------------------------- - def test_sample_descriptions(self): - """checks if aln.obj.sample_descriptions output matches sample - descriptions in alignment file""" - - sample_descriptions = self.aln_file.sample_descriptions - expected_descriptions = ['|10 sp|', '|47 sp|', '|15 sp|'] - - assert isinstance(sample_descriptions,list) - assert sample_descriptions == expected_descriptions -#---------------------------------------------------- - def test_sample_sequences(self): - """checks if aln.obj.sample_sequences output match sequences - in alignment file""" - - sample_sequences = self.aln_file.sample_sequences - expected_sample_sequences = ['ATGAAGAGCAAGGTGGGGGGGGGGGG', - 'ATGAAGAGCAAGGTGGACCCCCCCCC', - 'ATGAAGAGCAAGGTGGAAAAAAAAAA'] - - assert isinstance(sample_sequences,list) - assert sample_sequences == expected_sample_sequences -#---------------------------------------------------- - def test_marker_ids(self): - """checks if aln.obj.marker_ids matches output marker ids in - alignment file""" - - marker_ids = self.aln_file.marker_ids - expected_marker_ids = ['marker_0'] - - assert isinstance(marker_ids, list) - assert marker_ids == expected_marker_ids -#---------------------------------------------------- - def test_marker_descriptions(self): - """checks if aln.obj.marker_descriptions output - matches descriptions in alignment file""" - - marker_descriptions = self.aln_file.marker_descriptions - expected_marker_descriptions = ['|91 sp|'] - - assert isinstance(marker_descriptions,list) - assert marker_descriptions == expected_marker_descriptions -#---------------------------------------------------- - def test_marker_sequences(self): - """checks if align.obj.marker_sequences output - matches marker sequences alignment file""" - - marker_sequences = self.aln_file.marker_sequences - expected_marker_sequences = ['CCCCCCCCCCCCCCCCCCCCCCCCCC'] - - assert isinstance(marker_sequences,list) - assert marker_sequences == expected_marker_sequences -#---------------------------------------------------- - # class methods - - # Does not work properly - - #def test_subset(cls): - # """Returns a subset of the alignment by samples, markers and sites.""" - # sample_ids = [1,2,3] - # marker_ids = ['marker_0'] - # aln_obj = Alignment.from_fasta('test_alignment.txt', 'test_align', 'marker') - - # subset = (aln_obj,sample_ids, marker_ids) - # test_subset = -#---------------------------------------------------- - def test_get_samples(self): - """tests aln.object.get_samples returns expected - sequences sample of an alignment file - tests: - valid input - invalid sample id - invalid types""" - # valid input - get_sample_str = self.aln_file.get_samples('Dmel_528_2597') - get_sample_index = self.aln_file.get_samples(0) - expected_sites = 26 - expected_samples = 1 - expected_markers = 0 - expected_sequence = ['ATGAAGAGCAAGGTGGGGGGGGGGGG'] - test_sample_list = [get_sample_str,get_sample_index] - - for test in test_sample_list: - assert isinstance(test, object) - assert test.nsites == expected_sites - assert test.nsamples == expected_samples - assert test.nmarkers == expected_markers - assert test.sample_sequences == expected_sequence - - # invalid sample_id - try: - invalid_sample_name_str = self.aln_file.get_samples('Dmel_528_259700') - invalid_sample_name_lst = self.aln_file.get_samples(['Dmel_528_259700']) - invalid_sample_id_int = self.aln_file.get_samples(-1) - invalid_sample_id_lst = self.aln_file.get_samples([-1]) - - except: - assert ValueError - - # invalid type - test_invalid_types = [{'Dmel_528_2597':0 },('Dmel_528_2597')] - try: - - for invalid_input in test_invalid_types: - invalid_id = self.aln_file.get_samples(invalid_input) - except: - assert ValueError - - try: - test_invalid_list_items = [[],[{'Dmel_528_2597':0 }]] - - for invalid_input in test_invalid_list_items: - invalid_id = self.aln_file.get_samples(invalid_input) - except: - assert ValueError -#---------------------------------------------------- - def test_get_markers(self): - """tests if aln.object.get_markers returns expected - marker sequences of an alignment file - tests: - valid input - invalid sample id - invalid types""" - - # VI - get_markers_str = self.aln_file.get_markers('marker_0') - get_markers_int = self.aln_file.get_markers(0) - get_markers_list_str = self.aln_file.get_markers(['marker_0']) - get_markers_list_int = self.aln_file.get_markers([0]) - expected_marker_sequence = ['CCCCCCCCCCCCCCCCCCCCCCCCCC'] - tests = [get_markers_str, get_markers_int, get_markers_list_str, get_markers_list_int] - for test in tests: - assert isinstance(test,object) - assert test.sequences == ['CCCCCCCCCCCCCCCCCCCCCCCCCC'] - assert test.nsites == 26 - #assert test.nsamples == 1 # attribute error - - # IVI - try: - inv_markers_str = self.aln_file.get_markers('marker_01') - inv_markers_int = self.aln_file.get_markers(1) - inv_markers_list_str = self.aln_file.get_markers(['marker_01']) - inv_markers_list_int = self.aln_file.get_markers([1]) - tests = [inv_markers_str, inv_markers_int, inv_markers_list_str, inv_markers_list_int] - - except ValueError: - pass - - # IVT - try: - test_invalid_types = [{'marker_0':0 },('marker_0')] - except ValueError: - pass - -#---------------------------------------------------- - #def test_get_sites(self): # row error - # """Returns a new alignment containing only the sites specified - # #by the given list of column numbers.""" -#---------------------------------------------------- - # Setter/Replacer - def test_replace_samples(self): # - """tests if aln.object.replace_samples replaces the sequence - of one or more sample in the aln.object""" - - new_sample = 'AT' * 13 - prev_sample_sequence = self.aln_file.sample_sequences[0] - self.aln_file.replace_samples(['Dmel_528_2597'], [new_sample]) - curr_sequence = self.aln_file.sample_sequences[0] - - assert not prev_sample_sequence == curr_sequence - assert curr_sequence == new_sample -#---------------------------------------------------- - def test_insert_samples_from_lists(self): - """tests if aln.object.insert_samples_from_lists adds one or - more sequences in the aln.object""" - - new_sample_id = 'Dsim99201' - new_sample_desc = '|CH2912|' - new_sample_sequence = 'G' * 26 - self.aln_file.insert_samples_from_lists(1, [new_sample_id], - [new_sample_desc], - [new_sample_sequence]) - - assert self.aln_file.sample_ids[1] == new_sample_id - assert self.aln_file.sample_descriptions[1] == new_sample_desc - # error here, returns does not insert expected sequence value - #assert self.aln_file.sample_sequences[1] == new_sample_sequence -#---------------------------------------------------- - def test_append_sample_from_lists(self): - """tests if append_sample_from_lists adds one or - more sequences in the last index of aln.object""" - - new_sample_id = 'Dere_lastind' - new_sample_desc = '|last_ind|' - new_sample_sequence = 'G' * 26 - self.aln_file.append_sample_from_lists([new_sample_id], [new_sample_desc], [new_sample_sequence]) - assert self.aln_file.sample_sequences[-1] == new_sample_sequence - assert self.aln_file.sample_ids[-1] == new_sample_id - assert self.aln_file.sample_descriptions[-1] == new_sample_desc -#---------------------------------------------------- - def test_remove_samples(self): - """tests if aln.obj.remove_samples removes all sample - information of one or more indices from the alignment object""" - - index_to_remove = 1 - sequence_to_remove = self.aln_file.sample_sequences[index_to_remove] - self.aln_file.remove_samples(index_to_remove) - assert sequence_to_remove != self.aln_file.sample_sequences[1] -#---------------------------------------------------- - def test_retain_samples(self): - """tests if aln.obj.retain_samples removes all sample - information apart from specified indices in - alignment object""" - - self.aln_file.retain_samples([1]) - assert self.aln_file.nsamples == 1 - assert len(self.aln_file.sample_ids) == 1 - assert len(self.aln_file.sample_descriptions) == 1 - assert len(self.aln_file.sample_sequences) == 1 - assert self.aln_file.nmarkers == 1 - assert len(self.aln_file.marker_ids) == 1 - assert len(self.aln_file.marker_descriptions) == 1 - assert len(self.aln_file.marker_sequences) == 1 -#---------------------------------------------------- - def test_remove_sites(self): - """tests if aln.obj.remove_sites removes all one or more - sequences from the alignment sequences""" - - self.aln_file.remove_sites([2]) - assert self.aln_file.nsites == (25) -#---------------------------------------------------- - def test_retain_sites(self): - """tests if aln.obj.retain_sites all sequences - apart from specified sequences in alignment sequences""" - self.aln_file.retain_sites([0,1,2]) - assert self.aln_file.nsites == 3 - #TODO- should assert to that the positions are not ATG once - # get samples sequences is fixes -#---------------------------------------------------- - def test_from_fasta(cls): - """Create an Alignment object from a FASTA-formatted file.""" - aln_obj = Alignment.from_fasta('test_alignment_b.txt', 'test_align', 'marker') - assert aln_obj.nsites == 26 - assert aln_obj.nsamples == 3 - assert aln_obj.nmarkers == 1 -#---------------------------------------------------- - # Format converters - # tested, remove hashtag when done - #def test_to_fasta(self): - """Saves the alignment as a FASTA-formatted text file.""" - #create_aln_file = self.aln_file.to_fasta('test_aln_file') # should change input to path_to_file - #TODO- check if len(currentdir) increases by one, - #check if test_aln_file in dir - #use from_fasta to create new alingment object - - # How does this work? - - # Block-related methods - - #def test_set_blocklists(self, ref_seq, description_encoder=None): -# """Creates new block information for the sequences given a reference. """ -#---------------------------------------------------- - # def test_parse_description_as_blocks(self, description_decoder=None): -# """Parses sample description into block data.""" -#---------------------------------------------------- - # def test_write_blocks_to_description(self, description_encoder): -# """Writes each sample's block data as a string, replacing its - # description.""" -#---------------------------------------------------- diff --git a/test_alignment_b.txt b/test_alignment_b.txt deleted file mode 100644 index 4811f60..0000000 --- a/test_alignment_b.txt +++ /dev/null @@ -1,8 +0,0 @@ ->marker_0 |91 sp| -CCCCCCCCCCCCCCCCCCCCCCCCCC ->Dmel_528_2597 |10 sp| -ATGAAGAGCAAGGTGGGGGGGGGGGG ->Dmel_RG2 |47 sp| -ATGAAGAGCAAGGTGGACCCCCCCCC ->Dmel_RG4N |15 sp| -ATGAAGAGCAAGGTGGAAAAAAAAAA \ No newline at end of file From 3f6cb61bf44f3f4062f43f2e0c5e47629caebf4f Mon Sep 17 00:00:00 2001 From: Hassan Daanaa <45001829+hsdaanaa@users.noreply.github.com> Date: Wed, 13 Feb 2019 22:54:06 +0900 Subject: [PATCH 11/12] Add files via upload --- alignmentrs/tests/test_alignment_0_8_5.py | 1071 +++++++++++++++++++++ 1 file changed, 1071 insertions(+) create mode 100644 alignmentrs/tests/test_alignment_0_8_5.py diff --git a/alignmentrs/tests/test_alignment_0_8_5.py b/alignmentrs/tests/test_alignment_0_8_5.py new file mode 100644 index 0000000..edf0ad3 --- /dev/null +++ b/alignmentrs/tests/test_alignment_0_8_5.py @@ -0,0 +1,1071 @@ +import os +from alignmentrs.aln import Alignment + +#TODO- aln.subset: test invalid inputs +# aln.subset: test int and str input +# iter__xxx: write tests +# to_xxx_matrix_: write tests +# block_functions: write tests +# description editing + +def type_error(expected, actual): + return 'Expected type {}, instead got {}'.format(expected, actual) + +def value_error(expected, actual): + return 'Expected value {}, instead got {}'.format(expected, actual) + +def index_error(expected, actual): + return 'Expected type {}, instead got {}'.format(expected, actual) + +TypeError_msg = 'Expected TypeError' +ValueError_msg = 'Expected ValueError' +IndexError_msg = 'Expected IndexError' +Error_msg = 'Expected Error' + +class TestAlignmentGetters: + + # TODO: Refactor tests so that each test is very simple and + # multiple assertions are minimized, see test_nrows* and test_nsamples* + # TODO: Make "printer" functions like type_error and value_error + # above to standardize errors when the assertion + + # basic test for expected outputs + def setup(self): + # Create an alignment for testing + self.temp_filename = 'temp.aln' + with open(self.temp_filename, 'w') as fp: + print('>marker_0 |91 sp|\n', file=fp) + print('CCCCCCCCCCCCCCCCCCCCCCCCCC\n', file=fp) + print('>Dmel_528_2597 |10 sp|\n', file=fp) + print('ATGAAGAGCAAGGTGGGGGGGGGGGG\n', file=fp) + print('>Dmel_RG2 |47 sp|\n', file=fp) + print('ATGAAGAGCAAGGTGGACCCCCCCCC\n', file=fp) + print('>Dmel_RG4N |15 sp|\n', file=fp) + print('ATGAAGAGCAAGGTGGAAAAAAAAAA\n', file=fp) + # initiates alignment object for tests + self.aln_file = Alignment.from_fasta(self.temp_filename, 'test_align', marker_kw='marker') + + def teardown(self): + if os.path.exists(self.temp_filename): + os.remove(self.temp_filename) + + def test_nrows_type(self): + """Checks if aln.obj.nrows output type matches expected + type + """ + expected = int + result = type(self.aln_file.nrows) + assert expected == result, type_error(expected, result) + + def test_nrows_value(self): + """Checks if aln.obj.nrows output value matches expected + value + """ + expected = 4 + result = self.aln_file.nrows + assert expected == result, value_error(expected, result) +#----------------------------------------------------------------------------- + def test_nsamples_type(self): + """Checks if aln.obj.nrows output type matches expected + type + """ + expected = int + result = type(self.aln_file.nsamples) + assert expected == result, type_error(expected, result) + + def test_nsamples_value(self): + """Checks if aln.obj.nrows output value matches expected + value + """ + expected = 3 + result = self.aln_file.nsamples + assert expected == result, value_error(expected, result) +#----------------------------------------------------------------------------- + def test_nmarkers_type(self): + """Checks if aln.obj.nmarkers output type matches + expected type + """ + expected = int + result = self.aln_file.nmarkers + assert isinstance(result, expected), type_error(expected, result) + + def test_nmarkers_value(self): + """Checks if aln.obj.nmarkers value matches + expected number of markers in the sample + """ + expected = 1 + result = self.aln_file.nmarkers + assert expected == result, value_error(expected, result) +#----------------------------------------------------------------------------- + def test_nsites_type(self): + """checks if aln.obj.nsites output type matches + expected type + """ + expected = int + result = self.aln_file.nsites + assert isinstance(result, expected), type_error(expected, result) + + def test_nsites_value(self): + """checks if aln.obj.nsites value matches expected number + of sites in alignment(i.e sequence length) + """ + expected = 26 + result = self.aln_file.nsites + assert expected == result, value_error(expected, result) +#----------------------------------------------------------------------------- + def test_sample_ids_type(self): + """Checks if aln.obj.sample_ids type matches + expected type + """ + expected = list + result = self.aln_file.sample_ids + assert isinstance(result, expected), type_error(expected, result) + + def test_sample_ids_value(self): + """Checks if all aln.obj.sample_ids match expected + sample ids + """ + expected = ['Dmel_528_2597', 'Dmel_RG2', 'Dmel_RG4N'] + result = self.aln_file.sample_ids + assert expected == result, value_error(expected, result) +#----------------------------------------------------------------------------- + def test_sample_descriptions_type(self): + """Checks if aln.obj.sample_descriptions output type + matches expected type + """ + expected = list + result = self.aln_file.sample_descriptions + assert isinstance(result, expected), type_error(expected, result) + + def test_sample_descriptions_value(self): + """Checks if aln.obj.sample_descriptions value matches + expected value + """ + expected = ['|10 sp|', '|47 sp|', '|15 sp|'] + result = self.aln_file.sample_descriptions + assert expected == result, value_error(expected, result) +#----------------------------------------------------------------------------- + def test_sample_sequences_type(self): + """Checks if aln.obj.sample_sequences output type + matches expected type + """ + expected = list + result = self.aln_file.sample_sequences + assert isinstance(result, expected), type_error(expected, result) + + def test_sample_sequences_value(self): + """Checks if aln.obj.sample_sequences value output matches + expected value + """ + expected = ['ATGAAGAGCAAGGTGGGGGGGGGGGG', + 'ATGAAGAGCAAGGTGGACCCCCCCCC', + 'ATGAAGAGCAAGGTGGAAAAAAAAAA'] + result = self.aln_file.sample_sequences + assert result == expected, value_error(expected, result) +#----------------------------------------------------------------------------- + def test_marker_ids_type(self): + """Checks if aln.obj.marker_ids output type matches expected + type + """ + expected = list + result = self.aln_file.marker_ids + assert isinstance(result, expected), type_error(expected, result) + + def test_marker_ids_value(self): + """Checks if aln.obj.marker_ids value matches + expected value + """ + expected = ['marker_0'] + result = self.aln_file.marker_ids + assert result == expected, value_error(expected, result) +#----------------------------------------------------------------------------- + def test_marker_descriptions_type(self): + """checks if aln.obj.marker_descriptions output type + matches expected output + """ + expected = list + result = self.aln_file.marker_descriptions + assert isinstance(result, expected), type_error(expected, result) + + def test_marker_descriptions_value(self): + """checks if aln.obj.marker_descriptions output + value expected output + """ + expected = ['|91 sp|'] + result = self.aln_file.marker_descriptions + assert result == expected, value_error(expected, result) +#----------------------------------------------------------------------------- + def test_marker_sequences_type(self): + """Checks if align.obj.marker_sequences output type + matches expected output + """ + expected = list + result = self.aln_file.marker_sequences + assert isinstance(result, expected), type_error(expected, result) + + def test_marker_sequences_value(self): + """Checks if align.obj.marker_sequences value + matches expected output + """ + expected = ['CCCCCCCCCCCCCCCCCCCCCCCCCC'] + result = self.aln_file.marker_sequences + assert result == expected, value_error(expected, result) +#---------------------------------------------------- + # class methods + def test_subset_input_sample_id(self): + """Returns a subset of the alignment by samples, markers and sites.""" + sample_ids = [0,1] + expected_nsamples = 2 + expected_names = ['Dmel_528_2597', 'Dmel_RG2'] + expected_descriptions = ['|10 sp| ', '|47 sp| '] + expected_sequences = ['ATGAAGAGCAAGGTGGACCCCCCCCC', 'ATGAAGAGCAAGGTGGAAAAAAAAAA'] + result_subset = self.aln_file.subset(self.aln_file, sample_ids) # fails for sume reason + result_nsamples = result_subset.nsamples + result_ids = result_subset.sample_ids + result_desc = result_subset.sample_descriptions + result_seq = result_subset.sample_sequences + assert expected_nsamples == result_nsamples, value_error(expected_nsamples,result_nsamples) + assert expected_names == result_ids, value_error(expected_names ,result_ids) + assert expected_descriptions == result_desc, value_error(expected_descriptions ,result_desc) + assert expected_sequences == result_seq, value_error(expected_sequences ,result_seq) + + def test_subset_input_marker_id(self): + """Returns a subset of the alignment by samples, markers and sites.""" + marker_index = [0] + expected_nsamples = 1 + expected_names = ['marker_0'] + expected_descriptions = ['|91 sp|'] + expected_sequences = ['CCCCCCCCCCCCCCCCCCCCCCCCCC'] + result_subset = self.aln_file.subset(self.aln_file, marker_ids = marker_index) + result_nmarkers = result_subset.nmarkers + result_ids = result_subset.marker_ids + result_desc = result_subset.marker_descriptions + result_seq = result_subset.marker_sequences + assert expected_nsamples == result_nmarkers, value_error(expected_nsamples,result_nmarkers) + assert expected_names == result_ids, value_error(expected_names ,result_ids) # fails, gives wrong expected marker + assert expected_descriptions == result_desc, value_error(expected_descriptions ,result_desc) + assert expected_sequences == result_seq, value_error(expected_sequences ,result_seq) + + # HSD: TODO- test invalid invalid inputs + # HSD: TODO- test int and str input + + # def test_subset(self): + # """Returns a subset of the alignment by samples, markers and sites.""" + # expected_sample_ids = [0,1] + # result_subset = (self.aln_file,sample_ids) + + # result_sample_ids = result_subset.get_markers + # result_sample_desc = + # result_sample_seq = + # assert +#---------------------------------------------------- + def test_get_samples_valid_str(self): + """checks if aln.object.get_samples returns expected + output type given an input str or int""" + + result = self.aln_file.get_samples('Dmel_528_2597') + result_0 = self.aln_file.get_samples(0) + expected = object + assert isinstance(result,expected), type_error(expected, result) + assert isinstance(result_0,expected), type_error(expected, result_0) + + def test_get_samples_valid_list(self): + """checks if aln.object.get_samples returns expected + output type given an input list_str or list_int""" + + result = self.aln_file.get_samples(['Dmel_528_2597']) + result_0 = self.aln_file.get_samples([0]) + expected = object + assert isinstance(result,expected), type_error(expected, result) + assert isinstance(result_0,expected), type_error(expected, result_0) +#----------------------------------------------------------------------------- + def test_get_samples_str_in_invalid_type(self): + """checks if aln.object.get_samples raises error, given + an invalid type i.e set, tuple or none""" + try: + valid_str_invalid_type_set_str = self.aln_file.get_samples({}) + except TypeError: + pass + else: + raise Exception(TypeError_msg) + try: + valid_str_invalid_type_tuple_str = self.aln_file.get_samples(()) + except TypeError: + pass + else: + raise Exception(TypeError_msg) + try: + None_type = self.aln_file.get_samples(None) + except TypeError: + pass + else: + raise Exception(TypeError_msg) + + def test_get_samples_invalid_list_items(self): + """checks if aln.object.get_samples raises error, given + an invalid type in a list i.e tuple, set none in list""" + try: + set_in_list = self.aln_file.get_samples([{}]) + except TypeError: + pass + else: + raise Exception(TypeError_msg) + try: + tuple_in_list = self.aln_file.get_samples([()]) + except TypeError: + pass + else: + raise Exception(TypeError_msg) + try: + none_in_list = self.aln_file.get_samples([None]) + except TypeError: + pass + else: + raise Exception(TypeError_msg) + + def test_get_samples_invalid_str_sample_id(self): + """checks if aln.object.get_samples raises error, given + an invalid string sample id""" + try: + invalid_str = self.aln_file.get_samples('Dmel_528_259700') + except ValueError: + pass + else: + raise Exception(ValueError_msg) + + def test_get_samples_invalid_int_sample_id(self): + """checks if aln.object.get_samples raises error, given + an invalid index of a sample id""" + try: + invalid_str = self.aln_file.get_samples(-1) + except ValueError: + pass + else: + raise Exception(ValueError_msg) + + def test_get_samples_invalid_str_sample_id(self): + """checks if aln.object.get_samples raises error, given + an invalid string sample id in list""" + try: + invalid_str = self.aln_file.get_samples(['Dmel_528_259700']) + except ValueError: + pass + else: + raise Exception(ValueError_msg) + + def test_get_samples_invalid_int_sample_id(self): + """checks if aln.object.get_samples raises error, given + an invalid index of a sample id in list""" + try: + invalid_index = self.aln_file.get_samples([-1]) + except IndexError: + pass + else: + raise Exception(IndexError_msg) + + # TODO: Do not make compound tests! + # Each assertion should be a separate test so that it will fail for + # that specific test. + # For example, test.nsites == expected_sites is unnecessary because it + # duplicates an existing test - test_nsites +#----------------------------------------------------------------------------- + def test_get_markers_valid_input(self): + """checks if aln.object.get_markers returns expected + marker sequences of an alignment file + """ + result = self.aln_file.get_markers('marker_0') + result_0 = self.aln_file.get_markers(0) + expected = object + assert isinstance(result,expected), type_error(expected, result) + assert isinstance(result_0,expected), type_error(expected, result_0) + + def test_get_markers_valid_list_input(self): + """Tests if aln.object.get_markers returns expected + marker sequences of an alignment file, given a list + input + """ + result = self.aln_file.get_markers(['marker_0']) + result_0 = self.aln_file.get_markers([0]) + expected = object + assert isinstance(result,expected), type_error(expected, result) + assert isinstance(result_0,expected), type_error(expected, result_0) + # TODO: testing single char and list should be different tests as they are two scenarios of calling the method + + def test_get_markers_valid_invalid_type(self): + """checks if aln.object.get_markers raises error, given + an invalid type i.e tuple, set none""" + try: + valid_str_invalid_type_0 = self.aln_file.get_markers({}) + except TypeError: + pass + else: + raise Exception(TypeError_msg) + try: + valid_str_invalid_type_00 = self.aln_file.get_markers(()) + except TypeError: + pass + else: + raise Exception(TypeError_msg) + + try: + None_type = self.aln_file.get_markers(None) + except TypeError: + pass + else: + raise Exception(TypeError_msg) + def test_get_markers_valid_invalid_list_items(self): + """checks if aln.object.get_markers raises error, given + an invalid type in a list i.e tuple, set or none""" + try: + valid_str_invalid_type_0 = self.aln_file.get_markers([{}]) + except TypeError: + pass + else: + raise Exception(TypeError_msg) + try: + valid_str_invalid_type_00 = self.aln_file.get_markers([()]) + except TypeError: + pass + else: + raise Exception(TypeError_msg) + try: + None_type = self.aln_file.get_markers([None]) + except TypeError: + pass + else: + raise Exception(TypeError_msg) +#---------------------------------------------------- + #def test_get_sites(self): # row error + # """Returns a new alignment containing only the sites specified + # #by the given list of column numbers.""" + +#---------------------------------------------------- + # Setter/Replacer + #TODO- could test invalid input types + def test_insert_samples_from_lists_valid_inputs(self): + """checks if aln.object.insert_samples_from_lists inserts a + new sample into the aln.object + """ + expected_id = 'Dsim99201' + expected_desc = '|CH2912|' + expected_sequence = 'G' * 26 + self.aln_file.insert_samples_from_lists(1, [expected_id],[expected_desc],[expected_sequence]) + result_id = self.aln_file.sample_ids[1] + result_description = self.aln_file.sample_descriptions[1] + result_sequence = self.aln_file.sample_sequences[1] + assert expected_id == result_id, value_error(expected_id,result_id) + assert expected_desc == result_description , value_error(expected_desc,result_description) + assert result_sequence == expected_sequence, value_error(expected_sequence,result_sequence) + + def test_insert_samples_from_lists_valid_invalid_index(self): + """checks if aln.object.insert_samples_from_lists raises + index error given an invalid index + """ + invalid_index = -1 + valid_id = 'Dsim99201' + valid_desc = '|CH2912|' + valid_sequence = 'G' * 26 + try: + self.aln_file.insert_samples_from_lists(invalid_index, [valid_id],[valid_desc], [valid_sequence]) + except IndexError: + pass + else: + raise Exception(IndexError_msg) + + def test_insert_samples_from_lists_valid_invalid_id(self): + """checks if aln.object.insert_samples_from_lists raises + Type error given an invalid type for sample id + """ + valid_index = 1 + invalid_id = 1 + valid_desc = '|CH2912|' + valid_sequence = 'G' * 26 + try: + self.aln_file.insert_samples_from_lists(valid_index,[invalid_id],[valid_desc],[valid_sequence]) + except TypeError: + pass + else: + raise Exception(TypeError_msg) + + def test_insert_samples_from_lists_valid_invalid_description(self): + """checks if aln.object.insert_samples_from_lists raises + Type error given an invalid type for sample description + """ + valid_index = 1 + valid_id = 'Dsim99201' + invalid_desc = 1 + valid_sequence = 'G' * 26 + try: + self.aln_file.insert_samples_from_lists(valid_index,[valid_id],[invalid_desc],[valid_sequence]) + except TypeError: + pass + else: + raise Exception(TypeError_msg) + + def test_insert_samples_from_lists_valid_invalid_sequence(self): + """checks if aln.object.insert_samples_from_lists raises + Type error given an invalid type for sample sequence + """ + valid_index = 1 + valid_id = 'Dsim99201' + valid_desc = 1 + invalid_sequence = 26 + try: + self.aln_file.insert_samples_from_lists(valid_index, [valid_id],[valid_desc],[invalid_sequence]) + except TypeError: + pass + else: + raise Exception(TypeError_msg) +#----------------------------------------------------------------------------- + def test_append_sample_from_lists_valid_inputs(self): + """Tests if append_sample_from_lists appends a + to the last index of aln.object + """ + expected_id = 'Dere_lastind' + expected_desc = '|last_ind|' + expected_sequence = 'G' * 26 + self.aln_file.append_sample_from_lists([expected_id],[expected_desc], [expected_sequence]) + result_id = self.aln_file.sample_ids[-1] + result_desc = self.aln_file.sample_descriptions[-1] + result_sequence = self.aln_file.sample_sequences[-1] + assert result_id == expected_id, type_error(expected_id, result_id) + assert result_desc == expected_desc, type_error(expected_desc, result_desc) + assert result_sequence == expected_sequence, type_error(expected_sequence, result_sequence) + + def test_append_sample_from_lists_invalid_id_type(self): + """checks if aln.object.append_sample_from_lists raises + Type error given an invalid type for sample id + """ + sample_id = 1 + sample_desc = '|last_ind|' + sample_sequence = 'G' * 26 + + try: + result = self.aln_file.append_sample_from_lists([sample_id],[sample_desc], [sample_sequence]) + except TypeError: + pass + else: + raise Exception(TypeError_msg) + + def test_append_sample_from_lists_invalid_description_type(self): + """checks if aln.object.append_sample_from_lists raises + Type error given an invalid type for sample description + """ + expected_id = 'Dere_lastind' + expected_desc = 1 + expected_sequence = 'G' * 26 + try: + result = self.aln_file.append_sample_from_lists([expected_id],[expected_desc], [expected_sequence]) + except TypeError: + pass + else: + raise Exception(TypeError_msg) + + def test_append_sample_from_lists_invalid_sequence_type(self): + """checks if aln.object.append_sample_from_lists raises + Type error given an invalid type for sample sequence + """ + expected_id = 'Dere_lastind' + expected_desc = '|last_ind|' + expected_sequence = 26 + try: + result = self.aln_file.append_sample_from_lists([expected_id],[expected_desc], [expected_sequence]) + except TypeError: + pass + else: + raise Exception(TypeError_msg) +#----------------------------------------------------------------------------- + def test_remove_samples_valid_sample_name(self): + """checks if aln.obj.remove_samples removes sample + information of a sample in the alignment object + given a str sample id + """ + sample_name_to_remove = 'Dmel_RG2' + sample_index = 1 + self.aln_file.remove_samples(sample_name_to_remove) + result_sample_id = self.aln_file.sample_ids[sample_index] + result_sequence = self.aln_file.sample_sequences[sample_index] + result_desc = self.aln_file.sample_descriptions[sample_index] + expected_sample_id = ['Dmel_RG4N'] + expected_sequence = ['|15 sp|'] + expected_desc = 'ATGAAGAGCAAGGTGGAAAAAAAAAA' + assert expected_sample_id != result_sample_id, value_error(expected_sample_id,result_sequence) + assert expected_sequence != result_desc, value_error(expected_sequence,result_sample_id) + assert expected_desc != result_desc,type_error(expected_desc,result_desc) + + def test_remove_samples_valid_index(self): + """checks if aln.obj.remove_samples removes sample + information of a sample in the alignment object + given the sample index position + """ + index_to_remove = 1 + self.aln_file.remove_samples(index_to_remove) + result_sample_id = self.aln_file.sample_ids[index_to_remove] + result_sequence = self.aln_file.sample_sequences[index_to_remove] + result_desc = self.aln_file.sample_descriptions[index_to_remove] + expected_sample_id = ['Dmel_RG4N'] + expected_sequence = ['|15 sp|'] + expected_desc = 'ATGAAGAGCAAGGTGGAAAAAAAAAA' + assert expected_sample_id != result_sample_id, value_error(expected_sample_id,result_sequence) + assert expected_sequence != result_desc, value_error(expected_sequence,result_sample_id ) + assert expected_desc != result_desc,type_error(expected_desc,result_desc ) + + def test_remove_samples_invalid_str(self): + """checks if aln.obj.remove_samples gives a + TypeError given an invalid sample id + """ + sample_name_to_remove = 'Dmel_RG4N0' + try: + self.aln_file.remove_samples(sample_name_to_remove) + except ValueError: + pass + else: + raise Exception(TypeError_msg) + + def test_remove_samples_invalid_index(self): + """checks if aln.obj.remove_samples gives an + IndexError given an invalid input index + """ + index_to_remove = -1 + try: + self.aln_file.remove_samples(index_to_remove) + except IndexError: + pass + else: + raise Exception(index_error) + + def test_remove_samples_invalid_type(self): + """checks if aln.obj.remove_samples gives a + ValueError given an invalid input type i.e + dict, float, set and tuple + """ + float_type = 1.1 + dict_type = {1:'w'} + set_type = {} + tuple_type = () + try: + self.aln_file.remove_samples(float_type) + except TypeError: + pass + else: + raise Exception(TypeError_msg) + + try: + self.aln_file.remove_samples(dict_type) + except TypeError: + pass + else: + raise Exception(TypeError_msg) + try: + self.aln_file.remove_samples(set_type) + except TypeError: + pass + else: + raise Exception(TypeError_msg) + try: + self.aln_file.remove_samples(tuple_type) + except TypeError: + pass + else: + raise Exception(TypeError_msg) +#----------------------------------------------------------------------------- + def test_retain_samples_valid_input(self): + """checks if aln.obj.retain_samples changes + properties of the alignment object + """ + self.aln_file.retain_samples([1]) + expected_len = 1 + result_sample_num = self.aln_file.nsamples + result_sample_id_num = len(self.aln_file.sample_ids) + result_sample_desc_num = self.aln_file.sample_descriptions + result_sample_seq_num = len(self.aln_file.sample_sequences) + result_marker_num = self.aln_file.nmarkers + result_marker_id_num = len(self.aln_file.marker_ids) + result_marker_desc_num = len(self.aln_file.marker_descriptions) + result_marker_seq_num = len(self.aln_file.marker_sequences) + + assert result_sample_num == expected_len, value_error(expected_len, result_sample_num ) + assert result_sample_id_num == expected_len, value_error(expected_len, result_sample_id_num ) + assert result_sample_desc_num == expected_len, valu_error(expected_len, result_sample_desc_num ) + assert result_sample_seq_num == expected_len, value_error(expected_len, result_sample_seq_num) + assert result_marker_num == expected_len, value_error(expected_len, result_marker_num ) + assert result_marker_id_num == expected_len, value_error(expected_len, result_marker_id_num ) + assert result_marker_desc_num == expected_len, value_error(expected_len, result_marker_desc_num) + assert result_marker_seq_num == expected_len, value_error(expected_len, result_marker_seq_num) + + def test_retain_samples_valid_input(self): + """checks if aln.obj.retain_samples retains + expected sample in the alignment + """ + self.aln_file.retain_samples([1]) + expected_len = 1 + result_sample_id = self.aln_file.sample_ids[0] + result_sample_description = self.aln_file.sample_descriptions[0] + result_sequence = self.aln_file.sample_sequences[0] + expected_sample_id = 'Dmel_RG2' + expected_sample_description = '|47 sp|' + expected_sequence = 'ATGAAGAGCAAGGTGGACCCCCCCCC' + + assert expected_sample_id == result_sample_id, value_error(expected_sample_id, result_sample_id) + assert expected_sample_description == result_sample_description, value_error(expected_sample_description, result_sample_description) + assert expected_sequence == result_sequence, value_error(expected_sequence, result_sequence) + + def test_retain_samples_invalid_list_input(self): + """checks if aln.obj.retain_samples raises + an error given the wrong input type in list + """ + try: + self.aln_file.retain_samples(['1.1']) + except TypeError: + pass + else: + raise Exception(TypeError_msg) + try: + self.aln_file.retain_samples([1.1]) + except TypeError: + pass + else: + raise Exception(TypeError_msg) + try: + self.aln_file.retain_samples([-1]) + except TypeError: + pass + else: + raise Exception(TypeError_msg) + try: + self.aln_file.retain_samples([{}]) + except TypeError: + pass + else: + raise Exception(TypeError_msg) + try: + self.aln_file.retain_samples([]) + except TypeError: + pass + else: + raise Exception(TypeError_msg) + try: + self.aln_file.retain_samples([None]) + except TypeError: + pass + else: + raise Exception(TypeError_msg) + + def test_retain_samples_invalid_input(self): + """checks if aln.obj.retain_samples raises + an error given the wrong input type + """ + try: + self.aln_file.retain_samples('1.1') + except TypeError: + pass + else: + raise Exception(TypeError_msg) + try: + self.aln_file.retain_samples(1.1) + except TypeError: + pass + else: + raise Exception(TypeError_msg) + try: + self.aln_file.retain_samples(-1) + except TypeError: + pass + else: + raise Exception(TypeError_msg) + try: + self.aln_file.retain_samples({}) + except TypeError: + pass + else: + raise Exception(TypeError_msg) + try: + self.aln_file.retain_samples() + except TypeError: + pass + else: + raise Exception(TypeError_msg) + try: + self.aln_file.retain_samples(None) + except TypeError: + pass + else: + raise Exception(TypeError_msg) + # TODO: Other than count, test whether the correct sample was retained +#----------------------------------------------------------------------------- + def test_remove_sites_list_input(self): + """tests if aln.obj.remove_sites makes expected change + to number of sites in alignment given int in list""" + self.aln_file.remove_sites([2]) + expected = 25 + result = self.aln_file.nsites + assert expected == result, value_error(expected, actual) + + def test_remove_sites_int_input(self): + """tests if aln.obj.remove_sites makes expected change + to number of sites in alignment given an input int""" + self.aln_file.remove_sites(2) + expected = 25 + result = self.aln_file.nsites + assert expected == result, value_error(expected, actual) + + def test_remove_sites_empty_input(self): + """tests if aln.obj.remove_sites makes expected change + to number of sites in alignment given an input int""" + self.aln_file.remove_sites(()) + expected = 26 + result = self.aln_file.nsites + assert expected == result, value_error(expected, actual) + + def test_remove_sites_empty_list_input(self): + """tests if aln.obj.remove_sites makes expected change + to number of sites in alignment given an input int""" + self.aln_file.remove_sites([]) + expected = 26 + result = self.aln_file.nsites + assert expected == result, value_error(expected, actual) + + def test_remove_sites_invalid_input(self): + """tests if aln.obj.remove_sites raises an + error given invalid input""" + try: + self.aln_file.remove_sites(-2) + except IndexError: + pass + else: + raise Exception(IndexError_msg) + try: + self.aln_file.remove_sites({}) + except TypeError: + pass + else: + raise Exception(TypeError_msg) + try: + self.aln_file.remove_sites(None) + except TypeError: + pass + else: + raise Exception(TypeError_msg) + + def test_remove_sites_invalid_list_input(self): + """tests if aln.obj.remove_sites raises an + error given an invalid list input""" + try: + self.aln_file.remove_sites([-2]) + except IndexError: + pass + else: + raise Exception(IndexError_msg) + + try: + self.aln_file.remove_sites([()]) + except TypeError: + pass + else: + raise Exception(TypeError_msg) + + try: + self.aln_file.remove_sites([{}]) + except TypeError: + pass + else: + raise Exception(TypeError_msg) + try: + self.aln_file.remove_sites([None]) + except TypeError: + pass + else: + raise Exception(TypeError_msg) +#----------------------------------------------------------------------------- + def test_retain_sites_valid_input(self): + """tests if aln.obj.retain_sites removes all + but specified samples in the alignment object""" + self.aln_file.retain_sites(0,1,2) + expected = 26 + result = self.aln_file.nsites + + assert expected == result, value_error(expected, result) + + def test_retain_sites_valid_list_input(self): + """tests if aln.obj.retain_sites removes all + but specified samples in the alignment object""" + self.aln_file.retain_sites([0,1,2]) + expected = 3 + result = self.aln_file.nsites + + assert expected == result, value_error(expected, result) + + def test_retain_sites_invalid_input(self): + """tests if aln.obj.retain_sites all sequences + apart from specified sequences in alignment sequences""" + try: + self.aln_file.retain_sites(-1) + except IndexError: # Expected index error + pass + else: + raise Exception(IndexError_msg) + try: + self.aln_file.retain_sites((1,)) + except TypeError: # Expected index error + pass + else: + raise Exception(TypeError_msg) + try: + self.aln_file.retain_sites({}) + except TypeError: # Expected index error + pass + else: + raise Exception(TypeError_msg) + try: + self.aln_file.retain_sites(-1) + except TypeError: # Expected index error + pass + else: + raise Exception(TypeError_msg) + try: + self.aln_file.retain_sites('') + except TypeError: # Expected index error + pass + else: + raise Exception(TypeError_msg) + + def test_retain_sites_invalid_input(self): + """tests if aln.obj.retain_sites all sequences + apart from specified sequences in alignment sequences + given an input list""" + try: + self.aln_file.retain_sites([-1]) + except IndexError: # Expected index error + pass + else: + raise Exception(IndexError_msg) + try: + self.aln_file.retain_sites([(1,)]) + except TypeError: + pass + else: + raise Exception(TypeError_msg) + try: + self.aln_file.retain_sites([{}]) + except TypeError: + pass + else: + raise Exception(TypeError_msg) + try: + self.aln_file.retain_sites([-1]) + except TypeError: + pass + else: + raise Exception(TypeError_msg) + try: + self.aln_file.retain_sites(['']) + except TypeError: + pass + else: + raise Exception(TypeError_msg) +#----------------------------------------------------------------------------- + def test_from_fasta(cls): + """Create an Alignment object from a FASTA-formatted file.""" + aln_obj = Alignment.from_fasta('temp.aln', 'test_align_from_faster', 'marker') + result_nsites = aln_obj.nsites + result_samples = aln_obj.nsamples + results_nmarkers = aln_obj.nmarkers + expected_nsites = 26 + expected_nsamples = 3 + expected_nmarkers = 1 + assert result_nsites == expected_nsites,value_error(expected_nsites, result) + assert result_samples == expected_nsamples,value_error(expected_nsamples, result) + assert results_nmarkers == expected_nmarkers,value_error(expected_nmarkers, result) +#----------------------------------------------------------------------------- + # Format converters + # tested, remove hashtag when done + #def test_to_fasta(self): +# """Saves the alignment as a FASTA-formatted text file.""" + #create_aln_file = self.aln_file.to_fasta('test_aln_file') # should change input to path_to_file + #TODO- check if len(currentdir) increases by one, + #check if test_aln_file in dir + #use from_fasta to create new alingment object +#----------------------------------------------------------------------------- +#---------------------------------------------------- +# def test_to_sample_matrix(self): +# """Converts sequences into a numpy matrix.""" # is this matrix or array? +# seq_matrix = self.aln_file.to_sample_matrix() +# test_seq_matrix = array([list(key[1]) for key in self.test_aln_file.values() if 'A' in key[1]]) # use key names +# assert array_equal(seq_matrix, test_seq_matrix) +#---------------------------------------------------- +# def test_to_marker_matrix(self, size=1): +# """Converts sequences into a numpy matrix.""" +# mseq_matrix = self.aln_file.to_marker_matrix() +# test_mseq_matrix = array([list(self.test_aln_file[marker][1]) for marker in \ +# self.test_aln_file.keys() if 'marker' in marker]) +# assert array_equal(mseq_matrix, test_mseq_matrix) +#---------------------------------------------------- +# # Iterators +# def test_iter_sites(self): +# """Iterates column-wise over the alignment""" +# iter_seq = list(self.aln_file.iter_sites(0,1)) +# +# test_cols = [] +# seqs = [] +# for num in range(0,1): +# for value in self.test_aln_file.values(): +# seq = value[1] +# #if not 'A' in seq: +# #continue +# seqs.append(seq[num]) +# +# test_cols.append(sorted(seqs)) +# seqs = [] +# +# print(test_cols, iter_seq) +# assert test_cols == iter_seq +#---------------------------------------------------- +## def test_iter_sample_sites(self, start=0, stop=None, size=1): +## """Iterates column-wise over the sample alignment. Excludes markers. """ +## iter_seq = list(self.aln_file.iter_sample_sites(0,10)) +## +## test_cols = [] +## seqs = [] +## for num in range(0,10): +## for value in self.test_aln_file_wo_marker.values(): +## seq = value[1] +## seqs.append(seq[num]) +## +## test_cols.append(seqs) +## seqs = [] +## +## assert test_cols == iter_seq +#---------------------------------------------------- +### def test_iter_marker_sites(self): +### """Iterates column-wise over the marker alignment. Excludes samples. """ +### iter_seq = list(self.aln_file.iter_marker_sites(0,10)) +### +### test_cols = [] +### seqs = [] +### for num in range(0,10): +### for value in self.test_aln_file.values(): +### +### seq = value[1] +### if set(seq) != {'C', 'N'}: +### continue +### seqs.append(seq[num]) +### +### test_cols.append(seqs) +### seqs = [] +### +### assert test_cols == iter_seq +#---------------------------------------------------- +# How does this work? Not yet available for v.85 + + # Block-related methods + + #def test_set_blocklists(self, ref_seq, description_encoder=None): +# """Creates new block information for the sequences given a reference. """ +#---------------------------------------------------- + # def test_parse_description_as_blocks(self, description_decoder=None): +# """Parses sample description into block data.""" +#---------------------------------------------------- + # def test_write_blocks_to_description(self, description_encoder): +# """Writes each sample's block data as a string, replacing its + # description.""" +#---------------------------------------------------- \ No newline at end of file From 1c980e9c4f68bada14e3be8d944bd66a7f9ae2d0 Mon Sep 17 00:00:00 2001 From: Hassan Daanaa <45001829+hsdaanaa@users.noreply.github.com> Date: Thu, 14 Feb 2019 16:08:02 +0900 Subject: [PATCH 12/12] Add files via upload --- alignmentrs/tests/test_alignment.py | 1208 +++++++++++++++++++++------ 1 file changed, 957 insertions(+), 251 deletions(-) diff --git a/alignmentrs/tests/test_alignment.py b/alignmentrs/tests/test_alignment.py index 984de60..758feda 100644 --- a/alignmentrs/tests/test_alignment.py +++ b/alignmentrs/tests/test_alignment.py @@ -1,14 +1,34 @@ import os from alignmentrs.aln import Alignment +#TODO- aln.subset: test invalid inputs +# aln.subset: test int and str input +# iter__xxx: write tests +# to_xxx_matrix_: write tests +# block_functions: write tests +# description editing + def type_error(expected, actual): return 'Expected type {}, instead got {}'.format(expected, actual) def value_error(expected, actual): return 'Expected value {}, instead got {}'.format(expected, actual) -class TestAlignmentGetters: +def index_error(expected, actual): + return 'Expected type {}, instead got {}'.format(expected, actual) + +TypeError_msg = 'Expected TypeError' +ValueError_msg = 'Expected ValueError' +IndexError_msg = 'Expected IndexError' +Error_msg = 'Expected Error' +class TestAlignmentGetters: + + # TODO: Refactor tests so that each test is very simple and + # multiple assertions are minimized, see test_nrows* and test_nsamples* + # TODO: Make "printer" functions like type_error and value_error + # above to standardize errors when the assertion + # basic test for expected outputs def setup(self): # Create an alignment for testing @@ -30,326 +50,1012 @@ def teardown(self): os.remove(self.temp_filename) def test_nrows_type(self): - """Checks if aln.obj.nrows output matches expected rows - of alignment + """Checks if aln.obj.nrows output type matches expected + type """ expected = int result = type(self.aln_file.nrows) assert expected == result, type_error(expected, result) def test_nrows_value(self): - """Checks if aln.obj.nrows output matches expected rows - of alignment + """Checks if aln.obj.nrows output value matches expected + value """ expected = 4 result = self.aln_file.nrows assert expected == result, value_error(expected, result) - +#----------------------------------------------------------------------------- def test_nsamples_type(self): - """Checks if aln.obj.nrows output matches expected rows - of alignment + """Checks if aln.obj.nrows output type matches expected + type """ expected = int result = type(self.aln_file.nsamples) assert expected == result, type_error(expected, result) def test_nsamples_value(self): - """Checks if aln.obj.nrows output matches expected rows - of alignment + """Checks if aln.obj.nrows output value matches expected + value """ expected = 3 result = self.aln_file.nsamples assert expected == result, value_error(expected, result) - - # TODO: Refactor tests so that each test is very simple and - # multiple assertions are minimized, see test_nrows* and test_nsamples* - # TODO: Make "printer" functions like type_error and value_error - # above to standardize errors when the assertion - - def test_nmarkers(self): - """Checks if aln.obj.nmarkers matches +#----------------------------------------------------------------------------- + def test_nmarkers_type(self): + """Checks if aln.obj.nmarkers output type matches + expected type + """ + expected = int + result = self.aln_file.nmarkers + assert isinstance(result, expected), type_error(expected, result) + + def test_nmarkers_value(self): + """Checks if aln.obj.nmarkers value matches expected number of markers in the sample """ - nmarkers = self.aln_file.nmarkers - expected_nmarkers = 1 - assert isinstance(nmarkers, int) # TODO: Text shown when assertion fails - assert nmarkers == expected_nmarkers # TODO: Text shown when assertion fails - - def test_nsites(self): - """checks if aln.obj.nsites output matches expected number - of sites in alignment(i.e sequence length) file + expected = 1 + result = self.aln_file.nmarkers + assert expected == result, value_error(expected, result) +#----------------------------------------------------------------------------- + def test_nsites_type(self): + """checks if aln.obj.nsites output type matches + expected type """ - nsites = self.aln_file.nsites - expected_nsites = 26 - assert isinstance(nsites, int) # TODO: Text shown when assertion fails - assert nsites == expected_nsites # TODO: Text shown when assertion fails - - def test_sample_ids(self): - """Checks if all aln.obj.sample_ids match output - ids in alignment file - """ - sample_ids = self.aln_file.sample_ids - expected_sample_ids = ['Dmel_528_2597', 'Dmel_RG2', 'Dmel_RG4N'] - assert isinstance(sample_ids, list) # TODO: Text shown when assertion fails - assert sample_ids == expected_sample_ids # TODO: Text shown when assertion fails - - def test_sample_descriptions(self): - """Checks if aln.obj.sample_descriptions output matches sample - descriptions in alignment file - """ - sample_descriptions = self.aln_file.sample_descriptions - expected_descriptions = ['|10 sp|', '|47 sp|', '|15 sp|'] - assert isinstance(sample_descriptions, list) # TODO: Text shown when assertion fails - assert sample_descriptions == expected_descriptions # TODO: Text shown when assertion fails - - def test_sample_sequences(self): - """Checks if aln.obj.sample_sequences output match sequences - in alignment file + expected = int + result = self.aln_file.nsites + assert isinstance(result, expected), type_error(expected, result) + + def test_nsites_value(self): + """checks if aln.obj.nsites value matches expected number + of sites in alignment(i.e sequence length) + """ + expected = 26 + result = self.aln_file.nsites + assert expected == result, value_error(expected, result) +#----------------------------------------------------------------------------- + def test_sample_ids_type(self): + """Checks if aln.obj.sample_ids type matches + expected type + """ + expected = list + result = self.aln_file.sample_ids + assert isinstance(result, expected), type_error(expected, result) + + def test_sample_ids_value(self): + """Checks if all aln.obj.sample_ids match expected + sample ids + """ + expected = ['Dmel_528_2597', 'Dmel_RG2', 'Dmel_RG4N'] + result = self.aln_file.sample_ids + assert expected == result, value_error(expected, result) +#----------------------------------------------------------------------------- + def test_sample_descriptions_type(self): + """Checks if aln.obj.sample_descriptions output type + matches expected type + """ + expected = list + result = self.aln_file.sample_descriptions + assert isinstance(result, expected), type_error(expected, result) + + def test_sample_descriptions_value(self): + """Checks if aln.obj.sample_descriptions value matches + expected value + """ + expected = ['|10 sp|', '|47 sp|', '|15 sp|'] + result = self.aln_file.sample_descriptions + assert expected == result, value_error(expected, result) +#----------------------------------------------------------------------------- + def test_sample_sequences_type(self): + """Checks if aln.obj.sample_sequences output type + matches expected type + """ + expected = list + result = self.aln_file.sample_sequences + assert isinstance(result, expected), type_error(expected, result) + + def test_sample_sequences_value(self): + """Checks if aln.obj.sample_sequences value output matches + expected value """ - sample_sequences = self.aln_file.sample_sequences - expected_sample_sequences = ['ATGAAGAGCAAGGTGGGGGGGGGGGG', + expected = ['ATGAAGAGCAAGGTGGGGGGGGGGGG', 'ATGAAGAGCAAGGTGGACCCCCCCCC', 'ATGAAGAGCAAGGTGGAAAAAAAAAA'] - assert isinstance(sample_sequences, list) # TODO: Text shown when assertion fails - assert sample_sequences == expected_sample_sequences # TODO: Text shown when assertion fails - - def test_marker_ids(self): - """Checks if aln.obj.marker_ids matches output marker ids in - alignment file - """ - marker_ids = self.aln_file.marker_ids - expected_marker_ids = ['marker_0'] - assert isinstance(marker_ids, list) # TODO: Text shown when assertion fails - assert marker_ids == expected_marker_ids # TODO: Text shown when assertion fails - - def test_marker_descriptions(self): + result = self.aln_file.sample_sequences + assert result == expected, value_error(expected, result) +#----------------------------------------------------------------------------- + def test_marker_ids_type(self): + """Checks if aln.obj.marker_ids output type matches expected + type + """ + expected = list + result = self.aln_file.marker_ids + assert isinstance(result, expected), type_error(expected, result) + + def test_marker_ids_value(self): + """Checks if aln.obj.marker_ids value matches + expected value + """ + expected = ['marker_0'] + result = self.aln_file.marker_ids + assert result == expected, value_error(expected, result) +#----------------------------------------------------------------------------- + def test_marker_descriptions_type(self): + """checks if aln.obj.marker_descriptions output type + matches expected output + """ + expected = list + result = self.aln_file.marker_descriptions + assert isinstance(result, expected), type_error(expected, result) + + def test_marker_descriptions_value(self): """checks if aln.obj.marker_descriptions output - matches descriptions in alignment file""" - marker_descriptions = self.aln_file.marker_descriptions - expected_marker_descriptions = ['|91 sp|'] - assert isinstance(marker_descriptions, list) # TODO: Text shown when assertion fails - assert marker_descriptions == expected_marker_descriptions # TODO: Text shown when assertion fails - - def test_marker_sequences(self): - """Checks if align.obj.marker_sequences output - matches marker sequences alignment file - """ - marker_sequences = self.aln_file.marker_sequences - expected_marker_sequences = ['CCCCCCCCCCCCCCCCCCCCCCCCCC'] - assert isinstance(marker_sequences, list) # TODO: Text shown when assertion fails - assert marker_sequences == expected_marker_sequences # TODO: Text shown when assertion fails + value expected output + """ + expected = ['|91 sp|'] + result = self.aln_file.marker_descriptions + assert result == expected, value_error(expected, result) +#----------------------------------------------------------------------------- + def test_marker_sequences_type(self): + """Checks if align.obj.marker_sequences output type + matches expected output + """ + expected = list + result = self.aln_file.marker_sequences + assert isinstance(result, expected), type_error(expected, result) + + def test_marker_sequences_value(self): + """Checks if align.obj.marker_sequences value + matches expected output + """ + expected = ['CCCCCCCCCCCCCCCCCCCCCCCCCC'] + result = self.aln_file.marker_sequences + assert result == expected, value_error(expected, result) #---------------------------------------------------- # class methods + def test_subset_input_sample_id(self): + """Returns a subset of the alignment by samples, markers and sites.""" + sample_ids = [0,1] + expected_nsamples = 2 + expected_names = ['Dmel_528_2597', 'Dmel_RG2'] + expected_descriptions = ['|10 sp| ', '|47 sp| '] + expected_sequences = ['ATGAAGAGCAAGGTGGACCCCCCCCC', 'ATGAAGAGCAAGGTGGAAAAAAAAAA'] + result_subset = self.aln_file.subset(self.aln_file, sample_ids) # fails for sume reason + result_nsamples = result_subset.nsamples + result_ids = result_subset.sample_ids + result_desc = result_subset.sample_descriptions + result_seq = result_subset.sample_sequences + assert expected_nsamples == result_nsamples, value_error(expected_nsamples,result_nsamples) + assert expected_names == result_ids, value_error(expected_names ,result_ids) + assert expected_descriptions == result_desc, value_error(expected_descriptions ,result_desc) + assert expected_sequences == result_seq, value_error(expected_sequences ,result_seq) + + def test_subset_input_marker_id(self): + """Returns a subset of the alignment by samples, markers and sites.""" + marker_index = [0] + expected_nsamples = 1 + expected_names = ['marker_0'] + expected_descriptions = ['|91 sp|'] + expected_sequences = ['CCCCCCCCCCCCCCCCCCCCCCCCCC'] + result_subset = self.aln_file.subset(self.aln_file, marker_ids = marker_index) + result_nmarkers = result_subset.nmarkers + result_ids = result_subset.marker_ids + result_desc = result_subset.marker_descriptions + result_seq = result_subset.marker_sequences + assert expected_nsamples == result_nmarkers, value_error(expected_nsamples,result_nmarkers) + assert expected_names == result_ids, value_error(expected_names ,result_ids) # fails, gives wrong expected marker + assert expected_descriptions == result_desc, value_error(expected_descriptions ,result_desc) + assert expected_sequences == result_seq, value_error(expected_sequences ,result_seq) + + # HSD: TODO- test invalid invalid inputs + # HSD: TODO- test int and str input - # Does not work properly - - #def test_subset(cls): - # """Returns a subset of the alignment by samples, markers and sites.""" - # sample_ids = [1,2,3] - # marker_ids = ['marker_0'] - # aln_obj = Alignment.from_fasta('test_alignment.txt', 'test_align', 'marker') - - # subset = (aln_obj,sample_ids, marker_ids) - # test_subset = + # def test_subset(self): + # """Returns a subset of the alignment by samples, markers and sites.""" + # expected_sample_ids = [0,1] + # result_subset = (self.aln_file,sample_ids) + + # result_sample_ids = result_subset.get_markers + # result_sample_desc = + # result_sample_seq = + # assert #---------------------------------------------------- - def test_get_samples(self): - """Tests aln.object.get_samples returns expected - sequences sample of an alignment file - tests: - valid input - invalid sample id - invalid types""" - # valid input - get_sample_str = self.aln_file.get_samples('Dmel_528_2597') - get_sample_index = self.aln_file.get_samples(0) - expected_sites = 26 - expected_samples = 1 - expected_markers = 0 - expected_sequence = ['ATGAAGAGCAAGGTGGGGGGGGGGGG'] - test_sample_list = [get_sample_str,get_sample_index] - + def test_get_samples_valid_str(self): + """checks if aln.object.get_samples returns expected + output type given an input str or int""" + + result = self.aln_file.get_samples('Dmel_528_2597') + result_0 = self.aln_file.get_samples(0) + expected = object + assert isinstance(result,expected), type_error(expected, result) + assert isinstance(result_0,expected), type_error(expected, result_0) + + def test_get_samples_valid_list(self): + """checks if aln.object.get_samples returns expected + output type given an input list_str or list_int""" + + result = self.aln_file.get_samples(['Dmel_528_2597']) + result_0 = self.aln_file.get_samples([0]) + expected = object + assert isinstance(result,expected), type_error(expected, result) + assert isinstance(result_0,expected), type_error(expected, result_0) +#----------------------------------------------------------------------------- + def test_get_samples_str_in_invalid_type(self): + """checks if aln.object.get_samples raises error, given + an invalid type i.e set, tuple or none""" + try: + valid_str_invalid_type_set_str = self.aln_file.get_samples({}) + except TypeError: + pass + else: + raise Exception(TypeError_msg) + try: + valid_str_invalid_type_tuple_str = self.aln_file.get_samples(()) + except TypeError: + pass + else: + raise Exception(TypeError_msg) + try: + None_type = self.aln_file.get_samples(None) + except TypeError: + pass + else: + raise Exception(TypeError_msg) + + def test_get_samples_invalid_list_items(self): + """checks if aln.object.get_samples raises error, given + an invalid type in a list i.e tuple, set none in list""" + try: + set_in_list = self.aln_file.get_samples([{}]) + except TypeError: + pass + else: + raise Exception(TypeError_msg) + try: + tuple_in_list = self.aln_file.get_samples([()]) + except TypeError: + pass + else: + raise Exception(TypeError_msg) + try: + none_in_list = self.aln_file.get_samples([None]) + except TypeError: + pass + else: + raise Exception(TypeError_msg) + + def test_get_samples_invalid_str_sample_id(self): + """checks if aln.object.get_samples raises error, given + an invalid string sample id""" + try: + invalid_str = self.aln_file.get_samples('Dmel_528_259700') + except ValueError: + pass + else: + raise Exception(ValueError_msg) + + def test_get_samples_invalid_int_sample_id(self): + """checks if aln.object.get_samples raises error, given + an invalid index of a sample id""" + try: + invalid_str = self.aln_file.get_samples(-1) + except ValueError: + pass + else: + raise Exception(ValueError_msg) + + def test_get_samples_invalid_str_sample_id(self): + """checks if aln.object.get_samples raises error, given + an invalid string sample id in list""" + try: + invalid_str = self.aln_file.get_samples(['Dmel_528_259700']) + except ValueError: + pass + else: + raise Exception(ValueError_msg) + + def test_get_samples_invalid_int_sample_id(self): + """checks if aln.object.get_samples raises error, given + an invalid index of a sample id in list""" + try: + invalid_index = self.aln_file.get_samples([-1]) + except IndexError: + pass + else: + raise Exception(IndexError_msg) + # TODO: Do not make compound tests! # Each assertion should be a separate test so that it will fail for # that specific test. # For example, test.nsites == expected_sites is unnecessary because it # duplicates an existing test - test_nsites - for test in test_sample_list: - assert isinstance(test, object) - assert test.nsites == expected_sites - assert test.nsamples == expected_samples - assert test.nmarkers == expected_markers - assert test.sample_sequences == expected_sequence - - # invalid sample_id - # TODO: This should be a separate test - try: - invalid_sample_name_str = self.aln_file.get_samples('Dmel_528_259700') - invalid_sample_name_lst = self.aln_file.get_samples(['Dmel_528_259700']) - invalid_sample_id_int = self.aln_file.get_samples(-1) - invalid_sample_id_lst = self.aln_file.get_samples([-1]) - except: - assert ValueError # TODO: Text shown when assertion fails - - # invalid type - # TODO: This should be a separate test - test_invalid_types = [{'Dmel_528_2597': 0},('Dmel_528_2597')] - try: - for invalid_input in test_invalid_types: - invalid_id = self.aln_file.get_samples(invalid_input) - except: - assert ValueError # TODO: Text shown when assertion fails - - # TODO: This should be a separate test - try: - test_invalid_list_items = [[],[{'Dmel_528_2597':0 }]] - for invalid_input in test_invalid_list_items: - invalid_id = self.aln_file.get_samples(invalid_input) - except: - assert ValueError # TODO: Text shown when assertion fails - - def test_get_markers(self): - """Tests if aln.object.get_markers returns expected +#----------------------------------------------------------------------------- + def test_get_markers_valid_input(self): + """checks if aln.object.get_markers returns expected marker sequences of an alignment file - tests: - valid input - invalid sample id - invalid types """ + result = self.aln_file.get_markers('marker_0') + result_0 = self.aln_file.get_markers(0) + expected = object + assert isinstance(result,expected), type_error(expected, result) + assert isinstance(result_0,expected), type_error(expected, result_0) - # VI - get_markers_str = self.aln_file.get_markers('marker_0') - get_markers_int = self.aln_file.get_markers(0) + def test_get_markers_valid_list_input(self): + """Tests if aln.object.get_markers returns expected + marker sequences of an alignment file, given a list + input + """ + result = self.aln_file.get_markers(['marker_0']) + result_0 = self.aln_file.get_markers([0]) + expected = object + assert isinstance(result,expected), type_error(expected, result) + assert isinstance(result_0,expected), type_error(expected, result_0) # TODO: testing single char and list should be different tests as they are two scenarios of calling the method - get_markers_list_str = self.aln_file.get_markers(['marker_0']) - get_markers_list_int = self.aln_file.get_markers([0]) - expected_marker_sequence = ['CCCCCCCCCCCCCCCCCCCCCCCCCC'] - tests = [get_markers_str, get_markers_int, get_markers_list_str, get_markers_list_int] - for test in tests: - assert isinstance(test, object) - assert test.sequences == ['CCCCCCCCCCCCCCCCCCCCCCCCCC'] - assert test.nsites == 26 - #assert test.nsamples == 1 # attribute error - - # What is VI, IVI, IVT?? - # IVI - try: - inv_markers_str = self.aln_file.get_markers('marker_01') - inv_markers_int = self.aln_file.get_markers(1) - inv_markers_list_str = self.aln_file.get_markers(['marker_01']) - inv_markers_list_int = self.aln_file.get_markers([1]) - tests = [inv_markers_str, inv_markers_int, inv_markers_list_str, inv_markers_list_int] - except ValueError: - pass - - # IVT - try: - test_invalid_types = [{'marker_0':0 },('marker_0')] - except ValueError: - pass + + def test_get_markers_valid_invalid_type(self): + """checks if aln.object.get_markers raises error, given + an invalid type i.e tuple, set none""" + try: + valid_str_invalid_type_0 = self.aln_file.get_markers({}) + except TypeError: + pass + else: + raise Exception(TypeError_msg) + try: + valid_str_invalid_type_00 = self.aln_file.get_markers(()) + except TypeError: + pass + else: + raise Exception(TypeError_msg) + try: + None_type = self.aln_file.get_markers(None) + except TypeError: + pass + else: + raise Exception(TypeError_msg) + def test_get_markers_valid_invalid_list_items(self): + """checks if aln.object.get_markers raises error, given + an invalid type in a list i.e tuple, set or none""" + try: + valid_str_invalid_type_0 = self.aln_file.get_markers([{}]) + except TypeError: + pass + else: + raise Exception(TypeError_msg) + try: + valid_str_invalid_type_00 = self.aln_file.get_markers([()]) + except TypeError: + pass + else: + raise Exception(TypeError_msg) + try: + None_type = self.aln_file.get_markers([None]) + except TypeError: + pass + else: + raise Exception(TypeError_msg) #---------------------------------------------------- #def test_get_sites(self): # row error # """Returns a new alignment containing only the sites specified # #by the given list of column numbers.""" + #---------------------------------------------------- # Setter/Replacer - def test_replace_samples(self): - """Tests if aln.object.replace_samples replaces the sequence - of one or more sample in the aln.object + #TODO- could test invalid input types + def test_insert_samples_from_lists_valid_inputs(self): + """checks if aln.object.insert_samples_from_lists inserts a + new sample into the aln.object """ - new_sample = 'AT' * 13 - prev_sample_sequence = self.aln_file.sample_sequences[0] - self.aln_file.replace_samples(['Dmel_528_2597'], [new_sample]) - curr_sequence = self.aln_file.sample_sequences[0] + expected_id = 'Dsim99201' + expected_desc = '|CH2912|' + expected_sequence = 'G' * 26 + self.aln_file.insert_samples_from_lists(1, [expected_id],[expected_desc],[expected_sequence]) + result_id = self.aln_file.sample_ids[1] + result_description = self.aln_file.sample_descriptions[1] + result_sequence = self.aln_file.sample_sequences[1] + assert expected_id == result_id, value_error(expected_id,result_id) + assert expected_desc == result_description , value_error(expected_desc,result_description) + assert result_sequence == expected_sequence, value_error(expected_sequence,result_sequence) - assert not prev_sample_sequence == curr_sequence - assert curr_sequence == new_sample - - def test_insert_samples_from_lists(self): - """Tests if aln.object.insert_samples_from_lists adds one or - more sequences in the aln.object - """ - new_sample_id = 'Dsim99201' - new_sample_desc = '|CH2912|' - new_sample_sequence = 'G' * 26 - self.aln_file.insert_samples_from_lists(1, [new_sample_id], - [new_sample_desc], - [new_sample_sequence]) - assert self.aln_file.sample_ids[1] == new_sample_id # TODO: Text shown when assertion - assert self.aln_file.sample_descriptions[1] == new_sample_desc # TODO: Text shown when assertion - # error here, returns does not insert expected sequence value - #assert self.aln_file.sample_sequences[1] == new_sample_sequence - - def test_append_sample_from_lists(self): - """Tests if append_sample_from_lists adds one or - more sequences in the last index of aln.object - """ - new_sample_id = 'Dere_lastind' - new_sample_desc = '|last_ind|' - new_sample_sequence = 'G' * 26 - self.aln_file.append_sample_from_lists([new_sample_id],[new_sample_desc], [new_sample_sequence]) - assert self.aln_file.sample_sequences[-1] == new_sample_sequence # TODO: Text shown when assertion - assert self.aln_file.sample_ids[-1] == new_sample_id # TODO: Text shown when assertion - assert self.aln_file.sample_descriptions[-1] == new_sample_desc # TODO: Text shown when assertion + def test_insert_samples_from_lists_valid_invalid_index(self): + """checks if aln.object.insert_samples_from_lists raises + index error given an invalid index + """ + invalid_index = -1 + valid_id = 'Dsim99201' + valid_desc = '|CH2912|' + valid_sequence = 'G' * 26 + try: + self.aln_file.insert_samples_from_lists(invalid_index, [valid_id],[valid_desc], [valid_sequence]) + except IndexError: + pass + else: + raise Exception(IndexError_msg) + + def test_insert_samples_from_lists_valid_invalid_id(self): + """checks if aln.object.insert_samples_from_lists raises + Type error given an invalid type for sample id + """ + valid_index = 1 + invalid_id = 1 + valid_desc = '|CH2912|' + valid_sequence = 'G' * 26 + try: + self.aln_file.insert_samples_from_lists(valid_index,[invalid_id],[valid_desc],[valid_sequence]) + except TypeError: + pass + else: + raise Exception(TypeError_msg) + + def test_insert_samples_from_lists_valid_invalid_description(self): + """checks if aln.object.insert_samples_from_lists raises + Type error given an invalid type for sample description + """ + valid_index = 1 + valid_id = 'Dsim99201' + invalid_desc = 1 + valid_sequence = 'G' * 26 + try: + self.aln_file.insert_samples_from_lists(valid_index,[valid_id],[invalid_desc],[valid_sequence]) + except TypeError: + pass + else: + raise Exception(TypeError_msg) + + def test_insert_samples_from_lists_valid_invalid_sequence(self): + """checks if aln.object.insert_samples_from_lists raises + Type error given an invalid type for sample sequence + """ + valid_index = 1 + valid_id = 'Dsim99201' + valid_desc = 1 + invalid_sequence = 26 + try: + self.aln_file.insert_samples_from_lists(valid_index, [valid_id],[valid_desc],[invalid_sequence]) + except TypeError: + pass + else: + raise Exception(TypeError_msg) +#----------------------------------------------------------------------------- + def test_append_sample_from_lists_valid_inputs(self): + """Tests if append_sample_from_lists appends a + to the last index of aln.object + """ + expected_id = 'Dere_lastind' + expected_desc = '|last_ind|' + expected_sequence = 'G' * 26 + self.aln_file.append_sample_from_lists([expected_id],[expected_desc], [expected_sequence]) + result_id = self.aln_file.sample_ids[-1] + result_desc = self.aln_file.sample_descriptions[-1] + result_sequence = self.aln_file.sample_sequences[-1] + assert result_id == expected_id, type_error(expected_id, result_id) + assert result_desc == expected_desc, type_error(expected_desc, result_desc) + assert result_sequence == expected_sequence, type_error(expected_sequence, result_sequence) + + def test_append_sample_from_lists_invalid_id_type(self): + """checks if aln.object.append_sample_from_lists raises + Type error given an invalid type for sample id + """ + sample_id = 1 + sample_desc = '|last_ind|' + sample_sequence = 'G' * 26 + + try: + result = self.aln_file.append_sample_from_lists([sample_id],[sample_desc], [sample_sequence]) + except TypeError: + pass + else: + raise Exception(TypeError_msg) + + def test_append_sample_from_lists_invalid_description_type(self): + """checks if aln.object.append_sample_from_lists raises + Type error given an invalid type for sample description + """ + expected_id = 'Dere_lastind' + expected_desc = 1 + expected_sequence = 'G' * 26 + try: + result = self.aln_file.append_sample_from_lists([expected_id],[expected_desc], [expected_sequence]) + except TypeError: + pass + else: + raise Exception(TypeError_msg) - def test_remove_samples(self): - """Tests if aln.obj.remove_samples removes all sample - information of one or more indices from the alignment object + def test_append_sample_from_lists_invalid_sequence_type(self): + """checks if aln.object.append_sample_from_lists raises + Type error given an invalid type for sample sequence + """ + expected_id = 'Dere_lastind' + expected_desc = '|last_ind|' + expected_sequence = 26 + try: + result = self.aln_file.append_sample_from_lists([expected_id],[expected_desc], [expected_sequence]) + except TypeError: + pass + else: + raise Exception(TypeError_msg) +#----------------------------------------------------------------------------- + def test_remove_samples_valid_sample_name(self): + """checks if aln.obj.remove_samples removes sample + information of a sample in the alignment object + given a str sample id + """ + sample_name_to_remove = 'Dmel_RG2' + sample_index = 1 + self.aln_file.remove_samples(sample_name_to_remove) + result_sample_id = self.aln_file.sample_ids[sample_index] + result_sequence = self.aln_file.sample_sequences[sample_index] + result_desc = self.aln_file.sample_descriptions[sample_index] + expected_sample_id = ['Dmel_RG4N'] + expected_sequence = ['|15 sp|'] + expected_desc = 'ATGAAGAGCAAGGTGGAAAAAAAAAA' + assert expected_sample_id != result_sample_id, value_error(expected_sample_id,result_sequence) + assert expected_sequence != result_desc, value_error(expected_sequence,result_sample_id) + assert expected_desc != result_desc,type_error(expected_desc,result_desc) + + def test_remove_samples_valid_index(self): + """checks if aln.obj.remove_samples removes sample + information of a sample in the alignment object + given the sample index position """ index_to_remove = 1 - sequence_to_remove = self.aln_file.sample_sequences[index_to_remove] self.aln_file.remove_samples(index_to_remove) - assert sequence_to_remove != self.aln_file.sample_sequences[1] # TODO: Text shown when assertion + result_sample_id = self.aln_file.sample_ids[index_to_remove] + result_sequence = self.aln_file.sample_sequences[index_to_remove] + result_desc = self.aln_file.sample_descriptions[index_to_remove] + expected_sample_id = ['Dmel_RG4N'] + expected_sequence = ['|15 sp|'] + expected_desc = 'ATGAAGAGCAAGGTGGAAAAAAAAAA' + assert expected_sample_id != result_sample_id, value_error(expected_sample_id,result_sequence) + assert expected_sequence != result_desc, value_error(expected_sequence,result_sample_id ) + assert expected_desc != result_desc,type_error(expected_desc,result_desc ) - def test_retain_samples(self): - """Tests if aln.obj.retain_samples removes all sample - information apart from specified indices in - alignment object + def test_remove_samples_invalid_str(self): + """checks if aln.obj.remove_samples gives a + TypeError given an invalid sample id + """ + sample_name_to_remove = 'Dmel_RG4N0' + try: + self.aln_file.remove_samples(sample_name_to_remove) + except ValueError: + pass + else: + raise Exception(TypeError_msg) + + def test_remove_samples_invalid_index(self): + """checks if aln.obj.remove_samples gives an + IndexError given an invalid input index + """ + index_to_remove = -1 + try: + self.aln_file.remove_samples(index_to_remove) + except IndexError: + pass + else: + raise Exception(index_error) + + def test_remove_samples_invalid_type(self): + """checks if aln.obj.remove_samples gives a + ValueError given an invalid input type i.e + dict, float, set and tuple + """ + float_type = 1.1 + dict_type = {1:'w'} + set_type = {} + tuple_type = () + try: + self.aln_file.remove_samples(float_type) + except TypeError: + pass + else: + raise Exception(TypeError_msg) + + try: + self.aln_file.remove_samples(dict_type) + except TypeError: + pass + else: + raise Exception(TypeError_msg) + try: + self.aln_file.remove_samples(set_type) + except TypeError: + pass + else: + raise Exception(TypeError_msg) + try: + self.aln_file.remove_samples(tuple_type) + except TypeError: + pass + else: + raise Exception(TypeError_msg) +#----------------------------------------------------------------------------- + def test_retain_samples_valid_input(self): + """checks if aln.obj.retain_samples changes + properties of the alignment object """ self.aln_file.retain_samples([1]) - assert self.aln_file.nsamples == 1 # TODO: Text shown when assertion fails - assert len(self.aln_file.sample_ids) == 1 # TODO: Text shown when assertion fails - assert len(self.aln_file.sample_descriptions) == 1 # TODO: Text shown when assertion fails - assert len(self.aln_file.sample_sequences) == 1 # TODO: Text shown when assertion fails - assert self.aln_file.nmarkers == 1 # TODO: Text shown when assertion fails - assert len(self.aln_file.marker_ids) == 1 # TODO: Text shown when assertion fails - assert len(self.aln_file.marker_descriptions) == 1 # TODO: Text shown when assertion fails - assert len(self.aln_file.marker_sequences) == 1 # TODO: Text shown when assertion fails - - # TODO: Other than count, test whether the correct sample was retained - - def test_remove_sites(self): - """tests if aln.obj.remove_sites removes all one or more - sequences from the alignment sequences""" + expected_len = 1 + result_sample_num = self.aln_file.nsamples + result_sample_id_num = len(self.aln_file.sample_ids) + result_sample_desc_num = self.aln_file.sample_descriptions + result_sample_seq_num = len(self.aln_file.sample_sequences) + result_marker_num = self.aln_file.nmarkers + result_marker_id_num = len(self.aln_file.marker_ids) + result_marker_desc_num = len(self.aln_file.marker_descriptions) + result_marker_seq_num = len(self.aln_file.marker_sequences) + assert result_sample_num == expected_len, value_error(expected_len, result_sample_num ) + assert result_sample_id_num == expected_len, value_error(expected_len, result_sample_id_num ) + assert result_sample_desc_num == expected_len, valu_error(expected_len, result_sample_desc_num ) + assert result_sample_seq_num == expected_len, value_error(expected_len, result_sample_seq_num) + assert result_marker_num == expected_len, value_error(expected_len, result_marker_num ) + assert result_marker_id_num == expected_len, value_error(expected_len, result_marker_id_num ) + assert result_marker_desc_num == expected_len, value_error(expected_len, result_marker_desc_num) + assert result_marker_seq_num == expected_len, value_error(expected_len, result_marker_seq_num) + + def test_retain_samples_valid_input(self): + """checks if aln.obj.retain_samples retains + expected sample in the alignment + """ + self.aln_file.retain_samples([1]) + expected_len = 1 + result_sample_id = self.aln_file.sample_ids[0] + result_sample_description = self.aln_file.sample_descriptions[0] + result_sequence = self.aln_file.sample_sequences[0] + expected_sample_id = 'Dmel_RG2' + expected_sample_description = '|47 sp|' + expected_sequence = 'ATGAAGAGCAAGGTGGACCCCCCCCC' + + assert expected_sample_id == result_sample_id, value_error(expected_sample_id, result_sample_id) + assert expected_sample_description == result_sample_description, value_error(expected_sample_description, result_sample_description) + assert expected_sequence == result_sequence, value_error(expected_sequence, result_sequence) + + def test_retain_samples_invalid_list_input(self): + """checks if aln.obj.retain_samples raises + an error given the wrong input type in list + """ + try: + self.aln_file.retain_samples(['1.1']) + except TypeError: + pass + else: + raise Exception(TypeError_msg) + try: + self.aln_file.retain_samples([1.1]) + except TypeError: + pass + else: + raise Exception(TypeError_msg) + try: + self.aln_file.retain_samples([-1]) + except TypeError: + pass + else: + raise Exception(TypeError_msg) + try: + self.aln_file.retain_samples([{}]) + except TypeError: + pass + else: + raise Exception(TypeError_msg) + try: + self.aln_file.retain_samples([]) + except TypeError: + pass + else: + raise Exception(TypeError_msg) + try: + self.aln_file.retain_samples([None]) + except TypeError: + pass + else: + raise Exception(TypeError_msg) + + def test_retain_samples_invalid_input(self): + """checks if aln.obj.retain_samples raises + an error given the wrong input type + """ + try: + self.aln_file.retain_samples('1.1') + except TypeError: + pass + else: + raise Exception(TypeError_msg) + try: + self.aln_file.retain_samples(1.1) + except TypeError: + pass + else: + raise Exception(TypeError_msg) + try: + self.aln_file.retain_samples(-1) + except TypeError: + pass + else: + raise Exception(TypeError_msg) + try: + self.aln_file.retain_samples({}) + except TypeError: + pass + else: + raise Exception(TypeError_msg) + try: + self.aln_file.retain_samples() + except TypeError: + pass + else: + raise Exception(TypeError_msg) + try: + self.aln_file.retain_samples(None) + except TypeError: + pass + else: + raise Exception(TypeError_msg) + # TODO: Other than count, test whether the correct sample was retained +#----------------------------------------------------------------------------- + def test_remove_sites_list_input(self): + """tests if aln.obj.remove_sites makes expected change + to number of sites in alignment given int in list""" self.aln_file.remove_sites([2]) - assert self.aln_file.nsites == (25) # TODO: Text shown when assertion fails - - def test_retain_sites(self): + expected = 25 + result = self.aln_file.nsites + assert expected == result, value_error(expected, actual) + + def test_remove_sites_int_input(self): + """tests if aln.obj.remove_sites makes expected change + to number of sites in alignment given an input int""" + self.aln_file.remove_sites(2) + expected = 25 + result = self.aln_file.nsites + assert expected == result, value_error(expected, actual) + + def test_remove_sites_empty_input(self): + """tests if aln.obj.remove_sites makes expected change + to number of sites in alignment given an input int""" + self.aln_file.remove_sites(()) + expected = 26 + result = self.aln_file.nsites + assert expected == result, value_error(expected, actual) + + def test_remove_sites_empty_list_input(self): + """tests if aln.obj.remove_sites makes expected change + to number of sites in alignment given an input int""" + self.aln_file.remove_sites([]) + expected = 26 + result = self.aln_file.nsites + assert expected == result, value_error(expected, actual) + + def test_remove_sites_invalid_input(self): + """tests if aln.obj.remove_sites raises an + error given invalid input""" + try: + self.aln_file.remove_sites(-2) + except IndexError: + pass + else: + raise Exception(IndexError_msg) + try: + self.aln_file.remove_sites({}) + except TypeError: + pass + else: + raise Exception(TypeError_msg) + try: + self.aln_file.remove_sites(None) + except TypeError: + pass + else: + raise Exception(TypeError_msg) + + def test_remove_sites_invalid_list_input(self): + """tests if aln.obj.remove_sites raises an + error given an invalid list input""" + try: + self.aln_file.remove_sites([-2]) + except IndexError: + pass + else: + raise Exception(IndexError_msg) + + try: + self.aln_file.remove_sites([()]) + except TypeError: + pass + else: + raise Exception(TypeError_msg) + + try: + self.aln_file.remove_sites([{}]) + except TypeError: + pass + else: + raise Exception(TypeError_msg) + try: + self.aln_file.remove_sites([None]) + except TypeError: + pass + else: + raise Exception(TypeError_msg) +#----------------------------------------------------------------------------- + def test_retain_sites_valid_input(self): + """tests if aln.obj.retain_sites removes all + but specified samples in the alignment object""" + self.aln_file.retain_sites(0,1,2) + expected = 26 + result = self.aln_file.nsites + + assert expected == result, value_error(expected, result) + + def test_retain_sites_valid_list_input(self): + """tests if aln.obj.retain_sites removes all + but specified samples in the alignment object""" + self.aln_file.retain_sites([0,1,2]) + expected = 3 + result = self.aln_file.nsites + + assert expected == result, value_error(expected, result) + + def test_retain_sites_invalid_input(self): """tests if aln.obj.retain_sites all sequences apart from specified sequences in alignment sequences""" - self.aln_file.retain_sites([0,1,2]) - assert self.aln_file.nsites == 3 # TODO: Text shown when assertion fails - #TODO- should assert to that the positions are not ATG once - # get samples sequences is fixes - + try: + self.aln_file.retain_sites(-1) + except IndexError: # Expected index error + pass + else: + raise Exception(IndexError_msg) + try: + self.aln_file.retain_sites((1,)) + except TypeError: + pass + else: + raise Exception(TypeError_msg) + try: + self.aln_file.retain_sites({}) + except TypeError: + pass + else: + raise Exception(TypeError_msg) + try: + self.aln_file.retain_sites(-1) + except TypeError: + pass + else: + raise Exception(TypeError_msg) + try: + self.aln_file.retain_sites('') + except TypeError: + pass + else: + raise Exception(TypeError_msg) + + def test_retain_sites_invalid_input(self): + """tests if aln.obj.retain_sites all sequences + apart from specified sequences in alignment sequences + given an input list""" + try: + self.aln_file.retain_sites([-1]) + except IndexError: # Expected index error + pass + else: + raise Exception(IndexError_msg) + try: + self.aln_file.retain_sites([(1,)]) + except TypeError: + pass + else: + raise Exception(TypeError_msg) + try: + self.aln_file.retain_sites([{}]) + except TypeError: + pass + else: + raise Exception(TypeError_msg) + try: + self.aln_file.retain_sites([-1]) + except TypeError: + pass + else: + raise Exception(TypeError_msg) + try: + self.aln_file.retain_sites(['']) + except TypeError: + pass + else: + raise Exception(TypeError_msg) +#----------------------------------------------------------------------------- def test_from_fasta(cls): """Create an Alignment object from a FASTA-formatted file.""" - aln_obj = Alignment.from_fasta('test_alignment_b.txt', 'test_align', 'marker') - assert aln_obj.nsites == 26 # TODO: Text shown when assertion fails - assert aln_obj.nsamples == 3 # TODO: Text shown when assertion fails - assert aln_obj.nmarkers == 1 # TODO: Text shown when assertion fails - + aln_obj = Alignment.from_fasta('temp.aln', 'test_align_from_faster', 'marker') + result_nsites = aln_obj.nsites + result_samples = aln_obj.nsamples + results_nmarkers = aln_obj.nmarkers + expected_nsites = 26 + expected_nsamples = 3 + expected_nmarkers = 1 + assert result_nsites == expected_nsites,value_error(expected_nsites, result) + assert result_samples == expected_nsamples,value_error(expected_nsamples, result) + assert results_nmarkers == expected_nmarkers,value_error(expected_nmarkers, result) +#----------------------------------------------------------------------------- # Format converters # tested, remove hashtag when done #def test_to_fasta(self): - """Saves the alignment as a FASTA-formatted text file.""" +# """Saves the alignment as a FASTA-formatted text file.""" #create_aln_file = self.aln_file.to_fasta('test_aln_file') # should change input to path_to_file #TODO- check if len(currentdir) increases by one, #check if test_aln_file in dir #use from_fasta to create new alingment object - - # How does this work? +#----------------------------------------------------------------------------- +#---------------------------------------------------- +# def test_to_sample_matrix(self): +# """Converts sequences into a numpy matrix.""" # is this matrix or array? +# seq_matrix = self.aln_file.to_sample_matrix() +# test_seq_matrix = array([list(key[1]) for key in self.test_aln_file.values() if 'A' in key[1]]) # use key names +# assert array_equal(seq_matrix, test_seq_matrix) +#---------------------------------------------------- +# def test_to_marker_matrix(self, size=1): +# """Converts sequences into a numpy matrix.""" +# mseq_matrix = self.aln_file.to_marker_matrix() +# test_mseq_matrix = array([list(self.test_aln_file[marker][1]) for marker in \ +# self.test_aln_file.keys() if 'marker' in marker]) +# assert array_equal(mseq_matrix, test_mseq_matrix) +#---------------------------------------------------- +# # Iterators +# def test_iter_sites(self): +# """Iterates column-wise over the alignment""" +# iter_seq = list(self.aln_file.iter_sites(0,1)) +# +# test_cols = [] +# seqs = [] +# for num in range(0,1): +# for value in self.test_aln_file.values(): +# seq = value[1] +# #if not 'A' in seq: +# #continue +# seqs.append(seq[num]) +# +# test_cols.append(sorted(seqs)) +# seqs = [] +# +# print(test_cols, iter_seq) +# assert test_cols == iter_seq +#---------------------------------------------------- +## def test_iter_sample_sites(self, start=0, stop=None, size=1): +## """Iterates column-wise over the sample alignment. Excludes markers. """ +## iter_seq = list(self.aln_file.iter_sample_sites(0,10)) +## +## test_cols = [] +## seqs = [] +## for num in range(0,10): +## for value in self.test_aln_file_wo_marker.values(): +## seq = value[1] +## seqs.append(seq[num]) +## +## test_cols.append(seqs) +## seqs = [] +## +## assert test_cols == iter_seq +#---------------------------------------------------- +### def test_iter_marker_sites(self): +### """Iterates column-wise over the marker alignment. Excludes samples. """ +### iter_seq = list(self.aln_file.iter_marker_sites(0,10)) +### +### test_cols = [] +### seqs = [] +### for num in range(0,10): +### for value in self.test_aln_file.values(): +### +### seq = value[1] +### if set(seq) != {'C', 'N'}: +### continue +### seqs.append(seq[num]) +### +### test_cols.append(seqs) +### seqs = [] +### +### assert test_cols == iter_seq +#---------------------------------------------------- +# How does this work? Not yet available for v.85 # Block-related methods