-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathmsa.fasta
186 lines (186 loc) · 6.75 KB
/
msa.fasta
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
>XP_007318498.1
MAT--PVIVGVGAITAALVGRQLLRNGVIG--------KRAAEEDGPTLRTKLKDAHRHI
MLANHPDRGGSPYLASKINEAKDLLDKTDGRSR---
>KFV57707.1
----------------------YYKGGFEQKMSSPEASLILGVSA-SAGKAKVRTAHRRI
MILNHPDKGGSPYLATKINEAKDLLESTPK------
>VDM53570.1
-------------------------------MTRREAAMILGIPA-TANPARIKEAHRRI
MIVNHPDRGGSPYIASKINEAKDLLESSKS------
>XP_015749139.1
----------IF-FLTQE-FSHYYRGGFEPKMTKREAGLVLGISP-SANKVKIREAHRRI
MLINHPDRGGSPYLAAKINEAKDLLEGSNKS-----
>EZA53442.1
MAET----VKRL-DSESLANSKYYKGGFEPRMTKREASLILGVSP-TASKAKVKDQFKKV
MSVNHPDRGGSPYVAAKINEAKDMLEK---------
>RIA99233.1
--------------------KNYYKGGFNNKINKREAALILGLKETSINKAKIKEAHKRM
IMLNHPDHGGSPYLTYKINEAKAFLEKTVKY-----
>query
---------------------GFLKGGFDPKMNSKEALQILNLTENTLTKKKLKEVHRKI
MLANHPDKGGSPFLATKINEAKDFLEKRGISK----
>XP_009983229.1
------------------SLSLYYKGGFEQKMSRREASLILGVSP-SASKAKIRTAHRRI
MILNHPDKGGSPYLATKINEAKDMLESTANN-----
>XP_024747594.1
------------------MGKAFYKGGFEPRMTKKEASLILSLNERSITKDKVRKAHRTL
MLLNHPDRGGSPYLATKVNEAKELLDKTV-------
>KZP00621.1
---------MGKT-----ATEEWARGGFKAKMDRKEAIAILGLKDNATLRNRLKDAHRHI
MLANHPDRGGSPYLASKINEAKDLLEKLDGKGR---
>OSD06571.1
MRRGL---IGGKN-----AAEQWVKGGFKAKMDRKEAIAILGLKDGPSLKKQLKDAHRHI
MLANHPDRGGSPYLASKINEAKDLLEKMEGRSR---
>KZM94488.1
-------------------------------MTRREASLILGVRE-STAMEKVREAHRRV
MVANHPDAGGSHYLASKINEAKDMMLRKTQGGGSAF
>ELU17463.1
-----------MDSIPGGLTSKYYKGGFDAKMSKREASLILGVSP-SANKNKVKDAHKRI
MLLNHPDRGGSPYLATKINEAKDMLDK---------
>VDO13032.1
-------------------------------MTRREAALVLGISP-SAPASKVKEAHKRI
MIANHPDRGGSPYLAAKINEAKDKLESTRHD-----
>XP_018187597.1
--------------------MCRILGGFAPKMHRKEAALILSLNERGVTREILRKKHRQL
MLLNHPDRGGSPYLATKINEAKEFLEKETS------
>PRW57663.1
-------------------MRAFYKGGFQPEMNRREAALILGVRE-SAPEEKVKEAHRRI
MIANHPDAGGSSFIAAKVNEAKDMLLGKKTGGSSIF
>XP_009038106.1
--------------------KRYYEGPFEAAMTRREAALILGVRE-SATAQRIKDAHRRI
LRINHPDMGGSAFLSAKVNEAKELLI----------
>CDP04286.1
-------------------------------MTRREAALILGIRE-NVTADKVKEAHRKV
MVANHPDAGGSHYLASKINEAKDVMLGKKRDSGSPF
>XP_009544617.1
LRRGI---IGGKG-----AAEQWVKGGFKAKMDRKEAIAILGLKDGPLLKTKLKDAHRHI
MLANHPDRGGAPYLASKINEAKDLLER---------
>PRD27054.1
MSEI----FNNLIVFQSFANSKYYKGGFETQMTKREAGLILGVSP-SASKNRIKDAHKRI
MLLNHPDRGGSPYLAAKINEAKDMLDK---------
>PZD16322.1
-------------------------------MTRREAALILEMPERGITKELLRKKHRSL
MLLNHPDRGGSPYLATKVNEAKELLEKEVK------
>XP_007003183.1
-------------------AEQFLRGGFKSKMDRSEAIAILGLRE-PITSIRLKEAHRRL
MLANHPDRGGAPYLAGKVNEAKAMLE----------
>XP_001743879.1
----------------------YYKGGFEETMSRREAGLILGCSP-SAPYKKIQEAHKRI
MIANHPDRGGSPFLAAKINEAKTLLDKIHQNQASV-
>EPT05582.1
-------RAGQR-----AAEQRRVASRQRHDVDRKEAIAILGLKDGPQLTIRFTEAHRHI
MIANYPDRGGSPYLASRINEANDSFEK---------
>OCH94377.1
MRRGL---LGGKN-----AAEQWVKGGFKAKMDRKEAFAILGLKDGPQLRNRLKDAHRQI
MLANHPDRGGSPYLASKINEAKDLLEKTEARGR---
>AQK40733.1
-------------------MRKFYEGGFQPTMTRREAALILGVRE-TASAEKVKEAHKRV
MVANHPDAGGSHYLASKINEAKDVMTGKTKGGGSAF
>XP_005419065.1
-------------MEPQAFSGGYYRGGFEPKMTKREAALILGVSP-TANRNKIREAHRRI
MLLNHPDKGGSPYVAAKINEAKDLLEDQAKK-----
>PRQ73050.1
-------------------KEEWVKGGFQAKMDRKEAVQILGLRESHMTITRLKDAHRRI
MLANHPDRGGSPYIASKVNEAK--------------
>XP_011400851.1
-------------------MRQFYKGGFLPEMTRREAALILGIRE-SAAEAKVKEAHRRI
MIANHPDAGGSSYIATKVNEAKDMLVGKKRSGSSMF
>CBI31499.3
-------------------------------MTKREAALILGIRE-NATADKVKEAHRRV
MVANHPDAGGSHYLASKINEAKDVMLGKTRGNESPF
>XP_001880856.1
MRRGI---LGGKA-----AADQWVKGGFKAKMDRKEAIEILGLKDGPLLRNKLKDAHRHI
MLANHPDRGGSPYLASKINEAKDLLDKTEGRGR---
>XP_007765267.1
MFRNG---MLGRR-----AAEEWAKGGFKAKMDRKEAIQILGLKDGPTMKLRLKDAHRHI
MLANHPDRGGSPYLASKINEAKDMLDKENRR-----
>EKC26761.1
-------------------------------MSKREAGLILGVSP-SANKNRLKEAHKRI
MILNHPDKGGSPYLAAKINEAKDLLDSTGKKQGK--
>XP_008039700.1
MRRGM---LGGKN-----AAEQWVKGGFKAKMDRKEAIAILGLKDGPQLRKQLKDAHRHI
MLANHPDRGGSPYIASKINEAKDLLDKSEGKAR---
>KFM09175.1
-------------------------GRFEQKMSRREASLILGVSP-SAGKAKIRRAHRTI
MISNHPDKGGSPYLATKINEAKDLLESTAK------
>KLO09234.1
-------------------------------MDRKEAIAILGLKDGPQLSTKLKDAHRQI
MIANHPDRGGSPYLASKINEAKELLDKTDGTRGR--
>EMD31316.1
MRRGL---LGGKN-----AAEQWVKGGFKAKMDRKEAIAILGLKDGSQVRTRLKDAHRHI
MLANHPDRGGSPYLASKINEAKDLLEKMDGKGR---
>XP_020578133.1
-------------------MRKFYEGGFQPSMTRREAALILGVRE-STPPDKIREAHRKV
MVANHPDAGGSHYLASKINEAKDVLLGKSKGGGSAF
>CDW53600.1
-------------------------------MTRREAFLILGVSP-SASKLRVREAHKRV
MLLNHPDRGGSPYIAAKINEAKDFLDKSNTR-----
>XP_005821764.1
----------------MAGIGGGVDKGFEDPMSRTEAAKILGISA-SADKDTVAKVHRKL
MILNHPDRGGSPYLASKVNEAKDVLSGKMRSNPFR-
>XP_007416648.1
MVAGKPRPTRIGD-----LKGPWAIGGFQARMDRREAKDILGLKESQVTKNRLKDAHRKI
MLANHPDRGGSPYLASKINEAKDLLEKSLR------
>XP_016202840.1
-------------------MRKFYEGGFQVTMTRREAALILGVRE-HTPTDKVKEAHRRV
MIANHPDAGGSHYLASKINEAKDVLLGKTKGGGSAF
>RMY97156.1
------------------MGKAFYKGGFEKQMTRREAALILETSERGVTRDMIRKKHRQM
MLLNHPDRGGSPYLATKINEAKEFLEKGAT------
>XP_002180499.1
-----------------GVGSKYYEGGFEDTMTRSEAALILGVRE-SSDPKRIKDAHRKL
LILNHPDTGGSTYMAGKINEAKELL-----------
>EYC43511.1
MLLT----FICS-PNTFFLFEKYHRGGFEPKMTRREAAMILGLPA-TAKPNRIKEAHKRI
MIANHPDRGGSPYLAAKINEAKDLLESSKS------
>KFV15611.1
-----------AKRISASSPSLYYEGGFEQKMSRREAGLILGVSP-SAGKAKIRTAHRRI
IILNHPGKDGSPSVATKINEAKDMLESTVKN-----
>ERN14836.1
-------------------------------MSRREAALILGVRE-SAVMEKIKEAHRRV
MVVNHPDAGGSHYLASKINEAKDMLIGRSKGGGSAF
>XP_002423617.1
---------MKS-FPTMDVNNKYYKGGFEPQMTKREACLILGISP-SANKLKIKEAHKRI
MLLNHPDKGGSPYLAAKINEAKDFIENNK-------
>XP_001622900.1
----------------------YYRGGFEPKMTKREAALILGISP-ASQKNKVREAHRRI
MLINHPDRGGSPYIAAKINEAKDLLDEASK------
>ORY32509.1
-------------------ADKFVKGGFKAKMDRNEAMQVLGLRD-PITSTRLKDAHRRL
MLANHPDRGGSPYLAGKVNEARVFLE----------
>XP_003031565.1
---------GAQK-----GAEQWVKGGFKARMDRKEALQILGLKDNNTVPLRLKDAHRHI
MLANHPDRGGSPYIASKINEAKDLLDKTDGK-----
>XP_019017947.1
----------------------FVKGGFDPKMNAREALRILELKEASLSLKKLKDNHRRI
MLLNHPDKGGSPYLATKINEAKDFLVK---------
>RKP00924.1
---------------GFSAGSKFLRGGFEPKMSRREAALILGVRE-TVSAQKLKEAHRQV
MLANHPDRSGTPFLASKVNEAKDLLEKSRR------
>OBT52395.1
-----MRKYRGGAGAVGALGKAYYKGGFEPKMNRKEAALILQLSERNLTKERIRKNHRTL
MMLNHPDRGGSPYLATKVNEAKEFLEKTS-------
>KJH47276.1
-------------------------------MTKREAALILGVQV-TAKPNKIKEAHRRI
MLINHPDRGGSPYIASKINEAKDLLDSSKS------
>RPD60075.1
MRRGL---LGGKN-----AAEQWVKGGFKAKMDRKEALQILGLKR---LKTKLKDAHRQI
MLANHPDRGGSPYLASKINEAKDLLEKEG-RSR---
>XP_009013064.1
--------------------SKFYRGGFDVKMSKREASLILGVSP-AASKTKIKEAHKRI
MLLNHPDRGGSPYLAAKINEAKDLMDKPGGGG----
>EDM02331.1
-------------------------------MSRREASLILGVSP-SAGKAKIRTAHKRI
MILNHPDKGGSPYLASKINEAKDLLEASSKAN----
>XP_002777593.1
------------MSTLFRASNLRGLEGFDQTMSRSEARKILNLGQTQLSRENIQKHHRQL
LLSNHPDRGGSTYIASKINEAKDVLLGKRR------
>KYM95277.1
MAET----VKKL-DSQSLANSKYYKGGFEPKMTRREASLILSVSP-TASKSKMKEQFKKV
MAVNHPDRGGSPYIAAKINEAKDLLEK---------
>KWU43360.1
-------------------KSDWAKGGFNAKMDRNEAAQILGVPESHMTMTKLKDAHRRI
MLANHPDRGGSPYIASKVNEAKDLLGQS--------
>EEC69977.1
-------------------MRKFYEGGFQPAMTRREAGLILGVRE-NVHPEKVKEAHKKV
MVANHPDAGGSHYLASKINEAKDVLLGKTKGGGSVF