/examples/data/ensembl_pax.fasta

http://github.com/sbotond/phylosim · Unknown · 8505 lines · 8505 code · 0 blank · 0 comment · 0 complexity · 19115dabad5ca713ecfa17b5df20b68d MD5 · raw file

Large files are truncated click here to view the full file

  1. >ENSOGAP00000011965
  2. F-------SCP-------------------------------------------------
  3. ------------------------------------------------------------
  4. ------------------------------------------------------------
  5. ------------------------------------------------------------
  6. ------------------------------------------------------------
  7. ------------------------------------------------------------
  8. ------------------------------------------------------------
  9. ------------------------------------------------------------
  10. -GISSMNQLGGLFVNGRPL--------------PLDTRQQIVQLAVS-GMRPCDISRSLK
  11. ------------------VSNGCVSKILG--------RYYRTGVLEPKGI------GGSK
  12. PR-LATPPVVARIAQLKGECPALFAWEI----------------------QHQLRAEGVC
  13. ------------------------------------------------------------
  14. ------------------------------------------------------------
  15. TQDKTPS------------------------VSSINRVLRTLQ-----------------
  16. ------------------------------------------------------------
  17. ------------------------------------------------------------
  18. ------------------------------------------------------------
  19. ------------------------------------------------------------
  20. ------------------------------------------------------------
  21. --------------------------------------------------EDQGLPWAQ-
  22. -LRSPAVLALAPPNPQSGSEAPRGP-------PGTGHRNRTIFSPGQA------------
  23. --------------EALEKE-FQRGQYPDSVVRGKL------AAATSLPEDTV-RVWFSN
  24. RRAKWRR-------QEKLKWEMQLP-----------------------------------
  25. ------------------------------------------------------------
  26. ------------------------------------------------------------
  27. ------------------------------GATQGLTVPKFSSGIISAQ---QAPGSVPT
  28. AALPA-------------------------------------------------------
  29. ------------------------------------------------------------
  30. -----------------------------------------------------LELLDPS
  31. CCQLCWAIAPDRFLSDTPPQVGLKPCWGYFSPQ-------LSSQDSALLYCPRPS-----
  32. TSFGAPQALFRPGSLLLDLG----------------------------------------
  33. ------------------------------------------------------------
  34. ------------------------------------------------------------
  35. ----------------------------------
  36. >ENSOPRP00000001544
  37. -------------------MQN--------------------------------------
  38. ------------------------------------------------------------
  39. ------------------------------------------------------------
  40. ------------------------------------------------------------
  41. ------------------------------------------------------------
  42. ------------------------------------------------------------
  43. ------------------------------------------------------------
  44. ------------------------------------------------------------
  45. -SHSGVNQLGGVFVNGRPL--------------PDSTRQKIVELAHS-GARPCDISRILQ
  46. ----THADAKVQVLDNQNVSNGCVSKILG--------RYYETGSIRPRAI------GGSK
  47. PR-VATPEVVSKIAQYKRECPSIFAWEI----------------------RDRLLSEGVC
  48. ------------------------------------------------------------
  49. ------------------------------------------------------------
  50. TNDNIPS------------------------VSSINRVLRNLA-----------------
  51. ------------------------------------------------------------
  52. ------------------------------------------------------------
  53. ------------------------------------------------------------
  54. ------------------------------------------------------------
  55. --------------------------------------------------------SEKQ
  56. Q------MGADGMYDKLRMLNGQTGS-----WGTRPGWYPGTSVPGQPTQ--DGCQPQE-
  57. -GAGENTNSISSNGEDSDEAQMRLQL------KRKLQRNRTSFTQEQI------------
  58. --------------EALEKE-FERTHYPDVFARERL------AAKIDLPEARI-QVWFSN
  59. RRAKWRR-------EEKLRNQRRQASNTPSHIPISS------------------------
  60. ------------------------------------------------------------
  61. -SFSTSVYQPIPQPTTPV-SSFTSGSMLGRTDTALTNTYSALPPMPSFTMANNLPMQPPV
  62. ---TNQTSS---YSNMLPPSPSVN------GRSYDTYTPPHMQTHMNSQPMGTSGTTSTG
  63. LISPGVSVPVQVPGSEPDMSQYWPRLQ---------------------------------
  64. ------------------------------------------------------------
  65. ------------------------------------------------------------
  66. ------------------------------------------------------------
  67. ------------------------------------------------------------
  68. ------------------------------------------------------------
  69. ------------------------------------------------------------
  70. ----------------------------------
  71. >ENSRNOP00000006302
  72. -------------------MQN--------------------------------------
  73. ------------------------------------------------------------
  74. ------------------------------------------------------------
  75. ------------------------------------------------------------
  76. ------------------------------------------------------------
  77. ------------------------------------------------------------
  78. ------------------------------------------------------------
  79. ------------------------------------------------------------
  80. -SHSGVNQLGGVFVNGRPL--------------PDSTRQKIVELAHS-GARPCDISRILQ
  81. ----THADAKVQVLDSENVSNGCVSKILG--------RYYETGSIRPRAI------GGSK
  82. PR-VATPEVVSKIAQYKRECPSIFAWEI----------------------RDRLLSEGVC
  83. ------------------------------------------------------------
  84. ------------------------------------------------------------
  85. TNDNIPS------------------------VSSINRVLRNLA-----------------
  86. ------------------------------------------------------------
  87. ------------------------------------------------------------
  88. ------------------------------------------------------------
  89. ------------------------------------------------------------
  90. --------------------------------------------------------SEKQ
  91. Q------MGADGMYDKLRMLNGQTGS-----WGTRPGWYPGTSVPGQPTQ--DGCQQQE-
  92. -GQGENTNSISSNGEDSDEAQMRLQL------KRKLQRNRTSFTQEQI------------
  93. --------------EALEKE-FERTHYPDVFARERL------AAKIDLPEARI-QVWFSN
  94. RRAKWRR-------EEKLRNQRRQASNTPSHIPISS------------------------
  95. ------------------------------------------------------------
  96. -SFSTSVYQPIPQPTTPV-SSFTSGSMLGRTDTALTNTYSALPPMPSFTMANNLPMQPPV
  97. ---PSQTSS---YSCMLPTSPSVN------GRSYDTYTPPHMQTHMNSQPMGTSGTTSTG
  98. LISPGVSVPVQVPGSEPDMSQYWPRLQ---------------------------------
  99. ------------------------------------------------------------
  100. ------------------------------------------------------------
  101. ------------------------------------------------------------
  102. ------------------------------------------------------------
  103. ------------------------------------------------------------
  104. ------------------------------------------------------------
  105. ----------------------------------
  106. >ENSP00000350844
  107. MDLEKNYPTPRTSRT---------------------------------------------
  108. ------------------------------------------------------------
  109. ------------------------------------------------------------
  110. ------------------------------------------------------------
  111. ------------------------------------------------------------
  112. ------------------------------------------------------------
  113. ------------------------------------------------------------
  114. ------------------------------------------------------------
  115. -GHGGVNQLGGVFVNGRPL--------------PDVVRQRIVELAHQ-GVRPCDISRQLR
  116. ------------------VSHGCVSKILG--------RYYETGSIKPGVI------GGSK
  117. PK-VATPKVVEKIAEYKRQNPTMFAWEI----------------------RDRLLAERVC
  118. ------------------------------------------------------------
  119. ------------------------------------------------------------
  120. DNDTVPS------------------------VSSINRIIRTKV-----------------
  121. ----------------------QQP-----------------------------------
  122. ------------------------------------------------------------
  123. ---------------------------------------------------PNQPVPASS
  124. --HSIVSTGSVTQVS----------------SVS-------------TDSAGSS--YSIS
  125. GILGI----TSPSADTN-------------KRKRDEGI----------------------
  126. --QESPV----------------------------PNGHSLPGRD---------------
  127. -------------------------F------LRKQMRGDLF-TQQQL------------
  128. --------------EVLDRV-FERQHYSDIFTTTE-------PIKPEQ--TTE-YSAM--
  129. ASLAG-G-------LDDMKANLASP-TPADIG----------------------------
  130. -------------------------------------------------------SSVP-
  131. -GPQSYP--------------IVT------------------------------------
  132. ---------------------------------------------------GRDLASTT-
  133. --LPG--------------------------------------------------YPPHV
  134. PP----------------------------------------------------------
  135. --------------------------------------------------------AGQG
  136. S----YSAPT-----L-----------TGMVP----------------------------
  137. ------------------GS---------------------------------EFSGSPY
  138. SHP------QYSSYND-SWRFPNP------------GLL-------------------GS
  139. PYYYSAA-----------------------------ARGAAP----PAAAT--AYDRH--
  140. ----------------------------------
  141. >ENSDARP00000043209
  142. ----------------------MDIHCKADP---FSAM----H-----------------
  143. ------------------------------------------------------------
  144. ------------------------------------------------------------
  145. ------------------------------------------------------------
  146. ------------------------------------------------------------
  147. ------------------------------------------------------------
  148. ------------------------------------------------------------
  149. ------------------------------------------------------------
  150. -RHGGVNQLGGVFVNGRPL--------------PDVVRQRIVELAHQ-GVRPCDISRQLR
  151. ------------------VSHGCVSKILG--------RYYETGSIKPGVI------GGSK
  152. PK-VATPKVVDKIADYKRQNPTMFAWEI----------------------RDRLLAEGIC
  153. ------------------------------------------------------------
  154. ------------------------------------------------------------
  155. DNDTVPS------------------------VSSINRIIRTKV-----------------
  156. ----------------------QQPFH---------------------------------
  157. ------------------------------------------------------------
  158. ---------------------------------------------PSPDG---TSLSTPG
  159. --HTIIPSTASPPVS----------------SSS-------------NDPVGS---YSIN
  160. GILGI------PRSNGE-------------KRKRDADG----------------------
  161. --SEGSA----------------------------QSSDSQGSVE---------------
  162. -------------------------S------LRKHLRADAF-TQQQL------------
  163. --------------EALDRV-FERPVFPDVFPTSE-------HIKPEQ--ASE-YS-L--
  164. PALNT-G-------LDEVKPSLSSS-AASDLG----------------------------
  165. -------------------------------------------------------ASVS-
  166. ---QSYP--------------V--------------------------------------
  167. ---------------------------------------------------GRDMANTT-
  168. --LPG--------------------------------------------------YPPHV
  169. PP----------------------------------------------------------
  170. --------------------------------------------------------TGQG
  171. S----YATST-----L-----------AGMVP----------------------------
  172. ------------------GS---------------------------------EFSGNPY
  173. SHP------QYTTYNE-AWRFSNP------------AIL-------------------SS
  174. PYYYSA------------------------------SRGSAP----PTAAT--AYDRH--
  175. ----------------------------------
  176. >ENSMMUP00000020235
  177. L-------SRP-------------------------------------------------
  178. ------------------------------------------------------------
  179. ------------------------------------------------------------
  180. ------------------------------------------------------------
  181. ------------------------------------------------------------
  182. ------------------------------------------------------------
  183. ------------------------------------------------------------
  184. ------------------------------------------------------------
  185. -GISSMNQLGGLFVNGRPL--------------PLDTRQQIVRLAVR-GMRPCDISRSLK
  186. ------------------VSNGCVSKILG--------RYYRTGVLEPKGI------GGSK
  187. PR-LATPPVVARIAQLKGECPALFAWEI----------------------QRQLCAEGLC
  188. ------------------------------------------------------------
  189. ------------------------------------------------------------
  190. TQDKTPS------------------------VSSINRVLRALQ-----------------
  191. ------------------------------------------------------------
  192. ------------------------------------------------------------
  193. ------------------------------------------------------------
  194. ------------------------------------------------------------
  195. ------------------------------------------------------------
  196. --------------------------------------------------EDQGLPWTQ-
  197. -LRSPAVLAPALLTPHSGSETPRGPH------PGTGHRNRTIFSPSQA------------
  198. --------------EALEKE-FQRGQYPDSVARGKL------AAATSLPEDTV-RVWFSN
  199. RRAKWRR-------QEKLKWEMQLP-----------------------------------
  200. ------------------------------------------------------------
  201. ------------------------------------------------------------
  202. ------------------------------GASQGLTVPRVAPGIISAQ---QSPGSVPT
  203. AVLPA-------------------------------------------------------
  204. ------------------------------------------------------------
  205. -----------------------------------------------------LEPLGLL
  206. CLP-CPPTVP------WPVLVAVRPCSG------------------LAAHYYCGSFLFPV
  207. IAPSCVDLAWPCLDAFLAYYLIGGAGEATPTHFSHWP-----------------------
  208. ------------------------------------------------------------
  209. ------------------------------------------------------------
  210. ----------------------------------
  211. >ENSMICP00000000087
  212. F-------SCP-------------------------------------------------
  213. ------------------------------------------------------------
  214. ------------------------------------------------------------
  215. ------------------------------------------------------------
  216. ------------------------------------------------------------
  217. ------------------------------------------------------------
  218. ------------------------------------------------------------
  219. ------------------------------------------------------------
  220. -GISSVNQLGGLFVNGRPL--------------PLDTRQQIVQLAVR-GMRPCDISRSLK
  221. ------------------VSNGCVSKILG--------RYYRTGVLEPKGI------GGSK
  222. PR-LATPPVVARIAQLKGECPALFAWEI----------------------QRQLCAEGLC
  223. ------------------------------------------------------------
  224. ------------------------------------------------------------
  225. TQDKTPS------------------------VSSINRVLRALQ-----------------
  226. ------------------------------------------------------------
  227. ------------------------------------------------------------
  228. ------------------------------------------------------------
  229. ------------------------------------------------------------
  230. ------------------------------------------------------------
  231. --------------------------------------------------EDQGLSWAQ-
  232. -LRSPAVLAPAPPTRQSGFEAPRGPH------PGTGHRNRTIFSPGQA------------
  233. --------------EALEKE-FQRGQYPDSVARGKL------AAATSLPEDTV-RVWFSN
  234. RRAKWRR-------QEKLKWEMQLP-----------------------------------
  235. ------------------------------------------------------------
  236. ------------------------------------------------------------
  237. ------------------------------GAPQGLTVQKVSPGIVSAQ---QSPGSAPT
  238. AALPA-------------------------------------------------------
  239. ------------------------------------------------------------
  240. -----------------------------------------------------LEPLAAP
  241. CCQLCWATVPDRFLSDAQPQAPLKPCWGYLPPQ-------PSSWDSVLLCCPCPS-----
  242. SSLGAPQALPPPGSGLLGLGG---------------------------------------
  243. ------------------------------------------------------------
  244. ------------------------------------------------------------
  245. ----------------------------------
  246. >ENSTNIP00000006290
  247. LSSIPDLPLFRLLCLA--------------------------------------------
  248. ------------------------------------------------------------
  249. ------------------------------------------------------------
  250. ------------------------------------------------------------
  251. ------------------------------------------------------------
  252. ------------------------------------------------------------
  253. ------------------------------------------------------------
  254. ------------------------------------------------------------
  255. -GHGGVNQLGGVFVNGRPL--------------PDVVRQRIVELAHQ-GVRPCDISRQLR
  256. ------------------VSHGCVSKILG--------RYYETGSIRPGVI------GGSK
  257. PK-VATPKVVDKIADYKRQNPTMFAWEI----------------------RDRLLAERVC
  258. ------------------------------------------------------------
  259. ------------------------------------------------------------
  260. DNDSVPS------------------------VSSINRIIRTKV-----------------
  261. ----------------------QQQ-----------------------------------
  262. ------------------------------------------------------------
  263. ---------------------------------------------------PGQTGSVSA
  264. --HNLATSVAATQVS----------------AVT-------------SDSAGSS--YSIS
  265. GILGI----SSA-ADVG-------------KRKRDEGK----------------------
  266. --SNSPK----------------------------RSARNARGKD---------------
  267. -------------------------R------LRVKPCGDLCPQPKQR------------
  268. --------------EVGCRW-APHPPKYIIYTPKH---------PPPPHQTSD-YSAM--
  269. ASLTG-G-------LDEMKNSLANPGTGAEIG----------------------------
  270. -------------------------------------------------------ASVT-
  271. -GPQSYS--------------LVP------------------------------------
  272. ---------------------------------------------------GRDLASTT-
  273. --LPG--------------------------------------------------YPPHV
  274. PP----------------------------------------------------------
  275. --------------------------------------------------------TGQG
  276. S----YSTPS-----L-----------TGMVP----------------------------
  277. ------------------GG---------------------------------DFSGSPY
  278. SHP------QYSTYNE-SWRFPNP------------SLL-------------------GS
  279. PYYYSAT-----------------------------SRGAGP----AATATASAYDRH--
  280. ----------------------------------
  281. >ENSSSCP00000014151
  282. -------------------MQN--------------------------------------
  283. ------------------------------------------------------------
  284. ------------------------------------------------------------
  285. ------------------------------------------------------------
  286. ------------------------------------------------------------
  287. ------------------------------------------------------------
  288. ------------------------------------------------------------
  289. ------------------------------------------------------------
  290. -SHSGVNQLGGVFVNGRPL--------------PDSTRQKIVELAHS-GARPCDISRILQ
  291. ------------------VSNGCVSKILG--------RYYETGSIRPRAI------GGSK
  292. PR-VATPEVVSKIAQYKRECPSIFAWEI----------------------RDRLLSEGVC
  293. ------------------------------------------------------------
  294. ------------------------------------------------------------
  295. TNDNIPS------------------------VSSINRVLRNLA-----------------
  296. ------------------------------------------------------------
  297. ------------------------------------------------------------
  298. ------------------------------------------------------------
  299. ------------------------------------------------------------
  300. --------------------------------------------------------SEKQ
  301. Q------MGADGMYDKLRMLNGQTGS-----WGTRPGWYPGTSVPGQPTQ--DGCQQQE-
  302. -GGGENTNSISSNGEDSDEAQMRLQL------KRKLQRNRTSFTQEQI------------
  303. --------------EALEKE-FERTHYPDVFARERL------AAKIDLPEARI-QVWFSN
  304. RRAKWRR-------EEKLRNQRRQASNTPSHIPISS------------------------
  305. ------------------------------------------------------------
  306. -SFSTSVYQPIPQPTTPV-SSFTSGSMLGRTDTALTNTYSALPPMPSFTMANNLPMQPPV
  307. ---PSQTSS---YSCMLPTSPSVN------GRSYDTYTPPHMQTHMNSQPMGTSGTTSTG
  308. LISPGVSVPVQVPGSEPDMSQYWPRLQ---------------------------------
  309. ------------------------------------------------------------
  310. ------------------------------------------------------------
  311. ------------------------------------------------------------
  312. ------------------------------------------------------------
  313. ------------------------------------------------------------
  314. ------------------------------------------------------------
  315. ----------------------------------
  316. >ENSPPYP00000003888
  317. -------------------LSS--------------------------------------
  318. ------------------------------------------------------------
  319. ------------------------------------------------------------
  320. ------------------------------------------------------------
  321. ------------------------------------------------------------
  322. ------------------------------------------------------------
  323. ------------------------------------------------------------
  324. ------------------------------------------------------------
  325. -GHSGVNQLGGVFVNGRPL--------------PDSTRQKIVELAHS-GARPCDISRILQ
  326. ----THADAKVQVLDNQNVSNGCVSKILG--------RYYETGSIRPRAI------GGSK
  327. PR-VATPEVVSKIAQYKRECPSIFAWEI----------------------RDRLLSEGVC
  328. ------------------------------------------------------------
  329. ------------------------------------------------------------
  330. TNDNIPS------------------------VSSINRVLRNLA-----------------
  331. ------------------------------------------------------------
  332. ------------------------------------------------------------
  333. ------------------------------------------------------------
  334. ------------------------------------------------------------
  335. --------------------------------------------------------SEKQ
  336. Q------MGADGMYDKLRMLNGQTGS-----WGTRPGWYPGTSVPGQPTQ--DGCQQQE-
  337. -GGGENTNSISSNGEDSDEAQMRLQL------KRKLQRNRTSFTQEQI------------
  338. --------------EALEKE-FERTHYPDVFALERL------AAKIDLPEA---------
  339. ------------------------------------------------------------
  340. ------------------------------------------------------------
  341. ------------------------------------------------------------
  342. ------------------------------------------------------------
  343. ------------------------------------------------------------
  344. ------------------------------------------------------------
  345. ------------------------------------------------------------
  346. ------------------------------------------------------------
  347. ------------------------------------------------------------
  348. ------------------------------------------------------------
  349. ------------------------------------------------------------
  350. ----------------------------------
  351. >ENSSARP00000010317
  352. -------------------MQN--------------------------------------
  353. ------------------------------------------------------------
  354. ------------------------------------------------------------
  355. ------------------------------------------------------------
  356. ------------------------------------------------------------
  357. ------------------------------------------------------------
  358. ------------------------------------------------------------
  359. ------------------------------------------------------------
  360. -SHSGVNQLGGVFVNGRPL--------------PDSTRQKIVELAHS-GARPCDISRILQ
  361. ----THADAKVQVLDNQNVSNGCVSKILG--------RYYETGSIRPRAI------GGSK
  362. PR-VATPEVVSKIAQYKRECPSIFAWEI----------------------RDRLLSEGVC
  363. ------------------------------------------------------------
  364. ------------------------------------------------------------
  365. TNDNIPS------------------------XXXXXXXXXXXX-----------------
  366. ------------------------------------------------------------
  367. ------------------------------------------------------------
  368. ------------------------------------------------------------
  369. ------------------------------------------------------------
  370. --------------------------------------------------------XXXX
  371. X------XXXXXXXXXXXXXXXXXXX-----XXXXXXXXXXXXXXXXXXX--XGCQQQE-
  372. -GGGENTNSISSNGEDSDEAQMRLQL------KRKLQRNRTSFTQEQI------------
  373. --------------EALEKE-FERTHYPDVFARERL------AAKIDLPEARI-QVWFSN
  374. RRAKWRR-------EEKLRNQRRQASNTPSHIPISS------------------------
  375. ------------------------------------------------------------
  376. -SFSTSVYQPIPQPTTPV-SSFTSGSVLGRTDTALTNTYSALPPMPSFTMANNLPMQPPV
  377. ---PSQTSS---YSCMLPTSPSVN------GRSYDTYTPPHMQTHMNSQPMGTSGTTSTG
  378. LISPGVSVPVQVPGSEPDMSQYWPRLQ---------------------------------
  379. ------------------------------------------------------------
  380. ------------------------------------------------------------
  381. ------------------------------------------------------------
  382. ------------------------------------------------------------
  383. ------------------------------------------------------------
  384. ------------------------------------------------------------
  385. ----------------------------------
  386. >ENSDARP00000067247
  387. MPQKEYHNQPTWESGVASMMQN--------------------------------------
  388. ------------------------------------------------------------
  389. ------------------------------------------------------------
  390. ------------------------------------------------------------
  391. ------------------------------------------------------------
  392. ------------------------------------------------------------
  393. ------------------------------------------------------------
  394. ------------------------------------------------------------
  395. -SHSGVNQLGGVFVNGRPL--------------PDSTRQKIVELAHS-GARPCDISRILQ
  396. ------------------VSNGCVSKILG--------RYYETGSIRPRAI------GGSK
  397. PR-VATPEVVGKIAQYKRECPSIFAWEI----------------------RDRLLSEGVC
  398. ------------------------------------------------------------
  399. ------------------------------------------------------------
  400. TNDNIPS------------------------VSSINRVLRNLA-----------------
  401. ------------------------------------------------------------
  402. ------------------------------------------------------------
  403. ------------------------------------------------------------
  404. ------------------------------------------------------------
  405. --------------------------------------------------------SEKQ
  406. Q------MGADGMYDKLRMLNGQSGT-----WGTRPGWYPGTSVPGQPNQ--DGCQQQD-
  407. -NGGENTNSISSNGEDSDETQMRLQL------KRKLQRNRTSFTQEQI------------
  408. --------------EALEKE-FERTHYPDVFARERL------AAKIDLPEARI-QVWFSN
  409. RRAKWRR-------EEKLRNQRRQASNSSSHIPISS------------------------
  410. ------------------------------------------------------------
  411. -SFNTSVYQAIPQPTTPV--SFTTGSMLGRPDTALTNTYTGLPPMPSFTMANNLPMQ---
  412. ---PSQTSS---YSCMLPSSPSVN------GRSFDTYTPPHMQAHMNSQTMATSGTASTG
  413. LISPGVSVPVQVPGTEPDMSQYWSRLQ---------------------------------
  414. ------------------------------------------------------------
  415. ------------------------------------------------------------
  416. ------------------------------------------------------------
  417. ------------------------------------------------------------
  418. ------------------------------------------------------------
  419. ------------------------------------------------------------
  420. ----------------------------------
  421. >ENSTNIP00000016123
  422. P-----------------------------------------------------------
  423. ------------------------------------------------------------
  424. ------------------------------------------------------------
  425. ------------------------------------------------------------
  426. ------------------------------------------------------------
  427. ------------------------------------------------------------
  428. ------------------------------------------------------------
  429. ------------------------------------------------------------
  430. -GNSGVNQLGGVFINGRPL--------------PPVVRQSIVELAGR-GARPSDISRRLR
  431. ------------------VSHGCVSKILA--------RY---------------------
  432. ------------------------------------------------------------
  433. ------------------------------------------------------------
  434. ------------------------------------------------------------
  435. ------------------------------------------------------------
  436. ------------------------------------------------------------
  437. ------------------------------------------------------------
  438. ------------------------------------------------------------
  439. ------------------------------------------------------------
  440. ------------------------------------------------------------
  441. ------------------------------------------------------------
  442. ------------------------------------------------------------
  443. ------------------------------------------------------------
  444. ------------------------------------------------------------
  445. ------------------------------------------------------------
  446. ------------------------------------------------------------
  447. ------------------------------------------------------------
  448. ------------------------------------------------------------
  449. ------------------------------------------------------------
  450. ------------------------------------------------------------
  451. ------------------------------------------------------------
  452. ------------------------------------------------------------
  453. ------------------------------------------------------------
  454. ------------------------------------------------------------
  455. ----------------------------------
  456. >ENSOGAP00000008434
  457. ISVNV-SV----------------------------------------------------
  458. ------------------------------------------------------------
  459. ------------------------------------------------------------
  460. ------------------------------------------------------------
  461. ------------------------------------------------------------
  462. ------------------------------------------------------------
  463. ------------------------------------------------------------
  464. ------------------------------------------------------------
  465. -GHGGLNQLGGAFVNGRPL--------------PEVVRQRIVDLAHQ-GVRPCDISRQLR
  466. ------------------VSHGCVSKILG--------RYYETGSIRPGVI------GGSK
  467. PK-VATPKVVEKIGDYKRQNPTMFAWEI----------------------RDRLLAEXXX
  468. ------------------------------------------------------------
  469. ------------------------------------------------------------
  470. XXXXXXX------------------------XXXXXXXXXXXX-----------------
  471. ----------------------XXXXX---------------------------------
  472. ------------------------------------------------------------
  473. ---------------------------------------------XXXXXXXXXXXXXXX
  474. --XXXXXXXXXXXPE----------------SPQ-------------SDSLGST--YSIN
  475. GLLGI----AQPGSDS--------------KRKMDDSD----------------------
  476. --QDSCR----------------------------LSIDSQSSST---------------
  477. -------------------------G------PRKHLRTDAF-SQHHL------------
  478. --------------EPLECP-FERQHYPEAYASPSH------T-KGEQ--XXX-XP-L--
  479. -LLNS-A-------LDDGKATLTP--SNTPLG----------------------------
  480. -------------------------------------------------------RNLS-
  481. -THQTYP--------------VVADPH--SPFAIKQE-TPEVSSSSSTPSSL-SSSAFLD
  482. ---LQQV-GSG------V----------PPFNAFPHAASVYGQFTGQALLSGREMVGPT-
  483. --LPG--------------------------------------------------YPPHI
  484. PT----------------------------------------------------------
  485. --------------------------------------------------------SGQG
  486. S----YASSA-----I-----------AGMV-----------------------------
  487. -----------------AXX---------------------------------XXXXXXX
  488. XXX------XXXXXXX-XXXXXXX------------XXX-------------------XS
  489. PYYYSST-----------------------------SRPNAP----PTTAT--AFDHL--
  490. ----------------------------------
  491. >ENSCINP00000013350
  492. MATYDSCRQASSMALCFNRESLPHK-----------------------------------
  493. ------------------------------------------------------------
  494. ------------------------------------------------------------
  495. ------------------------------------------------------------
  496. ------------------------------------------------------------
  497. ------------------------------------------------------------
  498. ------------------------------------------------------------
  499. ------------------------------------------------------------
  500. -GHSGMNQLGGMFVNGRPL--------------PDSIRQKIVEFAHN-GARPCDISRILQ
  501. ------------------VSNGCVSKILA--------RYYETGTIRPRAI------GGSK
  502. PR-VATPEVVNKIASYKRECPSIFAWEI----------------------RDRLLNEGIC
  503. ------------------------------------------------------------
  504. ------------------------------------------------------------
  505. NNDNIPS------------------------VSSINRVLRNLN-----------------
  506. ------------------------------------------------------------
  507. ------------------------------------------------------------
  508. ------------------------------------------------------------
  509. ------------------------------------------------------------
  510. ------------------------------------------------------------
  511. ----------GDHQTGGFIETTGRDPKSGSQLGLEWSLTCNGWLPQQTMCQEQIAAEGL-
  512. -MGLKGKESVVESEAKDGSSEARLQL------KRKLQRNRTSFTQIQV------------
  513. --------------EALEKE-FERTHYPDVFARERL------ATKIDLPEARI-QVWFSN
  514. RRAKWRR-------EEKIRSQRSSAASDGSDVMRRTNDQQSIG-QCGVYSSVTQQHA---
  515. -QGSMIY-------GINSFIYSFVSNLTFY-----SEVEHFPPMHRMHEAPYLYGLSSGG
  516. PSNLTPPPHYTSYDHDRRVEEPSHNTIPTPPSSANQPSPDHDHHGSHMQPLDGGIYQASL
  517. SGMHVGHQHHALVGAQATDQSAS-SMIVPPMTALQNPANFH-TAEGYWQSGVQG------
  518. ------------------------------------------------------------
  519. ------------------------------------------------------------
  520. ------------------------------------------------------------
  521. ------------------------------------------------------------
  522. ------------------------------------------------------------
  523. ------------------------------------------------------------
  524. ------------------------------------------------------------
  525. ----------------------------------
  526. >K06B9.5
  527. MFTKTFSNNYMTSSQSAYCNLQQYHDSRVCLLKCCRVQKVDPYFPRIALNSATSYPTVSG
  528. TVSLPKAETVEPDLWIKSFKGNEDPLLSDG------------------------------
  529. ------------------------------------------------------------
  530. ------------------------------------------------------------
  531. ------------------------------------------------------------
  532. ------------------------------------------------------------
  533. ------------------------------------------------------------
  534. ------------------------------------------------------------
  535. -SHTGVNQLGGVFVNGRPL--------------PDTIRAQIVEMSQH-GTRPCDISRQLK
  536. ------------------VSHGCVSKILG--------RYYSTGSVRPGVI------GGSK
  537. PK-VATPRVVECIAGYKRANPTMFAWEI----------------------RQKLIEDQIC
  538. ------------------------------------------------------------
  539. ------------------------------------------------------------
  540. GEENVPS------------------------VSSINRIVRNKS-----------------
  541. ------------------------------------------------------------
  542. ------------------------------------------------------------
  543. ------------------------------------------------------------
  544. ------------------------------------------------------------
  545. ------------------------------------------------------------
  546. ------------------------------------------------------------
  547. ---------------FMAQLATPTSV------TPSVARPSSATSQNQR------------
  548. -----------SPPRGVQQH-MQQSTSVQQLQQFQL------TSAATV------------
  549. ------------------------------------------------------------
  550. ------------------------------------------------------------
  551. ------------------------------------------------------------
  552. ----------------------------------------------------NSLISRPA
  553. FAIPG-------------------------------------------------------
  554. ------------------------------------------------------------
  555. ------------------------------------------------------------
  556. -----TTHSINGLLGTFPHSSLLDDKFTNLSTHSADMSLVYPTGLVGEHDWAMRTPMVIL
  557. PQNYCGQL----------------------------------------------------
  558. ------------------------------------------------------------
  559. ------------------------------------------------------------
  560. ----------------------------------
  561. >ENSMLUP00000011514
  562. MDLEKNYPTPRTGRT---------------------------------------------
  563. ------------------------------------------------------------
  564. ------------------------------------------------------------
  565. ------------------------------------------------------------
  566. ------------------------------------------------------------
  567. ------------------------------------------------------------
  568. ------------------------------------------------------------
  569. ------------------------------------------------------------
  570. -GHGGVNQLGGVFVNGRPL--------------PDVVRQRIVELAHQ-GVRPCDISRQLR
  571. ------------------VSHGCVSKILG--------RYYETGSIKPGVI------GGSK
  572. PK-VATPKVVEKIAEYKRQNPTMFAWEI----------------------RDRLLAERVC
  573. ------------------------------------------------------------
  574. ------------------------------------------------------------
  575. DNDTVPS------------------------VSSINRIIRTKV-----------------
  576. ----------------------QQP-----------------------------------
  577. ------------------------------------------------------------
  578. ---------------------------------------------------PNQPVPASS
  579. --HSIVSTGSVTQVS----------------SVS-------------TDSAGSS--YSIS
  580. GILGI----TSPSADTN-------------KRKRDEXX----------------------
  581. --XXXXX----------------------------XXXXXXXXXX---------------
  582. -------------------------X------XXXXXXXXXX-XXXXX------------
  583. --------------XXXXXX-XXXXXXXXXXXXXX-------XXXXXX--XXX-XXXX--
  584. XXXXX-X-------XXXXXXXXXXX-XXXXXX----------------------------
  585. -------------------------------------------------------XXXX-
  586. -XXXXXX--------------XXX------------------------------------
  587. ---------------------------------------------------XRDLASTT-
  588. --LPG--------------------------------------------------YPPHV
  589. PP----------------------------------------------------------
  590. --------------------------------------------------------AGQG
  591. S----YSAPT-----L-----------TGMVP----------------------------
  592. ------------------GS---------------------------------EFSGSPY
  593. SHP------QYPSYND-SWRFPNP------------GLL-------------------GS
  594. PYYYSAA-----------------------------ARGAAP----PAAAT--AYDRH--
  595. ----------------------------------
  596. >ENSSSCP00000011247
  597. ------------------------------------------------------------
  598. ------------------------------------------------------------
  599. ------------------------------------------------------------
  600. ------------------------------------------------------------
  601. ------------------------------------------------------------
  602. ------------------------------------------------------------
  603. ------------------------------------------------------------
  604. ------------------------------------------------------------
  605. ------------------------------------------------------------
  606. ------------------------------------------------------------
  607. ------------------------------------------------------------
  608. ------------------------------------------------------------
  609. ------------------------------------------------------------
  610. ------------------------------------------------------------
  611. ------------------------------------------------------------
  612. ------------------------------------------------------------
  613. ------------------------------------------------------------
  614. ------------------------------------------------------------
  615. ------------------------------------------------------------
  616. ------------------------------------------------------------
  617. ------------------------------------------------------------
  618. -------------------V-FERPSYPDVFQASEH---------------------IKS
  619. EQGNEYSLPALTPGLDEVKSSLSAS-----------------------------------
  620. ------------------------------------------------------------
  621. ------------------------------------------------------------
  622. --------------------------------TNPELGSNVSGTQTYPVVTGRDMASTTL
  623. PGYPP-------------------------------------------------------
  624. ------------------------------------------------------------
  625. ------------------------------------------------------------
  626. ------------------------------------------------------------
  627. ----------------HVPPTGQGSYPTSTLAGMVP----------------------GS
  628. EFSGNPYSHPQYTAYNEAWRFSNPALLSSPYYYSAAPRGSLPLLPLPMTATSYRGDHIKL
  629. QADSFGLHIVPV------------------------------------------------
  630. ----------------------------------
  631. >ENSTGUP00000007459
  632. MELEKTYATPRASRT---------------------------------------------
  633. ------------------------------------------------------------
  634. ------------------------------------------------------------
  635. ------------------------------------------------------------
  636. ------------------------------------------------------------
  637. ------------------------------------------------------------
  638. ------------------------------------------------------------
  639. ------------------------------------------------------------
  640. -GHGGVNQLGGVFVNGRPL--------------PDVVRQRIVELAHQ-GVRPCDISRQLR
  641. ------------------VSHGCVSKILG--------RYYETGSIKPGVI------GGSK
  642. PK-VATPKVVEKIAEYKRQNPTMFAWEI----------------------RDRLLAERVC
  643. ------------------------------------------------------------
  644. ------------------------------------------------------------
  645. DNDTVPS------------------------VSSINRIIRTKV-----------------
  646. ----------------------QQP-----------------------------------
  647. ------------------------------------------------------------
  648. ---------------------------------------------------PNQQVPASS
  649. --HSIASTGSVTQVS----------------SVT-------------TDSAGSS--YSIS
  650. GILGI----ASPGTESN-------------KRKRDEGI----------------------
  651. --QESPV----------------------------PNGHSLPSRD---------------
  652. -------------------------F------LRKQMRGDLF-TQQQL------------
  653. --------------EVLDRV-FERQHYSDIFTTTE-------PIKPEQ--ATE-YSAM--
  654. ASLAG-G-------LDDMKANITSP-TSADLG----------------------------
  655. -------------------------------------------------------ASVP-
  656. -GPQSYP--------------IVT------------------------------------
  657. ---------------------------------------------------GRELASTT-
  658. --LPG--------------------------------------------------YPPHV
  659. PP----------------------------------------------------------
  660. --------------------------------------------------------AGQG
  661. S----YSTPA-----L-----------TGMVP----------------------------
  662. ------------------GD---------------------------------EFSGSPY
  663. SHP------QYSTYND-SWRFPNP------------GLL-------------------GS
  664. PYYYSAT-----------------------------ARGAAA----PAAAA--AYDRH--
  665. ----------------------------------
  666. >ENSSSCP00000011246
  667. ----------------------MDMHCKADP---FSAM----HP----------------
  668. ------------------------------------------------------------
  669. ------------------------------------------------------------
  670. ------------------------------------------------------------
  671. ------------------------------------------------------------
  672. ------------------------------------------------------------
  673. ------------------------------------------------------------
  674. ------------------------------------------------------------
  675. -GHGGVNQLGGVFVNGRPL--------------PDVVRQRIVELAHQ-GVRPCDISRQLR
  676. ------------------VSHGCVSKILG--------RYYETGSIKPGVI------GGSK
  677. PK-VATPKVVDKIAEYKRQNPTMFAWEI----------------------RDRLLAEGIC
  678. ------------------------------------------------------------
  679. ------------------------------------------------------------
  680. DNDTVPS------------------------VSSINRIIRTKV-----------------
  681. ----------------------QQPFH---------------------------------
  682. ------------------------------------------------------------
  683. ---------------------------------------------PTPDG-AGTGVTAPG
  684. --HTIVPSTASPPVS----------------SAS-------------NDPVGS---YSIN
  685. GILGI------PRSNGE-------------KRKRDEVEVYTDPAHIRGGGGLHLVWTLRG
  686. MGARGTM----------------------------VRGQGK-------------------
  687. ------------------------------------------------------------
  688. ------------------------------------------------------------
  689. ------------------------------------------------------------
  690. ------------------------------------------------------------
  691. ------------------------------------------------------------
  692. ------------------------------------------------------------
  693. ------------------------------------------------------------
  694. ------------------------------------------------------------
  695. ------------------------------------------------------------
  696. ------------------------------------------------------------
  697. ------------------------------------------------------------
  698. ------------------------------------------------------------
  699. ------------------------------------------------------------
  700. ----------------------------------
  701. >ENSTBEP00000014786
  702. ----------------------KNMHCKEEP---FSAK----PT----------------
  703. ------------------------------------------------------------
  704. ------------------------------------------------------------
  705. ------------------------------------------------------------
  706. ------------------------------------------------------------
  707. ------------------------------------------------------------
  708. ------------------------------------------------------------
  709. ------------------------------------------------------------
  710. -GHGGVNQLGGV-VNGRPL--------------PDVV-QRIVELTHQ-GVRPCDISRQLR
  711. ------------------VSHGCVSKI-G--------RYYETGSIKPGVI------GGSK
  712. PK-VATPKVVDKIAEYKRQNPTMFAWET----------------------HGRLLAEGIC
  713. ------------------------------------------------------------
  714. ------------------------------------------------------------
  715. DNDTVPS------------------------VSTINXXXXXXX-----------------
  716. ----------------------XXXXX---------------------------------
  717. ------------------------------------------------------------
  718. ---------------------------------------------XXXXX-XXXXXXXXX
  719. --XXXXPSTASPPVS----------------SAS-------------NDPVGS---YSIN
  720. GILGI------PRSNGE-------------KRKRDEVEVYTDPAHIRGGGGLHLVWTLR-
  721. ------------------------------------------------------------
  722. ------------------------------------------------------------
  723. ------------------------------------------------------------
  724. ------------------------------------------------------------
  725. ------------------------------------------------------------
  726. ------------------------------------------------------------
  727. ------------------------------------------------------------
  728. ------------------------------------------------------------
  729. ------------------------------------------------------------
  730. ------------------------------------------------------------
  731. ------------------------------------------------------------
  732. ------------------------------------------------------------
  733. ------------------------------------------------------------
  734. ------------------------------------------------------------
  735. ----------------------------------
  736. >ENSACAP00000002317
  737. --------------------PA--------------------------------------
  738. ------------------------------------------------------------
  739. ------------------------------------------------------------
  740. ------------------------------------------------------------
  741. ------------------------------------------------------------
  742. ------------------------------------------------------------
  743. ------------------------------------------------------------
  744. ------------------------------------------------------------
  745. -GHSGVNQLGGVFVNGRPL--------------PDSTRQKIVELAHS-GARPCDISRILQ
  746. ----THADAKVQVLDNQNVSNGCVSKILG--------RYYETGSIRPRAI------GGSK
  747. PR-VATPEVVSKIAQYKRECPSIFAWEI----------------------RDRLLSEGVC
  748. ------------------------------------------------------------
  749. ------------------------------------------------------------
  750. TNDNIPS------------------------VSSINRVLRNLA-----------------
  751. ------------------------------------------------------------
  752. ------------------------------------------------------------
  753. ------------------------------------------------------------
  754. ------------------------------------------------------------
  755. --------------------------------------------------------SEKQ
  756. Q------MGADGMYDKLRMLNGQSGT-----WGTRPGWYPGTSVPGQPAP--DGCPQQE-
  757. -GGAENTNSISSNGEDSDEAQMRLQL------KRKLQRNRTSFTQEQI------------
  758. --------------EALEKE-FERTHYPDVFARERL------AAKIDLPEARI-QVWFSN
  759. RRAKWRR-------EEKLRNQRRQASNTPSHIPISS------------------------
  760. ------------------------------------------------------------
  761. -SFSTSVYQPIPQPTTPV-SSFTSGSMLGRTDTALTNTYSALPPMPSFTMANNLPMQPPV
  762. ---PSQTSS---YSCMLPTSPSVN------GRSYDTYTPPHMQTHMNSQPMGTSGTTSTG
  763. LISPGVSVPVQVPGSEPDMSQYWPRLQ---------------------------------
  764. ------------------------------------------------------------
  765. ------------------------------------------------------------
  766. ------------------------------------------------------------
  767. ------------------------------------------------------------
  768. ------------------------------------------------------------
  769. ------------------------------------------------------------
  770. ----------------------------------
  771. >ENSGACP00000003177
  772. ----------------------MDIHCKADP---FTAM----H-----------------
  773. ------------------------------------------------------------
  774. ------------------------------------------------------------
  775. ------------------------------------------------------------
  776. ------------------------------------------------------------
  777. ------------------------------------------------------------
  778. ------------------------------------------------------------
  779. ------------------------------------------------------------
  780. -RHGGVNQLGGVFVNGRPL--------------PDVVRQRIVELAHQ-GVRPCDISRQLR
  781. ------------------VSHGCVSKILG--------RYYETGSIKPGVI------GGSK
  782. PK-VATPKVVDKIADYKRQNPTMFAWEI----------------------RDRLLAEGVC
  783. ------------------------------------------------------------
  784. ------------------------------------------------------------
  785. DNDTVPS------------------------VSSINRIIRTKV-----------------
  786. ----------------------QQPFH---------------------------------
  787. ------------------------------------------------------------
  788. ---------------------------------------------PSPDG---SSLSTPG
  789. --HTIVPSTTSPPVT----------------SAS-------------NDPAGS---YSIN
  790. GILGI------PRSNGE-------------KRKRDE------------------------
  791. ------------------------------------------------------------
  792. ------------------------------------------------------------
  793. ------------------------------------------------------------
  794. ------------------------------------------------------------
  795. ------------------------------------------------------------
  796. ------------------------------------------------------------
  797. ---------------------------------------------------GRDMANTT-
  798. --LPG--------------------------------------------------YPPHV
  799. PP----------------------------------------------------------
  800. --------------------------------------------------------TGQG
  801. S----YPTST-----L-----------AGMVP----------------------------
  802. ------------------GS---------------------------------EFSGNPY
  803. SHP------QYTTYND-AWRFSNP------------ALL-------------------SS
  804. PYYYSAA-----------------------------SRGSAP----HTAAT--AYDRH--
  805. ----------------------------------
  806. >ENSGACP00000022114
  807. IPPPPP------------------------------------------------------
  808. ------------------------------------------------------------
  809. ------------------------------------------------------------
  810. ------------------------------------------------------------
  811. ------------------------------------------------------------
  812. ------------------------------------------------------------
  813. ------------------------------------------------------------
  814. ------------------------------------------------------------
  815. -GHGGLNQLGGMFVNGRPL--------------PEVIRQRIVDMAHQ-GVRPCDISRQLR
  816. ------------------VSHGCVSKILG--------RYYETGSIKPGVI------GGSK
  817. PK-VATPKVVDKIAEYKRQNPTMFAWEI----------------------RDRLLAEEVC
  818. ------------------------------------------------------------
  819. ------------------------------------------------------------
  820. DSDTVPS------------------------VSSINRIIRTKV-----------------
  821. ----------------------QQPFN---------------------------------
  822. ------------------------------------------------------------
  823. ---------------------------------------------LPLDG----KGLSPG
  824. --HTLIPSSAVTPPE----------------SPH-------------SDSLGST--YSIS
  825. GLLGI----PQPSAEG--------------KRSHDDSD----------------------
  826. --QESCR----------------------------HSVDSQGSGG---------------
  827. -------------------------V------PRKQMRMDHF-SA-AT------------
  828. --------------PHLDCG-FDRHQYPPDSFGSAS------SSKTEQ---TL-YP-L--
  829. SLING-S-------LDEAKASLST--CGSAIG----------------------------
  830. -------------------------------------------------------RNLT-
  831. -AHQSYA--------------MVTESRQPLPLCLKQEMSPEVTSTSPSPNMALSNLAFME
  832. LQALQKPLSAGGGGGSSC---SNSNHYPNAFNSFSHHAPVYGQFSSQSIISGRDMVSST-
  833. --LPG--------------------------------------------------YPPHI
  834. PS----------------------------------------------------------
  835. --------------------------------------------------------PAQS
  836. G----YSSSA-----I-----------TGMVA----------------------------
  837. -----------------AGT---------------------------------DYSGQTY
  838. SHS------PYT-YSE-AWRFTNS------------SIL-------------------GS
  839. PYYYSTA-----------------------------SRTAPP----P--AA--AYDHL--
  840. ----------------------------------
  841. >ENSOCUP00000019685
  842. -------------------PSS--------------------------------------
  843. ------------------------------------------------------------
  844. ------------------------------------------------------------
  845. ------------------------------------------------------------
  846. ------------------------------------------------------------
  847. ---------------------------------------------------------