Merge pull request #231 from bioperl/pir-no-desc-line
[bioperl-live.git] / t / data / pfam_tests.stk
blobb4badb56865f1b3ec87c281fa0399bdf31db576e
1 # STOCKHOLM 1.0
2 #=GF ID   14-3-3
3 #=GF AC   PF00244.9
4 #=GF DE   14-3-3 protein
5 #=GF AU   Finn RD
6 #=GF SE   Prosite
7 #=GF GA   25.00 25.00; 25.00 25.00;
8 #=GF TC   28.50 28.50; 30.20 29.80;
9 #=GF NC   22.70 22.70; 20.60 20.60;
10 #=GF TP   Domain
11 #=GF BM   hmmbuild -F HMM_ls SEED
12 #=GF BM   hmmcalibrate --seed 0 HMM_ls
13 #=GF BM   hmmbuild -f -F HMM_fs SEED
14 #=GF BM   hmmcalibrate --seed 0 HMM_fs
15 #=GF AM   globalfirst
16 #=GF RN   [1]
17 #=GF RM   95327195
18 #=GF RT   Structure of a 14-3-3 protein and implications for
19 #=GF RT   coordination of multiple signalling pathways. 
20 #=GF RA   Xiao B, Smerdon SJ, Jones DH, Dodson GG, Soneji Y, Aitken
21 #=GF RA   A, Gamblin SJ; 
22 #=GF RL   Nature 1995;376:188-191.
23 #=GF RN   [2]
24 #=GF RM   95327196
25 #=GF RT   Crystal structure of the zeta isoform of the 14-3-3
26 #=GF RT   protein. 
27 #=GF RA   Liu D, Bienkowska J, Petosa C, Collier RJ, Fu H, Liddington
28 #=GF RA   R; 
29 #=GF RL   Nature 1995;376:191-194.
30 #=GF RN   [3]
31 #=GF RM   96182649
32 #=GF RT   Interaction of 14-3-3 with signaling proteins is mediated
33 #=GF RT   by the recognition of phosphoserine. 
34 #=GF RA   Muslin AJ, Tanner JW, Allen PM, Shaw AS; 
35 #=GF RL   Cell 1996;84:889-897.
36 #=GF RN   [4]
37 #=GF RM   97424374
38 #=GF RT   The 14-3-3 protein binds its target proteins with a common
39 #=GF RT   site located towards the C-terminus. 
40 #=GF RA   Ichimura T, Ito M, Itagaki C, Takahashi M, Horigome T,
41 #=GF RA   Omata S, Ohno S, Isobe T 
42 #=GF RL   FEBS Lett 1997;413:273-276.
43 #=GF RN   [5]
44 #=GF RM   96394689
45 #=GF RT   Molecular evolution of the 14-3-3 protein family. 
46 #=GF RA   Wang W, Shakes DC 
47 #=GF RL   J Mol Evol 1996;43:384-398.
48 #=GF RN   [6]
49 #=GF RM   96300316
50 #=GF RT   Function of 14-3-3 proteins. 
51 #=GF RA   Jin DY, Lyu MS, Kozak CA, Jeang KT 
52 #=GF RL   Nature 1996;382:308-308.
53 #=GF RN   [7]
54 #=GF RM   12184815
55 #=GF RT   The 14-3-3s. 
56 #=GF RA   Ferl RJ, Manak MS, Reyes MF; 
57 #=GF RL   Genome Biol 2002;3:REVIEWS3010.
58 #=GF DR   PROSITE; PDOC00633;
59 #=GF DR   SMART; 14_3_3;
60 #=GF DR   PRINTS; PR00305;
61 #=GF DR   SCOP; 1a4o; fa;
62 #=GF DR   INTERPRO; IPR000308;
63 #=GF SQ   16
64 #=GS RAD25_SCHPO/5-240  AC P42657
65 #=GS RAD24_SCHPO/6-241  AC P42656
66 #=GS BMH1_YEAST/4-240   AC P29311
67 #=GS 1433E_SHEEP/4-239  AC P62262
68 #=GS 1433B_VICFA/7-242  AC P42654
69 #=GS 14334_LYCES/6-243  AC P42652
70 #=GS 14333_LYCES/9-246  AC P93209
71 #=GS 14336_ARATH/7-240  AC P48349
72 #=GS 14332_ENTHI/4-238  AC P42649
73 #=GS 14331_ENTHI/4-239  AC P42648
74 #=GS 1433T_HUMAN/3-236  AC P27348
75 #=GS 1433_XENLA/1-227   AC P29309
76 #=GS 1433Z_DROME/6-239  AC P29310
77 #=GS 14331_CAEEL/5-237  AC P41932
78 #=GS 1433F_RAT/3-240    AC P68511
79 #=GS 1433S_HUMAN/3-238  AC P31947
80 RAD25_SCHPO/5-240            RENSVYLAKLAEQAERYEEMVENMKKVACSND...KLSVEERNLLSVAYKNIIGARRASWRIISSIEQKEESRG.NTRQAALIKEYRKKIEDELSDICHDVLSVLEKHLIPAA..TTGESKVFYYKMKGDYYRYLAEFTVGEVCKEAADSSLEAYKAASDIAVAELPPTDPMRLGLALNFSVFYYEILDSPESACHLAKQVFDEAISELDSLSEESYKDSTLIMQLLRDNLTLWTSDAEYNQ
81 RAD24_SCHPO/6-241            REDAVYLAKLAEQAERYEGMVENMKSVASTDQ...ELTVEERNLLSVAYKNVIGARRASWRIVSSIEQKEESKG.NTAQVELIKEYRQKIEQELDTICQDILTVLEKHLIPNA..ASAESKVFYYKMKGDYYRYLAEFAVGEKRQHSADQSLEGYKAASEIATAELAPTHPIRLGLALNFSVFYYEILNSPDRACYLAKQAFDEAISELDSLSEESYKDSTLIMQLLRDNLTLWTSDAEYSA
82 BMH1_YEAST/4-240             REDSVYLAKLAEQAERYEEMVENMKTVASSGQ...ELSVEERNLLSVAYKNVIGARRASWRIVSSIEQKEESKEKSEHQVELICSYRSKIETELTKISDDILSVLDSHLIPSA..TTGESKVFYYKMKGDYHRYLAEFSSGDAREKATNASLEAYKTASEIATTELPPTHPIRLGLALNFSVFYYEIQNSPDKACHLAKQAFDDAIAELDTLSEESYKDSTLIMQLLRDNLTLWTSDMSESG
83 1433E_SHEEP/4-239            REDLVYQAKLAEQAERYDEMVESMKKVAGMDV...ELTVEERNLLSVAYKNVIGARRASWRIISSIEQKEENKG.GEDKLKMIREYRQMVETELKLICCDILDVLDKHLIPAA..NTGESKVFYYKMKGDYHRYLAEFATGNDRKEAAENSLVAYKAASDIAMTELPPTHPIRLGLALNFSVFYYEILNSPDRACRLAKAAFDDAIAELDTLSEESYKDSTLIMQLLRDNLTLWTSDMQGDG
84 1433B_VICFA/7-242            RENFVYIAKLAEQAERYEEMVDSMKNVANLDV...ELTIEERNLLSVGYKNVIGARRASWRILSSIEQKEESKG.NDVNAKRIKEYRHKVETELSNICIDVMRVIDEHLIPSA..AAGESTVFYYKMKGDYYRYLAEFKTGNEKKEAGDQSMKAYESATTAAEAELPPTHPIRLGLALNFSVFYYEILNSPERACHLAKQAFDEAISELDTLNEESYKDSTLIMQLLRDNLTLWTSDIPEDG
85 14334_LYCES/6-243            REENVYLAKLAEQAERYEEMIEFMEKVAKTADV.EELTVEERNLLSVAYKNVIGARRASWRIISSIEQKEESRG.NEDHVNTIKEYRSKIEADLSKICDGILSLLESNLIPSA..STAESKVFHLKMKGDYHRYLAEFKTGTERKEAAENTLLAYKSAQDIALAELAPTHPIRLGLALNFSVFYYEILNSPDRACNLAKQAFDEAISELDTLGEESYKDSTLIMQLLRDNLTLWTSDNADDV
86 14333_LYCES/9-246            REENVYMAKLADRAESDEEMVEFMEKVSNSLGS.EELTVEERNLLSVAYKNVIGARRASWRIISSIEQKEESRG.NEEHVNSIREYRSKIENELSKICDGILKLLDSKLIPSA..TSGDSKVFYLKMKGDYHRYLAEFKTGAERKEAAESTLTAYKAAQDIASAELAPTHPIRLGLALNFSVFYYEILNSPDRACNLAKQAFDEAIAELDTLGEESYKDSTLIMQLLRDNLTLWTSDMQDDG
87 14336_ARATH/7-240            RDQYVYMAKLAEQAERYEEMVQFMEQLVTGATPAEELTVEERNLLSVAYKNVIGSLRAAWRIVSSIEQKEESRK.NDEHVSLVKDYRSKVESELSSVCSGILKLLDSHLIPSA..GASESKVFYLKMKGDYHRYMAEFKSGDERKTAAEDTMLAYKAAQDIAAADMAPTHPIRLGLALNFSVFYYEILNSSDKACNMAKQAFEEAIAELDTLGEESYKDSTLIMQLLRDNLTLWTSD.....
88 14332_ENTHI/4-238            REDLVYLSKLAEQSERYEEMVQYMKQVAEMGT...ELSVEERNLISVAYKNVVGSRRASWRIISSLEQKEQAKG.NTQRVELIKTYRAKIEQELSQKCDDVLKIITEFLLKNS..TSIESKVFFKKMEGDYYRYYAEFTVDEKRKEVADKSLAAYQEATDTA.ASLVPTHPIRLGLALNFSVFYYQIMNDADKACQLAKEAFDEAIQKLDEVPEESYKESTLIMQLLRDNLTLWTSDMGDDE
89 14331_ENTHI/4-239            REDCVYTAKLAEQSERYDEMVQCMKQVAEMEA...ELSIEERNLLSVAYKNVIGAKRASWRIISSLEQKEQAKG.NDKHVEIIKGYRAKIEKELSTCCDDVLKVIQENLLPKA..STSESKVFFKKMEGDYYRYFAEFTVDEKRKEVADKSLAAYTEATEISNAELAPTHPIRLGLALNFSVFYFEIMNDADKACQLAKQAFDDAIAKLDEVPENMYKDSTLIMQLLRDNLTLWTSDACDEE
90 1433T_HUMAN/3-236            KTELIQKAKLAEQAERYDDMATCMKAVTEQGA...ELSNEERNLLSVAYKNVVGGRRSAWRVISSIEQKTDT...SDKKLQLIKDYREKVESELRSICTTVLELLDKYLIANA..TNPESKVFYLKMKGDYFRYLAEVACGDDRKQTIDNSQGAYQEAFDISKKEMQPTHPIRLGLALNFSVFYYEILNNPELACTLAKTAFDEAIAELDTLNEDSYKDSTLIMQLLRDNLTLWTSDSAGEE
91 1433_XENLA/1-227             .......AKLSEQAERYDDMAASMKAVTELGA...ELSNEERNLLSVAYKNVVGARRSSWRVISSIEQKTEG...NDKRQQMAREYREKVETELQDICKDVLDLLDRFLVPNA..TPPESKVFYLKMKGDYYRYLSEVASGDSKQETVASSQQAYQEAFEISKSEMQPTHPIRLGLALNFSVFYYEILNSPEKACSLAKSAFDEAIRELDTLNEESYKDSTLIMQLLRDNLTLWTSENQGEE
92 1433Z_DROME/6-239            KEELVQKAKLAEQSERYDDMAQAMKSVTETGV...ELSNEERNLLSVAYKNVVGARRSSWRVISSIEQKTEA...SARKQQLAREYRERVEKELREICYEVLGLLDKYLIPKA..SNPESKVFYLKMKGDYYRYLAEVATGDARNTVVDDSQTAYQDAFDISKGKMQPTHPIRLGLALNFSVFYYEILNSPDKACQLAKQAFDDAIAELDTLNEDSYKDSTLIMQLLRDNLTLWTSDTQGDE
93 14331_CAEEL/5-237            VEELVQRAKLAEQAERYDDMAAAMKKVTEQGQ...ELSNEERNLLSVAYKNVVGARRSSWRVISSIEQKTEG...SEKKQQLAKEYRVKVEQELNDICQDVLKLLDEFLIVKA..GAAESKAFYLKMKGDYYRYLAEVAS.EDRAAVVEKSQKAYQEALDIAKDKMQPTHPIRLGLALNFSVFYYEILNTPEHACQLAKQAFDDAIAELDTLNEDSYKDSTLIMQLLRDNLTLWTSDVGAED
94 1433F_RAT/3-240              REQLLQRARLAEQAERYDDMASAMKAVTELNE...PLSNEDRNLLSVAYKNVVGARRSSWRVISSIEQKTMADG.NEKKLEKVKAYREKIEKELETVCNDVLALLDKFLIKNCNDFQYESKVFYLKMKGDYYRYLAEVASGEKKNSVVEASEAAYKEAFEISKEHMQPTHPIRLGLALNFSVFYYEIQNAPEQACLLAKQAFDDAIAELDTLNEDSYKDSTLIMQLLRDNLTLWTSDQQDEE
95 1433S_HUMAN/3-238            RASLIQKAKLAEQAERYEDMAAFMKGAVEKGE...ELSCEERNLLSVAYKNVVGGQRAAWRVLSSIEQKSNEEG.SEEKGPEVREYREKVETELQGVCDTVLGLLDSHLIKEA..GDAESRVFYLKMKGDYYRYLAEVATGDDKKRIIDSARSAYQEAMDISKKEMPPTNPIRLGLALNFSVFHYEIANSPEEAISLAKTTFDEAMADLHTLSEDSYKDSTLIMQLLRDNLTLWTADNAGEE
96 #=GC seq_cons                RE-hVYhAKLAEQAERY--MlpsMKpVsptss...ELSlEERNLLSVAYKNVlGARRASWRIISSIEQKEEu+G.N-c+lphIKEYRpKlEsELssICsDVLplLDcaLIPsA..ssuESKVFYhKMKGDYYRYLAEFsoG-cRKcss-sShtAYppApDIApuEhsPTHPIRLGLALNFSVFYYEILNSP-+ACpLAKQAFDEAIAELDTLsEESYKDSTLIMQLLRDNLTLWTSDhts-t
98 # STOCKHOLM 1.0
99 #=GF ID   2-ph_phosp
100 #=GF AC   PF04029.4
101 #=GF DE   2-phosphosulpholactate phosphatase
102 #=GF AU   Kerrison ND, Finn RD
103 #=GF SE   COG2045
104 #=GF GA   25.00 25.00; 25.00 25.00;
105 #=GF TC   43.30 43.30; 28.00 28.00;
106 #=GF NC   3.00 3.00; 22.60 22.00;
107 #=GF TP   Family
108 #=GF BM   hmmbuild -F HMM_ls SEED
109 #=GF BM   hmmcalibrate --seed 0 HMM_ls
110 #=GF BM   hmmbuild -f -F HMM_fs SEED
111 #=GF BM   hmmcalibrate --seed 0 HMM_fs
112 #=GF AM   globalfirst
113 #=GF RN   [1]
114 #=GF RM   21474017
115 #=GF RT   Identification of coenzyme M biosynthetic
116 #=GF RT   2-phosphosulfolactate phosphatase. A member of a new class
117 #=GF RT   of Mg(2+)-dependent acid phosphatases. 
118 #=GF RA   Graham DE, Graupner M, Xu H, White RH; 
119 #=GF RL   Eur J Biochem 2001;268:5176-5188.
120 #=GF DR   INTERPRO; IPR005238;
121 #=GF CC   Thought to catalyse 2-phosphosulpholactate = sulpholactate + phosphate.
122 #=GF CC   Probable magnesium cofactor.  Involved in the second step of coenzyme M
123 #=GF CC   biosynthesis.  Inhibited by vanadate in Methanococcus jannaschii.  Also
124 #=GF CC   known as the ComB family [1].
125 #=GF SQ   10
126 #=GS COMB_CLOAB/6-235   AC Q97E82
127 #=GS COMB_THEMA/1-224   AC Q9WZQ4
128 #=GS COMB_METTH/2-219   AC O27250
129 #=GS COMB_METJA/1-219   AC Q58540
130 #=GS COMB_DEIRA/2-232   AC Q9RUI6
131 #=GS COMB_SYNY3/2-241   AC P73849
132 #=GS COMB_THEVO/1-211   AC Q97CK6
133 #=GS COMB_THEAC/1-211   AC Q9HIA9
134 #=GS COMB_BACSU/2-223   AC O06738
135 #=GS COMB_STRCO/12-227  AC Q9F3E6
136 COMB_CLOAB/6-235             IISADDIKE.EKVKN..KTAVVIDMLRATSVITTALNNGCKRVVPVLTVEEALKKVKEY.GKDAILGGERKGLKIEGFDFSNSPMEY.TEDVV......KGKTLIMTTTNGTRAIKGSET.ARDILIGSVLNGEAVAEKIVELN.NDVVIVNAGTYGEFSIDDFICSGYIINCVMDRMKKLELT.DAATTA..QYVYKTNEDIKGFVKYAK.HYKRIMELGLKKDFEYCCKKDIVKLVPQYTN.GEIL..
137 COMB_THEMA/1-224             MVDVVMAPC.SPVEC..RTAVVIDVLRATSTIVTALSNGASGVIPVKTIEEALEKKK....EGVLICGERNAQKPKGFNLGNSPLEY.RKEKI......SGKTIVLTTTNGTQVIEKIRS..EEIIAASFLNLSAVVEYLKSKE..DILLVCAGTNGRFSLEDFLLAGAIV..KRLKRNDLG...DGAHAA..ERYFESVENTREEIKKHSSHAKRLISLGFENDIEFCTTEDLFKTVPALVN.GVFILK
138 COMB_METTH/2-219             AMRIRLSFE.RPEGS..GLCIMVDLLRASATITAALDR.FREVIPVADIEEAMEYSR....KGYLVAGERGGETLPGF.IANSPLEV.KNYR........GDVLVLTTSNGTRILESVKS...DALVGCLNNLDAVAEAARELS.DEVEVVMAGVNGRFAIEDFLCAGEIIAAIDGEMDEYA...EASVLA..VQDRSLVDDAIRRSRSAER....LGGLGFMDDVEYCIKRNITGNVPVYRD.GRIELM
139 COMB_METJA/1-219             MITLCNRFT..EYKC.GNVAIVVDVLRASTTITTLLSF.IDEVYITTST.....SKK....ENAIYIGERKGRKIEGFDFGNSPTEILANKDIIKERYENGEKVILTTTNGTRVLKSLDA..EHIFIGAIVNAKYVAKAVEDFE..DVSLVPCHRENNFAIDDFIGCGVIAKYLNGEFDEF.....IKAAL..ELTKHDWMSLILNSSSAEN....LKNLGYEKDVTFAILENSIDAVGIYKK...DKSK
140 COMB_DEIRA/2-232             RLRVDLLPD..SHYP..DVALVIDVLRATTTAVTLLEQGAAELLLTRTTEAALAVRETV..PDVLLAGERGGLTIPGFDLGNSPVEV.SGGAV......AGRRVVMTTTNGTIAAHRAAQTARHVVLAALVNAHAVARHALAVASEEIAIVCAGTDGRVGLDDVYAAGVIA.EYLLALGDFQVD.DGARIA..LTMRRGGGDPGEALRSSG.HGATLARLGLSSDVDYAAQLSTSRLIPTLVP.GDDVPA
141 COMB_SYNY3/2-241             EIFVYHTPELTPDQSLPDCAVVIDVLRATTTIATALKVGAEAVQVFSSLDDLMATSESWPGEKRLRAGERGGAAVAGYDLGNSPLDC.TSELM......AGKRLFLSTTNGTRALQRVKDC.PQLVTASLVNRGAAVDYLAQTQPKTVWLLGSGWEGGYSLEDTVCAGAIASLLREKGIDFTVGNDEVVAA..QSLYRQWRSDLLNLFKQASHGQRLLKLDRLEDLRYCATEDLIDILPKQVSPGVLTAA
142 COMB_THEVO/1-211             MIRIADGRK.EENWS..SINIIIDIFRSTTTIPVILSRGARYIVPFKDVTSALNFKRKN..KNVVLIGEKYGIKPPFFDYDNSPAQI.INADL......EGKIIAFTSTNGMYVLSRIKR..GRILFSSLVNMSATIKKVKGKD..DILVVPSNRPIGKAVEDNIFAEMLK..LALEGKNY....DREILV..NRIRETKENTVVSISTQ..............DLEICLKLDLLDCVPEYIE.GKIVND
143 COMB_THEAC/1-211             MIRIGDGRK.SDSWA..EINVVVDIFRSTTTIPMILFRGAKYILPFRDVRKAIEFKRRN..PGTILVGEKYGIKPPYFDYDNSPAEI.AEADL......SGKVVAFTSTNGTYVLSRIRS..GRIIFSSYVNLSATVAMIRSQR..DVLILPSNRPIGKAPEDILFANLLK..LMAEGHEV....DVSEYT..RKTEEINRNIIAGVGER..............DLEFCLRVDHTNIVPEYID.GRIVQS
144 COMB_BACSU/2-223             PIAIYQGHH..HSLAPADINIVIDVIRAFTVAHYAFIGGAKEILLVRTADEAFALKDTY..PDYVLTGEEKGVGISGFDLDNSPKRM.AGQNM......TDKSLIQKTTNGVTAALGALN.AKHLFVTGFSNAKTTAQHVKKLVANDCVINIVASHP.SGDDDMACAEYIK..GIIEGTNV.....VTAAE..AIERIKGSSVAEKFFDCR......QPLFDSEDIVYCTKELTGDFVMKVKQDGEVPTI
145 COMB_STRCO/12-227            DTRFVGIPE..VGEA.PAVAVVVDVMRAFTVAAWAFARGAEKIVLAGSLDEALALKERD..PARVAL..KDGPLTPGFDLVNSPGLL.RSADL......AGRTVVQKTTAGTVGALAVRD.ASLVLCAGFVVAEATARVLRARAPEHVTFVVTGEDG.RADEDLACARYIA..RRAAGHDA....DAAGFLGRAAESRAATELVQGVRQGVH..........PDDVALCLELDRFPFAMVAAP..EDSLM
146 #=GC seq_cons                hIclspshc.psstu..clAlVIDVLRATTTIssALspGAccllsspol--AlthK+p...cssllsGERtGhplsGFDluNSPhEl.sstcl......sGKsllhTTTNGTpslppl+s..pcllhuulVNtcAsActl+shs.pDVhlVsuGpsGthulEDhlsAGhIt..lttctc-h....Dsushs..pphccsscssltslppst.....lhtLsh.cDl-aChccDhhchVPphhs.Gcls.t
148 # STOCKHOLM 1.0
149 #=GF ID   3-alpha
150 #=GF AC   PF03475.3
151 #=GF DE   3-alpha domain
152 #=GF AU   Aravind L, Anantharaman V
153 #=GF SE   Aravind L, Anantharaman V
154 #=GF GA   25.00 25.00; 25.00 25.00;
155 #=GF TC   25.40 25.40; 25.00 25.00;
156 #=GF NC   24.40 24.40; 24.60 24.60;
157 #=GF TP   Domain
158 #=GF BM   hmmbuild -F HMM_ls SEED
159 #=GF BM   hmmcalibrate --seed 0 HMM_ls
160 #=GF BM   hmmbuild -f -F HMM_fs SEED
161 #=GF BM   hmmcalibrate --seed 0 HMM_fs
162 #=GF AM   globalfirst
163 #=GF RC   See figure 2.
164 #=GF RN   [1]
165 #=GF RM   11886751
166 #=GF RT   MOSC domains: ancient, predicted sulfur-carrier domains,
167 #=GF RT   present in diverse metal--sulfur cluster biosynthesis
168 #=GF RT   proteins including Molybdenum cofactor sulfurases. 
169 #=GF RA   Anantharaman V, Aravind L; 
170 #=GF RL   FEMS Microbiol Lett 2002;207:55-61.
171 #=GF DR   SCOP; 1o67; fa;
172 #=GF DR   INTERPRO; IPR005163;
173 #=GF DR   PDB; 1o65 A; 178; 224;
174 #=GF DR   PDB; 1o65 B; 178; 224;
175 #=GF DR   PDB; 1o65 C; 178; 224;
176 #=GF DR   PDB; 1o67 A; 178; 224;
177 #=GF DR   PDB; 1o67 B; 178; 224;
178 #=GF DR   PDB; 1o67 C; 178; 224;
179 #=GF CC   This small triple helical domain has been predicted
180 #=GF CC   to assume a topology similar to helix-turn-helix
181 #=GF CC   domains. These domains are found at the C-terminus
182 #=GF CC   of proteins related to Swiss:P32157.
183 #=GF SQ   11
184 #=GS Y278_HAEIN/174-219    AC P43976
185 #=GS Q99RT6_STAAM/171-217  AC Q99RT6
186 #=GS Q9PHR4_CAMJE/164-215  AC Q9PHR4
187 #=GS Q9RT82_DEIRA/181-226  AC Q9RT82
188 #=GS Q9KF70_BACHD/170-214  AC Q9KF70
189 #=GS Q9I1P0_PSEAE/174-219  AC Q9I1P0
190 #=GS Q9I607_PSEAE/169-215  AC Q9I607
191 #=GS O86804_STRCO/189-233  AC O86804
192 #=GS P95151_MYCTU/201-244  AC P95151
193 #=GS YIIM_ECOLI/168-214    AC P32157
194 #=GS O34542_BACSU/173-219  AC O34542
195 #=GS YIIM_ECOLI/168-214 DR PDB; 1o65 A; 178; 224;
196 #=GS YIIM_ECOLI/168-214 DR PDB; 1o65 B; 178; 224;
197 #=GS YIIM_ECOLI/168-214 DR PDB; 1o65 C; 178; 224;
198 #=GS YIIM_ECOLI/168-214 DR PDB; 1o67 A; 178; 224;
199 #=GS YIIM_ECOLI/168-214 DR PDB; 1o67 B; 178; 224;
200 #=GS YIIM_ECOLI/168-214 DR PDB; 1o67 C; 178; 224;
201 Y278_HAEIN/174-219           QITIRHLNRLLSTP.....KNEAELDSALEIEV.LAEAFKRSIRSQISKFKQ
202 Q99RT6_STAAM/171-217         RLSVQQLNDLYYNDRQ....NQDMLRYALNNPF.LSPTRRDKLQKMYNRTLK
203 Q9PHR4_CAMJE/164-215         SLSVFELNQLFYSPHQILKQNPNLLDKLEKLNSLISQNWHETIHKRLKNTYD
204 Q9RT82_DEIRA/181-226         APTIGELFDADFAKSH....DPAELRAWLTFP..LGKRQRKEVEKWLAKAEG
205 Q9KF70_BACHD/170-214         HPTVLEVNQLYYPKDI....NKEQLRRMSQLPE.LADAWKKAFSKKLANA..
206 Q9I1P0_PSEAE/174-219         DWSLLRLSEVLFDRRA....DAELLRQCLPLP..LTPSWRRTLERRLEKGQV
207 Q9I607_PSEAE/169-215         ELTVARLLQWYFGDPL....EPLGLRQMMACDA.LSQRWRKTAAKRLSSGVV
208 O86804_STRCO/189-233         EVTVALQFRAVTTQ.......RELLPRLLAAGGALHPEALATARKYVAEYGA
209 P95151_MYCTU/201-244         NVTVGLVFRARTSE.......SELLPQLLAADA.LAAELKAYARERTPSPPP
210 YIIM_ECOLI/168-214           DVTVQEAAAIAWHMPF....DDDQYHRLLSAAG.LSKSWTRTMQKRRLSGKI
211 #=GR YIIM_ECOLI/168-214 SS   SCBHHHHHHHHHTSCC....CHHHHHHHHTSTT.CCHHHHHHHHHHHHHSSC
212 #=GR YIIM_ECOLI/168-214 SA   6000320010013274....3372052026033.108303630350385563
213 O34542_BACSU/173-219         GISVQFANRINYHDAK....NLTAIERILSEAA.LSESWRASFMKKKDRLLP
214 #=GC SS_cons                 SCBHHHHHHHHHTSCC....CHHHHHHHHTSTT.CCHHHHHHHHHHHHHSSC
215 #=GC SA_cons                 6000320010013274....3372052026033.108303630350385563
216 #=GC seq_cons                plTVtclsclhasc......stphLcphLshss.Lupsa+cohpK+lspshs