Add tests for memory leaks and weaken for Issue #81
[bioperl-live.git] / t / data / roa1.dat
bloba21c7ef67faf95ae94a95afed6de3bea47d768a8
1 ID HSHNCPA1 standard; RNA; HUM; 1198 BP.
2 XX
3 AC X79536;
4 XX
5 SV X79536.1
6 XX
7 DT 03-JUN-1994 (Rel. 39, Created)
8 DT 03-JUN-1994 (Rel. 39, Last updated, Version 1)
9 XX
10 DE H.sapiens mRNA for hnRNPcore protein A1
12 KW core protein.
14 OS Homo sapiens (human)
15 OC Eukaryota; Metazoa; Chordata; Craniata; Vertebrata; Mammalia; Eutheria;
16 OC Primates; Catarrhini; Hominidae; Homo.
18 RN [2]
19 RP 1-1198
20 RA Leffers H.;
21 RT ;
22 RL Submitted (01-JUN-1994) to the EMBL/GenBank/DDBJ databases.
23 RL H. Leffers, Inst. of Medical Research Biochemistry & Danish Centre for
24 RL Human Genome Research, Ole Worms Alle 170, Aarhus Univ., 8000 Aarhus C,
25 RL DENMARK
27 RN [3]
28 RA Knudsen S.M., Leffers H.;
29 RT "Cloning and sequencing of a splice variant of human hnRNP core protein
30 RT A1";
31 RL Unpublished.
33 DR SWISS-PROT; P09651; ROA1_HUMAN.
35 FH Key Location/Qualifiers
37 FT source 1..1198
38 FT /db_xref="taxon:9606"
39 FT /organism="Homo sapiens"
40 FT /tissue_type="lung"
41 FT /cell_type="fibroblast"
42 FT /cell_line="MRC5"
43 FT /clone_lib="lambda ZapII"
44 FT /clone="HDP1"
45 FT CDS 27..989
46 FT /db_xref="SWISS-PROT:P09651"
47 FT /product="hnRNPcore protein A1"
48 FT /protein_id="CAA56072.1"
49 FT /translation="MSKSESPKEPEQLRKLFIGGLSFETTDESLRSHFEQWGTLTDCVV
50 FT MRDPNTKRSRGFGFVTYATVEEVDAAMNARPHKVDGRVVEPKRAVSREDSQRPGAHLTV
51 FT KKIFVGGIKEDTEEHHLRDYFEQYGKIEVIEIMTDRGSGKKRGFAFVTFDDHDSVDKIV
52 FT IQKYHTVNGHNCEVRKALSKQEMASASSSQRGRSGSGNFGGGRGGGFGGNDNFGRGGNF
53 FT SGRGGFGGSRGGGGYGGSGDGYNGFGNDGSNFGGGGSYNDFGNYNNQSSNFGPMKGGNF
54 FT GGRSSGPYGGGGQYFAKPRNQGGYGGSSSSSSYGSGRRF"
55 FT misc_feature 995
56 FT /note="alternative splice site"
57 FT polyA_signal 1180..1185
59 SQ Sequence 1198 BP; 334 A; 216 C; 336 G; 312 T; 0 other;
60 ttaaagtctc tcttcaccct gccgtcatgt ctaagtcaga gtctcctaaa gagcccgaac 60
61 agctgaggaa gctcttcatt ggagggttga gctttgaaac aactgatgag agcctgagga 120
62 gccattttga gcaatgggga acgctcacgg actgtgtggt aatgagagat ccaaacacca 180
63 agcgctctag gggctttggg tttgtcacat atgccactgt ggaggaggtg gatgcagcta 240
64 tgaatgcaag gccacacaag gtggatggaa gagttgtgga accaaagaga gctgtctcca 300
65 gagaagattc tcaaagacca ggtgcccact taactgtgaa aaagatattt gttggtggca 360
66 ttaaagaaga cactgaagaa catcacctaa gagattattt tgaacagtat ggaaaaattg 420
67 aagtgattga aatcatgact gaccgaggca gtggcaagaa aaggggcttt gcctttgtaa 480
68 cctttgacga ccatgactcc gtggataaga ttgtcattca gaaataccat actgtgaatg 540
69 gccacaactg tgaagttaga aaagccctgt caaagcaaga gatggctagt gcttcatcca 600
70 gccaaagagg tcgaagtggt tctggaaact ttggtggtgg tcgtggaggt ggtttcggtg 660
71 ggaatgacaa cttcggtcgt ggaggaaact tcagtggtcg tggtggcttt ggtggcagcc 720
72 gtggtggtgg tggatatggt ggcagtgggg atggctataa tggatttggc aatgatggaa 780
73 gcaattttgg aggtggtgga agctacaatg attttgggaa ttacaacaat cagtcttcaa 840
74 attttggacc catgaaggga ggaaattttg gaggcagaag ctctggcccc tatggcggtg 900
75 gaggccaata ctttgcaaaa ccacgaaacc aaggtggcta tggcggttcc agcagcagca 960
76 gtagctatgg cagtggcaga agattttaat tagggaggag tctgctacta gtcttatcag 1020
77 ctcttaaaaa cagaaactca tctgtccaag ttcgtggcag aaaggaacgt ccttgtgaag 1080
78 acctttatct gagccactgt acttcgttat cacgccatgc agtttacatg agctgttctg 1140
79 cagctcgaaa ttccattttg tgaatgggtt ttttttttta ataaactgta tttaactt 1198
81 ID HSHNRNPA standard; DNA; HUM; 5368 BP.
83 AC X12671;
85 SV X12671.1
87 DT 23-NOV-1989 (Rel. 21, Created)
88 DT 24-APR-1993 (Rel. 35, Last updated, Version 3)
90 DE Human gene for heterogeneous nuclear ribonucleoprotein (hnRNP) core
91 DE protein A1
93 KW hnRNP A1 proten; ribonucleoprotein; RNA binding protein.
95 OS Homo sapiens (human)
96 OC Eukaryota; Metazoa; Chordata; Craniata; Vertebrata; Mammalia; Eutheria;
97 OC Primates; Catarrhini; Hominidae; Homo.
99 RN [1]
100 RP 1-5368
101 RA Riva S.;
102 RT ;
103 RL Submitted (23-AUG-1988) to the EMBL/GenBank/DDBJ databases.
104 RL Riva S., Consiglio Nazionale Delle Ricerche, Istituto Di Genetica
105 RL Biochimica Ed Evoluzionistica CNR, Via Abbiategrasso 2D7, 27100 Pavia,
106 RL Italy.
108 RN [2]
109 RP 1-5368
110 RA Biamonti G., Buvoli M., Bassi M.T., Morandi C., Cobianchi F., Riva S.;
111 RT "Isolation of an active gene encoding human hnRNP protein A1";
112 RL J. Mol. Biol. 207:491-503(1988).
114 DR SWISS-PROT; P09651; ROA1_HUMAN.
116 FH Key Location/Qualifiers
118 FT source 1..5368
119 FT /db_xref="taxon:9606"
120 FT /organism="Homo sapiens"
121 FT /clone="pES5"
122 FT /tissue_type="liver"
123 FT /clone_lib="lambdaCh4A."
124 FT mRNA join(695..813,1377..1493,1789..1935,2084..2294,2388..2480,
125 FT 2567..2659,2794..2868,3806..3961,4252..4311,4543..5240)
126 FT CDS join(799..813,1377..1493,1789..1935,2084..2294,2388..2480,
127 FT 2567..2659,2794..2868,3806..3961,4252..4307)
128 FT /db_xref="SWISS-PROT:P09651"
129 FT /product="hnrnp a1 protein"
130 FT /protein_id="CAA31191.1"
131 FT /translation="MSKSESPKEPEQLRKLFIGGLSFETTDESLRSHFEQWGTLTDCVV
132 FT MRDPNTKRSRGFGFVTYATVEEVDAAMNARPHKVDGRVVEPKRAVSREDSQRPGAHLTV
133 FT KKIFVGGIKEDTEEHHLRDYFEQYGKIEVIEIMTDRGSGKKRGFAFVTFDDHDSVDKIV
134 FT IQKYHTVNGHNCEVRKALSKQEMASASSSQRGRSGSGNFGGGRGGGFGGNDNFGRGGNF
135 FT SGRGGFGGSRGGGGYGGSGDGYNGFGNDGSNFGGGGSYNDFGNYNNQSSNFGPMKGGNF
136 FT GGRSSGPYGGGGQYFAKPRNQGGYGGSSSSSSYGSGRRF"
137 FT exon 695..813
138 FT /number=1
139 FT misc_feature 695..695
140 FT /note="mRNA initiation site"
141 FT misc_feature 715..715
142 FT /note="mRNA initiation site"
143 FT misc_feature 735..735
144 FT /note="mRNA initiation site"
145 FT intron 814..1376
146 FT /number=1
147 FT exon 1377..1493
148 FT /number=2
149 FT intron 1494..1788
150 FT /number=2
151 FT exon 1789..1935
152 FT /number=3
153 FT intron 1936..2083
154 FT /number=3
155 FT exon 2084..2294
156 FT /number=4
157 FT intron 2295..2387
158 FT /number=4
159 FT exon 2388..2480
160 FT /number=5
161 FT intron 2481..2566
162 FT /number=5
163 FT exon 2567..2659
164 FT /number=6
165 FT intron 2660..2793
166 FT /number=6
167 FT exon 2794..2868
168 FT /number=7
169 FT intron 2869..3805
170 FT /number=7
171 FT exon 3806..3961
172 FT /number=8
173 FT intron 3962..4251
174 FT /number=8
175 FT exon 4252..4311
176 FT /number=9
177 FT intron 4312..4542
178 FT /number=9
179 FT exon 4543..5240
180 FT /number=10
182 SQ Sequence 5368 BP; 1476 A; 1052 C; 1270 G; 1570 T; 0 other;
183 gggattgaga gtgatcactc acgctaacgt ctgccctgtt cctgtatggt gaggccgcac 60
184 cacaagccac caccgccgcc gccttctgcg caacgccaac cgcccgccaa aacggatcct 120
185 tccctgcgcc tgcgcaacca atcttgggac cggacctttt ttctccgccc actacgcatg 180
186 cgcaaagcta ggacaaactc ccgccaacac gcaggcgccg taggttcact gcctactcct 240
187 gcccgccatt tcacgtgttc tcagaggcag gtggaacttc ttaatgcgcc tgcgcaaaac 300
188 tcgccatttt actacacgtg cggtcaacaa gagttcattg caaaaaaatt gttacctcct 360
189 agctgcttgt ctaatacata gtgttaatca tgctttgcca agcgacttga ctgtaatatt 420
190 tgcgcgtgga agattaaaaa gatgttaaac acccaaggta gattcaaatg tgaatgattg 480
191 gtcggttggc caatcagact ggttaacaat aacattactc gggaaccaat ggactccaag 540
192 gggtggagac ggcgtagaac gaccgaagga atgacgttac acagcaatgt ggcaccacag 600
193 gccaatagca gggggaagcg atttcaagta tccaatcaga gctgttctag ggcggagtct 660
194 accaatgccg aaagcgagga ggcggggtaa aaaagagagg gcgaaggtag gctggcagat 720
195 acgttcgtca gcttgctcct ttctgcccgt ggacgccgcc gaagaagcat cgttaaagtc 780
196 tctcttcacc ctgccgtcat gtctaagtca gaggtgagtt aggcgcgctt tcccacttga 840
197 attttttcct ctccctttcc tgaatcggta agatgctgct gggtttcgtt ccttgcacca 900
198 gcccattcta cagttccttc ggtcgctgcc acggcctacc cctcccaaag ttcaagtcgc 960
199 cattttgtcc tcttgatcgc catgaggccg ctctccgcca accatgtgtt atcatgcggg 1020
200 actcgttact cgtagcaaaa ttcttaggca cacaggatct ttgtcttttt ttaaaccttg 1080
201 ccttggtgag cgagttttct aaagagcgat tagtcccatt gtggagatgc acccctaccg 1140
202 cccaagcctt tgttgcgcgt gcgtcggaag gcgactaggg acgcatgcgc ttgcgatttc 1200
203 ctagcactcc caactccagc atacggcctc ccttgatagg cagaagcacg tgtcttgttg 1260
204 cgacctgaac gaacaataag tgctaggtac acagttggtg tctagttttt cttttcctcg 1320
205 atggaaattg tttcgtgttg tagcccattt aacacttccc cctcccccca ctctagtctc 1380
206 ctaaagagcc cgaacagctg aggaagctct tcattggagg gttgagcttt gaaacaactg 1440
207 atgagagcct gaggagccat tttgagcaat ggggaacgct cacggactgt gtggtaagat 1500
208 ttggaaggga caaagcagta aaacagccga tttccttggc ttatcttggt gcagtcttct 1560
209 ccgaatgctt atgaaagtag ttaatagcat tatagttaga gctttgttgg caaaggaacg 1620
210 tcctgctttg attttaaaag ctaacctctt aaatctaagg gtagtgggaa actggacgaa 1680
211 ctttttataa aaggctggtg taaagtttcc tattgcccta ttcaaagtta aaataacaaa 1740
212 agcttttgcg gtcagacttt gtgttacata aattaacact gttctcaggt aatgagagat 1800
213 ccaaacacca agcgctctag gggctttggg tttgtcacat atgccactgt ggaggaggtg 1860
214 gatgcagcta tgaatgcaag gccacacaag gtggatggaa gagttgtgga accaaagaga 1920
215 gctgtctcca gagaagtgag tgggtttttt ttcttcttct tcttaaactt acttggatat 1980
216 gtgctgctat gaacttaaga ttcgggagtt ttctaaactt accaaaattt tttattcgag 2040
217 tataggcttt gctaatctaa acctatggtt tttctcctat taggattctc aaagaccagg 2100
218 tgcccactta actgtgaaaa agatatttgt tggtggcatt aaagaagaca ctgaagaaca 2160
219 tcacctaaga gattattttg aacagtatgg aaaaattgaa gtgattgaaa tcatgactga 2220
220 ccgaggcagt ggcaagaaaa ggggctttgc ctttgtaacc tttgacgacc atgactccgt 2280
221 ggataagatt gtcagtaagt atcagatagt ggcatttagt aagggttcca caatctgtat 2340
222 ggcattctaa accctgatac catgttgtat ctatgttttt tttttagttc agaaatacca 2400
223 tactgtgaat ggccacaact gtgaagttag aaaagccctg tcaaagcaag agatggctag 2460
224 tgcttcatcc agccaaagag gtatgcttgt tgcttaatta aaccttaaag gtaactttga 2520
225 gttactccag tatgaatgat ttaatgctta aacttcatgt cttaaggtcg aagtggttct 2580
226 ggaaactttg gtggtggtcg tggaggtggt ttcggtggga atgacaactt cggtcgtgga 2640
227 ggaaacttca gtggtcgtgg tatgtatggt ttatctacat gtagttctga cttctcacca 2700
228 tctttgctat gaagatttta cagtacggga actgcattca gaatgtcact ttaagtccaa 2760
229 gtcatactta aaacttgaaa ctttttctta caggtggctt tggtggcagc cgtggtggtg 2820
230 gtggatatgg tggcagtggg gatggctata atggatttgg caatgatggt aagtttttta 2880
231 ggaataagta gagaaaaatt cctggcaacc tggatcttta gaataggtta gtagagacta 2940
232 aaattctggt gcatgtcaaa ctcaactttg cccataacac gcatgctgtg agcaggcctt 3000
233 cagccgttac acttgcacaa gttttcattg tcaaatactt ttgtcttatt gagaagaatt 3060
234 gtattcttgt aggtggttat ggaggaggcg gccctggtta ctctggagga agcagaggct 3120
235 atggaagtgg tggacagggt tatggaaacc agggcagtgg ctatggcggg agtggcagct 3180
236 atgacagcta taacaacgga ggcggaggcg gctttggcgg tggtagtggt aggtatccag 3240
237 tgatccaagt acttggtgtg acagctagat tagcctttta gagcttgggt tctggtgctg 3300
238 ttgaagcatt gtgtggtaca ctgcatggta tattaaaaac aaatgggctt gctatgctac 3360
239 ctcctcctag ctttaagctg gggccgcctc actcccaaat agtagagata agtggatagt 3420
240 gttgtctttg agttagatta gtatcataga aggatttagt attttaactc ctttgggacc 3480
241 ttaggcgctt agttgatgta tccaagatac ttctgcttgc tgtggccctg gatccgtgaa 3540
242 ggccttcaag gctgaagggt atgcttgtgc cactctgaaa atctctttat tttatgtcat 3600
243 ggtgagttag gccagttttc tttgtattac tggattattc aactgaatgc ctttcccaga 3660
244 gaatgaaatg caaagattgg agtcaccata gtttgggaga aaggaaggct gataactcaa 3720
245 ccttatttta ttctgactgc taaacagaat tggaaactaa catcatcctc aggtaacaga 3780
246 taaaggccct ctttcccatt cataggaagc aattttggag gtggtggaag ctacaatgat 3840
247 tttgggaatt acaacaatca gtcttcaaat tttggaccca tgaagggagg aaattttgga 3900
248 ggcagaagct ctggccccta tggcggtgga ggccaatact ttgcaaaacc acgaaaccaa 3960
249 ggtatggtat ctatgtaatt ttggataatg tcaaaagagt gtctgtagct actgctggga 4020
250 agaaagccct ttaactgcta tgtctgggca gcaaaacgtt tatagtttag aaccttcaga 4080
251 aagtgataat ttgatcacaa attagaaaaa tcatgggacc tctttaccac ctcccttgta 4140
252 gtagggccat ttttaaatgg ccagacactt gaatttaact tttattatcc caaatatgaa 4200
253 aacattactg ttggcacttt gaaactttaa aagaaaaatt gtacttttca ggtggctatg 4260
254 gcggttccag cagcagcagt agctatggca gtggcagaag attttaatta ggtaagtaag 4320
255 cacctttttg tgtgttgaca taatttttta aattgctgat gaacccaata accctaatgt 4380
256 agctgagcag tgcaacatag ttaacattat aattgcagta attgtggata taaagttaat 4440
257 attcagatca gcaaaatttg tgggaaacaa acttgatatt ggattgtagc cttgagtctt 4500
258 aatatgttta gattaacaac tctattccat attgttcaac aggaaacaaa gcttagcagg 4560
259 agaggagagc cagagaagtg acagggaagc tacaggttac aacagatttg tgaactcagc 4620
260 caagcacagt ggtggcaggg cctagctgct acaaagaaga catgttttag acaaatactc 4680
261 atgtgtatgg gcaaaaaact cgaggactgt atttgtgact aattgtataa caggttattt 4740
262 tagtttctgt tctgtggaaa gtgtaaagca ttccaacaaa gggttttaat gtagattttt 4800
263 ttttttgcac cccatgctgt tgattgctaa atgtaacagt ctgatcgtga cgctgaataa 4860
264 atgtcttttt tttaatgtgc tgtgtaaagt tagtctactc ttaagccatc ttggtaaatt 4920
265 tccccaacag tgtgaagtta gaattccttc agggtgatgc caggttctat ttggaattta 4980
266 tatacaacct gcttgggtgg agaagccatt gtcttcggaa accttggtgt agttgaactg 5040
267 atagttactg ttgtgacctg aagttcacca ttaaaaggga ttacccaagc aaaatcatgg 5100
268 aatggttata aaagtgattg ttggcacatc ctatgcaata tatctaaatt gaataatggt 5160
269 accagataaa attatagatg ggaatgaagc ttgtgtatcc attatcatgt gtaatcaata 5220
270 aacgatttaa ttctcttgaa tgaaatgaca actgtatgga tttgggactg gcagagattt 5280
271 ggactttccc tacccactcc ccctgataat aatgttgaat gcttctatca caattcaagt 5340
272 tcaaagctct gctagggaat agaaacta 5368
274 ID HSRNPA1 standard; RNA; HUM; 1747 BP.
276 AC X06747;
278 SV X06747.1
280 DT 08-JUN-1988 (Rel. 16, Created)
281 DT 12-SEP-1993 (Rel. 36, Last updated, Version 2)
283 DE Human hnRNP core protein A1
285 KW hnRNP A1 protein; ribonucleoprotein.
287 OS Homo sapiens (human)
288 OC Eukaryota; Metazoa; Chordata; Craniata; Vertebrata; Mammalia; Eutheria;
289 OC Primates; Catarrhini; Hominidae; Homo.
291 RN [1]
292 RP 1-1747
293 RA Riva S.;
294 RT ;
295 RL Submitted (26-JAN-1988) to the EMBL/GenBank/DDBJ databases.
296 RL Riva S., Istituto Di Genetica Biochimica, Ed Evoluzionistica - CNR, Via
297 RL Abbiategrasso 207, 27100 Pavia, Italy.
299 RN [2]
300 RP 1-1747
301 RX MEDLINE; 88233978.
302 RA Buvoli M., Biamonti G., Ghetti A., Riva S., Bassi M.T., Horandi C.;
303 RT "cDNA cloning of human hnRNP protein A1 reveals the existence of multiple
304 RT mRNA isoforms.";
305 RL Nucleic Acids Res. 16:3751-3770(1988).
307 DR SWISS-PROT; P09651; ROA1_HUMAN.
309 CC pRP15 sequence encodes the protein A1 type alpha isoform,
310 CC pRP12 (truncated at the 5' end, respectively) the beta isoform
312 FH Key Location/Qualifiers
314 FT source 1..1747
315 FT /db_xref="taxon:9606"
316 FT /organism="Homo sapiens"
317 FT /tissue_type="fibroblast"
318 FT /clone_lib="lambdagt11"
319 FT /clone="pRP15"
320 FT CDS 86..1048
321 FT /db_xref="SWISS-PROT:P09651"
322 FT /note="protein A1-alpha (AA 1-320)"
323 FT /protein_id="CAA29922.1"
324 FT /translation="MSKSESPKEPEQLRKLFIGGLSFETTDESLRSHFEQWGTLTDCVV
325 FT MRDPNTKRSRGFGFVTYATVEEVDAAMNARPHKVDGRVVEPKRAVSREDSQRPGAHLTV
326 FT KKIFVGGIKEDTEEHHLRDYFEQFGKIEVIEIMTDRGSGKKKGFAFVTFDDHDSVDKIV
327 FT IQKYHTVNGHNCEVRKALSKQEMASASSSQRGRSGSGNFGGGRGGGFGGNDNFGRGGNF
328 FT SGRGGFGGSRGGGGYGGSGDGYNGFGNDGSNFGGGGSYNDFGNYNNQSSNFGPMKGGNF
329 FT GGRSSGPYGGGGQYFAKPRNQGGYGGSSSSSSYGSGRRF"
330 FT misc_feature 209..209
331 FT /note="5' end of clone pRP12"
332 FT variation 467..469
333 FT /note="uau (Tyr) is uuu (Phe) in pRP12 (protein A1-beta)"
334 FT variation 521..523
335 FT /note="agg (Arg) is aag (Lys) in pRP12 (protein A1-beta)"
336 FT misc_feature 1365..1370
337 FT /note="polyA signal"
338 FT misc_feature 1726..1731
339 FT /note="polyA signal"
340 FT polyA_site 1747..1747
341 FT /note="polyA site"
343 SQ Sequence 1747 BP; 512 A; 300 C; 466 G; 469 T; 0 other;
344 cgaaaggtta caaaggcaaa gccccttttc tgcccgtgga cgccgccgaa gaagcatcgt 60
345 taaagtctct cttcaccctg ccgtcatgtc taagtcagag tctcctaaag agcccgaaca 120
346 gctgaggaag ctcttcattg gagggttgag ctttgaaaca actgatgaga gcctgaggag 180
347 ccattttgag caatggggaa cgctcacgga ctgtgtggta atgagagatc caaacaccaa 240
348 gcgctctagg ggctttgggt ttgtcacata tgccactgtg gaggaggtgg atgcagctat 300
349 gaatgcaagg ccacacaagg tggatggaag agttgtggaa ccaaagagag ctgtctccag 360
350 agaagattct caaagaccag gtgcccactt aactgtgaaa aagatatttg ttggtggcat 420
351 taaagaagac actgaagaac atcacctaag agattatttt gaacagtttg gaaaaattga 480
352 agtgattgaa atcatgactg accgaggcag tggcaagaaa aagggctttg cctttgtaac 540
353 ctttgacgac catgactccg tggataagat tgtcattcag aaataccata ctgtgaatgg 600
354 ccacaactgt gaagttagaa aagccctgtc aaagcaagag atggctagtg cttcatccag 660
355 ccaaagaggt cgaagtggtt ctggaaactt tggtggtggt cgtggaggtg gtttcggtgg 720
356 gaatgacaac ttcggtcgtg gaggaaactt cagtggtcgt ggtggctttg gtggcagccg 780
357 tggtggtggt ggatatggtg gcagtgggga tggctataat ggatttggca atgatggaag 840
358 caattttgga ggtggtggaa gctacaatga ttttgggaat tacaacaatc agtcttcaaa 900
359 ttttggaccc atgaagggag gaaattttgg aggcagaagc tctggcccct atggcggtgg 960
360 aggccaatac tttgcaaaac cacgaaacca aggtggctat ggcggttcca gcagcagcag 1020
361 tagctatggc agtggcagaa gattttaatt aggaaacaaa gcttagcagg agaggagagc 1080
362 cagagaagtg acagggaagc tacaggttac aacagatttg tgaactcagc caagcacagt 1140
363 ggtggcaggg cctagctgct acaaagaaga catgttttag acaaatactc atgtgtatgg 1200
364 gcaaaaaact cgaggactgt atttgtgact aattgtataa caggttattt tagtttctgt 1260
365 tctgtggaaa gtgtaaagca ttccaacaaa gggttttaat gtagattttt tttttgcacc 1320
366 ccatgctgtt gattgctaaa tgtaacagtc tgatcgtgac gctgaataaa tgtctttttt 1380
367 ttaatgtgct gtgtaaagtt agtctactct taagccatct tggtaaattt ccccaacagt 1440
368 gtgaagttag aattccttca gggtgatgcc aggttctatt tggaatttat atacaacctg 1500
369 cttgggtgga gaagccattg tcttcggaaa ccttggtgta gttgaactga tagttactgt 1560
370 tgtgacctga agttcaccat taaaagggat tacccaagca aaatcatgga atggttataa 1620
371 aagtgattgt tggcacatcc tatgcaatat atctaaattg aataatggta ccagataaaa 1680
372 ttatagatgg gaatgaagct tgtgtatcca ttatcatgtg taatcaataa acgatttaat 1740
373 tctcttg 1747
375 ID HSUPIR1 standard; RNA; HUM; 924 BP.
377 AC X04347;
379 SV X04347.1
381 DT 18-NOV-1986 (Rel. 10, Created)
382 DT 12-JUL-1995 (Rel. 44, Last updated, Version 3)
384 DE Human liver mRNA fragment DNA binding protein UPI homologue
385 DE (C-terminus)
387 KW DNA binding protein.
389 OS Homo sapiens (human)
390 OC Eukaryota; Metazoa; Chordata; Craniata; Vertebrata; Mammalia; Eutheria;
391 OC Primates; Catarrhini; Hominidae; Homo.
393 RN [1]
394 RP 1-924
395 RX MEDLINE; 87053868.
396 RA Riva S., Morandi C., Tsoulfas P., Pandolfo M., Biamonti G., Merrill B.,
397 RA Williams K.R., Multhaup G., Beyreuther K., Werr H., Heinrich B.,
398 RA Schaefer K.P.;
399 RT "Mammalian single-stranded DNA binding protein UP I is derived from the
400 RT hnRNP cor protein A1";
401 RL EMBO J. 5:2267-2273(1986).
403 DR SWISS-PROT; P09651; ROA1_HUMAN.
405 CC Pos. 1-216 is homologous to UPI (aa 126-195); pos. 184-273 is
406 CC homologous to V8 protease peptide AI/II (aa 185-214)
408 CC Data kindly reviewed (08-NOV-1986) by K. Beyreuther
410 FH Key Location/Qualifiers
412 FT source 1..924
413 FT /db_xref="taxon:9606"
414 FT /organism="Homo sapiens"
415 FT CDS <1..591
416 FT /codon_start=1
417 FT /db_xref="SWISS-PROT:P09651"
418 FT /note="ORF protein; C-terminal (aa 125-319; 196aa)"
419 FT /protein_id="CAA27874.1"
420 FT /translation="FEQYGKIEVIEIMTDPGSGKKRGFAFVTFDDHDSVDKIVIQKYHT
421 FT VNGHNCEVRKALSKQEMASASSSQRGRSGSGNFGGGRGGGFGGNDNFGRGGNFSGRGGF
422 FT GGSRGGGGYGGSGDGYNGFGNDGSNFGGGGSYNDFGNYNNQSSNFGPMKGGNFGGRSSG
423 FT PYGGGGQYFAKPRNQGGYGGSSSSSSYGSGRRF"
424 FT misc_feature 208..210
425 FT /note="dimethylated arginin"
426 FT polyA_signal 908..913
427 FT /note="pot. polyA signal"
428 FT polyA_site 924..924
429 FT /note="polyA site"
431 SQ Sequence 924 BP; 262 A; 148 C; 266 G; 248 T; 0 other;
432 tttgaacagt atggaaaaat tgaagtgatt gaaatcatga ctgacccagg cagtggcaag 60
433 aaaaggggct ttgcctttgt aacctttgac gaccatgact ccgtggataa gattgtcatt 120
434 cagaaatacc atactgtgaa tggccacaac tgtgaagtta gaaaagccct gtcaaagcaa 180
435 gagatggcta gtgcttcatc cagccaaaga ggtcgaagtg gttctggaaa ctttggtggt 240
436 ggtcgtggag gtggtttcgg tgggaatgac aacttcggtc gtggaggaaa cttcagtggt 300
437 cgtggtggct ttggtggcag ccgtggtggt ggtggatatg gtggcagtgg ggatggctat 360
438 aatggatttg gcaatgatgg aagcaatttt ggaggtggtg gaagctacaa tgattttggg 420
439 aattacaaca atcagtcttc aaattttgga cccatgaagg gaggaaattt tggaggcaga 480
440 agctctggcc cctatggcgg tggaggccaa tactttgcaa aaccacgaaa ccaaggtggc 540
441 tatggcggtt ccagcagcag cagtagctat ggcagtggca gaagatttta attaggaaac 600
442 aagcttggca ggagaggaga gccagagaag tgacagggaa gctacaggtt acaacagatt 660
443 tgtgaactca gccaagcaca gtggtggcag ggcctagctg ctacaaagaa gacatgtttt 720
444 agacaaatac tcatgtgtat gggcaaaaaa ctcgaggact gtatttgtga ctaattgtat 780
445 aacaggttat tttagtttct gttctgtgga aagtgaaagc attccaacaa agggttttaa 840
446 tgtagatttt ttttttttgc accccatgct gttgattgct aaatgtaaca gtctgatcgt 900
447 gacgctgaat aaatgtcttt tttt 924