This file is indexed.

/usr/share/EMBOSS/test/embl/vrt.dat is in emboss-test 6.6.0-1.

This file is owned by root:root, with mode 0o644.

The actual contents of the file can be viewed below.

  1
  2
  3
  4
  5
  6
  7
  8
  9
 10
 11
 12
 13
 14
 15
 16
 17
 18
 19
 20
 21
 22
 23
 24
 25
 26
 27
 28
 29
 30
 31
 32
 33
 34
 35
 36
 37
 38
 39
 40
 41
 42
 43
 44
 45
 46
 47
 48
 49
 50
 51
 52
 53
 54
 55
 56
 57
 58
 59
 60
 61
 62
 63
 64
 65
 66
 67
 68
 69
 70
 71
 72
 73
 74
 75
 76
 77
 78
 79
 80
 81
 82
 83
 84
 85
 86
 87
 88
 89
 90
 91
 92
 93
 94
 95
 96
 97
 98
 99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
ID   L07770; SV 1; linear; mRNA; STD; VRT; 1684 BP.
XX
AC   L07770;
XX
DT   12-DEC-1992 (Rel. 34, Created)
DT   17-APR-2005 (Rel. 83, Last updated, Version 8)
XX
DE   Xenopus laevis rhodopsin mRNA, complete cds.
XX
KW   G protein-coupled receptor; phototransduction protein; retinal protein;
KW   rhodopsin; transmembrane protein.
XX
OS   Xenopus laevis (African clawed frog)
OC   Eukaryota; Metazoa; Chordata; Craniata; Vertebrata; Euteleostomi; Amphibia;
OC   Batrachia; Anura; Pipoidea; Pipidae; Xenopodinae; Xenopus; Xenopus.
XX
RN   [1]
RP   1-1684
RA   Knox B.E., Scalzetti L.C., Batni S., Wang J.Q.;
RT   "Molecular cloning of the abundant rhodopsin and transducin from Xenopus
RT   laevis";
RL   Unpublished.
XX
RN   [2]
RP   1-1684
RX   DOI; 10.1074/jbc.271.6.3179.
RX   PUBMED; 8621718.
RA   Batni S., Scalzetti L., Moody S.A., Knox B.E.;
RT   "Characterization of the Xenopus rhodopsin gene";
RL   J Biol Chem 271(6):3179-3186(1996).
XX
FH   Key             Location/Qualifiers
FH
FT   source          1..1684
FT                   /organism="Xenopus laevis"
FT                   /mol_type="mRNA"
FT                   /dev_stage="adult"
FT                   /tissue_lib="lambda-ZAPII"
FT                   /tissue_type="retina"
FT                   /db_xref="taxon:8355"
FT   CDS             110..1174
FT                   /codon_start=1
FT                   /product="rhodopsin"
FT                   /note="gene accession number U23808"
FT                   /db_xref="GOA:P29403"
FT                   /db_xref="InterPro:IPR000276"
FT                   /db_xref="InterPro:IPR000732"
FT                   /db_xref="InterPro:IPR001760"
FT                   /db_xref="InterPro:IPR017452"
FT                   /db_xref="InterPro:IPR019477"
FT                   /db_xref="UniProtKB/Swiss-Prot:P29403"
FT                   /protein_id="AAC42232.1"
FT                   /translation="MNGTEGPNFYVPMSNKTGVVRSPFDYPQYYLAEPWQYSALAAYMF
FT                   LLILLGLPINFMTLFVTIQHKKLRTPLNYILLNLVFANHFMVLCGFTVTMYTSMHGYFI
FT                   FGQTGCYIEGFFATLGGEVALWSLVVLAVERYMVVCKPMANFRFGENHAIMGVAFTWIM
FT                   ALSCAAPPLFGWSRYIPEGMQCSCGVDYYTLKPEVNNESFVIYMFIVHFTIPLIVIFFC
FT                   YGRLLCTVKEAAAQQQESATTQKAEKEVTRMVVIMVVFFLICWVPYAYVAFYIFTHQGS
FT                   NFGPVFMTVPAFFAKSSAIYNPVIYIVLNKQFRNCLITTLCCGKNPFGDEDGSSAATSK
FT                   TEASSVSSSQVSPA"
FT   misc_feature    189..1684
FT                   /note="sequenced from clone pXOP71"
FT   variation       1224
FT                   /note="clone pX0P5 contained deletion from bp 1224-1534"
XX
SQ   Sequence 1684 BP; 426 A; 431 C; 339 G; 488 T; 0 other;
     ggtagaacag cttcagttgg gatcacaggc ttctagggat cctttgggca aaaaagaaac        60
     acagaaggca ttctttctat acaagaaagg actttataga gctgctacca tgaacggaac       120
     agaaggtcca aatttttatg tccccatgtc caacaaaact ggggtggtac gaagcccatt       180
     cgattaccct cagtattact tagcagagcc atggcaatat tcagcactgg ctgcttacat       240
     gttcctgctc atcctgcttg ggttaccaat caacttcatg accttgtttg ttaccatcca       300
     gcacaagaaa ctcagaacac ccctaaacta catcctgctg aacctggtat ttgccaatca       360
     cttcatggtc ctgtgtgggt tcacggtgac aatgtacacc tcaatgcacg gctacttcat       420
     ctttggccaa actggttgct acattgaagg cttctttgct acacttggtg gtgaagtggc       480
     cctctggtca ctggtagtat tggccgttga aagatatatg gtggtctgca agcccatggc       540
     caacttccga ttcggggaga accatgctat tatgggtgta gccttcacat ggatcatggc       600
     tttgtcttgt gctgctcctc ctctcttcgg atggtccaga tacatcccag agggaatgca       660
     atgctcatgc ggagtagact actacacact gaagcctgag gtcaacaatg aatcctttgt       720
     tatctacatg ttcattgtcc acttcaccat tcccctgatt gtcatcttct tctgctatgg       780
     tcgcctgctc tgcactgtca aagaggctgc agcccagcaa caggaatctg ctaccaccca       840
     gaaggctgag aaagaggtca ccagaatggt tgttatcatg gtcgttttct tcctgatctg       900
     ttgggtgccc tatgcctatg tggcattcta catcttcacc caccagggct ctaactttgg       960
     cccagtcttc atgaccgtcc cagctttctt tgccaagagc tctgctatct acaatcctgt      1020
     catctacatt gtcttgaaca aacagttccg taactgcttg atcaccaccc tgtgctgtgg      1080
     aaagaatcca ttcggtgatg aagatggctc ctctgcagcc acctccaaga cagaagcttc      1140
     ttctgtctct tccagccagg tgtctcctgc ataagagctt caccagggct gtctcagggt      1200
     ccgctgcctc acacaattcc catcacttaa gccctgtcta cttgttgcga aggcaaagaa      1260
     ttccacagtt ttaatattta cccccattct gcccaacctt ggacactgta agagctgacc      1320
     ccattactgc tgggaaggcc caagctttgt tgcattctga tgtgatcctt tcagcagaaa      1380
     atgggtggat tcaatgaatt tcaccaaggc tgtacataac aataacatta gtctgaaggc      1440
     acctcccacc cagagaatgc aacacttatt tatctctgtc ttttcttgac atattgatgc      1500
     tgcttctatt catggtcact aacaaaaagt cccattttac aatgcaactg aaagtaatgt      1560
     atttttgtaa tataataaca tatttcatgc aatctcctct gcttattggc aaggtctgat      1620
     atagtgagga tagacagcca gaccccttgc attaaaatcc tgtattaaaa atttctttgc      1680
     aagt                                                                   1684
//
ID   U23808; SV 2; linear; genomic DNA; STD; VRT; 8914 BP.
XX
AC   U23808;
XX
DT   23-APR-1995 (Rel. 43, Created)
DT   21-APR-2006 (Rel. 87, Last updated, Version 9)
XX
DE   Xenopus laevis rhodopsin gene, complete cds.
XX
KW   .
XX
OS   Xenopus laevis (African clawed frog)
OC   Eukaryota; Metazoa; Chordata; Craniata; Vertebrata; Euteleostomi; Amphibia;
OC   Batrachia; Anura; Pipoidea; Pipidae; Xenopodinae; Xenopus; Xenopus.
XX
RN   [1]
RP   1-8914
RX   DOI; 10.1074/jbc.271.6.3179.
RX   PUBMED; 8621718.
RA   Batni S., Scalzetti L., Moody S.A., Knox B.E.;
RT   "Characterization of the Xenopus rhodopsin gene";
RL   J Biol Chem 271(6):3179-3186(1996).
XX
RN   [2]
RP   1-8914
RA   Batni S., Scalzetti L., Knox B.E.;
RT   ;
RL   Submitted (30-MAR-1995) to the INSDC.
RL   Barry E. Knox, Biochemistry and Molecular Biology, SUNY HSC at Syracuse,
RL   750 E. Adams St., Syracuse, NY 13210, USA
XX
RN   [3]
RC   Sequence update by submitter
RP   1-8914
RA   Batni S., Scalzetti L., Knox B.E.;
RT   ;
RL   Submitted (20-APR-2006) to the INSDC.
RL   Barry E. Knox, Biochemistry and Molecular Biology, SUNY HSC at Syracuse,
RL   750 E. Adams St., Syracuse, NY 13210, USA
XX
CC   On Apr 20, 2006 this sequence version replaced gi:773645.
XX
FH   Key             Location/Qualifiers
FH
FT   source          1..8914
FT                   /organism="Xenopus laevis"
FT                   /mol_type="genomic DNA"
FT                   /db_xref="taxon:8355"
FT   promoter        5128..5360
FT   misc_feature    5128..5158
FT                   /note="XOP4 cis element"
FT   misc_feature    5191..5215
FT                   /note="XOP3 cis element"
FT   misc_feature    5225..5239
FT                   /note="Ret1 cis element"
FT   misc_feature    5254..5270
FT                   /note="Bat1 cis element"
FT   misc_feature    5277..5302
FT                   /note="NRE cis element"
FT   misc_feature    5309..5318
FT                   /note="Ret4 cis element"
FT   mRNA            join(5361..5830,6079..6247,6849..7014,7265..7504,
FT                   8210..8867)
FT                   /product="rhodopsin"
FT   CDS             join(5470..5830,6079..6247,6849..7014,7265..7504,
FT                   8210..8338)
FT                   /codon_start=1
FT                   /product="rhodopsin"
FT                   /note="cDNA sequence deposited under GenBank Accession
FT                   Number L07770"
FT                   /db_xref="GOA:P29403"
FT                   /db_xref="InterPro:IPR000276"
FT                   /db_xref="InterPro:IPR000732"
FT                   /db_xref="InterPro:IPR001760"
FT                   /db_xref="InterPro:IPR017452"
FT                   /db_xref="InterPro:IPR019477"
FT                   /db_xref="UniProtKB/Swiss-Prot:P29403"
FT                   /protein_id="AAC59901.1"
FT                   /translation="MNGTEGPNFYVPMSNKTGVVRSPFDYPQYYLAEPWQYSALAAYMF
FT                   LLILLGLPINFMTLFVTIQHKKLRTPLNYILLNLVFANHFMVLCGFTVTMYTSMHGYFI
FT                   FGQTGCYIEGFFATLGGEVALWSLVVLAVERYMVVCKPMANFRFGENHAIMGVAFTWIM
FT                   ALSCAAPPLFGWSRYIPEGMQCSCGVDYYTLKPEVNNESFVIYMFIVHFTIPLIVIFFC
FT                   YGRLLCTVKEAAAQQQESATTQKAEKEVTRMVVIMVVFFLICWVPYAYVAFYIFTHQGS
FT                   NFGPVFMTVPAFFAKSSAIYNPVIYIVLNKQFRNCLITTLCCGKNPFGDEDGSSAATSK
FT                   TEASSVSSSQVSPA"
XX
SQ   Sequence 8914 BP; 2521 A; 1879 C; 1845 G; 2668 T; 1 other;
     ggatccatgt tagtagcctt caaatcgagt ttagtctaat ttgaatcaaa ttcgataaga        60
     gttttcaagt cagcaaaaat tgtacgagtt ttagatgtcc aatttttttt tctataagta       120
     atttagagta tattcgaatt taatcgagtt taaaaaaatt cacattaatt ccaaattcga       180
     cctttaatca atgtgcctcc caggatgagt gccagactat gaactcctcc aacctattta       240
     ttcatcaacc agatttgaca gtgggagacc taagaatcca gtgattgaat gagtttaatg       300
     catgaaaagg ttggcttggt tatttgcagc acagagagaa accaataagg agaaagtaga       360
     gttgaggtgg gacattcatg aatactcacc taaaggactt tgattgggat tcagccaata       420
     atatcccatc caccacattt actgagctta gaacattctc caaacatgag cagtaaaggg       480
     acaaagagta atggctttaa aggagaacta aaccctaaaa ctgaatgtgt aaaaatgtta       540
     tattttatag acagaactta ttgcaccagc ctaagtttca gcttgtcaat agcagcaatg       600
     atccagaact tcaaacttgt cacagggggt caccatcttg gacagtgtct gtgacactca       660
     catgctcagt gggctctgag cagctgttga gaagctaagc ttaggggtcg tcactaatta       720
     tccagcagaa aatgaggttg gtctgtaata aaagctgatg ctacagggct taaattctga       780
     tgctaattgc actggtttct gtgctgccat gtagtaatta tctgtattaa ttactaatca       840
     gccttatatt gtgacatttc tgttctatgt gtactgtata ttgtgagtgg gtccctaagc       900
     tcagtaagtg acagcagcac agagcatgtg cagtgaatca gcagaaaaga agacggggag       960
     ctactggggc atctttggag acacagatct ttactgctaa agggctgtgg ttgcattggg      1020
     ctggtacaga agcccaaaac ataatgtaca acatttctat ctaattcttt agttaagctt      1080
     tagttctcca ttaagtgtgc gtccatgttc tacatgcagg agatgcacat gcatagaatg      1140
     aaactgataa gtaaatttag gcaaatattt tgaacttgag attctggact gaccttctta      1200
     accaatgatt ccataggtgc atatgggaga tctttgacag cgggtattgt cactatagga      1260
     tagaaactcc acctcccttc tgatgatttg tgagctaact gatgtttggt catattcatg      1320
     taagaacgac tactccgcat gttatttggc tgctctgcaa atgcaatagc agcatgaaag      1380
     gtgtagtggt gtcaggctga ggaggagtag cacatttgta ctgtgcctgc atgtgtcttc      1440
     aaaggaagaa gatgaagaag ggactgaaga agtccagaga aatgagatgt taaatgttgc      1500
     aacacaaacc aactggagtt ttattccttt cacaaaaaca tgtaagattt ggggcagttc      1560
     ttaaaaataa gtcttgttta atttaccctg gtctccataa ctgtcttgac ccaagttgat      1620
     gatccaacag caggagcccg tgttgaagga tgacaattac aaatcacaag atgactgtag      1680
     tgatgggcga atctgacccg tttggcttta ccgaaaattt gggaaatgaa aatttgctaa      1740
     aattcattgg gcgtgatttt ttgatgtgtg acaatttttt tcacccattg cagtctatgg      1800
     gcatcctttt aagctttgaa acttgacgaa aaattttgct catgactatg atgggttatg      1860
     aatcaagggg ggattaggtt tcatattgtc cttccttcat tctactgacg tggaaggaaa      1920
     agccaaggtg tgtgcacctt ctaccttggc tgataacacc atcatcggcc ataatcatcc      1980
     atctaaatat ttataggaat gctatgcaga ttattaattt aagatccttc accccaataa      2040
     cttcaactac atacccatgc agaaatagcc atacatgtat tacatatgag cagcctagaa      2100
     tatgaattac tgtatttgga gtctggaata actggttctt aagtgaaagc tataggactt      2160
     gatgcatcaa ttcttttgtg gttatcccta taaaagtacc acttcactat tgtacctgtt      2220
     tggctaaact ctcaataata ctgaaaatgt tgccatatca gagtcgggtg tcacaatgtc      2280
     aggcatcttt acaattctct gcatcagagg acaaaaagga ggaaccattt ttgcacccat      2340
     tgtgcctagg gttgccacct gaccagtatt ttaccagcct ggctggtaaa aatgatggtt      2400
     gatcccaatg ttattaatag ggaaaacaga taaatatata ggaaggccgg tattttatcc      2460
     agaaaaggtg gcgaccctaa ttgtgccctc tgaaggtccc actgccctgg tgtgtatgcc      2520
     catttactgt gccctttacc cttcccacca ggaatgtcca acctgcaaca ctccagagga      2580
     tgttgctata caactcccag catatagtga tgggtgaatt tgcgccgttt cgcttcgccg      2640
     aaaaatgtgc gaatttccca ctaaatggcg tataattcac aaaactgcac cggcgtctcg      2700
     tttttgatgc tggcgtccgt tttttttacg ccgatgcccg tttttgatgc cgatgcctgt      2760
     ttttaacgcc agcgtccgtt tttttggacg cctgtgacaa tttttttgac gcccatttcg      2820
     caaatttatt caccggcggc gaatcacgca aattcgccac aaatttgcgc ctggcgaata      2880
     aattcgccca tcactacaca ggagtcagta gctattgatg ggatgctgct agttgtagag      2940
     caacaaccta tgttggttca ttgattgtct atctgtgatt ctggtacatg aaacatcact      3000
     ctcatagtct ctccctgtgc aatcacagtg gccttgtttc ctgttagact gcaagctctt      3060
     ggaccttgca gaactgttcc ctcctgctaa caaaccaatg ccktggttct cagctacaga      3120
     gaaagctgac tgatcacgtg taggaaagaa caggagcgct gggggcagag agactgttta      3180
     tttggttgca tcttaatccc cggatgattg acaggattag tgaaatgtat ctctaccctg      3240
     cactctctgt ctgctaatta caaccagttg ctgaatactt caccttcttg cccagggatt      3300
     ttaacctgca aattcactaa ctggccatgc aaagcaatga gcaactttgc tgactagtgc      3360
     cttgacataa ggcaagttat cagctaaaat aaaagatttt atttaccttc gaataccttt      3420
     gtcaaattct tatacagtat aattagattt gtttgaaaga tagatagatc atctactcta      3480
     aatgattact aaggtgctca ctaatcaacc cgcattactg ggggttaatt cttcttgcag      3540
     aaatgattgg ttccagcatg aaaaaattct tatctgaatc tttttttctc taagcgtgtg      3600
     atttgcatct gggagtcaat attgggctgg ataattgtgc agagttttga gggtctgggc      3660
     cagagttgga gagctttgag agtttataag cctataacga gctttatgtt ggatttgtca      3720
     caggtacgga tagacattaa atgcattcac atattctaaa tcagggcttt tccgcctgtc      3780
     ctctcaaatg ttttatgatt taccattaaa ctgccattct caggcataaa gagaaactga      3840
     ggtgtgttca ctagtactaa ttctgaggaa tacatgccca gtagtgctgt ttgaatgaca      3900
     agctgattta ttataggagt aggaagtaca aaaaaaatcc acaattaaaa atatttctac      3960
     tcacaattgg aatttttttc gcagttttcc agtataagtt tacgctcctc aatcaggcaa      4020
     ccttccagag gggcaaagat ctttatacat tgctcacaaa tgagttgaac tggcagctca      4080
     cgaatgggac atggagctgt catttactat gctccccaat gcaagtgcta gagcactaag      4140
     gggtgcaaaa agagagctcc ttcgtgctaa ttctaaaagc attgatcctg gggtccagct      4200
     gtgctgtgga agggaaaggg tcaataaagg ggacatctgc aatcttcccc ttccccacat      4260
     gaatacagtg ctgcttgatg caggaactga tgaatcccgg tctctctgct ccatttttga      4320
     gtacagagac ttgtgaaatc tagagaactg caagacatga ttcaaagtgc taagtgcaaa      4380
     aaacaatggt ggtttatatc tgtctttgta ctttacactt gttcacttac agtccctaca      4440
     attgtgtcta gtgcagtggt ccccaaccag tagctcgtta gtaacatgtt gctcccccaa      4500
     ccccttggat gttgctccca atggcctcaa aacaattgct tatttttcaa ttccaggcaa      4560
     gttttggttg cataaaaacc aggtctatgg ccaaacagag ccccctctgg gctgcaaatc      4620
     cacaaagggc taccaaatag acaatcatat tctttattag gcaccccaag ggcttttttc      4680
     acgcttgtgc tgctccgcaa ctctttttac atttgaatgt ggcttatggg ttaaaaaggt      4740
     gcaacacaaa caaataatct attatttaca cactagtcaa gactggtgct cagctgtggt      4800
     ttgaagattc taattcaatg aactaatggt aaccagggcc ggatttgtat ttctgcagcc      4860
     cctaggccat gcggtcctaa cgtctgtcca cgacgagtct tattgccatc cacccgcaac      4920
     tcccgcaagt gcaaattttg gagcactggt gctcttcagc aagtggctgg gcggcatgcc      4980
     gtccctaaaa gttcgccgcc ctaggcacag gcctttgtgg cctctccaca aatccaagcc      5040
     tgatggtaac taaatgtaga gggaactgag taaaccccaa aaatggctgc cctggctcct      5100
     acaatatgga attatctcct gtaggtcaga cctggatttc ttcctgtcac ttttaaatac      5160
     actttcttct tgtgtgttta acagagagag agattgacag gtgtagactt aatacgttta      5220
     agggaagcca attaacactt tgcaatttta gcttggatta cagtgattaa tagtgcgcta      5280
     aatcctttgt tgctgacgct gggggttgca agcttactcc aggtgggact ttaaaaggac      5340
     gaggggacag tgggtcatac tgtagaacag cttcagttgg gatcacaggc ttctagggat      5400
     cctttgggca aaaaagaaac acagaaggca ttctttctat acaagaaagg actttataga      5460
     gctgctacca tgaacggaac agaaggtcca aatttttatg tccccatgtc caacaaaact      5520
     ggggtggtac gaagcccatt cgattaccct cagtattact tagcagagcc atggcaatat      5580
     tcagcactgg ctgcttacat gttcctgctc atcctgcttg ggttaccaat caacttcatg      5640
     accttgtttg ttaccatcca gcacaagaaa ctcagaacac ccctaaacta catcctgctg      5700
     aacctggtat ttgccaatca cttcatggtc ctgtgtgggt tcacggtgac aatgtacacc      5760
     tcaatgcacg gctacttcat ctttggccaa actggttgct acattgaagg cttctttgct      5820
     acacttggtg gtaagttcca atgggctttc gtcactgata ttgttgtagc aataaattct      5880
     tggaaagctc gtaagggaac aagctaccag ggaaagggtt atagggctga aaaggaatat      5940
     cagtactttc tatgttctcc agcagagtgt agtgcatacc atgttagaga aagttcaaca      6000
     tgtaatactg tgaggggcca aattgcctgg gttgagtcat gttaaccttt tgccttttcc      6060
     tgttcttttt actaacaggt gaagtggccc tctggtcact ggtagtattg gccgttgaaa      6120
     gatatatggt ggtctgcaag cccatggcca acttccgatt cggggagaac catgctatta      6180
     tgggtgtagc cttcacatgg atcatggctt tgtcttgtgc tgctcctcct ctcttcggat      6240
     ggtccaggta aatatatata acatcagtca gcatatccct agaaaagtat atctaatgat      6300
     acaactacgg tatatataaa cttgtagaaa catccaccaa agttacagca tgagttaagg      6360
     aagagtacat agaaggtcag ctaatgcttt ggaaaaatac aatagaaggt cagctaatgc      6420
     agaggttacc aaactccttt gggggctcca agctttggat ggaagcccag tttgaggtca      6480
     aggtttgaga tttgttaatt actcctggaa ctagaaaaga gttagttgcc cacatcttat      6540
     aacagcgaga caatactgac aattggtagt tgttgctgaa attcagcttt ctacacccca      6600
     ctacagccat tggctgcaat attgagttca gcttggagag aactcaatcc aggattgcac      6660
     ttctacattt tattccagta ttctatttat cagatgagct tgtgcttaaa ccccaaggac      6720
     tcaatgctga tgaataatgt taggatttac agttcaataa caattgagag atacaggatg      6780
     tctattcctg taatgtgggt aacagagtat gtgcttgttg gctctgacac tatattgtcc      6840
     ttgtgcagat acatcccaga gggaatgcaa tgctcatgcg gagtagacta ctacacactg      6900
     aagcctgagg tcaacaatga atcctttgtt atctacatgt tcattgtcca cttcaccatt      6960
     cccctgattg tcatcttctt ctgctatggt cgcctgctct gcactgtcaa agaggtgagt      7020
     agtcattatc atttggtcat ggtcacaacc caatccaact agttctaaac atagaccctc      7080
     caggtgttat tgaactgtta ctacttcttg gacttctcta caaccttgtt tgactgactg      7140
     gagagagaaa gatcagtaaa atctgattat gaagagaaca aagtcctaca ccttgtatgc      7200
     ccaatatcta ctactagact gttgctcttc tgtcctaact tctcttatct tacccatttc      7260
     ataggctgca gcccagcaac aggaatctgc taccacccag aaggctgaga aagaggtcac      7320
     cagaatggtt gttatcatgg tcgttttctt cctgatctgt tgggtgccct atgcctatgt      7380
     ggcattctac atcttcaccc accagggctc taactttggc ccagtcttca tgaccgtccc      7440
     agctttcttt gccaagagct ctgctatcta caatcctgtc atctacattg tcttgaacaa      7500
     acaggtacta aactacttcc aagtctgttc ttatttttta atcagcagtt tgtcaacttt      7560
     atgtatattt cctctcctat atgggtttcc aagggtttct atgtaatata taggatacca      7620
     agaattctga ccaccagctc ttgttgagac tcccaccagt ctacagctgt catctaggaa      7680
     tggtggaagt ttcagttcaa ccaaagcaaa gagtgctaaa catgagctga ttaactatga      7740
     ctcccattgt ctatagctgc agttaaaaaa agtcatggag aatgttctgc tacttatgat      7800
     gactgtgttg ccttaggatc agcatacaac ttggggtagt aagggcattt gtcttaggtc      7860
     ccaaaatgga aggggctttt agaggagaaa cacagataaa actacaaaga ccaccagtgt      7920
     tttagtattt taaaacacgg gtaataaccc ttgagcaaac ttcgtgtgct ggattaatta      7980
     ttacgtacct ttcgttgggg gtgccgtcct cctatgatcc atgcaccgtg aacgttgaaa      8040
     gagggaccag gtgtgcatct gcatttcgtt tggcttagta ttttacaacc ttcgtataca      8100
     tcaatatgca atgcattact tatttttagg gtagtagaga ctaaatgagt acaacaatac      8160
     agaagagatg aatggactag ataatgactg ttctcctttc tctccccagt tccgtaactg      8220
     cttgatcacc accctgtgct gtggaaagaa tccattcggt gatgaagatg gctcctctgc      8280
     agccacctcc aagacagaag cttcttctgt ctcttccagc caggtgtctc ctgcataaga      8340
     gcttcaccag ggctgtctca gggtccgctg cctcacacaa ttcccatcac ttaagccctg      8400
     tctacttgtt gcgaaggcaa agaattccac agttttaata tttaccccca ttctgcccaa      8460
     ccttggacac tgtaagagct gaccccatta ctgctgggaa ggcccaagct ttgttgcatt      8520
     ctgatgtgat cctttcagca gaaaatgggt ggattcaatg aatttcacca aggctgtaca      8580
     taacaataac attagtctga aggcacctcc cacccagaga atgcaacact tatttatctc      8640
     tgtcttttct tgacatattg atgctgcttc tattcatggt cactaacaaa aagtcccatt      8700
     ttacaatgca actgaaagta atgtattttt gtaatataat aacatatttc atgcaatctc      8760
     ctctgcttat tggcaaggtc tgatatagtg aggatagaca gccagacccc ttgcattaaa      8820
     atcctgtatt aaaaatttct ttgcaagtaa aaaaaaaaac acaaaaagtc aaatgtctta      8880
     ttcgatttat ttcacacttt gattgtctgg ttat                                  8914
//
ID   AF123456; SV 2; linear; mRNA; STD; VRT; 1510 BP.
XX
AC   AF123456;
XX
DT   24-MAR-1999 (Rel. 59, Created)
DT   13-APR-2012 (Rel. 112, Last updated, Version 6)
XX
DE   Gallus gallus doublesex and mab-3 related transcription factor 1 (DMRT1)
DE   mRNA, partial cds.
XX
KW   .
XX
OS   Gallus gallus (chicken)
OC   Eukaryota; Metazoa; Chordata; Craniata; Vertebrata; Euteleostomi;
OC   Archosauria; Dinosauria; Saurischia; Theropoda; Coelurosauria; Aves;
OC   Neognathae; Galliformes; Phasianidae; Phasianinae; Gallus.
XX
RN   [1]
RP   1-1510
RX   DOI; 10.1038/6769.
RX   PUBMED; 10080173.
RA   Nanda I., Shan Z.H., Schartl M., Burt D.V., Koehler M., Nothwang H.-G.,
RA   Gruetzner F., Paton I.R., Windsor D., Dunn I., Engel W., Staeheli P.,
RA   Mizuno S., Haaf T., Schmid M.;
RT   "300 million years of conserved synteny between chicken Z and human
RT   chromosome 9";
RL   Nat Genet 21(3):258-259(1999).
XX
RN   [2]
RP   1-1510
RX   PUBMED; 10894941.
RA   Nanda I., Zend-Ajusch E., Shan Z., Grutzner F., Schartl M., Burt D.W.,
RA   Koehler M., Fowler V.M., Goodwin G., Schneider W.J., Mizuno S., Dechant G.,
RA   Haaf T., Schmid M.;
RT   "Conserved synteny between the chicken Z sex chromosome and human
RT   chromosome 9 includes the male regulatory gene DMRT1: a comparative
RT   (re)view on avian sex determination";
RL   Cytogenet. Cell Genet. 89(1-2):67-78(2000).
XX
RN   [3]
RP   1-1510
RA   Haaf T., Shan Z.H.;
RT   ;
RL   Submitted (25-JAN-1999) to the INSDC.
RL   Max-Planck Institute for Molecular Genetics, Ihnestr. 73, Berlin 14195,
RL   Germany
XX
RN   [4]
RC   Sequence update by submitter
RP   1-1510
RA   Shan Z.;
RT   ;
RL   Submitted (23-DEC-1999) to the INSDC.
RL   MPI of Molecular Genetics, Ihnestr. 73, Berlin 14195, Germany
XX
CC   On Dec 23, 1999 this sequence version replaced gi:4454562.
XX
FH   Key             Location/Qualifiers
FH
FT   source          1..1510
FT                   /organism="Gallus gallus"
FT                   /chromosome="Z"
FT                   /map="Zp21"
FT                   /mol_type="mRNA"
FT                   /db_xref="taxon:9031"
FT   gene            <1..1510
FT                   /gene="DMRT1"
FT                   /note="expressed in genital ridges of both males and
FT                   females prior to the sexual determination, restricted to
FT                   the male gonads after sex determination; DMRT1 is a
FT                   candidate sex determination factor in vertebrates"
FT   CDS             <1..936
FT                   /codon_start=1
FT                   /gene="DMRT1"
FT                   /product="doublesex and mab-3 related transcription factor
FT                   1"
FT                   /note="cDMRT1"
FT                   /db_xref="GOA:Q9PTQ7"
FT                   /db_xref="InterPro:IPR001275"
FT                   /db_xref="InterPro:IPR022114"
FT                   /db_xref="UniProtKB/Swiss-Prot:Q9PTQ7"
FT                   /protein_id="AAF19666.1"
FT                   /translation="PAAGKKLPRLPKCARCRNHGYSSPLKGHKRFCMWRDCQCKKCSLI
FT                   AERQRVMAVQVALRRQQAQEEELGISHPVPLPSAPEPVVKKSSSSSSCLLQDSSSPAHS
FT                   TSTVAAAAASAPPEGRMLIQDIPSIPSRGHLESTSDLVVDSTYYSSFYQPSLYPYYNNL
FT                   YNYSQYQMAVATESSSSETGGTFVGSAMKNSLRSLPATYMSSQSGKQWQMKGMENRHAM
FT                   SSQYRMCSYYPPTSYLGQGVGSPTCVTQILASEDTPSYSESKARVFSPPSSQDSGLGCL
FT                   SSSESTKGDLECEPHQEPGAFAVSPVLEGE"
XX
SQ   Sequence 1510 BP; 320 A; 433 C; 472 G; 285 T; 0 other;
     ccggcggcgg gcaagaagct gccgcgtctg cccaagtgtg cccgctgccg caaccacggc        60
     tactcctcgc cgctgaaggg gcacaagcgg ttctgcatgt ggcgggactg ccagtgcaag       120
     aagtgcagcc tgatcgccga gcggcagcgg gtgatggccg tgcaggttgc actgaggagg       180
     cagcaagccc aggaagagga gctggggatc agccaccctg tacccctgcc cagtgcccct       240
     gagccagttg tcaagaagag cagcagcagc agctcctgtc tcctgcagga cagcagcagc       300
     cctgctcact ccacgagcac ggtggcagca gcagcagcga gcgcaccacc agagggacgg       360
     atgctcattc aggacatccc ttccatcccc agcagagggc acttggagag cacgtctgat       420
     ttggttgtgg actccaccta ctacagcagt ttttaccagc catccctgta tccttactat       480
     aacaacctgt acaactactc ccagtaccaa atggcagtgg ccactgagtc ttcctcaagt       540
     gagacagggg gtacgtttgt agggtcagcc atgaaaaaca gccttcgaag cctcccagca       600
     acatacatgt caagccagtc aggaaaacag tggcagatga agggaatgga gaaccgccat       660
     gccatgagct cccagtaccg gatgtgctcc tactacccgc ccacctcata cctgggccag       720
     ggggttggca gtcccacctg cgtcacacag atactggcct cggaggacac cccctcctac       780
     tcagagtcga aagcgagagt gttttcgccg cccagcagcc aggactcggg cctggggtgc       840
     ctgtcgagca gcgagagcac caagggagac ctggagtgcg agccccacca agagcccggc       900
     gccttcgcgg tgagcccggt tcttgagggc gagtaggcgc ggcgtcgggc ggctgctgcg       960
     cggcgttcac tgttgccttg ttctgttggg gttgcggggg ggcgttgggt ttcttctttc      1020
     cggggcgggg ggggcacggc ggggccgcgg ccgggccggc ggggcggggc ggggcgggac      1080
     ggggcggggc ggagccgcgc gggggccgca gtccgggccg gggccgccgt cgggtctcgg      1140
     cccgctcccg tcggggcgga gcgtccgacg atcggcctcc acgaaacgcg gtgccgtgat      1200
     gtgtttgtag tggttcctcg taggctccag acgttttctc ctcgtatcgc caaattaacg      1260
     cgttttgcat attacagttg agtgcctcga cttagattgc aatataagcg gccagcaaac      1320
     aagtctcaaa aaaaagttac gtgcgtttct gcgagtgtta ttttgttaag aacggctcac      1380
     agtgtcctct tcctgtgtta cagaagccaa cctgaaatga aactagtctg gaaaaattca      1440
     ttgttctctg tagttgcagc tgtacctgaa ataaaaatgt tattgatgac tgaaaaaaaa      1500
     aaaaaaaaaa                                                             1510
//
ID   AF123457; SV 1; linear; mRNA; STD; INV; 1634 BP.
XX
AC   AF123457;
XX
DT   31-JAN-2001 (Rel. 66, Created)
DT   15-APR-2005 (Rel. 83, Last updated, Version 3)
XX
DE   Toxoplasma gondii enolase (ENO2) mRNA, complete cds.
XX
KW   .
XX
OS   Toxoplasma gondii
OC   Eukaryota; Alveolata; Apicomplexa; Coccidia; Eucoccidiorida; Eimeriorina;
OC   Sarcocystidae; Toxoplasma.
XX
RN   [1]
RP   1-1634
RX   DOI; 10.1006/jmbi.2001.4730.
RX   PUBMED; 11399076.
RA   Dzierszinski F., Mortuaire M., Dendouga N., Popescu O., Tomavo S.;
RT   "Differential expression of two plant-like enolases with distinct enzymatic
RT   and antigenic properties during stage conversion of the protozoan parasite
RT   Toxoplasma gondii";
RL   J. Mol. Biol. 309(5):1017-1027(2001).
XX
RN   [2]
RP   1-1634
RA   Dzierszinski F., Tomavo S.;
RT   "Tachyzoite 76K strain enolase of Toxoplasma gondii";
RL   Unpublished.
XX
RN   [3]
RP   1-1634
RA   Dzierszinski F., Tomavo S.;
RT   ;
RL   Submitted (25-JAN-1999) to the INSDC.
RL   INSERM, 369, Rue Jules Guesde BP 39, Villeneuve D'Ascq 59651, France
XX
DR   EnsemblGenomes; TGME49_068850; Toxoplasma_gondii.
XX
FH   Key             Location/Qualifiers
FH
FT   source          1..1634
FT                   /organism="Toxoplasma gondii"
FT                   /strain="76K"
FT                   /mol_type="mRNA"
FT                   /dev_stage="tachyzoite"
FT                   /db_xref="taxon:5811"
FT   CDS             27..1361
FT                   /codon_start=1
FT                   /gene="ENO2"
FT                   /product="enolase"
FT                   /db_xref="GOA:Q9BPL7"
FT                   /db_xref="InterPro:IPR000941"
FT                   /db_xref="InterPro:IPR020809"
FT                   /db_xref="InterPro:IPR020810"
FT                   /db_xref="InterPro:IPR020811"
FT                   /db_xref="UniProtKB/Swiss-Prot:Q9BPL7"
FT                   /protein_id="AAG60329.1"
FT                   /translation="MVAIKDITARQILDSRGNPTVEVDLLTDGGCFRAAVPSGASTGIY
FT                   EALELRDKDQTKFMGKGVMKAVENIHKIIKPALIGKDPCDQKGIDKLMVEELDGTKNEW
FT                   GWCKSKLGANAILAVSMACCRAGAAAKGMPLYKYIATLAGNPTDKMVMPVPFFNVINGG
FT                   SHAGNKVAMQEFMIAPVGASTIQEAIQIGAEVYQHLKVVIKKKYGLDATNVGDEGGFAP
FT                   NISGATEALDLLMEAIKVSGHEGKVKIAADVAASEFFLQDDKVYDLDFKTPNNDKSQRK
FT                   TGEELRNLYKDLCQKYPFVSIEDPFDQDDFHSYAQLTNEVGEKVQIVGDDLLVTNPTRI
FT                   EKAVQEKACNGLLLKVNQIGTVSESIEACQLAQKNKWGVMVSHRSGETEDSFIADLVVG
FT                   LRTGQIKTGAPCRSERLCKYNQLMRIEESLGSDCQYAGAGFRHPN"
XX
SQ   Sequence 1634 BP; 396 A; 463 C; 457 G; 318 T; 0 other;
     tctaccgtta ctcaacttcc aacaaaatgg tggccatcaa ggacatcact gctcgtcaga        60
     tcctcgactc ccgaggaaac ccgaccgtcg aggttgactt gttgaccgat ggcggctgct       120
     tccgtgccgc tgtccccagc ggcgcatcca ctggcatcta cgaggcgctt gagctccgtg       180
     acaaggacca aactaagttc atgggcaagg gtgtgatgaa ggccgtggag aacatccaca       240
     agattatcaa gccggcgctt attggcaagg acccgtgcga ccagaagggt attgacaagc       300
     tgatggtcga ggagctcgat ggaactaaga acgagtgggg ctggtgcaag tcgaagctcg       360
     gcgcgaacgc gatcctggcc gtctcgatgg cttgctgccg cgccggcgct gctgccaagg       420
     gcatgcccct gtacaagtac attgccactt tggctggaaa cccgacagac aagatggtaa       480
     tgcccgtccc gttcttcaac gtcatcaacg gcggctccca cgcaggcaac aaggtcgcga       540
     tgcaggagtt catgatcgcc cccgtcggcg cctccacaat ccaagaggcg atccagatcg       600
     gcgcggaagt gtaccagcac ctgaaggtcg tcattaagaa gaagtatggc ctcgacgcca       660
     cgaacgtcgg cgacgagggt ggcttcgccc ccaacatcag cggcgccacg gaggccctcg       720
     acttgctgat ggaggccatc aaggtgtctg gtcacgaagg caaggtcaag attgccgccg       780
     acgtcgccgc ttccgagttc ttcctccagg acgacaaagt ctatgaccta gacttcaaga       840
     ctccgaacaa cgacaagtcg caacgcaaga ctggcgaaga gcttcgcaac ctgtacaagg       900
     acctgtgcca gaagtatccc ttcgtgtcca tcgaggaccc gttcgaccag gacgacttcc       960
     acagctacgc tcagctcacc aacgaggttg gcgagaaggt ccaaatcgtc ggcgacgacc      1020
     tcctggtcac caacccgacg cgcattgaga aggccgttca ggagaaagcg tgcaacggcc      1080
     tgcttctcaa ggtgaaccag attggcacag tcagcgagtc tatcgaggcc tgccagcttg      1140
     cccagaagaa caagtggggc gttatggttt ctcaccgctc cggtgagact gaggactcct      1200
     tcatcgctga cctcgtcgtc ggtctccgca ccgggcaaat caagactggc gccccgtgca      1260
     gatccgagcg tctctgcaag tacaaccagc tgatgcgtat cgaagagtcg ctcggctccg      1320
     actgtcagta cgccggcgct ggcttccgcc atcccaacta agtggaaacg gagtttcgac      1380
     tacccaactg ctcaattggg gctgggtggt ttgtccactc tgcaacaagg gcgtgacgag      1440
     atcgttgcac atgcaactgc cttttttgtg cttggtggga aggagcactt tcgcaggtgc      1500
     agcaccgagt tgcggttgat gggaatttcg gaactgattt gtttcttgca tgccatcacc      1560
     gaaggaacga gcagtttcgt tgataatatt ggaaagtctt ttgaaaaaaa aaaaaaaaaa      1620
     aaaaaaaaaa aaaa                                                        1634
//