File: inv.dat

package info (click to toggle)
emboss 6.6.0%2Bdfsg-9
  • links: PTS, VCS
  • area: main
  • in suites: bullseye
  • size: 571,548 kB
  • sloc: ansic: 460,579; java: 29,439; perl: 13,573; sh: 12,754; makefile: 3,284; csh: 706; asm: 351; xml: 239; pascal: 237; modula3: 8
file content (1665 lines) | stat: -rw-r--r-- 112,520 bytes parent folder | download | duplicates (7)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
660
661
662
663
664
665
666
667
668
669
670
671
672
673
674
675
676
677
678
679
680
681
682
683
684
685
686
687
688
689
690
691
692
693
694
695
696
697
698
699
700
701
702
703
704
705
706
707
708
709
710
711
712
713
714
715
716
717
718
719
720
721
722
723
724
725
726
727
728
729
730
731
732
733
734
735
736
737
738
739
740
741
742
743
744
745
746
747
748
749
750
751
752
753
754
755
756
757
758
759
760
761
762
763
764
765
766
767
768
769
770
771
772
773
774
775
776
777
778
779
780
781
782
783
784
785
786
787
788
789
790
791
792
793
794
795
796
797
798
799
800
801
802
803
804
805
806
807
808
809
810
811
812
813
814
815
816
817
818
819
820
821
822
823
824
825
826
827
828
829
830
831
832
833
834
835
836
837
838
839
840
841
842
843
844
845
846
847
848
849
850
851
852
853
854
855
856
857
858
859
860
861
862
863
864
865
866
867
868
869
870
871
872
873
874
875
876
877
878
879
880
881
882
883
884
885
886
887
888
889
890
891
892
893
894
895
896
897
898
899
900
901
902
903
904
905
906
907
908
909
910
911
912
913
914
915
916
917
918
919
920
921
922
923
924
925
926
927
928
929
930
931
932
933
934
935
936
937
938
939
940
941
942
943
944
945
946
947
948
949
950
951
952
953
954
955
956
957
958
959
960
961
962
963
964
965
966
967
968
969
970
971
972
973
974
975
976
977
978
979
980
981
982
983
984
985
986
987
988
989
990
991
992
993
994
995
996
997
998
999
1000
1001
1002
1003
1004
1005
1006
1007
1008
1009
1010
1011
1012
1013
1014
1015
1016
1017
1018
1019
1020
1021
1022
1023
1024
1025
1026
1027
1028
1029
1030
1031
1032
1033
1034
1035
1036
1037
1038
1039
1040
1041
1042
1043
1044
1045
1046
1047
1048
1049
1050
1051
1052
1053
1054
1055
1056
1057
1058
1059
1060
1061
1062
1063
1064
1065
1066
1067
1068
1069
1070
1071
1072
1073
1074
1075
1076
1077
1078
1079
1080
1081
1082
1083
1084
1085
1086
1087
1088
1089
1090
1091
1092
1093
1094
1095
1096
1097
1098
1099
1100
1101
1102
1103
1104
1105
1106
1107
1108
1109
1110
1111
1112
1113
1114
1115
1116
1117
1118
1119
1120
1121
1122
1123
1124
1125
1126
1127
1128
1129
1130
1131
1132
1133
1134
1135
1136
1137
1138
1139
1140
1141
1142
1143
1144
1145
1146
1147
1148
1149
1150
1151
1152
1153
1154
1155
1156
1157
1158
1159
1160
1161
1162
1163
1164
1165
1166
1167
1168
1169
1170
1171
1172
1173
1174
1175
1176
1177
1178
1179
1180
1181
1182
1183
1184
1185
1186
1187
1188
1189
1190
1191
1192
1193
1194
1195
1196
1197
1198
1199
1200
1201
1202
1203
1204
1205
1206
1207
1208
1209
1210
1211
1212
1213
1214
1215
1216
1217
1218
1219
1220
1221
1222
1223
1224
1225
1226
1227
1228
1229
1230
1231
1232
1233
1234
1235
1236
1237
1238
1239
1240
1241
1242
1243
1244
1245
1246
1247
1248
1249
1250
1251
1252
1253
1254
1255
1256
1257
1258
1259
1260
1261
1262
1263
1264
1265
1266
1267
1268
1269
1270
1271
1272
1273
1274
1275
1276
1277
1278
1279
1280
1281
1282
1283
1284
1285
1286
1287
1288
1289
1290
1291
1292
1293
1294
1295
1296
1297
1298
1299
1300
1301
1302
1303
1304
1305
1306
1307
1308
1309
1310
1311
1312
1313
1314
1315
1316
1317
1318
1319
1320
1321
1322
1323
1324
1325
1326
1327
1328
1329
1330
1331
1332
1333
1334
1335
1336
1337
1338
1339
1340
1341
1342
1343
1344
1345
1346
1347
1348
1349
1350
1351
1352
1353
1354
1355
1356
1357
1358
1359
1360
1361
1362
1363
1364
1365
1366
1367
1368
1369
1370
1371
1372
1373
1374
1375
1376
1377
1378
1379
1380
1381
1382
1383
1384
1385
1386
1387
1388
1389
1390
1391
1392
1393
1394
1395
1396
1397
1398
1399
1400
1401
1402
1403
1404
1405
1406
1407
1408
1409
1410
1411
1412
1413
1414
1415
1416
1417
1418
1419
1420
1421
1422
1423
1424
1425
1426
1427
1428
1429
1430
1431
1432
1433
1434
1435
1436
1437
1438
1439
1440
1441
1442
1443
1444
1445
1446
1447
1448
1449
1450
1451
1452
1453
1454
1455
1456
1457
1458
1459
1460
1461
1462
1463
1464
1465
1466
1467
1468
1469
1470
1471
1472
1473
1474
1475
1476
1477
1478
1479
1480
1481
1482
1483
1484
1485
1486
1487
1488
1489
1490
1491
1492
1493
1494
1495
1496
1497
1498
1499
1500
1501
1502
1503
1504
1505
1506
1507
1508
1509
1510
1511
1512
1513
1514
1515
1516
1517
1518
1519
1520
1521
1522
1523
1524
1525
1526
1527
1528
1529
1530
1531
1532
1533
1534
1535
1536
1537
1538
1539
1540
1541
1542
1543
1544
1545
1546
1547
1548
1549
1550
1551
1552
1553
1554
1555
1556
1557
1558
1559
1560
1561
1562
1563
1564
1565
1566
1567
1568
1569
1570
1571
1572
1573
1574
1575
1576
1577
1578
1579
1580
1581
1582
1583
1584
1585
1586
1587
1588
1589
1590
1591
1592
1593
1594
1595
1596
1597
1598
1599
1600
1601
1602
1603
1604
1605
1606
1607
1608
1609
1610
1611
1612
1613
1614
1615
1616
1617
1618
1619
1620
1621
1622
1623
1624
1625
1626
1627
1628
1629
1630
1631
1632
1633
1634
1635
1636
1637
1638
1639
1640
1641
1642
1643
1644
1645
1646
1647
1648
1649
1650
1651
1652
1653
1654
1655
1656
1657
1658
1659
1660
1661
1662
1663
1664
1665
ID   Z11115; SV 3; linear; genomic DNA; STD; INV; 40700 BP.
XX
AC   Z11115;
XX
PR   Project:PRJNA13758;
XX
DT   04-MAY-1991 (Rel. 28, Created)
DT   18-MAY-2012 (Rel. 112, Last updated, Version 115)
XX
DE   Caenorhabditis elegans Cosmid ZK637
XX
KW   HTG.
XX
OS   Caenorhabditis elegans
OC   Eukaryota; Metazoa; Nematoda; Chromadorea; Rhabditida; Rhabditoidea;
OC   Rhabditidae; Peloderinae; Caenorhabditis.
XX
RN   [1]
RP   1-40700
RG   Caenorhabditis elegans Sequencing Consortium
RA   ;
RT   "Genome sequence of the nematode C. elegans: a platform for investigating
RT   biology";
RL   Science 282(5396):2012-2018(1998).
XX
RN   [2]
RP   1-40700
RG   WormBase Consortium
RA   Craxton M.;
RT   ;
RL   Submitted (04-MAY-1991) to the INSDC.
RL   Nematode Sequencing Project: Sanger Institute, Hinxton, Cambridge CB10 1SA,
RL   UK and The Genome Institute at Washington University, St. Louis, MO 63110,
RL   USA. E-mail: help@wormbase.org
XX
DR   EMBL-CON; BX284603.
DR   Ensembl-Gn; ZK637.1; Caenorhabditis_elegans.
DR   Ensembl-Gn; ZK637.10; Caenorhabditis_elegans.
DR   Ensembl-Gn; ZK637.11; Caenorhabditis_elegans.
DR   Ensembl-Gn; ZK637.12; Caenorhabditis_elegans.
DR   Ensembl-Gn; ZK637.13; Caenorhabditis_elegans.
DR   Ensembl-Gn; ZK637.14; Caenorhabditis_elegans.
DR   Ensembl-Gn; ZK637.15; Caenorhabditis_elegans.
DR   Ensembl-Gn; ZK637.2; Caenorhabditis_elegans.
DR   Ensembl-Gn; ZK637.3; Caenorhabditis_elegans.
DR   Ensembl-Gn; ZK637.4; Caenorhabditis_elegans.
DR   Ensembl-Gn; ZK637.5; Caenorhabditis_elegans.
DR   Ensembl-Gn; ZK637.7; Caenorhabditis_elegans.
DR   Ensembl-Gn; ZK637.8; Caenorhabditis_elegans.
DR   Ensembl-Gn; ZK637.9; Caenorhabditis_elegans.
DR   Ensembl-Tr; ZK637.1.1; Caenorhabditis_elegans.
DR   Ensembl-Tr; ZK637.1.2; Caenorhabditis_elegans.
DR   Ensembl-Tr; ZK637.10.1; Caenorhabditis_elegans.
DR   Ensembl-Tr; ZK637.10.2; Caenorhabditis_elegans.
DR   Ensembl-Tr; ZK637.11.1; Caenorhabditis_elegans.
DR   Ensembl-Tr; ZK637.11.2; Caenorhabditis_elegans.
DR   Ensembl-Tr; ZK637.12.1; Caenorhabditis_elegans.
DR   Ensembl-Tr; ZK637.12.2; Caenorhabditis_elegans.
DR   Ensembl-Tr; ZK637.13.1; Caenorhabditis_elegans.
DR   Ensembl-Tr; ZK637.13.2; Caenorhabditis_elegans.
DR   Ensembl-Tr; ZK637.14; Caenorhabditis_elegans.
DR   Ensembl-Tr; ZK637.15; Caenorhabditis_elegans.
DR   Ensembl-Tr; ZK637.2.1; Caenorhabditis_elegans.
DR   Ensembl-Tr; ZK637.2.2; Caenorhabditis_elegans.
DR   Ensembl-Tr; ZK637.3.1; Caenorhabditis_elegans.
DR   Ensembl-Tr; ZK637.3.2; Caenorhabditis_elegans.
DR   Ensembl-Tr; ZK637.4; Caenorhabditis_elegans.
DR   Ensembl-Tr; ZK637.5; Caenorhabditis_elegans.
DR   Ensembl-Tr; ZK637.7b.1; Caenorhabditis_elegans.
DR   Ensembl-Tr; ZK637.7b.2; Caenorhabditis_elegans.
DR   Ensembl-Tr; ZK637.8a; Caenorhabditis_elegans.
DR   Ensembl-Tr; ZK637.9b; Caenorhabditis_elegans.
DR   EnsemblGenomes; ZK637.1; Caenorhabditis_elegans.
DR   EnsemblGenomes; ZK637.10; Caenorhabditis_elegans.
DR   EnsemblGenomes; ZK637.10.1; Caenorhabditis_elegans.
DR   EnsemblGenomes; ZK637.10.2; Caenorhabditis_elegans.
DR   EnsemblGenomes; ZK637.11; Caenorhabditis_elegans.
DR   EnsemblGenomes; ZK637.11.1; Caenorhabditis_elegans.
DR   EnsemblGenomes; ZK637.11.2; Caenorhabditis_elegans.
DR   EnsemblGenomes; ZK637.12; Caenorhabditis_elegans.
DR   EnsemblGenomes; ZK637.12.1; Caenorhabditis_elegans.
DR   EnsemblGenomes; ZK637.12.2; Caenorhabditis_elegans.
DR   EnsemblGenomes; ZK637.13; Caenorhabditis_elegans.
DR   EnsemblGenomes; ZK637.13.1; Caenorhabditis_elegans.
DR   EnsemblGenomes; ZK637.13.2; Caenorhabditis_elegans.
DR   EnsemblGenomes; ZK637.14; Caenorhabditis_elegans.
DR   EnsemblGenomes; ZK637.15; Caenorhabditis_elegans.
DR   EnsemblGenomes; ZK637.2; Caenorhabditis_elegans.
DR   EnsemblGenomes; ZK637.2.1; Caenorhabditis_elegans.
DR   EnsemblGenomes; ZK637.2.2; Caenorhabditis_elegans.
DR   EnsemblGenomes; ZK637.3; Caenorhabditis_elegans.
DR   EnsemblGenomes; ZK637.3.1; Caenorhabditis_elegans.
DR   EnsemblGenomes; ZK637.3.2; Caenorhabditis_elegans.
DR   EnsemblGenomes; ZK637.4; Caenorhabditis_elegans.
DR   EnsemblGenomes; ZK637.5; Caenorhabditis_elegans.
DR   EnsemblGenomes; ZK637.7; Caenorhabditis_elegans.
DR   EnsemblGenomes; ZK637.7b.1; Caenorhabditis_elegans.
DR   EnsemblGenomes; ZK637.7b.2; Caenorhabditis_elegans.
DR   EnsemblGenomes; ZK637.8; Caenorhabditis_elegans.
DR   EnsemblGenomes; ZK637.8a; Caenorhabditis_elegans.
DR   EnsemblGenomes; ZK637.9; Caenorhabditis_elegans.
DR   EnsemblGenomes; ZK637.9b; Caenorhabditis_elegans.
DR   WormBase; WBGene00014987; ZK637.6.
DR   WormBase; WBGene00168562; ZK637.16.
DR   WormBase; WBGene00174886; ZK637.17.
DR   WormBase; WBGene00194716; ZK637.18.
DR   WormBase; WBGene00200181; ZK637.19.
DR   WormBase; WBGene00201389; ZK637.20.
XX
CC   Protein-coding gene structures below are the result of integration
CC   and manual review of the following types of data: ab initio
CC   predictions by Genefinder (P. Green and L. Hillier, pers. comm.);
CC   alignments to published proteins and cDNAs; genome sequence
CC   conservation with other nematodes (e.g. to C. briggsae using WABA:
CC   Genome Res. 2000. 10:1115-1125); sequence features (such as
CC   trans-splice and polyA sites).
CC   
CC   Sources of data: large-scale EST projects of Yuji Kohara
CC   (http://www.ddbj.nig.ac.jp/c-elegans/html/CE_INDEX.html); ORFeome
CC   cloning project (http://worfdb.dfci.harvard.edu); RST large-scale
CC   sequencing project (Genome Res. 2009. 19:2334-2342); IST library
CC   (Science. 2004. 303:540-3); RT-PCR EST set (Ewing B. Green P. 2010
CC   Unpublished); UTRome EST data submission (UTRome v1 Mangone M.
CC   Piano F. 2009); TEC-RED data (PNAS 2004. 101:1650-1655); RNA Deep
CC   sequencing data (454 read clusters - Makedonka Mitreva,
CC   unpublished; Illumina sequence data, Genome Res. 2009. 19:657-66);
CC   Numerous data sets from the modENCODE project (Science. 2010.
CC   330:1775-87); Individual C. elegans Nucleotide Database
CC   submissions; Personal communications with C. elegans researchers;
CC   
CC   Non-Coding gene structures below are derived using the following
CC   methods and data: ab initio prediction of tRNAs by tRNAscan-SE
CC   (Nucl. Acids. Res., 25, 955-964); integration and appraisal of
CC   miRNAs from miRBase (http://www.mirbase.org); integration and
CC   appraisal of RFAM predictions (rfam.sanger.ac.uk); 21U-RNAs (Cell.
CC   2006. 127:1193-1207); modENCODE data (Science. 2010. 330:1775-87);
CC   manual curation of novel published ncRNAs from the literature.
CC   
CC   Current sequence finishing criteria for the C. elegans genome
CC   sequencing consortium are that all bases are either sequenced
CC   unambiguously on both strands, or on a single strand with both a
CC   dye primer and dye terminator reaction, from distinct subclones.
CC   Exceptions are indicated by an explicit note.
CC   
CC   For a graphical representation of this sequence and its analysis
CC   see:- http://www.wormbase.org/perl/ace/elegans/seq/sequence?
CC   name=ZK637;class=Sequence
CC   
CC   IMPORTANT: This sequence is not the entire insert of clone ZK637.
CC   It may be shorter because we only sequence overlapping
CC   sections once, or longer because we arrange for a small
CC   overlap between neighbouring submissions.
CC   The start of this sequence (1..180) overlaps with the end of
CC   sequence Z22175.
CC   The end of this sequence (40697..40700) overlaps with the start of
CC   sequence Z11126.
CC   
CC   [040212 dl] Sequence correction: Substitution A-> @ 39218
CC   
CC   [100415] Sequence correction: insertion 1 bases aacacccgaGggggctca
CC   @ 4309
XX
FH   Key             Location/Qualifiers
FH
FT   source          1..40700
FT                   /organism="Caenorhabditis elegans"
FT                   /strain="Bristol N2"
FT                   /mol_type="genomic DNA"
FT                   /clone="ZK637"
FT                   /db_xref="taxon:6239"
FT   ncRNA           10277..10297
FT                   /gene="21ur-14900"
FT                   /locus_tag="CELE_ZK637.16"
FT                   /standard_name="ZK637.16"
FT                   /product="RNA transcript 21ur-14900"
FT                   /note="21U RNA gene"
FT                   /ncRNA_class="other"
FT   ncRNA           complement(15810..15830)
FT                   /gene="21ur-13808"
FT                   /locus_tag="CELE_ZK637.17"
FT                   /standard_name="ZK637.17"
FT                   /product="RNA transcript 21ur-13808"
FT                   /note="21U RNA gene"
FT                   /ncRNA_class="other"
FT   ncRNA           complement(21488..21625)
FT                   /gene="ZK637.19"
FT                   /locus_tag="CELE_ZK637.19"
FT                   /standard_name="ZK637.19"
FT                   /product="RNA transcript ZK637.19"
FT                   /note="C. elegans probable non-coding RNA"
FT                   /ncRNA_class="other"
FT   ncRNA           complement(25111..25254)
FT                   /gene="ZK637.20"
FT                   /locus_tag="CELE_ZK637.20"
FT                   /standard_name="ZK637.20"
FT                   /product="RNA transcript ZK637.20"
FT                   /note="C. elegans probable non-coding RNA"
FT                   /ncRNA_class="other"
FT   CDS             join(29818..30078,30127..30263,30310..30394,30744..31280,
FT                   31331..31673,32243..32391)
FT                   /gene="trxr-2"
FT                   /locus_tag="CELE_ZK637.10"
FT                   /standard_name="ZK637.10"
FT                   /product="Protein TRXR-2"
FT                   /note="Partially confirmed by transcript evidence"
FT                   /note="Thioredoxin reductase"
FT                   /db_xref="GOA:P30635"
FT                   /db_xref="InterPro:IPR001327"
FT                   /db_xref="InterPro:IPR004099"
FT                   /db_xref="InterPro:IPR006338"
FT                   /db_xref="InterPro:IPR012999"
FT                   /db_xref="InterPro:IPR013027"
FT                   /db_xref="InterPro:IPR016156"
FT                   /db_xref="InterPro:IPR023753"
FT                   /db_xref="UniProtKB/Swiss-Prot:P30635"
FT                   /db_xref="WormBase:WBGene00014028"
FT                   /protein_id="CAA77459.1"
FT                   /translation="MLLSTFKRHLPIRRLFSSNKFDLIVIGAGSGGLSCSKRAADLGAN
FT                   VALIDAVEPTPHGHSWGIGGTCANVGCIPKKLMHQAAIVGKELKHADKYGWNGIDQEKI
FT                   KHDWNVLSKNVNDRVKANNWIYRVQLNQKKINYFNAYAEFVDKDKIVITGTDKNKTKNF
FT                   LSAPNVVISTGLRPKYPNIPGAELGITSDDLFTLASVPGKTLIVGGGYVALECAGFLSA
FT                   FNQNVEVLVRSIPLKGFDRDCVHFVMEHLKTTGVKVKEHVEVERVEAVGSKKKVTFTGN
FT                   GGVEEYDTVIWAAGRVPNLKSLNLDNAGVRTDKRSGKILADEFDRASCNGVYAVGDIVQ
FT                   DRQELTPLAIQSGKLLADRLFSNSKQIVRFDGVATTVFTPLELSTVGLTEEEAIQKHGE
FT                   DSIEVFHSHFTPFEYVVPQNKDSGFCYVKAVCTRDESQKILGLHFVGPNAAEVIQGYAV
FT                   AFRVGISMSDLQNTIAIHPCSSEEFVKLHITKRSGQDPRTQGCCG"
FT   CDS             complement(join(32542..33021,33416..33785,33833..33933))
FT                   /gene="cdc-25.3"
FT                   /locus_tag="CELE_ZK637.11"
FT                   /standard_name="ZK637.11"
FT                   /product="Protein CDC-25.3"
FT                   /note="Confirmed by transcript evidence"
FT                   /note="CDC25/string"
FT                   /db_xref="GOA:P30634"
FT                   /db_xref="InterPro:IPR000751"
FT                   /db_xref="InterPro:IPR001763"
FT                   /db_xref="UniProtKB/Swiss-Prot:P30634"
FT                   /db_xref="WormBase:WBGene00000388"
FT                   /protein_id="CAA77456.1"
FT                   /translation="MCVDVPCENCIVRNDGLRLKCSECAEGSSKLFPRQNRQHSSAISH
FT                   ISNSSPPTRKRSIDGGYTSGTDSANTSEIVIKKRLTFSKKSHSTSEIETWNAHLQVDYH
FT                   LETVTPSCSTVYQKITSETLIEIMQKLSQIEFMQKYILIDCRYDYEYNGGHIKGAQSLF
FT                   NPETAADFFFNKDGSKKINRIPIFYCEYSQKRGPTMANNLREVDRKLNSNIYPRCDYEE
FT                   IYLLEGGYKNFYAFTRGLEKEQRVQLCEPDNYVIMFDDRYKAELRKHQFHKKNVSKPMK
FT                   KWSSTTSVISILTTSGTRISTLRQTCDPIHEHDAH"
FT   CDS             complement(join(38545..38830,39129..39322))
FT                   /gene="glb-1"
FT                   /locus_tag="CELE_ZK637.13"
FT                   /standard_name="ZK637.13"
FT                   /product="Protein GLB-1"
FT                   /note="Confirmed by transcript evidence"
FT                   /note="Globin"
FT                   /db_xref="GOA:P30627"
FT                   /db_xref="InterPro:IPR000971"
FT                   /db_xref="InterPro:IPR009050"
FT                   /db_xref="InterPro:IPR012085"
FT                   /db_xref="InterPro:IPR012292"
FT                   /db_xref="PDB:2WTG"
FT                   /db_xref="PDB:2WTH"
FT                   /db_xref="UniProtKB/Swiss-Prot:P30627"
FT                   /db_xref="WormBase:WBGene00014030"
FT                   /protein_id="CAA77458.2"
FT                   /translation="MSMNRQEISDLCVKSLEGRMVGTEAQNIENGNAFYRYFFTNFPDL
FT                   RVYFKGAEKYTADDVKKSERFDKQGQRILLACHLLANVYTNEEVFKGYVRETINRHRIY
FT                   KMDPALWMAFFTVFTGYLESVGCLNDQQKAAWMALGKEFNAESQTHLKNSNLPHV"
FT   CDS             complement(join(4452..4729,4826..4975,5022..5079))
FT                   /gene="ZK637.14"
FT                   /locus_tag="CELE_ZK637.14"
FT                   /standard_name="ZK637.14"
FT                   /product="Protein ZK637.14"
FT                   /note="Confirmed by transcript evidence"
FT                   /note="Zinc finger, C3HC4 type (RING finger)"
FT                   /db_xref="GOA:P30631"
FT                   /db_xref="InterPro:IPR001841"
FT                   /db_xref="InterPro:IPR013083"
FT                   /db_xref="UniProtKB/Swiss-Prot:P30631"
FT                   /db_xref="WormBase:WBGene00014031"
FT                   /protein_id="CAA77447.1"
FT                   /translation="MSERDAIRAFSHMLETIFVRMRAEGTGSQTDAMQRWLDLYNVGSL
FT                   PIDKKSYKALRLMDRETTDQQKEDATCAICLDNLQNNVDIPEDHVIKEELKIDPTTFGT
FT                   TVIVMPCKHRFHYFCLTLWLEAQQTCPTCRQKVKTDKEVEEEERQRNLEELHDSMYG"
FT   CDS             join(36148..36306,36471..36668,36720..36842,36887..36988,
FT                   37039..37197)
FT                   /gene="ZK637.15"
FT                   /locus_tag="CELE_ZK637.15"
FT                   /standard_name="ZK637.15"
FT                   /product="Protein ZK637.15"
FT                   /note="Predicted"
FT                   /db_xref="UniProtKB/TrEMBL:Q23556"
FT                   /db_xref="WormBase:WBGene00014032"
FT                   /protein_id="CAA77457.2"
FT                   /translation="MECVNCDCTVKTMDNLDQAIRALLQRGKHVNRMMDNEKLIREARR
FT                   MEDVQQLKMQIPKPVDKKPRPPPSENNLKLISCEETCMDETLKNSSKPRMIYNKQLGRA
FT                   ESIDFDVPSLSYESSEKCAGETSPYTSASVSNSKKATSSSKFTKSEITTITELTTSTFK
FT                   KSNNSSGGALVLDNHYLINNDDGTVKKLPMKVYVKQRLEDGSLDVQLVFFDENSQKVMD
FT                   ISMLVNGKKIRNVQFCGKDGKLVN"
FT   CDS             join(3794..3918,4033..4234,5884..5988)
FT                   /gene="ZK637.2"
FT                   /locus_tag="CELE_ZK637.2"
FT                   /standard_name="ZK637.2"
FT                   /product="Protein ZK637.2"
FT                   /note="contains similarity to Interpro domain IPR008560
FT                   (Protein of unknown function DUF842, eukaryotic)"
FT                   /note="Confirmed by transcript evidence"
FT                   /db_xref="InterPro:IPR008560"
FT                   /db_xref="UniProtKB/Swiss-Prot:P30629"
FT                   /db_xref="WormBase:WBGene00014022"
FT                   /protein_id="CAA77449.2"
FT                   /translation="MSNSTMEATQMKVKLAVDEMIDDLDKTYLRDMQKSMFQCSARCCD
FT                   NKKTTRDAVENCVESCNDGMKKAQGYLEKELGGLQDQLSRCAMTCYDKLVQQFGPDVNK
FT                   YSESQKLSFNEKLDSCVSVCADDHIKLIPAIKKRFAKNT"
FT   CDS             join(6272..6466,6524..6643,7347..7659,7715..7776,
FT                   7825..8154,8768..9253,9312..9473,9780..9911)
FT                   /gene="tag-256"
FT                   /locus_tag="CELE_ZK637.3"
FT                   /standard_name="ZK637.3"
FT                   /product="Protein TAG-256"
FT                   /note="Confirmed by transcript evidence"
FT                   /note="C. elegans TAG-256 protein; contains similarity to
FT                   Interpro domain IPR024881 (T-cell immunomodulatory
FT                   protein)"
FT                   /db_xref="GOA:P30639"
FT                   /db_xref="InterPro:IPR024881"
FT                   /db_xref="UniProtKB/Swiss-Prot:P30639"
FT                   /db_xref="WormBase:WBGene00014023"
FT                   /protein_id="CAA77450.1"
FT                   /translation="MKKILPIIWLINLVSGSLSLEKKAPDLLGKVCAFGDFNADRNTDI
FT                   LVFANGTLTINYQETKLLDVLEASKFTPGTSFAISKPSLNADFVECSVGDFNGDSRLDV
FT                   LVSIRDKDTEIYNHTLWTSEIEDEKEIFRPFHVAMLQQHAMAIDVSDDGWTDVLGFYPN
FT                   GSMFCTGFNKEGKYNLLVNGCKHEFVAFPEKLNIYPGMPHLFVDLNSDLIADIVFMTKE
FT                   SDGSLFMSVWQKTKISWQFRDWVPKLTPAQYPFVGAPVVMDVDSDGELDILVPICREDE
FT                   CSHITQMASWSKTKLWGLVACDMQDYTVIKEPFSRVIFRVGEFSLDSFPDMVVIAQATR
FT                   ANTRPVIKVMDNAECTKCEKNGTRRFEIRAQENIQPKNMSLGVIKMGTFFDLLEDGSLD
FT                   LLVEYEYGGQTRFGFIYCPDKGDTTFLKVQVFTGVCSDRCNPKSNEIGSSISMTGACAS
FT                   FSMTDGWGGSTQSVACQVPASSNRALYLPFLLYGLGRSPNFVDELNIAIPKYADRKEDW
FT                   KHSLKQIVPNSRIIVLPPSDQYPHWTSRLYVTPSALIVQSLAVIALVCCMLLMVVVFLH
FT                   YREKKEDRYERQQQSHRFHFDAM"
FT   CDS             join(10249..10317,10370..10437,10487..10540,10596..10692)
FT                   /gene="ZK637.4"
FT                   /locus_tag="CELE_ZK637.4"
FT                   /standard_name="ZK637.4"
FT                   /product="Protein ZK637.4"
FT                   /note="Confirmed by transcript evidence"
FT                   /db_xref="UniProtKB/Swiss-Prot:P30637"
FT                   /db_xref="WormBase:WBGene00014024"
FT                   /protein_id="CAA77451.1"
FT                   /translation="MKSNPKYFLMNDVERQSKYSPKYVPNNSLKERILEFLDYYIAPLK
FT                   LYLLSYPMPDCLWDNRKLRLKASGVQVTPSSEPVHIDDRLIHISQKQPSE"
FT   CDS             join(11125..11558,11607..11865,12074..12283,12412..12537)
FT                   /gene="asna-1"
FT                   /locus_tag="CELE_ZK637.5"
FT                   /standard_name="ZK637.5"
FT                   /product="Protein ASNA-1"
FT                   /note="Confirmed by transcript evidence"
FT                   /note="ArsA"
FT                   /db_xref="GOA:P30632"
FT                   /db_xref="InterPro:IPR016300"
FT                   /db_xref="UniProtKB/Swiss-Prot:P30632"
FT                   /db_xref="WormBase:WBGene00014025"
FT                   /protein_id="CAA77452.1"
FT                   /translation="MSDQLEASIKNILEQKTLKWIFVGGKGGVGKTTCSCSLAAQLSKV
FT                   RERVLLISTDPAHNISDAFSQKFTKTPTLVEGFKNLFAMEIDSNPNGEGVEMGNIEEML
FT                   QNAAQNEGGSGGFSMGKDFLQSFAGGLPGIDEAMSFGEMIKLIDSLDFDVVVFDTAPTG
FT                   HTLRLLQFPTLLEKVFTKILSLQGMFGPMMNQFGGMFGMGGGSMNEMIEKMTTTLESVK
FT                   KMNAQFKDPNCTTFVCVCIAEFLSLYETERLIQELSKQGIDTHNIIVNQLLFPDTDANG
FT                   TVSCRKCASRQAIQSKYLTDIDELYEDFHVVKLPLLEAEVRGGPAILQFSERMVDPEAN
FT                   KN"
FT   CDS             complement(join(16631..16828,17584..17733,17780..17884,
FT                   17963..18373,18849..19007,19052..19648,19695..19827,
FT                   19877..19995,20105..20161))
FT                   /gene="lin-9"
FT                   /locus_tag="CELE_ZK637.7"
FT                   /standard_name="ZK637.7a"
FT                   /product="Protein LIN-9, isoform a"
FT                   /note="C. elegans LIN-9 protein; contains similarity to
FT                   Pfam domain PF06584 DIRP contains similarity to Interpro
FT                   domain IPR010561 (DIRP)"
FT                   /note="Confirmed by transcript evidence"
FT                   /db_xref="GOA:P30630"
FT                   /db_xref="InterPro:IPR010561"
FT                   /db_xref="UniProtKB/Swiss-Prot:P30630"
FT                   /db_xref="WormBase:WBGene00002998"
FT                   /protein_id="CAA77454.2"
FT                   /translation="MSSAVRSPRKKAASDTSDPDRTSSPYSLRETSKVPSRYRNEELYL
FT                   SPSRSIKRTGSPKKSPAKRLNGGRDSPSVNSLTRNSSLTMLAKAALDYESSSCALEYIP
FT                   KEERRPPRRALALSPPPAPSNDLLAKDLEMIEMHQNLVAGLDDLDNPANMTNEAVEHRD
FT                   TQSFFNMFSTDQERSAMMKQFKTYKNQTSEDVSTFMRANIKKLYNLLRYKKARQWVMCE
FT                   FFYSAIDEQIFKEENEFATIIRESFPNLKNWNLTRIEWRSIRKLLGKPRRCSKVFFEEE
FT                   RMYLEEKRMKIRSVYEGSYLNDPSIDLKDLPAKLPRPMVVGNRVFARIRNPYDGIYSGI
FT                   IDAVIPKGFRIIFDKPDIPPTLVSDTEILLDGKLDLLSIAYFIEQANSKLPSGVRPFVA
FT                   AVRDSSHPHLVRDVLVSRKIERSGGPLMGPNDERLNGKNAEMVGNFPLKFLVNLVKLTK
FT                   LIDIKKGLIRQLNELNADAEIQNMTSDKYSKAFQEKYAKTIIDLEHVNQNIDINMNGIQ
FT                   DHHMYFSSNDISTSNMKPEAVRQMCSQQAGRFVEHCNQGLNVENVHALTLIQSLTAVLL
FT                   QVRTMGTQKISAVDLQSLGDAISEIRTAIHPRNVAFFQDYVEVHMKQFHTIMLESGALA
FT                   GTVSNRK"
FT   CDS             complement(join(16631..16828,17584..17733,17780..17884,
FT                   17963..18373,18849..19007,19052..19654,19695..19827,
FT                   19877..19995,20105..20161))
FT                   /gene="lin-9"
FT                   /locus_tag="CELE_ZK637.7"
FT                   /standard_name="ZK637.7b"
FT                   /product="Protein LIN-9, isoform b"
FT                   /note="C. elegans LIN-9 protein; contains similarity to
FT                   Pfam domain PF06584 DIRP contains similarity to Interpro
FT                   domain IPR010561 (DIRP)"
FT                   /note="Partially confirmed by transcript evidence"
FT                   /db_xref="GOA:P30630"
FT                   /db_xref="InterPro:IPR010561"
FT                   /db_xref="UniProtKB/Swiss-Prot:P30630"
FT                   /db_xref="WormBase:WBGene00002998"
FT                   /protein_id="CAC42391.1"
FT                   /translation="MSSAVRSPRKKAASDTSDPDRTSSPYSLRETSKVPSRYRNEELYL
FT                   SPSRSIKRTGSPKKSPAKRLNGGRDSPSVNSLTRNSSLTMLAKAALDYESSSCALEYIF
FT                   QPKEERRPPRRALALSPPPAPSNDLLAKDLEMIEMHQNLVAGLDDLDNPANMTNEAVEH
FT                   RDTQSFFNMFSTDQERSAMMKQFKTYKNQTSEDVSTFMRANIKKLYNLLRYKKARQWVM
FT                   CEFFYSAIDEQIFKEENEFATIIRESFPNLKNWNLTRIEWRSIRKLLGKPRRCSKVFFE
FT                   EERMYLEEKRMKIRSVYEGSYLNDPSIDLKDLPAKLPRPMVVGNRVFARIRNPYDGIYS
FT                   GIIDAVIPKGFRIIFDKPDIPPTLVSDTEILLDGKLDLLSIAYFIEQANSKLPSGVRPF
FT                   VAAVRDSSHPHLVRDVLVSRKIERSGGPLMGPNDERLNGKNAEMVGNFPLKFLVNLVKL
FT                   TKLIDIKKGLIRQLNELNADAEIQNMTSDKYSKAFQEKYAKTIIDLEHVNQNIDINMNG
FT                   IQDHHMYFSSNDISTSNMKPEAVRQMCSQQAGRFVEHCNQGLNVENVHALTLIQSLTAV
FT                   LLQVRTMGTQKISAVDLQSLGDAISEIRTAIHPRNVAFFQDYVEVHMKQFHTIMLESGA
FT                   LAGTVSNRK"
FT   CDS             join(21665..21817,21899..22075,22183..22311,22561..22715,
FT                   23630..23839,23894..25148,26118..26258,26371..26590,
FT                   26755..26926,27146..27251)
FT                   /gene="unc-32"
FT                   /locus_tag="CELE_ZK637.8"
FT                   /standard_name="ZK637.8a"
FT                   /product="Protein UNC-32, isoform a"
FT                   /note="Confirmed by transcript evidence"
FT                   /note="TJ6/proton pump"
FT                   /db_xref="GOA:P30628"
FT                   /db_xref="InterPro:IPR002490"
FT                   /db_xref="UniProtKB/Swiss-Prot:P30628"
FT                   /db_xref="WormBase:WBGene00006768"
FT                   /protein_id="CAA77448.2"
FT                   /translation="MGDYVTPGEEPPQPGIYRSEQMCLAQLYLQSDASYQCVAELGELG
FT                   LVQFRDLNPDVSSFQRKYVNEVRRCDEMERKLRYLEREIKKDQIPMLDTGENPDAPLPR
FT                   EMIDLEATFEKLENELREVNKNEETLKKNFSELTELKHILRKTQTFFEEVDHDRWRILE
FT                   GGSGRRGRSTEREETRPLIDIGDMDDDSAARMSAQAAMLRLGFVAGVIQRERLPAFERL
FT                   LWRACRGNVFLRTSEIDDVLNDTVTGDPVNKCVFIIFFQGDHLKTKVKKICEGFRATLY
FT                   PCPDTPQERREMSIGVMTRIEDLKTVLGQTQDHRHRVLVAASKNVRMWLTKVRKIKSIY
FT                   HTLNLFNIDVTQKCLIAEVWCPIAELDRIKMALKRGTDESGSQVPSILNRMETNEAPPT
FT                   YNKTNKFTKGFQNIVDAYGIATYREINPAPYTMISFPFLFAVMFGDMGHGAIMLLAALF
FT                   FILKEKQLEAARIKDEIFQTFFGGRYVIFLMGAFSIYTGFMYNDVFSKSINTFGSSWQN
FT                   TIPESVIDYYLDDEKRSESQLILPPETAFDGNPYPIGVDPVWNLAEGNKLSFLNSMKMK
FT                   MSVLFGIAQMTFGVLLSYQNFIYFKSDLDIKYMFIPQMIFLSSIFIYLCIQILSKWLFF
FT                   GAVGGTVLGYKYPGSNCAPSLLIGLINMFMMKSRNAGFVDDSGETYPQCYLSTWYPGQA
FT                   TIEIILVVLALVQVPIMLFAKPYFLYRRDKQQSRYSTLTAESNQHQSVRADINQDDAEV
FT                   VHAPEQTPKPSGHGHGHGDGPLEMGDVMVYQAIHTIEFVLGCVSHTASYLRLWALSLAH
FT                   AQLSDVLWTMVFRNAFVLDGYTGAIATYILFFIFGSLSVFILVLMEGLSAFLHALRLHW
FT                   VEFQSKFYGGLGYEFAPFSFEKILAEEREAEENL"
FT   CDS             join(21665..21817,21899..22075,22183..22311,23004..23110,
FT                   23630..23839,23894..25148,25270..25392,26371..26590,
FT                   26755..26926,27146..27251)
FT                   /gene="unc-32"
FT                   /locus_tag="CELE_ZK637.8"
FT                   /standard_name="ZK637.8b"
FT                   /product="Protein UNC-32, isoform b"
FT                   /note="Confirmed by transcript evidence"
FT                   /note="TJ6/proton pump"
FT                   /db_xref="GOA:P30628"
FT                   /db_xref="InterPro:IPR002490"
FT                   /db_xref="UniProtKB/Swiss-Prot:P30628"
FT                   /db_xref="WormBase:WBGene00006768"
FT                   /protein_id="CAA77453.2"
FT                   /translation="MGDYVTPGEEPPQPGIYRSEQMCLAQLYLQSDASYQCVAELGELG
FT                   LVQFRDLNPDVSSFQRKYVNEVRRCDEMERKLRYLEREIKKDQIPMLDTGENPDAPLPR
FT                   EMIDLEATFEKLENELREVNKNEETLKKNFSELTELKHILRKTQTFFEEAGTGEMLPPA
FT                   AVESEEGLELTQHAAAGGATMFANFGFVAGVIQRERLPAFERLLWRACRGNVFLRTSEI
FT                   DDVLNDTVTGDPVNKCVFIIFFQGDHLKTKVKKICEGFRATLYPCPDTPQERREMSIGV
FT                   MTRIEDLKTVLGQTQDHRHRVLVAASKNVRMWLTKVRKIKSIYHTLNLFNIDVTQKCLI
FT                   AEVWCPIAELDRIKMALKRGTDESGSQVPSILNRMETNEAPPTYNKTNKFTKGFQNIVD
FT                   AYGIATYREINPAPYTMISFPFLFAVMFGDMGHGAIMLLAALFFILKEKQLEAARIKDE
FT                   IFQTFFGGRYVIFLMGAFSIYTGFMYNDVFSKSINTFGSSWQNTIPESVIDYYLDDEKR
FT                   SESQLILPPETAFDGNPYPIGVDPVWNLAEGNKLSFLNSMKMKMSVLFGIAQMTFGVLL
FT                   SYQNFIYFKSDLDIKYMFIPQMIFLSSIFIYLCIQILSKWLFFGAVGGTVLGYKYPGSN
FT                   CAPSLLIGLINMFMMKSRNAGFVDDSGETYPQCYLSTWYPGQSFFETIFVLVAIACVPV
FT                   MLFGKPYFLWKEEKERREGGHRQLSVRADINQDDAEVVHAPEQTPKPSGHGHGHGDGPL
FT                   EMGDVMVYQAIHTIEFVLGCVSHTASYLRLWALSLAHAQLSDVLWTMVFRNAFVLDGYT
FT                   GAIATYILFFIFGSLSVFILVLMEGLSAFLHALRLHWVEFQSKFYGGLGYEFAPFSFEK
FT                   ILAEEREAEENL"
FT   CDS             join(21665..21817,21899..22075,22183..22311,23348..23469,
FT                   23630..23839,23894..25148,26118..26258,26371..26590,
FT                   26755..26926,27146..27251)
FT                   /gene="unc-32"
FT                   /locus_tag="CELE_ZK637.8"
FT                   /standard_name="ZK637.8c"
FT                   /product="Protein UNC-32, isoform c"
FT                   /note="Confirmed by transcript evidence"
FT                   /note="TJ6/proton pump"
FT                   /db_xref="GOA:P30628"
FT                   /db_xref="InterPro:IPR002490"
FT                   /db_xref="UniProtKB/Swiss-Prot:P30628"
FT                   /db_xref="WormBase:WBGene00006768"
FT                   /protein_id="CAD30450.1"
FT                   /translation="MGDYVTPGEEPPQPGIYRSEQMCLAQLYLQSDASYQCVAELGELG
FT                   LVQFRDLNPDVSSFQRKYVNEVRRCDEMERKLRYLEREIKKDQIPMLDTGENPDAPLPR
FT                   EMIDLEATFEKLENELREVNKNEETLKKNFSELTELKHILRKTQTFFEEHEDMIASSAE
FT                   SSGIGEVLSADEEELSGRFSDAMSPLKLQLRFVAGVIQRERLPAFERLLWRACRGNVFL
FT                   RTSEIDDVLNDTVTGDPVNKCVFIIFFQGDHLKTKVKKICEGFRATLYPCPDTPQERRE
FT                   MSIGVMTRIEDLKTVLGQTQDHRHRVLVAASKNVRMWLTKVRKIKSIYHTLNLFNIDVT
FT                   QKCLIAEVWCPIAELDRIKMALKRGTDESGSQVPSILNRMETNEAPPTYNKTNKFTKGF
FT                   QNIVDAYGIATYREINPAPYTMISFPFLFAVMFGDMGHGAIMLLAALFFILKEKQLEAA
FT                   RIKDEIFQTFFGGRYVIFLMGAFSIYTGFMYNDVFSKSINTFGSSWQNTIPESVIDYYL
FT                   DDEKRSESQLILPPETAFDGNPYPIGVDPVWNLAEGNKLSFLNSMKMKMSVLFGIAQMT
FT                   FGVLLSYQNFIYFKSDLDIKYMFIPQMIFLSSIFIYLCIQILSKWLFFGAVGGTVLGYK
FT                   YPGSNCAPSLLIGLINMFMMKSRNAGFVDDSGETYPQCYLSTWYPGQATIEIILVVLAL
FT                   VQVPIMLFAKPYFLYRRDKQQSRYSTLTAESNQHQSVRADINQDDAEVVHAPEQTPKPS
FT                   GHGHGHGDGPLEMGDVMVYQAIHTIEFVLGCVSHTASYLRLWALSLAHAQLSDVLWTMV
FT                   FRNAFVLDGYTGAIATYILFFIFGSLSVFILVLMEGLSAFLHALRLHWVEFQSKFYGGL
FT                   GYEFAPFSFEKILAEEREAEENL"
FT   CDS             join(21665..21817,21899..22075,22183..22311,22561..22715,
FT                   23630..23839,23894..25148,25270..25392,26371..26590,
FT                   26755..26926,27146..27251)
FT                   /gene="unc-32"
FT                   /locus_tag="CELE_ZK637.8"
FT                   /standard_name="ZK637.8d"
FT                   /product="Protein UNC-32, isoform d"
FT                   /note="Confirmed by transcript evidence"
FT                   /note="TJ6/proton pump"
FT                   /db_xref="GOA:P30628"
FT                   /db_xref="InterPro:IPR002490"
FT                   /db_xref="UniProtKB/Swiss-Prot:P30628"
FT                   /db_xref="WormBase:WBGene00006768"
FT                   /protein_id="CAD30451.1"
FT                   /translation="MGDYVTPGEEPPQPGIYRSEQMCLAQLYLQSDASYQCVAELGELG
FT                   LVQFRDLNPDVSSFQRKYVNEVRRCDEMERKLRYLEREIKKDQIPMLDTGENPDAPLPR
FT                   EMIDLEATFEKLENELREVNKNEETLKKNFSELTELKHILRKTQTFFEEVDHDRWRILE
FT                   GGSGRRGRSTEREETRPLIDIGDMDDDSAARMSAQAAMLRLGFVAGVIQRERLPAFERL
FT                   LWRACRGNVFLRTSEIDDVLNDTVTGDPVNKCVFIIFFQGDHLKTKVKKICEGFRATLY
FT                   PCPDTPQERREMSIGVMTRIEDLKTVLGQTQDHRHRVLVAASKNVRMWLTKVRKIKSIY
FT                   HTLNLFNIDVTQKCLIAEVWCPIAELDRIKMALKRGTDESGSQVPSILNRMETNEAPPT
FT                   YNKTNKFTKGFQNIVDAYGIATYREINPAPYTMISFPFLFAVMFGDMGHGAIMLLAALF
FT                   FILKEKQLEAARIKDEIFQTFFGGRYVIFLMGAFSIYTGFMYNDVFSKSINTFGSSWQN
FT                   TIPESVIDYYLDDEKRSESQLILPPETAFDGNPYPIGVDPVWNLAEGNKLSFLNSMKMK
FT                   MSVLFGIAQMTFGVLLSYQNFIYFKSDLDIKYMFIPQMIFLSSIFIYLCIQILSKWLFF
FT                   GAVGGTVLGYKYPGSNCAPSLLIGLINMFMMKSRNAGFVDDSGETYPQCYLSTWYPGQS
FT                   FFETIFVLVAIACVPVMLFGKPYFLWKEEKERREGGHRQLSVRADINQDDAEVVHAPEQ
FT                   TPKPSGHGHGHGDGPLEMGDVMVYQAIHTIEFVLGCVSHTASYLRLWALSLAHAQLSDV
FT                   LWTMVFRNAFVLDGYTGAIATYILFFIFGSLSVFILVLMEGLSAFLHALRLHWVEFQSK
FT                   FYGGLGYEFAPFSFEKILAEEREAEENL"
FT   CDS             join(21665..21817,21899..22075,22183..22311,23348..23469,
FT                   23630..23839,23894..25148,25270..25392,26371..26590,
FT                   26755..26926,27146..27251)
FT                   /gene="unc-32"
FT                   /locus_tag="CELE_ZK637.8"
FT                   /standard_name="ZK637.8e"
FT                   /product="Protein UNC-32, isoform e"
FT                   /note="Confirmed by transcript evidence"
FT                   /note="TJ6/proton pump"
FT                   /db_xref="GOA:P30628"
FT                   /db_xref="InterPro:IPR002490"
FT                   /db_xref="UniProtKB/Swiss-Prot:P30628"
FT                   /db_xref="WormBase:WBGene00006768"
FT                   /protein_id="CAD30452.1"
FT                   /translation="MGDYVTPGEEPPQPGIYRSEQMCLAQLYLQSDASYQCVAELGELG
FT                   LVQFRDLNPDVSSFQRKYVNEVRRCDEMERKLRYLEREIKKDQIPMLDTGENPDAPLPR
FT                   EMIDLEATFEKLENELREVNKNEETLKKNFSELTELKHILRKTQTFFEEHEDMIASSAE
FT                   SSGIGEVLSADEEELSGRFSDAMSPLKLQLRFVAGVIQRERLPAFERLLWRACRGNVFL
FT                   RTSEIDDVLNDTVTGDPVNKCVFIIFFQGDHLKTKVKKICEGFRATLYPCPDTPQERRE
FT                   MSIGVMTRIEDLKTVLGQTQDHRHRVLVAASKNVRMWLTKVRKIKSIYHTLNLFNIDVT
FT                   QKCLIAEVWCPIAELDRIKMALKRGTDESGSQVPSILNRMETNEAPPTYNKTNKFTKGF
FT                   QNIVDAYGIATYREINPAPYTMISFPFLFAVMFGDMGHGAIMLLAALFFILKEKQLEAA
FT                   RIKDEIFQTFFGGRYVIFLMGAFSIYTGFMYNDVFSKSINTFGSSWQNTIPESVIDYYL
FT                   DDEKRSESQLILPPETAFDGNPYPIGVDPVWNLAEGNKLSFLNSMKMKMSVLFGIAQMT
FT                   FGVLLSYQNFIYFKSDLDIKYMFIPQMIFLSSIFIYLCIQILSKWLFFGAVGGTVLGYK
FT                   YPGSNCAPSLLIGLINMFMMKSRNAGFVDDSGETYPQCYLSTWYPGQSFFETIFVLVAI
FT                   ACVPVMLFGKPYFLWKEEKERREGGHRQLSVRADINQDDAEVVHAPEQTPKPSGHGHGH
FT                   GDGPLEMGDVMVYQAIHTIEFVLGCVSHTASYLRLWALSLAHAQLSDVLWTMVFRNAFV
FT                   LDGYTGAIATYILFFIFGSLSVFILVLMEGLSAFLHALRLHWVEFQSKFYGGLGYEFAP
FT                   FSFEKILAEEREAEENL"
FT   CDS             join(21665..21817,21899..22075,22183..22311,23004..23110,
FT                   23630..23839,23894..25148,26118..26258,26371..26590,
FT                   26755..26926,27146..27251)
FT                   /gene="unc-32"
FT                   /locus_tag="CELE_ZK637.8"
FT                   /standard_name="ZK637.8f"
FT                   /product="Protein UNC-32, isoform f"
FT                   /note="Confirmed by transcript evidence"
FT                   /note="TJ6/proton pump"
FT                   /db_xref="GOA:P30628"
FT                   /db_xref="InterPro:IPR002490"
FT                   /db_xref="UniProtKB/Swiss-Prot:P30628"
FT                   /db_xref="WormBase:WBGene00006768"
FT                   /protein_id="CAD30453.1"
FT                   /translation="MGDYVTPGEEPPQPGIYRSEQMCLAQLYLQSDASYQCVAELGELG
FT                   LVQFRDLNPDVSSFQRKYVNEVRRCDEMERKLRYLEREIKKDQIPMLDTGENPDAPLPR
FT                   EMIDLEATFEKLENELREVNKNEETLKKNFSELTELKHILRKTQTFFEEAGTGEMLPPA
FT                   AVESEEGLELTQHAAAGGATMFANFGFVAGVIQRERLPAFERLLWRACRGNVFLRTSEI
FT                   DDVLNDTVTGDPVNKCVFIIFFQGDHLKTKVKKICEGFRATLYPCPDTPQERREMSIGV
FT                   MTRIEDLKTVLGQTQDHRHRVLVAASKNVRMWLTKVRKIKSIYHTLNLFNIDVTQKCLI
FT                   AEVWCPIAELDRIKMALKRGTDESGSQVPSILNRMETNEAPPTYNKTNKFTKGFQNIVD
FT                   AYGIATYREINPAPYTMISFPFLFAVMFGDMGHGAIMLLAALFFILKEKQLEAARIKDE
FT                   IFQTFFGGRYVIFLMGAFSIYTGFMYNDVFSKSINTFGSSWQNTIPESVIDYYLDDEKR
FT                   SESQLILPPETAFDGNPYPIGVDPVWNLAEGNKLSFLNSMKMKMSVLFGIAQMTFGVLL
FT                   SYQNFIYFKSDLDIKYMFIPQMIFLSSIFIYLCIQILSKWLFFGAVGGTVLGYKYPGSN
FT                   CAPSLLIGLINMFMMKSRNAGFVDDSGETYPQCYLSTWYPGQATIEIILVVLALVQVPI
FT                   MLFAKPYFLYRRDKQQSRYSTLTAESNQHQSVRADINQDDAEVVHAPEQTPKPSGHGHG
FT                   HGDGPLEMGDVMVYQAIHTIEFVLGCVSHTASYLRLWALSLAHAQLSDVLWTMVFRNAF
FT                   VLDGYTGAIATYILFFIFGSLSVFILVLMEGLSAFLHALRLHWVEFQSKFYGGLGYEFA
FT                   PFSFEKILAEEREAEENL"
FT   CDS             join(28187..28353,28408..28488,28898..29084,29174..29285,
FT                   29335..29474)
FT                   /gene="tpk-1"
FT                   /locus_tag="CELE_ZK637.9"
FT                   /standard_name="ZK637.9a"
FT                   /product="Protein TPK-1, isoform a"
FT                   /note="Confirmed by transcript evidence"
FT                   /note="C. elegans TPK-1 protein; contains similarity to
FT                   Pfam domains PF04265 (Thiamin pyrophosphokinase, vitamin B1
FT                   binding domain) , PF04263 (Thiamin pyrophosphokinase,
FT                   catalytic domain) contains similarity to Interpro domains
FT                   IPR007373 (Thiamin pyrophosphokinase, vitamin B1-binding
FT                   domain), IPR016966 (Thiamin pyrophosphokinase, eukaryotic),
FT                   IPR007371 (Thiamin pyrophosphokinase, catalytic domain),
FT                   IPR006282 (Thiamin pyrophosphokinase)"
FT                   /db_xref="GOA:P30636"
FT                   /db_xref="InterPro:IPR006282"
FT                   /db_xref="InterPro:IPR007371"
FT                   /db_xref="InterPro:IPR007373"
FT                   /db_xref="InterPro:IPR016966"
FT                   /db_xref="UniProtKB/Swiss-Prot:P30636"
FT                   /db_xref="WormBase:WBGene00014027"
FT                   /protein_id="CAA77455.3"
FT                   /translation="MSKKLKPFEILEDSCASVCIWLNGEPTAISNRAENLWNKAKYRVA
FT                   TDGAVNEILKRKSFVEWPHIICGDFDSINKQIDTKNAKVVHLPDQDYTDLSKSVQWCLE
FT                   QKTLTSWEFENIVVLGGLNGRFDHTMSTLSSLIRFVDSQTPGDSNLDVNLEMTTKMCGI
FT                   IPIVQKETIVSSIGLKYEMENLALEFGKLISTSNEVTTSQVFLKSSSSLIFSIELENWV
FT                   YKLDSL"
FT   CDS             join(28187..28353,28408..28488,28898..29129,29174..29285,
FT                   29335..29474)
FT                   /gene="tpk-1"
FT                   /locus_tag="CELE_ZK637.9"
FT                   /standard_name="ZK637.9b"
FT                   /product="Protein TPK-1, isoform b"
FT                   /note="Confirmed by transcript evidence"
FT                   /note="C. elegans TPK-1 protein; contains similarity to
FT                   Pfam domains PF04265 (Thiamin pyrophosphokinase, vitamin B1
FT                   binding domain) , PF04263 (Thiamin pyrophosphokinase,
FT                   catalytic domain) contains similarity to Interpro domains
FT                   IPR007373 (Thiamin pyrophosphokinase, vitamin B1-binding
FT                   domain), IPR016966 (Thiamin pyrophosphokinase, eukaryotic),
FT                   IPR007371 (Thiamin pyrophosphokinase, catalytic domain),
FT                   IPR006282 (Thiamin pyrophosphokinase)"
FT                   /db_xref="GOA:P30636"
FT                   /db_xref="InterPro:IPR006282"
FT                   /db_xref="InterPro:IPR007371"
FT                   /db_xref="InterPro:IPR007373"
FT                   /db_xref="InterPro:IPR016966"
FT                   /db_xref="UniProtKB/Swiss-Prot:P30636"
FT                   /db_xref="WormBase:WBGene00014027"
FT                   /protein_id="CAI46594.1"
FT                   /translation="MSKKLKPFEILEDSCASVCIWLNGEPTAISNRAENLWNKAKYRVA
FT                   TDGAVNEILKRKSFVEWPHIICGDFDSINKQIDTKNAKVVHLPDQDYTDLSKSVQWCLE
FT                   QKTLTSWEFENIVVLGGLNGRFDHTMSTLSSLIRFVDSQTPVIVLDSRNLVLAVPTGDS
FT                   NLDVNLEMTTKMCGIIPIVQKETIVSSIGLKYEMENLALEFGKLISTSNEVTTSQVFLK
FT                   SSSSLIFSIELENWVYKLDSL"
FT   CDS             complement(15020..15565)
FT                   /gene="ZK637.6"
FT                   /locus_tag="CELE_ZK637.6"
FT                   /standard_name="ZK637.6"
FT                   /product="Protein ZK637.6"
FT                   /note="C. elegans predicted pseudogene"
FT                   /pseudogene="unknown"
FT   CDS             complement(14361..14501)
FT                   /gene="ZK637.18"
FT                   /locus_tag="CELE_ZK637.18"
FT                   /standard_name="ZK637.18"
FT                   /product="Protein ZK637.18"
FT                   /note="C. elegans predicted pseudogene"
FT                   /pseudogene="unknown"
FT   CDS             complement(join(Z22175.1:18703..18714,
FT                   Z22175.1:18763..18876,Z22175.1:19006..19177,
FT                   Z22175.1:19292..19791,238..427,486..610,660..746,787..870,
FT                   1188..1374,1418..1509))
FT                   /gene="svop-1"
FT                   /locus_tag="CELE_ZK637.1"
FT                   /standard_name="ZK637.1"
FT                   /product="Protein SVOP-1"
FT                   /note="Partially confirmed by transcript evidence"
FT                   /note="Sugar transporter"
FT                   /db_xref="GOA:P30638"
FT                   /db_xref="InterPro:IPR004749"
FT                   /db_xref="InterPro:IPR005828"
FT                   /db_xref="InterPro:IPR016196"
FT                   /db_xref="InterPro:IPR020846"
FT                   /db_xref="UniProtKB/Swiss-Prot:P30638"
FT                   /db_xref="WormBase:WBGene00014021"
FT                   /protein_id="CAA77460.2"
FT                   /translation="MGDKAILTEVLEASNLTEAYVDLTAKQLIKEIRHVGDDFAVRYSN
FT                   LDDRTELGEPTDQRSPDSEKTFTVDEAVEALGFGRFQLKLSILTGMAWMADAMEMMLLS
FT                   LISPALACEWGISSVQQALVTTCVFSGMMLSSTFWGKICDRFGRRKGLTFSTLVACIMG
FT                   VISGMSPHFYVLLFFRGLTGFGIGGVPQSVTLYAEFLPTAQRAKCVVLIESFWAIGAVF
FT                   EALLAYFVMESFGWRALMFLSSLPLGIFAVASFWLPESARFDMASGHPERALETLQAAA
FT                   RMNRVQLPTGRLVSSTKAGSESRGDIANLLSPDLRKTTILLWCIWAITAFSYYGMVLFT
FT                   TVLFQSHDECHGGLFSNGTQMEVCQPLTRSDYFDLLSTTLAEFPGLIITVLIIEWFGRK
FT                   KTMALEYAVFAIFTFLLYFCLDRFTVTVLIFVARAFISGAFQCAYVYTPEVYPTTLRAV
FT                   GLGTCSAMARIGAIVTPFIAQVASEKSLSLPIGIYGTAAILGLIASLSLPIETKGRQMM
FT                   DSH"
FT   CDS             join(40329..40487,40572..40700,Z11126.1:5..73,
FT                   Z11126.1:120..242,Z11126.1:288..389,Z11126.1:440..598)
FT                   /gene="ZK637.12"
FT                   /locus_tag="CELE_ZK637.12"
FT                   /standard_name="ZK637.12"
FT                   /product="Protein ZK637.12"
FT                   /note="Confirmed by transcript evidence"
FT                   /db_xref="UniProtKB/Swiss-Prot:P34658"
FT                   /db_xref="WormBase:WBGene00014029"
FT                   /protein_id="CAA77461.2"
FT                   /translation="MECVNCDCTVKTMDNLDQAIRALLQRGKHVNRMMDNEKLIREARR
FT                   MEEVQQLKMQIPKPVDKKPRPPPSENNLKLISCEETCMDETLKNSSKPRMIYNKQLGRA
FT                   ESIDFDVPSLSYESSEKCAGETSPYTSASVSNSKKATSSSNFTKSETTTITELTTSTFK
FT                   KSNNSSGGALVLDNHYLINNDDGTVKKLPMKVYVKQRLEDGSLDVQLVFFDENSQKVMD
FT                   ISMLVNGKKIRNVQFCGKDAKLVN"
XX
SQ   Sequence 40700 BP; 12908 A; 7116 C; 7280 G; 13396 T; 0 other;
     gatccagctt ttgttgaaga cactaatctt ccagttggca actgtactct attcattctc        60
     gctgctgctt gaagtgtttc tagagctcgt tcgggatgtc cagaagccat gtcaaaacga       120
     gcagattctg ggagccactg aaacattttt gaagtttact tgtatactat acttgcatac       180
     tagctttcaa ttcagacatt tttgaatttc taactcgatt tttttgataa aacttacaaa       240
     agaagccact gcaaaaattc caagaggtag tgaagaaagg aacataagag ctctccaacc       300
     aaatgattcc atcacaaaat aagcaagaag agcttcgaaa actgctccga tagcccaaaa       360
     tgattctatc aaaactacac atttggcacg ttgagcagtt ggaagaaact cagcgtataa       420
     agtgacactg aaagatgaag ttttttaaaa atagggattt ggaatattct gattaaaaaa       480
     ctaacgactg gggtacacct ccgataccaa atccagtaag tccacggaaa aatagaagaa       540
     cgtaaaaatg aggtgacatt ccagaaatga cacccatgat acaagcaact agtgttgaaa       600
     atgttagtcc ctgaaatttt ttacagattt caattatata catttatatt tcaactaact       660
     tttcgtcgac caaatcgatc acatattttt ccccaaaatg tacttgacaa catcattcca       720
     ctgaacacgc acgtcgtcac aagagcctca acacaatttt ttttttttgc ttgatttgaa       780
     acttacctgt tgcactgacg atattcccca ttcacatgcc agagctggag aaatcaatga       840
     taataacatc atttccattg cgtcggccat ctgaaattct gcgcaaaggt gtgttaataa       900
     attttttttt aaatacatat tgaagattca ttgttttctg aggtgtttaa aatttctggt       960
     gcttttccgt gactattttt ttgatatttt taaaaaataa ttttgaatgt tttcattaca      1020
     gtcatgcaac agaaatctgc tctaaaatgt ttttttttat tttcaaaagt ttcaatctaa      1080
     attttggtaa atttccaaat tttccaattc aaattgtgaa aatatatttg taatataaaa      1140
     ctcatttgga ttgaacactc ttttttgaaa actccctcga aactcaccca tgccattcct      1200
     gtcaaaattg acagtttcag ctgaaatctt ccaaatccca atgcttcaac agcttcatca      1260
     actgtaaacg tcttttcact atctggtgat ctctgatctg taggttctcc aagttcagta      1320
     cgatcatcga ggtttgagta tcgaactgca aaatcatctc cgacatgacg aattctaaag      1380
     tttgtaaata ttaaggaaac tgtgaacaaa tatttactct tttatcaact gtttggccgt      1440
     taaatccaca tatgcttcag tgagatttga cgcttcaaga acttctgtta gaattgcttt      1500
     atctcccatt ttttgggtct gaaaattata attaattcta gattcagact ttttaacgaa      1560
     aatatataac taaagtattt ttttaagtgg taaaatgtag ttaattgcca agtttaccaa      1620
     gcatttaatt ttttaatatt cacagttttt tctttaacag cctttaacaa atttttttac      1680
     aaataaaaat aattaaaata caagtaggag tccctatttt tggtcagctt ccaaaattaa      1740
     aaaaagaaaa tgaaaagcaa atctcgatca aaatctattg agcttaatcg taagatcaaa      1800
     aaaaaatttc cgcagaaaaa tgtaccagca ctattattgg tgagaatttt tctaaaacat      1860
     aaacaaaata tgaacatttt tgcttcaaca atattgcaat ttttaataaa tattttttac      1920
     ctaaattcaa agttggagga tatttttcaa gtaaaataag tattctgcca attaaaaact      1980
     tttagtgaaa ttcaaaattt aaaaaatcta actttctaat caactttcta aaaaccatat      2040
     tcacaaatgc attcaacaaa tattatgtta atagtatgtt taaacgtttc cggtcgggtc      2100
     gtgacaaagt caaaaacatt ggtaattgaa caaaacattc caatttcaaa atgtttttat      2160
     ggctgcagtt attcaataga atactcaata atatatttcg ctaaaaaata attggaaatg      2220
     taatttttat tcaaataatt tttttcaaca aacaaaaaaa atttatagtt ttttttaaat      2280
     ttaaaatcac atttttcaaa aaatttgtaa agctgtttgc ggggaacagg agggaggtgg      2340
     ggattacgaa acaaacatga aatcgatgtg gttaagccgg gagacaaaat gacccaataa      2400
     tttgtccaat gacgtggatg tgtgacacca aattcagagc tcaaagcttc aaacggaaaa      2460
     gaataaaaac caggagagtt gctccagatt cagagagaga aagacgtctc catatatgac      2520
     tctacgtcta ttcataatgc gcactgtctc tctatttggc tcagctgagc atcattggct      2580
     tcgaagcagt agaagaaagc cgagaaatgg aaatggagga ggttaagaga gacagaacgt      2640
     gtgagaaaga gagagcgaga gggacaaaaa tgaaaagtag gcggtttaaa caaacaaaga      2700
     aaaacacaag gaatatcgga tcgaaaggat gctccgagga gcaatattcg ggaaaaaaag      2760
     gagctccggt ttcagaatgt cacttctgaa tttggaagtg tgacaattca aaagaattag      2820
     tataactcag cggcccgatt tttgtaccaa aaatacggtc tcgacacgac aaacttttgt      2880
     taattgcaat ttagctgtaa aatggtgtgc gcctttaaaa gagtactgta atttccattc      2940
     ccaagttgtg agaaaacagg agaaaaacga atatttatta aaacaggaga aaaaagatca      3000
     gaagatttga gtattttgtt tgaaataaca acaagttgac caaattattt gtttttttag      3060
     ttttcagaaa cagttttgtg aatgcatttc atgaatggtt tttgtgtcaa agcaacgtta      3120
     taataaaatt taaaaataaa atattttaat ctctatttat tataacgtat tgatttttac      3180
     aaacacttta ctatttataa tacaattact ttcttgattt tgggattttc ttgaaatttg      3240
     caatattttc gcaatatttt cggaacgaca ttttgaaatc tcgacatttc acacaatttt      3300
     tgcatgtaaa cgttgtattt gccaccgttt taattgattt ctctcaattt taatttcaga      3360
     ttcatcaact acagtatact cgcctttgac tttcaagctc atcgagaagt gcgccagctt      3420
     cgcataatca agaagtgcgt cagcactcga cttgcgcaat tcttgtcaac tgatatgatt      3480
     tctttttgtt ttttggttat tttttgcgcg ttctttgtgc ttttcgtttt ttttttgttc      3540
     gttggtttct ttctttaatg aaacgaaata ttttatttta gtttagactt ccaatatata      3600
     gaataattaa attgcatata acatgacgaa aggaagtata atctgggatt ataaattttg      3660
     agctttagct atcttccttt atcctttaat tcttgcgtca ttcataaatg acatatcgtt      3720
     tactttcgaa aattgatttt cacatgtccg ttaacaataa ataatttaat tttataatac      3780
     ttttagggta aatatgtcaa actcaacgat ggaggctact caaatgaaag taaagctggc      3840
     tgtcgatgag atgattgacg atttggataa gacctatttg agggatatgc agaagagcat      3900
     gtttcagtgc tcagctcggt aattattttc gaaattacac taaatatgtt tagtaagcaa      3960
     tttgtattac gctaaaccac ctgaaaatgt ctaatttaac ttcgcaattg aaaatttttt      4020
     gcattatttc aggtgctgtg acaacaagaa aaccacacgc gatgctgtcg agaactgcgt      4080
     tgaaagctgc aacgatggca tgaaaaaggc gcaaggctat cttgaaaaag agctcggagg      4140
     gcttcaagac cagctctcac gctgtgcaat gacttgctat gataagcttg ttcaacagtt      4200
     tggtccagat gtcaataagt attcagaatc acaggtgtga agatttatta aattttagaa      4260
     atcaaaaaat ttataaatta atttaggatt taaaaaatca acacccgagg gggctcatag      4320
     ctcacagctt ttggtggaac atttttttgg aattaaaaca aaagtatata cagtgaaaag      4380
     ctagtttggg ttgaaaatta atttagtttt gtcgaagaag aatttaatag aaataagatt      4440
     taaattataa atcatccata cattgaatcg tgaagctctt caagatttct ctgtctctcc      4500
     tcctcctcaa cttctttatc agttttgacc ttctgacggc atgttgggca agtttgttga      4560
     gcttcaagcc atagagtgag acaaaaataa tgaaagcgat gtttgcatgg catgacgata      4620
     actgtggttc cgaacgttgt tggatcaatt tttaattcct ctttgatgac atgatcttca      4680
     ggaatatcga cgttgttttg caagttatcc aaacaaattg cacaggttgc tgaaaaatag      4740
     attatttagg caaatagtca gcattttttc tgagtgtttt ttttttcaaa tacaagcttt      4800
     gctcaatttt aatagtttct cataccatct tctttctgtt gatctgtagt ctctcgatcc      4860
     atcagtctca gcgctttata tgattttttg tcaattggca aacttccaac attatacaaa      4920
     tccagccatc tttgcatcgc atctgtttgt gaaccagtac cttccgctcg cattccttaa      4980
     tttaatatat aatttgaatg ctttctcata aaataactta ctgacgaaga tggtttcgag      5040
     catatgcgaa aaagctctaa tagcgtctct ttccgacata tctaattgcc agataaaata      5100
     ttttaagaaa tgacgagaga tatggtgaca aaaggaaaac gtacttacgc aagtgcaacg      5160
     aaaaacgtgc aattcgtcgt aacggtgttt gcggattttt tgcgtgtctg tctcgcactc      5220
     tccattcttt catcacgagt tttgatgact atttatgcaa atttcggggg tttatgaatc      5280
     accaatcaag tgccacgctg ttcatcgatt tttagttttg tattactttt gctattttaa      5340
     tagttagacc ctcataagat ttgtatcgag gggtgttttt tttttaatgt aacattatga      5400
     aatctaaaat gattcatttt cttttctatt ctttctgtcg tctctaatta atgataatta      5460
     tcaatttggt agaaatttag cgatcgctaa agacgcacgg tattattcag aagggtctcg      5520
     gcgcggaaaa aagtttatgg tagtttttaa tattttttgc agctgctttt ccttacattt      5580
     ttcattgcaa ttacctcgat tttagcaaat tttgcctttt tttaaaacat tttcatgtta      5640
     aaaattgttg taaaccagtt ttttattaaa aatatgtgtt tttctgtttt ttggcgtgga      5700
     agaaacagaa aagtgaaata tattttcttt acgcgctgag ccccatctta ataaattccg      5760
     tgcgccttta gcaaggcatg gcaaaaatat ttataagaca catttctgtg atcctaacgc      5820
     ctctgatttc tcacaaaatt aaaaaaaaat tgatcaaaaa ttaagaaaat cctcgcattt      5880
     cagaagctca gtttcaacga gaagctcgat tcgtgtgtct ctgtttgtgc tgatgatcac      5940
     atcaaattaa ttccggcaat caagaagaga ttcgcgaaaa atacctgaga gccagccaca      6000
     cattttccac cgagtattgc catatcccct cttaatttcc catttatcaa aaaaatatcc      6060
     catttaggcg tattctccac tcattaggct ccctcattgt tgctcactat tatatcatta      6120
     tttttctttc atactttttt aataagtttt catgcattca gtcataaaat ctctatccca      6180
     attgatttaa actctcctta aacgttttga ccgtatttca tactttttcc accgaactta      6240
     ttctcttcaa acaaaacaac gttcaggtac tatgaaaaaa atattaccga tcatatggct      6300
     catcaatttg gttagtggaa gcctatcact cgagaaaaaa gctcccgatt tacttggaaa      6360
     agtatgtgca tttggagatt tcaatgcaga tcggaatact gatattctgg tttttgcgaa      6420
     tggaacattg acgattaatt atcaagaaac taaacttctt gatgtggtta gtttttattt      6480
     tttcttttgt tgaaatttca cataaaaatt ttgaaatttt cagctcgaag cttccaaatt      6540
     cacaccagga acatcgtttg ccatcagtaa acccagcctg aatgcagatt ttgttgaatg      6600
     ttcagttggc gatttcaatg gagactctag gcttgatgtt ttggtgagtt tattgaaaac      6660
     attgtcattt tgcttcattg aacttgaaat gccccgaaaa acgaaaaatt tcgaaagaaa      6720
     aaccaaattt tagctaaaat ctacattttg tcatgtttac agcggccgga aattgatttt      6780
     tttaaattaa atcaacaaaa aacgtaatgt aaacaacaat atatgcataa taagccaatc      6840
     ataaaataaa aatcaatttc cgacagctgt gaccaaaagt gccgtcaaaa aaaatttcaa      6900
     ttttgctttg agtaaattga aaatcgaaaa acgaaagttg ttatattcat cttttttttt      6960
     gatttcccgg aaaatcgaaa aaaaaaacaa aatttataaa attaacaatg aaattcaagt      7020
     tttattcatg ttgatgaaaa aacatgagaa gacataattt tcatcaaaaa agagcaaaaa      7080
     tgaccttaat tttatgatat atttcgaaaa aaactacttt tttcgaaata tcagtttttt      7140
     tactgtccgc gaaaaaaaac tatttagaga ttttagctca atttaaaaaa aaaatattta      7200
     gacaacatat gtattttgaa ccaaaaactt tttgacaaat ttttggaaag tctcgttttt      7260
     aaattcaggt tttgtgcata ttattctaat agagcaaatt tgtattgatt cttttaacaa      7320
     attaataatc tatgactttc ttctaggtat caattcgcga taaagacact gaaatctaca      7380
     atcacactct ctggacatca gaaattgaag acgagaagga aatattccgt ccattccacg      7440
     tggcaatgct tcaacaacat gcaatggcca ttgatgtttc tgatgatgga tggactgatg      7500
     ttcttggatt ctatccgaat ggatcaatgt tctgtaccgg attcaataaa gaaggaaaat      7560
     acaatctact ggtgaatggt tgcaaacatg aattcgtcgc ttttcccgaa aaattaaata      7620
     tttatccagg aatgccgcac ttgtttgttg acttgaattg tgagtttaaa tttttatatt      7680
     ttcttaattg gaatctaaca atttcacgtt ttagccgacc tgattgctga tattgtcttc      7740
     atgaccaaag aaagcgatgg atcacttttc atgagtgtaa gtctatttta acagtagtag      7800
     tttgaaatgc aatatatttt tcaggtttgg caaaagacaa aaatcagctg gcaatttaga      7860
     gattgggttc ctaaattgac tccagcacaa tatccattcg ttggtgctcc agttgttatg      7920
     gatgttgatt cggacggtga actcgacatt ctagtaccaa tctgccgtga agatgagtgc      7980
     tcacacatta ctcaaatggc ttcttggtcg aagactaaac tttggggatt ggtggcctgt      8040
     gatatgcaag attatacagt tattaaagaa ccattttcac gagttatatt ccgcgttgga      8100
     gaattctcgt tggacagttt ccctgatatg gtggttattg cgcaggcaac cagagtgagt      8160
     ttaacaattt ttattttaaa caggatgtgg ttgtatactt ttaaaaaatg ttctatggct      8220
     tgataaggcg ttatgtatat ctgattcttt aaaagttcca aaaatcaacc tcttcgtcta      8280
     ttgaatttga atttcgattt ttaattttct ttgagttttg taagaaacgc ggccgtgtac      8340
     tcttctcgga caattaacta attaaatttt tggatttcaa gtaatttttc gcattttctt      8400
     gatttccctc ggtatgttgt aacagatgca gagacgcatt ttactttaat taacagacca      8460
     ctcactccta aatacagtaa tgtatcttgt tctgctgatg aatgacactt ctaaaatcac      8520
     atagtttatt cattttcctg tttttcattg aataatcaat ttgatagtgt tatcgatttt      8580
     cattagaaat aacgggaagt aacgagaaaa tactaggaca tggcctaaaa ttcaaaaatt      8640
     taattaatta atagtacgag aagagtaaaa ataggaagat cagacttgat ttcccaaaaa      8700
     taacttcagt taactgaata atgcaaaaaa aattaccttt cattaatcaa aatttgaata      8760
     atttcaggcc aacactcgcc ctgtgatcaa agtaatggac aatgcagaat gtacaaaatg      8820
     tgaaaagaac ggaacacgac gattcgaaat ccgagctcaa gagaatattc aaccaaaaaa      8880
     tatgtctctc ggagtcatca aaatgggaac attttttgat cttcttgaag atggatcatt      8940
     ggatcttctt gttgagtatg aatacggtgg tcagacacgt tttggattca tctactgccc      9000
     tgataaagga gatacaacat tcttgaaagt tcaagttttc acaggagttt gcagtgatcg      9060
     atgcaatcca aaatcaaacg agattggatc gagtatcagt atgactggtg catgtgcttc      9120
     tttctcaatg acagatggat ggggaggtag tacacagagt gtagcatgtc aagttccggc      9180
     ttcatcaaat agagcacttt atctcccatt tttgttgtat ggtcttggaa gaagtccaaa      9240
     ttttgtggat gaggtaattt catatcttct agatattttc gttcaattat tccaaataat      9300
     ctttttttca gttgaatatt gccattccga aatacgcaga tcgtaaagaa gattggaaac      9360
     acagtcttaa acagattgtt ccaaattctc ggattattgt tctcccacca tcggatcaat      9420
     atccacactg gacgagtcgg ctctacgtca caccatcagc tcttattgtt caggtaagat      9480
     tattatggag acgtggacat acgctccaaa tgggaacgac ggaaattgat aaaataaaat      9540
     taaaaaataa aagaaaaaaa cttttcattt ttaatgcatt ctttaaacat aatttcggca      9600
     taaaaatcat taaaactaac gaaaaacatt tcaaaatggt tgcaaatacg aattcgttga      9660
     attcacgggt ttgctgccaa ataactaacg agacccatgg ctcgggggcg gagcgtagtc      9720
     agttggccat ggggcacatt tccacgtctc tataataaat cgatattctc attttccaga      9780
     gtcttgccgt cattgctctc gtatgctgta tgcttctaat ggttgtcgta ttcttacatt      9840
     atcgagagaa aaaggaagat cgatacgaac gacaacaaca atctcatcga ttccatttcg      9900
     atgccatgta gatttttttg tgaattttaa gatcatatct tcttgaagac gagatcgttt      9960
     tttacgggtt cccatcattt gtctcttttt ttgcatattt gaccttttga agcttcatcc     10020
     tgtgtttaga tttcccattt cgagctgtga ttgcacgtcg gagtattttt agagatcagc     10080
     tttaaatccg agttttcctt gtttgaaaat agaaacatta tttgaaaaca actgtaatat     10140
     ttattccacg tgacccctta ccctccatca ctctctttat aaactgaaca gagacttttt     10200
     cgtttttttg acgaactatt aaaataaaac tttttgaatt ttttcctaat gaagtcaaat     10260
     ccaaaatatt ttctaatgaa tgacgtggag cggcagagca aatattcgcc gaaatatgtg     10320
     agttttcttc aaatttttgt taactttaac aaaaagtttc caatttcagg ttccaaacaa     10380
     cagtctgaaa gagcgaattc tggagttttt ggattattac attgcgccat tgaaactgta     10440
     agtttcattt tatggaaaat tctcataaaa aactcaatat tttcaggtat cttctgtctt     10500
     acccgatgcc ggattgcctt tgggacaatc gaaaattgag gtattacatc ggaaaatcgt     10560
     tgcaatgaca tggaacccac attcattttt ttcagattga aggccagtgg tgtgcaagtg     10620
     actccgagct ccgaaccagt tcatatcgat gatcgtctaa ttcacatttc acagaaacaa     10680
     ccgtccgaat gatttttcga tttttattta ataaagtttt agaaattatt tcattttttt     10740
     caagttttat ccgtgttcta atggttttct attaccttat tattatttct tcagttctcc     10800
     aaaaaaaaat attacccaga cataaaatgt tgaggttttg taacctgggt ctcgccccga     10860
     gaaaattttg ttaaatgcag aaagttgtgc gcctttggag tactgtaata aacactttcg     10920
     gaattttcat aatcgaatca aaaaagttat ttattaaaga acttaactcc tatcaagtcg     10980
     agaaaacact gtagaaaaac aataaaaatt tgtatccatt tttacttgaa aaattaaaaa     11040
     aactgcaaaa ggctagacat ttctttttaa aatttcaaac tttaaatgca aataaaccta     11100
     aaacttcttt ttttttcaga aataatgtcg gatcagctgg aagcctctat caagaatatt     11160
     ctcgaacaaa aaacgctaaa atggattttt gtgggtggaa agggaggtgt cggaaagacg     11220
     acatgcagtt gctcattggc agctcaactc tcaaaagttc gtgagagagt tcttctcatc     11280
     tccaccgatc ccgcccacaa catttctgat gccttcagtc agaaattcac aaaaactcca     11340
     acactggtcg aaggtttcaa aaatctcttt gcaatggaaa tcgattcaaa tccgaacgga     11400
     gaaggcgtcg aaatggggaa tatcgaagaa atgctgcaaa atgctgcaca aaacgaaggt     11460
     ggaagcggtg gattctcgat gggaaaagat tttcttcaaa gttttgctgg aggacttcct     11520
     gggattgatg aggcaatgag tttcggggaa atgataaagt gagtgtcaat gattctgatt     11580
     tttaaaaaat ctattatttt tttcaggttg atagactctc ttgacttcga cgttgtggtc     11640
     tttgacaccg ctccaactgg gcacactctt cgtcttcttc aattcccaac acttttggaa     11700
     aaagtattta cgaaaattct gtcacttcaa ggaatgtttg gaccaatgat gaatcaattc     11760
     ggtggaatgt ttggaatggg aggtggatca atgaatgaaa tgattgaaaa gatgacaacg     11820
     actctagaat ctgtgaaaaa gatgaacgca cagtttaagg atcctgttag tttttcagat     11880
     tcaagtgata tttaaaatta ctacggagat atatcaccca gacgcgaaaa ttgtcgtaaa     11940
     attctgcatc ttggtaatat gtttttttaa ccttttcaat tatatcaagg gtaaattcta     12000
     gcttgatata tattgaattc agagatttta aatcatcaaa gtttctgcag agcattcaaa     12060
     tatgtattta cagaattgca ccacattcgt ctgcgtctgc attgccgaat tcctctctct     12120
     ttacgaaacc gaacgactta ttcaggagtt gtccaaacaa ggaatcgata ctcataatat     12180
     tattgtgaat caacttctct ttccggatac cgatgcaaat ggaacagttt catgcagaaa     12240
     atgtgcatcg agacaggcga ttcagtcgaa atacttgaca gatgtgagtt taaatgagaa     12300
     gtttgataaa ttattaaatt agaaactttg agcaaattaa tattgaataa ccacagtgca     12360
     tttttgactc tgtcgtgatt tgctagatgc ggaataaatc aatttttcca gatcgatgag     12420
     ctctacgagg atttccacgt cgtcaaactt ccacttcttg aggcagaagt gcgtggaggg     12480
     cccgcaattc ttcagttcag cgaacggatg gtggatcctg aagctaacaa aaactaaact     12540
     aatttgttct cctacaaaat caacttgttc tgtggttttt tatgttaaaa gattcttcct     12600
     atcccatgtt ttttctccaa aattccctgt ccccttattt ctcgctttat tgtgggtgcc     12660
     tttttcgaat caaatgaata atttatgata ttcattgttt tttacttagg attgaagtat     12720
     atttggaaca taattatctt tcaaacttca gcctggcaaa ctatttttgt caagtaatca     12780
     ttttaattag ctagatttta gacgtaattt ctttcaaata gtacctagta ttaggcagcc     12840
     gacaggtcat gggaccaagc agtacatttt tccgactgct agacttcatc cgacacttac     12900
     ctagattcag agaattcaat tttcacacaa cttgttaaaa tctctagttt acgagcttgt     12960
     ttttaaccag acttatggat cctgagaatg gagggccatg gagcctccat ggaggggatg     13020
     gcagttggag atacaatgat tttggagtaa ttttaccttc gtattatttt tcatgtgatt     13080
     tcattttcaa ttcacttagc cccgtttcct aatgttcaag ttgctatttc caatttattt     13140
     tccttggtcc acttcatatt ccttggaatt ttttctgcat tcaaattacc aaatagccac     13200
     gtgcaatatc ccattctctg cagttttgaa atttgaattt atacaataaa catgagttgt     13260
     caaatattca gtcttaatct gatattagtt caaatatatt ccaaatcaat tccaaatata     13320
     ttcgaaatat atttcaaata tattccaaat atatttaaaa tatattccaa atatattcca     13380
     aatctattcc aaatatattc caaatatatt tcctattcta ctaatctttt tctcaatttc     13440
     tgtgcgaaat tgtgttatta tcgtaccagg gaacagagat atgaccaaat ctgtactcac     13500
     tgttcagatt ttttataaaa atggtgaaaa aaggctttgg ataattccaa acattcattt     13560
     ggcagaagct ggaagttaat gaaacacaca ccgcagctgt taaaacttat ataaatatat     13620
     tttctgtttc caaaattata aacttgtaaa ataaaaccgt ttcaaaactt tcacgatcga     13680
     aaatatgatg cgtgccaaaa ggacgtcaga atatatttgg aatatatttg gaatatattt     13740
     gaaatatatt tggaatacat ttggaataga tttggaatat atttggaata gatttggaat     13800
     atatttggaa tatatttgga atatatttga aatatatttg gaatatatca gtttccggta     13860
     atttttgttt gtccgctaag atactttgtc acccaaaagt ttgttatcac ggagaattga     13920
     tcaactatgc ttgatttatt gcttttatac cccttatgat cctttgaagc tgaaggatca     13980
     gatcatcagg aggtacccat ctgatccttt gaagctgaag gaacagatca ccaggaggta     14040
     cccttctgat ccttcggagc tgaaggatca gatcaccagg aggtaccctt ctgatccttt     14100
     gaagctgaat aatcagatca tcaggaggga tcattgttca tacattcaat tgtgagtagt     14160
     caaggccgaa aatccatgga aaattgcatt taaaaactta ttccagtgaa aaaaaaacaa     14220
     aaatcgattg agaaatatat ataaaaaact agttgaaaaa gtttgtcacc gaagatacgc     14280
     ccggtcagag acaaatggca ctttgtcgac tggataccat gtcactttgg atactttgtc     14340
     cccaaaaata ccttgccacc ctaaaagttt gtcccctcgg aatgaaggcc attttgatgc     14400
     atctcaatca tctccagatt ctttgcaaga agatcattac ttggtgctgg aggcggagac     14460
     agagcaagag ctctgcgtgg agggcgtcgt tcttcttttg gctgaaactt gaagacatga     14520
     caacaataac gtcgcgtatt gcactttttt gagaacaaaa aatccacatt tcatctggaa     14580
     aatatttttt gaaaaacagt aaagaagaaa aagaaggaaa tagaaaacca ttggaacacg     14640
     aataaaatgt gaaaaataaa atcatttccc cgtttcattg aagcaaaagt attatgtaac     14700
     agagttaaaa agtgatggga aagtttggcg aactagtatt gactagtagt ataatagtgt     14760
     tacaagcata aagttcaaaa caaaagatga aaatttaagt aaaaaaaaat tctatttaat     14820
     gtacatggaa cttttgatgt ttatttctct gcgagcttct caaaagtcgc aggacaggag     14880
     ttttcggctc ttccacgtgt ggtgaaggtg ttcgttgagg cgttcctcta atttgcacaa     14940
     cagctttggc aggcggtgcc agaaaacaga agcgggcatt tgtcgatttt gcgatcggta     15000
     tctcagaatc cattgttcct tattttatag agtttctatg tgcatgaacg gatttcaacg     15060
     aaagataggt atgatggcaa cacgagcaca ccgtcggttg agtgatgtga tgcacatttc     15120
     tcatgtgctt cctcacatca tcggctcgag tcatcacaat ttggcacatc aggcattcct     15180
     gtggtgtcat atgatacttc aatcgatgat ggtttagtgc cgccaagtcc ttgagcttag     15240
     aactgcagac attatgcaac atttcttcca tattctccac ttcgacgtct tctccatctg     15300
     gttttgaatc gatttccatc acaaagagat ttttgaatcc ttcgaccagt gttggaaatt     15360
     tagtgaattc ctggctgaag gcatccgaga ttttgtgggc ggtatcggtg gacacgatta     15420
     gaacactctc acggactttt gagagttgcg ttgctaatga gcaactgcct gtcgtctttc     15480
     cgacaccttt tcaggctaca aaaatccgtt ttagcgtttt ttgttcgaga atattctcga     15540
     tagaggcttc caactgatct accatgctga aaaaagtatt tattgtattt gaaaaaataa     15600
     tcaaattgat tttggagcaa taccagagaa atggagaaat acggagagaa gcaaatagat     15660
     tttttgttaa tttttgcagc taaatataag aatgatatca atgtacttga aacattcaaa     15720
     aatttcataa aagattaaca gaaatttttt aaattttaac tattttttca aattttttaa     15780
     acagttttaa atgtattttt gtcggttttc agtgaaattt ttgttaaaaa ataagaaaat     15840
     taagaaaaaa agctaaaaat gacttttaaa aaaattgaaa ttcgtttttt ggcgcaaaaa     15900
     gttaaaggga catgagattt cgtagggagc gggtctcgcc acgattcctc ctatttttat     15960
     ttttactttc aaacgaaaca acgaagctcc gaaataacgc attcgtgata aatttaataa     16020
     agaaattagc agcaaaacag caaaaaatgc gaatggaatt caaatacgaa gcaaggcgcg     16080
     caacacacta taaaaattga tcaaaattac gcagcaaaga cagtttaaaa ctacagtaat     16140
     ctttgaaggc gcacatccgt ttgtatttaa cagacatttg tcgtgaccag ttaccgtact     16200
     tttagcgctc acttttgtgt ccgggctaat atcttctcac cgctggcaaa cataataaaa     16260
     tgaaaattca cctgaaactt taaaatttta tttattttct agacagtcag taaaataaaa     16320
     aatagtggag tataactgac aagggtttcg ttatttggct cgtttttctc gaaaactgat     16380
     gatgatgatg atgacaatga ggaagaaaat agaattttgg cacattcgaa ttatcaaggt     16440
     tgaactactt ttaaaaaata agaaaaatgg ggatgtgtct catgatcggg tacaattttg     16500
     aaaagacaca aagtgattga agaaggtggg gagagagaga gagcagagat gagagaactg     16560
     agaatattca gaaaaacaaa aactgacggg accggttggc gtttttttgg acaaaatgag     16620
     acgcttttag ttattttctg ttcgatacag ttccagctag tgctccactt tcgagcataa     16680
     ttgtgtgaaa ttgtttcata tgaacttcaa cgtagtcttg gaagaatgcc acgttgcggg     16740
     ggtgaatagc ggtccgaatt tcagatatgg cgtcaccaag tgattgaaga tcaactgcag     16800
     agatcttttg agttcccatt gtgcgaacct ggaaaaatat aatatttttt ctaatatttt     16860
     tctgcagtaa aaaaattttt taatagtgtt ttaccgatga ccaggtaatt ttgaattcta     16920
     ggaaacaatt ttagtttttt ttttgtaaaa tagtaatttg taattaattc taatgggacg     16980
     atgcaagtga acacgtgtat tcagctcgac caacgcctcg aaaattttca aaaaaggcgg     17040
     gaaaaaatat ttgaattcgc caagaggaat ttcaccgcag cgcgtgacgg tgtttgcaca     17100
     aattacaccg aatggtcgag ctgaaaacac gtggtgaatt tctcgtaatt tctcgacaca     17160
     ttttttgcaa tgcaagtgcg cggagaaatg acgagaaatg tcgtgaaatt tgcaatttct     17220
     ccgcatttct cgacatatga tgaacggtga gatacgcaga aacatgtgtc cccgcaggaa     17280
     actccgccta ctcaccgcac ttttaacagg gtgaaatgtc ttaccaccct gcgaggacac     17340
     atctcatatg tcgagaaacg cgtagaaatt gcgaatttca cgacatttct cgtcatttct     17400
     ccgcacactt gcattgcaaa aaatgtgtcg agaaatgacg agaaattcac ttgcatcgtc     17460
     ccataatgaa attaggaaag aggatttggt aaaaaccgaa gtttattttc taatgaattt     17520
     ttacattttc aatttttttt ttcattaata aattattatt ctgcagtcta tagtgccaca     17580
     aacctgtaaa aggacagctg tcaatgattg aataagtgtc aacgcatgca cattctctac     17640
     atttaatcct tgattacagt gctctacaaa tcttccagct tgttgagagc acatttgtct     17700
     aactgcttca ggtttcatat ttgacgttga aatctgcaaa caaatagatc tttcgaagaa     17760
     tcaggaaatg aaaaattaca tcattcgaag agaaatacat atggtgatct tgaattccat     17820
     tcatattgat atctatattc tgattcacat gttccagatc gatgatagtt ttggcgtatt     17880
     tctcctgaaa aaaaattgtt ttttagattc tatctagttg actttttcat atatcaaaaa     17940
     aaatttctaa ttaaaaatgt acctgaaaag ctttcgaata tttgtctgac gtcatatttt     18000
     gtatctcggc atccgcattc aattcgttca attgtcgtat caatcccttt ttgatatcaa     18060
     ttaatttcgt cagtttcaca agattcacaa ggaatttcag cgggaaattt ccaaccattt     18120
     ctgcattttt tccatttaat cgttcgtcgt tcggtcccat taatggtcca ccacttctct     18180
     cgatttttcg agaaaccagg acgtcacgaa caagatgtgg atgtgatgag tcacgaactg     18240
     ctgctacaaa tggacgaacg cctgatggaa gcttagagtt ggcttgttca atgaagtagg     18300
     cgatactcaa caaatcaagt tttccgtcga gaagtatttc cgtgtcacta accagtgttg     18360
     gtgggatatc tggctgaaag aataaaacat tggaatttat agaatttcaa atattcaaat     18420
     ttccctaaaa caaaataatt tatgatccaa aactaccgaa tatagtaata ggacgtctta     18480
     atttccaaag acttcctatt ttcagctaaa tcattaaatt ttgtcaattt ctcctaacac     18540
     tttttattgc atattttggt agtaattcga tgatttgagc acattttaag tcgataagaa     18600
     tcctactttg atatttttgg tgtctatcga cttaaagtga tcctaaatca tagaattaaa     18660
     gcgaaataaa ccactaaaat atgcaataac tgttgaaaat gcaataagaa ttgcattcca     18720
     gcatgtacaa aatggacaag ttggcgaagt tcacgaattt agctgaaaat aggtttgtgg     18780
     cgaaatttta agacatctcg ttacaaaatt cgggcgtttt gggtgatatt gagtctcctt     18840
     ttacaaacct tgtcaaaaat aattctgaat cctttcggaa tgacagcatc aataattcca     18900
     gaataaattc catcgtaggg atttcgaatt ctcgcaaata cacgatttcc aaccaccatt     18960
     ggacgtggaa gcttggctgg aagatctttt agatcaatcg atggatcctg aaagaacatt     19020
     tattgaaaat gatacacctc ttcagcctta cgttaagata acttccttca tagacacttc     19080
     gaatcttcat tcttttctct tccaggtaca ttctttcttc ttcaaaaaac actttcgagc     19140
     atctacgtgg ctttccgaga agttttcgaa tcgaccgcca ctcaatacgc gttaaattcc     19200
     aatttttcag atttgggaaa gattcgcgga taattgtggc aaactcgttt tcttctttga     19260
     aaatttgttc gtcgattgca gaatagaaga actcgcacat gacccattga cgagctttct     19320
     tatatcggag caaattgtag agtttcttta tattagctct cataaatgtg ctcacatctt     19380
     cacttgtttg atttttatac gttttgaatt gtttcatcat ggcacttcgt tcttgatctg     19440
     tactgaacat gttgaagaat gactgtgtat ctcgatgttc tacagcttca tttgtcatat     19500
     tcgcaggatt atctaaatca tcaagacctg ctacaaggtt ttgatgcatc tcaatcatct     19560
     ccagatcctt tgcgagaaga tcattacttg gtgctggagg cggagacaga gcaagagctc     19620
     tgcgtggagg gcgtcgttct tcttttggct ggaacttgga gacatgacaa caatacaatt     19680
     gttttaaaac ttacaatata ttccaaagca caactggaag attcataatc aagagctgcc     19740
     tttgcgagca ttgttagact tgagtttcgg gtcaatgagt tcactgaagg agaatctcta     19800
     cctccattca ggcgtttcgc gggagatctg taaaatcata agattagtcg gccacttttt     19860
     cggaacagct tgttactttt tgggagatcc ggtacgtttg atactgcgag acggtgatag     19920
     gtatagttct tcattacgat atctcgatgg aactttagat gtttcacgga gactgtatgg     19980
     tgagctggtg cgatcctgaa aataccgaat gtcatgcata ctttcaatat ctttctttaa     20040
     tttacaactt ctttattttt aaaaacacga aaacccaata aaatcaatat ttccaataac     20100
     ttacaggatc agacgtgtca cttgctgcct ttttccgcgg acttctcacc gcagacgaca     20160
     tttttatctg aaaaataaca aatttttgaa taatttcaga ccacgagaca aaaatcaatg     20220
     aaagaatgcg gacgcgcgcg cgcgaaaaaa actttgaaat ggcggttctt ttccccaacc     20280
     aacagccgat ttcaaacagc gtgatggtct cgacgcgatt gccctgcggc agtgtagcga     20340
     ggtacggtgg agcgctgtct gttggaaaac agaacacagc tgagagaagt gaatgtggtg     20400
     ggaaacggaa aaaagggaga gctgctgttt gacagtcgaa cgtcgtgaca ttccgttttt     20460
     ggattttctc gtgaaagttt tttttttttt tttatttgtt ttatttctta tttgtattga     20520
     ttttccatct ttcctgggtt atcattaaat tttaaacatg gttttacaca agatcatgcg     20580
     gtgaaacatg tttttttctt cctttccgca tttaaaacga attattttgt ttatattgtt     20640
     cttctctttc cattctcatg attcatttct ctccttattg gcaagaaaca ttataaaatt     20700
     gttcattcct actaagtgtt taccaaaatt tattttggcc gcaaagtttt aaaattgtag     20760
     aataaacttt tcattaaaaa tatttcgtct tcaatcactc atctttgttc cgaaaacatc     20820
     tcacaggttt tttcttcaaa gcaatattct tctttagtgt ttttagtcag cgtttttcgt     20880
     tctggatctg gattctatgg tttgatgtta ctttgaaaca ctatttataa aatctttttg     20940
     caaagaaaca attctcttaa atttaataca atttccgcat caaaattgaa gtttttgtgc     21000
     aaagttgacc tctcgcagcg taatcttatc gttttttcgc gttatcacca ctcaatctcc     21060
     cccactgctc tacaattatt tcatttctct caaccttttg atcgaatcga ttgaatttca     21120
     taatatccac gaaatgtgag tcgcccaatg tttacgtttc tccatcctat aacactgctt     21180
     acaaatggtt tcagtgttca aacattgcgg tgaatgaggc agacaatcag acattttctt     21240
     tcttttaaaa cctgtcctgt tcatttcttc ctcatctcct ttaggttttc ttattcgcca     21300
     tctgaaagtt tatttctctg cgtctagcta ttagactcct ggagaattac gctctaatgt     21360
     cgatgacgtg tcggctgatc gattagattg cgcaaattgt ttctttagtt ttttctagat     21420
     ttctctccct tttttcatga tattccaatg gagcacgttt gagcgcatgc tctcttcttg     21480
     ctcagtgctg ctccgtatcg atccctctcc gtcaatatct ggtcttcggt cctgaggcct     21540
     tcgctcctag cctcgtgctt ttcttaaatg ttttctctcg aaagaagcgt ttttgatttt     21600
     tttttccttc ttatttttga aatcttcata ttatttcatg gaaattctta cagaatcaac     21660
     tagaatgggt gattacgtga ctcccggcga ggagccacca caaccgggca tctatcgaag     21720
     tgagcagatg tgcctggctc aactctacct tcaatctgat gcttcctatc aatgcgttgc     21780
     tgaactggga gagctcggac ttgttcagtt tcgtgatgtg agtttgtgat atgtaaaaaa     21840
     ctattttcaa ttaataattt taaaaaaaag taaaacttca atttatttta attttcagct     21900
     taatcccgat gtgagctcct tccaacgaaa atatgtaaat gaagtcagac ggtgtgatga     21960
     aatggaacga aaattgagat atcttgaacg agaaattaaa aaagatcaga tcccgatgct     22020
     ggatactggt gagaatccag atgctccact tccacgagaa atgattgatt tggaggtttg     22080
     ttgaaaaaaa aatataggta tataaatatg tgttgcaatt tcacggtcta ttttttttga     22140
     atgtttaatt tttaaaaagt ttttaaaaat tctttcttac aggcaacatt cgaaaaactc     22200
     gagaacgaac ttcgcgaggt caataagaac gaggaaacgc tgaagaaaaa cttttcagag     22260
     ctcacagagc tgaaacatat tttacgaaag actcaaactt tcttcgaaga ggtgagaatt     22320
     tcatgttttc tcatcatttc caaattctct aacatttttt ttcacaaatt ctccttttct     22380
     ctctaattct ggcatgcttt tcgagaatag ttaaacaccc taacataatc aaaaaaaaaa     22440
     tggaacttga tcctataata ttttttattt tctagcagat gtagtatgtt ttgtgcctca     22500
     cctatttata gctataatat tagtatagtt gctctcctca ctattcggtt cgtcacacag     22560
     gttgatcatg atcggtggcg aattctggaa ggcggaagtg gacgacgagg acgttctaca     22620
     gaacgtgaag aaacgcgacc ccttattgat attggagata tggacgacga ttcagctgca     22680
     cggatgtcag ctcaagctgc gatgctacgt cttgggtatg tggtcctagg caagatggac     22740
     agaccagaaa gcgccaccat cgcgaaacga gacctagttt atgttgtctt gttcgtatcc     22800
     ttctcctttt gcatcccgtt ggtgtttttt cctgattctt ttctggtaat ttaattaatt     22860
     ggtgctttta agcactagga aaatttaaaa tgactcctaa tctaatatct tcccacatct     22920
     ttctctctcc ttaaatcctc ccctaaccga ctttccttat ccttctatgt tccttttccg     22980
     taaaatctcc ttcactaaca caggccggga ctggagaaat gttgccacct gctgcagtcg     23040
     aatctgaaga aggccttgaa ctgactcaac atgccgccgc tggcggagcc acaatgttcg     23100
     ccaattttgg gtgagacttc tgctcctact cgtcgttgta tcgttcattg tcgcacggtt     23160
     ttgctttcga ttgcttacac ttctttcctt ttctatcagt atctcatgtc tctatcctgt     23220
     agcttgtcgt ggtgtgccag agtttaggtg aatcggtcac tacatcccca acataacttt     23280
     ggaaagaatt tattgaaaaa agccaagggt aatctaaatg tagtattgtg tttgtttgat     23340
     tctgcagcac gaagacatga ttgcctcatc agcggaaagt tcgggaattg gtgaagtgct     23400
     cagtgccgac gaagaagagc tttcaggaag attcagcgat gcaatgtcgc cactcaaact     23460
     gcaattacgg taggatcagg cttattttgt tgtctttttg tcttttcata tcattatgta     23520
     ttgtgatggt ggtgtctttt caaagcgagc gcgttaaaag atgtgtccgg cttggtttct     23580
     tagtttttag aacatgaaaa tcatcattta cttaaatttt tgattttaga tttgttgctg     23640
     gtgtaattca acgggaacgt cttcccgcat ttgagcgact tctttggaga gcgtgtcgtg     23700
     gtaatgtctt cttgcgaaca agcgagattg atgatgtact caatgatacg gtcactggag     23760
     atccagtcaa caagtgcgtc ttcatcatct tcttccaagg agatcatctt aaaacgaaag     23820
     ttaagaaaat ttgtgaaggg tgagtttccg taatttctaa aatcagaatt ttattcaaaa     23880
     cataattttt cagattccgc gcaacgcttt acccctgtcc tgatactcca caagaaagac     23940
     gagaaatgtc aattggtgtg atgactcgta ttgaagatct caaaactgtt ctcggacaga     24000
     cacaggatca tcgtcatcgt gttcttgtcg ctgcatcgaa gaatgttcga atgtggctca     24060
     caaaagtacg gaaaatcaag tcgatctacc atacactaaa ccttttcaat atcgatgtta     24120
     cacaaaagtg cttgatcgcc gaggtttggt gtccgattgc tgagcttgat cgtatcaaga     24180
     tggcgctgaa acgtggaaca gatgagagtg gaagtcaagt tccgtcaatt ttgaatcgaa     24240
     tggagacaaa tgaagctcct ccgacataca ataagacgaa caagttcaca aaaggattcc     24300
     aaaacattgt tgatgcatat ggaattgcaa catatcgaga aataaatcca gctccataca     24360
     caatgatctc gttccctttc ctttttgctg tgatgttcgg tgatatgggg cacggagcca     24420
     tcatgttact tgctgctctt ttctttattc tcaaagagaa acaactcgaa gcggcacgaa     24480
     tcaaagatga gatcttccaa acattctttg gaggtcgtta tgtgatcttt ttgatgggag     24540
     ctttctcaat atacactgga ttcatgtaca atgatgtctt ctcgaaaagt atcaacacat     24600
     ttgggtcatc atggcagaat acaattcctg aaagtgttat tgattattac ctggacgacg     24660
     agaaacgatc agaatctcag cttattcttc caccagagac agcttttgat ggaaatccgt     24720
     atccaattgg agtggatcca gtttggaatc ttgccgaagg aaacaaattg tcattcctca     24780
     actcgatgaa aatgaaaatg tccgtattat tcggaattgc tcaaatgaca ttcggagttc     24840
     tcctctcata tcaaaatttc atatatttca aatctgatct tgatattaag tacatgttca     24900
     ttccacaaat gatattcttg tcatcgatat tcatttatct gtgcatccaa atcctttcaa     24960
     aatggctatt cttcggtgct gttggtggaa ctgttcttgg ctacaagtat cctggttcga     25020
     attgtgctcc atcccttctc atcggtctca tcaacatgtt catgatgaaa agtcgtaatg     25080
     ctggatttgt ggatgacagt ggtgaaacat atccacagtg ttatttgagc acttggtatc     25140
     ctggacaggt aagcttaatc ctccccatgt ctttcaggtg tttggatgac tgatgttgat     25200
     gaaattgaag agaaacgatg tttgacatga cgatgaataa aaacaaaagc aataattttt     25260
     ctatttaagt cgttcttcga aacaattttc gtcctggtag cgatcgcgtg cgttcccgtt     25320
     atgctattcg gaaagcctta cttcttgtgg aaagaggaaa aagaacggcg cgaggggggc     25380
     catagacaat tggtgagcta ttataataag aaaattgttt aaattagcac gcacccgcct     25440
     tctactgtcc cgttactttt tgttgtgttg tattgttttt attttgtgag aagatcgact     25500
     ttttaaaaat aattttggag aacattttgc ttcattcaaa attttaattt tcacgaaagt     25560
     tttgaatcgc aaaggccatc aacatctgaa aatgctcctc gtcaaaatat accagattat     25620
     attaacccag acgcgaaatt tttgctccaa aagtatggta accggtctcg acacgacatt     25680
     ttttgttaaa tgcaaacgtt aaagagtact gtagcttcaa aatttcagaa ttcacatttt     25740
     tattttttaa aactaccata aaacatctat aacataaatt ctaccaaaac aaaactacag     25800
     tactctttaa tggcgcacac atttttggat tttacacaaa tttgtcgcgt cgagaccggg     25860
     taccgtattt ttagcgcaaa ttttgtgact gggtcaatat cacgtcaata ttattaataa     25920
     cacatcaata attaattaat actgtgggaa tattggttgg tgatagttgt atatcctatg     25980
     cgcttgtctt attcggcatg ttgtaaatat tcgtcgttgt gtcatgatca tcatctcttc     26040
     gatcttcatc aacaccgtct tcaacaccgg atcggctgaa accaacgaat cataaaaatg     26100
     cagcaagcat gttccaggca acaatcgaaa taatacttgt ggtgttggcg ttggtgcagg     26160
     ttccgattat gttgtttgcg aaaccatatt ttctgtatcg ccgagacaag caacaatcga     26220
     gatatagcac tttgacagca gagtcaaatc aacatcaggt aaacaattgg tgatgggtag     26280
     tttttgcatg attgtattag ttttattctg cactttttcc aatattattg aatcgacacc     26340
     aattttatag gctaatgttt ttgaattcag agtgttcgtg ctgatatcaa ccaggatgac     26400
     gcagaagttg ttcacgcgcc agagcaaact ccaaaaccaa gtggtcacgg acatgggcat     26460
     ggtgatgggc cacttgagat gggggatgtg atggtgtacc aggctattca cacaatcgag     26520
     tttgttcttg gatgtgtgtc acatactgct tcataccttc gtctttgggc tctttcattg     26580
     gctcatgctc gtaagtaaag aaaataatag aaaatctcaa agaagaactg atacgttaaa     26640
     aagtaaaaaa tttttgattg tttaaaagcc taaataataa ttatagaata gaaaacccta     26700
     aaattatttt accgtaaaaa cgaaacaatt atcgaaataa attttatttt ctagagctct     26760
     ctgatgttct ctggacaatg gttttccgta atgcattcgt tttggatgga tacactggag     26820
     ctattgccac ttacattctc ttcttcatct ttggatcgtt gtcagtgttc attttggtac     26880
     tcatggaagg tctttccgca ttccttcacg ctcttcgtct tcattggttc gttttctaat     26940
     tcaaaattag acattattaa gaaaccatga gttcatgaga atgcctactt gccggcgcga     27000
     aacaagcggc agcagtgaga gcatgcggcg acgagagatt taggtgcctt cgctacgaga     27060
     tatttccgcg ccaaaacggt agccattctc atgaactcat gatttcttaa tacacagtca     27120
     tttactgata ttcaataatt ttcagggtcg agttccaatc aaagttctat ggagggcttg     27180
     gatatgagtt cgctccattc tcattcgaaa aaatccttgc tgaagagcgt gaagctgagg     27240
     agaatctcta agatcacctc ggccacttca aacagtgtga catcgacgtt cgacaaatct     27300
     ttaattattt atttctagta gatatatact tctatttgaa tattgtgtcg tgttgtgctt     27360
     ttttcttctt gtgtttgtgc atagagtttc ccctcatccc ccagccatct cctttctcta     27420
     aaattgttcc attttccttt cggtgaccag aatctgaatt ttcttcttct cgcattttta     27480
     aaattcatct tattttcttc taaattcttg cttcctgtct ctatttcttt tcatatttca     27540
     gtctagttct cttctattgt gatgacttta tgtatttctt cttaatttat tccttttctt     27600
     gaaagtaccg atcgctcggg atttccattt tcgccaatat tttgtatttc ggtattgcaa     27660
     gctttctaat catttagtaa atcatatttt tattttaagt tttttctttt cgtaaattta     27720
     gtttgtctcg aattttcgat tgccgatcgt catcgccact aaccgttgaa taaataagtt     27780
     gattgcaaac aaagtggaat cgctagctcc atgacaagac agtaaatttc tgaaggctat     27840
     agtactatta cacagacgcg aaatttggac tatttttgct ccaaaaatac gattccccgg     27900
     tctcggcacg aaaatgtttt gtaattgtaa actaatgtga gccttcaaag agtacagtag     27960
     cggaatgttc acaatttttg gctatgtatt tttttaacaa ttgaagcaat caaaacatat     28020
     tttaacaaaa aatacgggaa aaattaaatt cgcacacatt tttgtcttta acgaaagatt     28080
     cttgcgtcaa aaatcgcaag tttttgcctc agagtaataa taagctaaac attttaaccc     28140
     ctcatcacaa gtggaagctt acaaaaaata aaaattttgc agagaaatgt caaagaaatt     28200
     gaagccattc gaaattttag aggattcgtg tgcatcagta tgtatttggc ttaacggtga     28260
     acctacggca atcagcaatc gcgctgaaaa tttatggaat aaggccaaat atcgagttgc     28320
     aactgatgga gctgttaatg agattcttaa aaggtgatct aggatccaga aattgaaaat     28380
     tatcgtaaac cgagttttgg atttcagaaa gagtttcgtc gaatggcctc atattatctg     28440
     cggagatttc gattcaataa ataaacagat tgatacaaaa aatgcaaagt tagtttaaat     28500
     tctactgaaa ttaaaaatta atataggcat tactcaactt cattgtaatc gtgtttcatg     28560
     tttgataaca tcttctatta atgagcaatg atagaattac tgtagggtta ctgtagtgat     28620
     cacaaagaat tattactgta gcggctgttg aatattagct aaaagaatat ataggcgtga     28680
     acgttgaaaa taaaattaaa atattattga gttgtgtttt taatactgga agactgaaag     28740
     ctacaattcg ttgagaagag tgtattgacc aggtcataat aatgattttg cacttttttt     28800
     ggtatttctg gcttgccaac taaatgttat tcattctgtg ttcaggacta aaaaaataaa     28860
     aatattttgt cgaaaattgt tcttaatgtt gttttagagt cgtccatctg cctgatcaag     28920
     actacacaga tctctcgaag agcgttcagt ggtgcttaga gcagaaaaca ctaacaagct     28980
     gggaattcga gaatatcgtt gttctaggag gtctcaatgg acgatttgat cacaccatgt     29040
     caacgttatc atctttaata agattcgttg attctcaaac tcctgtgatc gttttggatt     29100
     ctagaaattt ggttctcgct gttcctacag taatccttgg caggcctatg tgaacattaa     29160
     gagttaaatt cagggggatt caaatcttga tgtcaatctt gaaatgacaa caaaaatgtg     29220
     tggaatcatt ccaattgttc aaaaggagac aatcgtcagt tcaattggac taaaatatga     29280
     aatgggtata atccaatgtt tcaacatcat ttctattaaa cgtttccatt tcagaaaacc     29340
     ttgctcttga atttggaaaa cttatcagca cgtcgaatga agttaccacg agccaagtat     29400
     ttttgaaatc ttcgtcgtct ctgatttttt caattgaact tgaaaattgg gtctacaaac     29460
     ttgattctct atagtatcac attttatggt ccctcttaat tcacaacttt tcattccttt     29520
     gctattcaac tgttctattt tctttttatt ccatttttcc tagttttcac cggtactata     29580
     taattatcta caatattata atacacttta ttccctgtac cattttgtgt tgaaaacgaa     29640
     ttaataaaaa taaaaacgaa ttaatagtat gagattaaaa ttttcatttt aaaagcaatg     29700
     ttatttgttt aaaaaatatc caattctaat gaattatctg cgaatatccg atagcgattt     29760
     caaaaatcta atgaaaattg aaattcaact ttaaatcatt tgtagatcaa ttttctgatg     29820
     cttctatcca ctttcaaacg acatctacca atcaggcgtc tcttctcatc aaataaattt     29880
     gatctgattg taattggagc aggatctgga ggactttctt gttctaaaag agcagctgat     29940
     cttggagcaa acgtggcatt aattgatgca gttgagccaa ctccacatgg acattcatgg     30000
     ggaatcggag gaacttgtgc aaatgtcgga tgcattccta aaaagttaat gcaccaagca     30060
     gcaatcgtcg ggaaagaggc aggaataata ttataaatat ttagagcact aaattcaaaa     30120
     ttccagctaa aacacgcaga caaatatggc tggaatggca tagatcaaga gaaaatcaaa     30180
     catgattgga atgtgttgtc aaagaatgtg aatgatcgag taaaagcaaa caattggatt     30240
     tatagagttc aattaaatca gaagtatttt ttttaatttt gtggaaattt ttatttttat     30300
     gaaatttaga aaaatcaatt acttcaatgc ctatgccgag tttgtggata aagacaagat     30360
     tgtgataact ggtacagaca aaaataaaac caaggtacgt ttggaaaaat gaaaaaagaa     30420
     gttttaaaaa atttgttccg tatacccaaa agttttgcgg cttttcggag gagaatacgg     30480
     tatcaggtct cgacacgaca atatagtttt ccgaaaaaac ataatttatt ctaacaagtt     30540
     gtgataaaat ctataaaaat aatctataaa aattccgtag caacaaatgt ttgagatgac     30600
     agtactcgtt aaaggcacaa cttttcgcat ttgacaaaaa tttgtcgcgt cgagacctgg     30660
     taccgcattt ttggcgcaaa ctttaggtaa taataatatt gctaggaaac ggaaaattaa     30720
     aaaatttcat cctagatttt cagaattttc tttccgcacc gaatgtagtc atctcaacag     30780
     gactccgtcc caaatatcca aatattcctg gtgctgaact tggaatcact tcagacgatc     30840
     tttttacact ggcatcagtt cccggaaaaa ctttgattgt tggtggagga tatgttgcat     30900
     tggaatgtgc tggatttctt tctgcattca atcaaaatgt tgaagttctt gtgagatcaa     30960
     ttcctttgaa gggttttgat agagattgtg tgcattttgt catggagcat ctgaaaacaa     31020
     ctggagtgaa agttaaggaa cacgtggaag tagaacgtgt agaagcagtt ggcagtaaga     31080
     agaaggttac attcactgga aatggtggtg ttgaagaata tgatacagtt atttgggcgg     31140
     ctggtagagt tccaaatttg aaaagtttga atttggataa tgctggagtg aggactgata     31200
     agagatctgg gaagattcta gcagatgaat ttgatagagc ttcctgtaat ggtgtatatg     31260
     ccgttggaga tattgttcag gtacgataaa aaaagtaaca tttttttaaa ataaaaatga     31320
     tagtattcag gatcgccaag agctcacgcc acttgctatt caatccggaa aacttctagc     31380
     tgatcgtctt ttttcaaatt ccaaacaaat agttcgattc gatggagttg ccactacagt     31440
     attcacgcct cttgaactct caaccgtcgg gttaactgag gaagaagcca ttcagaaaca     31500
     tggagaagat tcgatcgaag tgtttcattc tcattttact ccgtttgagt atgttgtgcc     31560
     acagaataag gatagcggtt tttgttatgt gaaagccgtg tgtacaagag atgaatcgca     31620
     gaaaattctt ggtcttcatt ttgttggacc aaatgccgca gaagtaattc aaggtaattg     31680
     attcaaaaag agaaatagtc cgccccgccc gtcacgaaaa tgttttctga acaccttcaa     31740
     ttttggaaca atgttcgaaa aaccataatc tgttcgcaaa aacttacgtg ctaaatctgt     31800
     tattttgaat tttttatctt tttctttatt gaatgaataa tattacacat acgcaaaatt     31860
     ctgctatttt tgcgccaaaa atacggcttg atacgacaat ttttaatgca aagaaagtgt     31920
     gcacctttaa ataatactga aaatttaaac tttcgctgct gtagaatttt tatcgatttt     31980
     ttaaagattt aatcacaact tgagacaatt aataaatttt ttatcaaaaa gctttaaaaa     32040
     tctacaaaat ttctgcagaa tcgagagtct gaaactacag tattctttac aggcgcgaaa     32100
     aaattttatc gtgtcaagtt caggtaccgt acttttggca atcaactcac aatattctgc     32160
     gggtaggtaa tactaacaac ctcgataatc gatcaagata cgaaaacttt aaaagctaac     32220
     cgattgcact aaattatttc aggctacgca gtagcattcc gtgttggaat ttcaatgtct     32280
     gatcttcaaa acacaattgc cattcatcca tgttcttctg aagagttcgt gaagcttcac     32340
     attacaaaac gatctggaca agacccaaga actcagggat gctgtggata attcaaaaag     32400
     tttattgaca aatcattcag tttatttatc aaagttaatt tacatcctat tatcctggat     32460
     actagtaatt ataattaaac ataataaata gtacaaaata tttgattatc ctttttaaaa     32520
     gataccggga actacatatt cttaatgcgc atcgtgctca tggatgggat cacatgtctg     32580
     acgaagtgtc gaaatacgag ttccagaagt tgttagaata gatatcacag atgttgttga     32640
     actccatttc ttcattggct tcgaaacatt cttcttatgg aactggtgct tccgaagctc     32700
     agccttataa cgatcatcaa acatgattac ataattatct ggctcacaga gttgtactct     32760
     ttgttccttc tctaatcccc gcgtgaaagc gtaaaagttt ttataacctc cttccaacaa     32820
     ataaatctcc tcataatcac atctcggata gatatttgaa ttcagttttc tgtccacttc     32880
     ccgaaggttg ttcgccatgg ttggtccacg tttttgactg tattcacagt agaaaatggg     32940
     tatccggttg attttcttgg aaccatcttt gttgaagaag aagtctgcag cagtttctgg     33000
     attgaacagg ctttgagctc cctgaaaaga tttgcagttt taactttctg gtattttttc     33060
     aaaacagtta ttataattct tttttctgaa acgcacactt aaaggcgcat gatttggttt     33120
     ggaagggtct tgccacgaag gaaagtagat tttttattaa ttctaaaatt aaatgtgttt     33180
     tctgtttttg acagaaccca ttagaacgga ctcatgattc tttaagtacg agttttaaga     33240
     agtacagtat cccattctca tatggcattt tctctcgaaa gagtctattt attgaaaaac     33300
     taaaatgata cacggacacg aagagagaat ataaattacg agggttactg taaacttaaa     33360
     ggtacacact aagactttgg agtctggaaa cgtagtacaa acggcaaaaa ctaaccttaa     33420
     tatgccctcc attatattca taatcatatc ggcaatcaat tagaatatat ttctgcataa     33480
     actcaatttg cgatagcttc tgcatgattt caattaacgt ttcagaagtg attttttggt     33540
     atacggtaga acagctaggc gtcacggttt ccaaatgata atccacttga agatgggcat     33600
     tccatgtctc aatttccgaa gttgaatggc tcttttttga gaaagttagt cttttcttta     33660
     tcacaatttc agaagtattc gcagaatccg ttccagatgt atatcctcca tcaatgcttc     33720
     gtttccgagt gggtggcgat gagttggaga tgtggctgat cgcagaagag tgttgacggt     33780
     tttgtctgta aattatggat ttattgatat cgaacacaaa taatcaacta accttgggaa     33840
     tagcttcgag gatccttcag cacattcaga acatttcagc cggagcccgt cattgcgaac     33900
     aatgcagttt tcacatggaa cgtcaacgca catcaggaga cttggagcta gactgaacta     33960
     ggtatacctg aatgaaagaa tgcaatagaa tggatttgaa gactaaatga aaaaagagag     34020
     actgactagt ctagtttaat atgaattgga atgggatcag tagaaaaccc taatgaacac     34080
     tcaataaaat aaaacattat tttagcgcgc aatgatcatg gaccctcccc ttttatatgg     34140
     tccccctcga gatcgatata acctatataa aatggggcgg gccgttctcc tgggaagaca     34200
     attgatctcg caattgtgtg ccaaggtgtc gtgttagtgt ggcgatgtgc acctatttcc     34260
     gggagtgaga atttgaccta cgattgtttt cacctttaga gcgggaatta gacaaagaga     34320
     atatgagtag attcgactgg gaagttttga ttctgggaag aaacggtgag aattgtctct     34380
     aattgtattt aactttgaac aattttaaat aaaatttttg gtataaggtg tagaatatgg     34440
     cttgtgggca aaacaattga aaatcattaa tttgatggat accataataa tttttaaaaa     34500
     attggaaaag aaaaaattgg aaaaagaaaa tttccaccta taaaaggaaa cgaaaccggc     34560
     ttccaggttc ttgactgact cttaacatat ctagatcaga aagaaccatt ggtatttcaa     34620
     gagtgaaatt ttttataacc attcctttgg tgaaaaatac attctatgaa actattgaaa     34680
     gctcctaaat ttttgataaa cttttaaaat caaaatcact tcaacaaggt gttcgttctt     34740
     ccaacagctt tctacgttta ttgtacaaaa tacactttca taaaaacgaa tagtcaaact     34800
     ttcaattagt atttttcaat caatgtcgac ttgataaatt gacaaaaatc aaaatgccga     34860
     gttatttttt gagaaactta aatcttctgt tgtcaaatta tacgcgacaa actattaaaa     34920
     taacagtagt gatactagtt tagggtattt catatttggc tacagtattc tacagtgttc     34980
     ctactgggat aacggaacct aaggttctta gaaattaatg tcaaatatgc gggtaatcca     35040
     gcaaaatttc catttttcac tgtctcatta atattttgta aagttttatt tggatggttc     35100
     aggcaccatt tggcccatgt aaaggggtgc ttcttttttg aaaactattt tccaactgtc     35160
     gctactctac ttctaaaaca gtttttatat tattcttcga gtcatttgaa tttcgaatca     35220
     ctgtttaata caattgaaaa taagatttat tcaaactacc tacagaacaa aaaaatcaat     35280
     agagcaacaa tgattttgaa gattagagaa cacttttaca attttcccac atttacaact     35340
     aactcttttc cggtatacag ctctgtacat tctcatccag atatagattt aagatgtcta     35400
     aggtgtagtg tagtcttctc atattttctc ccatctccac actcgtctca ttgtgggtat     35460
     actctctttc ttttcagtct ttcttctttt attaattcag aagatgcgag cccattacca     35520
     accacctgcg aatcaaaaac tggcagtggt tattctggat tttggcactc tgccaaatcg     35580
     ggatcccgtt gtgcagtgca tatttgaatg ttattgcgaa taatcattgg gattttccat     35640
     gaataatcct tagttcttgt ttttgcgact ttgacggtct gtaaattgat aaacaacaat     35700
     aatggcagta gttttcgagt ggcagacgaa gtggagaaaa tagtaaattg gggttgtgtg     35760
     aggatggaaa ctcaaaaatc aaaatatttt gacatttatt actgaaaatt aatcattata     35820
     tttttttgga aatttttata ttttttgtaa attctctcaa aacgaacaag aaaatcggcc     35880
     ttttccaaaa agtttctaga atattctaag tttttaaaag ctttaaaagt ctttcttcag     35940
     acccaaatat tccagacatt atcacttttt ggacatttcg caaaaatttt aactcaaata     36000
     attaatactt cataaatgga aagtttattg aacatttaaa cgtgtagcct aattttttaa     36060
     aagttgaatg aaaaaaaatc aaaacaacaa ttcaaaacca gaaatcaatt attccttacc     36120
     tttcaaaatt cgaagcaagc gaaaaggatg gaatgcgtga attgcgattg tacagtcaaa     36180
     acgatggaca atttggatca agcgattcgg gcactgctgc aacgtggcaa acacgtgaat     36240
     cgaatgatgg acaacgagaa gctgattaga gaggctcgac gtatggagga cgtccagcag     36300
     ttgaaggtat gaaaattaat gggacctttc tctggtaaat cggttctgat cgacgaagaa     36360
     gatagtacaa tcgacgttgg tacacccagc tttggtatac ttcgatgtct agcagaatcg     36420
     atttaccaga gaatttagag caattgacag tttcgaatta tgattttcag atgcaaatcc     36480
     ccaagccggt tgacaagaaa ccccgtccac cgccttcgga aaataacctg aagctgattt     36540
     cgtgcgagga aacatgcatg gatgagacac tgaaaaactc gtcgaagcca cgtatgatct     36600
     acaataagca actcggacgc gccgaatcga ttgatttcga tgttccgtcc ctgtcttacg     36660
     agagttcggt ggatatctgc tgctacgttt ccacctagaa tgaaagcatt tttttatggg     36720
     aaaagtgcgc cggcgaaacg agtccgtata cttcggcgtc ggtgtcgaat tctaaaaagg     36780
     cgacgtcttc ctcgaagttc accaagtcgg agatcactac aattaccgag ttgacaactt     36840
     ctgtaagccg gaaagccgtc caactcatca ataattactg tttcagacgt tcaaaaaatc     36900
     taataattca tcaggtggcg ctcttgttct ggacaatcat tacttgatta ataatgacga     36960
     tggaactgtg aagaaattgc caatgaaggt agtatgcctg accaccatct aataattaat     37020
     tcattaaaaa tgttgcaggt ctatgtgaaa caacgtctcg aagatggatc tcttgatgtt     37080
     caacttgtat ttttcgacga aaactcgcaa aaagtgatgg atatctccat gcttgtgaat     37140
     ggaaaaaaga ttagaaacgt tcaattttgt ggaaaagacg gcaagcttgt gaactagaac     37200
     ttcttattgt atttttgtca agtaaaagga atgaggcgtt ttgctctatc tgttctattc     37260
     tattttcagc aattcccata gcgtctgtcc tcttcactca tgtagaatca ctcatgtaga     37320
     aaagagaaac ccatgataat ccctactaaa tcaggcaaat tgtttcgatt tgtttgttgt     37380
     ggcagaggtt tggtttttaa cgaatataaa aaacaaaagg tgtaaaaata tttttaaaag     37440
     taattaaaac atctgcaaat ctcgtatgcc taaagttaag aagtttataa gtgatctgaa     37500
     aaaggtggag tatgagtatt tggaaaatag ttaaaactac gggctgaaat gtccaaatat     37560
     catagttaaa attttcaaag aatgtttgaa ttttaaatac tatagcactc gaatccctaa     37620
     agtgtctgaa tattcttatt tgaaacatga gtcggccata aaatttgaaa aaaaatactt     37680
     atgttttgcc cgccaacttc caaaaagagt gacaaaacct gacatttttt caattttcaa     37740
     aataatcaaa taaaattgac atttttttat ttgttttaca atgatatttg gccattggaa     37800
     tgccatagga atatttcaaa gcaatttcct actggcgcca cttcattttt aaacaaacca     37860
     aaacaattgg tctattcatg tgatgtttca aaatagtaag ttgtttttgt tgattttttt     37920
     tctgtatttt tttacatcac aagagtacct ttattagttt gtaagttctg attgttttat     37980
     agcatcccaa aaatttcgtt aatgtattat ttaatgtgga aaactataat cattgcattt     38040
     tgttcagtcg aatccagtcg aatcaaatga tatgtattcc aagcttgttt ggtgccgcaa     38100
     acttattccg tgcttcataa tattcacaac atttacggaa gctttaatgt aattcaagca     38160
     attcaagtgt acacaaaatg aggaaaaagt gtaaaacgct agtgtacgtg ccatgttgtt     38220
     ggtctctatt cacacgtgtt ggcaggcaat tcgaaaacga aaagatcaaa acatcagaag     38280
     tcagttcgag agatattcgg ttctttggtt catggtgaat taaaaacaag ataaatattt     38340
     tgatggcatg caatgtgacg gctgcatcat ggaaatggac aataaattga agttccaaag     38400
     tgttgccaag tacgtattaa ttttctgtga actatgtcaa aatactttgt ttattttgta     38460
     caaaaacgtt tccaagagag ataatcatta taatactcaa agctcattca aatacaatat     38520
     aaaggctcaa aacattcaga tctattaaac atgtggaaga ttggaattct tgagatgtgt     38580
     ctgactctca gcattgaatt cctttccaag tgccatccat gcggcctttt gttgatcatt     38640
     gagacatcca acagattcaa gatatccagt gaatacagtg aagaatgcca tccacagagc     38700
     tggatccatt ttgtagatac gatgacggtt gatggtttca cggacgtatc ccttgaagac     38760
     ttcttcattg gtgtagacgt tggcaaggag atggcacgca agaagaatac gttggccttg     38820
     tttgtcaaat ctggaattgg aattatttag ttttgttttg ctgataattt ccattagtca     38880
     gacacgctac aatatagcac cccgttgttt aattttaaca gctttaaaaa aattgttacc     38940
     tggaaaaatg ttttttattt cttttcctat tgttgtgcag ttaattattt attggtatct     39000
     tcaaaattga actagttatt accttcaaaa gcgaagtagt ggggtgcatt actattagag     39060
     gaaacacgtc aaattttgct aactaaaatc gaaaccaata tcaaaaagtt tacagtgtta     39120
     atactaacct ctcactcttc ttcacatcat ctgcagtgta cttctcggct cccttgaaat     39180
     agacacgaag atccgggaag ttggtgaaga aataacggta gaaggcgttt ccattctcaa     39240
     tgttttgagc ctcagttcca accattcgtc cttcaaggga cttcacacag agatcactaa     39300
     tttcttgacg gttcatcgac atttttctct gaaaaatatt tagttaaatt gggagtttgt     39360
     aaaatcttat ataaatcttt aaaaaataaa aattaaaaaa gaattagaaa taaccatagt     39420
     aaagttagaa agaaaagaga ctctagtgaa tgttttccat ctagtctctc tttctctttc     39480
     caaaatgcct caaaccgccg aaaaataacg acttttgacc agtccgcacg gctccgccca     39540
     tttcccttcc cgcctccaaa tgatgacaaa cattatgatc ttttggatgc tctgcgtttc     39600
     tgcatttcca atgttatcta acattttgga acggaaagga gtgaggcggg atttttgcga     39660
     ctctgaaggt cagtaaattg gtaaacaaca tccaaataac ggaggtaatt ttcaagtggc     39720
     agacgaggtg gagaaaagag taaattaggg ttgggtaaag atggaaactc aaaaatcaaa     39780
     acatttggaa attactgaaa atttagtatt gagttttaaa aatcataaat tctatctaaa     39840
     ctacaaaaaa taagttatag gaaaatgtat taagattaaa acggcaaagc ttcatgctca     39900
     acccctgaaa cttcaatctg taactttttc agtgcagttt tcactactct cgagacatgt     39960
     acaattgctt taaaatctat attttgcaga cttttgataa ttttgcgttg tttaagagaa     40020
     gttaaacctt tggaaacaat ttggaaattt ttgaaatcta aacctcaaaa ggttcaattc     40080
     gggtttccct tattcctaat attcgaacca tattatcact tttttgacat tttacaactg     40140
     caccattctc atttcacata tgttcttaca attaattttt aacgttaact ttccaatgga     40200
     aaatttattg aacatttaaa cgtgtagcct aatttgtttg aaaagttgaa tgaaaaaaat     40260
     caaaacaaca attcaaaacc agaaatcaat tattccttaa ctttcaaaat tcgaagcaag     40320
     cgaaaaggat ggaatgcgtg aattgcgatt gtacagtcaa aacgatggac aatttggatc     40380
     aagcgattcg ggcactgctg caacgtggca aacacgtgaa tcgaatgatg gacaacgaga     40440
     agctgattag agaggctcga cgcatggagg aggtccagca gttgaaggta tgaaaattaa     40500
     aagaggataa cctctaaagc aattaacaaa tttgaattaa atgacgtgac aactgactgg     40560
     ggaattttca gatgcaaatc cccaagccgg ttgacaagaa gccccgtcca ccgccttcgg     40620
     aaaataacct gaagctgatt tcgtgcgagg aaacatgcat ggatgagaca ctgaaaaact     40680
     cgtcgaagcc acgtatgatc                                                 40700
//
ID   X07797; SV 1; linear; mRNA; STD; INV; 1675 BP.
XX
AC   X07797;
XX
DT   01-AUG-1988 (Rel. 17, Created)
DT   14-NOV-2006 (Rel. 89, Last updated, Version 5)
XX
DE   Octopus mRNA for rhodopsin
XX
KW   rhodopsin.
XX
OS   Enteroctopus dofleini
OC   Eukaryota; Metazoa; Mollusca; Cephalopoda; Coleoidea; Neocoleoidea;
OC   Octopodiformes; Octopoda; Incirrata; Octopodidae; Enteroctopus.
XX
RN   [1]
RP   1-1675
RX   DOI; 10.1016/0014-5793(88)80388-0.
RX   PUBMED; 3366250.
RA   Ovchinnikov Y.A., Abdulaev N.G., Zolotarev A.S., Artamonov I.D.,
RA   Bespalov I.A., Dergachev A.E., Tsuda M.;
RT   "Octopus rhodopsin - Amino acid sequence deduced from cDNA";
RL   FEBS Lett. 232(1):69-72(1988).
XX
RN   [2]
RP   1-1675
RA   Abdulaev N.G.;
RT   ;
RL   Submitted (25-OCT-1988) to the INSDC.
XX
CC   Data kindly reviewed (25-OCT-1988) by Abdulaev N.G.
XX
FH   Key             Location/Qualifiers
FH
FT   source          1..1675
FT                   /organism="Enteroctopus dofleini"
FT                   /mol_type="mRNA"
FT                   /clone="pORh462"
FT                   /db_xref="taxon:267067"
FT   CDS             75..1442
FT                   /product="rhodopsin"
FT                   /db_xref="GOA:P09241"
FT                   /db_xref="InterPro:IPR000276"
FT                   /db_xref="InterPro:IPR001760"
FT                   /db_xref="InterPro:IPR006031"
FT                   /db_xref="InterPro:IPR017452"
FT                   /db_xref="PDB:2AUL"
FT                   /db_xref="UniProtKB/Swiss-Prot:P09241"
FT                   /protein_id="CAA30644.1"
FT                   /translation="MVESTTLVNQTWWYNPTVDIHPHWAKFDPIPDAVYYSVGIFIGVV
FT                   GIIGILGNGVVIYLFSKTKSLQTPANMFIINLAMSDLSFSAINGFPLKTISAFMKKWIF
FT                   GKVACQLYGLLGGIFGFMSINTMAMISIDRYNVIGRPMAASKKMSHRRAFLMIIFVWMW
FT                   SIVWSVGPVFNWGAYVPEGILTSCSFDYLSTDPSTRSFILCMYFCGFMLPIIIIAFCYF
FT                   NIVMSVSNHEKEMAAMAKRLNAKELRKAQAGASAEMKLAKISMVIITQFMLSWSPYAII
FT                   ALLAQFGPAEWVTPYAAELPVLFAKASAIHNPIVYSVSHPKFREAIQTTFPWLLTCCQF
FT                   DEKECEDANDAEEEVVASERGGESRDAAQMKEMMAMMQKMQAQQAAYQPPPPPQGYPPQ
FT                   GYPPQGAYPPPQGYPPQGYPPQGYPPQGYPPQGAPPQVEAPQGAPPQGVDNQAYQA"
FT   old_sequence    1270
FT                   /replace="c"
FT                   /citation=[1]
FT   polyA_site      1675..1675
FT                   /note="polyA site"
XX
SQ   Sequence 1675 BP; 479 A; 406 C; 330 G; 460 T; 0 other;
     attgggttgt actctagagg ggtagaatac ctagtattcc ctaaaaagca caagcgttaa        60
     cccaagcatt aaaaatggtg gaatcaacaa cgttagtaaa ccagacatgg tggtataatc       120
     caaccgtaga catccatcct cattgggcca agttcgatcc catcccagat gcagtctact       180
     attctgtagg tatcttcatc ggtgttgttg gaattatcgg aatcctaggc aatggtgtcg       240
     tcatctacct tttctccaaa acgaaatctc tacagacccc ggctaacatg tttatcatca       300
     atctcgctat gtctgacttg agtttctcag ctattaatgg atttccgctt aaaacaatat       360
     cagcgtttat gaaaaagtgg attttcggta aagttgcttg tcaactttat ggtttgctgg       420
     gcggtatctt cggattcatg tcaatcaaca ccatggccat gatctccatc gatcgttata       480
     acgtcattgg aagacctatg gcagcgtcca aaaaaatgtc ccatagaaga gctttcctca       540
     tgattatctt tgtgtggatg tggtccattg tttggtcagt cggacccgtc ttcaactggg       600
     gagcatacgt ccccgaaggt attctcacat cctgctcttt cgattacctc tccactgatc       660
     ctagtaccag atctttcatc ttgtgcatgt acttctgtgg tttcatgctg cccataatta       720
     tcatcgcttt ctgttatttc aacattgtca tgtctgtatc caaccacgaa aaggaaatgg       780
     ctgccatggc aaagaggttg aatgccaaag aattgcgtaa agcacaggct ggtgcgagcg       840
     ctgaaatgaa acttgccaaa atttcaatgg taattattac ccaattcatg ctttcctggt       900
     ctccatacgc catcatcgct cttcttgcac agtttgggcc agctgaatgg gttactccat       960
     acgcagccga attgcctgta ctgtttgcta aagcttcagc tatccacaac ccaattgtct      1020
     actctgtttc ccatccaaag ttcagagagg ccatccaaac cacattccca tggttgctga      1080
     catgttgtca attcgatgag aaagaatgcg aagatgctaa tgatgccgaa gaagaagtcg      1140
     tagcttccga acgcggcggt gaatcccgtg atgccgcaca aatgaaagaa atgatggcaa      1200
     tgatgcagaa aatgcaagca caacaagctg cctaccaacc accaccacca cctcagggct      1260
     acccaccaca aggctaccca ccccaaggcg cctatccacc acctcagggc tacccaccac      1320
     aaggctaccc accacaaggc tacccacctc aaggctaccc accccaggga gcaccacccc      1380
     aagtagaggc accccaagga gcaccacccc aaggagtcga caaccaggcc tatcaagctt      1440
     gagaagcagg tcttttaaga attacttaga attctgtcgt agaaactgca agaaagtgtt      1500
     atcactggaa aagactcttg aacaaggaaa aacaaaaaat aacatgttca aatttttttg      1560
     tgctctttta tgaatttttt ttcttcaaat ttttatttta aatattgagg caaaatggtt      1620
     tgtcggaata gaataaaagt attttctatt tggttgttta ttttcgaaag agatg           1675
//
ID   M96661; SV 1; linear; genomic DNA; STD; INV; 4712 BP.
XX
AC   M96661;
XX
DT   09-SEP-1992 (Rel. 33, Created)
DT   14-NOV-2006 (Rel. 89, Last updated, Version 7)
XX
DE   Anopheles albimanus heat shock protein 70 (hsp70) gene (clone p70b),
DE   complete cds.
XX
KW   heat shock protein 70.
XX
OS   Anopheles albimanus
OC   Eukaryota; Metazoa; Arthropoda; Hexapoda; Insecta; Pterygota; Neoptera;
OC   Endopterygota; Diptera; Nematocera; Culicoidea; Culicidae; Anophelinae;
OC   Anopheles.
XX
RN   [1]
RP   1-4712
RX   DOI; 10.1111/j.1365-2583.1993.tb00130.x.
RX   PUBMED; 9087548.
RA   Benedict M.Q., Cockburn A.F., Seawright J.A.;
RT   "The Hsp70 heat-shock gene family of the mosquito Anopheles albimanus";
RL   Insect Mol Biol 2(2):93-102(1993).
XX
FH   Key             Location/Qualifiers
FH
FT   source          1..4712
FT                   /organism="Anopheles albimanus"
FT                   /mol_type="genomic DNA"
FT                   /db_xref="taxon:7167"
FT   CDS             complement(1..1506)
FT                   /partial
FT                   /codon_start=1
FT                   /gene="hsp70"
FT                   /product="heat shock protein 70, hsp70A2"
FT                   /note="carboxy terminus truncated in clone isolated"
FT                   /db_xref="GOA:P41827"
FT                   /db_xref="InterPro:IPR001023"
FT                   /db_xref="InterPro:IPR013126"
FT                   /db_xref="InterPro:IPR018181"
FT                   /db_xref="UniProtKB/Swiss-Prot:P41827"
FT                   /protein_id="AAC41542.1"
FT                   /translation="MPSAIGIDLGTTYSCVGVFQHGKVEIIANDQGNRTTPSYVAFSDT
FT                   ERLIGDAAKNQVAMNPTNTVFDAKRLIGRKFDDPKIQADMKHWPFTVVNDGGKPKIRVE
FT                   FKGERKTFAPEEISSMVLTKMKETAEAYLGQSVKNAVITVPAYFNDSQRQATKDAGAIA
FT                   GLNVMRIINEPTAAALAYGLDKNLKGERNVLIFDLGGGTFDVSILTIDEGSLFEVRSTA
FT                   GDTHLGGEDFDNRMVGHFVEEFKRKHKKDLSKNARALRRLRTACERAKRTLSSSTEATI
FT                   EIDALMDGIDYYTKISRARFEELCSDLFRSTLQPVEKALSDAKMDKSSIHDIVLVGGST
FT                   RIPKVQSLLQNFFAGKSLNLSINPDEAVAYGAAVQAAILSGDKDDKIQDVLLVDVAPLS
FT                   LGIETAGGVMTKLIERNSRIPCKQTQIFSTYADNQPGVSIQVFEGERAMTKDNNLLGQF
FT                   DLSGIPPAPRGVPQIEVTFDLDANGILNVAAKEKSTGKEKNITI"
FT   5'UTR           complement(1507..>1687)
FT                   /gene="hsp70"
FT                   /note="Location changed from
FT                   'complement(1507..(1687.1690))' to
FT                   'complement(1507..>1687)'"
FT   TATA_signal     complement(1712..1719)
FT                   /gene="hsp70"
FT                   /note="tandem overlapping TATA boxes"
FT   TATA_signal     2493..2500
FT                   /gene="hsp70"
FT                   /note="tandem overlapping TATA boxes"
FT   5'UTR           <2525..2705
FT                   /gene="hsp70"
FT                   /note="Location changed from '(2522.2525)..2705' to
FT                   '<2525..2705'"
FT   CDS             2706..4628
FT                   /codon_start=1
FT                   /gene="hsp70"
FT                   /product="heat shock protein 70, hsp70A2"
FT                   /note="single base deletion between nucleotides 3418 and
FT                   3419 predicts premature termination in this clone.
FT                   Insertion of 'N' restores reading frame and is silent"
FT                   /db_xref="GOA:P41827"
FT                   /db_xref="InterPro:IPR001023"
FT                   /db_xref="InterPro:IPR013126"
FT                   /db_xref="InterPro:IPR018181"
FT                   /db_xref="UniProtKB/Swiss-Prot:P41827"
FT                   /protein_id="AAC41543.1"
FT                   /translation="MPSAIGIDLGTTYSCVGVFQHGKVEIIANDQGNRTTPSYVAFSDT
FT                   ERLIGDAAKNQVAMNPTNTVFDAKRLIGRKFDDPKIQADMKHWPFTVVNDGGKPKIRVE
FT                   FKGERKTFAPEEISSMVLTKMKETAEAYLGQSVKNAVITVPAYFNDSQRQATKDAGAIA
FT                   GLNVMRIINEPTAAALAYGLDKNLKGERNVLIFDLGGGTFDVSILTIDEGSLFEVRSTA
FT                   GDTHLGGEDFDNRMVGHFVEEFKRKHKKDLSKNARALRRLRTACERAKRTLSSSTEATI
FT                   EIDALMDGIDYYTKISRARFEELCSDLFRSTLQPVEKALSDAKMDKSSIHDIVLVGGST
FT                   RIPKVQSLLQNFFAGKSLNLSINPDEAVAYGAAVQAAILSGDKDDKIQDVLLVDVAPLS
FT                   LGIETAGGVMTKLIERNSRIPCKQTQIFSTYADNQPGVSIQVFEGERAMTKDNNLLGQF
FT                   DLSGIPPAPRGVPQIEVTFDLDANGILNVAAKEKSTGKEKNITIKNDKGRLSQADIDRM
FT                   VSEAEKFREEDEKQRERISARNQLEAYCFNLKQSLDGEGASKLSDADRKTVQDRCEETL
FT                   RWIDGNTMADKEEFEHKMQELTKACSPIMTKLHQQAAGGPSPSSCAQQAGGFGGRTGPT
FT                   VEEVD"
XX
SQ   Sequence 4712 BP; 1191 A; 1163 C; 1225 G; 1132 T; 1 other;
     gatcgtgata ttcttctcct ttccggtgct cttctcctta gctgccacgt tcaggattcc        60
     gttggcatcc agatcgaagg tcacctcgat ctgtggcaca ccacgtggag ccgggggaat       120
     gcccgagagg tcaaactgtc ccagaagatt gttgtccttg gtcatggctc gttctccctc       180
     gaacacctgg atcgaaacgc cgggctggtt gtcggcgtat gtcgagaaga tctgcgtctg       240
     tttgcacgga atgcgcgagt tgcgctcaat cagcttcgtc atcacacctc cggccgtctc       300
     aattccaagc gacaatggag cgacatccac tagcagtacg tcttgaatct tatcgtcctt       360
     gtctccgctg aggatggccg cctgtaccgc tgcaccgtaa gccacggcct catccggatt       420
     gatcgaaagg ttcagagact ttccagcgaa aaagttctgc agcaaggact gcaccttcgg       480
     gatgcgtgtg gagcctccta ccaggacgat atcgtgaatg gagctcttat ccatcttcgc       540
     atcggacaga gccttttcca ctggctgcag cgtcgaacgg aacaagtcag aacacagctc       600
     ctcgaatcgt gcccggctga tcttcgtgta ataatcgatg ccatccatca gggcgtcaat       660
     ctcgatcgtt gcctccgtgc tcgaggacag tgtgcgcttc gccctctcgc atgccgttct       720
     caaacgacgc agagcgcgag cgttcttcga cagatccttc ttgtgctttc gtttgaattc       780
     ttccacgaag tggcccacca ttcggttatc gaagtcttcg cctcccaaat gagtatctcc       840
     ggccgtggat cgtacctcaa acagtgatcc ctcgtcgatc gtcagaatgg acacgtcgaa       900
     ggtgccgcct cccagatcga agatcagaac attgcgttct ccctttaggt tcttatccaa       960
     gccatacgcc agagctgctg ccgtcggttc gttgatgatg cgcatcacat tcagtccagc      1020
     gatggctcca gcatcctttg tggcctgtcg ctggctgtcg ttgaagtagg ctggtactgt      1080
     gatgactgca ttttttactg actggcccag gtaggcttcg gcggtttcct tcatcttcgt      1140
     cagcaccatc gaactgattt cctccggggc aaaggttttg cgctcgccct tgaactcgac      1200
     gcggatcttg ggcttaccac cgtcatttac caccgtgaat ggccagtgct tcatatcggc      1260
     ttggatcttc ggatcgtcga atttgcgtcc aatcagtcgc ttggcatcga acaccgtgtt      1320
     agtcggattc atggccactt ggttcttggc tgcatctccg atgagtcgct cagtgtccga      1380
     gaacgcaacg tagctcggtg tcgttcggtt gccctggtcg tttgcgatga tctccacctt      1440
     tccatgctgg aacacaccaa cgcaggagta cgtggtgccc agatcgattc cgattgccga      1500
     aggcattctg tgtctctgtg gttcaacttc gatgaatatg ctttctcaaa tcactcaaac      1560
     tggtgtgcac aattatacgc tttctgatgc aacaattgat tcactctggt cactgcttgt      1620
     tactttgaaa cactttattt ttcacgtgtt tgcacttgtt actctcagct cgctcagatt      1680
     caaattgacg acagctgctc gaacggaccg gtttatatac cacaccactc gatttctaga      1740
     aggttcgagc actttccaca gctctccgct aggctactcg aacgcgatga gggagattgt      1800
     atgccgcgtt ctggaaattt ctcgcgtacg aatcatcaaa gcggacccgg ctatttttag      1860
     ccaatcgcgt gcgtgatgat ggaaaacgca agaatgtgcg agaggagaga gagtgaggtg      1920
     gacaaaaaat gtgtttgctt ttgaaagtgt ttattcctct taacttttaa caacattaaa      1980
     agaatgctgg atttaattta acagaataca ttttcaacaa agcagcttgt aggtcacaat      2040
     gcgtttatta ttatgataaa gtgcatatag ttaaggaaag ctattagaaa ggaatattaa      2100
     ttttattgca cctcaagttt gcgtaggcta acaattgtta gaattattta aatttgattt      2160
     taataatatt ttgttcacaa cttgccctga aaaattgatt tgaatgatcg taaaatttat      2220
     aaaactgtta ttgaataatc cgttacgagt tatgcggaat aaattaataa atcaacattc      2280
     agttatgtcc ctcctcgctc gctctcctct cgcacattct tgcgttttcc atcatcacgc      2340
     acgcgattgg cttaaaaata gccgggtccg ctttgatgat tcgtacgcga gagatttcca      2400
     gaatgcggca tacaatctcc ctcatcgcgt tcgagtagcc tagcggagag ctgtggaaag      2460
     tgctcgaacc ttctagaaat cgagtggtgt ggtatataaa ccggtccgtt cgagcagctg      2520
     tcgtcaattt gaatctgagc gagctgagag taacaagtgc aaacacgtga aaaataaagt      2580
     gtttcaaagt aacaagcagt gaccagagtg aatcaattgt tgcatcagaa agcgtataat      2640
     tgtgcacacc agtttgagtg atttgagaaa gcatattcat cgaagttgaa ccacagagac      2700
     acagaatgcc ttcggcaatc ggaatcgatc tgggcaccac gtactcctgc gttggtgtgt      2760
     tccagcatgg aaaggtggag atcatcgcaa acgaccaggg caaccgaacg acaccgagct      2820
     acgttgcgtt ctcggacact gagcgactca tcggagatgc agccaagaac caagtggcca      2880
     tgaatccgac taacacggtg ttcgatgcca agcgactgat tggacgcaaa ttcgacgatc      2940
     cgaagatcca agccgatatg aagcactggc cattcacggt ggtaaatgac ggtggtaagc      3000
     ccaagatccg cgtcgagttc aagggcgagc gcaaaacctt tgccccggag gaaatcagtt      3060
     cgatggtgct gacgaagatg aaggaaaccg ccgaagccta cctgggccag tcagtaaaaa      3120
     atgcagtcat cacagtacca gcctacttca acgacagcca gcgacaggcc acaaaggatg      3180
     ctggagccat cgctggactg aatgtgatgc gcatcatcaa cgaaccgacg gcagcagctc      3240
     tggcgtatgg cttggataag aacctaaagg gagaacgcaa tgttctgatc ttcgatctgg      3300
     gaggcggcac cttcgacgtg tccattctga cgatcgacga gggatcactg tttgaggtac      3360
     gatccacggc cggagatact catttgggag gcgaagactt cgataaccga atggtgggnc      3420
     acttcgtgga agaattcaaa cgaaagcaca agaaggatct gtcgaagaac gctcgcgctc      3480
     tgcgtcgttt gagaacggca tgcgagaggg cgaagcgcac actgtcctcg agcacggagg      3540
     caacgatcga aattgacgcc ctgatggatg gcatcgatta ttacacgaag atcagccggg      3600
     cacgattcga ggagctgtgt tctgacttgt tccgttcgac gctgcagcca gtggaaaagg      3660
     ctctgtccga tgcgaagatg gataagagct ccattcacga tatcgtcctg gtaggagggt      3720
     ccacacgcat cccgaaggtg cagtccttgc tgcagaactt tttcgctgga aagtctctga      3780
     acctttcgat caatccggat gaggccgtgg cttacggtgc agcggtacag gcggccatcc      3840
     tcagcggaga caaggacgat aagattcaag acgtactgct agtggatgtc gctccattgt      3900
     cgcttggaat tgagacggcc ggaggtgtga tgacgaagct gattgagcgc aactcgcgca      3960
     ttccgtgcaa acagacgcag atcttctcga catacgccga caaccagccc ggcgtttcga      4020
     tccaggtgtt cgagggagaa cgagccatga ccaaggacaa caatcttctg ggacagtttg      4080
     acctctcggg cattcccccg gctccacgtg gtgtgccaca gatcgaggtg accttcgatc      4140
     tggatgccaa cggaatcctg aacgtggcag ctaaggagaa gagcaccgga aaggagaaga      4200
     atatcacgat caagaacgac aagggtcgcc tatcgcaggc cgatatcgat cgaatggtgt      4260
     cggaagctga gaagttccgc gaggaggatg agaagcaacg cgaacgcatc tctgcccgca      4320
     atcagctcga ggcttactgc ttcaacctga aacagtcgct ggacggcgaa ggagcgagta      4380
     aactcagcga tgccgatcgc aagacagtgc aggatcgatg cgaagagact ctgcgatgga      4440
     tcgacggcaa cacaatggcc gataaggagg agttcgagca caagatgcaa gagctaacga      4500
     aggcatgcag ccccatcatg acgaaactgc accagcaggc agctggcggg ccctcgccaa      4560
     gcagttgcgc acagcaagct ggaggatttg gaggaaggac gggtccgaca gtggaagaag      4620
     tggattaagg agtagaaata acggagattt ataattgatt cgaagaggat ggcattgact      4680
     gaatatgatt actcatatag tatgttccta tg                                    4712
//