Helicobacter pylori 26695
complement (3042..4202) / product = "tetracycline resistance protein TetA(P), putative;
identity: 26.96; identified by sequence similarity"


ID   AE000622   standard; DNA; PRO; 10099 BP.
XX
AC   AE000622; AE000511;
XX
SV   AE000622.1
XX
NI   g2314317
XX
DT   25-AUG-1997 (Rel. 52, Created)
DT   12-APR-1999 (Rel. 59, Last updated, Version 4)
XX
DE   Helicobacter pylori 26695 section 100 of 134 of the complete
DE   genome.
XX
KW   .
XX
OS   Helicobacter pylori 26695
OC   Bacteria; Proteobacteria; epsilon subdivision; Helicobacter group;
OC   Helicobacter; Helicobacter pylori.
XX
RN   [1]
RC   Erratum:[[published erratum appears in Nature 1997 Sep
RC   25;389(6649):412]]
RP   1-10099
RX   MEDLINE; 97394467.
RA   Tomb J.-F., White O., Kerlavage A.R., Clayton R.A., Sutton G.G.,
RA   Fleischmann R.D., Ketchum K.A., Klenk H.P., Gill S., Dougherty B.A.,
RA   Nelson K., Quackenbush J., Zhou L., Kirkness E.F., Peterson S.,
RA   Loftus B., Richardson D., Dodson R., Khalak H.G., Glodek A.,
RA   McKenney K., Fitzegerald L.M., Lee N., Adams M.D., Hickey E.K.,
RA   Berg D.E., Gocayne J.D., Utterback T.R., Peterson J.D., Kelley J.M.,
RA   Karp P.D., Smith H.O., Fraser C.M., Venter J.C.;
RT   "The complete genome sequence of the gastric pathogen Helicobacter
RT   pylori";
RL   Nature 388(6642):539-547(1997).
XX
RN   [2]
RP   1-10099
RA   Tomb J.-F., White O., Kerlavage A.R., Clayton R.A., Sutton G.G.,
RA   Fleischmann R.D., Ketchum K.A., Klenk H.P., Gill S., Dougherty B.A.,
RA   Nelson K., Quackenbush J., Zhou L., Kirkness E.F., Peterson S.,
RA   Loftus B., Richardson D., Dodson R., Khalak H.G., Glodek A.,
RA   McKenney K., Fitzegerald L.M., Lee N., Adams M.D., Hickey E.K.,
RA   Berg D.E., Gocayne J.D., Utterback T.R., Peterson J.D., Kelley J.M.,
RA   Cotton M.D., Weidman J.M., Fujii C., Bowman C., Watthey L., Wallin E.,
RA   Hayes W.S., Borodovsky M., Karp P.D., Smith H.O., Fraser C.M.,
RA   Venter J.C.;
RT   ;
RL   Submitted (06-AUG-1997) to the EMBL/GenBank/DDBJ databases.
RL   The Institute for Genomic Research, 9712 Medical Center Dr, Rockville,
RL   MD 20850, USA
XX
RN   [3]
RP   1-10099
RA   White O.;
RT   ;
RL   Submitted (17-MAR-1999) to the EMBL/GenBank/DDBJ databases.
RL   The Institute for Genomic Research, 9712 Medical Center Dr, Rockville,
RL   MD 20850, USA
XX
DR   SPTREMBL; O25775; O25775.
DR   SPTREMBL; O25777; O25777.
DR   SPTREMBL; O25778; O25778.
DR   SPTREMBL; O25779; O25779.
DR   SPTREMBL; O25780; O25780.
DR   SPTREMBL; O25782; O25782.
DR   SWISS-PROT; O25776; FLAV_HELPY.
DR   SWISS-PROT; O25781; G6PI_HELPY.
DR   SWISS-PROT; P56190; CSTA_HELPY.
XX
FH   Key             Location/Qualifiers
FH
FT   source          1..10099
FT                   /db_xref="taxon:85962"
FT                   /organism="Helicobacter pylori 26695"
FT                   /strain="26695"
FT   CDS             complement(76..498)
FT                   /codon_start=1
FT                   /db_xref="PID:g2314318"
FT                   /db_xref="SPTREMBL:O25775"
FT                   /note="similar to GB:L42023 PID:1004109 PID:1221906
FT                   PID:1204263 SP:P71335 percent identity: 29.79; identified
FT                   by sequence similarity; putative"
FT                   /transl_table=11
FT                   /gene="HP1160"
FT                   /product="conserved hypothetical protein"
FT                   /protein_id="AAD08206.1"
FT                   /translation="MLEIDNQTPLESDFLLLEKIANVLAPTQIIELVLVSDETIREINK
FT                   DLRGCDYATDVLSFPLEAIPHTPLGSVVINAPLAQTNALKLGHSLENEIALLFIHGVLH
FT                   LLGYDHEKDKGEQRQKESELIKAFNLPLSLIERTQD"
FT   CDS             complement(553..1047)
FT                   /codon_start=1
FT                   /db_xref="PID:g2314319"
FT                   /db_xref="SWISS-PROT:O25776"
FT                   /note="similar to SP:P31158 GB:M88253 PID:154528 percent
FT                   identity: 46.99; identified by sequence similarity;
FT                   putative"
FT                   /transl_table=11
FT                   /gene="HP1161"
FT                   /product="flavodoxin (fldA)"
FT                   /protein_id="AAD08207.1"
FT                   /translation="MGKIGIFFGTDSGNAEAIAEKISKAIGNAEVVDVAKASKEQFNSF
FT                   TKVILVAPTAGAGDLQTDWEDFLGTLEASDFATKTIGLVGLGDQDTYSETFAEGIFHIY
FT                   EKAKAGKVVGQTPTDGYHFEASKAVEGGKFVGLVIDEDNQDDLTDERISKWVEQVKGSF
FT                   A"
FT   CDS             complement(1137..1751)
FT                   /codon_start=1
FT                   /db_xref="PID:g2314320"
FT                   /db_xref="SPTREMBL:O25777"
FT                   /note="similar to SP:P33366 PID:405866 GB:U00096
FT                   PID:1788458 percent identity: 27.62; identified by sequence
FT                   similarity; putative"
FT                   /transl_table=11
FT                   /gene="HP1162"
FT                   /product="conserved hypothetical integral membrane protein"
FT                   /protein_id="AAD08208.1"
FT                   /translation="MKIKTNQKRVFMQEALLRFQEGFKEWGYLILFLYSLGGGYVGIVI
FT                   ASILSATTHALDIKITIFVAFLGNMVGSGALVVFARYQKRDFLQYFHKHRRKLALASLW
FT                   VKRYALLMIFVNKYLYGIKSVVPLAVGFSKYPLKKFLWLNVFSSFLWALIVGSVSFQAS
FT                   DWVKTLYERLSHYTSFFIISFVLIALLIWFLLKRYSRKMGF"
FT   CDS             1845..2036
FT                   /codon_start=1
FT                   /db_xref="PID:g2314326"
FT                   /db_xref="SPTREMBL:O25778"
FT                   /note="hypothetical protein; identified by GeneMark;
FT                   putative"
FT                   /transl_table=11
FT                   /gene="HP1163"
FT                   /product="H. pylori predicted coding region HP1163"
FT                   /protein_id="AAD08214.1"
FT                   /translation="MNTEILTIMLVVSVLMGLVGLIAFLWGVKSGQFDDEKRMLESVLY
FT                   DSASDLNEAILQEKRQKN"
FT   CDS             2061..3035
FT                   /codon_start=1
FT                   /db_xref="PID:g2314321"
FT                   /db_xref="SPTREMBL:O25779"
FT                   /note="similar to GP:886900 percent identity: 27.82;
FT                   identified by sequence similarity; putative"
FT                   /transl_table=11
FT                   /gene="HP1164"
FT                   /product="thioredoxin reductase (trxB)"
FT                   /protein_id="AAD08209.1"
FT                   /translation="MNQEILDVLIVGAGPGGIATAVECEIAGVKKVLLCEKTESHSGML
FT                   EKFYKAGKRIDKDYKKQVVELKGHIPFKDSFKEETLENFTNLLKEHHITPSYKTDIESV
FT                   KKEGEYFKITTTSNTTYHAKFVVVAIGKMGQPNRPTAYKIPVALSKQVVFSINDCKENE
FT                   KTLVIGGGNSAVEYAIALCKTTPTTLNYRKKEFSRINEDNAKNLQEVLNNNTLKSKLGV
FT                   DIESLEEDNTQIKVNFTDNTSESFDRLLYAIGGSTPLEFFKRCSLELDPSTNIPVVKEN
FT                   LESNNIPNLFIVGDILFKSGASIATALNHGYDVAIEIAKRLHS"
FT   CDS             complement(3042..4202)
FT                   /codon_start=1
FT                   /db_xref="PID:g2314322"
FT                   /db_xref="SPTREMBL:O25780"
FT                   /note="similar to GB:L20800 PID:456034 PID:1845540 percent
FT                   identity: 26.96; identified by sequence similarity;
FT                   putative"
FT                   /transl_table=11
FT                   /gene="HP1165"
FT                   /product="tetracycline resistance protein tetA(P),
FT                   putative"
FT                   /protein_id="AAD08210.1"
FT                   /translation="MLRKNILAYYGANFLLIIAQSLPHAILTPLLLSKGLSLSEILLVQ
FT                   TFFSFCVLVAEYPSGVLADLMSRKNLFLVSNAFLIASFSFVLFFDSFIFMLLAWGLYGL
FT                   YSACSSGTIEASLITDIKENKKDLSKFLAKNNQITYLGMIIGSSLGSFLYLKVHAMLYI
FT                   VGIFLIMLCVLTIIFYFKEKEGDFKSQKSLKLLKEQVKGSLKELKDNPKLKILLVGHLI
FT                   TPVFFMSHFQMWQAYFLKQGVKEQYLFVFYIAFQVISILIHFLKASSYSQKIALSSLVV
FT                   LLGVSPLLLSNIPYCFIGVYALMVAFFTYMSYCLNYQFSKFVSKNNISSLSSLLSSCVR
FT                   VVSVLILSLSSLELRYFSPLTIITMHFALTLIILFFFLYKAKPFDE"
FT   CDS             4266..5903
FT                   /codon_start=1
FT                   /db_xref="PID:g2314323"
FT                   /db_xref="SWISS-PROT:O25781"
FT                   /note="similar to SP:P11537 GB:X15196 PID:396360 PID:42377
FT                   GB:U00096 percent identity: 53.32; identified by sequence
FT                   similarity; putative"
FT                   /transl_table=11
FT                   /gene="HP1166"
FT                   /product="glucose-6-phosphate isomerase (pgi)"
FT                   /protein_id="AAD08211.1"
FT                   /translation="MLTQLKTYPKLLKHYEEIKEVHMRDWFFKDKERASRYFLQFESLS
FT                   LDYSKNRLNDTTLKLLFELANDCSLKEKIEAMFKGEKINTTEKRAVLHTALRSLNDTEI
FT                   LLDNMEVLKSIRSVLKRMRAFSDSVRSGKRLGYTNQVITDIVNIGIGGSDLGALMVCTA
FT                   LKRYAHPRLKMHFVSNVDGTQILDVLEKLNPASTLFIVASKTFSTQETLTNALTARKWF
FT                   VERSGDEKHIAKHFVAVSTNKEAVQQFGIDEHNMFEFWDFVGGRYSLWSAIGLSIMIYL
FT                   GKKNFNALLKGAYLMDEHFRNAPFESNLPVLMGLIGVWYINFFQSKSHLIAPYDQYLRH
FT                   FPKFIQQLDMESNGKRISKKGEIIPYDTCPVVWGDMGINAQHAFFQLLHQGTHLIPIDF
FT                   IASLDKKPNAKGHHEILFSNVLAQAQAFMKGKSYEEALGELLFKGLDKDEAKDLAHHRV
FT                   FFGNRPSNILLLEKISPSNIGALVALYEHKVFVQGVIWDINSFDQWGVELGKELAVPIL
FT                   QELEGHKSNAYFDSSTKHLIELYKNYNQ"
FT   CDS             6209..7624
FT                   /codon_start=1
FT                   /db_xref="PID:g2314325"
FT                   /db_xref="SPTREMBL:O25782"
FT                   /note="hypothetical protein; identified by GeneMark;
FT                   putative"
FT                   /transl_table=11
FT                   /gene="HP1167"
FT                   /product="H. pylori predicted coding region HP1167"
FT                   /protein_id="AAD08213.1"
FT                   /translation="MKKASQVLFFGAFLSSSLQGFEAKLNGFVDQSSTIGFNQHKINKE
FT                   RGIYPMQQFATIAGYLGLGFSLLPKKVSDHVLKGKIGGMVGSIFYDGTKKFEDSSVAYN
FT                   LFGYYDGFMGGYTNILQSDDLATQNMKYNKNVRNYVFSDAYLEYAYKNYFEIKAGRYLS
FT                   TMPYKSGQTQGFQISGQYKKARLTWFSSFGRAFAYGSFLMDWFAARTTYSGGFTKNDKG
FT                   GYDSHGRKVLYGTHAVQLTYKPHRFLIEGFYYLSPQIFNAPGVKIGWDSNPNFSGTGFR
FT                   SDTAIIGFFPIYYPWMIVKSNGSPVYKYDTPATQNGQNLIILQRFDINNYNVSIAFYKV
FT                   FQNANGWIGNMGNPSGVIMGSNSVYAGFTGTALKRDAATIFLSCGGTHFAKKFTWKFAT
FT                   QYSNSVVSWEARAMISLGYKFTEYLSGSVDLAYYGVYTNKGFKPGENGPVPKDFPALYS
FT                   DRSALYTALVASF"
FT   CDS             complement(7902..9965)
FT                   /codon_start=1
FT                   /db_xref="PID:g2314324"
FT                   /db_xref="SWISS-PROT:P56190"
FT                   /note="similar to SP:P15078 GB:X52904 PID:41081 GB:U00096
FT                   PID:1651245 percent identity: 55.51; identified by sequence
FT                   similarity; putative"
FT                   /transl_table=11
FT                   /gene="HP1168"
FT                   /product="carbon starvation protein (cstA)"
FT                   /protein_id="AAD08212.1"
FT                   /translation="MQKSLVSLAWVFVAILGAICLGVLALHKGESINTLWLVVASACIY
FT                   SIGYRFYSHFIAYKVLKLDDSRATPACVRNDGKDFVPTDKAITFGHHFAAIAGAGPLVG
FT                   PILAAQMGYLPSILWILIGSVLGGCVHDFVVLFASIRRDGKSLGEMIKLEMGQFVGMIA
FT                   SLGILGIMLIIIAILAMVVVKALAHSPWGFFTIAMTIPIAILMGLYMRFFRPHKILEVS
FT                   VIGFILLIIAIYAGKYVSLDPKLASIFTFEASSLAWMIMGYGFVASILPVWFLLAPRDY
FT                   LSTFLKIGVIGVLVVAIIFVAPPLQIPKITPFVDGSGPVFAGSVFPFLFITVACGTISG
FT                   FHALISSGTTPKMLAKESDARLVGYGSMVMESVVALMALVCAGILHPGLYFAINSPEVS
FT                   IGKDIADAASVISSWGFNISAEEIREMTKNIGESSILSRTGGAPTFAIGLAMIVYHILG
FT                   DPSVMAFWYHFAILFEALFILTAVDAGTRTARFMIQDLLGNVYKPLGDLSSYKAGIFAT
FT                   LLCVAGWGYFLYQGTIDPKGGIYTLWPLFGVSNQMLAGMALLLVTVVLFKMGRFKGAMI
FT                   SALPAVLILSITFYSGILKVVPKSDNSVLNNVSHVAQMQIIKEKMATTTDEKALKTLQK
FT                   SFFNHAIDAILCVFFMLVALLVLIVSVRICSNAYFKNKIYPPLAETPYIKAS"
XX
SQ   Sequence 10099 BP; 3290 A; 2134 C; 1919 G; 2756 T; 0 other;
     ATTTTTTCAA ATCTTAAAAA TTCCATTCTT AAAAATTAAA AGCTTTATTT GTCAGCATTA        60
     GTAGAGTATC TAAACCTAAT CCTGTGTGCG TTCAATCAAA CTCAAAGGCA AGTTAAACGC       120
     TTTAATGAGT TCGCTCTCTT TTTGGCGTTG TTCGCCCTTA TCTTTTTCAT GGTCATAGCC       180
     CAACAAATGC AACACCCCAT GAATGAATAA AAGAGCGATC TCATTTTCTA AGCTATGTCC       240
     TAATTTCAGA GCGTTAGTTT GAGCTAATGG CGCATTAATC ACCACGCTCC CTAAAGGGGT       300
     GTGAGGAATG GCTTCTAAAG GGAAGCTCAA AACATCGGTA GCGTAATCGC AACCCCTTAA       360
     ATCCTTGTTG ATTTCTCGAA TGGTTTCATC GCTCACCAAA ACAAGCTCAA TGATTTGAGT       420
     GGGGGCTAAA ACATTTGCGA TTTTTTCTAA TAATAAAAAG TCTGATTCTA GCGGGGTTTG       480
     GTTGTCTATT TCTAGCATTA AAGATATAAG AAGAAGTTTA AAAAAGCCCT AAAATTTAGG       540
     GCTTATAAAA AATTAAGCGA AAGAACCTTT AACTTGTTCT ACCCATTTTG AAATCCTCTC       600
     ATCAGTGAGA TCGTCTTGAT TGTCTTCATC AATCACAAGA CCCACGAATT TACCGCCTTC       660
     TACCGCTTTA GAAGCTTCAA AATGATAACC ATCAGTGGGA GTTTGCCCTA CCACTTTGCC       720
     GGCTTTAGCT TTTTCATAAA TGTGGAAAAT GCCTTCCGCA AAAGTTTCGC TGTAAGTGTC       780
     TTGATCGCCC AAGCCTACAA GCCCAATGGT TTTAGTCGCA AAATCGCTCG CTTCTAGTGT       840
     GCCTAAAAAG TCTTCCCAAT CTGTTTGCAA ATCACCCGCA CCAGCTGTTG GAGCGACTAA       900
     AATAACCTTT GTAAAGCTAT TAAATTGCTC TTTAGAAGCC TTAGCCACAT CAACCACTTC       960
     GGCATTACCA ATAGCCTTGC TGATTTTTTC AGCGATAGCT TCAGCGTTCC CGCTGTCTGT      1020
     CCCAAAAAAG ATACCAATTT TTCCCATATC CAATCCTTGT GTTTAAAGAT ATTAACGCAC      1080
     CCGCTTTTAG CGAATGCTTG TGGGCGTAGT CTAGCGCATT TAATTAAACA TCTTGCTTAA      1140
     AAACCCATTT TGCGCGAATA TCGTTTCAAT AAAAACCATA TTAAAAGCGC TATAAGAACA      1200
     AAACTTATGA TAAAAAACGA AGTGTAATGA GAAAGCCTTT CATACAGCGT TTTCACCCAA      1260
     TCGCTCGCTT GAAAAGAAAC GCTCCCCACG ATGAGCGCCC ACAAAAAACT GGAAAAAACA      1320
     TTAAGCCATA AAAACTTTTT TAAAGGGTAT TTGCTAAAAC CAACCGCCAA AGGCACAACG      1380
     CTTTTAATCC CATAGAGATA TTTATTGACA AAAATCATGA GCAAGGCGTA GCGTTTCACC      1440
     CACAAACTCG CTAAAGCAAG CTTTCTTCGG TGCTTATGAA AATATTGCAA AAAATCTCTT      1500
     TTTTGATAGC GGGCAAAGAC TACAAGAGCC CCACTCCCTA CCATATTCCC TAAAAAAGCG      1560
     ACAAAAATGG TTATTTTTAT ATCTAAAGCG TGCGTGGTAG CGCTCAAAAT AGAGGCGATG      1620
     ACAATCCCCA CATACCCGCC CCCTAAAGAA TATAAAAACA AAATAAGATA ACCCCACTCC      1680
     TTAAAACCCT CTTGAAAACG CAACAACGCT TCTTGCATAA AAACCCTCTT TTGATTCGTT      1740
     TTTATTTTCA TGTTATCCAA ACTTATTCAA CCTATTGGTG ATTTAAACGC TATCTTTTAG      1800
     TATAATAATC AGTTCATGCA ATCCTAATCA TAAAGATTAA AGAGATGAAT ACAGAAATTT      1860
     TAACCATCAT GTTAGTTGTC TCAGTGCTTA TGGGATTGGT AGGCTTAATA GCGTTTTTAT      1920
     GGGGGGTTAA AAGCGGTCAG TTTGACGATG AAAAACGCAT GCTTGAAAGC GTGTTGTATG      1980
     ACAGCGCGAG CGATTTGAAC GAAGCGATTT TACAAGAAAA ACGCCAAAAG AATTAAAAAA      2040
     TTAAAATAAA AAGGATAGAA ATGAATCAAG AAATTTTAGA CGTGTTGATA GTGGGTGCAG      2100
     GGCCTGGGGG CATTGCCACG GCCGTAGAAT GCGAAATAGC CGGCGTTAAA AAAGTGCTTT      2160
     TATGCGAAAA AACCGAAAGC CATTCAGGCA TGTTAGAGAA GTTTTATAAA GCCGGTAAAA      2220
     GGATTGATAA AGATTATAAA AAGCAAGTCG TAGAGCTTAA AGGGCATATC CCTTTTAAAG      2280
     ACAGCTTTAA AGAAGAAACT TTAGAGAATT TCACTAACCT TTTAAAAGAG CATCACATCA      2340
     CGCCAAGCTA TAAAACCGAT ATTGAGAGCG TGAAAAAAGA GGGCGAATAC TTTAAAATCA      2400
     CCACCACTTC TAACACAACC TATCATGCTA AATTCGTGGT GGTTGCGATC GGGAAAATGG      2460
     GCCAGCCAAA CCGCCCTACT GCTTATAAAA TCCCTGTTGC GCTCTCTAAA CAAGTGGTTT      2520
     TTAGCATCAA TGATTGTAAG GAAAATGAAA AAACCCTTGT GATCGGCGGA GGCAACTCAG      2580
     CGGTGGAATA CGCCATTGCT TTGTGCAAAA CCACCCCTAC CACCCTCAAT TACCGCAAAA      2640
     AAGAATTCAG CCGCATCAAT GAAGACAACG CTAAAAACTT GCAAGAAGTC CTAAACAATA      2700
     ACACGCTTAA AAGCAAGCTT GGAGTGGATA TTGAAAGCCT AGAAGAAGAT AACACTCAGA      2760
     TTAAGGTTAA CTTCACCGAT AACACGAGCG AAAGTTTTGA TCGTTTGCTG TATGCGATCG      2820
     GCGGCTCTAC CCCTTTAGAG TTTTTTAAAC GCTGTTCTTT AGAGCTGGAT CCTAGCACCA      2880
     ATATCCCTGT GGTGAAAGAA AATTTAGAGA GCAACAATAT CCCTAATTTG TTCATCGTGG      2940
     GCGATATTTT ATTCAAATCA GGGGCGAGCA TCGCTACCGC TTTAAACCAT GGCTATGATG      3000
     TTGCTATAGA AATCGCTAAA AGGTTGCACT CTTAAAGCCG CTCACTCATC AAACGGCTTA      3060
     GCCTTATACA AAAAGAAAAA GAGGATGATA AGCGTCAAGG CAAAATGCAT GGTTATGATA      3120
     GTTAGGGGTG AGAAGTAACG CAGTTCCAGA CTGCTGAGCG ATAAGATTAG CACAGAGACC      3180
     ACGCGCACAC AGCTTGATAA AAGCGATGAG AGCGAGGAAA TGTTGTTTTT AGAAACGAAT      3240
     TTGGAGAATT GATAGTTTAA GCAATAGCTC ATGTAAGTGA AAAACGCCAC CATGAGCGCA      3300
     TACACCCCTA TGAAACAATA AGGGATATTG CTAAGCAATA AGGGGCTAAC GCCTAACAAC      3360
     ACCACAAGCG AACTCAAGGC GATTTTTTGG CTATAACTAG AGGCTTTTAA AAAATGAATG      3420
     AGAATAGAAA TCACTTGAAA AGCGATATAA AACACAAAAA GGTATTGCTC TTTAACGCCT      3480
     TGTTTTAAAA AATACGCTTG CCACATTTGA AAATGGCTCA TAAAAAAGAC GGGCGTAATC      3540
     AAATGCCCCA CTAACAGAAT TTTAAGTTTG GGGTTATCTT TAAGCTCTTT AAGACTGCCT      3600
     TTGACTTGCT CTTTAAGGAG TTTCAGGCTT TTTTGGCTTT TAAAATCCCC TTCTTTCTCT      3660
     TTAAAATAAA AAATGATCGT TAGCACACAG AGCATGATTA AAAAAATCCC CACAATATAC      3720
     AGCATCGCAT GGACTTTGAG ATACAAAAAC GATCCCAAAG AACTCCCTAT AATCATGCCT      3780
     AAATAAGTAA TTTGATTGTT TTTGGCTAAA AACTTGGATA AATCTTTTTT GTTTTCCTTA      3840
     ATGTCTGTGA TGAGTGAAGC TTCAATCGTG CCGCTAGAGC ATGCGCTATA CAAACCATAC      3900
     AACCCCCACG CTAAAAGCAT GAAAATAAAG CTATCAAAAA ACAGCACAAA CGAAAAACTA      3960
     GCGATTAAAA AGGCATTAGA AACCAGGAAT AAATTTTTTC GGCTCATCAA ATCCGCTAAA      4020
     ACGCCGCTTG GGTATTCAGC CACTAGCACG CAAAAGCTAA AAAAGGTTTG CACGAGCAAG      4080
     ATTTCACTCA AACTAAGCCC TTTAGAAAGC AACAAGGGGG TTAAAATCGC ATGGGGTAAG      4140
     CTTTGAGCGA TGATTAAGAG AAAATTCGCC CCATAGTAAG CTAAAATGTT TTTCCTTAAC      4200
     ATTTGAAAAT TGTAATTAAA ACTAGCTTAT AATACAGCAT TATATCTTTT ATTTAAGGGG      4260
     TATTGATGCT AACCCAATTA AAAACTTATC CAAAATTACT CAAACATTAT GAAGAAATCA      4320
     AAGAAGTGCA TATGCGCGAT TGGTTTTTTA AAGACAAAGA GCGAGCGAGC CGTTATTTTT      4380
     TGCAATTTGA AAGCTTGAGC TTGGATTATT CCAAAAACCG CCTGAACGAT ACCACTTTAA      4440
     AGCTTCTTTT TGAATTAGCG AATGACTGCT CTTTAAAAGA AAAGATTGAA GCGATGTTTA      4500
     AGGGCGAAAA AATCAACACC ACCGAAAAAA GGGCCGTTTT ACACACCGCC TTAAGAAGCT      4560
     TGAATGACAC TGAAATTTTA CTAGACAACA TGGAAGTGTT AAAAAGTATT AGGAGCGTTT      4620
     TAAAACGCAT GCGAGCCTTT AGCGATAGCG TGAGAAGCGG TAAAAGATTA GGCTATACCA      4680
     ATCAAGTGAT CACCGATATT GTCAATATCG GCATTGGGGG GTCAGATTTA GGCGCTTTAA      4740
     TGGTTTGCAC CGCCTTAAAA CGCTACGCCC ACCCGAGATT AAAGATGCAT TTTGTGTCTA      4800
     ATGTGGATGG CACACAGATT TTAGATGTTT TAGAAAAACT CAATCCAGCC AGCACGCTTT      4860
     TTATCGTGGC TTCTAAGACT TTTTCCACTC AAGAAACCTT AACCAACGCC CTAACCGCTA      4920
     GAAAATGGTT TGTAGAAAGG AGTGGCGATG AAAAGCATAT CGCTAAGCAC TTTGTAGCGG      4980
     TATCCACCAA TAAAGAAGCC GTGCAACAAT TTGGCATTGA CGAGCATAAC ATGTTTGAAT      5040
     TTTGGGATTT TGTAGGGGGG CGCTATAGCT TGTGGTCGGC TATTGGCTTA TCCATTATGA      5100
     TCTATTTAGG GAAGAAAAAT TTTAACGCTC TTTTGAAAGG AGCGTATCTG ATGGATGAGC      5160
     ATTTTAGAAA CGCCCCTTTT GAAAGCAATT TACCCGTTTT AATGGGGCTA ATTGGCGTGT      5220
     GGTATATCAA TTTTTTCCAA TCCAAAAGCC ATTTAATCGC TCCTTACGAT CAGTATTTAA      5280
     GGCATTTCCC TAAATTCATC CAGCAATTAG ATATGGAAAG CAATGGCAAA CGCATCAGCA      5340
     AAAAAGGCGA AATTATCCCC TATGACACAT GCCCTGTTGT TTGGGGCGAT ATGGGCATTA      5400
     ACGCTCAGCA CGCCTTTTTC CAGCTCTTGC ATCAAGGCAC GCATTTAATA CCCATTGATT      5460
     TTATCGCTTC CTTAGATAAA AAGCCTAACG CTAAAGGCCA CCATGAGATT TTATTCAGCA      5520
     ATGTTTTAGC GCAAGCGCAA GCCTTCATGA AAGGCAAGAG TTATGAAGAA GCGCTTGGGG      5580
     AATTGCTCTT TAAAGGATTA GACAAAGATG AAGCCAAAGA TTTAGCCCAC CACAGGGTGT      5640
     TTTTTGGCAA CCGCCCCTCT AATATCCTTT TATTAGAAAA GATTTCACCA AGCAATATTG      5700
     GAGCATTAGT GGCTCTTTAT GAGCATAAAG TCTTTGTGCA AGGGGTCATT TGGGATATTA      5760
     ACAGCTTTGA TCAATGGGGC GTGGAGCTTG GGAAAGAATT GGCCGTGCCG ATTTTACAAG      5820
     AATTAGAGGG GCATAAAAGC AACGCTTATT TTGACAGCTC CACTAAGCAC TTAATAGAAT      5880
     TGTATAAAAA TTACAACCAA TAGGCTTTGT TTTATAACAA GATAAAACCT AAAAACAATC      5940
     AAGCAAAGCT TAACCCCATT CTCAAGCAAT CCGTTCAAAA TCATCCGTTA ATCATAACGG      6000
     ATTTTAGCGC CATATATTAG CCATTTGAAT TTAAAGAGAG TAAATTTTCC ACAAAGTAAT      6060
     CGTTTTTAGC TTTTAAAAGC TTAACTTTCT CATTATATGC ATTATTTTAC ATATTATAAT      6120
     TATTTCAAAG CTAAGAATAA TAAAAACTAA AGAATAGATT TATCTTTAAA AGTATTTGCA      6180
     TTTATCAATC TCATTTTAGG AGGCATGCAT GAAAAAGGCA AGTCAGGTTT TATTCTTTGG      6240
     GGCATTTTTA AGCTCTTCTT TGCAAGGTTT TGAAGCTAAG CTCAACGGCT TTGTGGATCA      6300
     ATCCAGCACT ATCGGTTTTA ACCAGCATAA AATCAATAAA GAAAGAGGTA TCTACCCTAT      6360
     GCAGCAATTC GCAACGATTG CGGGCTATTT AGGGCTTGGT TTTAGCCTGT TACCCAAAAA      6420
     GGTTTCAGAC CATGTTCTAA AAGGCAAAAT AGGAGGCATG GTGGGATCTA TTTTCTATGA      6480
     TGGCACGAAG AAGTTTGAAG ACAGCTCTGT AGCTTACAAC CTCTTTGGTT ATTATGATGG      6540
     GTTCATGGGG GGTTATACAA ACATCTTACA AAGCGATGAT TTAGCGACAC AAAACATGAA      6600
     ATACAATAAA AATGTCCGCA ACTATGTCTT TAGCGACGCG TATTTAGAAT ACGCTTATAA      6660
     GAATTATTTT GAAATAAAAG CCGGGCGCTA TTTATCCACT ATGCCTTATA AAAGCGGTCA      6720
     AACGCAAGGC TTTCAAATTT CTGGGCAATA CAAGAAAGCG CGCTTGACTT GGTTTAGCTC      6780
     TTTTGGGAGG GCGTTCGCTT ACGGCTCGTT TTTGATGGAT TGGTTTGCCG CTAGGACCAC      6840
     TTATAGCGGA GGTTTTACCA AAAACGATAA GGGAGGTTAT GATAGCCATG GGCGAAAGGT      6900
     GCTTTATGGC ACGCATGCGG TGCAACTCAC CTATAAACCT CATCGTTTCC TCATAGAAGG      6960
     CTTTTATTAC CTTTCGCCTC AAATCTTTAA CGCTCCGGGC GTTAAGATTG GTTGGGATTC      7020
     TAACCCTAAT TTTAGCGGCA CAGGCTTTCG CTCTGATACA GCTATCATAG GGTTTTTCCC      7080
     CATTTACTAC CCTTGGATGA TCGTTAAATC CAATGGAAGC CCGGTCTATA AATACGACAC      7140
     GCCTGCCACT CAAAATGGGC AAAACCTCAT TATCCTCCAA CGCTTTGACA TCAACAATTA      7200
     CAATGTTTCC ATCGCTTTTT ATAAAGTCTT TCAAAACGCT AATGGTTGGA TAGGCAACAT      7260
     GGGGAATCCA AGCGGTGTGA TCATGGGGAG TAACAGCGTC TATGCGGGTT TTACAGGCAC      7320
     AGCCCTTAAA AGAGATGCCG CTACCATTTT CCTTTCTTGT GGCGGCACTC ATTTTGCCAA      7380
     AAAATTCACA TGGAAATTCG CCACGCAATA CTCCAATTCA GTGGTTTCTT GGGAAGCGAG      7440
     AGCGATGATC TCTTTAGGTT ATAAATTCAC TGAATACTTG AGCGGTAGCG TGGATCTTGC      7500
     ATATTATGGC GTGTATACTA ACAAAGGATT TAAACCGGGT GAAAACGGGC CTGTGCCTAA      7560
     AGACTTCCCC GCCCTTTATT CTGACAGGAG CGCGTTATAC ACGGCTCTAG TAGCATCTTT      7620
     TTGATGCTAC CCTATGATTA TGGTGGGCGT CTTTTGATGC TGTTTCTCTA GTCTTATATA      7680
     TAAAATTTCT TTTCAAGCAA AAGCCCTTTT TTAAATCATA CCCACTAAGC AAAATACCCA      7740
     TCATCTTTAA ATCATCTTTA AAATTGAGCC TTTAAAAAAT CAAGCGATAG CCTTTTAAAA      7800
     ACCCAAGCAG AAACCCCAAG CATCTTTAGT GTTTGCACGC TTCACAAACA GGGTCAAACT      7860
     TTTTTCTATG GATTTAAAGG GGGTTAAAAC CCCTTTTTTA TTCAAGAGGC TTTGATGTAG      7920
     GGCGTTTCAG CCAGCGGTGG GTAAATTTTG TTTTTAAAAT AAGCGTTTGA GCAAATCCTA      7980
     ACGCTCACGA TTAAAACCAA TAGCGCCACA AGCATGAAAA ACACGCACAA AATCGCATCA      8040
     ATAGCGTGGT TAAAAAAGGA TTTTTGGAGC GTTTTGAGCG CTTTTTCATC GGTAGTGGTA      8100
     GCCATTTTTT CTTTGATGAT TTGCATTTGC GCCACATGGG AAACATTATT CAGCACGCTG      8160
     TTATCGCTCT TTGGCACCAC CTTTAAAATA CCGCTATAAA AAGTGATGGA TAAAATCAAA      8220
     ACTGCCGGTA AGGCGCTTAT CATCGCCCCC TTAAAACGCC CCATTTTAAA CAACACCACC      8280
     GTGACCAACA ACAACGCCAT GCCCGCTAAC ATCTGATTGC TCACGCCAAA TAAAGGCCAT      8340
     AGCGTATAAA TCCCCCCTTT AGGATCAATC GTGCCTTGAT ACAAGAAATA CCCCCACCCT      8400
     GCCACGCACA AAAGAGTGGC AAAAATCCCA GCCTTATAAG AGCTAAGATC GCCCAAAGGC      8460
     TTATAAACAT TACCGAGCAA ATCTTGAATC ATGAAACGAG CGGTTCGTGT GCCAGCATCC      8520
     ACAGCGGTTA AAATGAACAA AGCTTCAAAC AAAATCGCAA AATGATACCA AAACGCCATC      8580
     ACGCTTGGAT CCCCTAAAAT GTGATACACA ATCATCGCTA AACCGATCGC AAAAGTGGGC      8640
     GCCCCACCGG TGCGGCTCAA AATGGAGCTT TCGCCGATGT TTTTAGTCAT CTCACGAATT      8700
     TCTTCAGCGC TGATATTAAA CCCCCATGAG CTAATCACTG AAGCCGCATC AGCTATATCT      8760
     TTACCGATGC TCACTTCTGG CGAATTGATA GCGAAATAAA GCCCTGGGTG CAAGATCCCT      8820
     GCGCACACCA ACGCCATAAG AGCCACAACG CTCTCCATCA CCATAGAGCC ATAGCCCACT      8880
     AGCCTTGCGT CGCTTTCTTT AGCGAGCATT TTAGGGGTCG TGCCTGAAGA AATTAAAGCA      8940
     TGGAATCCGC TAATCGTCCC GCAAGCCACC GTGATAAACA AGAAAGGGAA CACGCTTCCT      9000
     GCAAACACAG GCCCACTGCC ATCTACAAAG GGCGTGATTT TAGGGATTTG TAAAGGCGGA      9060
     GCGACAAAAA TAATGGCCAC AACCAACACC CCTATAACGC CAATTTTTAA AAAAGTGCTT      9120
     AGATAATCTC GTGGAGCGAG TAAAAACCAT ACCGGTAAAA TAGAAGCCAC AAACCCATAG      9180
     CCCATGATCA TCCACGCTAA AGAACTGGCC TCAAAAGTGA ATATTGACGC TAATTTAGGA      9240
     TCTAAAGAAA CGTATTTACC CGCATAAATC GCTATAATCA ATAGGATAAA GCCAATAACA      9300
     GAAACCTCTA AAATCTTGTG TGGCCTGAAA AACCGCATGT AAAGCCCCAT AAGAATCGCA      9360
     ATGGGAATAG TCATTGCGAT CGTAAAAAAG CCCCAAGGCG AATGCGCTAA AGCCTTCACC      9420
     ACCACCATCG CTAAAATCGC AATGATAATG AGCATGATCC CTAAAATGCC CAGACTTGCG      9480
     ATCATGCCTA CAAATTGGCC CATTTCAAGT TTGATCATTT CGCCTAAAGA CTTGCCATCG      9540
     CGCCTAATAG AAGCAAAAAG CACCACAAAA TCATGCACGC AACCCCCTAA AACCGAGCCT      9600
     ATCAAAATCC ATAAGATAGA GGGCAAGTAA CCCATTTGAG CGGCTAGTAT CGGGCCTACT      9660
     AAAGGGCCAG CCCCAGCAAT AGCGGCGAAA TGGTGCCCAA AAGTGATCGC TTTATCGGTT      9720
     GGCACAAAAT CCTTGCCATC ATTCCTTACG CATGCGGGCG TGGCTCTGCT ATCATCTAGC      9780
     TTTAACACCT TATAAGCGAT AAAATGGCTA TAAAAACGAT AGCCTATGCT ATAAATACAA      9840
     GCGCTCGCTA CTACAAGCCA TAGCGTGTTA ATGCTCTCAC CCTTGTGTAA GGCTAACACC      9900
     CCTAAACAGA TCGCCCCTAA AATAGCTACA AAAACCCAAG CCAAAGAAAC TAAACTTTTT      9960
     TGCATGTCCT CTCCATTTAA TGATTGTTTA ATCATTGTTG TTAATTTCAG CCAGTTTTTT     10020
     TATTATAATC CAAAATTTCT TTGAATAGTG GCAAAACGGC TCATAAACTT CCCATAATAA     10080
     GGGCTTGGGT TTTCCAAAC                                                  10099
//