JAL-1260 refactored GenBank (and EMBL) flat file parser
[jalview.git] / test / jalview / io / J03321.gb
1 LOCUS       CH1L1CG                 7502 bp    DNA     circular BCT 06-APR-2020
2 DEFINITION  Chlamydia trachomatis plasmid pCHL1, complete sequence.
3 ACCESSION   J03321
4 VERSION     J03321.1
5 DBLINK      BioSample: SAMN14225621
6 KEYWORDS    .
7 SOURCE      Chlamydia trachomatis
8   ORGANISM  Chlamydia trachomatis
9             Bacteria; Chlamydiae; Chlamydiales; Chlamydiaceae;
10             Chlamydia/Chlamydophila group; Chlamydia.
11 REFERENCE   1  (bases 1 to 7502)
12   AUTHORS   Comanducci,M., Ricci,S., Cevenini,R. and Ratti,G.
13   TITLE     Diversity of the Chlamydia trachomatis common plasmid in biovars
14             with different pathogenicity
15   JOURNAL   Plasmid 23 (2), 149-154 (1990)
16    PUBMED   2194229
17 REFERENCE   2  (bases 1 to 7502)
18   AUTHORS   Comanducci,M., Ricci,S., Cevenini,R. and Ratti,G.
19   TITLE     Direct Submission
20   JOURNAL   Submitted (23-JUN-2010) Sclavo Research Centre, Siena, Italy
21 COMMENT     Draft entry and computer-readable sequence kindly submitted by
22             G.Ratti, 28-MAR-1990.
23             ! CDS location split below (and this line added), for Jalview test purposes !
24 FEATURES             Location/Qualifiers
25      source          1..7502
26                      /organism="Chlamydia trachomatis"
27                      /mol_type="genomic DNA"
28                      /serotype="D"
29                      /isolate="G0/86"
30                      /isolation_source="trachoma"
31                      /db_xref="taxon:813"
32                      /plasmid="pCHL1"
33      CDS             join(7022..7502,
34                      1..437)
35                      /note="pGP7-D"
36                      /codon_start=1
37                      /transl_table=11
38                      /product="hypothetical protein"
39                      /protein_id="AAA91567.1"
40                      /translation="MGSMAFHKSRLFLTFGDASEIWLSTLSYLTRKNYASGINFLVSL
41                      EILDLSETLIKAISLDHSESLFKIKSLDVFNGKVVSEASKQARAACYISFTKFLYRLT
42                      KGYIKPAIPLKDFGNTTFFKIRDKIKTESISKQEWTVFFEALRIVNYRDYLIGKLIVQ
43                      GIRKLDEILSLRTDDLFFASNQISFRIKKRQNKETKILITFPISLMEELQKYTCGRNG
44                      RVFVSKIGIPVTTSQVAHNFRLAEFHSAMKIKITPRVLRASALIHLKQIGLKDEEIMR
45                      ISCLSSRQSVCSYCSGEEVIPLVQTPTIL"
46      CDS             complement(488..1480)
47                      /note="pGP8-D"
48                      /codon_start=1
49                      /transl_table=11
50                      /product="hypothetical protein"
51                      /protein_id="AAA91568.1"
52                      /translation="MGKGILSLQQEMSLEYSEKSYQEVLKIRQESYWKRMKSFSLFEV
53                      IMHWTASLNKHTCRSYRGSFLSLEKIGLLSLDMNLQEFSLLNHNLILDAIKKVSSAKT
54                      SWTEGTKQVRAASYISLTRFLNRMTQGIVAIAQPSKQENSRTFFKTREIVKTDAMNSL
55                      QTASFLKELKKINARDWLIAQTMLQGGKRSSEVLSLEISQICFQQATISFSQLKNRQT
56                      EKRIIITYPQKFMHFLQEYIGQRRGFVFVTRSGKMVGLRQIARTFSQAGLQAAIPFKI
57                      TPHVLRATAVTEYKRLGCSDSDIMKVTGHATAKMIFAYDKSSREDNASKKMALI"
58      CDS             1579..2934
59                      /note="pGP1-D"
60                      /codon_start=1
61                      /transl_table=11
62                      /product="hypothetical protein"
63                      /protein_id="AAA91569.1"
64                      /translation="MKTRSEIENRMQDIEYALLGKALIFEDSTEYILRQLANYEFKCS
65                      HHKNIFIVFKHLKDNGLPITVDSAWEELLRRRIKDMDKSYLGLMLHDALSNDKLRSVS
66                      HTVFLDDLSVCSAEENLSNFIFRSFNEYNENPLRRSPFLLLERIKGRLDSAIAKTFSI
67                      RSARGRSIYDIFSQSEIGVLARIKKRRVAFSENQNSFFDGFPTGYKDIDDKGVILAKG
68                      NFVIIAARPSIGKTALAIDMAINLAVTQQRRVGFLSLEMSAGQIVERIIANLTGISGE
69                      KLQRGDLSKEELFRVEEAGETVRESHFYICSDSQYKLNLIANQIRLLRKEDRVDVIFI
70                      DYLQLINSSVGENRQNEIADISRTLRGLASELNIPIVCLSQLSRKVEDRANKVPMLSD
71                      LRDSGQIEQDADVILFINRKESSSNCEITVGKNRHGSVFSSVLHFDPKISKFSAIKKV
72                      W"
73      CDS             2928..3992
74                      /note="pGP2-D"
75                      /codon_start=1
76                      /transl_table=11
77                      /product="hypothetical protein"
78                      /protein_id="AAA91570.1"
79                      /translation="MVNYSNCHFIKSPIHLENQKFGRRPGQSIKISPKLAQNGMVEVI
80                      GLDFLSSHYHALAAIQRLLTATNYKGNTKGVVLSRESNSFQFEGWIPRIRFTKTEFLE
81                      AYGVKRYKTSRNKYEFSGKEAETALEALYHLGHQPFLIVATRTRWTNGTQIVDRYQTL
82                      SPIIRIYEGWEGLTDEENIDIDLTPFNSPPTRKHKGFVVEPCPILVDQIESYFVIKPA
83                      NVYQEIKMRFPNASKYAYTFIDWVITAAAKKRRKLTKDNSWPENLLLNVNVKSLAYIL
84                      RMNRYICTRNWKKIELAIDKCIEIAIQLGWLSRRKRIEFLDSSKLSKKEILYLNKERF
85                      EEITKKSKEQMEQLEQESIN"
86      CDS             4054..4848
87                      /note="pGP3-D"
88                      /codon_start=1
89                      /transl_table=11
90                      /product="hypothetical protein"
91                      /protein_id="AAA91571.1"
92                      /translation="MGNSGFYLYNTENCVFADNIKVGQMTEPLKDQQIILGTTSTPVA
93                      AKMTASDGISLTVSNNSSTNASITIGLDAEKAYQLILEKLGDQILDGIADTIVDSTVQ
94                      DILDKIKTDPSLGLLKAFNNFPITNKIQCNGLFTPSNIETLLGGTEIGKFTVTPKSSG
95                      SMFLVSADIIASRMEGGVVLALVREGDSKPCAISYGYSSGIPNLCSLRTSITNTGLTP
96                      TTYSLRVGGLESGVVWVNALSNGNDILGITNTSNVSFLEVIPQTNA"
97      CDS             4918..5226
98                      /note="pGP4-D"
99                      /codon_start=1
100                      /transl_table=11
101                      /product="hypothetical protein"
102                      /protein_id="AAA91572.1"
103                      /translation="MQNKRKVRDDFIKIVKDVKKDFPELDLKIRVNKEKVTFLNSPLE
104                      LYHKSVSLILGLLQQIENSLGLFPDSPVLEKLEDNSLKLKKALIMLILSRKDMFSKAE
105                      "
106      CDS             5317..6048
107                      /note="pGP5-D (gtg start codon)"
108                      /codon_start=1
109                      /transl_table=11
110                      /product="hypothetical protein"
111                      /protein_id="AAA91573.1"
112                      /translation="MGCNLAQFLGKKVLLADLDPQSNLSSGLGASVRSDQKGLHDIVY
113                      TSNDLKSIICETKKDSVDLIPASFSSEQFRELDIHRGPSNNLKLFLNEYCAPFYDICI
114                      IDTPPSLGGLTKEAFVAGDKLIACLTPEPFSILGLQKIREFLSSVGKPEEEHILGIAL
115                      SFWDDRNSTNQMYIDIIESIYKNKLFSTKIRRDISLSRSLLKEDSVANVYPNSRAAED
116                      ILKLTHEIANILHIEYERDYSQRTT"
117      CDS             6045..6788
118                      /note="pGP6-D (gtg start codon)"
119                      /codon_start=1
120                      /transl_table=11
121                      /product="hypothetical protein"
122                      /protein_id="AAA91574.1"
123                      /translation="MNKLKKEADVFFKKNQTAASLDFKKTLPSIELFSATLNSEESQS
124                      LDRLFLSESQNYSDEEFYQEDILAVKLLTGQIKSIQKQHVLLLGEKIYNARKILSKDH
125                      FSSTTFSSWIELVFRTKSSAYNALAYYELFINLPNQTLQKEFQSIPYKSAYILAARKG
126                      DLKTKVDVIGKVCGMSNSSAIRVLDQFLPSSRNKDVRETIDKSDSEKNRQLSDFLIEI
127                      LRIMCSGVSLSSYNENLLQQLFELFKQKS"
128      repeat_region   6857..6945
129                      /note="four tandem 22bp repeats"
130 ORIGIN      
131         1 ggatccgtaa gttagacgaa attttgtctt tgcgcacaga cgatctattt tttgcatcca
132        61 atcagatttc ctttcgcatt aaaaaaagac agaataaaga aaccaaaatt ctaatcacat
133       121 ttcctatcag cttaatggaa gagttgcaaa aatacacttg tgggagaaat gggagagtat
134       181 ttgtttctaa aatagggatt cctgtaacaa caagtcaggt tgcgcataat tttaggcttg
135       241 cagagttcca tagtgctatg aaaataaaaa ttactcccag agtacttcgt gcaagcgctt
136       301 tgattcattt aaagcaaata ggattaaaag atgaggaaat catgcgtatt tcctgtcttt
137       361 catcgagaca aagtgtgtgt tcttattgtt ctggggaaga ggtaattcct ctagtacaaa
138       421 cacccacaat attgtgatat aattaaaatt atattcatat tctgttgcca gaaaaaacac
139       481 ctttaggcta tattagagcc atcttctttg aagcgttgtc ttctcgagaa gatttatcgt
140       541 acgcaaatat catctttgcg gttgcgtgtc ctgtgacctt cattatgtcg gagtctgagc
141       601 accctaggcg tttgtactcc gtcacagcgg ttgctcgaag cacgtgcggg gttattttaa
142       661 aagggattgc agcttgtagt cctgcttgag agaacgtgcg ggcgatttgc cttaacccca
143       721 ccatttttcc ggagcgagtt acgaagacaa aacctcttcg ttgaccgatg tactcttgta
144       781 gaaagtgcat aaacttctga ggataagtta taataatcct cttttctgtc tgacggttct
145       841 taagctggga gaaagaaatg gtagcttgtt ggaaacaaat ctgactaatc tccaagctta
146       901 agacttcaga ggagcgttta cctccttgga gcattgtctg ggcgatcaac caatcccggg
147       961 cattgatttt ttttagctct tttaggaagg atgctgtttg caaactgttc atcgcatccg
148      1021 tttttactat ttccctggtt ttaaaaaatg ttcgactatt ttcttgttta gaaggttgcg
149      1081 ctatagcgac tattccttga gtcatcctgt ttaggaatct tgttaaggaa atatagcttg
150      1141 ctgctcgaac ttgtttagta ccttcggtcc aagaagtctt ggcagaggaa acttttttaa
151      1201 tcgcatctag gattagatta tgatttaaaa gggaaaactc ttgcagattc atatccaagg
152      1261 acaatagacc aatcttttct aaagacaaaa aagatcctcg atatgatcta caagtatgtt
153      1321 tgttgagtga tgcggtccaa tgcataataa cttcgaataa ggagaagctt ttcatgcgtt
154      1381 tccaatagga ttcttggcga atttttaaaa cttcctgata agacttttca ctatattcta
155      1441 acgacatttc ttgctgcaaa gataaaatcc ctttacccat gaaatccctc gtgatataac
156      1501 ctatccgtaa aatgtcctga ttagtgaaat aatcaggttg ttaacaggat agcacgctcg
157      1561 gtattttttt atataaacat gaaaactcgt tccgaaatag aaaatcgcat gcaagatatc
158      1621 gagtatgcgt tgttaggtaa agctctgata tttgaagact ctactgagta tattctgagg
159      1681 cagcttgcta attatgagtt taagtgttct catcataaaa acatattcat agtatttaaa
160      1741 cacttaaaag acaatggatt acctataact gtagactcgg cttgggaaga gcttttgcgg
161      1801 cgtcgtatca aagatatgga caaatcgtat ctcgggttaa tgttgcatga tgctttatca
162      1861 aatgacaagc ttagatccgt ttctcatacg gttttcctcg atgatttgag cgtgtgtagc
163      1921 gctgaagaaa atttgagtaa tttcattttc cgctcgttta atgagtacaa tgaaaatcca
164      1981 ttgcgtagat ctccgtttct attgcttgag cgtataaagg gaaggcttga tagtgctata
165      2041 gcaaagactt tttctattcg cagcgctaga ggccggtcta tttatgatat attctcacag
166      2101 tcagaaattg gagtgctggc tcgtataaaa aaaagacgag tagcgttctc tgagaatcaa
167      2161 aattctttct ttgatggctt cccaacagga tacaaggata ttgatgataa aggagttatc
168      2221 ttagctaaag gtaatttcgt gattatagca gctagaccat ctatagggaa aacagcttta
169      2281 gctatagaca tggcgataaa tcttgcggtt actcaacagc gtagagttgg tttcctatct
170      2341 ctagaaatga gcgcaggtca aattgttgag cggattattg ctaatttaac aggaatatct
171      2401 ggtgaaaaat tacaaagagg ggatctctct aaagaagaat tattccgagt agaagaagct
172      2461 ggagaaacgg ttagagaatc acatttttat atctgcagtg atagtcagta taagcttaac
173      2521 ttaatcgcga atcagatccg gttgctgaga aaagaagatc gagtagacgt aatatttatc
174      2581 gattacttgc agttgatcaa ctcatcggtt ggagaaaatc gtcaaaatga aatagcagat
175      2641 atatctagaa ccttaagagg tttagcctca gagctaaaca ttcctatagt ttgtttatcc
176      2701 caactatcta gaaaagttga ggatagagca aataaagttc ccatgctttc agatttgcga
177      2761 gacagcggtc aaatagagca agacgcagat gtgattttgt ttatcaatag gaaggaatcg
178      2821 tcttctaatt gtgagataac tgttgggaaa aatagacatg gatcggtttt ctcttcggta
179      2881 ttacatttcg atccaaaaat tagtaaattc tccgctatta aaaaagtatg gtaaattata
180      2941 gtaactgcca cttcatcaaa agtcctatcc accttgaaaa tcagaagttt ggaagaagac
181      3001 ctggtcaatc tattaagata tctcccaaat tggctcaaaa tgggatggta gaagttatag
182      3061 gtcttgattt tctttcatct cattaccatg cattagcagc tatccaaaga ttactgaccg
183      3121 caacgaatta caaggggaac acaaaagggg ttgttttatc cagagaatca aatagttttc
184      3181 aatttgaagg atggatacca agaatccgtt ttacaaaaac tgaattctta gaggcttatg
185      3241 gagttaagcg gtataaaaca tccagaaata agtatgagtt tagtggaaaa gaagctgaaa
186      3301 ctgctttaga agccttatac catttaggac atcaaccgtt tttaatagtg gcaactagaa
187      3361 ctcgatggac taatggaaca caaatagtag accgttacca aactctttct ccgatcatta
188      3421 ggatttacga aggatgggaa ggtttaactg acgaagaaaa tatagatata gacttaacac
189      3481 cttttaattc accacctaca cggaaacata aagggttcgt tgtagagcca tgtcctatct
190      3541 tggtagatca aatagaatcc tactttgtaa tcaagcctgc aaatgtatac caagaaataa
191      3601 aaatgcgttt cccaaatgca tcaaagtatg cttacacatt tatcgactgg gtgattacag
192      3661 cagctgcgaa aaagagacga aaattaacta aggataattc ttggccagaa aacttgttat
193      3721 taaacgttaa cgttaaaagt cttgcatata ttttaaggat gaatcggtac atctgtacaa
194      3781 ggaactggaa aaaaatcgag ttagctatcg ataaatgtat agaaatcgcc attcagcttg
195      3841 gctggttatc tagaagaaaa cgcattgaat ttctggattc ttctaaactc tctaaaaaag
196      3901 aaattctata tctaaataaa gagcgctttg aagaaataac taagaaatct aaagaacaaa
197      3961 tggaacaatt agaacaagaa tctattaatt aatagcaagc ttgaaactaa aaacctaatt
198      4021 tatttaaagc tcaaaataaa aaagagtttt aaaatgggaa attctggttt ttatttgtat
199      4081 aacactgaaa actgcgtctt tgctgataat atcaaagttg ggcaaatgac agagccgctc
200      4141 aaggaccagc aaataatcct tgggacaaca tcaacacctg tcgcagccaa aatgacagct
201      4201 tctgatggaa tatctttaac agtctccaat aattcatcaa ccaatgcttc tattacaatt
202      4261 ggtttggatg cggaaaaagc ttaccagctt attctagaaa agttgggaga tcaaattctt
203      4321 gatggaattg ctgatactat tgttgatagt acagtccaag atattttaga caaaatcaaa
204      4381 acagaccctt ctctaggttt gttgaaagct tttaacaact ttccaatcac taataaaatt
205      4441 caatgcaacg ggttattcac tcccagtaac attgaaactt tattaggagg aactgaaata
206      4501 ggaaaattca cagtcacacc caaaagctct gggagcatgt tcttagtctc agcagatatt
207      4561 attgcatcaa gaatggaagg cggcgttgtt ctagctttgg tacgagaagg tgattctaag
208      4621 ccctgcgcga ttagttatgg atactcatca ggcattccta atttatgtag tctaagaacc
209      4681 agtattacta atacaggatt gactccgaca acgtattcat tacgtgtagg cggtttagaa
210      4741 agcggtgtgg tatgggttaa tgccctttct aatggcaatg atattttagg aataacaaat
211      4801 acttctaatg tatctttttt agaggtaata cctcaaacaa acgcttaaac aatttttatt
212      4861 ggatttttct tataggtttt atatttagag aaaacagttc gaattacggg gtttgttatg
213      4921 caaaataaaa gaaaagtgag ggacgatttt attaaaattg ttaaagatgt gaaaaaagat
214      4981 ttccccgaat tagacctaaa aatacgagta aacaaggaaa aagtaacttt cttaaattct
215      5041 cccttagaac tctaccataa aagtgtctca ctaattctag gactgcttca acaaatagaa
216      5101 aactctttag gattattccc agactctcct gttcttgaaa aattagagga taacagttta
217      5161 aagctaaaaa aggctttgat tatgcttatc ttgtctagaa aagacatgtt ttccaaggct
218      5221 gaatagacaa cttactctaa cgttggagtt gatttgcaca ccttagtttt ttgctctttt
219      5281 aagggaggaa ctggaaaaac aacactttct ctaaacgtgg gatgcaactt ggcccaattt
220      5341 ttagggaaaa aagtgttact tgctgaccta gacccgcaat ccaatttatc ttctggattg
221      5401 ggggctagtg tcagaagtga ccaaaaaggc ttgcacgaca tagtatacac atcaaacgat
222      5461 ttaaaatcaa tcatttgcga aacaaaaaaa gatagtgtgg acctaattcc tgcatcattt
223      5521 tcatccgaac agtttagaga attggatatt catagaggac ctagtaacaa cttaaagtta
224      5581 tttctgaatg agtactgcgc tcctttttat gacatctgca taatagacac tccacctagc
225      5641 ctaggagggt taacgaaaga agcttttgtt gcaggagaca aattaattgc ttgtttaact
226      5701 ccagaacctt tttctattct agggttacaa aagatacgtg aattcttaag ttcggtcgga
227      5761 aaacctgaag aagaacacat tcttggaata gctttgtctt tttgggatga tcgtaactcg
228      5821 actaaccaaa tgtatataga cattatcgag tctatttaca aaaacaagct tttttcaaca
229      5881 aaaattcgtc gagatatttc tctcagccgt tctcttctta aagaagattc tgtagctaat
230      5941 gtctatccaa attctagggc cgcagaagat attctgaagt taacgcatga aatagcaaat
231      6001 attttgcata tcgaatatga acgagattac tctcagagga caacgtgaac aaactaaaaa
232      6061 aagaagcgga tgtctttttt aaaaaaaatc aaactgccgc ttctctagat tttaagaaga
233      6121 cgcttccctc cattgaacta ttctcagcaa ctttgaattc tgaggaaagt cagagtttgg
234      6181 atcgattatt tttatcagag tcccaaaact attcggatga agaattttat caagaagaca
235      6241 tcctagcggt aaaactgctt actggtcaga taaaatccat acagaagcaa cacgtacttc
236      6301 ttttaggaga aaaaatctat aatgctagaa aaatcctgag taaggatcac ttctcctcaa
237      6361 caactttttc atcttggata gagttagttt ttagaactaa gtcttctgct tacaatgctc
238      6421 ttgcatatta cgagcttttt ataaacctcc ccaaccaaac tctacaaaaa gagtttcaat
239      6481 cgatccccta taaatccgca tatattttgg ccgctagaaa aggcgattta aaaaccaagg
240      6541 tcgatgtgat agggaaagta tgtggaatgt cgaactcatc ggcgataagg gtgttggatc
241      6601 aatttcttcc ttcatctaga aacaaagacg ttagagaaac gatagataag tctgattcag
242      6661 agaagaatcg ccaattatct gatttcttaa tagagatact tcgcatcatg tgttccggag
243      6721 tttctttgtc ctcctataac gaaaatcttc tacaacagct ttttgaactt tttaagcaaa
244      6781 agagctgatc ctccgtcagc tcatatatat atatctatta tatatatata tttagggatt
245      6841 tgatttcacg agagagattt gcaactcttg gtggtagact ttgcaactct tggtggtaga
246      6901 ctttgcaact cttggtggta gactttgcaa ctcttggtgg tagacttggt cataatggac
247      6961 ttttgttaaa aaatttatta aaatcttaga gctccgattt tgaatagctt tggttaagaa
248      7021 aatgggctcg atggctttcc ataaaagtag attgttttta acttttgggg acgcgtcgga
249      7081 aatttggtta tctactttat cttatctaac tagaaaaaat tatgcgtctg ggattaactt
250      7141 tcttgtttct ttagagattc tggatttatc ggaaaccttg ataaaggcta tttctcttga
251      7201 ccacagcgaa tctttgttta aaatcaagtc tctagatgtt tttaatggaa aagttgtttc
252      7261 agaggcatct aaacaggcta gagcggcatg ctacatatct ttcacaaagt ttttgtatag
253      7321 attgaccaag ggatatatta aacccgctat tccattgaaa gattttggaa acactacatt
254      7381 ttttaaaatc cgagacaaaa tcaaaacaga atcgatttct aagcaggaat ggacagtttt
255      7441 ttttgaagcg ctccggatag tgaattatag agactattta atcggtaaat tgattgtaca
256      7501 ag
257 //
258