1LOCUS       NC_004718              29751 bp ss-RNA     linear   VRL 06-FEB-2004
2DEFINITION  SARS coronavirus, complete genome.
3ACCESSION   NC_004718
4VERSION     NC_004718.3  GI:30271926
5KEYWORDS    .
6SOURCE      SARS coronavirus
7  ORGANISM  SARS coronavirus
8            Viruses; ssRNA positive-strand viruses, no DNA stage; Nidovirales;
9            Coronaviridae; Coronavirus.
10REFERENCE   1  (bases 1 to 29751)
11  AUTHORS   Snijder,E.J., Bredenbeek,P.J., Dobbe,J.C., Thiel,V., Ziebuhr,J.,
12            Poon,L.L., Guan,Y., Rozanov,M., Spaan,W.J. and Gorbalenya,A.E.
13  TITLE     Unique and conserved features of genome and proteome of
14            SARS-coronavirus, an early split-off from the coronavirus group 2
15            lineage
16  JOURNAL   J. Mol. Biol. 331 (5), 991-1004 (2003)
17  MEDLINE   22809466
18   PUBMED   12927536
19REFERENCE   2  (bases 1 to 29751)
20  AUTHORS   Marra,M.A., Jones,S.J., Astell,C.R., Holt,R.A., Brooks-Wilson,A.,
21            Butterfield,Y.S., Khattra,J., Asano,J.K., Barber,S.A., Chan,S.Y.,
22            Cloutier,A., Coughlin,S.M., Freeman,D., Girn,N., Griffith,O.L.,
23            Leach,S.R., Mayo,M., McDonald,H., Montgomery,S.B., Pandoh,P.K.,
24            Petrescu,A.S., Robertson,A.G., Schein,J.E., Siddiqui,A.,
25            Smailus,D.E., Stott,J.M., Yang,G.S., Plummer,F., Andonov,A.,
26            Artsob,H., Bastien,N., Bernard,K., Booth,T.F., Bowness,D., Czub,M.,
27            Drebot,M., Fernando,L., Flick,R., Garbutt,M., Gray,M., Grolla,A.,
28            Jones,S., Feldmann,H., Meyers,A., Kabani,A., Li,Y., Normand,S.,
29            Stroher,U., Tipples,G.A., Tyler,S., Vogrig,R., Ward,D., Watson,B.,
30            Brunham,R.C., Krajden,M., Petric,M., Skowronski,D.M., Upton,C. and
31            Roper,R.L.
32  TITLE     The Genome sequence of the SARS-associated coronavirus
33  JOURNAL   Science 300 (5624), 1399-1404 (2003)
34  MEDLINE   22660725
35   PUBMED   12730501
36REFERENCE   3  (bases 1 to 29751)
37  AUTHORS   .
38  CONSRTM   BCCA Genome Sciences Centre, British Columbia Centre for Disease
39            Control and National Microbiology Laboratory Canada
40  TITLE     Direct Submission
41  JOURNAL   Submitted (30-APR-2003) Genome Sciences Centre, British Columbia
42            Cancer Research Centre, 600 West 10th Avenue, Vancouver, BC V5Z
43            4E6, Canada
44  REMARK    Sequence update by submitter
45REFERENCE   4  (bases 1 to 29751)
46  AUTHORS   .
47  CONSRTM   BCCA Genome Sciences Centre, British Columbia Centre for Disease
48            Control and National Microbiology Laboratory Canada
49  TITLE     Direct Submission
50  JOURNAL   Submitted (23-APR-2003) Genome Sciences Centre, British Columbia
51            Cancer Research Centre, 600 West 10th Avenue, Vancouver, BC V5Z
52            4E6, Canada
53  REMARK    Sequence update by submitter
54REFERENCE   5  (bases 1 to 29751)
55  AUTHORS   .
56  CONSRTM   BCCA Genome Sciences Centre, British Columbia Centre for Disease
57            Control and National Microbiology Laboratory Canada
58  TITLE     Direct Submission
59  JOURNAL   Submitted (13-APR-2003) Genome Sciences Centre, British Columbia
60            Cancer Research Centre, 600 West 10th Avenue, Vancouver, BC V5Z
61            4E6, Canada
62COMMENT     REVIEWED REFSEQ: This record has been curated by NCBI staff. The
63            reference sequence was derived from AY274119.
64            On May 1, 2003 this sequence version replaced gi:30124072.
65            The annotation in based mainly on the sequence analysis described
66            by Snijder et al. (2003). Annotation of transcription regulatory
67            sequences was copied from virtually identical (except the very 3'
68            end) AY291315 (Frankfurt 1).  Designations of the 3'-adjacent genes
69            do not coincide with those provided by Marra et al. (2003).
70FEATURES             Location/Qualifiers
71     source          1..29751
72                     /organism="SARS coronavirus"
73                     /mol_type="genomic RNA"
74                     /isolate="Tor2"
75                     /isolation_source="patient #2 with severe acute
76                     respiratory syndrome (SARS)"
77                     /db_xref="taxon:227859"
78                     /country="Canada: Toronto"
79     5'UTR           1..264
80                     /evidence=not_experimental
81     misc_feature    67..72
82                     /note="transcription regulatory sequence leader TRS"
83     gene            265..21485
84                     /gene="orf1ab"
85                     /locus_tag="sars1"
86                     /db_xref="GeneID:1489680"
87     CDS             join(265..13398,13398..21485)
88                     /gene="orf1ab"
89                     /locus_tag="sars1"
90                     /note="It was assumed that the SARS orf1ab polyprotein
91                     processing map should be similar to that of murine
92                     hepatitis virus; however, of the two MHV papain-like
93                     proteinases, only PL2-PRO is well conserved for SARS
94                     coronavirus. The mature peptides located downstream from
95                     nsp4-pp1a/pp1ab are cleaved from the polyprotein by the
96                     nsp5-pp1a/pp1ab proteinase 3CL-PRO. The orf1a/orf1b
97                     translational frameshift, the predicted processing map,
98                     and both proteinase activities have been supported by in
99                     vitro expression and mutagenesis experiments (Thiel et
100                     al., 2003); -1 frameshift"
101                     /codon_start=1
102                     /product="orf1ab polyprotein (pp1ab)"
103                     /protein_id="NP_828849.2"
104                     /db_xref="GI:30124074"
105                     /db_xref="GeneID:1489680"
106                     /translation="MESLVLGVNEKTHVQLSLPVLQVRDVLVRGFGDSVEEALSEARE
107                     HLKNGTCGLVELEKGVLPQLEQPYVFIKRSDALSTNHGHKVVELVAEMDGIQYGRSGI
108                     TLGVLVPHVGETPIAYRNVLLRKNGNKGAGGHSYGIDLKSYDLGDELGTDPIEDYEQN
109                     WNTKHGSGALRELTRELNGGAVTRYVDNNFCGPDGYPLDCIKDFLARAGKSMCTLSEQ
110                     LDYIESKRGVYCCRDHEHEIAWFTERSDKSYEHQTPFEIKSAKKFDTFKGECPKFVFP
111                     LNSKVKVIQPRVEKKKTEGFMGRIRSVYPVASPQECNNMHLSTLMKCNHCDEVSWQTC
112                     DFLKATCEHCGTENLVIEGPTTCGYLPTNAVVKMPCPACQDPEIGPEHSVADYHNHSN
113                     IETRLRKGGRTRCFGGCVFAYVGCYNKRAYWVPRASADIGSGHTGITGDNVETLNEDL
114                     LEILSRERVNINIVGDFHLNEEVAIILASFSASTSAFIDTIKSLDYKSFKTIVESCGN
115                     YKVTKGKPVKGAWNIGQQRSVLTPLCGFPSQAAGVIRSIFARTLDAANHSIPDLQRAA
116                     VTILDGISEQSLRLVDAMVYTSDLLTNSVIIMAYVTGGLVQQTSQWLSNLLGTTVEKL
117                     RPIFEWIEAKLSAGVEFLKDAWEILKFLITGVFDIVKGQIQVASDNIKDCVKCFIDVV
118                     NKALEMCIDQVTIAGAKLRSLNLGEVFIAQSKGLYRQCIRGKEQLQLLMPLKAPKEVT
119                     FLEGDSHDTVLTSEEVVLKNGELEALETPVDSFTNGAIVGTPVCVNGLMLLEIKDKEQ
120                     YCALSPGLLATNNVFRLKGGAPIKGVTFGEDTVWEVQGYKNVRITFELDERVDKVLNE
121                     KCSVYTVESGTEVTEFACVVAEAVVKTLQPVSDLLTNMGIDLDEWSVATFYLFDDAGE
122                     ENFSSRMYCSFYPPDEEEEDDAECEEEEIDETCEHEYGTEDDYQGLPLEFGASAETVR
123                     VEEEEEEDWLDDTTEQSEIEPEPEPTPEEPVNQFTGYLKLTDNVAIKCVDIVKEAQSA
124                     NPMVIVNAANIHLKHGGGVAGALNKATNGAMQKESDDYIKLNGPLTVGGSCLLSGHNL
125                     AKKCLHVVGPNLNAGEDIQLLKAAYENFNSQDILLAPLLSAGIFGAKPLQSLQVCVQT
126                     VRTQVYIAVNDKALYEQVVMDYLDNLKPRVEAPKQEEPPNTEDSKTEEKSVVQKPVDV
127                     KPKIKACIDEVTTTLEETKFLTNKLLLFADINGKLYHDSQNMLRGEDMSFLEKDAPYM
128                     VGDVITSGDITCVVIPSKKAGGTTEMLSRALKKVPVDEYITTYPGQGCAGYTLEEAKT
129                     ALKKCKSAFYVLPSEAPNAKEEILGTVSWNLREMLAHAEETRKLMPICMDVRAIMATI
130                     QRKYKGIKIQEGIVDYGVRFFFYTSKEPVASIITKLNSLNEPLVTMPIGYVTHGFNLE
131                     EAARCMRSLKAPAVVSVSSPDAVTTYNGYLTSSSKTSEEHFVETVSLAGSYRDWSYSG
132                     QRTELGVEFLKRGDKIVYHTLESPVEFHLDGEVLSLDKLKSLLSLREVKTIKVFTTVD
133                     NTNLHTQLVDMSMTYGQQFGPTYLDGADVTKIKPHVNHEGKTFFVLPSDDTLRSEAFE
134                     YYHTLDESFLGRYMSALNHTKKWKFPQVGGLTSIKWADNNCYLSSVLLALQQLEVKFN
135                     APALQEAYYRARAGDAANFCALILAYSNKTVGELGDVRETMTHLLQHANLESAKRVLN
136                     VVCKHCGQKTTTLTGVEAVMYMGTLSYDNLKTGVSIPCVCGRDATQYLVQQESSFVMM
137                     SAPPAEYKLQQGTFLCANEYTGNYQCGHYTHITAKETLYRIDGAHLTKMSEYKGPVTD
138                     VFYKETSYTTTIKPVSYKLDGVTYTEIEPKLDGYYKKDNAYYTEQPIDLVPTQPLPNA
139                     SFDNFKLTCSNTKFADDLNQMTGFTKPASRELSVTFFPDLNGDVVAIDYRHYSASFKK
140                     GAKLLHKPIVWHINQATTKTTFKPNTWCLRCLWSTKPVDTSNSFEVLAVEDTQGMDNL
141                     ACESQQPTSEEVVENPTIQKEVIECDVKTTEVVGNVILKPSDEGVKVTQELGHEDLMA
142                     AYVENTSITIKKPNELSLALGLKTIATHGIAAINSVPWSKILAYVKPFLGQAAITTSN
143                     CAKRLAQRVFNNYMPYVFTLLFQLCTFTKSTNSRIRASLPTTIAKNSVKSVAKLCLDA
144                     GINYVKSPKFSKLFTIAMWLLLLSICLGSLICVTAAFGVLLSNFGAPSYCNGVRELYL
145                     NSSNVTTMDFCEGSFPCSICLSGLDSLDSYPALETIQVTISSYKLDLTILGLAAEWVL
146                     AYMLFTKFFYLLGLSAIMQVFFGYFASHFISNSWLMWFIISIVQMAPVSAMVRMYIFF
147                     ASFYYIWKSYVHIMDGCTSSTCMMCYKRNRATRVECTTIVNGMKRSFYVYANGGRGFC
148                     KTHNWNCLNCDTFCTGSTFISDEVARDLSLQFKRPINPTDQSSYIVDSVAVKNGALHL
149                     YFDKAGQKTYERHPLSHFVNLDNLRANNTKGSLPINVIVFDGKSKCDESASKSASVYY
150                     SQLMCQPILLLDQALVSDVGDSTEVSVKMFDAYVDTFSATFSVPMEKLKALVATAHSE
151                     LAKGVALDGVLSTFVSAARQGVVDTDVDTKDVIECLKLSHHSDLEVTGDSCNNFMLTY
152                     NKVENMTPRDLGACIDCNARHINAQVAKSHNVSLIWNVKDYMSLSEQLRKQIRSAAKK
153                     NNIPFRLTCATTRQVVNVITTKISLKGGKIVSTCFKLMLKATLLCVLAALVCYIVMPV
154                     HTLSIHDGYTNEIIGYKAIQDGVTRDIISTDDCFANKHAGFDAWFSQRGGSYKNDKSC
155                     PVVAAIITREIGFIVPGLPGTVLRAINGDFLHFLPRVFSAVGNICYTPSKLIEYSDFA
156                     TSACVLAAECTIFKDAMGKPVPYCYDTNLLEGSISYSELRPDTRYVLMDGSIIQFPNT
157                     YLEGSVRVVTTFDAEYCRHGTCERSEVGICLSTSGRWVLNNEHYRALSGVFCGVDAMN
158                     LIANIFTPLVQPVGALDVSASVVAGGIIAILVTCAAYYFMKFRRVFGEYNHVVAANAL
159                     LFLMSFTILCLVPAYSFLPGVYSVFYLYLTFYFTNDVSFLAHLQWFAMFSPIVPFWIT
160                     AIYVFCISLKHCHWFFNNYLRKRVMFNGVTFSTFEEAALCTFLLNKEMYLKLRSETLL
161                     PLTQYNRYLALYNKYKYFSGALDTTSYREAACCHLAKALNDFSNSGADVLYQPPQTSI
162                     TSAVLQSGFRKMAFPSGKVEGCMVQVTCGTTTLNGLWLDDTVYCPRHVICTAEDMLNP
163                     NYEDLLIRKSNHSFLVQAGNVQLRVIGHSMQNCLLRLKVDTSNPKTPKYKFVRIQPGQ
164                     TFSVLACYNGSPSGVYQCAMRPNHTIKGSFLNGSCGSVGFNIDYDCVSFCYMHHMELP
165                     TGVHAGTDLEGKFYGPFVDRQTAQAAGTDTTITLNVLAWLYAAVINGDRWFLNRFTTT
166                     LNDFNLVAMKYNYEPLTQDHVDILGPLSAQTGIAVLDMCAALKELLQNGMNGRTILGS
167                     TILEDEFTPFDVVRQCSGVTFQGKFKKIVKGTHHWMLLTFLTSLLILVQSTQWSLFFF
168                     VYENAFLPFTLGIMAIAACAMLLVKHKHAFLCLFLLPSLATVAYFNMVYMPASWVMRI
169                     MTWLELADTSLSGYRLKDCVMYASALVLLILMTARTVYDDAARRVWTLMNVITLVYKV
170                     YYGNALDQAISMWALVISVTSNYSGVVTTIMFLARAIVFVCVEYYPLLFITGNTLQCI
171                     MLVYCFLGYCCCCYFGLFCLLNRYFRLTLGVYDYLVSTQEFRYMNSQGLLPPKSSIDA
172                     FKLNIKLLGIGGKPCIKVATVQSKMSDVKCTSVVLLSVLQQLRVESSSKLWAQCVQLH
173                     NDILLAKDTTEAFEKMVSLLSVLLSMQGAVDINRLCEEMLDNRATLQAIASEFSSLPS
174                     YAAYATAQEAYEQAVANGDSEVVLKKLKKSLNVAKSEFDRDAAMQRKLEKMADQAMTQ
175                     MYKQARSEDKRAKVTSAMQTMLFTMLRKLDNDALNNIINNARDGCVPLNIIPLTTAAK
176                     LMVVVPDYGTYKNTCDGNTFTYASALWEIQQVVDADSKIVQLSEINMDNSPNLAWPLI
177                     VTALRANSAVKLQNNELSPVALRQMSCAAGTTQTACTDDNALAYYNNSKGGRFVLALL
178                     SDHQDLKWARFPKSDGTGTIYTELEPPCRFVTDTPKGPKVKYLYFIKGLNNLNRGMVL
179                     GSLAATVRLQAGNATEVPANSTVLSFCAFAVDPAKAYKDYLASGGQPITNCVKMLCTH
180                     TGTGQAITVTPEANMDQESFGGASCCLYCRCHIDHPNPKGFCDLKGKYVQIPTTCAND
181                     PVGFTLRNTVCTVCGMWKGYGCSCDQLREPLMQSADASTFLNRVCGVSAARLTPCGTG
182                     TSTDVVYRAFDIYNEKVAGFAKFLKTNCCRFQEKDEEGNLLDSYFVVKRHTMSNYQHE
183                     ETIYNLVKDCPAVAVHDFFKFRVDGDMVPHISRQRLTKYTMADLVYALRHFDEGNCDT
184                     LKEILVTYNCCDDDYFNKKDWYDFVENPDILRVYANLGERVRQSLLKTVQFCDAMRDA
185                     GIVGVLTLDNQDLNGNWYDFGDFVQVAPGCGVPIVDSYYSLLMPILTLTRALAAESHM
186                     DADLAKPLIKWDLLKYDFTEERLCLFDRYFKYWDQTYHPNCINCLDDRCILHCANFNV
187                     LFSTVFPPTSFGPLVRKIFVDGVPFVVSTGYHFRELGVVHNQDVNLHSSRLSFKELLV
188                     YAADPAMHAASGNLLLDKRTTCFSVAALTNNVAFQTVKPGNFNKDFYDFAVSKGFFKE
189                     GSSVELKHFFFAQDGNAAISDYDYYRYNLPTMCDIRQLLFVVEVVDKYFDCYDGGCIN
190                     ANQVIVNNLDKSAGFPFNKWGKARLYYDSMSYEDQDALFAYTKRNVIPTITQMNLKYA
191                     ISAKNRARTVAGVSICSTMTNRQFHQKLLKSIAATRGATVVIGTSKFYGGWHNMLKTV
192                     YSDVETPHLMGWDYPKCDRAMPNMLRIMASLVLARKHNTCCNLSHRFYRLANECAQVL
193                     SEMVMCGGSLYVKPGGTSSGDATTAYANSVFNICQAVTANVNALLSTDGNKIADKYVR
194                     NLQHRLYECLYRNRDVDHEFVDEFYAYLRKHFSMMILSDDAVVCYNSNYAAQGLVASI
195                     KNFKAVLYYQNNVFMSEAKCWTETDLTKGPHEFCSQHTMLVKQGDDYVYLPYPDPSRI
196                     LGAGCFVDDIVKTDGTLMIERFVSLAIDAYPLTKHPNQEYADVFHLYLQYIRKLHDEL
197                     TGHMLDMYSVMLTNDNTSRYWEPEFYEAMYTPHTVLQAVGACVLCNSQTSLRCGACIR
198                     RPFLCCKCCYDHVISTSHKLVLSVNPYVCNAPGCDVTDVTQLYLGGMSYYCKSHKPPI
199                     SFPLCANGQVFGLYKNTCVGSDNVTDFNAIATCDWTNAGDYILANTCTERLKLFAAET
200                     LKATEETFKLSYGIATVREVLSDRELHLSWEVGKPRPPLNRNYVFTGYRVTKNSKVQI
201                     GEYTFEKGDYGDAVVYRGTTTYKLNVGDYFVLTSHTVMPLSAPTLVPQEHYVRITGLY
202                     PTLNISDEFSSNVANYQKVGMQKYSTLQGPPGTGKSHFAIGLALYYPSARIVYTACSH
203                     AAVDALCEKALKYLPIDKCSRIIPARARVECFDKFKVNSTLEQYVFCTVNALPETTAD
204                     IVVFDEISMATNYDLSVVNARLRAKHYVYIGDPAQLPAPRTLLTKGTLEPEYFNSVCR
205                     LMKTIGPDMFLGTCRRCPAEIVDTVSALVYDNKLKAHKDKSAQCFKMFYKGVITHDVS
206                     SAINRPQIGVVREFLTRNPAWRKAVFISPYNSQNAVASKILGLPTQTVDSSQGSEYDY
207                     VIFTQTTETAHSCNVNRFNVAITRAKIGILCIMSDRDLYDKLQFTSLEIPRRNVATLQ
208                     AENVTGLFKDCSKIITGLHPTQAPTHLSVDIKFKTEGLCVDIPGIPKDMTYRRLISMM
209                     GFKMNYQVNGYPNMFITREEAIRHVRAWIGFDVEGCHATRDAVGTNLPLQLGFSTGVN
210                     LVAVPTGYVDTENNTEFTRVNAKPPPGDQFKHLIPLMYKGLPWNVVRIKIVQMLSDTL
211                     KGLSDRVVFVLWAHGFELTSMKYFVKIGPERTCCLCDKRATCFSTSSDTYACWNHSVG
212                     FDYVYNPFMIDVQQWGFTGNLQSNHDQHCQVHGNAHVASCDAIMTRCLAVHECFVKRV
213                     DWSVEYPIIGDELRVNSACRKVQHMVVKSALLADKFPVLHDIGNPKAIKCVPQAEVEW
214                     KFYDAQPCSDKAYKIEELFYSYATHHDKFTDGVCLFWNCNVDRYPANAIVCRFDTRVL
215                     SNLNLPGCDGGSLYVNKHAFHTPAFDKSAFTNLKQLPFFYYSDSPCESHGKQVVSDID
216                     YVPLKSATCITRCNLGGAVCRHHANEYRQYLDAYNMMISAGFSLWIYKQFDTYNLWNT
217                     FTRLQSLENVAYNVVNKGHFDGHAGEAPVSIINNAVYTKVDGIDVEIFENKTTLPVNV
218                     AFELWAKRNIKPVPEIKILNNLGVDIAANTVIWDYKREAPAHVSTIGVCTMTDIAKKP
219                     TESACSSLTVLFDGRVEGQVDLFRNARNGVLITEGSVKGLTPSKGPAQASVNGVTLIG
220                     ESVKTQFNYFKKVDGIIQQLPETYFTQSRDLEDFKPRSQMETDFLELAMDEFIQRYKL
221                     EGYAFEHIVYGDFSHGQLGGLHLMIGLAKRSQDSPLKLEDFIPMDSTVKNYFITDAQT
222                     GSSKCVCSVIDLLLDDFVEIIKSQDLSVISKVVKVTIDYAEISFMLWCKDGHVETFYP
223                     KLQASQAWQPGVAMPNLYKMQRMLLEKCDLQNYGENAVIPKGIMMNVAKYTQLCQYLN
224                     TLTLAVPYNMRVIHFGAGSDKGVAPGTAVLRQWLPTGTLLVDSDLNDFVSDADSTLIG
225                     DCATVHTANKWDLIISDMYDPRTKHVTKENDSKEGFFTYLCGFIKQKLALGGSIAVKI
226                     TEHSWNADLYKLMGHFSWWTAFVTNVNASSSEAFLIGANYLGKPKEQIDGYTMHANYI
227                     FWRNTNPIQLSSYSLFDMSKFPLKLRGTAVMSLKENQINDMIYSLLEKGRLIIRENNR
228                     VVVSSDILVNN"
229     mat_peptide     265..804
230                     /gene="orf1ab"
231                     /locus_tag="sars1"
232                     /product="nsp1-pp1a/pp1ab"
233                     /note="PL2-PRO cleavage product; leader protein"
234                     /evidence=not_experimental
235                     /protein_id="NP_828860.2"
236                     /db_xref="GI:34555774"
237     mat_peptide     805..2718
238                     /gene="orf1ab"
239                     /locus_tag="sars1"
240                     /product="nsp2-pp1a/pp1ab"
241                     /note="PL2-PRO cleavage product; counterpart of MHV p65"
242                     /evidence=not_experimental
243                     /protein_id="NP_828861.2"
244                     /db_xref="GI:34555775"
245     mat_peptide     2719..8484
246                     /gene="orf1ab"
247                     /locus_tag="sars1"
248                     /product="nsp3-pp1a/pp1ab"
249                     /note="PL2-PRO cleavage product; former nsp1; conserved
250                     domains are: N-terminal acidic (Ac), predicted
251                     phosphoesterase (similar to the Appr-1'-p
252                     processing enzyme) formerly known as 'X-domain',
253                     papain-like proteinase similar to that of MHV PL2-PRO,
254                     Y-domain; transmembrane domain 1 (TM1); adenosine
255                     diphosphate-ribose 1''-phosphatase (ADPR)"
256                     /protein_id="NP_828862.2"
257                     /db_xref="GI:34555776"
258     mat_peptide     8485..9984
259                     /gene="orf1ab"
260                     /locus_tag="sars1"
261                     /product="nsp4-pp1a/pp1ab"
262                     /note="cleaved from polyprotein by the PL2-PRO at the
263                     N-terminus and by 3CL-PRO at the C-terminus; contains
264                     transmembrane domain 2 (TM2)"
265                     /evidence=not_experimental
266                     /protein_id="NP_904322.1"
267                     /db_xref="GI:34555778"
268     mat_peptide     9985..10902
269                     /gene="orf1ab"
270                     /locus_tag="sars1"
271                     /product="nsp5-pp1a/pp1ab  (3CL-PRO)"
272                     /note="mediates cleavages downstream from nsp4-pp1a/pp1ab.
273                     3D structure has been determined (Yang et al., 2003);
274                     3C-like proteinase; main proteinase (Mpro)"
275                     /evidence=experimental
276                     /protein_id="NP_828863.1"
277                     /db_xref="GI:29837498"
278     mat_peptide     10903..11772
279                     /gene="orf1ab"
280                     /locus_tag="sars1"
281                     /product="nsp6-pp1a/pp1ab (TM3)"
282                     /note="putative transmembrane domain"
283                     /evidence=not_experimental
284                     /protein_id="NP_828864.1"
285                     /db_xref="GI:29837499"
286     mat_peptide     11773..12021
287                     /gene="orf1ab"
288                     /locus_tag="sars1"
289                     /product="nsp7-pp1a/pp1ab"
290                     /evidence=not_experimental
291                     /protein_id="NP_828865.1"
292                     /db_xref="GI:29837500"
293     mat_peptide     12022..12615
294                     /gene="orf1ab"
295                     /locus_tag="sars1"
296                     /product="nsp8-pp1a/pp1ab"
297                     /evidence=not_experimental
298                     /protein_id="NP_828866.1"
299                     /db_xref="GI:29837501"
300     mat_peptide     12616..12954
301                     /gene="orf1ab"
302                     /locus_tag="sars1"
303                     /product="nsp9-pp1a/pp1ab"
304                     /evidence=not_experimental
305                     /protein_id="NP_828867.1"
306                     /db_xref="GI:29837502"
307     mat_peptide     12955..13371
308                     /gene="orf1ab"
309                     /locus_tag="sars1"
310                     /product="nsp10-pp1a/pp1ab"
311                     /note="formerly known as growth-factor-like protein (GFL)"
312                     /evidence=not_experimental
313                     /protein_id="NP_828868.1"
314                     /db_xref="GI:29837503"
315     mat_peptide     join(13372..13398,13398..16166)
316                     /gene="orf1ab"
317                     /locus_tag="sars1"
318                     /product="nsp12-pp1ab (RdRp)"
319                     /note="RNA-dependent  RNA polymerase"
320                     /evidence=not_experimental
321                     /protein_id="NP_828869.1"
322                     /db_xref="GI:29837504"
323     mat_peptide     16167..17969
324                     /gene="orf1ab"
325                     /locus_tag="sars1"
326                     /product="nsp13-pp1ab (ZD, NTPase/HEL)"
327                     /note="zinc-binding domain (ZD), NTPase/helicase domain.
328                     RNA-stimulated ATPase and dsDNA helicase activities have
329                     been confirmed (Thiel et al., 2003)"
330                     /evidence=experimental
331                     /protein_id="NP_828870.1"
332                     /db_xref="GI:29837505"
333     mat_peptide     17970..19550
334                     /gene="orf1ab"
335                     /locus_tag="sars1"
336                     /product="nsp14-pp1ab (nuclease ExoN homolog)"
337                     /note="exonuclease"
338                     /evidence=not_experimental
339                     /protein_id="NP_828871.1"
340                     /db_xref="GI:29837506"
341     mat_peptide     19551..20588
342                     /gene="orf1ab"
343                     /locus_tag="sars1"
344                     /product="nsp15-pp1ab (endoRNAse)"
345                     /note="the C-terminal domain is a homolog of endoRNase
346                     XendoU and is conserved through the order Nidovirales"
347                     /evidence=not_experimental
348                     /protein_id="NP_828872.1"
349                     /db_xref="GI:29837507"
350     mat_peptide     20589..21482
351                     /gene="orf1ab"
352                     /locus_tag="sars1"
353                     /product="nsp16-pp1ab (2'-o-MT)"
354                     /note="putative ribose 2'-O-methyltransferase"
355                     /evidence=not_experimental
356                     /protein_id="NP_828873.2"
357                     /db_xref="GI:30133975"
358     CDS             265..13413
359                     /gene="orf1ab"
360                     /locus_tag="sars1"
361                     /codon_start=1
362                     /evidence=not_experimental
363                     /product="orf1a polyprotein (pp1a)"
364                     /protein_id="NP_828850.1"
365                     /db_xref="GI:29836495"
366                     /db_xref="GeneID:1489680"
367                     /translation="MESLVLGVNEKTHVQLSLPVLQVRDVLVRGFGDSVEEALSEARE
368                     HLKNGTCGLVELEKGVLPQLEQPYVFIKRSDALSTNHGHKVVELVAEMDGIQYGRSGI
369                     TLGVLVPHVGETPIAYRNVLLRKNGNKGAGGHSYGIDLKSYDLGDELGTDPIEDYEQN
370                     WNTKHGSGALRELTRELNGGAVTRYVDNNFCGPDGYPLDCIKDFLARAGKSMCTLSEQ
371                     LDYIESKRGVYCCRDHEHEIAWFTERSDKSYEHQTPFEIKSAKKFDTFKGECPKFVFP
372                     LNSKVKVIQPRVEKKKTEGFMGRIRSVYPVASPQECNNMHLSTLMKCNHCDEVSWQTC
373                     DFLKATCEHCGTENLVIEGPTTCGYLPTNAVVKMPCPACQDPEIGPEHSVADYHNHSN
374                     IETRLRKGGRTRCFGGCVFAYVGCYNKRAYWVPRASADIGSGHTGITGDNVETLNEDL
375                     LEILSRERVNINIVGDFHLNEEVAIILASFSASTSAFIDTIKSLDYKSFKTIVESCGN
376                     YKVTKGKPVKGAWNIGQQRSVLTPLCGFPSQAAGVIRSIFARTLDAANHSIPDLQRAA
377                     VTILDGISEQSLRLVDAMVYTSDLLTNSVIIMAYVTGGLVQQTSQWLSNLLGTTVEKL
378                     RPIFEWIEAKLSAGVEFLKDAWEILKFLITGVFDIVKGQIQVASDNIKDCVKCFIDVV
379                     NKALEMCIDQVTIAGAKLRSLNLGEVFIAQSKGLYRQCIRGKEQLQLLMPLKAPKEVT
380                     FLEGDSHDTVLTSEEVVLKNGELEALETPVDSFTNGAIVGTPVCVNGLMLLEIKDKEQ
381                     YCALSPGLLATNNVFRLKGGAPIKGVTFGEDTVWEVQGYKNVRITFELDERVDKVLNE
382                     KCSVYTVESGTEVTEFACVVAEAVVKTLQPVSDLLTNMGIDLDEWSVATFYLFDDAGE
383                     ENFSSRMYCSFYPPDEEEEDDAECEEEEIDETCEHEYGTEDDYQGLPLEFGASAETVR
384                     VEEEEEEDWLDDTTEQSEIEPEPEPTPEEPVNQFTGYLKLTDNVAIKCVDIVKEAQSA
385                     NPMVIVNAANIHLKHGGGVAGALNKATNGAMQKESDDYIKLNGPLTVGGSCLLSGHNL
386                     AKKCLHVVGPNLNAGEDIQLLKAAYENFNSQDILLAPLLSAGIFGAKPLQSLQVCVQT
387                     VRTQVYIAVNDKALYEQVVMDYLDNLKPRVEAPKQEEPPNTEDSKTEEKSVVQKPVDV
388                     KPKIKACIDEVTTTLEETKFLTNKLLLFADINGKLYHDSQNMLRGEDMSFLEKDAPYM
389                     VGDVITSGDITCVVIPSKKAGGTTEMLSRALKKVPVDEYITTYPGQGCAGYTLEEAKT
390                     ALKKCKSAFYVLPSEAPNAKEEILGTVSWNLREMLAHAEETRKLMPICMDVRAIMATI
391                     QRKYKGIKIQEGIVDYGVRFFFYTSKEPVASIITKLNSLNEPLVTMPIGYVTHGFNLE
392                     EAARCMRSLKAPAVVSVSSPDAVTTYNGYLTSSSKTSEEHFVETVSLAGSYRDWSYSG
393                     QRTELGVEFLKRGDKIVYHTLESPVEFHLDGEVLSLDKLKSLLSLREVKTIKVFTTVD
394                     NTNLHTQLVDMSMTYGQQFGPTYLDGADVTKIKPHVNHEGKTFFVLPSDDTLRSEAFE
395                     YYHTLDESFLGRYMSALNHTKKWKFPQVGGLTSIKWADNNCYLSSVLLALQQLEVKFN
396                     APALQEAYYRARAGDAANFCALILAYSNKTVGELGDVRETMTHLLQHANLESAKRVLN
397                     VVCKHCGQKTTTLTGVEAVMYMGTLSYDNLKTGVSIPCVCGRDATQYLVQQESSFVMM
398                     SAPPAEYKLQQGTFLCANEYTGNYQCGHYTHITAKETLYRIDGAHLTKMSEYKGPVTD
399                     VFYKETSYTTTIKPVSYKLDGVTYTEIEPKLDGYYKKDNAYYTEQPIDLVPTQPLPNA
400                     SFDNFKLTCSNTKFADDLNQMTGFTKPASRELSVTFFPDLNGDVVAIDYRHYSASFKK
401                     GAKLLHKPIVWHINQATTKTTFKPNTWCLRCLWSTKPVDTSNSFEVLAVEDTQGMDNL
402                     ACESQQPTSEEVVENPTIQKEVIECDVKTTEVVGNVILKPSDEGVKVTQELGHEDLMA
403                     AYVENTSITIKKPNELSLALGLKTIATHGIAAINSVPWSKILAYVKPFLGQAAITTSN
404                     CAKRLAQRVFNNYMPYVFTLLFQLCTFTKSTNSRIRASLPTTIAKNSVKSVAKLCLDA
405                     GINYVKSPKFSKLFTIAMWLLLLSICLGSLICVTAAFGVLLSNFGAPSYCNGVRELYL
406                     NSSNVTTMDFCEGSFPCSICLSGLDSLDSYPALETIQVTISSYKLDLTILGLAAEWVL
407                     AYMLFTKFFYLLGLSAIMQVFFGYFASHFISNSWLMWFIISIVQMAPVSAMVRMYIFF
408                     ASFYYIWKSYVHIMDGCTSSTCMMCYKRNRATRVECTTIVNGMKRSFYVYANGGRGFC
409                     KTHNWNCLNCDTFCTGSTFISDEVARDLSLQFKRPINPTDQSSYIVDSVAVKNGALHL
410                     YFDKAGQKTYERHPLSHFVNLDNLRANNTKGSLPINVIVFDGKSKCDESASKSASVYY
411                     SQLMCQPILLLDQALVSDVGDSTEVSVKMFDAYVDTFSATFSVPMEKLKALVATAHSE
412                     LAKGVALDGVLSTFVSAARQGVVDTDVDTKDVIECLKLSHHSDLEVTGDSCNNFMLTY
413                     NKVENMTPRDLGACIDCNARHINAQVAKSHNVSLIWNVKDYMSLSEQLRKQIRSAAKK
414                     NNIPFRLTCATTRQVVNVITTKISLKGGKIVSTCFKLMLKATLLCVLAALVCYIVMPV
415                     HTLSIHDGYTNEIIGYKAIQDGVTRDIISTDDCFANKHAGFDAWFSQRGGSYKNDKSC
416                     PVVAAIITREIGFIVPGLPGTVLRAINGDFLHFLPRVFSAVGNICYTPSKLIEYSDFA
417                     TSACVLAAECTIFKDAMGKPVPYCYDTNLLEGSISYSELRPDTRYVLMDGSIIQFPNT
418                     YLEGSVRVVTTFDAEYCRHGTCERSEVGICLSTSGRWVLNNEHYRALSGVFCGVDAMN
419                     LIANIFTPLVQPVGALDVSASVVAGGIIAILVTCAAYYFMKFRRVFGEYNHVVAANAL
420                     LFLMSFTILCLVPAYSFLPGVYSVFYLYLTFYFTNDVSFLAHLQWFAMFSPIVPFWIT
421                     AIYVFCISLKHCHWFFNNYLRKRVMFNGVTFSTFEEAALCTFLLNKEMYLKLRSETLL
422                     PLTQYNRYLALYNKYKYFSGALDTTSYREAACCHLAKALNDFSNSGADVLYQPPQTSI
423                     TSAVLQSGFRKMAFPSGKVEGCMVQVTCGTTTLNGLWLDDTVYCPRHVICTAEDMLNP
424                     NYEDLLIRKSNHSFLVQAGNVQLRVIGHSMQNCLLRLKVDTSNPKTPKYKFVRIQPGQ
425                     TFSVLACYNGSPSGVYQCAMRPNHTIKGSFLNGSCGSVGFNIDYDCVSFCYMHHMELP
426                     TGVHAGTDLEGKFYGPFVDRQTAQAAGTDTTITLNVLAWLYAAVINGDRWFLNRFTTT
427                     LNDFNLVAMKYNYEPLTQDHVDILGPLSAQTGIAVLDMCAALKELLQNGMNGRTILGS
428                     TILEDEFTPFDVVRQCSGVTFQGKFKKIVKGTHHWMLLTFLTSLLILVQSTQWSLFFF
429                     VYENAFLPFTLGIMAIAACAMLLVKHKHAFLCLFLLPSLATVAYFNMVYMPASWVMRI
430                     MTWLELADTSLSGYRLKDCVMYASALVLLILMTARTVYDDAARRVWTLMNVITLVYKV
431                     YYGNALDQAISMWALVISVTSNYSGVVTTIMFLARAIVFVCVEYYPLLFITGNTLQCI
432                     MLVYCFLGYCCCCYFGLFCLLNRYFRLTLGVYDYLVSTQEFRYMNSQGLLPPKSSIDA
433                     FKLNIKLLGIGGKPCIKVATVQSKMSDVKCTSVVLLSVLQQLRVESSSKLWAQCVQLH
434                     NDILLAKDTTEAFEKMVSLLSVLLSMQGAVDINRLCEEMLDNRATLQAIASEFSSLPS
435                     YAAYATAQEAYEQAVANGDSEVVLKKLKKSLNVAKSEFDRDAAMQRKLEKMADQAMTQ
436                     MYKQARSEDKRAKVTSAMQTMLFTMLRKLDNDALNNIINNARDGCVPLNIIPLTTAAK
437                     LMVVVPDYGTYKNTCDGNTFTYASALWEIQQVVDADSKIVQLSEINMDNSPNLAWPLI
438                     VTALRANSAVKLQNNELSPVALRQMSCAAGTTQTACTDDNALAYYNNSKGGRFVLALL
439                     SDHQDLKWARFPKSDGTGTIYTELEPPCRFVTDTPKGPKVKYLYFIKGLNNLNRGMVL
440                     GSLAATVRLQAGNATEVPANSTVLSFCAFAVDPAKAYKDYLASGGQPITNCVKMLCTH
441                     TGTGQAITVTPEANMDQESFGGASCCLYCRCHIDHPNPKGFCDLKGKYVQIPTTCAND
442                     PVGFTLRNTVCTVCGMWKGYGCSCDQLREPLMQSADASTFLNGFAV"
443     mat_peptide     13372..13410
444                     /gene="orf1ab"
445                     /locus_tag="sars1"
446                     /product="nsp11-pp1a"
447                     /note="putative C-terminal cleavage product of pp1a"
448                     /protein_id="NP_904321.1"
449                     /db_xref="GI:34555777"
450     misc_feature    13392..13472
451                     /gene="orf1ab"
452                     /locus_tag="sars1"
453                     /note="Region: potential ribosome slippery sequence
454                     followed by stimulatory RNA pseudoknot"
455     misc_feature    21486..21491
456                     /note="transcription regulatory sequence for mRNA2"
457     gene            21492..25259
458                     /gene="S"
459                     /locus_tag="sars2"
460                     /note="synonym: E2"
461                     /db_xref="GeneID:1489668"
462     CDS             21492..25259
463                     /gene="S"
464                     /locus_tag="sars2"
465                     /note="As established by Krokhin et al. (2003), the
466                     glycosylated spike protein (as well as the nucleocapsid
467                     protein) can be detected in infected cell culture
468                     supernatants with antisera from SARS patients; putative
469                     spike glycoprotein"
470                     /codon_start=1
471                     /evidence=experimental
472                     /product="E2 glycoprotein precursor"
473                     /protein_id="NP_828851.1"
474                     /db_xref="GI:29836496"
475                     /db_xref="GeneID:1489668"
476                     /translation="MFIFLLFLTLTSGSDLDRCTTFDDVQAPNYTQHTSSMRGVYYPD
477                     EIFRSDTLYLTQDLFLPFYSNVTGFHTINHTFGNPVIPFKDGIYFAATEKSNVVRGWV
478                     FGSTMNNKSQSVIIINNSTNVVIRACNFELCDNPFFAVSKPMGTQTHTMIFDNAFNCT
479                     FEYISDAFSLDVSEKSGNFKHLREFVFKNKDGFLYVYKGYQPIDVVRDLPSGFNTLKP
480                     IFKLPLGINITNFRAILTAFSPAQDIWGTSAAAYFVGYLKPTTFMLKYDENGTITDAV
481                     DCSQNPLAELKCSVKSFEIDKGIYQTSNFRVVPSGDVVRFPNITNLCPFGEVFNATKF
482                     PSVYAWERKKISNCVADYSVLYNSTFFSTFKCYGVSATKLNDLCFSNVYADSFVVKGD
483                     DVRQIAPGQTGVIADYNYKLPDDFMGCVLAWNTRNIDATSTGNYNYKYRYLRHGKLRP
484                     FERDISNVPFSPDGKPCTPPALNCYWPLNDYGFYTTTGIGYQPYRVVVLSFELLNAPA
485                     TVCGPKLSTDLIKNQCVNFNFNGLTGTGVLTPSSKRFQPFQQFGRDVSDFTDSVRDPK
486                     TSEILDISPCAFGGVSVITPGTNASSEVAVLYQDVNCTDVSTAIHADQLTPAWRIYST
487                     GNNVFQTQAGCLIGAEHVDTSYECDIPIGAGICASYHTVSLLRSTSQKSIVAYTMSLG
488                     ADSSIAYSNNTIAIPTNFSISITTEVMPVSMAKTSVDCNMYICGDSTECANLLLQYGS
489                     FCTQLNRALSGIAAEQDRNTREVFAQVKQMYKTPTLKYFGGFNFSQILPDPLKPTKRS
490                     FIEDLLFNKVTLADAGFMKQYGECLGDINARDLICAQKFNGLTVLPPLLTDDMIAAYT
491                     AALVSGTATAGWTFGAGAALQIPFAMQMAYRFNGIGVTQNVLYENQKQIANQFNKAIS
492                     QIQESLTTTSTALGKLQDVVNQNAQALNTLVKQLSSNFGAISSVLNDILSRLDKVEAE
493                     VQIDRLITGRLQSLQTYVTQQLIRAAEIRASANLAATKMSECVLGQSKRVDFCGKGYH
494                     LMSFPQAAPHGVVFLHVTYVPSQERNFTTAPAICHEGKAYFPREGVFVFNGTSWFITQ
495                     RNFFSPQIITTDNTFVSGNCDVVIGIINNTVYDPLQPELDSFKEELDKYFKNHTSPDV
496                     DLGDISGINASVVNIQKEIDRLNEVAKNLNESLIDLQELGKYEQYIKWPWYVWLGFIA
497                     GLIAIVMVTILLCCMTSCCSCLKGACSCGSCCKFDEDDSEPVLKGVKLHYT"
498     misc_feature    21843..21845
499                     /gene="S"
500                     /locus_tag="sars2"
501                     /note="second glycosylation site"
502                     /evidence=experimental
503     misc_feature    21846..21848
504                     /gene="S"
505                     /locus_tag="sars2"
506                     /note="first glycosylation site"
507                     /evidence=experimental
508     misc_feature    22170..22172
509                     /gene="S"
510                     /locus_tag="sars2"
511                     /note="glycosylation site"
512                     /evidence=experimental
513     misc_feature    22296..22298
514                     /gene="S"
515                     /locus_tag="sars2"
516                     /note="glycosylation site"
517                     /evidence=experimental
518     misc_feature    23838..23840
519                     /gene="S"
520                     /locus_tag="sars2"
521                     /note="glycosylation site"
522                     /evidence=experimental
523     misc_feature    25260..25265
524                     /note="transcription regulatory sequence for mRNA3"
525     gene            25268..26092
526                     /locus_tag="sars3a"
527                     /db_xref="GeneID:1489669"
528     CDS             25268..26092
529                     /locus_tag="sars3a"
530                     /codon_start=1
531                     /evidence=not_experimental
532                     /product="hypothetical protein sars3a"
533                     /protein_id="NP_828852.2"
534                     /db_xref="GI:30124073"
535                     /db_xref="GeneID:1489669"
536                     /translation="MDLFMRFFTLRSITAQPVKIDNASPASTVHATATIPLQASLPFG
537                     WLVIGVAFLAVFQSATKIIALNKRWQLALYKGFQFICNLLLLFVTIYSHLLLVAAGME
538                     AQFLYLYALIYFLQCINACRIIMRCWLCWKCKSKNPLLYDANYFVCWHTHNYDYCIPY
539                     NSVTDTIVVTEGDGISTPKLKEDYQIGGYSEDRHSGVKDYVVVHGYFTEVYYQLESTQ
540                     ITTDTGIENATFFIFNKLVKDPPNVQIHTIDGSSGVANPAMDPIYDEPTTTTSVPL"
541     gene            25689..26153
542                     /locus_tag="sars3b"
543                     /db_xref="GeneID:1489670"
544     CDS             25689..26153
545                     /locus_tag="sars3b"
546                     /codon_start=1
547                     /evidence=not_experimental
548                     /product="hypothetical protein sars3b"
549                     /protein_id="NP_828853.1"
550                     /db_xref="GI:29836498"
551                     /db_xref="GeneID:1489670"
552                     /translation="MMPTTLFAGTHITMTTVYHITVSQIQLSLLKVTAFQHQNSKKTT
553                     KLVVILRIGTQVLKTMSLYMAISPKFTTSLSLHKLLQTLVLKMLHSSSLTSLLKTHRM
554                     CKYTQSTALQELLIQQWIQFMMSRRRLLACLCKHKKVSTNLCTHSFRKKQVR"
555     misc_feature    26109..26114
556                     /locus_tag="sars3b"
557                     /note="transcription regulatory sequence for mRNA4"
558     gene            26117..26347
559                     /gene="E"
560                     /locus_tag="sars4"
561                     /db_xref="GeneID:1489671"
562     CDS             26117..26347
563                     /gene="E"
564                     /locus_tag="sars4"
565                     /note="E. coli expression reported by Shen et al. (2003);
566                     protein sM; protein E"
567                     /codon_start=1
568                     /evidence=experimental
569                     /product="small envelope protein"
570                     /protein_id="NP_828854.1"
571                     /db_xref="GI:29836499"
572                     /db_xref="GeneID:1489671"
573                     /translation="MYSFVSEETGTLIVNSVLLFLAFVVFLLVTLAILTALRLCAYCC
574                     NIVNVSLVKPTVYVYSRVKNLNSSEGVPDLLV"
575     misc_feature    26348..26353
576                     /note="transcription regulatory sequence for mRNA5"
577     gene            26398..27063
578                     /gene="M"
579                     /locus_tag="sars5"
580                     /db_xref="GeneID:1489672"
581     CDS             26398..27063
582                     /gene="M"
583                     /locus_tag="sars5"
584                     /note="E. coli expression reported by Zhang et al. (2003)"
585                     /codon_start=1
586                     /product="matrix protein"
587                     /protein_id="NP_828855.1"
588                     /db_xref="GI:29836504"
589                     /db_xref="GeneID:1489672"
590                     /translation="MADNGTITVEELKQLLEQWNLVIGFLFLAWIMLLQFAYSNRNRF
591                     LYIIKLVFLWLLWPVTLACFVLAAVYRINWVTGGIAIAMACIVGLMWLSYFVASFRLF
592                     ARTRSMWSFNPETNILLNVPLRGTIVTRPLMESELVIGAVIIRGHLRMAGHSLGRCDI
593                     KDLPKEITVATSRTLSYYKLGASQRVGTDSGFAAYNRYRIGNYKLNTDHAGSNDNIAL
594                     LVQ"
595     gene            26913..27265
596                     /locus_tag="sars6"
597                     /db_xref="GeneID:1489673"
598     misc_feature    26913..26918
599                     /locus_tag="sars6"
600                     /note="transcription regulatory sequence for mRNA6"
601     CDS             27074..27265
602                     /locus_tag="sars6"
603                     /codon_start=1
604                     /evidence=not_experimental
605                     /product="hypothetical protein sars6"
606                     /protein_id="NP_828856.1"
607                     /db_xref="GI:29836500"
608                     /db_xref="GeneID:1489673"
609                     /translation="MFHLVDFQVTIAEILIIIMRTFRIAIWNLDVIISSIVRQLFKPL
610                     TKKNYSELDDEEPMELDYP"
611     misc_feature    27267..27272
612                     /note="transcription regulatory sequence for mRNA7"
613     gene            27273..27641
614                     /locus_tag="sars7a"
615                     /db_xref="GeneID:1489674"
616     CDS             27273..27641
617                     /locus_tag="sars7a"
618                     /codon_start=1
619                     /evidence=not_experimental
620                     /product="hypothetical protein sars7a"
621                     /protein_id="NP_828857.1"
622                     /db_xref="GI:29836501"
623                     /db_xref="GeneID:1489674"
624                     /translation="MKIILFLTLIVFTSCELYHYQECVRGTTVLLKEPCPSGTYEGNS
625                     PFHPLADNKFALTCTSTHFAFACADGTRHTYQLRARSVSPKLFIRQEEVQQELYSPLF
626                     LIVAALVFLILCFTIKRKTE"
627     gene            27638..27772
628                     /locus_tag="sars7b"
629                     /db_xref="GeneID:1489675"
630     CDS             27638..27772
631                     /locus_tag="sars7b"
632                     /codon_start=1
633                     /evidence=not_experimental
634                     /product="hypothetical protein sars7b"
635                     /protein_id="NP_849175.1"
636                     /db_xref="GI:30524940"
637                     /db_xref="GeneID:1489675"
638                     /translation="MNELTLIDFYLCFLAFLLFLVLIMLIIFWFSLEIQDLEEPCTKV
639                     "
640     misc_feature    27773..27778
641                     /note="transcription regulatory sequence for mRNA8"
642     gene            27779..27898
643                     /locus_tag="sars8a"
644                     /db_xref="GeneID:1489676"
645     CDS             27779..27898
646                     /locus_tag="sars8a"
647                     /codon_start=1
648                     /evidence=not_experimental
649                     /product="hypothetical protein sars8a"
650                     /protein_id="NP_849176.1"
651                     /db_xref="GI:30524941"
652                     /db_xref="GeneID:1489676"
653                     /translation="MKLLIVLTCISLCSCICTVVQRCASNKPHVLEDPCKVQH"
654     gene            27864..28118
655                     /locus_tag="sars8b"
656                     /db_xref="GeneID:1489677"
657     CDS             27864..28118
658                     /locus_tag="sars8b"
659                     /codon_start=1
660                     /evidence=not_experimental
661                     /product="hypothetical protein sars8b"
662                     /protein_id="NP_849177.1"
663                     /db_xref="GI:30524942"
664                     /db_xref="GeneID:1489677"
665                     /translation="MCLKILVRYNTRGNTYSTAWLCALGKVLPFHRWHTMVQTCTPNV
666                     TINCQDPAGGALIARCWYLHEGHQTAAFRDVLVVLNKRTN"
667     misc_feature    28106..28111
668                     /locus_tag="sars8b"
669                     /note="transcription regulatory sequence for mRNA9"
670     gene            28120..29388
671                     /gene="N"
672                     /locus_tag="sars9a"
673                     /db_xref="GeneID:1489678"
674     CDS             28120..29388
675                     /gene="N"
676                     /locus_tag="sars9a"
677                     /note="As established by Krokhin et al. (2003), the
678                     N-terminal methionine is removed, all other methionines
679                     are oxidized, and the resulting N-terminal serine is
680                     acetylated"
681                     /codon_start=1
682                     /evidence=experimental
683                     /product="nucleocapsid protein"
684                     /protein_id="NP_828858.1"
685                     /db_xref="GI:29836503"
686                     /db_xref="GeneID:1489678"
687                     /translation="MSDNGPQSNQRSAPRITFGGPTDSTDNNQNGGRNGARPKQRRPQ
688                     GLPNNTASWFTALTQHGKEELRFPRGQGVPINTNSGPDDQIGYYRRATRRVRGGDGKM
689                     KELSPRWYFYYLGTGPEASLPYGANKEGIVWVATEGALNTPKDHIGTRNPNNNAATVL
690                     QLPQGTTLPKGFYAEGSRGGSQASSRSSSRSRGNSRNSTPGSSRGNSPARMASGGGET
691                     ALALLLLDRLNQLESKVSGKGQQQQGQTVTKKSAAEASKKPRQKRTATKQYNVTQAFG
692                     RRGPEQTQGNFGDQDLIRQGTDYKHWPQIAQFAPSASAFFGMSRIGMEVTPSGTWLTY
693                     HGAIKLDDKDPQFKDNVILLNKHIDAYKTFPPTEPKKDKKKKTDEAQPLPQRQKKQPT
694                     VTLLPAADMDDFSRQLQNSMSGASADSTQA"
695     misc_feature    28123..28125
696                     /gene="N"
697                     /locus_tag="sars9a"
698                     /note="acetylation site"
699                     /evidence=experimental
700     gene            28130..28426
701                     /locus_tag="sars9b"
702                     /db_xref="GeneID:1489679"
703     CDS             28130..28426
704                     /locus_tag="sars9b"
705                     /codon_start=1
706                     /evidence=not_experimental
707                     /product="hypothetical protein sars9b"
708                     /protein_id="NP_828859.1"
709                     /db_xref="GI:29836502"
710                     /db_xref="GeneID:1489679"
711                     /translation="MDPNQTNVVPPALHLVDPQIQLTITRMEDAMGQGQNSADPKVYP
712                     IILRLGSQLSLSMARRNLDSLEARAFQSTPIVVQMTKLATTEELPDEFVVVTAK"
713     3'UTR           29389..29751
714ORIGIN
715        1 atattaggtt tttacctacc caggaaaagc caaccaacct cgatctcttg tagatctgtt
716       61 ctctaaacga actttaaaat ctgtgtagct gtcgctcggc tgcatgccta gtgcacctac
717      121 gcagtataaa caataataaa ttttactgtc gttgacaaga aacgagtaac tcgtccctct
718      181 tctgcagact gcttacggtt tcgtccgtgt tgcagtcgat catcagcata cctaggtttc
719      241 gtccgggtgt gaccgaaagg taagatggag agccttgttc ttggtgtcaa cgagaaaaca
720      301 cacgtccaac tcagtttgcc tgtccttcag gttagagacg tgctagtgcg tggcttcggg
721      361 gactctgtgg aagaggccct atcggaggca cgtgaacacc tcaaaaatgg cacttgtggt
722      421 ctagtagagc tggaaaaagg cgtactgccc cagcttgaac agccctatgt gttcattaaa
723      481 cgttctgatg ccttaagcac caatcacggc cacaaggtcg ttgagctggt tgcagaaatg
724      541 gacggcattc agtacggtcg tagcggtata acactgggag tactcgtgcc acatgtgggc
725      601 gaaaccccaa ttgcataccg caatgttctt cttcgtaaga acggtaataa gggagccggt
726      661 ggtcatagct atggcatcga tctaaagtct tatgacttag gtgacgagct tggcactgat
727      721 cccattgaag attatgaaca aaactggaac actaagcatg gcagtggtgc actccgtgaa
728      781 ctcactcgtg agctcaatgg aggtgcagtc actcgctatg tcgacaacaa tttctgtggc
729      841 ccagatgggt accctcttga ttgcatcaaa gattttctcg cacgcgcggg caagtcaatg
730      901 tgcactcttt ccgaacaact tgattacatc gagtcgaaga gaggtgtcta ctgctgccgt
731      961 gaccatgagc atgaaattgc ctggttcact gagcgctctg ataagagcta cgagcaccag
732     1021 acacccttcg aaattaagag tgccaagaaa tttgacactt tcaaagggga atgcccaaag
733     1081 tttgtgtttc ctcttaactc aaaagtcaaa gtcattcaac cacgtgttga aaagaaaaag
734     1141 actgagggtt tcatggggcg tatacgctct gtgtaccctg ttgcatctcc acaggagtgt
735     1201 aacaatatgc acttgtctac cttgatgaaa tgtaatcatt gcgatgaagt ttcatggcag
736     1261 acgtgcgact ttctgaaagc cacttgtgaa cattgtggca ctgaaaattt agttattgaa
737     1321 ggacctacta catgtgggta cctacctact aatgctgtag tgaaaatgcc atgtcctgcc
738     1381 tgtcaagacc cagagattgg acctgagcat agtgttgcag attatcacaa ccactcaaac
739     1441 attgaaactc gactccgcaa gggaggtagg actagatgtt ttggaggctg tgtgtttgcc
740     1501 tatgttggct gctataataa gcgtgcctac tgggttcctc gtgctagtgc tgatattggc
741     1561 tcaggccata ctggcattac tggtgacaat gtggagacct tgaatgagga tctccttgag
742     1621 atactgagtc gtgaacgtgt taacattaac attgttggcg attttcattt gaatgaagag
743     1681 gttgccatca ttttggcatc tttctctgct tctacaagtg cctttattga cactataaag
744     1741 agtcttgatt acaagtcttt caaaaccatt gttgagtcct gcggtaacta taaagttacc
745     1801 aagggaaagc ccgtaaaagg tgcttggaac attggacaac agagatcagt tttaacacca
746     1861 ctgtgtggtt ttccctcaca ggctgctggt gttatcagat caatttttgc gcgcacactt
747     1921 gatgcagcaa accactcaat tcctgatttg caaagagcag ctgtcaccat acttgatggt
748     1981 atttctgaac agtcattacg tcttgtcgac gccatggttt atacttcaga cctgctcacc
749     2041 aacagtgtca ttattatggc atatgtaact ggtggtcttg tacaacagac ttctcagtgg
750     2101 ttgtctaatc ttttgggcac tactgttgaa aaactcaggc ctatctttga atggattgag
751     2161 gcgaaactta gtgcaggagt tgaatttctc aaggatgctt gggagattct caaatttctc
752     2221 attacaggtg tttttgacat cgtcaagggt caaatacagg ttgcttcaga taacatcaag
753     2281 gattgtgtaa aatgcttcat tgatgttgtt aacaaggcac tcgaaatgtg cattgatcaa
754     2341 gtcactatcg ctggcgcaaa gttgcgatca ctcaacttag gtgaagtctt catcgctcaa
755     2401 agcaagggac tttaccgtca gtgtatacgt ggcaaggagc agctgcaact actcatgcct
756     2461 cttaaggcac caaaagaagt aacctttctt gaaggtgatt cacatgacac agtacttacc
757     2521 tctgaggagg ttgttctcaa gaacggtgaa ctcgaagcac tcgagacgcc cgttgatagc
758     2581 ttcacaaatg gagctatcgt tggcacacca gtctgtgtaa atggcctcat gctcttagag
759     2641 attaaggaca aagaacaata ctgcgcattg tctcctggtt tactggctac aaacaatgtc
760     2701 tttcgcttaa aagggggtgc accaattaaa ggtgtaacct ttggagaaga tactgtttgg
761     2761 gaagttcaag gttacaagaa tgtgagaatc acatttgagc ttgatgaacg tgttgacaaa
762     2821 gtgcttaatg aaaagtgctc tgtctacact gttgaatccg gtaccgaagt tactgagttt
763     2881 gcatgtgttg tagcagaggc tgttgtgaag actttacaac cagtttctga tctccttacc
764     2941 aacatgggta ttgatcttga tgagtggagt gtagctacat tctacttatt tgatgatgct
765     3001 ggtgaagaaa acttttcatc acgtatgtat tgttcctttt accctccaga tgaggaagaa
766     3061 gaggacgatg cagagtgtga ggaagaagaa attgatgaaa cctgtgaaca tgagtacggt
767     3121 acagaggatg attatcaagg tctccctctg gaatttggtg cctcagctga aacagttcga
768     3181 gttgaggaag aagaagagga agactggctg gatgatacta ctgagcaatc agagattgag
769     3241 ccagaaccag aacctacacc tgaagaacca gttaatcagt ttactggtta tttaaaactt
770     3301 actgacaatg ttgccattaa atgtgttgac atcgttaagg aggcacaaag tgctaatcct
771     3361 atggtgattg taaatgctgc taacatacac ctgaaacatg gtggtggtgt agcaggtgca
772     3421 ctcaacaagg caaccaatgg tgccatgcaa aaggagagtg atgattacat taagctaaat
773     3481 ggccctctta cagtaggagg gtcttgtttg ctttctggac ataatcttgc taagaagtgt
774     3541 ctgcatgttg ttggacctaa cctaaatgca ggtgaggaca tccagcttct taaggcagca
775     3601 tatgaaaatt tcaattcaca ggacatctta cttgcaccat tgttgtcagc aggcatattt
776     3661 ggtgctaaac cacttcagtc tttacaagtg tgcgtgcaga cggttcgtac acaggtttat
777     3721 attgcagtca atgacaaagc tctttatgag caggttgtca tggattatct tgataacctg
778     3781 aagcctagag tggaagcacc taaacaagag gagccaccaa acacagaaga ttccaaaact
779     3841 gaggagaaat ctgtcgtaca gaagcctgtc gatgtgaagc caaaaattaa ggcctgcatt
780     3901 gatgaggtta ccacaacact ggaagaaact aagtttctta ccaataagtt actcttgttt
781     3961 gctgatatca atggtaagct ttaccatgat tctcagaaca tgcttagagg tgaagatatg
782     4021 tctttccttg agaaggatgc accttacatg gtaggtgatg ttatcactag tggtgatatc
783     4081 acttgtgttg taataccctc caaaaaggct ggtggcacta ctgagatgct ctcaagagct
784     4141 ttgaagaaag tgccagttga tgagtatata accacgtacc ctggacaagg atgtgctggt
785     4201 tatacacttg aggaagctaa gactgctctt aagaaatgca aatctgcatt ttatgtacta
786     4261 ccttcagaag cacctaatgc taaggaagag attctaggaa ctgtatcctg gaatttgaga
787     4321 gaaatgcttg ctcatgctga agagacaaga aaattaatgc ctatatgcat ggatgttaga
788     4381 gccataatgg caaccatcca acgtaagtat aaaggaatta aaattcaaga gggcatcgtt
789     4441 gactatggtg tccgattctt cttttatact agtaaagagc ctgtagcttc tattattacg
790     4501 aagctgaact ctctaaatga gccgcttgtc acaatgccaa ttggttatgt gacacatggt
791     4561 tttaatcttg aagaggctgc gcgctgtatg cgttctctta aagctcctgc cgtagtgtca
792     4621 gtatcatcac cagatgctgt tactacatat aatggatacc tcacttcgtc atcaaagaca
793     4681 tctgaggagc actttgtaga aacagtttct ttggctggct cttacagaga ttggtcctat
794     4741 tcaggacagc gtacagagtt aggtgttgaa tttcttaagc gtggtgacaa aattgtgtac
795     4801 cacactctgg agagccccgt cgagtttcat cttgacggtg aggttctttc acttgacaaa
796     4861 ctaaagagtc tcttatccct gcgggaggtt aagactataa aagtgttcac aactgtggac
797     4921 aacactaatc tccacacaca gcttgtggat atgtctatga catatggaca gcagtttggt
798     4981 ccaacatact tggatggtgc tgatgttaca aaaattaaac ctcatgtaaa tcatgagggt
799     5041 aagactttct ttgtactacc tagtgatgac acactacgta gtgaagcttt cgagtactac
800     5101 catactcttg atgagagttt tcttggtagg tacatgtctg ctttaaacca cacaaagaaa
801     5161 tggaaatttc ctcaagttgg tggtttaact tcaattaaat gggctgataa caattgttat
802     5221 ttgtctagtg ttttattagc acttcaacag cttgaagtca aattcaatgc accagcactt
803     5281 caagaggctt attatagagc ccgtgctggt gatgctgcta acttttgtgc actcatactc
804     5341 gcttacagta ataaaactgt tggcgagctt ggtgatgtca gagaaactat gacccatctt
805     5401 ctacagcatg ctaatttgga atctgcaaag cgagttctta atgtggtgtg taaacattgt
806     5461 ggtcagaaaa ctactacctt aacgggtgta gaagctgtga tgtatatggg tactctatct
807     5521 tatgataatc ttaagacagg tgtttccatt ccatgtgtgt gtggtcgtga tgctacacaa
808     5581 tatctagtac aacaagagtc ttcttttgtt atgatgtctg caccacctgc tgagtataaa
809     5641 ttacagcaag gtacattctt atgtgcgaat gagtacactg gtaactatca gtgtggtcat
810     5701 tacactcata taactgctaa ggagaccctc tatcgtattg acggagctca ccttacaaag
811     5761 atgtcagagt acaaaggacc agtgactgat gttttctaca aggaaacatc ttacactaca
812     5821 accatcaagc ctgtgtcgta taaactcgat ggagttactt acacagagat tgaaccaaaa
813     5881 ttggatgggt attataaaaa ggataatgct tactatacag agcagcctat agaccttgta
814     5941 ccaactcaac cattaccaaa tgcgagtttt gataatttca aactcacatg ttctaacaca
815     6001 aaatttgctg atgatttaaa tcaaatgaca ggcttcacaa agccagcttc acgagagcta
816     6061 tctgtcacat tcttcccaga cttgaatggc gatgtagtgg ctattgacta tagacactat
817     6121 tcagcgagtt tcaagaaagg tgctaaatta ctgcataagc caattgtttg gcacattaac
818     6181 caggctacaa ccaagacaac gttcaaacca aacacttggt gtttacgttg tctttggagt
819     6241 acaaagccag tagatacttc aaattcattt gaagttctgg cagtagaaga cacacaagga
820     6301 atggacaatc ttgcttgtga aagtcaacaa cccacctctg aagaagtagt ggaaaatcct
821     6361 accatacaga aggaagtcat agagtgtgac gtgaaaacta ccgaagttgt aggcaatgtc
822     6421 atacttaaac catcagatga aggtgttaaa gtaacacaag agttaggtca tgaggatctt
823     6481 atggctgctt atgtggaaaa cacaagcatt accattaaga aacctaatga gctttcacta
824     6541 gccttaggtt taaaaacaat tgccactcat ggtattgctg caattaatag tgttccttgg
825     6601 agtaaaattt tggcttatgt caaaccattc ttaggacaag cagcaattac aacatcaaat
826     6661 tgcgctaaga gattagcaca acgtgtgttt aacaattata tgccttatgt gtttacatta
827     6721 ttgttccaat tgtgtacttt tactaaaagt accaattcta gaattagagc ttcactacct
828     6781 acaactattg ctaaaaatag tgttaagagt gttgctaaat tatgtttgga tgccggcatt
829     6841 aattatgtga agtcacccaa attttctaaa ttgttcacaa tcgctatgtg gctattgttg
830     6901 ttaagtattt gcttaggttc tctaatctgt gtaactgctg cttttggtgt actcttatct
831     6961 aattttggtg ctccttctta ttgtaatggc gttagagaat tgtatcttaa ttcgtctaac
832     7021 gttactacta tggatttctg tgaaggttct tttccttgca gcatttgttt aagtggatta
833     7081 gactcccttg attcttatcc agctcttgaa accattcagg tgacgatttc atcgtacaag
834     7141 ctagacttga caattttagg tctggccgct gagtgggttt tggcatatat gttgttcaca
835     7201 aaattctttt atttattagg tctttcagct ataatgcagg tgttctttgg ctattttgct
836     7261 agtcatttca tcagcaattc ttggctcatg tggtttatca ttagtattgt acaaatggca
837     7321 cccgtttctg caatggttag gatgtacatc ttctttgctt ctttctacta catatggaag
838     7381 agctatgttc atatcatgga tggttgcacc tcttcgactt gcatgatgtg ctataagcgc
839     7441 aatcgtgcca cacgcgttga gtgtacaact attgttaatg gcatgaagag atctttctat
840     7501 gtctatgcaa atggaggccg tggcttctgc aagactcaca attggaattg tctcaattgt
841     7561 gacacatttt gcactggtag tacattcatt agtgatgaag ttgctcgtga tttgtcactc
842     7621 cagtttaaaa gaccaatcaa ccctactgac cagtcatcgt atattgttga tagtgttgct
843     7681 gtgaaaaatg gcgcgcttca cctctacttt gacaaggctg gtcaaaagac ctatgagaga
844     7741 catccgctct cccattttgt caatttagac aatttgagag ctaacaacac taaaggttca
845     7801 ctgcctatta atgtcatagt ttttgatggc aagtccaaat gcgacgagtc tgcttctaag
846     7861 tctgcttctg tgtactacag tcagctgatg tgccaaccta ttctgttgct tgaccaagct
847     7921 cttgtatcag acgttggaga tagtactgaa gtttccgtta agatgtttga tgcttatgtc
848     7981 gacacctttt cagcaacttt tagtgttcct atggaaaaac ttaaggcact tgttgctaca
849     8041 gctcacagcg agttagcaaa gggtgtagct ttagatggtg tcctttctac attcgtgtca
850     8101 gctgcccgac aaggtgttgt tgataccgat gttgacacaa aggatgttat tgaatgtctc
851     8161 aaactttcac atcactctga cttagaagtg acaggtgaca gttgtaacaa tttcatgctc
852     8221 acctataata aggttgaaaa catgacgccc agagatcttg gcgcatgtat tgactgtaat
853     8281 gcaaggcata tcaatgccca agtagcaaaa agtcacaatg tttcactcat ctggaatgta
854     8341 aaagactaca tgtctttatc tgaacagctg cgtaaacaaa ttcgtagtgc tgccaagaag
855     8401 aacaacatac cttttagact aacttgtgct acaactagac aggttgtcaa tgtcataact
856     8461 actaaaatct cactcaaggg tggtaagatt gttagtactt gttttaaact tatgcttaag
857     8521 gccacattat tgtgcgttct tgctgcattg gtttgttata tcgttatgcc agtacataca
858     8581 ttgtcaatcc atgatggtta cacaaatgaa atcattggtt acaaagccat tcaggatggt
859     8641 gtcactcgtg acatcatttc tactgatgat tgttttgcaa ataaacatgc tggttttgac
860     8701 gcatggttta gccagcgtgg tggttcatac aaaaatgaca aaagctgccc tgtagtagct
861     8761 gctatcatta caagagagat tggtttcata gtgcctggct taccgggtac tgtgctgaga
862     8821 gcaatcaatg gtgacttctt gcattttcta cctcgtgttt ttagtgctgt tggcaacatt
863     8881 tgctacacac cttccaaact cattgagtat agtgattttg ctacctctgc ttgcgttctt
864     8941 gctgctgagt gtacaatttt taaggatgct atgggcaaac ctgtgccata ttgttatgac
865     9001 actaatttgc tagagggttc tatttcttat agtgagcttc gtccagacac tcgttatgtg
866     9061 cttatggatg gttccatcat acagtttcct aacacttacc tggagggttc tgttagagta
867     9121 gtaacaactt ttgatgctga gtactgtaga catggtacat gcgaaaggtc agaagtaggt
868     9181 atttgcctat ctaccagtgg tagatgggtt cttaataatg agcattacag agctctatca
869     9241 ggagttttct gtggtgttga tgcgatgaat ctcatagcta acatctttac tcctcttgtg
870     9301 caacctgtgg gtgctttaga tgtgtctgct tcagtagtgg ctggtggtat tattgccata
871     9361 ttggtgactt gtgctgccta ctactttatg aaattcagac gtgtttttgg tgagtacaac
872     9421 catgttgttg ctgctaatgc acttttgttt ttgatgtctt tcactatact ctgtctggta
873     9481 ccagcttaca gctttctgcc gggagtctac tcagtctttt acttgtactt gacattctat
874     9541 ttcaccaatg atgtttcatt cttggctcac cttcaatggt ttgccatgtt ttctcctatt
875     9601 gtgccttttt ggataacagc aatctatgta ttctgtattt ctctgaagca ctgccattgg
876     9661 ttctttaaca actatcttag gaaaagagtc atgtttaatg gagttacatt tagtaccttc
877     9721 gaggaggctg ctttgtgtac ctttttgctc aacaaggaaa tgtacctaaa attgcgtagc
878     9781 gagacactgt tgccacttac acagtataac aggtatcttg ctctatataa caagtacaag
879     9841 tatttcagtg gagccttaga tactaccagc tatcgtgaag cagcttgctg ccacttagca
880     9901 aaggctctaa atgactttag caactcaggt gctgatgttc tctaccaacc accacagaca
881     9961 tcaatcactt ctgctgttct gcagagtggt tttaggaaaa tggcattccc gtcaggcaaa
882    10021 gttgaagggt gcatggtaca agtaacctgt ggaactacaa ctcttaatgg attgtggttg
883    10081 gatgacacag tatactgtcc aagacatgtc atttgcacag cagaagacat gcttaatcct
884    10141 aactatgaag atctgctcat tcgcaaatcc aaccatagct ttcttgttca ggctggcaat
885    10201 gttcaacttc gtgttattgg ccattctatg caaaattgtc tgcttaggct taaagttgat
886    10261 acttctaacc ctaagacacc caagtataaa tttgtccgta tccaacctgg tcaaacattt
887    10321 tcagttctag catgctacaa tggttcacca tctggtgttt atcagtgtgc catgagacct
888    10381 aatcatacca ttaaaggttc tttccttaat ggatcatgtg gtagtgttgg ttttaacatt
889    10441 gattatgatt gcgtgtcttt ctgctatatg catcatatgg agcttccaac aggagtacac
890    10501 gctggtactg acttagaagg taaattctat ggtccatttg ttgacagaca aactgcacag
891    10561 gctgcaggta cagacacaac cataacatta aatgttttgg catggctgta tgctgctgtt
892    10621 atcaatggtg ataggtggtt tcttaataga ttcaccacta ctttgaatga ctttaacctt
893    10681 gtggcaatga agtacaacta tgaacctttg acacaagatc atgttgacat attgggacct
894    10741 ctttctgctc aaacaggaat tgccgtctta gatatgtgtg ctgctttgaa agagctgctg
895    10801 cagaatggta tgaatggtcg tactatcctt ggtagcacta ttttagaaga tgagtttaca
896    10861 ccatttgatg ttgttagaca atgctctggt gttaccttcc aaggtaagtt caagaaaatt
897    10921 gttaagggca ctcatcattg gatgctttta actttcttga catcactatt gattcttgtt
898    10981 caaagtacac agtggtcact gtttttcttt gtttacgaga atgctttctt gccatttact
899    11041 cttggtatta tggcaattgc tgcatgtgct atgctgcttg ttaagcataa gcacgcattc
900    11101 ttgtgcttgt ttctgttacc ttctcttgca acagttgctt actttaatat ggtctacatg
901    11161 cctgctagct gggtgatgcg tatcatgaca tggcttgaat tggctgacac tagcttgtct
902    11221 ggttataggc ttaaggattg tgttatgtat gcttcagctt tagttttgct tattctcatg
903    11281 acagctcgca ctgtttatga tgatgctgct agacgtgttt ggacactgat gaatgtcatt
904    11341 acacttgttt acaaagtcta ctatggtaat gctttagatc aagctatttc catgtgggcc
905    11401 ttagttattt ctgtaacctc taactattct ggtgtcgtta cgactatcat gtttttagct
906    11461 agagctatag tgtttgtgtg tgttgagtat tacccattgt tatttattac tggcaacacc
907    11521 ttacagtgta tcatgcttgt ttattgtttc ttaggctatt gttgctgctg ctactttggc
908    11581 cttttctgtt tactcaaccg ttacttcagg cttactcttg gtgtttatga ctacttggtc
909    11641 tctacacaag aatttaggta tatgaactcc caggggcttt tgcctcctaa gagtagtatt
910    11701 gatgctttca agcttaacat taagttgttg ggtattggag gtaaaccatg tatcaaggtt
911    11761 gctactgtac agtctaaaat gtctgacgta aagtgcacat ctgtggtact gctctcggtt
912    11821 cttcaacaac ttagagtaga gtcatcttct aaattgtggg cacaatgtgt acaactccac
913    11881 aatgatattc ttcttgcaaa agacacaact gaagctttcg agaagatggt ttctcttttg
914    11941 tctgttttgc tatccatgca gggtgctgta gacattaata ggttgtgcga ggaaatgctc
915    12001 gataaccgtg ctactcttca ggctattgct tcagaattta gttctttacc atcatatgcc
916    12061 gcttatgcca ctgcccagga ggcctatgag caggctgtag ctaatggtga ttctgaagtc
917    12121 gttctcaaaa agttaaagaa atctttgaat gtggctaaat ctgagtttga ccgtgatgct
918    12181 gccatgcaac gcaagttgga aaagatggca gatcaggcta tgacccaaat gtacaaacag
919    12241 gcaagatctg aggacaagag ggcaaaagta actagtgcta tgcaaacaat gctcttcact
920    12301 atgcttagga agcttgataa tgatgcactt aacaacatta tcaacaatgc gcgtgatggt
921    12361 tgtgttccac tcaacatcat accattgact acagcagcca aactcatggt tgttgtccct
922    12421 gattatggta cctacaagaa cacttgtgat ggtaacacct ttacatatgc atctgcactc
923    12481 tgggaaatcc agcaagttgt tgatgcggat agcaagattg ttcaacttag tgaaattaac
924    12541 atggacaatt caccaaattt ggcttggcct cttattgtta cagctctaag agccaactca
925    12601 gctgttaaac tacagaataa tgaactgagt ccagtagcac tacgacagat gtcctgtgcg
926    12661 gctggtacca cacaaacagc ttgtactgat gacaatgcac ttgcctacta taacaattcg
927    12721 aagggaggta ggtttgtgct ggcattacta tcagaccacc aagatctcaa atgggctaga
928    12781 ttccctaaga gtgatggtac aggtacaatt tacacagaac tggaaccacc ttgtaggttt
929    12841 gttacagaca caccaaaagg gcctaaagtg aaatacttgt acttcatcaa aggcttaaac
930    12901 aacctaaata gaggtatggt gctgggcagt ttagctgcta cagtacgtct tcaggctgga
931    12961 aatgctacag aagtacctgc caattcaact gtgctttcct tctgtgcttt tgcagtagac
932    13021 cctgctaaag catataagga ttacctagca agtggaggac aaccaatcac caactgtgtg
933    13081 aagatgttgt gtacacacac tggtacagga caggcaatta ctgtaacacc agaagctaac
934    13141 atggaccaag agtcctttgg tggtgcttca tgttgtctgt attgtagatg ccacattgac
935    13201 catccaaatc ctaaaggatt ctgtgacttg aaaggtaagt acgtccaaat acctaccact
936    13261 tgtgctaatg acccagtggg ttttacactt agaaacacag tctgtaccgt ctgcggaatg
937    13321 tggaaaggtt atggctgtag ttgtgaccaa ctccgcgaac ccttgatgca gtctgcggat
938    13381 gcatcaacgt ttttaaacgg gtttgcggtg taagtgcagc ccgtcttaca ccgtgcggca
939    13441 caggcactag tactgatgtc gtctacaggg cttttgatat ttacaacgaa aaagttgctg
940    13501 gttttgcaaa gttcctaaaa actaattgct gtcgcttcca ggagaaggat gaggaaggca
941    13561 atttattaga ctcttacttt gtagttaaga ggcatactat gtctaactac caacatgaag
942    13621 agactattta taacttggtt aaagattgtc cagcggttgc tgtccatgac tttttcaagt
943    13681 ttagagtaga tggtgacatg gtaccacata tatcacgtca gcgtctaact aaatacacaa
944    13741 tggctgattt agtctatgct ctacgtcatt ttgatgaggg taattgtgat acattaaaag
945    13801 aaatactcgt cacatacaat tgctgtgatg atgattattt caataagaag gattggtatg
946    13861 acttcgtaga gaatcctgac atcttacgcg tatatgctaa cttaggtgag cgtgtacgcc
947    13921 aatcattatt aaagactgta caattctgcg atgctatgcg tgatgcaggc attgtaggcg
948    13981 tactgacatt agataatcag gatcttaatg ggaactggta cgatttcggt gatttcgtac
949    14041 aagtagcacc aggctgcgga gttcctattg tggattcata ttactcattg ctgatgccca
950    14101 tcctcacttt gactagggca ttggctgctg agtcccatat ggatgctgat ctcgcaaaac
951    14161 cacttattaa gtgggatttg ctgaaatatg attttacgga agagagactt tgtctcttcg
952    14221 accgttattt taaatattgg gaccagacat accatcccaa ttgtattaac tgtttggatg
953    14281 ataggtgtat ccttcattgt gcaaacttta atgtgttatt ttctactgtg tttccaccta
954    14341 caagttttgg accactagta agaaaaatat ttgtagatgg tgttcctttt gttgtttcaa
955    14401 ctggatacca ttttcgtgag ttaggagtcg tacataatca ggatgtaaac ttacatagct
956    14461 cgcgtctcag tttcaaggaa cttttagtgt atgctgctga tccagctatg catgcagctt
957    14521 ctggcaattt attgctagat aaacgcacta catgcttttc agtagctgca ctaacaaaca
958    14581 atgttgcttt tcaaactgtc aaacccggta attttaataa agacttttat gactttgctg
959    14641 tgtctaaagg tttctttaag gaaggaagtt ctgttgaact aaaacacttc ttctttgctc
960    14701 aggatggcaa cgctgctatc agtgattatg actattatcg ttataatctg ccaacaatgt
961    14761 gtgatatcag acaactccta ttcgtagttg aagttgttga taaatacttt gattgttacg
962    14821 atggtggctg tattaatgcc aaccaagtaa tcgttaacaa tctggataaa tcagctggtt
963    14881 tcccatttaa taaatggggt aaggctagac tttattatga ctcaatgagt tatgaggatc
964    14941 aagatgcact tttcgcgtat actaagcgta atgtcatccc tactataact caaatgaatc
965    15001 ttaagtatgc cattagtgca aagaatagag ctcgcaccgt agctggtgtc tctatctgta
966    15061 gtactatgac aaatagacag tttcatcaga aattattgaa gtcaatagcc gccactagag
967    15121 gagctactgt ggtaattgga acaagcaagt tttacggtgg ctggcataat atgttaaaaa
968    15181 ctgtttacag tgatgtagaa actccacacc ttatgggttg ggattatcca aaatgtgaca
969    15241 gagccatgcc taacatgctt aggataatgg cctctcttgt tcttgctcgc aaacataaca
970    15301 cttgctgtaa cttatcacac cgtttctaca ggttagctaa cgagtgtgcg caagtattaa
971    15361 gtgagatggt catgtgtggc ggctcactat atgttaaacc aggtggaaca tcatccggtg
972    15421 atgctacaac tgcttatgct aatagtgtct ttaacatttg tcaagctgtt acagccaatg
973    15481 taaatgcact tctttcaact gatggtaata agatagctga caagtatgtc cgcaatctac
974    15541 aacacaggct ctatgagtgt ctctatagaa atagggatgt tgatcatgaa ttcgtggatg
975    15601 agttttacgc ttacctgcgt aaacatttct ccatgatgat tctttctgat gatgccgttg
976    15661 tgtgctataa cagtaactat gcggctcaag gtttagtagc tagcattaag aactttaagg
977    15721 cagttcttta ttatcaaaat aatgtgttca tgtctgaggc aaaatgttgg actgagactg
978    15781 accttactaa aggacctcac gaattttgct cacagcatac aatgctagtt aaacaaggag
979    15841 atgattacgt gtacctgcct tacccagatc catcaagaat attaggcgca ggctgttttg
980    15901 tcgatgatat tgtcaaaaca gatggtacac ttatgattga aaggttcgtg tcactggcta
981    15961 ttgatgctta cccacttaca aaacatccta atcaggagta tgctgatgtc tttcacttgt
982    16021 atttacaata cattagaaag ttacatgatg agcttactgg ccacatgttg gacatgtatt
983    16081 ccgtaatgct aactaatgat aacacctcac ggtactggga acctgagttt tatgaggcta
984    16141 tgtacacacc acatacagtc ttgcaggctg taggtgcttg tgtattgtgc aattcacaga
985    16201 cttcacttcg ttgcggtgcc tgtattagga gaccattcct atgttgcaag tgctgctatg
986    16261 accatgtcat ttcaacatca cacaaattag tgttgtctgt taatccctat gtttgcaatg
987    16321 ccccaggttg tgatgtcact gatgtgacac aactgtatct aggaggtatg agctattatt
988    16381 gcaagtcaca taagcctccc attagttttc cattatgtgc taatggtcag gtttttggtt
989    16441 tatacaaaaa cacatgtgta ggcagtgaca atgtcactga cttcaatgcg atagcaacat
990    16501 gtgattggac taatgctggc gattacatac ttgccaacac ttgtactgag agactcaagc
991    16561 ttttcgcagc agaaacgctc aaagccactg aggaaacatt taagctgtca tatggtattg
992    16621 ccactgtacg cgaagtactc tctgacagag aattgcatct ttcatgggag gttggaaaac
993    16681 ctagaccacc attgaacaga aactatgtct ttactggtta ccgtgtaact aaaaatagta
994    16741 aagtacagat tggagagtac acctttgaaa aaggtgacta tggtgatgct gttgtgtaca
995    16801 gaggtactac gacatacaag ttgaatgttg gtgattactt tgtgttgaca tctcacactg
996    16861 taatgccact tagtgcacct actctagtgc cacaagagca ctatgtgaga attactggct
997    16921 tgtacccaac actcaacatc tcagatgagt tttctagcaa tgttgcaaat tatcaaaagg
998    16981 tcggcatgca aaagtactct acactccaag gaccacctgg tactggtaag agtcattttg
999    17041 ccatcggact tgctctctat tacccatctg ctcgcatagt gtatacggca tgctctcatg
1000    17101 cagctgttga tgccctatgt gaaaaggcat taaaatattt gcccatagat aaatgtagta
1001    17161 gaatcatacc tgcgcgtgcg cgcgtagagt gttttgataa attcaaagtg aattcaacac
1002    17221 tagaacagta tgttttctgc actgtaaatg cattgccaga aacaactgct gacattgtag
1003    17281 tctttgatga aatctctatg gctactaatt atgacttgag tgttgtcaat gctagacttc
1004    17341 gtgcaaaaca ctacgtctat attggcgatc ctgctcaatt accagccccc cgcacattgc
1005    17401 tgactaaagg cacactagaa ccagaatatt ttaattcagt gtgcagactt atgaaaacaa
1006    17461 taggtccaga catgttcctt ggaacttgtc gccgttgtcc tgctgaaatt gttgacactg
1007    17521 tgagtgcttt agtttatgac aataagctaa aagcacacaa ggataagtca gctcaatgct
1008    17581 tcaaaatgtt ctacaaaggt gttattacac atgatgtttc atctgcaatc aacagacctc
1009    17641 aaataggcgt tgtaagagaa tttcttacac gcaatcctgc ttggagaaaa gctgttttta
1010    17701 tctcacctta taattcacag aacgctgtag cttcaaaaat cttaggattg cctacgcaga
1011    17761 ctgttgattc atcacagggt tctgaatatg actatgtcat attcacacaa actactgaaa
1012    17821 cagcacactc ttgtaatgtc aaccgcttca atgtggctat cacaagggca aaaattggca
1013    17881 ttttgtgcat aatgtctgat agagatcttt atgacaaact gcaatttaca agtctagaaa
1014    17941 taccacgtcg caatgtggct acattacaag cagaaaatgt aactggactt tttaaggact
1015    18001 gtagtaagat cattactggt cttcatccta cacaggcacc tacacacctc agcgttgata
1016    18061 taaagttcaa gactgaagga ttatgtgttg acataccagg cataccaaag gacatgacct
1017    18121 accgtagact catctctatg atgggtttca aaatgaatta ccaagtcaat ggttacccta
1018    18181 atatgtttat cacccgcgaa gaagctattc gtcacgttcg tgcgtggatt ggctttgatg
1019    18241 tagagggctg tcatgcaact agagatgctg tgggtactaa cctacctctc cagctaggat
1020    18301 tttctacagg tgttaactta gtagctgtac cgactggtta tgttgacact gaaaataaca
1021    18361 cagaattcac cagagttaat gcaaaacctc caccaggtga ccagtttaaa catcttatac
1022    18421 cactcatgta taaaggcttg ccctggaatg tagtgcgtat taagatagta caaatgctca
1023    18481 gtgatacact gaaaggattg tcagacagag tcgtgttcgt cctttgggcg catggctttg
1024    18541 agcttacatc aatgaagtac tttgtcaaga ttggacctga aagaacgtgt tgtctgtgtg
1025    18601 acaaacgtgc aacttgcttt tctacttcat cagatactta tgcctgctgg aatcattctg
1026    18661 tgggttttga ctatgtctat aacccattta tgattgatgt tcagcagtgg ggctttacgg
1027    18721 gtaaccttca gagtaaccat gaccaacatt gccaggtaca tggaaatgca catgtggcta
1028    18781 gttgtgatgc tatcatgact agatgtttag cagtccatga gtgctttgtt aagcgcgttg
1029    18841 attggtctgt tgaataccct attataggag atgaactgag ggttaattct gcttgcagaa
1030    18901 aagtacaaca catggttgtg aagtctgcat tgcttgctga taagtttcca gttcttcatg
1031    18961 acattggaaa tccaaaggct atcaagtgtg tgcctcaggc tgaagtagaa tggaagttct
1032    19021 acgatgctca gccatgtagt gacaaagctt acaaaataga ggaactcttc tattcttatg
1033    19081 ctacacatca cgataaattc actgatggtg tttgtttgtt ttggaattgt aacgttgatc
1034    19141 gttacccagc caatgcaatt gtgtgtaggt ttgacacaag agtcttgtca aacttgaact
1035    19201 taccaggctg tgatggtggt agtttgtatg tgaataagca tgcattccac actccagctt
1036    19261 tcgataaaag tgcatttact aatttaaagc aattgccttt cttttactat tctgatagtc
1037    19321 cttgtgagtc tcatggcaaa caagtagtgt cggatattga ttatgttcca ctcaaatctg
1038    19381 ctacgtgtat tacacgatgc aatttaggtg gtgctgtttg cagacaccat gcaaatgagt
1039    19441 accgacagta cttggatgca tataatatga tgatttctgc tggatttagc ctatggattt
1040    19501 acaaacaatt tgatacttat aacctgtgga atacatttac caggttacag agtttagaaa
1041    19561 atgtggctta taatgttgtt aataaaggac actttgatgg acacgccggc gaagcacctg
1042    19621 tttccatcat taataatgct gtttacacaa aggtagatgg tattgatgtg gagatctttg
1043    19681 aaaataagac aacacttcct gttaatgttg catttgagct ttgggctaag cgtaacatta
1044    19741 aaccagtgcc agagattaag atactcaata atttgggtgt tgatatcgct gctaatactg
1045    19801 taatctggga ctacaaaaga gaagccccag cacatgtatc tacaataggt gtctgcacaa
1046    19861 tgactgacat tgccaagaaa cctactgaga gtgcttgttc ttcacttact gtcttgtttg
1047    19921 atggtagagt ggaaggacag gtagaccttt ttagaaacgc ccgtaatggt gttttaataa
1048    19981 cagaaggttc agtcaaaggt ctaacacctt caaagggacc agcacaagct agcgtcaatg
1049    20041 gagtcacatt aattggagaa tcagtaaaaa cacagtttaa ctactttaag aaagtagacg
1050    20101 gcattattca acagttgcct gaaacctact ttactcagag cagagactta gaggatttta
1051    20161 agcccagatc acaaatggaa actgactttc tcgagctcgc tatggatgaa ttcatacagc
1052    20221 gatataagct cgagggctat gccttcgaac acatcgttta tggagatttc agtcatggac
1053    20281 aacttggcgg tcttcattta atgataggct tagccaagcg ctcacaagat tcaccactta
1054    20341 aattagagga ttttatccct atggacagca cagtgaaaaa ttacttcata acagatgcgc
1055    20401 aaacaggttc atcaaaatgt gtgtgttctg tgattgatct tttacttgat gactttgtcg
1056    20461 agataataaa gtcacaagat ttgtcagtga tttcaaaagt ggtcaaggtt acaattgact
1057    20521 atgctgaaat ttcattcatg ctttggtgta aggatggaca tgttgaaacc ttctacccaa
1058    20581 aactacaagc aagtcaagcg tggcaaccag gtgttgcgat gcctaacttg tacaagatgc
1059    20641 aaagaatgct tcttgaaaag tgtgaccttc agaattatgg tgaaaatgct gttataccaa
1060    20701 aaggaataat gatgaatgtc gcaaagtata ctcaactgtg tcaatactta aatacactta
1061    20761 ctttagctgt accctacaac atgagagtta ttcactttgg tgctggctct gataaaggag
1062    20821 ttgcaccagg tacagctgtg ctcagacaat ggttgccaac tggcacacta cttgtcgatt
1063    20881 cagatcttaa tgacttcgtc tccgacgcag attctacttt aattggagac tgtgcaacag
1064    20941 tacatacggc taataaatgg gaccttatta ttagcgatat gtatgaccct aggaccaaac
1065    21001 atgtgacaaa agagaatgac tctaaagaag ggtttttcac ttatctgtgt ggatttataa
1066    21061 agcaaaaact agccctgggt ggttctatag ctgtaaagat aacagagcat tcttggaatg
1067    21121 ctgaccttta caagcttatg ggccatttct catggtggac agcttttgtt acaaatgtaa
1068    21181 atgcatcatc atcggaagca tttttaattg gggctaacta tcttggcaag ccgaaggaac
1069    21241 aaattgatgg ctataccatg catgctaact acattttctg gaggaacaca aatcctatcc
1070    21301 agttgtcttc ctattcactc tttgacatga gcaaatttcc tcttaaatta agaggaactg
1071    21361 ctgtaatgtc tcttaaggag aatcaaatca atgatatgat ttattctctt ctggaaaaag
1072    21421 gtaggcttat cattagagaa aacaacagag ttgtggtttc aagtgatatt cttgttaaca
1073    21481 actaaacgaa catgtttatt ttcttattat ttcttactct cactagtggt agtgaccttg
1074    21541 accggtgcac cacttttgat gatgttcaag ctcctaatta cactcaacat acttcatcta
1075    21601 tgaggggggt ttactatcct gatgaaattt ttagatcaga cactctttat ttaactcagg
1076    21661 atttatttct tccattttat tctaatgtta cagggtttca tactattaat catacgtttg
1077    21721 gcaaccctgt catacctttt aaggatggta tttattttgc tgccacagag aaatcaaatg
1078    21781 ttgtccgtgg ttgggttttt ggttctacca tgaacaacaa gtcacagtcg gtgattatta
1079    21841 ttaacaattc tactaatgtt gttatacgag catgtaactt tgaattgtgt gacaaccctt
1080    21901 tctttgctgt ttctaaaccc atgggtacac agacacatac tatgatattc gataatgcat
1081    21961 ttaattgcac tttcgagtac atatctgatg ccttttcgct tgatgtttca gaaaagtcag
1082    22021 gtaattttaa acacttacga gagtttgtgt ttaaaaataa agatgggttt ctctatgttt
1083    22081 ataagggcta tcaacctata gatgtagttc gtgatctacc ttctggtttt aacactttga
1084    22141 aacctatttt taagttgcct cttggtatta acattacaaa ttttagagcc attcttacag
1085    22201 ccttttcacc tgctcaagac atttggggca cgtcagctgc agcctatttt gttggctatt
1086    22261 taaagccaac tacatttatg ctcaagtatg atgaaaatgg tacaatcaca gatgctgttg
1087    22321 attgttctca aaatccactt gctgaactca aatgctctgt taagagcttt gagattgaca
1088    22381 aaggaattta ccagacctct aatttcaggg ttgttccctc aggagatgtt gtgagattcc
1089    22441 ctaatattac aaacttgtgt ccttttggag aggtttttaa tgctactaaa ttcccttctg
1090    22501 tctatgcatg ggagagaaaa aaaatttcta attgtgttgc tgattactct gtgctctaca
1091    22561 actcaacatt tttttcaacc tttaagtgct atggcgtttc tgccactaag ttgaatgatc
1092    22621 tttgcttctc caatgtctat gcagattctt ttgtagtcaa gggagatgat gtaagacaaa
1093    22681 tagcgccagg acaaactggt gttattgctg attataatta taaattgcca gatgatttca
1094    22741 tgggttgtgt ccttgcttgg aatactagga acattgatgc tacttcaact ggtaattata
1095    22801 attataaata taggtatctt agacatggca agcttaggcc ctttgagaga gacatatcta
1096    22861 atgtgccttt ctcccctgat ggcaaacctt gcaccccacc tgctcttaat tgttattggc
1097    22921 cattaaatga ttatggtttt tacaccacta ctggcattgg ctaccaacct tacagagttg
1098    22981 tagtactttc ttttgaactt ttaaatgcac cggccacggt ttgtggacca aaattatcca
1099    23041 ctgaccttat taagaaccag tgtgtcaatt ttaattttaa tggactcact ggtactggtg
1100    23101 tgttaactcc ttcttcaaag agatttcaac catttcaaca atttggccgt gatgtttctg
1101    23161 atttcactga ttccgttcga gatcctaaaa catctgaaat attagacatt tcaccttgcg
1102    23221 cttttggggg tgtaagtgta attacacctg gaacaaatgc ttcatctgaa gttgctgttc
1103    23281 tatatcaaga tgttaactgc actgatgttt ctacagcaat tcatgcagat caactcacac
1104    23341 cagcttggcg catatattct actggaaaca atgtattcca gactcaagca ggctgtctta
1105    23401 taggagctga gcatgtcgac acttcttatg agtgcgacat tcctattgga gctggcattt
1106    23461 gtgctagtta ccatacagtt tctttattac gtagtactag ccaaaaatct attgtggctt
1107    23521 atactatgtc tttaggtgct gatagttcaa ttgcttactc taataacacc attgctatac
1108    23581 ctactaactt ttcaattagc attactacag aagtaatgcc tgtttctatg gctaaaacct
1109    23641 ccgtagattg taatatgtac atctgcggag attctactga atgtgctaat ttgcttctcc
1110    23701 aatatggtag cttttgcaca caactaaatc gtgcactctc aggtattgct gctgaacagg
1111    23761 atcgcaacac acgtgaagtg ttcgctcaag tcaaacaaat gtacaaaacc ccaactttga
1112    23821 aatattttgg tggttttaat ttttcacaaa tattacctga ccctctaaag ccaactaaga
1113    23881 ggtcttttat tgaggacttg ctctttaata aggtgacact cgctgatgct ggcttcatga
1114    23941 agcaatatgg cgaatgccta ggtgatatta atgctagaga tctcatttgt gcgcagaagt
1115    24001 tcaatggact tacagtgttg ccacctctgc tcactgatga tatgattgct gcctacactg
1116    24061 ctgctctagt tagtggtact gccactgctg gatggacatt tggtgctggc gctgctcttc
1117    24121 aaataccttt tgctatgcaa atggcatata ggttcaatgg cattggagtt acccaaaatg
1118    24181 ttctctatga gaaccaaaaa caaatcgcca accaatttaa caaggcgatt agtcaaattc
1119    24241 aagaatcact tacaacaaca tcaactgcat tgggcaagct gcaagacgtt gttaaccaga
1120    24301 atgctcaagc attaaacaca cttgttaaac aacttagctc taattttggt gcaatttcaa
1121    24361 gtgtgctaaa tgatatcctt tcgcgacttg ataaagtcga ggcggaggta caaattgaca
1122    24421 ggttaattac aggcagactt caaagccttc aaacctatgt aacacaacaa ctaatcaggg
1123    24481 ctgctgaaat cagggcttct gctaatcttg ctgctactaa aatgtctgag tgtgttcttg
1124    24541 gacaatcaaa aagagttgac ttttgtggaa agggctacca ccttatgtcc ttcccacaag
1125    24601 cagccccgca tggtgttgtc ttcctacatg tcacgtatgt gccatcccag gagaggaact
1126    24661 tcaccacagc gccagcaatt tgtcatgaag gcaaagcata cttccctcgt gaaggtgttt
1127    24721 ttgtgtttaa tggcacttct tggtttatta cacagaggaa cttcttttct ccacaaataa
1128    24781 ttactacaga caatacattt gtctcaggaa attgtgatgt cgttattggc atcattaaca
1129    24841 acacagttta tgatcctctg caacctgagc ttgactcatt caaagaagag ctggacaagt
1130    24901 acttcaaaaa tcatacatca ccagatgttg atcttggcga catttcaggc attaacgctt
1131    24961 ctgtcgtcaa cattcaaaaa gaaattgacc gcctcaatga ggtcgctaaa aatttaaatg
1132    25021 aatcactcat tgaccttcaa gaattgggaa aatatgagca atatattaaa tggccttggt
1133    25081 atgtttggct cggcttcatt gctggactaa ttgccatcgt catggttaca atcttgcttt
1134    25141 gttgcatgac tagttgttgc agttgcctca agggtgcatg ctcttgtggt tcttgctgca
1135    25201 agtttgatga ggatgactct gagccagttc tcaagggtgt caaattacat tacacataaa
1136    25261 cgaacttatg gatttgttta tgagattttt tactcttaga tcaattactg cacagccagt
1137    25321 aaaaattgac aatgcttctc ctgcaagtac tgttcatgct acagcaacga taccgctaca
1138    25381 agcctcactc cctttcggat ggcttgttat tggcgttgca tttcttgctg tttttcagag
1139    25441 cgctaccaaa ataattgcgc tcaataaaag atggcagcta gccctttata agggcttcca
1140    25501 gttcatttgc aatttactgc tgctatttgt taccatctat tcacatcttt tgcttgtcgc
1141    25561 tgcaggtatg gaggcgcaat ttttgtacct ctatgccttg atatattttc tacaatgcat
1142    25621 caacgcatgt agaattatta tgagatgttg gctttgttgg aagtgcaaat ccaagaaccc
1143    25681 attactttat gatgccaact actttgtttg ctggcacaca cataactatg actactgtat
1144    25741 accatataac agtgtcacag atacaattgt cgttactgaa ggtgacggca tttcaacacc
1145    25801 aaaactcaaa gaagactacc aaattggtgg ttattctgag gataggcact caggtgttaa
1146    25861 agactatgtc gttgtacatg gctatttcac cgaagtttac taccagcttg agtctacaca
1147    25921 aattactaca gacactggta ttgaaaatgc tacattcttc atctttaaca agcttgttaa
1148    25981 agacccaccg aatgtgcaaa tacacacaat cgacggctct tcaggagttg ctaatccagc
1149    26041 aatggatcca atttatgatg agccgacgac gactactagc gtgcctttgt aagcacaaga
1150    26101 aagtgagtac gaacttatgt actcattcgt ttcggaagaa acaggtacgt taatagttaa
1151    26161 tagcgtactt ctttttcttg ctttcgtggt attcttgcta gtcacactag ccatccttac
1152    26221 tgcgcttcga ttgtgtgcgt actgctgcaa tattgttaac gtgagtttag taaaaccaac
1153    26281 ggtttacgtc tactcgcgtg ttaaaaatct gaactcttct gaaggagttc ctgatcttct
1154    26341 ggtctaaacg aactaactat tattattatt ctgtttggaa ctttaacatt gcttatcatg
1155    26401 gcagacaacg gtactattac cgttgaggag cttaaacaac tcctggaaca atggaaccta
1156    26461 gtaataggtt tcctattcct agcctggatt atgttactac aatttgccta ttctaatcgg
1157    26521 aacaggtttt tgtacataat aaagcttgtt ttcctctggc tcttgtggcc agtaacactt
1158    26581 gcttgttttg tgcttgctgc tgtctacaga attaattggg tgactggcgg gattgcgatt
1159    26641 gcaatggctt gtattgtagg cttgatgtgg cttagctact tcgttgcttc cttcaggctg
1160    26701 tttgctcgta cccgctcaat gtggtcattc aacccagaaa caaacattct tctcaatgtg
1161    26761 cctctccggg ggacaattgt gaccagaccg ctcatggaaa gtgaacttgt cattggtgct
1162    26821 gtgatcattc gtggtcactt gcgaatggcc ggacactccc tagggcgctg tgacattaag
1163    26881 gacctgccaa aagagatcac tgtggctaca tcacgaacgc tttcttatta caaattagga
1164    26941 gcgtcgcagc gtgtaggcac tgattcaggt tttgctgcat acaaccgcta ccgtattgga
1165    27001 aactataaat taaatacaga ccacgccggt agcaacgaca atattgcttt gctagtacag
1166    27061 taagtgacaa cagatgtttc atcttgttga cttccaggtt acaatagcag agatattgat
1167    27121 tatcattatg aggactttca ggattgctat ttggaatctt gacgttataa taagttcaat
1168    27181 agtgagacaa ttatttaagc ctctaactaa gaagaattat tcggagttag atgatgaaga
1169    27241 acctatggag ttagattatc cataaaacga acatgaaaat tattctcttc ctgacattga
1170    27301 ttgtatttac atcttgcgag ctatatcact atcaggagtg tgttagaggt acgactgtac
1171    27361 tactaaaaga accttgccca tcaggaacat acgagggcaa ttcaccattt caccctcttg
1172    27421 ctgacaataa atttgcacta acttgcacta gcacacactt tgcttttgct tgtgctgacg
1173    27481 gtactcgaca tacctatcag ctgcgtgcaa gatcagtttc accaaaactt ttcatcagac
1174    27541 aagaggaggt tcaacaagag ctctactcgc cactttttct cattgttgct gctctagtat
1175    27601 ttttaatact ttgcttcacc attaagagaa agacagaatg aatgagctca ctttaattga
1176    27661 cttctatttg tgctttttag cctttctgct attccttgtt ttaataatgc ttattatatt
1177    27721 ttggttttca ctcgaaatcc aggatctaga agaaccttgt accaaagtct aaacgaacat
1178    27781 gaaacttctc attgttttga cttgtatttc tctatgcagt tgcatatgca ctgtagtaca
1179    27841 gcgctgtgca tctaataaac ctcatgtgct tgaagatcct tgtaaggtac aacactaggg
1180    27901 gtaatactta tagcactgct tggctttgtg ctctaggaaa ggttttacct tttcatagat
1181    27961 ggcacactat ggttcaaaca tgcacaccta atgttactat caactgtcaa gatccagctg
1182    28021 gtggtgcgct tatagctagg tgttggtacc ttcatgaagg tcaccaaact gctgcattta
1183    28081 gagacgtact tgttgtttta aataaacgaa caaattaaaa tgtctgataa tggaccccaa
1184    28141 tcaaaccaac gtagtgcccc ccgcattaca tttggtggac ccacagattc aactgacaat
1185    28201 aaccagaatg gaggacgcaa tggggcaagg ccaaaacagc gccgacccca aggtttaccc
1186    28261 aataatactg cgtcttggtt cacagctctc actcagcatg gcaaggagga acttagattc
1187    28321 cctcgaggcc agggcgttcc aatcaacacc aatagtggtc cagatgacca aattggctac
1188    28381 taccgaagag ctacccgacg agttcgtggt ggtgacggca aaatgaaaga gctcagcccc
1189    28441 agatggtact tctattacct aggaactggc ccagaagctt cacttcccta cggcgctaac
1190    28501 aaagaaggca tcgtatgggt tgcaactgag ggagccttga atacacccaa agaccacatt
1191    28561 ggcacccgca atcctaataa caatgctgcc accgtgctac aacttcctca aggaacaaca
1192    28621 ttgccaaaag gcttctacgc agagggaagc agaggcggca gtcaagcctc ttctcgctcc
1193    28681 tcatcacgta gtcgcggtaa ttcaagaaat tcaactcctg gcagcagtag gggaaattct
1194    28741 cctgctcgaa tggctagcgg aggtggtgaa actgccctcg cgctattgct gctagacaga
1195    28801 ttgaaccagc ttgagagcaa agtttctggt aaaggccaac aacaacaagg ccaaactgtc
1196    28861 actaagaaat ctgctgctga ggcatctaaa aagcctcgcc aaaaacgtac tgccacaaaa
1197    28921 cagtacaacg tcactcaagc atttgggaga cgtggtccag aacaaaccca aggaaatttc
1198    28981 ggggaccaag acctaatcag acaaggaact gattacaaac attggccgca aattgcacaa
1199    29041 tttgctccaa gtgcctctgc attctttgga atgtcacgca ttggcatgga agtcacacct
1200    29101 tcgggaacat ggctgactta tcatggagcc attaaattgg atgacaaaga tccacaattc
1201    29161 aaagacaacg tcatactgct gaacaagcac attgacgcat acaaaacatt cccaccaaca
1202    29221 gagcctaaaa aggacaaaaa gaaaaagact gatgaagctc agcctttgcc gcagagacaa
1203    29281 aagaagcagc ccactgtgac tcttcttcct gcggctgaca tggatgattt ctccagacaa
1204    29341 cttcaaaatt ccatgagtgg agcttctgct gattcaactc aggcataaac actcatgatg
1205    29401 accacacaag gcagatgggc tatgtaaacg ttttcgcaat tccgtttacg atacatagtc
1206    29461 tactcttgtg cagaatgaat tctcgtaact aaacagcaca agtaggttta gttaacttta
1207    29521 atctcacata gcaatcttta atcaatgtgt aacattaggg aggacttgaa agagccacca
1208    29581 cattttcatc gaggccacgc ggagtacgat cgagggtaca gtgaataatg ctagggagag
1209    29641 ctgcctatat ggaagagccc taatgtgtaa aattaatttt agtagtgcta tccccatgtg
1210    29701 attttaatag cttcttagga gaatgacaaa aaaaaaaaaa aaaaaaaaaa a
1211//
1212
1213