diff --git a/etc/af063097.embl b/etc/af063097.embl
new file mode 100644
index 0000000000000000000000000000000000000000..99cf9f44ad205661aa8beda925336eed44ce9783
--- /dev/null
+++ b/etc/af063097.embl
@@ -0,0 +1,1903 @@
+ID   AF063097   standard; DNA; PHG; 33593 BP.
+XX
+AC   AF063097; J02474; L29304; M12772; M13202; M27131; M27836; M34756; M58023;
+AC   M59752; M64677; U02597; X02300; X02301; X05655; X61229; X87173; X99627;
+AC   X99628; Z11483;
+XX
+SV   AF063097.1
+XX
+DT   21-MAY-1998 (Rel. 55, Created)
+DT   07-JAN-1999 (Rel. 58, Last updated, Version 2)
+XX
+DE   Bacteriophage P2, complete genome.
+XX
+KW   .
+XX
+OS   Enterobacteria phage P2
+OC   Viruses; dsDNA viruses, no RNA stage; Caudovirales; Myoviridae;
+OC   P2-like Viruses.
+XX
+RN   [1]
+RP   1-9, 33582-33593
+RX   MEDLINE; 73220701.
+RA   Murray K., Murray N.E.;
+RT   "Terminal nucleotide sequences of DNA from temperate coliphages";
+RL   Nature New Biol. 243(126):134-139(1973).
+XX
+RN   [2]
+RP   1-26, 33568-33593
+RX   MEDLINE; 77209985.
+RA   Murray K., Isaksson-Forsen A.G., Challberg M., Englund P.T.;
+RT   "Symmetrical nucleotide sequences in the recognition sites for the ter
+RT   function of bacteriophages P2, 299 and 186";
+RL   J. Mol. Biol. 112(3):471-489(1977).
+XX
+RN   [3]
+RP   1-26, 33568-33593
+RX   MEDLINE; 82051282.
+RA   Lindqvist B.H.;
+RT   "Recombination between satellite phage P4 and its helper P2. I. In vivo and
+RT   in vitro construction of P4: :P2 hybrid satellite phage";
+RL   Gene 14(4):231-241(1981).
+XX
+RN   [4]
+RP   2929-3589
+RX   MEDLINE; 83268689.
+RA   Christie G.E., Calendar R.;
+RT   "Bacteriophage P2 late promoters. Transcription initiation sites for two
+RT   late mRNAs";
+RL   J. Mol. Biol. 167(4):773-790(1983).
+XX
+RN   [5]
+RP   25456-25995
+RX   MEDLINE; 84248044.
+RA   Ljungquist E., Kockum K., Bertani E.L.;
+RT   "DNA sequence of the repressor gene and operator region of bacteriophage
+RT   P2";
+RL   Proc. Natl. Acad. Sci. U.S.A. 81:3988-3992(1984).
+XX
+RN   [6]
+RP   10188-10518, 17510-17996
+RX   MEDLINE; 85160858.
+RA   Christie G.E., Calender R.;
+RT   "Bacteriophage P2 late promoters - comparison of the four late promoter
+RT   sequences";
+RL   J. Mol. Biol. 181:373-382(1985).
+XX
+RN   [7]
+RP   23909-24339
+RX   MEDLINE; 86281704.
+RA   Birkeland N.K., Lindquist B.H.;
+RT   "Coliphage P2 late control gene ogr. DNA sequence and product
+RT   identification";
+RL   J. Mol. Biol. 188(3):487-490(1986).
+XX
+RN   [8]
+RP   23889-24333
+RX   MEDLINE; 86205872.
+RA   Christie G.E., Haggard-Ljungquist E., Feiwell R., Calendar R.;
+RT   "Regulation of bacteriophage P2 late-gene expression: the ogr gene";
+RL   Proc. Natl. Acad. Sci. U.S.A. 83(10):3238-3242(1986).
+XX
+RN   [9]
+RP   25849-27048
+RX   MEDLINE; 87286423.
+RA   Haggard-Ljungquist E., Kockum K., Bertani L.E.;
+RT   "DNA sequences of bacteriophage P2 early genes cox and B and their
+RT   regulatory sites";
+RL   Mol. Gen. Genet. 208(1-2):52-56(1987).
+XX
+RN   [10]
+RP   25849-27048
+RX   MEDLINE; 88082694.
+RA   Saha S., Haggard-Ljungquist E., Nordstrom K.;
+RT   "The cox protein of bacteriophage P2 inhibits the formation of the
+RT   repressor protein and autoregulates the early operon";
+RL   EMBO J. 6(10):3191-3199(1987).
+XX
+RN   [11]
+RP   24252-25595
+RX   MEDLINE; 90006769.
+RA   Yu A., Bertani L.E., Haggard-Ljungquist E.;
+RT   "Control of prophage integration and excision in bacteriophage P2:
+RT   nucleotide sequences of the int gene and att sites";
+RL   Gene 80(1):1-11(1989).
+XX
+RN   [12]
+RP   31590-33593
+RX   MEDLINE; 90152373.
+RA   Haggard-Ljungquist E., Barreiro V., Calendar R., Kurnit D.M., Cheng H.;
+RT   "The P2 phage old gene: sequence, transcription and translational control";
+RL   Gene 85(1):25-33(1989).
+XX
+RN   [13]
+RP   1-266, 33200-33593
+RX   MEDLINE; 91092507.
+RA   Ziermann R., Calendar R.;
+RT   "Characterization of the cos sites of bacteriophages P2 and P4";
+RL   Gene 96(1):9-15(1990).
+XX
+RN   [14]
+RP   17627-19373
+RX   MEDLINE; 91135001.
+RA   Temple L.M., Forsburg S.L., Calendar R., Christie G.E.;
+RT   "Nucleotide sequence of the genes encoding the major tail sheath and tail
+RT   tube proteins of bacteriophage P2";
+RL   Virology 181(1):353-358(1991).
+XX
+RN   [15]
+RP   4050-5178
+RX   MEDLINE; 91220668.
+RA   Six E.W., Sunshine M.G., Williams J., Haggard-Ljungquist E.,
+RA   Lindqvist B.H.;
+RT   "Morphopoietic switch mutations of bacteriophage P2";
+RL   Virology 182(1):34-46(1991).
+XX
+RN   [16]
+RP   1-6551
+RX   MEDLINE; 92115571.
+RA   Linderoth N.A., Ziermann R., Haggard-Ljungquist E., Christie G.E.,
+RA   Calendar R.;
+RT   "Nucleotide sequence of the DNA packaging and capsid synthesis genes of
+RT   bacteriophage P2";
+RL   Nucleic Acids Res. 19(25):7207-7214(1991).
+XX
+RN   [17]
+RP   12173-15684
+RX   MEDLINE; 92165720.
+RA   Haggard-Ljungquist E., Halling C., Calendar R.;
+RT   "DNA sequence of two tail genes of bacteriophage P2: Further evidence for
+RT   horizontal transfer of tail fiber genes among unrelated bacteriophages";
+RL   J. Bacteriol. 174:1462-1477(1992).
+XX
+RN   [18]
+RP   26923-30721
+RX   MEDLINE; 93287108.
+RA   Liu Y., Saha S., Haggard-Ljungquist E.;
+RT   "Studies of bacteriophage P2 DNA replication. The DNA sequence of the
+RT   cis-acting gene A and ori region and construction of a P2 mini-chromosome";
+RL   J. Mol. Biol. 231(2):361-374(1993).
+XX
+RN   [19]
+RP   6288-8381
+RX   MEDLINE; 94327465.
+RA   Ziermann R., Bartlett B., Calendar R., Christie G.E.;
+RT   "Functions involved in bacteriophage P2-induced host cell lysis and
+RT   identification of a new tail gene";
+RL   J. Bacteriol. 176:4974-4984(1994).
+XX
+RN   [20]
+RP   8376-10381
+RX   MEDLINE; 94233699.
+RA   Linderoth N.A., Julien B., Flick K.E., Calendar R., Christie G.E.;
+RT   "Molecular cloning and characterization of bacteriophage P2 genes R and S
+RT   involved in tail completion";
+RL   Virology 200:347-359(1994).
+XX
+RN   [21]
+RP   10276-12739
+RX   MEDLINE; 96036485.
+RA   Haggard-Liungquist E., Jacobsen E., Rishovd S., Six W.S., Nilssen O.,
+RA   Sunshine M.G., Lindqvist B.H., Kim K.J., Barreiro V., Koonin E.V.,
+RA   Calendar R.;
+RT   "Bacteriophage P2: genes involved in baseplate assembly";
+RL   Virology 213(1):109-121(1995).
+XX
+RN   [22]
+RP   15627-17626, 30643-31622
+RA   Calendar R., Yu S., Myung H., Barreiro V., Odegrip R., Bertani L.E.,
+RA   Carlson K., Davenport L., Mosig G., Christie G.E., Haggard-Ljungquist E.;
+RT   "The lysogenic conversion genes of coliphage P2 have unusually high AT
+RT   content";
+RL   (in) Syvanen M., Kado C. (eds.);
+RL   HORIZONTAL GENE TRANSFER:1-1;
+RL   Chapman and Hall, London (1998)
+XX
+RN   [23]
+RP   19374-23954
+RA   Christie G.E., Temple L.M., Bartlett B.A., Goodwin T.S.;
+RT   "Bacteriophage P2 tail assembly genes: Gene organization and a programmed
+RT   translational frameshift parallel those of bacteriophage lambda";
+RL   Unpublished.
+XX
+RN   [24]
+RP   1-33593
+RA   Christie G.E., Haggard-Ljungquist E., Calendar R.;
+RT   "The complete genome of bacteriophage P2";
+RL   Unpublished.
+XX
+RN   [25]
+RP   24351-25595
+RA   Haggard-Ljungquist E.;
+RT   ;
+RL   Submitted (15-SEP-1989) to the EMBL/GenBank/DDBJ databases.
+RL   Department of Microbial Genetics, Karolinska Institutet, Stockholm, Sweden
+XX
+RN   [26]
+RP   1-6551
+RA   Linderoth N.A.;
+RT   ;
+RL   Submitted (13-AUG-1991) to the EMBL/GenBank/DDBJ databases.
+RL   Dept of Mol and Cell Biology, Div of Biochemistry and Molecular Biology,
+RL   University of California, 401 Barker Hall, Berkeley, CA 94720, USA
+XX
+RN   [27]
+RP   26923-30721
+RA   Haggard-Ljungquist E.;
+RT   ;
+RL   Submitted (12-NOV-1991) to the EMBL/GenBank/DDBJ databases.
+RL   Department of Microbial Genetics, Karolinska Institutet, S-10401,
+RL   Stockholm, Sweden
+XX
+RN   [28]
+RP   8376-10381
+RA   Linderoth N.A.;
+RT   ;
+RL   Submitted (18-OCT-1993) to the EMBL/GenBank/DDBJ databases.
+RL   Nora A. Linderoth, Laboratory of Genetics, The Rockefeller University, 1230
+RL   York Avenue, New York, NY 10021, USA
+XX
+RN   [29]
+RP   10276-12739
+RA   Haggard E.B.;
+RT   ;
+RL   Submitted (12-MAY-1995) to the EMBL/GenBank/DDBJ databases.
+RL   Department of Genetics, Stockholm University, S-10691, Stockholm, Sweden
+XX
+RN   [30]
+RP   15627-17626, 30643-31622
+RA   Haggard-Ljungquist E.;
+RT   ;
+RL   Submitted (30-JUL-1996) to the EMBL/GenBank/DDBJ databases.
+RL   Department of Genetics, Stockholm University, S-106 91, Stockholm, Sweden
+XX
+RN   [31]
+RP   17510-23954
+RA   Christie G.E.;
+RT   ;
+RL   Submitted (21-NOV-1996) to the EMBL/GenBank/DDBJ databases.
+RL   Department of Microbiology and Immunology, Virginia Commonwealth
+RL   University, Box 980678, Richmond, VA 23298-0678, USA
+XX
+RN   [32]
+RP   1-33593
+RA   Christie G.E.;
+RT   ;
+RL   Submitted (05-MAY-1998) to the EMBL/GenBank/DDBJ databases.
+RL   Department of Microbiology and Immunology, Virginia Commonwealth
+RL   University, Richmond, VA 23298-0678, USA
+XX
+DR   SPTREMBL; O64312; O64312.
+DR   SPTREMBL; O64313; O64313.
+DR   SPTREMBL; O64314; O64314.
+DR   SPTREMBL; O64315; O64315.
+DR   SPTREMBL; P79669; P79669.
+DR   SPTREMBL; P79670; P79670.
+DR   SPTREMBL; Q38498; Q38498.
+DR   SWISS-PROT; P04132; RPC_BPP2.
+DR   SWISS-PROT; P07695; VCOX_BPP2.
+DR   SWISS-PROT; P07696; VPB_BPP2.
+DR   SWISS-PROT; P08762; VOGR_BPP2.
+DR   SWISS-PROT; P10312; VPD_BPP2.
+DR   SWISS-PROT; P13520; VOLD_BPP2.
+DR   SWISS-PROT; P22501; VPF1_BPP2.
+DR   SWISS-PROT; P22502; VPF2_BPP2.
+DR   SWISS-PROT; P25475; VPL_BPP2.
+DR   SWISS-PROT; P25476; VPM_BPP2.
+DR   SWISS-PROT; P25477; VPN_BPP2.
+DR   SWISS-PROT; P25478; VPO_BPP2.
+DR   SWISS-PROT; P25479; VPP_BPP2.
+DR   SWISS-PROT; P25480; VPQ_BPP2.
+DR   SWISS-PROT; P26699; TFA_BPP2.
+DR   SWISS-PROT; P26700; VPH_BPP2.
+DR   SWISS-PROT; P26701; VPI_BPP2.
+DR   SWISS-PROT; P31340; VPV_BPP2.
+DR   SWISS-PROT; P36932; VINT_BPP2.
+DR   SWISS-PROT; P36933; VPR_BPP2.
+DR   SWISS-PROT; P36934; VPS_BPP2.
+DR   SWISS-PROT; P36935; YSV_BPP2.
+DR   SWISS-PROT; P51767; VPJ_BPP2.
+DR   SWISS-PROT; P51768; VPW_BPP2.
+DR   SWISS-PROT; P51769; LYSA_BPP2.
+DR   SWISS-PROT; P51770; LYSB_BPP2.
+DR   SWISS-PROT; P51771; LYCV_BPP2.
+DR   SWISS-PROT; P51772; VPX_BPP2.
+DR   SWISS-PROT; P51773; HOLI_BPP2.
+DR   SWISS-PROT; Q06419; VPA_BPP2.
+DR   SWISS-PROT; Q06422; YO80_BPP2.
+DR   SWISS-PROT; Q06423; YO81_BPP2.
+DR   SWISS-PROT; Q06424; YO82_BPP2.
+DR   SWISS-PROT; Q06425; YO83_BPP2.
+DR   SWISS-PROT; Q06426; YO91_BPP2.
+XX
+CC   On May 20, 1998 this sequence version replaced gi:506838 gi:15821
+CC   gi:1806573 gi:215666 gi:506836 gi:508561 gi:1061043 gi:215669
+CC   gi:1769975 gi:494974 gi:215664 gi:15620 gi:393451 gi:1769977
+CC   gi:215681 gi:215675 gi:215676 gi:15141 gi:414530.
+XX
+FH   Key             Location/Qualifiers
+FH
+FT   source          1..33593
+FT                   /db_xref="taxon:10679"
+FT                   /organism="Enterobacteria phage P2"
+FT                   /lab_host="Escherichia coli"
+FT   misc_feature    1..19
+FT                   /note="cosL; left cohesive end"
+FT   terminator      complement(160..181)
+FT                   /note="tQ; putative rho-independent terminator for P
+FT                   operon"
+FT   CDS             complement(187..1221)
+FT                   /codon_start=1
+FT                   /db_xref="SWISS-PROT:P25480"
+FT                   /evidence=EXPERIMENTAL
+FT                   /transl_table=11
+FT                   /gene="Q"
+FT                   /function="presumed portal protein"
+FT                   /product="gpQ"
+FT                   /protein_id="AAD03268.1"
+FT                   /translation="MSKKKGKTPQPAAKTMTASGPKMEAFTFGEPVPVLDRRDILDYVE
+FT                   CISNGRWYEPPVSFTGLAKSLRAAVHHSSPIYVKRNILASTFIPHPWLSQQDFSRFVLD
+FT                   FLVFGNAFLEKRYSTTGKVIRLETSPAKYTRRGVEEDVYWWVPSFNEPTAFAPGSVFHL
+FT                   LEPDINQELYGLPEYLSALNSAWLNESATLFRRKYYENGAHAGYIMYVTDAVQDRNDIE
+FT                   MLRENMVKSKGRNNFKNLFLYAPQGKADGIKIIPLSEVATKDDFFNIKKASAADLLDAH
+FT                   RIPFQLMGGKPENVGSLGDIEKVAKVFVRNELIPLQDRIREINGWLGQEVIRFKNYSLD
+FT                   TDND"
+FT   variation       complement(653)
+FT                   /note="Qam34 mutation"
+FT                   /replace="t"
+FT                   /gene="Q"
+FT   CDS             complement(1221..2993)
+FT                   /codon_start=1
+FT                   /db_xref="SWISS-PROT:P25479"
+FT                   /evidence=EXPERIMENTAL
+FT                   /transl_table=11
+FT                   /gene="P"
+FT                   /function="terminase; DNA-dependent ATPase"
+FT                   /product="gpP"
+FT                   /protein_id="AAD03269.1"
+FT                   /translation="MTITTDTTLLHDPRRQAALLYWQGFSVPQIAAMLQMKRPTVQSWK
+FT                   QRDGWDSVAPISRVEMSLEARLTQLIIKPQKTGGDFKEIDLLGRQIERLARVNRYSQTG
+FT                   NEADLNPNVANRNKGGRRKPKKNFFSDEAIEKLEQIFFEQSFDYQLHWYRAGLEHRIRD
+FT                   ILKSRQIGATFYFSREALLRALKTGHNQIFLSASKTQAYVFREYIIAFARLVDVDLTGD
+FT                   PIVLGNNGAKLIFLGTNSNTAQSHNGDLYVDEIFWIPNFQVLRKVASGMASQSHLRSTY
+FT                   FSTPSTLAHDAYPFWSGELFNRGRASAAERVEIDVSHNALAGGLLCADGQWRQIVTIED
+FT                   ALKGGCTLFDIEQLKRENSADDFKNLFMCEFVDDKASVFPFEELQRCMVDTLEEWEDYA
+FT                   PFAANPFGSRPVWIGYDPSHRGDSAGCVVLAPPVVAGGKFRILERHQWKGMDFATQAES
+FT                   IRKLTEKYNVEYIGIDATGLGVGVFQLVRSFYPAARDIRYTPEMKTAMVLKAKDVIRRG
+FT                   CLEYDVSATDITSSFMAIRKTMTSSGRSATYEASRSEEASHADLAWATMHALLNEPLTA
+FT                   GISTPLTSTILEFY"
+FT   variation       complement(2210)
+FT                   /note="Pam24 and Pam137 mutations"
+FT                   /replace="a"
+FT                   /gene="P"
+FT   variation       complement(2948)
+FT                   /note="Pam253 mutation"
+FT                   /replace="a"
+FT                   /gene="P"
+FT   misc_feature    complement(3016)
+FT                   /note="transcription start site for P operon; encodes P,Q"
+FT                   /gene="P"
+FT   misc_feature    3057..3087
+FT                   /evidence=EXPERIMENTAL
+FT                   /note="activator binding site; pO, pP promoters"
+FT   misc_feature    3127
+FT                   /evidence=EXPERIMENTAL
+FT                   /note="transcription start site for O operon; encodes O, N,
+FT                   M, L, X, Y, K, lysA, lysB, R, S"
+FT   CDS             3167..4021
+FT                   /codon_start=1
+FT                   /db_xref="SWISS-PROT:P25478"
+FT                   /transl_table=11
+FT                   /gene="O"
+FT                   /function="presumed capsid scaffolding protein"
+FT                   /product="gpO"
+FT                   /protein_id="AAD03270.1"
+FT                   /translation="MAKKVSKFFRIGVEGDTCDGRVISAQDIQEMAETFDPRVYGCRIN
+FT                   LEHLRGILPDGIFKRYGDVAELKAEKIDDDSALKGKWALFAKITPTDDLIAMNKAAQKV
+FT                   YTSMEIQPNFANTGKCYLVGLAVTDDPASLGTEYLEFCRTAKHNPLNRFKLSPENLISV
+FT                   ATPVELEFEDLPETVFTALTEKVKSIFGRKQASDDARLNDVHEAVTAVAEHVQEKLSAT
+FT                   EQRLAEMETAFSALKQEVTDRADETSQAFTRLKNSLDHTESLTQQRRSKATGGGGDALM
+FT                   TNC"
+FT   variation       3206
+FT                   /note="Oam71 mutation"
+FT                   /replace="t"
+FT                   /gene="O"
+FT   variation       3411
+FT                   /note="Oam7 mutation"
+FT                   /replace="a"
+FT                   /gene="O"
+FT   variation       3878
+FT                   /note="Oam279 mutation"
+FT                   /replace="t"
+FT                   /gene="O"
+FT   CDS             4080..5153
+FT                   /codon_start=1
+FT                   /db_xref="SWISS-PROT:P25477"
+FT                   /transl_table=11
+FT                   /gene="N"
+FT                   /function="major capsid precursor"
+FT                   /product="gpN"
+FT                   /protein_id="AAD03271.1"
+FT                   /translation="MRQETRFKFNAYLSRVAELNGIDAGDVSKKFTVEPSVTQTLMNTM
+FT                   QESSDFLTRINIVPVSEMKGEKIGIGVTGSIASTTDTAGGTERQPKDFSKLASNKYECD
+FT                   QINFDFYIRYKTLDLWARYQDFQLRIRNAIIKRQSLDFIMAGFNGVKRAETSDRSSNPM
+FT                   LQDVAVGWLQKYRNEAPARVMSKVTDEEGRTTSEVIRVGKGGDYASLDALVMDATNNLI
+FT                   EPWYQEDPDLVVIVGRQLLADKYFPIVNKEQDNSEMLAADVIISQKRIGNLPAVRVPYF
+FT                   PADAMLITKLENLSIYYMDDSHRRVIEENPKLDRVENYESMNIDYVVEDYAAGCLVEKI
+FT                   KVGDFSTPAKATAEPGA"
+FT   variation       4349..4350
+FT                   /note="Nam209 mutation"
+FT                   /replace="at"
+FT                   /gene="N"
+FT   variation       4630
+FT                   /note="sir3 mutation; defective for choice of small capsids
+FT                   by satellite phage P4"
+FT                   /replace="c"
+FT                   /gene="N"
+FT   variation       4695
+FT                   /note="sir5 mutation; defective for choice of small capsids
+FT                   by satellite phage P4"
+FT                   /replace="t"
+FT                   /gene="N"
+FT   variation       4695..4697
+FT                   /note="sir9 mutation; defective for choice of small capsids
+FT                   by satellite phage P4"
+FT                   /replace=""
+FT                   /gene="N"
+FT   variation       4699
+FT                   /note="sir2, sir6 and sir8 mutations; defective for choice
+FT                   of small capsids by satellite phage P4"
+FT                   /replace="t"
+FT                   /gene="N"
+FT   variation       4740
+FT                   /note="sir1 mutation; defective for choice of small capsids
+FT                   by satellite phage P4"
+FT                   /replace="g"
+FT                   /gene="N"
+FT   variation       4741
+FT                   /note="sir4 mutation; defective for choice of small capsids
+FT                   by satellite phage P4"
+FT                   /replace="a"
+FT                   /gene="N"
+FT   CDS             5157..5900
+FT                   /codon_start=1
+FT                   /db_xref="SWISS-PROT:P25476"
+FT                   /transl_table=11
+FT                   /gene="M"
+FT                   /function="terminase"
+FT                   /product="gpM"
+FT                   /protein_id="AAD03272.1"
+FT                   /translation="MTSPAQRHMMRVSAAMTAQREAAPLRHATVYEQMLVKLAADQRTL
+FT                   KAIYSKELKAAKKRELLPFWLPWVNGVLELGKGAQDDILMTVMLWRLDTGDIAGALEIA
+FT                   RYALKYGLTMPGKHRRTPPYMFTEEVALAAMRAHAAGESVDTRLLTETLELTATADMPD
+FT                   EVRAKLHKITGLFLRDGGDAAGALAHLQRATQLDCQAGVKKEIERLERELKPKPEPQPK
+FT                   AATRAPRKTRSVTPAKRGRPKKKAS"
+FT   variation       5361
+FT                   /note="Mts52 mutation"
+FT                   /replace="a"
+FT                   /gene="M"
+FT   variation       5751
+FT                   /note="Mam32 mutation"
+FT                   /replace="t"
+FT                   /gene="M"
+FT   CDS             6000..6509
+FT                   /codon_start=1
+FT                   /db_xref="SWISS-PROT:P25475"
+FT                   /transl_table=11
+FT                   /gene="L"
+FT                   /function="capsid completion protein"
+FT                   /product="gpL"
+FT                   /protein_id="AAD03273.1"
+FT                   /translation="MMTLIIPRKEAPVSGEGTVVIPQPAGDEPVIKNTFFFPDIDPKRV
+FT                   RERMRLEQTVAPARLREAIKSGMAETNAELYEYREQKIAAGFTRLADVPADDIDGESIK
+FT                   VFYYERAVCAMATASLYERYRGVDASAKGDKKADSIDSTIDELWRDMRWAVARIQGKPR
+FT                   CIVSQI"
+FT   variation       6024
+FT                   /note="Lam79 mutation"
+FT                   /replace="t"
+FT                   /gene="L"
+FT   variation       6240
+FT                   /note="Lam9 mutation"
+FT                   /replace="t"
+FT                   /gene="L"
+FT   CDS             6509..6712
+FT                   /codon_start=1
+FT                   /db_xref="SWISS-PROT:P51772"
+FT                   /evidence=EXPERIMENTAL
+FT                   /transl_table=11
+FT                   /gene="X"
+FT                   /function="essential tail gene"
+FT                   /product="gpX"
+FT                   /protein_id="AAD03274.1"
+FT                   /translation="MKTFALQGDTLDAICVRYYGRTEGVVETVLAANPGLAELGAVLPH
+FT                   GTAVELPDVQTAPVAETVNLWE"
+FT   variation       6562
+FT                   /note="Xam95 mutation"
+FT                   /replace="g"
+FT                   /gene="X"
+FT   CDS             6716..6997
+FT                   /codon_start=1
+FT                   /db_xref="SWISS-PROT:P51773"
+FT                   /evidence=EXPERIMENTAL
+FT                   /transl_table=11
+FT                   /gene="Y"
+FT                   /function="holin; essential for host cell cell lysis"
+FT                   /product="gpY"
+FT                   /protein_id="AAD03275.1"
+FT                   /translation="MTAEEKSVLSLFMIGVLIVVGKVLAGGEPITPRLFIGRMLLGGFV
+FT                   SMVAGVVLVQFPDLSLPAVCGIGSMLGIAGYQVIEIAIQRRFKGRGKQ"
+FT   variation       6852
+FT                   /note="Yam94 mutation"
+FT                   /replace="a"
+FT                   /gene="Y"
+FT   CDS             6997..7494
+FT                   /codon_start=1
+FT                   /db_xref="SWISS-PROT:P51771"
+FT                   /evidence=EXPERIMENTAL
+FT                   /transl_table=11
+FT                   /gene="K"
+FT                   /function="endolysin; essential for host cell lysis"
+FT                   /product="gpK"
+FT                   /protein_id="AAD03276.1"
+FT                   /translation="MPVINTHQNIAAFLDMLAVSEGTANHPLTKNRGYDVIVTGLDGKP
+FT                   EIFTDYSDHPFAHGRPAKVFNRRGEKSTASGRYQQLYLFWPHYRKQLALPDFSPLSQDR
+FT                   LAIQLIRERGALDDIRAGRIERAISRCRNIWASLPGAGYGQREHSLEKLVTVWRTAGGV
+FT                   PA"
+FT   variation       7114
+FT                   /note="Kts60 mutation"
+FT                   /replace="a"
+FT                   /gene="K"
+FT   variation       7126
+FT                   /note="Kam218 mutation"
+FT                   /replace="t"
+FT                   /gene="K"
+FT   variation       7318
+FT                   /note="Kam12 mutation"
+FT                   /replace="t"
+FT                   /gene="K"
+FT   variation       7322
+FT                   /note="Kam76 mutation"
+FT                   /replace="a"
+FT                   /gene="K"
+FT   CDS             7509..7934
+FT                   /codon_start=1
+FT                   /db_xref="SWISS-PROT:P51769"
+FT                   /evidence=EXPERIMENTAL
+FT                   /transl_table=11
+FT                   /gene="lysA"
+FT                   /function="nonessential; affects timing of lysis"
+FT                   /product="LysA"
+FT                   /protein_id="AAD03277.1"
+FT                   /translation="MKKLSLSLMLNVSLALMLALSLIYPQSVAVNFVAAWAILATVICV
+FT                   VAGGVGVYATEYVLERYGRELPPESLAVKIVTSLFLQPVPWRRRAAALVVVVATFISLV
+FT                   AAGWIFTALIYLVVSLFFRLIRKACRQRLEGREPCQG"
+FT   variation       7694
+FT                   /note="lysAam96 mutation"
+FT                   /replace="g"
+FT                   /gene="lysA"
+FT   CDS             7922..8347
+FT                   /codon_start=1
+FT                   /db_xref="SWISS-PROT:P51770"
+FT                   /evidence=EXPERIMENTAL
+FT                   /transl_table=11
+FT                   /gene="lysB"
+FT                   /function="nonessential; affects timing of lysis"
+FT                   /product="LysB"
+FT                   /protein_id="AAD03278.1"
+FT                   /translation="MSRLMIVLVVLLSLAVAGLFLVKHKNASLRASLDRANNVASGQQT
+FT                   TITMLKNQLHVALTRADKNELAQVALRQELENAAKREAQREKTITRLLNENEDFRRWYG
+FT                   ADLPDAVRRLHQRPACTDASDCPQRMPESEPLPDAGQ"
+FT   variation       8099..8100
+FT                   /note="lysBam97 mutation"
+FT                   /replace="ta"
+FT                   /gene="lysB"
+FT   attenuator      8399..8417
+FT                   /note="putative transcription attenuator; O operon"
+FT   CDS             8455..8922
+FT                   /codon_start=1
+FT                   /db_xref="SWISS-PROT:P36933"
+FT                   /evidence=EXPERIMENTAL
+FT                   /transl_table=11
+FT                   /gene="R"
+FT                   /function="essential tail gene; tail completion"
+FT                   /product="gpR"
+FT                   /protein_id="AAD03279.1"
+FT                   /translation="MLKPDSLRRALTDAVTVLKTNPDMLRIFVDNGSIASTLAASLSFE
+FT                   KRYTLNVIVTDFTGDFDLLIVPVLAWLRENQPDIMTTDEGQKKGFTFYADINNDSSFDI
+FT                   SISLMLTERTLVSEVDGALHVKNISEPPPPEPVTRPMELYINGELVSKWDE"
+FT   variation       8680
+FT                   /note="Ram3 mutation"
+FT                   /replace="t"
+FT                   /gene="R"
+FT   variation       8710
+FT                   /note="Ram42 mutation"
+FT                   /replace="t"
+FT                   /gene="R"
+FT   variation       8857
+FT                   /note="Ram23 mutation"
+FT                   /replace="t"
+FT                   /gene="R"
+FT   CDS             8915..9367
+FT                   /codon_start=1
+FT                   /db_xref="SWISS-PROT:P36934"
+FT                   /evidence=EXPERIMENTAL
+FT                   /transl_table=11
+FT                   /gene="S"
+FT                   /function="essential tail gene; tail completion"
+FT                   /product="gpS"
+FT                   /protein_id="AAD03280.1"
+FT                   /translation="MNEFKRFEDRLTGLIESLSPSGRRRLSAELAKRLRQSQQRRVMAQ
+FT                   KAPDGTPYAPRQQQSVRKKTGRVKRKMFAKLITSRFLHIRASPEQASMEFYGGKSPKIA
+FT                   SVHQFGLSEENRKDGKKIDYPARPLLGFTGEDVQMIEEIILAHLER"
+FT   variation       9209
+FT                   /note="Sam75 mutation"
+FT                   /replace="t"
+FT                   /gene="S"
+FT   variation       9213
+FT                   /note="Sam89 mutation"
+FT                   /replace="a"
+FT                   /gene="S"
+FT   terminator      9397..9433
+FT                   /note="putative rho-independent terminator for O operon"
+FT   CDS             complement(9439..10224)
+FT                   /codon_start=1
+FT                   /db_xref="SWISS-PROT:P36935"
+FT                   /transl_table=11
+FT                   /gene="orf30"
+FT                   /function="nonessential"
+FT                   /product="Orf30"
+FT                   /protein_id="AAD03281.1"
+FT                   /translation="MVSYNVTNVWGLIVFFLCSFAVLAFFSFGKSNLMRLIAHYFNFGY
+FT                   SDKKLKRLDREWRDIQLFKIINGINVSGIENVRMIQQGLIDGKLKTSYFFLTRIWGDIT
+FT                   KPPHIIKTIIVILASIFYILLACYIHNEQSVIVRDATGIPYKNMMYYVYSDKVLLSFKN
+FT                   KAVEFNKTYSLADCKRLQNVFIKDTLPEIACNKLLQLNEEDSEWLSQEIKDNNSHKKAL
+FT                   LILSLVYFTSGLVIFLSYTKFFYANKKVLEYKASNKNHS"
+FT   misc_feature    10239..10266
+FT                   /evidence=EXPERIMENTAL
+FT                   /note="activator binding site; activation of pV promoter"
+FT   CDS             10308..10943
+FT                   /codon_start=1
+FT                   /db_xref="SWISS-PROT:P31340"
+FT                   /evidence=EXPERIMENTAL
+FT                   /transl_table=11
+FT                   /gene="V"
+FT                   /function="baseplate assembly protein"
+FT                   /product="gpV"
+FT                   /protein_id="AAD03282.1"
+FT                   /translation="MNTLANIQELARALRNMIRTGIIVETDLNAGRCRVQTGGMCTDWL
+FT                   QWLTHRAGRSRTWWAPSVGEQVLILAVGGELDTAFVLPGIYSGDNPSPSVSADALHIRF
+FT                   PDGAVIEYEPETSALTVSGIKTASVTASGSVTATVPVVMVKASTRVTLDTPEVVCTNRL
+FT                   ITGTLEVQKGGTMRGNIEHTGGELSSNGKVLHTHKHPGDSGGTTGSPL"
+FT   misc_feature    10308
+FT                   /evidence=EXPERIMENTAL
+FT                   /note="transcription start site for V operon; encodes V, W,
+FT                   J, I, H, G"
+FT                   /gene="V"
+FT   variation       10329
+FT                   /note="Vam42, Vam203 and Vam205 mutations"
+FT                   /replace="t"
+FT                   /gene="V"
+FT   variation       10498
+FT                   /note="Vts199 mutation"
+FT                   /replace="a"
+FT                   /gene="V"
+FT   CDS             10940..11287
+FT                   /codon_start=1
+FT                   /db_xref="SWISS-PROT:P51768"
+FT                   /evidence=EXPERIMENTAL
+FT                   /transl_table=11
+FT                   /gene="W"
+FT                   /function="baseplate assembly protein"
+FT                   /product="gpW"
+FT                   /protein_id="AAD03283.1"
+FT                   /translation="MTARYLGMNRSDGLTVTDLEHISQSIGDILRTPVGSRVMRRDYGS
+FT                   LLASMIDQPQTPALELQIKVACYMAVLKWEPRVTLSSVTTARSFDGRMTVTLTGQHNDT
+FT                   GQPLSLTIPVS"
+FT   variation       11237
+FT                   /note="Wam50 mutation"
+FT                   /replace="t"
+FT                   /gene="W"
+FT   CDS             11292..12200
+FT                   /codon_start=1
+FT                   /db_xref="SWISS-PROT:P51767"
+FT                   /evidence=EXPERIMENTAL
+FT                   /transl_table=11
+FT                   /gene="J"
+FT                   /function="baseplate assembly protein"
+FT                   /product="gpJ"
+FT                   /protein_id="AAD03284.1"
+FT                   /translation="MPIIDLNQLPAPDVVEELDFESILAERKATLISLYPEDQQEAVAR
+FT                   TLTLESEPLVKLLEENAYRELIWRQRVNEAARAVMLACAAGNDLDVIGANYNTTRLTIT
+FT                   PADDSTIPPTPAVMESDTDYRLRIQQAFEGLSVAGSVGAYQYHGRSADGRVADISVTSP
+FT                   SPACVTISVLSRENNGVASEDLLAVVRNALNGEDVRPVADRVTVQSAAIVEYQINATLY
+FT                   LYPGPESEPIRAAAVKKLEAYITAQHRLGRDIRLSAIYAALHVEGVQRVELAAPLADIV
+FT                   LNSTQASFCTEYRVVTGGSDE"
+FT   variation       11937
+FT                   /note="Jam31 mutation"
+FT                   /replace="t"
+FT                   /gene="J"
+FT   CDS             12193..12723
+FT                   /codon_start=1
+FT                   /db_xref="SWISS-PROT:P26701"
+FT                   /evidence=EXPERIMENTAL
+FT                   /transl_table=11
+FT                   /gene="I"
+FT                   /function="baseplate assembly protein"
+FT                   /product="gpI"
+FT                   /protein_id="AAD03285.1"
+FT                   /translation="MSDSRLLPTGSSPLEVAAAKACAEIEKTPVSIRELWNPDTCPANL
+FT                   LPWLAWAFSVDRWDEKWPEATKRAVIRDAYFIHCHKGTIGAIRRVVEPLGYLINVTEWW
+FT                   ENSDPPGTFRLDIGVLESGITEAMYQEMERLIADAKPASRHLIGLNITRDIPGYLFAGG
+FT                   VAYDGDVITVYPG"
+FT   variation       12235
+FT                   /note="Iam78 mutation"
+FT                   /replace="t"
+FT                   /gene="I"
+FT   CDS             12734..14743
+FT                   /codon_start=1
+FT                   /db_xref="SWISS-PROT:P26700"
+FT                   /transl_table=11
+FT                   /gene="H"
+FT                   /function="probable tail fiber protein"
+FT                   /product="gpH"
+FT                   /protein_id="AAD03286.1"
+FT                   /translation="MSIKFRTVITTAGAAKLAAATAPGRRKVGITTMAVGDGGGKLPVP
+FT                   DAGQTGLIHEVWRHALNKISQDKRNSNYIIAELVIPPEVGGFWMRELGLYDDAGTLIAV
+FT                   ANMAESYKPALAEGSGRWQTCRMVIIVSSVASVELTIDTTTVMATQDYVDDKIAEHEQS
+FT                   RRHPDASLTAKGFTQLSSATNSTSETLAATPKAVKAAYDLANGKYTAQDATTARKGLVQ
+FT                   LSSATNSTSETLAATPKAVKTVMDETNKKAPLNSPALTGTPTTPTARQGTNNTQIANTA
+FT                   FVMAAIAALVDSSPDALNTLNELAAALGNDPNFATTMTNALAGKQPKDATLTALAGLAT
+FT                   AADRFPYFTGNDVASLATLTKVGRDILAKSTVAAVIEYLGLQETVNRAGNAVQKNGDTL
+FT                   SGGLTFENDSILAWIRNTDWAKIGFKNDADGDTDSYMWFETGDNGNEYFKWRSRQSTTT
+FT                   KDLMTLKWDALNILVNAVINGCFGVGTTNALGGSSIVLGDNDTGFKQNGDGILDVYANS
+FT                   QRVFRFQNGVAIAFKNIQAGDSKKFSLSSSNTSTKNITFNLWGASTRPVVAELGDEAGW
+FT                   HFYSQRNTDNSVIFAVNGQMQPSNWGNFDSRYVKDVRLGTRVVQLMARGGRYEKAGHTI
+FT                   TGLRIIGEVDGDDEAIFRPIQKYINGTWYNVAQV"
+FT   variation       13994
+FT                   /note="Ham72 mutation"
+FT                   /replace="t"
+FT                   /gene="H"
+FT   variation       14336
+FT                   /note="Ham59 mutation"
+FT                   /replace="t"
+FT                   /gene="H"
+FT   CDS             14747..15274
+FT                   /codon_start=1
+FT                   /db_xref="SWISS-PROT:P26699"
+FT                   /transl_table=11
+FT                   /gene="G"
+FT                   /function="probable tail fiber assembly protein"
+FT                   /product="gpG"
+FT                   /protein_id="AAD03287.1"
+FT                   /translation="MQHLKNIKSGNPKTKEQYQLTKNFDVIWLWSEDGKNWYEEVKNFQ
+FT                   PDTIKIVYDENNIIVAITRDASTLNPEGFSVVEVPDITSNRRADDSGKWMFKDGAVVKR
+FT                   IYTADEQQQQAESQKAALLSEAENVIQPLERAVRLNMATDEERARLESWERYSVLVSRV
+FT                   DPANPEWPEMPQ"
+FT   variation       14879
+FT                   /note="Gam1 mutation"
+FT                   /replace="t"
+FT                   /gene="G"
+FT   variation       15294..17233
+FT                   /note="del2 deletion"
+FT                   /replace=""
+FT   terminator      15639..15666
+FT                   /note="putative rho-independent terminator for V operon"
+FT   CDS             complement(15675..17261)
+FT                   /codon_start=1
+FT                   /db_xref="SPTREMBL:P79669"
+FT                   /note="cloned gene blocks growth of T5"
+FT                   /transl_table=11
+FT                   /gene="fun(Z)"
+FT                   /function="nonessential; lysogenic conversion; confers
+FT                   sensitivity to FUdR"
+FT                   /product="Fun(Z)"
+FT                   /protein_id="AAD03288.1"
+FT                   /translation="MIPIKDLTLGYADAENYKRRENKELLNKVFIRDNHLSRLCEPNIS
+FT                   FLVGEKGTGKTAYSIYLSNNNINNTLATTKYIRETEYQKFITLKSEKHLNLSDFSGIWK
+FT                   VILYLLISKQVLDKEGKISKLLNYSKFSSLNDAIDEYYLKAFSPEIIQALSFVQESKVA
+FT                   AELLHKHATLKGEERESLSFSESRFQINLFYIQKKFEEAFSQIRLSQNHILFIDGIDIR
+FT                   PSSIPYDDYLECIKGLAHAVWEINNDFFPSIKGGKGRMKAVLLIRPDIFESIGLQNQNA
+FT                   KIRDNSVFLDWRTEYVNHRSSQLFEVLDHLLRTQQDMALKKGQAWDHYFPWDSPNVHDN
+FT                   YNHPTSFINFLRWSYYRPRDILRMLEIIKSHASGDDGKNQFSLDDFESPSMQRDYSNYL
+FT                   LGEIKDHLSFYYGSEHYEIFLKFFEFLSGKDTFDYAEYLLAYKQLETHISSISTTKPKF
+FT                   MTTANDFLQFLFGLNVICYIETTEDNNRFIRWCFRERSYANISPKIKTGMKYQIFYGLA
+FT                   KSLNVGKALKK"
+FT   variation       complement(15784)
+FT                   /note="Z81su3 mutation"
+FT                   /replace="a"
+FT                   /gene="fun(Z)"
+FT   variation       complement(15872)
+FT                   /note="Z20 mutation"
+FT                   /replace="t"
+FT                   /gene="fun(Z)"
+FT   variation       complement(15944)
+FT                   /note="Z81 mutation"
+FT                   /replace="t"
+FT                   /gene="fun(Z)"
+FT   variation       complement(15946)
+FT                   /note="fun1 mutation"
+FT                   /replace="t"
+FT                   /gene="fun(Z)"
+FT   variation       complement(16079)
+FT                   /note="csZ150 mutation"
+FT                   /replace="t"
+FT                   /gene="fun(Z)"
+FT   variation       complement(16266)
+FT                   /note="fun99 mutation"
+FT                   /replace="t"
+FT                   /gene="fun(Z)"
+FT   variation       16267..17299
+FT                   /note="del5 deletion"
+FT                   /replace=""
+FT   variation       complement(16638)
+FT                   /note="csZ150 mutation"
+FT                   /replace="a"
+FT                   /gene="fun(Z)"
+FT   misc_feature    17555..17583
+FT                   /evidence=EXPERIMENTAL
+FT                   /note="activator binding site; activation of pF promoter"
+FT   misc_feature    17626..17628
+FT                   /evidence=EXPERIMENTAL
+FT                   /note="transcription start site for F operon; encodes FI,
+FT                   FII, E, E', T, U, D"
+FT   CDS             17652..18842
+FT                   /codon_start=1
+FT                   /db_xref="SWISS-PROT:P22501"
+FT                   /transl_table=11
+FT                   /gene="FI"
+FT                   /function="essential tail protein; tail sheath"
+FT                   /product="gpFI"
+FT                   /protein_id="AAD03289.1"
+FT                   /translation="MSDYHHGVQVLEINEGTRVISTVSTAIVGMVCTASDADAETFPLN
+FT                   KPVLITNVQSAISKAGKKGTLAASLQAIADQSKPVTVVMRVEDGTGDDEETKLAQTVSN
+FT                   IIGTTDENGQYTGLKAMLAAESVTGVKPRILGVPGLDTKEVAVALASVCQKLRAFGYIS
+FT                   AWGCKTISEVKAYRQNFSQRELMVIWPDFLAWDTVTSTTATAYATARALGLRAKIDQEQ
+FT                   GWHKTLSNVGVNGVTGISASVFWDLQESGTDADLLNESGVTTLIRRDGFRFWGNRTCSD
+FT                   DPLFLFENYTRTAQVVADTMAEAHMWAVDKPITATLIRDIVDGINAKFRELKTNGYIVD
+FT                   ATCWFSEESNDAETLKAGKLYIDYDYTPVPPLENLTLRQRITDKYLANLVTSVNSN"
+FT   variation       18183
+FT                   /note="Fam4 mutation"
+FT                   /replace="t"
+FT                   /gene="FI"
+FT   CDS             18855..19373
+FT                   /codon_start=1
+FT                   /db_xref="SWISS-PROT:P22502"
+FT                   /transl_table=11
+FT                   /gene="FII"
+FT                   /function="essential tail protein; tail tube"
+FT                   /product="gpFII"
+FT                   /protein_id="AAD03290.1"
+FT                   /translation="MAMPRKLKLMNVFLNGYSYQGVAKSVTLPKLTRKLENYRGAGMNG
+FT                   SAPVDLGLDDDALSMEWSLGGFPDSVIWELYAATGVDAVPIRFAGSYQRDDTGETVAVE
+FT                   VVMRGRQKEIDTGEGKQGEDTESKISVVCTYFRLTMDGKELVEIDTINMIEKVNGVDRL
+FT                   EQHRRNIGL"
+FT   CDS             join(19430..19684,19684..19857)
+FT                   /codon_start=1
+FT                   /db_xref="SPTREMBL:O64312"
+FT                   /note="shares amino terminus with gpE; -1 frameshift"
+FT                   /transl_table=11
+FT                   /gene="E+E'"
+FT                   /function="essential tail protein"
+FT                   /product="gpE+E'"
+FT                   /protein_id="AAD03292.1"
+FT                   /translation="MNKENVITLDNPVKRGEQVIEQVTLMKPSAGTLRGVSLAAVANSE
+FT                   VDALIKVLPRMTAPMLTEQEVAALELPDLVALAGKVVGFLVAELGAVTFPKNLSVDDLM
+FT                   ADVAVIFHWPPSELYPMSLTELITWREKALRRSGNTNE"
+FT   CDS             19430..19705
+FT                   /codon_start=1
+FT                   /db_xref="SPTREMBL:O64313"
+FT                   /transl_table=11
+FT                   /gene="E"
+FT                   /function="essential tail protein"
+FT                   /product="gpE"
+FT                   /protein_id="AAD03291.1"
+FT                   /translation="MNKENVITLDNPVKRGEQVIEQVTLMKPSAGTLRGVSLAAVANSE
+FT                   VDALIKVLPRMTAPMLTEQEVAALELPDLVALAGKVVGFLSPNSVQ"
+FT   variation       19473
+FT                   /note="Ets55 mutation"
+FT                   /replace="a"
+FT                   /gene="E"
+FT   variation       19619
+FT                   /note="Eam30 mutation"
+FT                   /replace="t"
+FT                   /gene="E"
+FT   misc_feature    19685
+FT                   /evidence=EXPERIMENTAL
+FT                   /note="site of -1 translational frameshift"
+FT                   /gene="E+E'"
+FT   CDS             19850..22297
+FT                   /codon_start=1
+FT                   /db_xref="SPTREMBL:O64314"
+FT                   /transl_table=11
+FT                   /gene="T"
+FT                   /function="essential tail protein; putative tail length
+FT                   determinator"
+FT                   /product="gpT"
+FT                   /protein_id="AAD03293.1"
+FT                   /translation="MSNNVKLQVLLRAVDQASRPFKSIRTASKSLSGDIRETQKSLREL
+FT                   NGHASRIEGFRKTSAQLAVTGHALEKARQEAEALATQFKNTERPTRAQAKVLESAKRAA
+FT                   EDLQAKYNRLTDSVKRQQRELAAVGINTRNLAHDEQGLKNRISETTAQLNRQRDALVRV
+FT                   SAQQAKLNAVKQRYQAGKELAGNMASVGAAGVGIAAAGTMAGVKLLMPGYEFAQKNSEL
+FT                   QAVIGVAKDSAEMAALRKQARQLGDNTAASADDAAGAQIIIAKAGGDVDAIQAATPVTL
+FT                   NMALANRRTMEENAALLMGMKSAFQLSNDKVAHIGDVLSMTMNKTAADFDGMSDALTYA
+FT                   APVAKNAGVSIEETAAMVGALHDAKITGSMAGTGSRAVLSRLQAPTGKAWDALKELGVK
+FT                   TSDSKGNTRPIFTILKEMQASFEKNRLGTAQQAEYMKTIFGEEASSAAAVLMTAASTGK
+FT                   LDKLTAAFKASDGKTAELVNIMQDNLGGDFKAFQSAYEAVGTDLFDQQEGALRKLTQTA
+FT                   TKYVLKLDGWIQKNKSLASTIGIIAGGALALTGIIGAIGLVAWPVITGINAIIAAAGAM
+FT                   GAVFTTVGSAVMTAIGAISWPVVAVVAAIVAGALLIRKYWEPVSAFFGGVVEGLKAAFA
+FT                   PVGELFTPLKPVFDWLGEKLQAAWQWFKNLIAPVKATQDTLNRCRDTGVMFGQALADAL
+FT                   MLPLNAFNKLRSGIDWVLEKLGVINKESDTLDQTAARTHTATYGTGDYIPATSSYAGYQ
+FT                   AYQPVTAPAGRSYVDQSKNEYHISLTGGTAPGTQLDRQLQDALEKYERDKRARARASMM
+FT                   HDG"
+FT   variation       20669
+FT                   /note="Tam215 mutation"
+FT                   /replace="t"
+FT                   /gene="T"
+FT   variation       21101
+FT                   /note="Tam5 mutation"
+FT                   /replace="t"
+FT                   /gene="T"
+FT   variation       21528
+FT                   /note="Tam64 mutation"
+FT                   /replace="a"
+FT                   /gene="T"
+FT   CDS             22312..22791
+FT                   /codon_start=1
+FT                   /db_xref="SPTREMBL:O64315"
+FT                   /transl_table=11
+FT                   /gene="U"
+FT                   /function="essential tail protein"
+FT                   /product="gpU"
+FT                   /protein_id="AAD03294.1"
+FT                   /translation="MMLALGMFVFMRQTLPHQTMQRESDYRWPSNSRIGKRDAFQFLGV
+FT                   GEENITLAGVLYPELTGGKLTMTTLRLMAEEGRAWPLLDGTGMIYGMYVISRVSETGSI
+FT                   FFADGTPRKIDFTLSLTRVDESLAALYGDIGKQAESLIGKAGSMATRFTGMTGAG"
+FT   variation       22363
+FT                   /note="Uam25 mutation"
+FT                   /replace="t"
+FT                   /gene="U"
+FT   variation       22501
+FT                   /note="Uam77 and Uam92 mutations"
+FT                   /replace="t"
+FT                   /gene="U"
+FT   CDS             22791..23954
+FT                   /codon_start=1
+FT                   /db_xref="SWISS-PROT:P10312"
+FT                   /transl_table=11
+FT                   /gene="D"
+FT                   /function="essential tail protein"
+FT                   /product="gpD"
+FT                   /protein_id="AAD03295.1"
+FT                   /translation="MLDALTFDAGSTLTPDYMLMLDSRDITGNISDRLMSMTLTDNRGF
+FT                   EADQLDIELNDADGQVGLPVRGAVLTVYIGWKGFALVCKGKFTVDEVEHRGAPDVVTIR
+FT                   ARSADFRGTLNSRREGSWHDTTLGAIVKAIATRNRLEASVAPSLAGIKIPHIDQSQESD
+FT                   AKFLTRLAERNGGEVSVKMGKLLFLKAGQGVTASGKKIPQVTITRSDGDRHHFAIADRG
+FT                   AYTGVTAKWLHTKDPKPQKQKVKLKRKKKEKHLRALEHPKAKPVRQKKAPKVPEAREGE
+FT                   YMAGEADNVFALTTVYATKAQAMRAAQAKWDKLQRGVAEFSISLATGRADIYTETPVKV
+FT                   SGFKRVIDEQDWTITKVTHFLNNSGFTTSLELEVRLSDVEYETEDDE"
+FT   variation       23592
+FT                   /note="Dam6 mutation"
+FT                   /replace="t"
+FT                   /gene="D"
+FT   -35_signal      23973..23975
+FT   -10_signal      23996..24002
+FT   prim_transcript 24008..24288
+FT                   /note="putative"
+FT   CDS             24036..24254
+FT                   /codon_start=1
+FT                   /db_xref="SWISS-PROT:P08762"
+FT                   /transl_table=11
+FT                   /gene="ogr"
+FT                   /product="Ogr"
+FT                   /protein_id="AAD03296.1"
+FT                   /translation="MFHCPLCQHAAHARTSRYITDTTKERYHQCQNVNCSATFITYESV
+FT                   QRYIVKPGEVHAVRPHPLPSGQQIMWM"
+FT   variation       24148..25274
+FT                   /note="del15 deletion"
+FT                   /replace=""
+FT   variation       24160
+FT                   /note="ogr1 and ogr52 mutations"
+FT                   /replace="g"
+FT                   /gene="ogr"
+FT   terminator      24265..24288
+FT                   /evidence=EXPERIMENTAL
+FT                   /note="rho-independent terminator for ogr transcript and F
+FT                   operon"
+FT   protein_bind    24293..24320
+FT                   /note="P arm"
+FT                   /bound_moiety="Int"
+FT   protein_bind    24324..24357
+FT                   /bound_moiety="IHF"
+FT   misc_feature    complement(24356..24382)
+FT                   /note="attP"
+FT   protein_bind    24356..24383
+FT                   /note="attP core"
+FT                   /bound_moiety="Int"
+FT   variation       24372
+FT                   /note="saf mutation; altered integration site specificity"
+FT                   /replace="g"
+FT   variation       24376
+FT                   /note="left end del3 deletion/insertion"
+FT   variation       24378..25927
+FT                   /note="vir22 deletion/insertion"
+FT   variation       24378..25065
+FT                   /note="del6 deletion"
+FT                   /replace=""
+FT   variation       24381..26340
+FT                   /note="vir94 deletion/insertion"
+FT   protein_bind    24399..24472
+FT                   /bound_moiety="Cox"
+FT   CDS             complement(24462..25475)
+FT                   /codon_start=1
+FT                   /db_xref="SWISS-PROT:P36932"
+FT                   /transl_table=11
+FT                   /gene="int"
+FT                   /function="integrase"
+FT                   /product="Int"
+FT                   /protein_id="AAD03297.1"
+FT                   /translation="MAIKKLDDGRYEVDIRPTGRNGKRIRRKFDKKSEAVAFEKYTLYN
+FT                   HHNKEWLSKPTDKRRLSELTQIWWDLKGKHEEHGKSNLGKIEIFTKITNDPCAFQITKS
+FT                   LISQYCATRRSQGIKPSSINRDLTCISGMFTALIEAELFFGEHPIRGTKRLKEEKPETG
+FT                   YLTQEEIALLLAALDGDNKKIAILCLSTGARWGEAARLKAENIIHNRVTFVKTKTNKPR
+FT                   TVPISEAVAKMIADNKRGFLFPDADYPRFRRTMKAIKPDLPMGQATHALRHSFATHFMI
+FT                   NGGSIITLQRILGHTRIEQTMVYAHFAPEYLQDAISLNPLRGGTEAESVHTVSTVE"
+FT   protein_bind    24470..24496
+FT                   /note="P' arm"
+FT                   /gene="int"
+FT                   /bound_moiety="Int"
+FT   variation       complement(24539)
+FT                   /note="intam150 mutation"
+FT                   /replace="a"
+FT                   /gene="int"
+FT   variation       complement(25130)
+FT                   /note="intam239 mutation"
+FT                   /replace="a"
+FT                   /gene="int"
+FT   variation       complement(25454)
+FT                   /note="nip1 mutation"
+FT                   /replace="t"
+FT                   /gene="int"
+FT   variation       25492..25839
+FT                   /note="vir 79 deletion"
+FT                   /replace=""
+FT   CDS             complement(25591..25890)
+FT                   /codon_start=1
+FT                   /db_xref="SWISS-PROT:P04132"
+FT                   /transl_table=11
+FT                   /gene="C"
+FT                   /function="immunity repressor"
+FT                   /product="gpC"
+FT                   /protein_id="AAD03298.1"
+FT                   /translation="MSNTISEKIVLMRKSEYLSRQQLADLTGVPYGTLSYYESGRSTPP
+FT                   TDVMMNILQTPQFTKYTLWFMTNQIAPESGQIAPALAHFGQNETTSPHSGQKTG"
+FT   variation       complement(25637)
+FT                   /note="sly1 mutation"
+FT                   /replace="t"
+FT                   /gene="C"
+FT   variation       complement(25682)
+FT                   /note="cts7 mutation"
+FT                   /replace="t"
+FT                   /gene="C"
+FT   variation       complement(25686..25702)
+FT                   /note="cam11 and cam13 mutations"
+FT                   /replace="a"
+FT                   /gene="C"
+FT   variation       complement(25702)
+FT                   /note="cts6 mutation"
+FT                   /replace="a"
+FT                   /gene="C"
+FT   variation       complement(25731)
+FT                   /note="cam10 and cam12 mutations"
+FT                   /replace="a"
+FT                   /gene="C"
+FT   variation       complement(25772)
+FT                   /note="cts9 mutation"
+FT                   /replace="t"
+FT                   /gene="C"
+FT   variation       complement(25802)
+FT                   /note="vir1 mutation"
+FT                   /replace="t"
+FT                   /gene="C"
+FT   variation       complement(25829)
+FT                   /note="cts8 mutation"
+FT                   /replace="g"
+FT                   /gene="C"
+FT   variation       complement(25844)
+FT                   /note="cts5 mutation"
+FT                   /replace="a"
+FT                   /gene="C"
+FT   -35_signal      25884..25889
+FT                   /note="early promoter Pe"
+FT   misc_feature    25894..25901
+FT                   /note="O1 repressor binding site"
+FT   variation       25899..25955
+FT                   /note="vir24 deletion"
+FT                   /replace=""
+FT   variation       25900..25916
+FT                   /note="vir3 deletion"
+FT                   /replace=""
+FT   variation       25904..25920
+FT                   /note="vir65 deletion"
+FT                   /replace=""
+FT   -10_signal      25907..25912
+FT                   /note="early promoter Pe"
+FT   variation       25909..25983
+FT                   /note="vir40 deletion"
+FT                   /replace=""
+FT   variation       25913
+FT                   /note="c1 mutation"
+FT                   /replace="c"
+FT   misc_feature    25916..25923
+FT                   /note="O2 repressor binding site"
+FT   variation       25922
+FT                   /note="vir6 mutation"
+FT                   /replace=""
+FT   -10_signal      complement(25962..25967)
+FT                   /note="Pc promoter"
+FT   -35_signal      complement(25982..25987)
+FT                   /note="Pc promoter"
+FT   CDS             26005..26280
+FT                   /codon_start=1
+FT                   /db_xref="SWISS-PROT:P07695"
+FT                   /transl_table=11
+FT                   /gene="cox"
+FT                   /function="repressor of Pc; required for prophage excision;
+FT                   inhibits integration; activates P11 promoter of satellite
+FT                   phage P4"
+FT                   /product="Cox"
+FT                   /protein_id="AAD03299.1"
+FT                   /translation="MSKQVTLMTDAIPYQEFAKLIGKSTGAVRRMIDKGKLPVIDMTDP
+FT                   QSASGRAGEYWVYLPAWNNGLKLAYESRPKEIRDGWLMWLGLGEPR"
+FT   variation       26069
+FT                   /note="cox3 mutation"
+FT                   /replace="a"
+FT                   /gene="cox"
+FT   variation       26129
+FT                   /note="cox2 mutation"
+FT                   /replace="c"
+FT                   /gene="cox"
+FT   variation       26164
+FT                   /note="cox4 mutation"
+FT                   /replace="a"
+FT                   /gene="cox"
+FT   CDS             26291..26461
+FT                   /codon_start=1
+FT                   /db_xref="SPTREMBL:Q38498"
+FT                   /transl_table=11
+FT                   /gene="orf78"
+FT                   /product="Orf78"
+FT                   /protein_id="AAD03300.1"
+FT                   /translation="MNEPRCIAQLLRNESPRAIDFTITHGKGRKGIIIRTKKQSPLKKA
+FT                   LTFLKSRRVWK"
+FT   CDS             26458..26958
+FT                   /codon_start=1
+FT                   /db_xref="SWISS-PROT:P07696"
+FT                   /transl_table=11
+FT                   /gene="B"
+FT                   /function="essential protein; DNA replication; required for
+FT                   lagging strand synthesis"
+FT                   /product="gpB"
+FT                   /protein_id="AAD03301.1"
+FT                   /translation="MTVMTLNLVEKQPAAMRRIIGKHLAVPRWQDTCDYYNQMMERERL
+FT                   TVCFHAQLKQRHATMCFEEMNDVERERLVCAIDELRGAFSKRRQVGASEYAYISFLTVS
+FT                   QRRTLFMHAGLTEKEFNQPYWRINEESCYWRDALFRALRELFSLFEYAPTILTSVKPEQ
+FT                   YLH"
+FT   variation       26525
+FT                   /note="rlb1 mutation"
+FT                   /replace="g"
+FT                   /gene="B"
+FT   variation       26611
+FT                   /note="Bam213 mutation"
+FT                   /replace="t"
+FT                   /gene="B"
+FT   variation       26722
+FT                   /note="Bam116 mutation"
+FT                   /replace="t"
+FT                   /gene="B"
+FT   variation       26762
+FT                   /note="Bts6 mutation"
+FT                   /replace="t"
+FT                   /gene="B"
+FT   variation       26914
+FT                   /note="Bts40 mutation"
+FT                   /replace="t"
+FT                   /gene="B"
+FT   terminator      26980..27007
+FT                   /note="putative rho-independent terminator"
+FT   CDS             27022..27246
+FT                   /codon_start=1
+FT                   /db_xref="SWISS-PROT:Q06422"
+FT                   /transl_table=11
+FT                   /gene="orf80"
+FT                   /product="Orf80"
+FT                   /protein_id="AAD03302.1"
+FT                   /translation="MHTVSENQCGIYALLLQQARTEAQADAATRFSSHLDAMIRHITKA
+FT                   ELSRVEIVELLSQESEKFHNIGLSRGEVL"
+FT   CDS             27246..27548
+FT                   /codon_start=1
+FT                   /db_xref="SWISS-PROT:Q06423"
+FT                   /transl_table=11
+FT                   /gene="orf81"
+FT                   /product="Orf81"
+FT                   /protein_id="AAD03303.1"
+FT                   /translation="MFCSRAVVLLNNALKIAVMKNGDLSLIQLGLDKEKREITESVIAI
+FT                   YQSELNLLSDVVNLLVKRAVFHKQISSVDELTKLTTEIASYCADEFKKLNDKRNW"
+FT   CDS             27548..27772
+FT                   /codon_start=1
+FT                   /db_xref="SWISS-PROT:Q06424"
+FT                   /transl_table=11
+FT                   /gene="orf82"
+FT                   /product="Orf82"
+FT                   /protein_id="AAD03304.1"
+FT                   /translation="MPDNVDFIQEQQAELLERQINAARVKHCGASALVCEECDAPIPAA
+FT                   RRAAYPSATRCVSCQSVFEAKNKHYRRTA"
+FT   CDS             27769..28044
+FT                   /codon_start=1
+FT                   /db_xref="SWISS-PROT:Q06425"
+FT                   /transl_table=11
+FT                   /gene="orf83"
+FT                   /product="Orf83"
+FT                   /protein_id="AAD03305.1"
+FT                   /translation="MSIRIEIGERYVVTSDSFQFILHEKKRAESGKNAGQEWLAVVGYY
+FT                   PKLSQLVSGLMHHDILTGSAKSFADLNVQVEQLSKRCSEAFGSYGR"
+FT   CDS             28034..30319
+FT                   /codon_start=1
+FT                   /db_xref="SWISS-PROT:Q06419"
+FT                   /transl_table=11
+FT                   /gene="A"
+FT                   /function="essential protein; DNA replication; makes
+FT                   site-specific nick at origin of replication"
+FT                   /product="gpA"
+FT                   /protein_id="AAD03306.1"
+FT                   /translation="MAVKASGRFVPPSAFAAGTGKMFTGAYAWNAPREAVGRERPLTRD
+FT                   EMRQMQGVLSTINRLPYFLRSLFTSRYDYIRRNKSPVHGFYFLTSTFQRRLWPRIERVN
+FT                   QRHEMNTDASLLFLAERDHYARLPGMNDKELKKFAARISSQLFMMYEELSDAWVDAHGE
+FT                   KESLFTDEAQAHLYGHVAGAARAFNISPLYWKKYRKGQMTTRQAYSAIARLFNDEWWTH
+FT                   QLKGQRMRWHETLLIAVGEVNKDRSPYASKHAIRDVRARRQANLEFLKSCDLENRETGE
+FT                   RIDLISKVMGSISNPEIRRMELMNTIAGIERYAAAEGDVGMFITLTAPSKYHPTRQVGK
+FT                   GESKTVQLNHGWNDEAFNPKDAQRYLCHIWSLMRTAFKDNDLQVYGLRVVEPHHDGTPH
+FT                   WHMMLFCNPRQRNQIIEIMRRYALKEDGDERGAARNRFQAKHLNQGGAAGYIAKYISKN
+FT                   IDGYALDGQLDNDTGRPLKDTAAAVTAWASTWRIPQFKTVGLPTMGAYRELRKLPRGVS
+FT                   IADEFDERVEAARAAADSGDFALYISAQGGANVPRDCQTVRVARSPSDEVNEYEEEVER
+FT                   VVGIYAPHLGARHIHITRTTDWRIVPKVPVVEPLTLKSGIAAPRSPVNNCGKLTGGDTS
+FT                   LPAPTPSEHAAAVLNLVDDGVIEWNEPEVVRALRGALKYDMRTPNRQQRNGSPLKPHEI
+FT                   APSARLTRSERLQITRIRVDLAQNGIRPQRWELEALARGATVNYDGKKFTYPVADEWPG
+FT                   FSTVMEWT"
+FT   variation       28649
+FT                   /note="Aam127 mutation"
+FT                   /replace="t"
+FT                   /gene="A"
+FT   variation       29528
+FT                   /note="Ats54 mutation"
+FT                   /replace="a"
+FT                   /gene="A"
+FT   rep_origin      29892
+FT                   /evidence=EXPERIMENTAL
+FT                   /note="nick site at ori"
+FT   CDS             30316..30645
+FT                   /codon_start=1
+FT                   /db_xref="SWISS-PROT:Q06426"
+FT                   /transl_table=11
+FT                   /gene="orf91"
+FT                   /product="Orf91"
+FT                   /protein_id="AAD03307.1"
+FT                   /translation="MMAKIHEVKLHAKYFDLVLEGKKRAEFRKKDRNYERGDTLILHEW
+FT                   VQGVFTGRKVEARITDVTDLSDWLEDYVLLHRILGEILPLTVKLAVSSTFFINLRRRTV
+FT                   AIYLL"
+FT   CDS             complement(30684..31445)
+FT                   /codon_start=1
+FT                   /db_xref="SPTREMBL:P79670"
+FT                   /transl_table=11
+FT                   /gene="tin"
+FT                   /function="nonessential protein; lysogenic conversion;
+FT                   blocks growth of T-even phages"
+FT                   /product="Tin"
+FT                   /protein_id="AAD03308.1"
+FT                   /translation="MNNMDIVKAVKDGMKKSADATYLMDFRSGAKINTEYVATVSIGLS
+FT                   LLEIKSFRHGDYKVIFEYHTNKFINATVPLSKRSDPQKIFSKKTVRKNTNTTRSGRIDI
+FT                   AILDSRPFFDIPICAIEVKGNAPCKSLLFSDIRRNLEYFKHTGPTGNSSLGLALNCSFH
+FT                   SYNDSTKKNYCTTIHHKEDMIRKLKNKYKKYISELNEEIPDDISVTIDVFTAAEHLLSP
+FT                   DADQYEYESHIDDLHLTLGVMVIFERKSILN"
+FT   variation       30992..33334
+FT                   /note="del4 deletion"
+FT                   /replace=""
+FT   variation       31022..33454
+FT                   /note="del1 deletion"
+FT                   /replace=""
+FT   CDS             complement(31620..33380)
+FT                   /codon_start=1
+FT                   /db_xref="SWISS-PROT:P13520"
+FT                   /transl_table=11
+FT                   /gene="old"
+FT                   /function="nonessential protein; lysogenic conversion;
+FT                   exonuclease; blocks growth of phage lambda"
+FT                   /product="Old"
+FT                   /protein_id="AAD03309.1"
+FT                   /translation="MTVRLASVSISNFRSCKSTSAILRPFTALVGYNNAGKSNIILAIK
+FT                   WLLDGSLISESDVYDPTHPVSVEGVIQGITDDTLSLLTEENQQKIAPFIIDGTLTFARR
+FT                   QEFNKETGKAKKSLDVYDGTTWKKNPGGIDGAISNIFPEPIHIPAMSDAVEDSTKCKNT
+FT                   TTIGKILSAIVSEIKQEHEEKFSKNISEIGKYLSHNGENRLESLNKIDSGVNKKVNQFF
+FT                   PDVSVKLHFPTPTLDEIFKSGTLKVFESREDEPVMRDISRFGHGTQRSIQMALIQYLAE
+FT                   IKKENSESKKSNTLIFIDEPELYLHPSAINSVRESLVTLSESGYQVIISTHSASMLSAK
+FT                   HAANAIQVCKDSNGTIARKTISEKIEELYKSSSPQLHSAFTLSNSSYLLFSEEVLLVEG
+FT                   KTETNVLYALYKKINGHELNPSKICIVAVDGKGSLFKMSQIINAIGIKTRILADCDFLS
+FT                   NILLTEHKDLLSTECDNLLTALIESINSGELSLNTKVTTFESFKSISSKDFIKICNHEK
+FT                   TQKHIHEIHQKLKDNGIYIWKSGDIEAVYGFGKKQTEWDSLLDCLCDESKDVRAVIKKY
+FT                   DEMEDFIKWI"
+FT   variation       complement(31991)
+FT                   /note="oldam11 mutation"
+FT                   /replace="a"
+FT                   /gene="old"
+FT   variation       complement(32576)
+FT                   /note="old1 mutation"
+FT                   /replace="t"
+FT                   /gene="old"
+FT   misc_feature    complement(33424)
+FT                   /note="transcript start 1; old-tin mRNA"
+FT   misc_feature    complement(33426)
+FT                   /note="transcript start 2; old-tin mRNA"
+FT   misc_feature    33575..33593
+FT                   /note="cosR; right cohesive end"
+XX
+SQ   Sequence 33593 BP; 8398 A; 7983 C; 8870 G; 8342 T; 0 other;
+     ggcgaggcgg ggaaagcact gcgcgctgac ggtggtgctg attgtatttt ttcagcgtct        60
+     cagcgcgtcg tgacggcact tagtctgccc gttgaggcgt tgtgtgtctg cggggtgttt       120
+     tgtgcggtgg tgagcgtgtg aggggggatg acggggtgta aaaaagccgc ccgcaggcgg       180
+     cgatgttcag tcgttgtcag tgtccagtga gtagttttta aagcggatga cctcctgacc       240
+     gagccagccg tttatctcgc ggatcctgtc ctgtaacggg ataagctcat tgcggacaaa       300
+     gacctttgcc actttctcaa tatcacccag cgacccgacg ttctccggct tgccacccat       360
+     caactgaaag gggatgcggt gcgcgtccag caggtcagcg gcgctggctt ttttgatatt       420
+     aaaaaaatcg tccttcgtcg ccacttcact gagggggata attttaatgc cgtcggcttt       480
+     cccctgtggg gcatagagaa acaggttttt aaagttgttg cggcctttcg acttgaccat       540
+     gttttcgcga agcatttcga tatcgttgcg atcctgcacg gcatcggtga catacatgat       600
+     gtatccggca tgtgcgccat tttcgtaata cttgcggcgg aacaacgtgg ccgactcatt       660
+     cagccaggca gagttaaggg cgctgagata ttccggcagg ccgtacagct cctgattaat       720
+     atccggctcc agcaggtgaa acacggagcc gggcgcgaag gctgtcggct cgttgaagga       780
+     cggcacccac cagtaaacat cctcttccac gccacggcgg gtatattttg ccggtgaggt       840
+     ttccagtctg atgaccttac cggtggtgct gtaacgcttt tccagaaacg cattaccgaa       900
+     caccagaaaa tccagcacaa agcggctgaa atcctgctgg gaaagccatg gatgcgggat       960
+     aaatgtcgag gccagaatat tgcgtttgac gtaaatcggc gagctgtgat gcacggcagc      1020
+     ccgcaggctt tttgccagac cggtaaagct gaccggtggc tcataccatc tgccgttact      1080
+     gatgcactcg acgtaatcca gaatgtcacg gcggtcgagt accggcaccg gctcaccaaa      1140
+     ggtgaatgcc tccattttcg ggccgctggc ggtcattgtt tttgccgcag gttgcggtgt      1200
+     tttccctttt ttcttgctca tcagtaaaac tccagaatgg tggatgtcag cggggtgctg      1260
+     ataccggcgg tgagtggctc atttaacagg gcgtgcatgg tcgcccaggc gaggtcggcg      1320
+     tggctggctt cctcgctgcg gctggcctca taggtggcgc tgcgtccgct gctggtcatg      1380
+     gtcttgcgga tagccataaa cgagctggtg atgtcggtgg cgctgacgtc gtattccaga      1440
+     cagccacggc ggataacgtc ttttgccttg agcaccattg cggttttcat ttccggcgtg      1500
+     tagcggatat cacgcgcggc gggatagaac gagcgcacga gctggaacac gccgacaccg      1560
+     aggccggtgg catcaatacc gatgtattcg acgttgtatt tttcggtgag tttgcggatg      1620
+     gattccgcct gggtggcaaa gtccatgcct ttccactggt gacgctcaag tattctgaat      1680
+     ttgccaccgg ccaccaccgg cggtgccagt accacgcatc cggcgctgtc gccacggtgt      1740
+     gacgggtcgt aaccaatcca taccgggcgg gagccgaacg gattggcggc aaacggcgca      1800
+     tagtcttccc attcttccag cgtgtcgacc atgcagcgtt gcagctcctc gaacgggaac      1860
+     accgatgcct tgtcgtcaac aaattcacac atgaacaggt ttttaaaatc gtcggcgctg      1920
+     ttttcgcgtt tgagctgctc aatgtcgaac agcgtgcagc cgcctttcag ggcgtcctca      1980
+     atggtgacaa tctgtcgcca ctggccgtcc gcacagagaa gcccaccggc aagggcgtta      2040
+     tgactgacgt cgatttccac gcgttcggcg gcgctggcgc gtccccggtt aaacagttca      2100
+     cccgaccaga acgggtaggc gtcgtgcgcc agcgtggacg gggtggagaa ataggtcgag      2160
+     cgcaggtgac tctgtgaggc catacctgat gccaccttac gcagtacctg aaaattcggg      2220
+     atccagaaaa tctcatcgac gtacaggtcg ccgttatgac tctgcgcggt gttggagttg      2280
+     gtgccgagaa aaatcagttt tgcgccgtta ttgcccagga caatcgggtc accggtcagg      2340
+     tcaacgtcaa ccagacgggc aaaggcgatg atgtattcgc ggaacacata cgcctgtgtt      2400
+     ttactggccg acagaaaaat ctggttatga ccggttttca gggcacgcag cagcgcctcg      2460
+     cgggaaaaat aaaacgtcgc gccaatctgg cgggatttca ggatatcgcg gatgcggtgc      2520
+     tcaagcccgg cacgatacca gtgcagctga tagtcgaaag actgctcaaa gaaaatctgc      2580
+     tccagctttt cgatggcctc gtcactgaaa aaattctttt tcggtttgcg ccgtccgcct      2640
+     ttgttacggt tagcgacgtt cggattaagg tctgcctcgt tgccggtctg gctgtagcgg      2700
+     ttgacccgtg ccagtcgttc aatctggcgt cccagcaggt caatttcctt gaagtcaccg      2760
+     ccggttttct gtggtttgat gatgagctgg gtcagccgcg cttccagact catttcgaca      2820
+     cggctgatgg gggcaacgct gtcccagccg tcgcgctgtt tccagctctg cactgtcggg      2880
+     cgtttcatct gcaacatggc ggcaatctgc ggcacggaaa acccctgcca gtacagcagc      2940
+     gccgcctgac gacgcgggtc gtgtaaaaga gtggtgtctg tggtgatggt catgaatacc      3000
+     tcgccgtgat gaatacacgg caaggctact gagtcgcgcc ccgcgattcg ctaaggtgct      3060
+     gttgtgtcag tgataagcca tccgggactg atggcggagg atgcgcatcg tcgggaaact      3120
+     gatgccgaca tgtgactcct ctaatcacta ttcaggactc ctgacaatgg caaaaaaagt      3180
+     ctcaaaattc tttcgtatcg gcgttgaggg tgacacctgt gacgggcgtg tcatcagtgc      3240
+     gcaggatatt caggaaatgg ccgaaacctt tgacccgcgt gtctatggtt gccgcattaa      3300
+     cctggaacat ctgcgcggca tcctgcctga cggtattttt aagcgttatg gcgatgtggc      3360
+     cgaactgaag gccgaaaaga ttgacgatga ttcggcgctg aaaggcaaat gggcgctgtt      3420
+     tgcgaaaatc accccgaccg atgaccttat cgcgatgaac aaggccgcgc agaaggtcta      3480
+     cacctcaatg gaaattcagc cgaactttgc caacaccggc aaatgttatc tggtgggtct      3540
+     ggccgtcacc gatgacccgg caagcctcgg cacggaatac ctggaattct gccgcacggc      3600
+     aaaacacaac cccctgaacc gcttcaaatt aagccctgaa aacctgattt cagtggcaac      3660
+     gcctgttgag ctggaatttg aagacctgcc tgaaaccgtg ttcaccgccc tgaccgaaaa      3720
+     ggtgaagtcc atttttggcc gcaaacaggc cagcgatgat gcccgtctga atgacgtgca      3780
+     tgaagcggtg accgctgttg ctgaacatgt gcaggaaaaa ctgagcgcca ctgagcagcg      3840
+     cctcgctgag atggaaaccg ccttttctgc acttaagcag gaggtgactg acagggcgga      3900
+     tgaaaccagc caggcattca cccgcctgaa aaacagtctc gaccacaccg aaagtctgac      3960
+     ccagcagcgc cgcagcaaag ccaccggcgg tggcggtgac gccctgatga cgaactgctg      4020
+     accggcgtca gtcagtccgg gaaaaccttc acgattaacc cttaatttca ggaaaaacta      4080
+     tgcgccagga aacccgcttt aaatttaatg cctacctgtc ccgtgttgcc gaactgaacg      4140
+     gcatcgacgc cggtgatgtg tcgaaaaaat tcaccgttga accgtcggtc acccagaccc      4200
+     tgatgaacac catgcaggag tcctctgact ttctgacccg catcaatatt gtgccggtca      4260
+     gcgaaatgaa aggggaaaaa attggtatcg gtgtcaccgg ctccatcgcc agcactaccg      4320
+     acactgccgg tggtaccgag cgtcagccga aggacttctc gaagctggcg tcaaacaagt      4380
+     acgaatgcga ccagattaac ttcgattttt atatccgcta caaaacgctg gacctgtggg      4440
+     cgcgttatca ggatttccag ctccgtatcc gtaacgccat tatcaaacgc cagtcccttg      4500
+     atttcatcat ggccggtttt aacggcgtga agcgtgccga aacctctgac cgcagcagca      4560
+     atccgatgtt gcaggatgtg gcggtcggct ggctgcagaa ataccgcaat gaagcaccgg      4620
+     cgcgcgtgat gagcaaggtc actgacgagg aaggccgcac cacctctgag gttatccgcg      4680
+     tgggtaaggg cggtgattat gccagccttg atgcactggt gatggatgcg accaacaacc      4740
+     tgattgaacc gtggtatcag gaagaccctg accttgtggt gattgtgggg cgtcagctac      4800
+     tggcggacaa gtatttcccc atcgtcaaca aggagcagga caacagcgaa atgctggccg      4860
+     ctgacgtcat catcagccag aaacgcatcg gtaacctacc agcggtacgc gtcccgtact      4920
+     tcccggcgga tgcgatgctc atcacgaagc tggaaaacct gtccatctac tacatggatg      4980
+     acagccatcg ccgcgtgatt gaggaaaacc cgaaactcga ccgcgtggag aactacgagt      5040
+     caatgaacat tgattacgtg gtggaagact acgccgccgg ttgtctggtg gaaaaaatca      5100
+     aggtcggtga cttctccaca ccggctaagg cgaccgcaga gccgggagcg taaccgatga      5160
+     cgagtcccgc acagcgccac atgatgcggg tctcggcagc gatgaccgcg cagcgggaag      5220
+     ccgccccgct gcgacatgca actgtctatg agcagatgct ggttaagctc gccgcagacc      5280
+     agcgcacact gaaagcgatt tactcaaaag agctgaaggc cgcaaaaaaa cgcgaactgc      5340
+     tgccgttctg gttgccgtgg gtgaacggcg tgctggagct gggcaaaggt gcacaggatg      5400
+     acattctgat gacggtcatg ctgtggcgtc tggataccgg cgatattgcc ggtgcgctgg      5460
+     agattgcccg ttatgccctg aagtacggtc tgaccatgcc gggtaaacac cgccgtaccc      5520
+     cgccgtacat gttcaccgag gaggtagcgc ttgcggccat gcgcgctcac gctgccggtg      5580
+     agtctgtgga tacccgcctg ctgacggaga cccttgaact gaccgccacg gctgacatgc      5640
+     ctgatgaagt gcgcgcaaag ctgcacaaaa tcaccggtct gtttctgcgt gacggtggtg      5700
+     atgccgccgg tgcgctggcg cacctgcaac gtgcgacaca gctcgactgt caggcaggcg      5760
+     tcaaaaaaga gattgaacga ctggagcggg agctgaaacc gaagccggag ccgcagccca      5820
+     aagcggccac ccgcgccccg cgtaagaccc ggagcgtgac accggcaaaa cgtggacgcc      5880
+     cgaaaaagaa agccagttaa caaccgaatg cgccccgcgc cagggcggca cgccggtcag      5940
+     tgacggtgaa tcacctgaca ctgcaccggc gtccaccgcc cgacttttca gaggtagtca      6000
+     tgatgacgct gattattccg cgaaaggagg ctcccgtgtc cggtgagggt acggtggtca      6060
+     tcccgcaacc ggcaggcgac gagccggtga ttaaaaacac gttctttttt cccgatatcg      6120
+     acccgaagcg cgtccgggaa cgtatgcgcc ttgagcagac cgtcgccccc gcccgtctgc      6180
+     gtgaggccat caagtcaggc atggctgaaa cgaatgcgga gctgtacgag taccgcgaac      6240
+     agaaaattgc cgccggtttt acgcgtctgg ctgacgtccc ggcggacgat atcgacggtg      6300
+     aaagcatcaa ggttttttac tacgagcgcg ccgtgtgtgc gatggcgacc gcgtcgcttt      6360
+     atgagcgtta tcgcggtgtg gatgccagtg cgaaaggcga caagaaggct gacagcattg      6420
+     acagcaccat tgatgagctg tggcgggata tgcgctgggc ggtggcgcgc atccagggca      6480
+     agccgcgctg catcgtgagt caaatctgat gaagaccttt gcgctacagg gcgacacgct      6540
+     cgacgccatt tgtgtccgct attacgggcg cactgagggc gtggttgaga ccgtgctcgc      6600
+     cgcaaatccg ggactggctg aactgggggc ggtgctgcca cacggcaccg ccgtcgaact      6660
+     gcccgacgtt cagaccgcgc ccgtggctga aactgtcaat ctgtgggagt aacgcatgac      6720
+     agcagaagaa aaaagcgtcc tgtcgctttt catgattggg gtgctgattg ttgtcggcaa      6780
+     ggtgcttgcc ggtggtgaac ctatcacccc gcgtctgttt atcgggcgca tgttgctcgg      6840
+     tggttttgtc tcgatggttg ccggtgttgt tctggtgcag tttcctgacc tgtcactgcc      6900
+     agcggtgtgc ggcatcggct ccatgctggg tatcgccggt tatcaggtga ttgagattgc      6960
+     cattcagcgc cgctttaagg gcagggggaa acagtaatgc cggtaattaa cacgcatcag      7020
+     aatatcgccg cctttctcga catgctggcc gtgtccgaag ggacggcgaa tcatccactg      7080
+     acgaaaaacc ggggctatga cgtgatagtc accggactgg acgggaagcc ggaaattttc      7140
+     accgactaca gtgaccaccc gttcgcacat ggccgaccgg cgaaggtgtt taaccgtcgc      7200
+     ggtgaaaaat ccacggcctc cggtcgctat cagcagcttt acctgttctg gccgcattac      7260
+     cgcaaacagc ttgccctgcc ggatttcagt ccgttgtcac aggacagact cgccattcag      7320
+     ttgatccgcg aacgcggagc actggatgac atccgggcgg gacgcattga gcgcgccatt      7380
+     tcacgctgtc gcaatatctg ggcgtccctg ccgggtgccg gttacggtca gcgtgagcat      7440
+     tcactggaaa aactggtcac cgtctggcgt accgctggcg gcgtaccggc ttaaacggag      7500
+     taaataccat gaagaaatta tccctttcac tgatgctgaa cgtgtcgctg gcgctgatgc      7560
+     tggcactgtc cctgatttac ccgcagagcg tggccgtcaa ttttgtcgct gcctgggcga      7620
+     ttctggcgac ggttatctgt gtggttgccg gtggtgtggg cgtgtatgcc actgagtatg      7680
+     tgctggaacg ctacgggcgg gagctgccgc cggaatcgct ggccgtgaag attgtcacgt      7740
+     cgctgttttt gcagccggtg ccgtggcgca gacgggcggc ggctctggta gtggtggtgg      7800
+     cgacgtttat ctcgctggtc gctgccgggt ggatttttac cgcgctgatt tatcttgtgg      7860
+     tgtcgctgtt tttccggctg atacgtaaag cctgtcgtca gcgtcttgag gggcgggaac      7920
+     catgtcaagg ctgatgattg tgctggtcgt gttgttatcg ctggcggtgg ccggtctgtt      7980
+     tctggtgaaa cacaaaaatg ccagcctgcg cgcctcgctg gacagggcga acaacgtcgc      8040
+     cagcggtcag cagacgacca tcaccatgct gaaaaatcag cttcatgttg cgctcaccag      8100
+     ggcagataaa aacgagctgg cgcaggtggc actgcgtcag gaactggaga acgccgcgaa      8160
+     acgtgaagca cagcgcgaga aaaccatcac gaggttactt aatgagaacg aagattttcg      8220
+     ccgctggtac ggtgctgacc tgcctgatgc tgtgcgccgg ttgcaccagc gccccgcctg      8280
+     caccgacgcc agtgattgtc cccaacgcat gcccgaaagt gagcctttgc ccgatgccgg      8340
+     gcagtgaccc gcagacgaac ggcgatttaa gtgccgatat ccggcagctt gagaacgcgc      8400
+     tggcacgctg tgccagccag gtaaaaatga ttaaacactg tcaggacgaa aacgatgctc      8460
+     aaacccgaca gcctgcgcag ggcgctgact gatgccgtca cggtgctgaa aactaacccc      8520
+     gatatgctgc ggatattcgt ggataacggg agtattgcct ccacactggc ggcgtcgctg      8580
+     tcattcgaaa agcgttacac gctcaatgtg attgtgaccg actttaccgg tgattttgac      8640
+     ctgctcattg tgccggtgct ggcgtggctg cgggaaaatc agcccgacat catgaccacc      8700
+     gacgaaggcc agaaaaaggg cttcacgttt tatgcagaca tcaacaatga cagcagcttt      8760
+     gatatcagta tcagcctgat gctgaccgag cgcacgctgg tcagtgaggt ggacggcgca      8820
+     ctgcatgtga agaatatctc ggaacccccg ccgccggagc cggtcacccg cccgatggag      8880
+     ctgtatatca atggcgaact ggtgagtaag tgggatgaat gagtttaagc gttttgaaga      8940
+     ccggctgacc ggactgattg aatcgctgtc accgtcaggg cgtcggcgac tgagtgccga      9000
+     actggcgaaa cgtctgcggc agagtcagca gcgtcgggtg atggcacaga aagccccgga      9060
+     cggcacaccc tacgcgccac gccagcagca gagcgtcaga aaaaagaccg gtcgcgttaa      9120
+     gcgaaaaatg tttgcgaaac ttattaccag tcgttttttg catatccgtg ccagcccgga      9180
+     gcaggcatca atggaatttt acggcgggaa gtcgccgaaa atcgccagtg tgcatcagtt      9240
+     tggtctgtcg gaagaaaacc ggaaagacgg taagaaaatt gattatccgg cgcgtcccct      9300
+     gctcggcttt accggtgagg atgtgcagat gattgaagag attatcctgg ctcaccttga      9360
+     gcgttagttt tatccaggca gaggctgatg cgcaattaaa cattgagcgg ccatgctggt      9420
+     cgctcaatgt ttagaggttt atgagtgatt tttatttgat gctttgtatt ctaaaacctt      9480
+     cttattggcg taaaagaatt ttgtatatga caggaatata accagacctg aagtgaaata      9540
+     gacgagggat agtattaata atgctttttt gtgactgtta ttatctttaa tctcctggct      9600
+     taaccattcg gagtcctcct cgtttagctg taagagctta ttgcaggcga tctcaggaag      9660
+     tgtgtctttt ataaatacgt tttgcagtct cttgcaatcg gcaaggctat aagttttatt      9720
+     aaattcaact gctttatttt tgaaggataa aagaactttg tcactataaa catagtacat      9780
+     catgttttta tatggtatgc ctgtggcatc ccttactata acggattgtt cgttgtgtat      9840
+     gtaacatgcg aggagaatgt aaaaaatact ggccagaatt acaattattg ttttaattat      9900
+     gtgtggtggt tttgttatgt caccccagat acgagtaagg aaaaaatacg atgtttttag      9960
+     ttttccatca atcagtccct gctgtatcat tctcacattt tcaatgcctg atacattgat     10020
+     tccgttaatt attttaaata gttgaatgtc gcgccactcg cggtcaagtc tttttaattt     10080
+     tttgtctgaa tatccaaaat tgaaataatg tgcaataagc ctcataaggt tacttttacc     10140
+     aaagctaaaa aatgctaata ctgcaaagct acaaaggaaa aaaacgatta gcccccacac     10200
+     attagtcaca ttatagctga ccattacgct ctccttgaat gttgtctggt agttctacaa     10260
+     atgaatccag atagcataac ttttatatat tgtgcaatct cacatgcatg aacactctcg     10320
+     caaatattca ggaactcgcg cgcgcactgc gcaacatgat tcgcactggc attatcgtcg     10380
+     aaaccgacct taacgccggt cgctgccgcg tgcagaccgg cggcatgtgc accgactggc     10440
+     ttcagtggct gacccatcgc gcaggacgtt cgcgcacatg gtgggcacct tccgtggggg     10500
+     aacaggtgct gattctggcc gtgggtggtg aactcgacac ggcgttcgtt ctgccgggga     10560
+     tttattccgg cgataacccc tcgccgtctg tgtcggcgga tgccctgcat atccgtttcc     10620
+     ctgacggggc ggtgattgaa tatgaacccg aaaccagtgc actcacggta agcggaatta     10680
+     aaacggccag cgtgacggct tccggttctg ttactgccac ggtgccggtg gtcatggtga     10740
+     aagcatcaac ccgcgtcacc ctggacaccc cggaggtggt ctgcaccaac aggctgatta     10800
+     ccggcacgct ggaagtgcag aaaggcggga cgatgcgcgg caacattgaa cacaccggcg     10860
+     gtgaactctc atcaaacggt aaggtactgc atacccataa acaccccggc gacagcggcg     10920
+     gcacaaccgg gagtccttta tgacagcgcg ttatctcgga atgaatcgca gtgatggcct     10980
+     gactgtcact gaccttgagc atatcagcca gagtatcggc gatatcctgc gcacaccggt     11040
+     cggctcacgg gtgatgcgtc gtgattacgg ctcgttgctg gcgtcaatga ttgaccagcc     11100
+     gcagaccccg gcgcttgagt tgcagattaa agtcgcctgt tacatggcag tgctgaaatg     11160
+     ggaaccccgc gtcaccctgt catccgtcac cacggcgcgc agttttgacg ggcgaatgac     11220
+     ggtcacgtta accggccagc acaacgacac cggccagcca ctttcattaa ccatccctgt     11280
+     gagttgaaac catgccgatt atcgacctga accagctacc cgcaccggat gtggtcgagg     11340
+     agctggactt tgaaagcatt ctcgctgaac gcaaggcgac actgatttcc ctttacccgg     11400
+     aagatcagca ggaggcggtc gcccgtaccc tgacactgga atctgagcct ctcgtcaaac     11460
+     tgctggaaga aaatgcttat cgtgagctta tctggcgtca gcgtgtgaat gaggccgcac     11520
+     gggcggtgat gctggcctgt gccgccggta atgaccttga tgtgattggt gccaattaca     11580
+     acaccacgcg cctgactatc accccggcag atgattcgac catcccgccg acaccggcag     11640
+     tgatggaatc tgacaccgat tatcgtctgc gtattcagca ggcttttgag ggcttaagcg     11700
+     tcgccgggtc agtgggagcc tatcagtatc atggtcgcag tgctgacggg cgtgtcgcgg     11760
+     atatttctgt caccagtccg tctccggcct gtgtcaccat ctctgtgctg tcacgtgaaa     11820
+     ataacggcgt cgcatccgaa gacctgctgg ctgtggtgcg taacgccctt aatggcgagg     11880
+     acgtcaggcc ggtggccgac cgcgtgaccg tgcagtctgc cgccatcgtt gaataccaga     11940
+     taaacgccac gctttacctt taccctggtc ccgaaagcga acccatccgc gctgccgctg     12000
+     tgaaaaagct ggaagcgtat atcacggcac agcaccggct ggggcgcgac atccgtctgt     12060
+     ctgccattta tgccgctttg catgtggaag gtgtgcagcg tgtcgaactg gctgcaccac     12120
+     tggccgacat cgtgctcaac agtacgcagg cgtctttctg taccgaatac cgcgtcgtga     12180
+     ccggaggctc ggatgagtga ttcgcgactg ctgccgaccg gctcatcacc gcttgaggtc     12240
+     gccgccgcaa aagcctgtgc ggaaattgaa aaaacgccgg tcagtattcg tgaactgtgg     12300
+     aacccggaca cctgtccggc aaatctgctg ccgtggctgg cgtgggcgtt ttcggtcgac     12360
+     aggtgggatg aaaagtggcc ggaagcgaca aaacgcgccg ttatccgcga tgcctatttc     12420
+     atccactgtc ataagggcac gataggtgca atccggcgtg tggtggagcc gctcggctat     12480
+     ctcatcaacg tgacggagtg gtgggaaaac agtgacccgc ccggcacctt ccggcttgat     12540
+     attggtgtac tggaaagcgg tatcacagag gcaatgtatc aggaaatgga acggctgatt     12600
+     gctgatgcca aacctgcaag ccgtcacctt attggcctga acattacccg ggacattccc     12660
+     ggctatctgt tcgccggtgg tgtggcttac gacggcgatg taattacggt ttaccccgga     12720
+     taagtgagga ataatgagca taaaattcag aaccgttatc accactgccg gtgcagcaaa     12780
+     gctggcagcg gcaaccgcgc cgggaaggcg gaaggtcggc attaccacga tggccgtcgg     12840
+     ggatggcggt ggtaaattgc ctgtcccgga tgccggacag accgggctta tccatgaagt     12900
+     ctggcgacat gcgctgaaca aaatcagcca ggacaaacga aacagtaatt atattatcgc     12960
+     cgagctggtt attccgccgg aggtgggcgg tttctggatg cgtgagcttg gcctgtacga     13020
+     tgatgcggga acgttaattg ccgtggcgaa catggccgaa agctataagc cagcccttgc     13080
+     cgaaggctca ggacgttggc agacctgtcg catggtcatc atcgtcagca gtgtggcctc     13140
+     agtggagctg accattgaca ccacaacggt gatggcgacg caggattacg ttgatgacaa     13200
+     aattgcagag cacgaacagt cacgacgtca cccggacgcc tcgctgacag caaaaggttt     13260
+     tactcagtta agcagtgcga ccaacagcac gtctgaaaca ctggccgcaa cgccgaaagc     13320
+     ggtaaaggcc gcgtatgacc tggctaacgg gaaatatacc gcacaggacg ccaccacagc     13380
+     gcgaaaaggc cttgtccagc ttagtagcgc caccaacagc acgtctgaaa cgctcgccgc     13440
+     aacaccaaaa gccgttaaga cggtaatgga tgaaacgaac aaaaaagcgc cattaaacag     13500
+     ccctgcactg accggaacgc caacgacgcc aactgcgcga cagggaacga ataatactca     13560
+     gatcgcaaac acggctttcg ttatggccgc gattgccgcc cttgtagact cgtcgcctga     13620
+     cgcactgaat acgctgaacg agctggcggc ggcgctgggc aatgacccga attttgctac     13680
+     caccatgact aatgcgcttg cgggtaagca accgaaagat gctaccctga cggcgctggc     13740
+     ggggcttgct actgcggcag acaggtttcc gtattttacg gggaatgatg ttgccagcct     13800
+     ggcgaccctg acaaaagtcg ggcgggatat tctggctaaa tcgaccgttg ccgccgttat     13860
+     cgaatatctc ggtttacagg aaacggtaaa ccgagccggg aacgccgtgc aaaaaaatgg     13920
+     cgataccttg tccggtggac ttacttttga aaacgactca atccttgcct ggattcgaaa     13980
+     tactgactgg gcgaagattg gatttaaaaa tgatgccgat ggtgacactg attcatacat     14040
+     gtggtttgaa acgggggata acggcaatga atatttcaaa tggagaagcc gccagagtac     14100
+     cacaacaaaa gacctgatga cgttgaaatg ggatgcacta aatattcttg ttaatgccgt     14160
+     cattaatggc tgttttggag ttggtacgac gaatgcacta ggtggtagct ctattgttct     14220
+     tggtgataat gataccggat ttaaacagaa tggagacggt attcttgatg tttatgctaa     14280
+     cagtcagcgt gtattccgtt ttcagaatgg agtggctatt gcttttaaaa atattcaggc     14340
+     aggtgatagt aaaaagttct cgctatccag ctctaataca tccacgaaga atattacctt     14400
+     taatttatgg ggtgcttcca cccgtccagt ggttgcagag ttaggcgatg aggccggatg     14460
+     gcatttctat agccagcgaa atacagataa ctcggtaata tttgctgtta acggtcagat     14520
+     gcaacccagc aactggggaa attttgattc ccgctatgtg aaagatgttc gcctgggtac     14580
+     gcgagttgtt caattgatgg cgcgaggtgg tcgttatgaa aaagccggac acacgattac     14640
+     cggattaaga atcattggtg aagtagatgg cgatgatgaa gccatcttca ggccgataca     14700
+     aaaatacatc aatggcacat ggtataacgt tgcgcaggtg taagttatgc agcatttaaa     14760
+     gaacattaag tcaggtaatc caaaaacaaa agagcaatat cagctaacaa agaattttga     14820
+     tgttatctgg ttatggtccg aagacggaaa aaactggtat gaggaagtga agaactttca     14880
+     gccagacaca ataaagattg tttacgatga aaataatatt attgtcgcta tcaccagaga     14940
+     tgcttcaacg cttaatcctg aaggttttag cgttgttgag gttcctgata ttacctccaa     15000
+     ccgacgtgct gacgactcag gtaaatggat gtttaaggat ggtgctgtgg ttaaacggat     15060
+     ttatacggca gatgaacagc aacaacaggc agaatcacaa aaggccgcgt tactttccga     15120
+     agcggaaaac gttattcagc cactggaacg cgctgtcagg ctgaatatgg cgacggatga     15180
+     ggaacgtgca cgactggagt catgggaacg ttacagcgtt ctggtcagcc gtgtggatcc     15240
+     tgcaaatcct gaatggccgg aaatgccgca ataagttgta tgacctctgt tgtgaactta     15300
+     catatctatg gcacagagta aagcctaatc tgaagtccac tctgtgccaa aagcggacct     15360
+     tataaacaag aacaatggtc atatcagtgt gttttgattg catagctaac gtgcgtcttc     15420
+     ctgtacagaa tcataagatg atagggcata ggagatgatt attatcgcgt gttttaaaaa     15480
+     tagctttctg catcaagtgt cacttgcgaa gaggtattgg cgctatgatt ggcatcactc     15540
+     agttcagata atattttaaa tatttggtaa atgttcagat tacacaattc ggtctgcgtc     15600
+     ccgttaaaat tatctactat tagttattac tatgaggtga atggcaagtg ttttccactc     15660
+     gccatttttg ttttttattt ttttaaagcc tttccgacgt ttaaggattt tgccaagcca     15720
+     taaaatattt gatatttcat tcctgttttt atttttggtg agatatttgc gtaacttctt     15780
+     tctctaaaac accaacgtat aaacctatta ttatcttcgg ttgtttctat atagcatatt     15840
+     acattgagac caaaaagaaa ctgaaggaag tcatttgcag ttgtcatgaa ttttggtttt     15900
+     gttgtggaaa tggaactaat atgagtttca agttgtttat atgctaagag gtattcagcg     15960
+     taatcaaaag tatcttttcc agagaggaat tcaaagaact ttaaaaaaat ctcataatgt     16020
+     tcacttccat aataaaatga taaatgatct tttatttctc caagtaaata gttagagtaa     16080
+     tctctttgca tgctaggact ttcaaagtca tctagactaa attgattttt cccatcatca     16140
+     ccgctggcgt gtgatttgat aatttcgagc atccgtaata tatctcttgg gcgataatat     16200
+     gaccagcgaa ggaaattaat aaatgatgtg gggtggttat aattatcatg gacgttgggt     16260
+     gaatcccaag ggaaataatg gtcccatgcc tgtccctttt taagggccat gtcttgctga     16320
+     gtcctaagca gatgatctaa tacctcaaat aattgagagc tacggtggtt aacatattct     16380
+     gtccgccagt ccaagaatac tgaattatct ctgatttttg cgttttgatt ttgtaatcct     16440
+     atggattcaa atatatctgg cctgatcaag agaacggcct tcattctccc ttttcctccc     16500
+     tttatacttg ggaagaaatc gttgttaatc tcccagactg cgtgagctaa tccttttata     16560
+     cattctagat aatcatcgta tggaattgag gaagggcgga tatcaatacc atcgataaat     16620
+     aaaatatgat tttgagataa acgtatttgg ctaaaggcct cttcaaattt tttttgtata     16680
+     taaaataaat ttatctgaaa tctgctctca gaaaaagata aagactctct ttcttcacct     16740
+     tttaaggttg catgcttatg aagtagttcg gctgcaactt ttgactcttg aacaaaactg     16800
+     agggcttgaa ttatttctgg tgaaaatgcc ttaagataat actcatctat tgcatcatta     16860
+     agtgatgaga attttgaata atttagtaac tttgaaattt tcccttcttt atctaatact     16920
+     tgttttgata ttaataaata tagaataact ttccatatgc cagagaagtc agacaaattt     16980
+     aaatgctttt cagatttaag agtgataaat ttttgatatt ctgtctctct tatatattta     17040
+     gttgtagcta gcgtattgtt aatattgtta tttgagagat agatagagta tgcggtttta     17100
+     ccagtacctt tctctcctac aagaaacgat atatttggtt cacataatct agataggtga     17160
+     ttatcacgta tgaacacttt gttaagtaat tctttattct cccttctctt ataattttca     17220
+     gcatcagcat agccaagagt tagatctttg attggtatca ttattacctc aactaaagca     17280
+     attgaaaaac atatggttat aaaaacatag cgctgctctg tcgcatattg tggatatcaa     17340
+     catatgaaat gtaaaggaac tatttgtgga tgaatgaacc gaatcgctgt agcttcggta     17400
+     gtcatctttc agacttgtat aaatgaacaa cttccgcttc tcgctcaaag gaaactgtca     17460
+     gatttgatag cttttgggct atgtaaactg tcagtcggaa aatgagtgag tacaaatcag     17520
+     ggcaggtgag cgaattgccc gccttttctt taccggtggt tgtgctgtcg attagccaac     17580
+     cgggacaaat agcctgacat ctccggcgca actgaaaata ccactcaccc attaaccacg     17640
+     gagttaaacg gatgagtgac tatcatcacg gcgtgcaggt gctggagatt aacgagggca     17700
+     cccgcgtcat ttccaccgta tccacggcca ttgtcggcat ggtctgcacg gccagcgatg     17760
+     cagatgcgga aaccttcccc ctcaataaac ctgtgctgat taccaatgtg cagagcgcaa     17820
+     tttcaaaggc cggtaaaaaa ggcacgctgg cggcatcgtt gcaggccatc gctgaccagt     17880
+     caaaaccggt caccgttgtc atgcgcgtgg aagacggcac cggtgatgac gaggaaacga     17940
+     aactcgcgca gaccgtttcc aatatcatcg gcaccaccga tgaaaacggt cagtacaccg     18000
+     gactaaaagc catgctggcg gcggagtcgg taaccggtgt taaaccgcgt attctcggcg     18060
+     tgccgggact ggataccaaa gaggtggctg ttgcactggc atcagtctgt cagaagctgc     18120
+     gtgctttcgg gtatatcagc gcatggggct gtaaaaccat ttccgaggtg aaagcctatc     18180
+     gtcagaattt cagccagcgt gagctgatgg tcatctggcc ggatttcctc gcatgggata     18240
+     cggtcaccag taccaccgcc accgcgtatg ccaccgcccg tgcgctgggg ctgcgcgcta     18300
+     aaatcgacca ggagcagggc tggcataaaa cgctgtccaa tgtcggggtg aacggtgtta     18360
+     ccggcatcag cgcatctgta ttctgggatt tgcaggagtc cggcaccgat gctgacctgc     18420
+     ttaacgagtc aggcgtcact acgctgattc gccgcgacgg tttccgcttc tggggtaacc     18480
+     gtacctgctc tgatgacccg ctgttcctct ttgaaaacta cacccgcacc gcgcaggtcg     18540
+     tggccgacac gatggctgag gcgcacatgt gggcggtgga caagcccatc actgcaacgc     18600
+     tgattcgcga catcgttgac ggcatcaatg ccaaattccg tgagctgaaa acaaacggct     18660
+     atatcgtgga tgcgacctgc tggttcagcg aagaatccaa cgatgcggaa accctcaagg     18720
+     ccggaaaact gtatatcgac tacgactata caccggtgcc tcctctcgaa aacctgaccc     18780
+     tgcgccagcg tattaccgat aaatacctgg caaatctggt cacctcggtt aacagcaatt     18840
+     aaggagcctg accgatggca atgccgcgca aactcaagtt aatgaacgtc tttctgaacg     18900
+     gctacagcta tcagggcgtt gcaaagtccg tcacgctgcc aaaactgacc cgtaagctcg     18960
+     aaaactatcg cggtgcgggg atgaacggca gcgcaccggt agacctcggc cttgatgacg     19020
+     atgcgctgtc aatggagtgg tcgctcggtg gcttcccgga ttcggttatc tgggagcttt     19080
+     acgccgcaac cggtgtggat gccgtgccga ttcgttttgc aggctcttac cagcgcgacg     19140
+     ataccggcga aacggtggcc gtcgaagtgg tcatgcgtgg acgtcagaaa gaaatcgaca     19200
+     ccggcgaggg taaacaggga gaagacactg agtcgaaaat ctccgtggtc tgcacctatt     19260
+     tccggctgac gatggacggt aaggagctgg tcgaaattga caccatcaac atgattgaga     19320
+     aggtgaacgg cgtcgatcgg ctggagcaac accgccgcaa tatcggcctg tgattttcat     19380
+     ccggtcagcc tggctggccg gttaaccctg attcagaagt gagaaaacca tgaacaaaga     19440
+     aaatgtcatt accctggaca atccggtcaa acgtggtgag caggttatcg aacaggtcac     19500
+     gctgatgaaa cccagtgccg ggacgctacg cggtgtcagt ctggctgcgg ttgcaaactc     19560
+     cgaagtcgat gcactgatta aggtgctgcc gcgcatgacg gcaccgatgc tgaccgagca     19620
+     ggaagtcgcc gcgctggaac tgcctgacct tgtggcgctg gccggtaagg tggtcggttt     19680
+     tttgtcgccg aactcggtgc agtgacgttt ccgaaaaatc tctcggtcga tgacctgatg     19740
+     gcggatgtgg cagtgatatt tcactggccg ccatcagaac tgtatcccat gagcctgacc     19800
+     gaactcatca catggcgcga aaaggcgctc cggcgaagcg gaaacacgaa tgagtaacaa     19860
+     tgtaaaatta caggtattgc tcagggctgt tgaccaggca tcccgcccgt ttaaatccat     19920
+     ccgcacagcg agcaagtcgc tgtcggggga tatccgggaa acacaaaaat cactgcgcga     19980
+     gctgaacggt cacgcatccc gtattgaggg attccgcaag accagtgcac agctcgccgt     20040
+     gactggtcat gcacttgaaa aggcacggca ggaggccgaa gcccttgcca cacagtttaa     20100
+     aaacaccgaa cgtccgaccc gtgctcaggc gaaagtcctg gaatccgcaa agcgtgcggc     20160
+     ggaggactta caggcgaaat ataaccgcct gacagattcc gttaaacgcc agcagcggga     20220
+     actggccgct gtgggaatta atacccgcaa tcttgcacat gatgagcagg gactgaaaaa     20280
+     ccgtatcagt gaaaccaccg cacagcttaa ccgtcagcgt gatgcgctgg tgcgtgtcag     20340
+     tgcgcaacag gcaaaactta acgcagtaaa acagcgttat caggccggaa aggaactggc     20400
+     cggaaatatg gcctcagtgg gcgctgccgg tgtggggatt gcggcggcgg gaacgatggc     20460
+     cggtgttaag ctactgatgc ccggttatga gtttgcgcag aaaaactcag aattacaggc     20520
+     tgtgatcgga gtggcaaaag actccgccga aatggccgca ctccgcaagc aggcgcgcca     20580
+     gctcggcgac aataccgccg cctcggcaga tgatgcagcc ggtgcgcaga ttattattgc     20640
+     gaaagccggt ggggatgttg atgccattca ggcggcaacg ccggtcacgc tgaacatggc     20700
+     gctggcgaac cgtcgcacaa tggaagaaaa cgccgccctg ctgatgggga tgaaatccgc     20760
+     ctttcagctt tcaaacgata aggtcgctca tatcggggat gttctctcca tgacgatgaa     20820
+     caaaaccgcc gccgattttg acggcatgag cgatgcgctg acctatgccg cacctgtggc     20880
+     aaaaaatgcc ggtgtcagca ttgaagaaac cgccgcaatg gtcggggcgc tgcatgatgc     20940
+     aaaaatcaca ggctcaatgg cggggacggg aagccgtgcc gtgttaagcc gcctgcaggc     21000
+     accgacggga aaagcatggg atgcactcaa agagcttgga gtgaaaacct cagacagcaa     21060
+     aggaaacacc cggccaatat ttaccattct gaaagaaatg caggccagtt ttgagaaaaa     21120
+     ccggctcggt actgcccagc aggctgaata catgaaaact attttcgggg aggaggccag     21180
+     ctcagccgct gccgtgctga tgactgccgc ctcaaccgga aagctggaca aactgaccgc     21240
+     tgcgtttaaa gcctcagacg ggaagaccgc cgagctggta aatatcatgc aggacaacct     21300
+     aggcggtgac tttaaagcgt ttcagtccgc ttatgaggcg gtggggactg acctgtttga     21360
+     ccagcaggaa ggcgcgctgc gtaagctcac gcagacggcc acaaagtatg tgttaaaact     21420
+     cgacggctgg atacagaaaa acaaatcact ggcgtcaacc atcggcatca ttgccggcgg     21480
+     tgcactggcg cttactggca tcatcggtgc cattggcctc gtagcctggc cggttatcac     21540
+     cggcatcaat gccatcatcg cggcagcagg cgcaatgggg gcagtcttca cgacggttgg     21600
+     cagtgctgtt atgaccgcca tcggggctat tagctggccg gttgtggccg tggtggctgc     21660
+     cattgtcgcc ggtgcgttgc ttatccgtaa atactgggag cctgtcagcg cattctttgg     21720
+     tggtgtggtt gaagggctga aagcggcatt tgcgccggtg ggggaactgt tcacgccact     21780
+     taaaccggtt tttgactggc tgggcgaaaa gttacaggcc gcgtggcagt ggtttaaaaa     21840
+     cctgattgcc ccggtcaaag ccacccagga caccctgaac cgttgccgtg acacgggcgt     21900
+     catgttcggg caggcactgg ctgacgcgtt gatgctgccg cttaatgcgt tcaacaaact     21960
+     gcgcagtggt attgactggg tactggaaaa actcggtgtt atcaacaaag agtcagacac     22020
+     acttgaccag accgccgcca gaactcatac cgccacgtat ggtaccggtg actatattcc     22080
+     ggcgaccagc tcttatgcag gctatcaggc ttatcagccg gtcacggcac cggctggccg     22140
+     ctcttatgta gaccagagta aaaacgaata tcacatcagc ctgacggggg ggactgcgcc     22200
+     ggggacacag cttgaccgcc agttacagga tgcgctcgaa aaatacgagc gggataaacg     22260
+     tgcgcgcgcc cgtgccagca tgatgcatga cggttaagga ggtgacgaaa aatgatgctc     22320
+     gcgttaggta tgtttgtttt tatgcgccag acgctgccac accagaccat gcagcgtgaa     22380
+     tcagattatc gctggccgtc aaattcccgt atcggtaaac gggatgcctt tcagtttctc     22440
+     ggtgtgggtg aggaaaacat cacgctggcc ggtgtgcttt atcccgaact gaccggcggc     22500
+     aagctgacga tgaccacgct caggctgatg gcagaggagg ggcgggcgtg gccgttgctg     22560
+     gatggcaccg gcatgattta cggcatgtat gtcatcagca gggtgagtga aacagggagt     22620
+     attttctttg cagacggcac accccggaaa attgatttta cgctgtcact cacccgcgtt     22680
+     gatgaatcac tggccgcgct ttatggcgat atcggtaaac aggcggaatc gctcatcggt     22740
+     aaggccggca gtatggcgac cagattcaca ggtatgacgg gggcgggata atgctggatg     22800
+     cgctgacatt tgatgcaggc agtacgctga cgccggatta catgctgatg ctcgacagca     22860
+     gggatattac cggcaatatc agcgaccgtc tgatgagcat gaccctgacg gataaccggg     22920
+     gctttgaggc tgaccagctt gatattgaac tgaacgatgc cgacgggcag gtcgggctgc     22980
+     cggttcgtgg cgctgtcctg acggtgtata tcggctggaa aggttttgcc ctggtatgca     23040
+     aagggaaatt taccgttgat gaggttgaac accggggcgc accggatgta gtcaccatcc     23100
+     gcgcccggag tgcagatttt cgcgggacgc tcaattcccg ccgggaaggc tcctggcatg     23160
+     acaccacgct cggtgcgatt gttaaggcga tagccacccg taacaggctg gaagccagtg     23220
+     tcgctccgtc actggccgga ataaaaattc cacacatcga ccagtcgcag gagtctgatg     23280
+     cgaaattcct gacccgtctt gcagaacgca acggcggtga ggtgtcggta aaaatgggaa     23340
+     aactgttgtt tctcaaagcg gggcagggag tgacggccag cggtaaaaaa atcccgcagg     23400
+     tcaccataac ccgcagcgac ggcgaccgcc atcattttgc gattgctgac cgtggagcct     23460
+     acaccggtgt aacggcaaaa tggctacaca ctaaagaccc gaagccgcaa aagcagaagg     23520
+     taaaactgaa acgcaaaaag aaagagaaac acctgcgcgc actggagcac ccgaaagcga     23580
+     aaccggtcag gcagaagaaa gcgcctaaag taccggaagc gcgtgaaggt gaatacatgg     23640
+     ccggtgaggc tgacaacgtt tttgccctga ccacggtata tgccacgaaa gcgcaggcca     23700
+     tgcgcgccgc tcaggcgaag tgggataaac tgcaacgggg cgttgcggag ttctctatca     23760
+     gcctggctac cggtcgggca gatatttaca cggaaacacc ggtcaaagtg tctggcttta     23820
+     agcgcgtcat agacgagcag gactggacaa tcactaaggt gacacatttt ctgaataata     23880
+     gcggcttcac gacgtcctta gagcttgagg tcaggctttc tgatgtggag tacgaaacag     23940
+     aagatgatga gtgatgtttt tgttttatct gtttgttttg taaggataaa ttaactaaaa     24000
+     tggcaccatc aacaaaaccg gaagaggtgc tcgcgatgtt tcattgtcct ttatgccagc     24060
+     atgccgcaca tgcgcgtaca agtcgctata tcactgacac gacaaaagag cgttatcatc     24120
+     agtgccagaa cgtgaattgc agcgccacgt tcatcactta tgagtcggta cagcgataca     24180
+     tcgtgaagcc gggagaagtc cacgccgtaa ggccgcaccc gttgccatca gggcagcaaa     24240
+     ttatgtggat gtaattacaa acagaaagcc cctcagtcga ggggcttttt tgtcgatgtg     24300
+     gtcaatgtgt ggacgtgacc agaaataaat ccttttattt caatttattg tacgtaaaaa     24360
+     ataagcccgt gtaagggaga tttagggtgt caccagtagg ggctttcaac ggtacaatgc     24420
+     gggtttgagc ggcataaatt accactgaaa gcccttaaac gttactctac tgtggacact     24480
+     gtgtggacac tctcggcctc agtaccacct cttagcggat taagagaaat ggcgtcctga     24540
+     aggtactctg gcgcaaaatg agcgtaaacc atagtttgct caatccgcgt gtgacctagt     24600
+     atccgttgta gcgtgataat acttcctcca ttaatcatga aatgagtggc aaagctgtgc     24660
+     cttagtgcat gtgtggcttg ccccattggc aaatccggtt ttattgcttt cattgttcgt     24720
+     ctgaagcgag ggtaatcagc atcagggaat aaaaaacctc gtttgttatc cgcgatcatt     24780
+     ttggcaacag cctctgagat cgggacggtg cgtggtttgt ttgttttcgt tttaacaaac     24840
+     gtgacgcggt tatggatgat attttctgct ttcaaacgag ctgcttctcc ccaacgtgct     24900
+     cctgtactca ggcaaagaat cgcaatcttt ttattgtcgc cgtcaagtgc tgcaagcagt     24960
+     aaggcaattt cttcctgtgt tagatagcct gtttctggtt tttcctcctt aagccttttt     25020
+     gtccctctga tagggtgctc accaaagaat aactccgctt caatcagggc tgtaaacatg     25080
+     ccgctaatac atgttaaatc acgattgata ctcgaaggtt taataccctg acttcttcgg     25140
+     gtggcgcagt actggctgat aagcgatttc gtaatttgaa atgcgcatgg gtcattcgtt     25200
+     atttttgtga agatttcaat ttttccaaga ttagatttcc catgctcttc gtgtttaccc     25260
+     tttaaatccc accagatctg tgtcagctcc gacagacgtc gcttgtctgt tggttttgat     25320
+     agccattctt tattgtggtg gttgtacaac gtgtatttct cgaaagcgac agcttcgctt     25380
+     ttcttatcaa acttcctacg gatgcgtttt ccattacgtc cagtagggcg gatgtccact     25440
+     tcatatcgac catcatcgag ttttttgatt gccatcagaa aaccctccga gtggtgtgtt     25500
+     tttttgcgac tactaatcgc ttttttcgtg gtggctgaaa tttagccacc aatagtaggc     25560
+     acttgtgatg aatatattca cgatgaattg ttaaccagtc ttttgaccgg agtggggcga     25620
+     cgttgtttcg ttttgcccaa agtgtgcgag agcgggcgca atttgcccgg actcaggagc     25680
+     gatctgattg gtcatgaacc ataaagtgta tttggtgaat tgtggggtct gcaggatgtt     25740
+     catcatgaca tctgttggag gtgttgaacg accactttca tagtaactca gcgtgccata     25800
+     cggaacccct gttaaatcag caagttgttg tctgctcaaa tactctgatt ttcgcattaa     25860
+     gactatcttc tcgcttatcg tgtttgacat ggtgtttaga tctcaatagt atttagttta     25920
+     gatgtagatt gtttagtgct tggatgtggg cactaaaagg cattataaga cattaaacgc     25980
+     aattcatgag ggctagagga cgacatgagc aagcaagtaa cactcatgac tgatgcgatt     26040
+     ccttatcagg agttcgcaaa actaatagga aaatcgacag gagcggttcg tcggatgatc     26100
+     gataaaggaa agctgcctgt aattgatatg accgatccac aatcagcttc aggtcgtgca     26160
+     ggtgaatatt gggtatacct tccggcatgg aataacggac taaaactggc ttatgaaagc     26220
+     cgccctaaag agattcgtga cggctggttg atgtggttag gtctcggtga accacgttaa     26280
+     ggagaaccgt atgaatgagc ctcgttgtat tgctcagtta ctgcgtaacg aaagccccag     26340
+     ggcgattgac ttcaccatca cccacggtaa ggggcgtaag ggaatcatta tccgcaccaa     26400
+     aaaacagagt ccgttaaaaa aggctctgac ctttctgaaa agccggaggg tatggaaatg     26460
+     acagtgatga cgctcaatct cgttgaaaaa cagccagcag ctatgcgccg gataattggt     26520
+     aagcatcttg ccgttcctcg ctggcaggat acatgtgatt attataatca gatgatggag     26580
+     cgcgaacggt taacggtttg cttccatgct cagttaaaac agcgtcacgc aacgatgtgt     26640
+     tttgaagaaa tgaacgacgt cgaacgtgaa cgactggtat gtgcaattga tgaattgcgt     26700
+     ggtgcattct caaaacgccg tcaggttggc gcaagtgagt atgcatatat tagtttttta     26760
+     acagtcagtc agcgtcgtac tttatttatg catgccggat tgactgaaaa agaattcaac     26820
+     cagccatact ggcgaattaa tgaagagtca tgttactggc gtgatgcttt attccgtgca     26880
+     ttacgtgaat tattcagtct gtttgagtat gcaccgacaa ttctgacgtc ggtaaaaccg     26940
+     gagcaatatc tgcattaagt aattaaccag agtttttaac gcacttaatt gtgcggggct     27000
+     tctttttgcc tggagaaagt tatgcataca gtttctgaaa atcagtgcgg tatatacgca     27060
+     ttactgctgc aacaggccag aaccgaagca caggccgacg ctgcgacgcg cttttcttct     27120
+     catcttgatg ccatgattcg ccacatcaca aaggcggagt tatcccgcgt ggagatagtc     27180
+     gagctgctca gtcaggagtc ggaaaaattt cacaatatcg gattgtctcg cggggaggtg     27240
+     ctttgatgtt ctgttctcgt gcagttgtat tactgaataa cgccttaaaa atcgccgtta     27300
+     tgaaaaatgg cgatttgtct cttattcaac ttggtcttga taaagaaaaa cgcgaaataa     27360
+     ctgaatctgt tatcgcgatt tatcagagtg aattaaacct cctgtctgat gtggtcaatt     27420
+     tacttgttaa acgcgctgta tttcacaagc aaatttcctc cgtggatgaa ctgacgaaat     27480
+     taacgacaga aatcgccagc tattgcgctg atgaatttaa aaaactgaac gacaaaagga     27540
+     actggtaatg ccggacaacg tagattttat tcaggaacaa caggctgaat tactggagcg     27600
+     ccagattaac gcggcaaggg taaaacattg cggtgcttct gcgctggttt gcgaagagtg     27660
+     tgacgcgcca atacctgctg cccgtcgtgc ggcttacccg tcagccacgc gttgtgtttc     27720
+     ctgtcagtca gtctttgaag caaaaaacaa acattaccgg agaacggcat gagtattcgt     27780
+     attgaaattg gcgaacgtta tgtcgttacc agtgacagct ttcagtttat tctccacgag     27840
+     aaaaagagag cggaaagcgg taaaaacgcc ggtcaggaat ggctggcggt ggttggttat     27900
+     tacccgaaat taagccagct cgtttcaggc ctgatgcatc acgatattct gaccggaagc     27960
+     gcaaagtctt ttgctgattt aaacgtgcag gttgagcaac tcagcaagcg ttgttcagag     28020
+     gcttttggct catatggccg ttaaagcctc cgggcgtttt gtccctccgt cagcatttgc     28080
+     cgcaggcacc ggtaagatgt ttaccggtgc ttatgcatgg aacgcgccac gcgaggccgt     28140
+     cgggcgcgaa agacccctta cacgtgacga gatgcgtcag atgcaaggtg ttttatccac     28200
+     gattaaccgc ctgccttact ttttgcgctc gctgtttact tcacgctatg actacatccg     28260
+     gcgcaataaa agcccggtgc acgggtttta tttcctcaca tccacttttc agcgtcgttt     28320
+     atggccgcgc attgagcgtg tgaatcagcg ccatgaaatg aacaccgacg cgtcgttgct     28380
+     gtttctggca gagcgtgacc actatgcgcg cctgccggga atgaatgaca aggagctgaa     28440
+     aaagtttgcc gcccgtatct catcgcagct tttcatgatg tatgaggaac tcagcgatgc     28500
+     ctgggtggat gcacatggcg aaaaagaatc gctgtttacg gatgaggcgc aggctcacct     28560
+     ctatggtcat gttgctggcg ctgcacgtgc tttcaatatt tccccgcttt actggaaaaa     28620
+     ataccgtaaa ggacagatga ccacgaggca ggcatattct gccattgccc gtctgtttaa     28680
+     cgatgagtgg tggactcatc agctcaaagg ccagcgtatg cgctggcatg agacgttact     28740
+     gattgctgtc ggggaggtga ataaagaccg ttctccttat gccagtaaac atgccattcg     28800
+     tgatgtgcgt gcacgccgcc aagcaaatct ggaatttctt aaatcgtgtg accttgaaaa     28860
+     cagggaaacc ggcgagcgca tcgaccttat cagtaaggtg atgggcagta tttctaatcc     28920
+     tgaaattcgc cggatggagc tgatgaacac cattgccggt attgagcgtt acgccgccgc     28980
+     agagggtgat gtggggatgt ttatcacgct taccgcgcct tcaaagtatc acccgacacg     29040
+     tcaggtcgga aaaggcgaaa gtaaaaccgt ccagctaaat cacggctgga acgatgaggc     29100
+     atttaatcca aaggatgcgc agcgttatct ctgccatatc tggagcctga tgcgcacggc     29160
+     attcaaagat aatgatttac aggtctacgg tttgcgtgtc gtcgagccac accacgacgg     29220
+     aacgccgcac tggcatatga tgcttttttg taatccacgc cagcgtaacc agattatcga     29280
+     aatcatgcgt cgctatgcgc tcaaagagga tggcgacgaa agaggagccg cgcgaaaccg     29340
+     ttttcaggca aaacacctta accagggcgg tgctgcgggg tatatcgcga aatacatctc     29400
+     aaaaaacatc gatggctatg cactggatgg tcagctcgat aacgataccg gcagaccgct     29460
+     gaaagacact gctgcggctg ttaccgcatg ggcgtcaacg tggcgcatcc cacaatttaa     29520
+     aacggttggt ctgccgacaa tgggggctta ccgtgaacta cgcaaattgc ctcgcggcgt     29580
+     cagcattgct gatgagtttg acgagcgcgt cgaggctgca cgcgccgccg cagacagtgg     29640
+     tgattttgcg ttgtatatca gcgcgcaggg tggggcaaat gtcccgcgcg attgtcagac     29700
+     tgtcagggtc gcccgtagtc cgtcggatga ggttaacgag tacgaggaag aagtcgagag     29760
+     agtggtcggc atttacgcgc cgcatctcgg cgcgcgtcat attcatatca ccagaacgac     29820
+     ggactggcgc attgtgccga aagttccggt cgttgagcct ctgactttaa aaagcggcat     29880
+     cgccgcgcct cggagtcctg tcaataactg tggaaagctc accggtggtg atacttcgtt     29940
+     accggctccc acaccttctg agcacgccgc agcagtgctt aatctggttg atgacggtgt     30000
+     tattgaatgg aatgaaccgg aggtcgtgag ggcgctcagg ggcgcattaa aatacgacat     30060
+     gagaacgcca aaccgtcagc aaagaaacgg aagcccgtta aaaccgcatg aaattgcacc     30120
+     atctgccaga ctgaccaggt ctgaacgatt gcagatcacc cgtatccgcg ttgaccttgc     30180
+     tcagaacggt atcaggcctc agcgatggga acttgaggcg ctggcgcgtg gagcaaccgt     30240
+     aaattatgac gggaaaaaat tcacgtatcc ggtcgctgat gagtggccgg gattctcaac     30300
+     agtaatggag tggacatgat ggcaaaaatt cacgaggtaa agctgcacgc aaaatatttc     30360
+     gaccttgtac tggaaggaaa gaaacgcgca gagtttcgga aaaaagatcg taattatgag     30420
+     cgcggggaca cgttgatttt gcatgaatgg gtgcagggtg tgtttacggg gcgaaaggtt     30480
+     gaagcccgga taacagatgt tactgacctg tcagactggc tggaagatta tgtcttgctg     30540
+     cacagaatac taggtgagat actgccgctg actgtcaagc tggcagtatc ctccacattt     30600
+     tttataaatc taaggcgaag aacggtggca atatatttgc tttaaattgt aaataagcaa     30660
+     attattctaa gccacaaatg atatcaattg agtatcgatt ttcgttcgaa tataaccata     30720
+     acgccaagcg tcaaatgtaa gtcatctata tgtgattcgt attcatattg gtcagcatca     30780
+     ggagatagta aatgctctgc tgctgtaaaa acatcaattg taacagatat atcgtctgga     30840
+     atttcttcat ttaattcgga tatgtatttt ttatatttgt tttttaattt ccttatcatg     30900
+     tcttccttat ggtggattgt agtgcagtaa ttttttttag ttgaatcatt gtatgaatgg     30960
+     aatgaacagt ttaatgctag gccaagactt gaatttcctg tagggcctgt gtgtttaaag     31020
+     tattcaagat ttcttcttat gtcagaaaat aaaagacttt tacagggggc atttccttta     31080
+     acttctattg cacatattgg aatgtcgaaa aatggtctgc tgtccaatat ggcaatatca     31140
+     attctgcctg atcttgttgt gtttgtgttt tttctgacag ttttttttga gaatattttt     31200
+     tgggggtcag accgtttcga taaaggaact gttgcattaa tgaatttatt tgtatggtac     31260
+     tcaaatataa ctttgtaatc accatggcga aaagatttta tttctaacaa cgatagacct     31320
+     atagatacgg tagctacata ttcagtgttt atttttgcac cagacctgaa atccattaaa     31380
+     taagttgcgt cggctgactt tttcattcca tcttttacag ctttcacaat atccatgtta     31440
+     ttcatatcaa caccttttat attccagaat tataaatctt aatgattgat ttgtttgtgt     31500
+     gtttaggtta ctagattgac gtacttatag cacattctga ttttgaaatc accatccttg     31560
+     ggtaaagcac agcctatcac tattggttta gtactgtgct gtaatagtat cagattaagt     31620
+     taaatccatt ttatgaaatc ttccatttca tcatattttt ttattactgc tctaacatct     31680
+     ttgctttcat cacataaaca atctaaaaga ctatcccatt cagtttgttt tttaccaaat     31740
+     ccataaacag cctctatatc accggatttc catatataga ttccgttatc tttcaatttt     31800
+     tgatgtattt catgtatatg cttttgtgtt ttttcatggt tacatatttt gatgaagtct     31860
+     ttgcttgaaa tgcttttgaa tgactcaaaa gtagtaactt ttgtatttaa actaagctct     31920
+     cctgagttga ttgattcaat caaagcagtc aatagattat cacattcagt actaagtaag     31980
+     tctttatgct ctgttaatag aatatttgat aagaaatcac aatcagctag aatccttgtt     32040
+     tttatgccga tggcattgat gatttgtgac atcttaaata aactaccctt accgtcaacg     32100
+     gcaacaatgc agattttact cgggttgagt tcatgtccgt taattttttt ataaagtgca     32160
+     tatagaacgt ttgtctctgt tttcccttca acaagcaaaa cttcttcaga aaataaaagg     32220
+     tatgatgaat tagaaagcgt gaatgctgag tgcaattgcg gtgatgaaga tttatataat     32280
+     tcttcgattt tttcagatat agtcttcctt gctatggttc cattagaatc cttacaaacc     32340
+     tgaatcgcat ttgctgcatg ctttgcagaa agcatactgg ctgagtgagt tgatattata     32400
+     acctgatacc ctgattcact taatgtgaca agtgattctc tgacagaatt aatggctgaa     32460
+     gggtgtaaat ataactcagg ttcatcaatg aaaatcaaag tgtttgattt ttttgattcg     32520
+     ctgttttctt tttttatttc ggccaggtat tgaattaatg ccatttgaat ggaacgttgt     32580
+     gttccgtgac caaatcggct gatatctctc attaccggtt catcttcccg agactcaaaa     32640
+     actttcagag tgccggattt aaatatctca tctaatgtcg gtgtgggaaa gtgtaacttt     32700
+     acacttacgt caggaaaaaa ttggtttact tttttattta cacctgagtc tattttatta     32760
+     aggctttcta atctgttctc accgttgtga gaaagatatt tacctatttc tgatatgttt     32820
+     tttgaaaatt tttcttcgtg ttcttgtttt atttcagaaa caattgcgga aagtatcttt     32880
+     cctattgtgg tcgtgttttt gcattttgtt gagtcttcga cagcgtcaga cattgcaggg     32940
+     atatgaattg gttccggaaa tatattggag attgcaccat ctatgccgcc agggtttttc     33000
+     ttccacgtgg taccgtcata tacatccaga ctttttttgg cttttcctgt ttccttatta     33060
+     aattcctgtc ttcttgcaaa ggtaagagtc ccgtcaatta taaacggagc tattttttgt     33120
+     tgattctctt ctgttaacaa agacagagta tcatctgtta taccttgaat aacgccttca     33180
+     acggatacgg ggtgtgtagg atcgtacaca tctgattctg aaatcaaaga gccatctaac     33240
+     agccacttaa ttgctaagat aatatttgat tttcctgcgt tattataacc aactaaagca     33300
+     gtgaaggggc gcaaaatagc cgatgttgac ttacaagaac gaaagttgct aattgaaact     33360
+     gaagcaagac gtacagtcat tatttttcct taaatgtgct atttgtatgc aatgagttca     33420
+     tacgaaacgc ttttttacat tttatagtcg ttgcattcaa gggtgcatga gattgcatta     33480
+     agggaaactg tgatatggct tggcttttga ctggaaatac tgatggctca ttagttttat     33540
+     taaggtgcat taaaaccgcc ccgtgaagcg ggcgggcgag gcggggaaag cac            33593
+//
diff --git a/etc/af063097.fasta b/etc/af063097.fasta
new file mode 100644
index 0000000000000000000000000000000000000000..8ed33789edf8bdca99328c641c5b29fc75ec7e2d
--- /dev/null
+++ b/etc/af063097.fasta
@@ -0,0 +1,561 @@
+>AF063097 AF063097 Bacteriophage P2, complete genome.
+ggcgaggcggggaaagcactgcgcgctgacggtggtgctgattgtattttttcagcgtct
+cagcgcgtcgtgacggcacttagtctgcccgttgaggcgttgtgtgtctgcggggtgttt
+tgtgcggtggtgagcgtgtgaggggggatgacggggtgtaaaaaagccgcccgcaggcgg
+cgatgttcagtcgttgtcagtgtccagtgagtagtttttaaagcggatgacctcctgacc
+gagccagccgtttatctcgcggatcctgtcctgtaacgggataagctcattgcggacaaa
+gacctttgccactttctcaatatcacccagcgacccgacgttctccggcttgccacccat
+caactgaaaggggatgcggtgcgcgtccagcaggtcagcggcgctggcttttttgatatt
+aaaaaaatcgtccttcgtcgccacttcactgagggggataattttaatgccgtcggcttt
+cccctgtggggcatagagaaacaggtttttaaagttgttgcggcctttcgacttgaccat
+gttttcgcgaagcatttcgatatcgttgcgatcctgcacggcatcggtgacatacatgat
+gtatccggcatgtgcgccattttcgtaatacttgcggcggaacaacgtggccgactcatt
+cagccaggcagagttaagggcgctgagatattccggcaggccgtacagctcctgattaat
+atccggctccagcaggtgaaacacggagccgggcgcgaaggctgtcggctcgttgaagga
+cggcacccaccagtaaacatcctcttccacgccacggcgggtatattttgccggtgaggt
+ttccagtctgatgaccttaccggtggtgctgtaacgcttttccagaaacgcattaccgaa
+caccagaaaatccagcacaaagcggctgaaatcctgctgggaaagccatggatgcgggat
+aaatgtcgaggccagaatattgcgtttgacgtaaatcggcgagctgtgatgcacggcagc
+ccgcaggctttttgccagaccggtaaagctgaccggtggctcataccatctgccgttact
+gatgcactcgacgtaatccagaatgtcacggcggtcgagtaccggcaccggctcaccaaa
+ggtgaatgcctccattttcgggccgctggcggtcattgtttttgccgcaggttgcggtgt
+tttcccttttttcttgctcatcagtaaaactccagaatggtggatgtcagcggggtgctg
+ataccggcggtgagtggctcatttaacagggcgtgcatggtcgcccaggcgaggtcggcg
+tggctggcttcctcgctgcggctggcctcataggtggcgctgcgtccgctgctggtcatg
+gtcttgcggatagccataaacgagctggtgatgtcggtggcgctgacgtcgtattccaga
+cagccacggcggataacgtcttttgccttgagcaccattgcggttttcatttccggcgtg
+tagcggatatcacgcgcggcgggatagaacgagcgcacgagctggaacacgccgacaccg
+aggccggtggcatcaataccgatgtattcgacgttgtatttttcggtgagtttgcggatg
+gattccgcctgggtggcaaagtccatgcctttccactggtgacgctcaagtattctgaat
+ttgccaccggccaccaccggcggtgccagtaccacgcatccggcgctgtcgccacggtgt
+gacgggtcgtaaccaatccataccgggcgggagccgaacggattggcggcaaacggcgca
+tagtcttcccattcttccagcgtgtcgaccatgcagcgttgcagctcctcgaacgggaac
+accgatgccttgtcgtcaacaaattcacacatgaacaggtttttaaaatcgtcggcgctg
+ttttcgcgtttgagctgctcaatgtcgaacagcgtgcagccgcctttcagggcgtcctca
+atggtgacaatctgtcgccactggccgtccgcacagagaagcccaccggcaagggcgtta
+tgactgacgtcgatttccacgcgttcggcggcgctggcgcgtccccggttaaacagttca
+cccgaccagaacgggtaggcgtcgtgcgccagcgtggacggggtggagaaataggtcgag
+cgcaggtgactctgtgaggccatacctgatgccaccttacgcagtacctgaaaattcggg
+atccagaaaatctcatcgacgtacaggtcgccgttatgactctgcgcggtgttggagttg
+gtgccgagaaaaatcagttttgcgccgttattgcccaggacaatcgggtcaccggtcagg
+tcaacgtcaaccagacgggcaaaggcgatgatgtattcgcggaacacatacgcctgtgtt
+ttactggccgacagaaaaatctggttatgaccggttttcagggcacgcagcagcgcctcg
+cgggaaaaataaaacgtcgcgccaatctggcgggatttcaggatatcgcggatgcggtgc
+tcaagcccggcacgataccagtgcagctgatagtcgaaagactgctcaaagaaaatctgc
+tccagcttttcgatggcctcgtcactgaaaaaattctttttcggtttgcgccgtccgcct
+ttgttacggttagcgacgttcggattaaggtctgcctcgttgccggtctggctgtagcgg
+ttgacccgtgccagtcgttcaatctggcgtcccagcaggtcaatttccttgaagtcaccg
+ccggttttctgtggtttgatgatgagctgggtcagccgcgcttccagactcatttcgaca
+cggctgatgggggcaacgctgtcccagccgtcgcgctgtttccagctctgcactgtcggg
+cgtttcatctgcaacatggcggcaatctgcggcacggaaaacccctgccagtacagcagc
+gccgcctgacgacgcgggtcgtgtaaaagagtggtgtctgtggtgatggtcatgaatacc
+tcgccgtgatgaatacacggcaaggctactgagtcgcgccccgcgattcgctaaggtgct
+gttgtgtcagtgataagccatccgggactgatggcggaggatgcgcatcgtcgggaaact
+gatgccgacatgtgactcctctaatcactattcaggactcctgacaatggcaaaaaaagt
+ctcaaaattctttcgtatcggcgttgagggtgacacctgtgacgggcgtgtcatcagtgc
+gcaggatattcaggaaatggccgaaacctttgacccgcgtgtctatggttgccgcattaa
+cctggaacatctgcgcggcatcctgcctgacggtatttttaagcgttatggcgatgtggc
+cgaactgaaggccgaaaagattgacgatgattcggcgctgaaaggcaaatgggcgctgtt
+tgcgaaaatcaccccgaccgatgaccttatcgcgatgaacaaggccgcgcagaaggtcta
+cacctcaatggaaattcagccgaactttgccaacaccggcaaatgttatctggtgggtct
+ggccgtcaccgatgacccggcaagcctcggcacggaatacctggaattctgccgcacggc
+aaaacacaaccccctgaaccgcttcaaattaagccctgaaaacctgatttcagtggcaac
+gcctgttgagctggaatttgaagacctgcctgaaaccgtgttcaccgccctgaccgaaaa
+ggtgaagtccatttttggccgcaaacaggccagcgatgatgcccgtctgaatgacgtgca
+tgaagcggtgaccgctgttgctgaacatgtgcaggaaaaactgagcgccactgagcagcg
+cctcgctgagatggaaaccgccttttctgcacttaagcaggaggtgactgacagggcgga
+tgaaaccagccaggcattcacccgcctgaaaaacagtctcgaccacaccgaaagtctgac
+ccagcagcgccgcagcaaagccaccggcggtggcggtgacgccctgatgacgaactgctg
+accggcgtcagtcagtccgggaaaaccttcacgattaacccttaatttcaggaaaaacta
+tgcgccaggaaacccgctttaaatttaatgcctacctgtcccgtgttgccgaactgaacg
+gcatcgacgccggtgatgtgtcgaaaaaattcaccgttgaaccgtcggtcacccagaccc
+tgatgaacaccatgcaggagtcctctgactttctgacccgcatcaatattgtgccggtca
+gcgaaatgaaaggggaaaaaattggtatcggtgtcaccggctccatcgccagcactaccg
+acactgccggtggtaccgagcgtcagccgaaggacttctcgaagctggcgtcaaacaagt
+acgaatgcgaccagattaacttcgatttttatatccgctacaaaacgctggacctgtggg
+cgcgttatcaggatttccagctccgtatccgtaacgccattatcaaacgccagtcccttg
+atttcatcatggccggttttaacggcgtgaagcgtgccgaaacctctgaccgcagcagca
+atccgatgttgcaggatgtggcggtcggctggctgcagaaataccgcaatgaagcaccgg
+cgcgcgtgatgagcaaggtcactgacgaggaaggccgcaccacctctgaggttatccgcg
+tgggtaagggcggtgattatgccagccttgatgcactggtgatggatgcgaccaacaacc
+tgattgaaccgtggtatcaggaagaccctgaccttgtggtgattgtggggcgtcagctac
+tggcggacaagtatttccccatcgtcaacaaggagcaggacaacagcgaaatgctggccg
+ctgacgtcatcatcagccagaaacgcatcggtaacctaccagcggtacgcgtcccgtact
+tcccggcggatgcgatgctcatcacgaagctggaaaacctgtccatctactacatggatg
+acagccatcgccgcgtgattgaggaaaacccgaaactcgaccgcgtggagaactacgagt
+caatgaacattgattacgtggtggaagactacgccgccggttgtctggtggaaaaaatca
+aggtcggtgacttctccacaccggctaaggcgaccgcagagccgggagcgtaaccgatga
+cgagtcccgcacagcgccacatgatgcgggtctcggcagcgatgaccgcgcagcgggaag
+ccgccccgctgcgacatgcaactgtctatgagcagatgctggttaagctcgccgcagacc
+agcgcacactgaaagcgatttactcaaaagagctgaaggccgcaaaaaaacgcgaactgc
+tgccgttctggttgccgtgggtgaacggcgtgctggagctgggcaaaggtgcacaggatg
+acattctgatgacggtcatgctgtggcgtctggataccggcgatattgccggtgcgctgg
+agattgcccgttatgccctgaagtacggtctgaccatgccgggtaaacaccgccgtaccc
+cgccgtacatgttcaccgaggaggtagcgcttgcggccatgcgcgctcacgctgccggtg
+agtctgtggatacccgcctgctgacggagacccttgaactgaccgccacggctgacatgc
+ctgatgaagtgcgcgcaaagctgcacaaaatcaccggtctgtttctgcgtgacggtggtg
+atgccgccggtgcgctggcgcacctgcaacgtgcgacacagctcgactgtcaggcaggcg
+tcaaaaaagagattgaacgactggagcgggagctgaaaccgaagccggagccgcagccca
+aagcggccacccgcgccccgcgtaagacccggagcgtgacaccggcaaaacgtggacgcc
+cgaaaaagaaagccagttaacaaccgaatgcgccccgcgccagggcggcacgccggtcag
+tgacggtgaatcacctgacactgcaccggcgtccaccgcccgacttttcagaggtagtca
+tgatgacgctgattattccgcgaaaggaggctcccgtgtccggtgagggtacggtggtca
+tcccgcaaccggcaggcgacgagccggtgattaaaaacacgttcttttttcccgatatcg
+acccgaagcgcgtccgggaacgtatgcgccttgagcagaccgtcgcccccgcccgtctgc
+gtgaggccatcaagtcaggcatggctgaaacgaatgcggagctgtacgagtaccgcgaac
+agaaaattgccgccggttttacgcgtctggctgacgtcccggcggacgatatcgacggtg
+aaagcatcaaggttttttactacgagcgcgccgtgtgtgcgatggcgaccgcgtcgcttt
+atgagcgttatcgcggtgtggatgccagtgcgaaaggcgacaagaaggctgacagcattg
+acagcaccattgatgagctgtggcgggatatgcgctgggcggtggcgcgcatccagggca
+agccgcgctgcatcgtgagtcaaatctgatgaagacctttgcgctacagggcgacacgct
+cgacgccatttgtgtccgctattacgggcgcactgagggcgtggttgagaccgtgctcgc
+cgcaaatccgggactggctgaactgggggcggtgctgccacacggcaccgccgtcgaact
+gcccgacgttcagaccgcgcccgtggctgaaactgtcaatctgtgggagtaacgcatgac
+agcagaagaaaaaagcgtcctgtcgcttttcatgattggggtgctgattgttgtcggcaa
+ggtgcttgccggtggtgaacctatcaccccgcgtctgtttatcgggcgcatgttgctcgg
+tggttttgtctcgatggttgccggtgttgttctggtgcagtttcctgacctgtcactgcc
+agcggtgtgcggcatcggctccatgctgggtatcgccggttatcaggtgattgagattgc
+cattcagcgccgctttaagggcagggggaaacagtaatgccggtaattaacacgcatcag
+aatatcgccgcctttctcgacatgctggccgtgtccgaagggacggcgaatcatccactg
+acgaaaaaccggggctatgacgtgatagtcaccggactggacgggaagccggaaattttc
+accgactacagtgaccacccgttcgcacatggccgaccggcgaaggtgtttaaccgtcgc
+ggtgaaaaatccacggcctccggtcgctatcagcagctttacctgttctggccgcattac
+cgcaaacagcttgccctgccggatttcagtccgttgtcacaggacagactcgccattcag
+ttgatccgcgaacgcggagcactggatgacatccgggcgggacgcattgagcgcgccatt
+tcacgctgtcgcaatatctgggcgtccctgccgggtgccggttacggtcagcgtgagcat
+tcactggaaaaactggtcaccgtctggcgtaccgctggcggcgtaccggcttaaacggag
+taaataccatgaagaaattatccctttcactgatgctgaacgtgtcgctggcgctgatgc
+tggcactgtccctgatttacccgcagagcgtggccgtcaattttgtcgctgcctgggcga
+ttctggcgacggttatctgtgtggttgccggtggtgtgggcgtgtatgccactgagtatg
+tgctggaacgctacgggcgggagctgccgccggaatcgctggccgtgaagattgtcacgt
+cgctgtttttgcagccggtgccgtggcgcagacgggcggcggctctggtagtggtggtgg
+cgacgtttatctcgctggtcgctgccgggtggatttttaccgcgctgatttatcttgtgg
+tgtcgctgtttttccggctgatacgtaaagcctgtcgtcagcgtcttgaggggcgggaac
+catgtcaaggctgatgattgtgctggtcgtgttgttatcgctggcggtggccggtctgtt
+tctggtgaaacacaaaaatgccagcctgcgcgcctcgctggacagggcgaacaacgtcgc
+cagcggtcagcagacgaccatcaccatgctgaaaaatcagcttcatgttgcgctcaccag
+ggcagataaaaacgagctggcgcaggtggcactgcgtcaggaactggagaacgccgcgaa
+acgtgaagcacagcgcgagaaaaccatcacgaggttacttaatgagaacgaagattttcg
+ccgctggtacggtgctgacctgcctgatgctgtgcgccggttgcaccagcgccccgcctg
+caccgacgccagtgattgtccccaacgcatgcccgaaagtgagcctttgcccgatgccgg
+gcagtgacccgcagacgaacggcgatttaagtgccgatatccggcagcttgagaacgcgc
+tggcacgctgtgccagccaggtaaaaatgattaaacactgtcaggacgaaaacgatgctc
+aaacccgacagcctgcgcagggcgctgactgatgccgtcacggtgctgaaaactaacccc
+gatatgctgcggatattcgtggataacgggagtattgcctccacactggcggcgtcgctg
+tcattcgaaaagcgttacacgctcaatgtgattgtgaccgactttaccggtgattttgac
+ctgctcattgtgccggtgctggcgtggctgcgggaaaatcagcccgacatcatgaccacc
+gacgaaggccagaaaaagggcttcacgttttatgcagacatcaacaatgacagcagcttt
+gatatcagtatcagcctgatgctgaccgagcgcacgctggtcagtgaggtggacggcgca
+ctgcatgtgaagaatatctcggaacccccgccgccggagccggtcacccgcccgatggag
+ctgtatatcaatggcgaactggtgagtaagtgggatgaatgagtttaagcgttttgaaga
+ccggctgaccggactgattgaatcgctgtcaccgtcagggcgtcggcgactgagtgccga
+actggcgaaacgtctgcggcagagtcagcagcgtcgggtgatggcacagaaagccccgga
+cggcacaccctacgcgccacgccagcagcagagcgtcagaaaaaagaccggtcgcgttaa
+gcgaaaaatgtttgcgaaacttattaccagtcgttttttgcatatccgtgccagcccgga
+gcaggcatcaatggaattttacggcgggaagtcgccgaaaatcgccagtgtgcatcagtt
+tggtctgtcggaagaaaaccggaaagacggtaagaaaattgattatccggcgcgtcccct
+gctcggctttaccggtgaggatgtgcagatgattgaagagattatcctggctcaccttga
+gcgttagttttatccaggcagaggctgatgcgcaattaaacattgagcggccatgctggt
+cgctcaatgtttagaggtttatgagtgatttttatttgatgctttgtattctaaaacctt
+cttattggcgtaaaagaattttgtatatgacaggaatataaccagacctgaagtgaaata
+gacgagggatagtattaataatgcttttttgtgactgttattatctttaatctcctggct
+taaccattcggagtcctcctcgtttagctgtaagagcttattgcaggcgatctcaggaag
+tgtgtcttttataaatacgttttgcagtctcttgcaatcggcaaggctataagttttatt
+aaattcaactgctttatttttgaaggataaaagaactttgtcactataaacatagtacat
+catgtttttatatggtatgcctgtggcatcccttactataacggattgttcgttgtgtat
+gtaacatgcgaggagaatgtaaaaaatactggccagaattacaattattgttttaattat
+gtgtggtggttttgttatgtcaccccagatacgagtaaggaaaaaatacgatgtttttag
+ttttccatcaatcagtccctgctgtatcattctcacattttcaatgcctgatacattgat
+tccgttaattattttaaatagttgaatgtcgcgccactcgcggtcaagtctttttaattt
+tttgtctgaatatccaaaattgaaataatgtgcaataagcctcataaggttacttttacc
+aaagctaaaaaatgctaatactgcaaagctacaaaggaaaaaaacgattagcccccacac
+attagtcacattatagctgaccattacgctctccttgaatgttgtctggtagttctacaa
+atgaatccagatagcataacttttatatattgtgcaatctcacatgcatgaacactctcg
+caaatattcaggaactcgcgcgcgcactgcgcaacatgattcgcactggcattatcgtcg
+aaaccgaccttaacgccggtcgctgccgcgtgcagaccggcggcatgtgcaccgactggc
+ttcagtggctgacccatcgcgcaggacgttcgcgcacatggtgggcaccttccgtggggg
+aacaggtgctgattctggccgtgggtggtgaactcgacacggcgttcgttctgccgggga
+tttattccggcgataacccctcgccgtctgtgtcggcggatgccctgcatatccgtttcc
+ctgacggggcggtgattgaatatgaacccgaaaccagtgcactcacggtaagcggaatta
+aaacggccagcgtgacggcttccggttctgttactgccacggtgccggtggtcatggtga
+aagcatcaacccgcgtcaccctggacaccccggaggtggtctgcaccaacaggctgatta
+ccggcacgctggaagtgcagaaaggcgggacgatgcgcggcaacattgaacacaccggcg
+gtgaactctcatcaaacggtaaggtactgcatacccataaacaccccggcgacagcggcg
+gcacaaccgggagtcctttatgacagcgcgttatctcggaatgaatcgcagtgatggcct
+gactgtcactgaccttgagcatatcagccagagtatcggcgatatcctgcgcacaccggt
+cggctcacgggtgatgcgtcgtgattacggctcgttgctggcgtcaatgattgaccagcc
+gcagaccccggcgcttgagttgcagattaaagtcgcctgttacatggcagtgctgaaatg
+ggaaccccgcgtcaccctgtcatccgtcaccacggcgcgcagttttgacgggcgaatgac
+ggtcacgttaaccggccagcacaacgacaccggccagccactttcattaaccatccctgt
+gagttgaaaccatgccgattatcgacctgaaccagctacccgcaccggatgtggtcgagg
+agctggactttgaaagcattctcgctgaacgcaaggcgacactgatttccctttacccgg
+aagatcagcaggaggcggtcgcccgtaccctgacactggaatctgagcctctcgtcaaac
+tgctggaagaaaatgcttatcgtgagcttatctggcgtcagcgtgtgaatgaggccgcac
+gggcggtgatgctggcctgtgccgccggtaatgaccttgatgtgattggtgccaattaca
+acaccacgcgcctgactatcaccccggcagatgattcgaccatcccgccgacaccggcag
+tgatggaatctgacaccgattatcgtctgcgtattcagcaggcttttgagggcttaagcg
+tcgccgggtcagtgggagcctatcagtatcatggtcgcagtgctgacgggcgtgtcgcgg
+atatttctgtcaccagtccgtctccggcctgtgtcaccatctctgtgctgtcacgtgaaa
+ataacggcgtcgcatccgaagacctgctggctgtggtgcgtaacgcccttaatggcgagg
+acgtcaggccggtggccgaccgcgtgaccgtgcagtctgccgccatcgttgaataccaga
+taaacgccacgctttacctttaccctggtcccgaaagcgaacccatccgcgctgccgctg
+tgaaaaagctggaagcgtatatcacggcacagcaccggctggggcgcgacatccgtctgt
+ctgccatttatgccgctttgcatgtggaaggtgtgcagcgtgtcgaactggctgcaccac
+tggccgacatcgtgctcaacagtacgcaggcgtctttctgtaccgaataccgcgtcgtga
+ccggaggctcggatgagtgattcgcgactgctgccgaccggctcatcaccgcttgaggtc
+gccgccgcaaaagcctgtgcggaaattgaaaaaacgccggtcagtattcgtgaactgtgg
+aacccggacacctgtccggcaaatctgctgccgtggctggcgtgggcgttttcggtcgac
+aggtgggatgaaaagtggccggaagcgacaaaacgcgccgttatccgcgatgcctatttc
+atccactgtcataagggcacgataggtgcaatccggcgtgtggtggagccgctcggctat
+ctcatcaacgtgacggagtggtgggaaaacagtgacccgcccggcaccttccggcttgat
+attggtgtactggaaagcggtatcacagaggcaatgtatcaggaaatggaacggctgatt
+gctgatgccaaacctgcaagccgtcaccttattggcctgaacattacccgggacattccc
+ggctatctgttcgccggtggtgtggcttacgacggcgatgtaattacggtttaccccgga
+taagtgaggaataatgagcataaaattcagaaccgttatcaccactgccggtgcagcaaa
+gctggcagcggcaaccgcgccgggaaggcggaaggtcggcattaccacgatggccgtcgg
+ggatggcggtggtaaattgcctgtcccggatgccggacagaccgggcttatccatgaagt
+ctggcgacatgcgctgaacaaaatcagccaggacaaacgaaacagtaattatattatcgc
+cgagctggttattccgccggaggtgggcggtttctggatgcgtgagcttggcctgtacga
+tgatgcgggaacgttaattgccgtggcgaacatggccgaaagctataagccagcccttgc
+cgaaggctcaggacgttggcagacctgtcgcatggtcatcatcgtcagcagtgtggcctc
+agtggagctgaccattgacaccacaacggtgatggcgacgcaggattacgttgatgacaa
+aattgcagagcacgaacagtcacgacgtcacccggacgcctcgctgacagcaaaaggttt
+tactcagttaagcagtgcgaccaacagcacgtctgaaacactggccgcaacgccgaaagc
+ggtaaaggccgcgtatgacctggctaacgggaaatataccgcacaggacgccaccacagc
+gcgaaaaggccttgtccagcttagtagcgccaccaacagcacgtctgaaacgctcgccgc
+aacaccaaaagccgttaagacggtaatggatgaaacgaacaaaaaagcgccattaaacag
+ccctgcactgaccggaacgccaacgacgccaactgcgcgacagggaacgaataatactca
+gatcgcaaacacggctttcgttatggccgcgattgccgcccttgtagactcgtcgcctga
+cgcactgaatacgctgaacgagctggcggcggcgctgggcaatgacccgaattttgctac
+caccatgactaatgcgcttgcgggtaagcaaccgaaagatgctaccctgacggcgctggc
+ggggcttgctactgcggcagacaggtttccgtattttacggggaatgatgttgccagcct
+ggcgaccctgacaaaagtcgggcgggatattctggctaaatcgaccgttgccgccgttat
+cgaatatctcggtttacaggaaacggtaaaccgagccgggaacgccgtgcaaaaaaatgg
+cgataccttgtccggtggacttacttttgaaaacgactcaatccttgcctggattcgaaa
+tactgactgggcgaagattggatttaaaaatgatgccgatggtgacactgattcatacat
+gtggtttgaaacgggggataacggcaatgaatatttcaaatggagaagccgccagagtac
+cacaacaaaagacctgatgacgttgaaatgggatgcactaaatattcttgttaatgccgt
+cattaatggctgttttggagttggtacgacgaatgcactaggtggtagctctattgttct
+tggtgataatgataccggatttaaacagaatggagacggtattcttgatgtttatgctaa
+cagtcagcgtgtattccgttttcagaatggagtggctattgcttttaaaaatattcaggc
+aggtgatagtaaaaagttctcgctatccagctctaatacatccacgaagaatattacctt
+taatttatggggtgcttccacccgtccagtggttgcagagttaggcgatgaggccggatg
+gcatttctatagccagcgaaatacagataactcggtaatatttgctgttaacggtcagat
+gcaacccagcaactggggaaattttgattcccgctatgtgaaagatgttcgcctgggtac
+gcgagttgttcaattgatggcgcgaggtggtcgttatgaaaaagccggacacacgattac
+cggattaagaatcattggtgaagtagatggcgatgatgaagccatcttcaggccgataca
+aaaatacatcaatggcacatggtataacgttgcgcaggtgtaagttatgcagcatttaaa
+gaacattaagtcaggtaatccaaaaacaaaagagcaatatcagctaacaaagaattttga
+tgttatctggttatggtccgaagacggaaaaaactggtatgaggaagtgaagaactttca
+gccagacacaataaagattgtttacgatgaaaataatattattgtcgctatcaccagaga
+tgcttcaacgcttaatcctgaaggttttagcgttgttgaggttcctgatattacctccaa
+ccgacgtgctgacgactcaggtaaatggatgtttaaggatggtgctgtggttaaacggat
+ttatacggcagatgaacagcaacaacaggcagaatcacaaaaggccgcgttactttccga
+agcggaaaacgttattcagccactggaacgcgctgtcaggctgaatatggcgacggatga
+ggaacgtgcacgactggagtcatgggaacgttacagcgttctggtcagccgtgtggatcc
+tgcaaatcctgaatggccggaaatgccgcaataagttgtatgacctctgttgtgaactta
+catatctatggcacagagtaaagcctaatctgaagtccactctgtgccaaaagcggacct
+tataaacaagaacaatggtcatatcagtgtgttttgattgcatagctaacgtgcgtcttc
+ctgtacagaatcataagatgatagggcataggagatgattattatcgcgtgttttaaaaa
+tagctttctgcatcaagtgtcacttgcgaagaggtattggcgctatgattggcatcactc
+agttcagataatattttaaatatttggtaaatgttcagattacacaattcggtctgcgtc
+ccgttaaaattatctactattagttattactatgaggtgaatggcaagtgttttccactc
+gccatttttgttttttatttttttaaagcctttccgacgtttaaggattttgccaagcca
+taaaatatttgatatttcattcctgtttttatttttggtgagatatttgcgtaacttctt
+tctctaaaacaccaacgtataaacctattattatcttcggttgtttctatatagcatatt
+acattgagaccaaaaagaaactgaaggaagtcatttgcagttgtcatgaattttggtttt
+gttgtggaaatggaactaatatgagtttcaagttgtttatatgctaagaggtattcagcg
+taatcaaaagtatcttttccagagaggaattcaaagaactttaaaaaaatctcataatgt
+tcacttccataataaaatgataaatgatcttttatttctccaagtaaatagttagagtaa
+tctctttgcatgctaggactttcaaagtcatctagactaaattgatttttcccatcatca
+ccgctggcgtgtgatttgataatttcgagcatccgtaatatatctcttgggcgataatat
+gaccagcgaaggaaattaataaatgatgtggggtggttataattatcatggacgttgggt
+gaatcccaagggaaataatggtcccatgcctgtccctttttaagggccatgtcttgctga
+gtcctaagcagatgatctaatacctcaaataattgagagctacggtggttaacatattct
+gtccgccagtccaagaatactgaattatctctgatttttgcgttttgattttgtaatcct
+atggattcaaatatatctggcctgatcaagagaacggccttcattctcccttttcctccc
+tttatacttgggaagaaatcgttgttaatctcccagactgcgtgagctaatccttttata
+cattctagataatcatcgtatggaattgaggaagggcggatatcaataccatcgataaat
+aaaatatgattttgagataaacgtatttggctaaaggcctcttcaaattttttttgtata
+taaaataaatttatctgaaatctgctctcagaaaaagataaagactctctttcttcacct
+tttaaggttgcatgcttatgaagtagttcggctgcaacttttgactcttgaacaaaactg
+agggcttgaattatttctggtgaaaatgccttaagataatactcatctattgcatcatta
+agtgatgagaattttgaataatttagtaactttgaaattttcccttctttatctaatact
+tgttttgatattaataaatatagaataactttccatatgccagagaagtcagacaaattt
+aaatgcttttcagatttaagagtgataaatttttgatattctgtctctcttatatattta
+gttgtagctagcgtattgttaatattgttatttgagagatagatagagtatgcggtttta
+ccagtacctttctctcctacaagaaacgatatatttggttcacataatctagataggtga
+ttatcacgtatgaacactttgttaagtaattctttattctcccttctcttataattttca
+gcatcagcatagccaagagttagatctttgattggtatcattattacctcaactaaagca
+attgaaaaacatatggttataaaaacatagcgctgctctgtcgcatattgtggatatcaa
+catatgaaatgtaaaggaactatttgtggatgaatgaaccgaatcgctgtagcttcggta
+gtcatctttcagacttgtataaatgaacaacttccgcttctcgctcaaaggaaactgtca
+gatttgatagcttttgggctatgtaaactgtcagtcggaaaatgagtgagtacaaatcag
+ggcaggtgagcgaattgcccgccttttctttaccggtggttgtgctgtcgattagccaac
+cgggacaaatagcctgacatctccggcgcaactgaaaataccactcacccattaaccacg
+gagttaaacggatgagtgactatcatcacggcgtgcaggtgctggagattaacgagggca
+cccgcgtcatttccaccgtatccacggccattgtcggcatggtctgcacggccagcgatg
+cagatgcggaaaccttccccctcaataaacctgtgctgattaccaatgtgcagagcgcaa
+tttcaaaggccggtaaaaaaggcacgctggcggcatcgttgcaggccatcgctgaccagt
+caaaaccggtcaccgttgtcatgcgcgtggaagacggcaccggtgatgacgaggaaacga
+aactcgcgcagaccgtttccaatatcatcggcaccaccgatgaaaacggtcagtacaccg
+gactaaaagccatgctggcggcggagtcggtaaccggtgttaaaccgcgtattctcggcg
+tgccgggactggataccaaagaggtggctgttgcactggcatcagtctgtcagaagctgc
+gtgctttcgggtatatcagcgcatggggctgtaaaaccatttccgaggtgaaagcctatc
+gtcagaatttcagccagcgtgagctgatggtcatctggccggatttcctcgcatgggata
+cggtcaccagtaccaccgccaccgcgtatgccaccgcccgtgcgctggggctgcgcgcta
+aaatcgaccaggagcagggctggcataaaacgctgtccaatgtcggggtgaacggtgtta
+ccggcatcagcgcatctgtattctgggatttgcaggagtccggcaccgatgctgacctgc
+ttaacgagtcaggcgtcactacgctgattcgccgcgacggtttccgcttctggggtaacc
+gtacctgctctgatgacccgctgttcctctttgaaaactacacccgcaccgcgcaggtcg
+tggccgacacgatggctgaggcgcacatgtgggcggtggacaagcccatcactgcaacgc
+tgattcgcgacatcgttgacggcatcaatgccaaattccgtgagctgaaaacaaacggct
+atatcgtggatgcgacctgctggttcagcgaagaatccaacgatgcggaaaccctcaagg
+ccggaaaactgtatatcgactacgactatacaccggtgcctcctctcgaaaacctgaccc
+tgcgccagcgtattaccgataaatacctggcaaatctggtcacctcggttaacagcaatt
+aaggagcctgaccgatggcaatgccgcgcaaactcaagttaatgaacgtctttctgaacg
+gctacagctatcagggcgttgcaaagtccgtcacgctgccaaaactgacccgtaagctcg
+aaaactatcgcggtgcggggatgaacggcagcgcaccggtagacctcggccttgatgacg
+atgcgctgtcaatggagtggtcgctcggtggcttcccggattcggttatctgggagcttt
+acgccgcaaccggtgtggatgccgtgccgattcgttttgcaggctcttaccagcgcgacg
+ataccggcgaaacggtggccgtcgaagtggtcatgcgtggacgtcagaaagaaatcgaca
+ccggcgagggtaaacagggagaagacactgagtcgaaaatctccgtggtctgcacctatt
+tccggctgacgatggacggtaaggagctggtcgaaattgacaccatcaacatgattgaga
+aggtgaacggcgtcgatcggctggagcaacaccgccgcaatatcggcctgtgattttcat
+ccggtcagcctggctggccggttaaccctgattcagaagtgagaaaaccatgaacaaaga
+aaatgtcattaccctggacaatccggtcaaacgtggtgagcaggttatcgaacaggtcac
+gctgatgaaacccagtgccgggacgctacgcggtgtcagtctggctgcggttgcaaactc
+cgaagtcgatgcactgattaaggtgctgccgcgcatgacggcaccgatgctgaccgagca
+ggaagtcgccgcgctggaactgcctgaccttgtggcgctggccggtaaggtggtcggttt
+tttgtcgccgaactcggtgcagtgacgtttccgaaaaatctctcggtcgatgacctgatg
+gcggatgtggcagtgatatttcactggccgccatcagaactgtatcccatgagcctgacc
+gaactcatcacatggcgcgaaaaggcgctccggcgaagcggaaacacgaatgagtaacaa
+tgtaaaattacaggtattgctcagggctgttgaccaggcatcccgcccgtttaaatccat
+ccgcacagcgagcaagtcgctgtcgggggatatccgggaaacacaaaaatcactgcgcga
+gctgaacggtcacgcatcccgtattgagggattccgcaagaccagtgcacagctcgccgt
+gactggtcatgcacttgaaaaggcacggcaggaggccgaagcccttgccacacagtttaa
+aaacaccgaacgtccgacccgtgctcaggcgaaagtcctggaatccgcaaagcgtgcggc
+ggaggacttacaggcgaaatataaccgcctgacagattccgttaaacgccagcagcggga
+actggccgctgtgggaattaatacccgcaatcttgcacatgatgagcagggactgaaaaa
+ccgtatcagtgaaaccaccgcacagcttaaccgtcagcgtgatgcgctggtgcgtgtcag
+tgcgcaacaggcaaaacttaacgcagtaaaacagcgttatcaggccggaaaggaactggc
+cggaaatatggcctcagtgggcgctgccggtgtggggattgcggcggcgggaacgatggc
+cggtgttaagctactgatgcccggttatgagtttgcgcagaaaaactcagaattacaggc
+tgtgatcggagtggcaaaagactccgccgaaatggccgcactccgcaagcaggcgcgcca
+gctcggcgacaataccgccgcctcggcagatgatgcagccggtgcgcagattattattgc
+gaaagccggtggggatgttgatgccattcaggcggcaacgccggtcacgctgaacatggc
+gctggcgaaccgtcgcacaatggaagaaaacgccgccctgctgatggggatgaaatccgc
+ctttcagctttcaaacgataaggtcgctcatatcggggatgttctctccatgacgatgaa
+caaaaccgccgccgattttgacggcatgagcgatgcgctgacctatgccgcacctgtggc
+aaaaaatgccggtgtcagcattgaagaaaccgccgcaatggtcggggcgctgcatgatgc
+aaaaatcacaggctcaatggcggggacgggaagccgtgccgtgttaagccgcctgcaggc
+accgacgggaaaagcatgggatgcactcaaagagcttggagtgaaaacctcagacagcaa
+aggaaacacccggccaatatttaccattctgaaagaaatgcaggccagttttgagaaaaa
+ccggctcggtactgcccagcaggctgaatacatgaaaactattttcggggaggaggccag
+ctcagccgctgccgtgctgatgactgccgcctcaaccggaaagctggacaaactgaccgc
+tgcgtttaaagcctcagacgggaagaccgccgagctggtaaatatcatgcaggacaacct
+aggcggtgactttaaagcgtttcagtccgcttatgaggcggtggggactgacctgtttga
+ccagcaggaaggcgcgctgcgtaagctcacgcagacggccacaaagtatgtgttaaaact
+cgacggctggatacagaaaaacaaatcactggcgtcaaccatcggcatcattgccggcgg
+tgcactggcgcttactggcatcatcggtgccattggcctcgtagcctggccggttatcac
+cggcatcaatgccatcatcgcggcagcaggcgcaatgggggcagtcttcacgacggttgg
+cagtgctgttatgaccgccatcggggctattagctggccggttgtggccgtggtggctgc
+cattgtcgccggtgcgttgcttatccgtaaatactgggagcctgtcagcgcattctttgg
+tggtgtggttgaagggctgaaagcggcatttgcgccggtgggggaactgttcacgccact
+taaaccggtttttgactggctgggcgaaaagttacaggccgcgtggcagtggtttaaaaa
+cctgattgccccggtcaaagccacccaggacaccctgaaccgttgccgtgacacgggcgt
+catgttcgggcaggcactggctgacgcgttgatgctgccgcttaatgcgttcaacaaact
+gcgcagtggtattgactgggtactggaaaaactcggtgttatcaacaaagagtcagacac
+acttgaccagaccgccgccagaactcataccgccacgtatggtaccggtgactatattcc
+ggcgaccagctcttatgcaggctatcaggcttatcagccggtcacggcaccggctggccg
+ctcttatgtagaccagagtaaaaacgaatatcacatcagcctgacgggggggactgcgcc
+ggggacacagcttgaccgccagttacaggatgcgctcgaaaaatacgagcgggataaacg
+tgcgcgcgcccgtgccagcatgatgcatgacggttaaggaggtgacgaaaaatgatgctc
+gcgttaggtatgtttgtttttatgcgccagacgctgccacaccagaccatgcagcgtgaa
+tcagattatcgctggccgtcaaattcccgtatcggtaaacgggatgcctttcagtttctc
+ggtgtgggtgaggaaaacatcacgctggccggtgtgctttatcccgaactgaccggcggc
+aagctgacgatgaccacgctcaggctgatggcagaggaggggcgggcgtggccgttgctg
+gatggcaccggcatgatttacggcatgtatgtcatcagcagggtgagtgaaacagggagt
+attttctttgcagacggcacaccccggaaaattgattttacgctgtcactcacccgcgtt
+gatgaatcactggccgcgctttatggcgatatcggtaaacaggcggaatcgctcatcggt
+aaggccggcagtatggcgaccagattcacaggtatgacgggggcgggataatgctggatg
+cgctgacatttgatgcaggcagtacgctgacgccggattacatgctgatgctcgacagca
+gggatattaccggcaatatcagcgaccgtctgatgagcatgaccctgacggataaccggg
+gctttgaggctgaccagcttgatattgaactgaacgatgccgacgggcaggtcgggctgc
+cggttcgtggcgctgtcctgacggtgtatatcggctggaaaggttttgccctggtatgca
+aagggaaatttaccgttgatgaggttgaacaccggggcgcaccggatgtagtcaccatcc
+gcgcccggagtgcagattttcgcgggacgctcaattcccgccgggaaggctcctggcatg
+acaccacgctcggtgcgattgttaaggcgatagccacccgtaacaggctggaagccagtg
+tcgctccgtcactggccggaataaaaattccacacatcgaccagtcgcaggagtctgatg
+cgaaattcctgacccgtcttgcagaacgcaacggcggtgaggtgtcggtaaaaatgggaa
+aactgttgtttctcaaagcggggcagggagtgacggccagcggtaaaaaaatcccgcagg
+tcaccataacccgcagcgacggcgaccgccatcattttgcgattgctgaccgtggagcct
+acaccggtgtaacggcaaaatggctacacactaaagacccgaagccgcaaaagcagaagg
+taaaactgaaacgcaaaaagaaagagaaacacctgcgcgcactggagcacccgaaagcga
+aaccggtcaggcagaagaaagcgcctaaagtaccggaagcgcgtgaaggtgaatacatgg
+ccggtgaggctgacaacgtttttgccctgaccacggtatatgccacgaaagcgcaggcca
+tgcgcgccgctcaggcgaagtgggataaactgcaacggggcgttgcggagttctctatca
+gcctggctaccggtcgggcagatatttacacggaaacaccggtcaaagtgtctggcttta
+agcgcgtcatagacgagcaggactggacaatcactaaggtgacacattttctgaataata
+gcggcttcacgacgtccttagagcttgaggtcaggctttctgatgtggagtacgaaacag
+aagatgatgagtgatgtttttgttttatctgtttgttttgtaaggataaattaactaaaa
+tggcaccatcaacaaaaccggaagaggtgctcgcgatgtttcattgtcctttatgccagc
+atgccgcacatgcgcgtacaagtcgctatatcactgacacgacaaaagagcgttatcatc
+agtgccagaacgtgaattgcagcgccacgttcatcacttatgagtcggtacagcgataca
+tcgtgaagccgggagaagtccacgccgtaaggccgcacccgttgccatcagggcagcaaa
+ttatgtggatgtaattacaaacagaaagcccctcagtcgaggggcttttttgtcgatgtg
+gtcaatgtgtggacgtgaccagaaataaatccttttatttcaatttattgtacgtaaaaa
+ataagcccgtgtaagggagatttagggtgtcaccagtaggggctttcaacggtacaatgc
+gggtttgagcggcataaattaccactgaaagcccttaaacgttactctactgtggacact
+gtgtggacactctcggcctcagtaccacctcttagcggattaagagaaatggcgtcctga
+aggtactctggcgcaaaatgagcgtaaaccatagtttgctcaatccgcgtgtgacctagt
+atccgttgtagcgtgataatacttcctccattaatcatgaaatgagtggcaaagctgtgc
+cttagtgcatgtgtggcttgccccattggcaaatccggttttattgctttcattgttcgt
+ctgaagcgagggtaatcagcatcagggaataaaaaacctcgtttgttatccgcgatcatt
+ttggcaacagcctctgagatcgggacggtgcgtggtttgtttgttttcgttttaacaaac
+gtgacgcggttatggatgatattttctgctttcaaacgagctgcttctccccaacgtgct
+cctgtactcaggcaaagaatcgcaatctttttattgtcgccgtcaagtgctgcaagcagt
+aaggcaatttcttcctgtgttagatagcctgtttctggtttttcctccttaagccttttt
+gtccctctgatagggtgctcaccaaagaataactccgcttcaatcagggctgtaaacatg
+ccgctaatacatgttaaatcacgattgatactcgaaggtttaataccctgacttcttcgg
+gtggcgcagtactggctgataagcgatttcgtaatttgaaatgcgcatgggtcattcgtt
+atttttgtgaagatttcaatttttccaagattagatttcccatgctcttcgtgtttaccc
+tttaaatcccaccagatctgtgtcagctccgacagacgtcgcttgtctgttggttttgat
+agccattctttattgtggtggttgtacaacgtgtatttctcgaaagcgacagcttcgctt
+ttcttatcaaacttcctacggatgcgttttccattacgtccagtagggcggatgtccact
+tcatatcgaccatcatcgagttttttgattgccatcagaaaaccctccgagtggtgtgtt
+tttttgcgactactaatcgcttttttcgtggtggctgaaatttagccaccaatagtaggc
+acttgtgatgaatatattcacgatgaattgttaaccagtcttttgaccggagtggggcga
+cgttgtttcgttttgcccaaagtgtgcgagagcgggcgcaatttgcccggactcaggagc
+gatctgattggtcatgaaccataaagtgtatttggtgaattgtggggtctgcaggatgtt
+catcatgacatctgttggaggtgttgaacgaccactttcatagtaactcagcgtgccata
+cggaacccctgttaaatcagcaagttgttgtctgctcaaatactctgattttcgcattaa
+gactatcttctcgcttatcgtgtttgacatggtgtttagatctcaatagtatttagttta
+gatgtagattgtttagtgcttggatgtgggcactaaaaggcattataagacattaaacgc
+aattcatgagggctagaggacgacatgagcaagcaagtaacactcatgactgatgcgatt
+ccttatcaggagttcgcaaaactaataggaaaatcgacaggagcggttcgtcggatgatc
+gataaaggaaagctgcctgtaattgatatgaccgatccacaatcagcttcaggtcgtgca
+ggtgaatattgggtataccttccggcatggaataacggactaaaactggcttatgaaagc
+cgccctaaagagattcgtgacggctggttgatgtggttaggtctcggtgaaccacgttaa
+ggagaaccgtatgaatgagcctcgttgtattgctcagttactgcgtaacgaaagccccag
+ggcgattgacttcaccatcacccacggtaaggggcgtaagggaatcattatccgcaccaa
+aaaacagagtccgttaaaaaaggctctgacctttctgaaaagccggagggtatggaaatg
+acagtgatgacgctcaatctcgttgaaaaacagccagcagctatgcgccggataattggt
+aagcatcttgccgttcctcgctggcaggatacatgtgattattataatcagatgatggag
+cgcgaacggttaacggtttgcttccatgctcagttaaaacagcgtcacgcaacgatgtgt
+tttgaagaaatgaacgacgtcgaacgtgaacgactggtatgtgcaattgatgaattgcgt
+ggtgcattctcaaaacgccgtcaggttggcgcaagtgagtatgcatatattagtttttta
+acagtcagtcagcgtcgtactttatttatgcatgccggattgactgaaaaagaattcaac
+cagccatactggcgaattaatgaagagtcatgttactggcgtgatgctttattccgtgca
+ttacgtgaattattcagtctgtttgagtatgcaccgacaattctgacgtcggtaaaaccg
+gagcaatatctgcattaagtaattaaccagagtttttaacgcacttaattgtgcggggct
+tctttttgcctggagaaagttatgcatacagtttctgaaaatcagtgcggtatatacgca
+ttactgctgcaacaggccagaaccgaagcacaggccgacgctgcgacgcgcttttcttct
+catcttgatgccatgattcgccacatcacaaaggcggagttatcccgcgtggagatagtc
+gagctgctcagtcaggagtcggaaaaatttcacaatatcggattgtctcgcggggaggtg
+ctttgatgttctgttctcgtgcagttgtattactgaataacgccttaaaaatcgccgtta
+tgaaaaatggcgatttgtctcttattcaacttggtcttgataaagaaaaacgcgaaataa
+ctgaatctgttatcgcgatttatcagagtgaattaaacctcctgtctgatgtggtcaatt
+tacttgttaaacgcgctgtatttcacaagcaaatttcctccgtggatgaactgacgaaat
+taacgacagaaatcgccagctattgcgctgatgaatttaaaaaactgaacgacaaaagga
+actggtaatgccggacaacgtagattttattcaggaacaacaggctgaattactggagcg
+ccagattaacgcggcaagggtaaaacattgcggtgcttctgcgctggtttgcgaagagtg
+tgacgcgccaatacctgctgcccgtcgtgcggcttacccgtcagccacgcgttgtgtttc
+ctgtcagtcagtctttgaagcaaaaaacaaacattaccggagaacggcatgagtattcgt
+attgaaattggcgaacgttatgtcgttaccagtgacagctttcagtttattctccacgag
+aaaaagagagcggaaagcggtaaaaacgccggtcaggaatggctggcggtggttggttat
+tacccgaaattaagccagctcgtttcaggcctgatgcatcacgatattctgaccggaagc
+gcaaagtcttttgctgatttaaacgtgcaggttgagcaactcagcaagcgttgttcagag
+gcttttggctcatatggccgttaaagcctccgggcgttttgtccctccgtcagcatttgc
+cgcaggcaccggtaagatgtttaccggtgcttatgcatggaacgcgccacgcgaggccgt
+cgggcgcgaaagaccccttacacgtgacgagatgcgtcagatgcaaggtgttttatccac
+gattaaccgcctgccttactttttgcgctcgctgtttacttcacgctatgactacatccg
+gcgcaataaaagcccggtgcacgggttttatttcctcacatccacttttcagcgtcgttt
+atggccgcgcattgagcgtgtgaatcagcgccatgaaatgaacaccgacgcgtcgttgct
+gtttctggcagagcgtgaccactatgcgcgcctgccgggaatgaatgacaaggagctgaa
+aaagtttgccgcccgtatctcatcgcagcttttcatgatgtatgaggaactcagcgatgc
+ctgggtggatgcacatggcgaaaaagaatcgctgtttacggatgaggcgcaggctcacct
+ctatggtcatgttgctggcgctgcacgtgctttcaatatttccccgctttactggaaaaa
+ataccgtaaaggacagatgaccacgaggcaggcatattctgccattgcccgtctgtttaa
+cgatgagtggtggactcatcagctcaaaggccagcgtatgcgctggcatgagacgttact
+gattgctgtcggggaggtgaataaagaccgttctccttatgccagtaaacatgccattcg
+tgatgtgcgtgcacgccgccaagcaaatctggaatttcttaaatcgtgtgaccttgaaaa
+cagggaaaccggcgagcgcatcgaccttatcagtaaggtgatgggcagtatttctaatcc
+tgaaattcgccggatggagctgatgaacaccattgccggtattgagcgttacgccgccgc
+agagggtgatgtggggatgtttatcacgcttaccgcgccttcaaagtatcacccgacacg
+tcaggtcggaaaaggcgaaagtaaaaccgtccagctaaatcacggctggaacgatgaggc
+atttaatccaaaggatgcgcagcgttatctctgccatatctggagcctgatgcgcacggc
+attcaaagataatgatttacaggtctacggtttgcgtgtcgtcgagccacaccacgacgg
+aacgccgcactggcatatgatgcttttttgtaatccacgccagcgtaaccagattatcga
+aatcatgcgtcgctatgcgctcaaagaggatggcgacgaaagaggagccgcgcgaaaccg
+ttttcaggcaaaacaccttaaccagggcggtgctgcggggtatatcgcgaaatacatctc
+aaaaaacatcgatggctatgcactggatggtcagctcgataacgataccggcagaccgct
+gaaagacactgctgcggctgttaccgcatgggcgtcaacgtggcgcatcccacaatttaa
+aacggttggtctgccgacaatgggggcttaccgtgaactacgcaaattgcctcgcggcgt
+cagcattgctgatgagtttgacgagcgcgtcgaggctgcacgcgccgccgcagacagtgg
+tgattttgcgttgtatatcagcgcgcagggtggggcaaatgtcccgcgcgattgtcagac
+tgtcagggtcgcccgtagtccgtcggatgaggttaacgagtacgaggaagaagtcgagag
+agtggtcggcatttacgcgccgcatctcggcgcgcgtcatattcatatcaccagaacgac
+ggactggcgcattgtgccgaaagttccggtcgttgagcctctgactttaaaaagcggcat
+cgccgcgcctcggagtcctgtcaataactgtggaaagctcaccggtggtgatacttcgtt
+accggctcccacaccttctgagcacgccgcagcagtgcttaatctggttgatgacggtgt
+tattgaatggaatgaaccggaggtcgtgagggcgctcaggggcgcattaaaatacgacat
+gagaacgccaaaccgtcagcaaagaaacggaagcccgttaaaaccgcatgaaattgcacc
+atctgccagactgaccaggtctgaacgattgcagatcacccgtatccgcgttgaccttgc
+tcagaacggtatcaggcctcagcgatgggaacttgaggcgctggcgcgtggagcaaccgt
+aaattatgacgggaaaaaattcacgtatccggtcgctgatgagtggccgggattctcaac
+agtaatggagtggacatgatggcaaaaattcacgaggtaaagctgcacgcaaaatatttc
+gaccttgtactggaaggaaagaaacgcgcagagtttcggaaaaaagatcgtaattatgag
+cgcggggacacgttgattttgcatgaatgggtgcagggtgtgtttacggggcgaaaggtt
+gaagcccggataacagatgttactgacctgtcagactggctggaagattatgtcttgctg
+cacagaatactaggtgagatactgccgctgactgtcaagctggcagtatcctccacattt
+tttataaatctaaggcgaagaacggtggcaatatatttgctttaaattgtaaataagcaa
+attattctaagccacaaatgatatcaattgagtatcgattttcgttcgaatataaccata
+acgccaagcgtcaaatgtaagtcatctatatgtgattcgtattcatattggtcagcatca
+ggagatagtaaatgctctgctgctgtaaaaacatcaattgtaacagatatatcgtctgga
+atttcttcatttaattcggatatgtattttttatatttgttttttaatttccttatcatg
+tcttccttatggtggattgtagtgcagtaattttttttagttgaatcattgtatgaatgg
+aatgaacagtttaatgctaggccaagacttgaatttcctgtagggcctgtgtgtttaaag
+tattcaagatttcttcttatgtcagaaaataaaagacttttacagggggcatttccttta
+acttctattgcacatattggaatgtcgaaaaatggtctgctgtccaatatggcaatatca
+attctgcctgatcttgttgtgtttgtgttttttctgacagttttttttgagaatattttt
+tgggggtcagaccgtttcgataaaggaactgttgcattaatgaatttatttgtatggtac
+tcaaatataactttgtaatcaccatggcgaaaagattttatttctaacaacgatagacct
+atagatacggtagctacatattcagtgtttatttttgcaccagacctgaaatccattaaa
+taagttgcgtcggctgactttttcattccatcttttacagctttcacaatatccatgtta
+ttcatatcaacaccttttatattccagaattataaatcttaatgattgatttgtttgtgt
+gtttaggttactagattgacgtacttatagcacattctgattttgaaatcaccatccttg
+ggtaaagcacagcctatcactattggtttagtactgtgctgtaatagtatcagattaagt
+taaatccattttatgaaatcttccatttcatcatatttttttattactgctctaacatct
+ttgctttcatcacataaacaatctaaaagactatcccattcagtttgttttttaccaaat
+ccataaacagcctctatatcaccggatttccatatatagattccgttatctttcaatttt
+tgatgtatttcatgtatatgcttttgtgttttttcatggttacatattttgatgaagtct
+ttgcttgaaatgcttttgaatgactcaaaagtagtaacttttgtatttaaactaagctct
+cctgagttgattgattcaatcaaagcagtcaatagattatcacattcagtactaagtaag
+tctttatgctctgttaatagaatatttgataagaaatcacaatcagctagaatccttgtt
+tttatgccgatggcattgatgatttgtgacatcttaaataaactacccttaccgtcaacg
+gcaacaatgcagattttactcgggttgagttcatgtccgttaatttttttataaagtgca
+tatagaacgtttgtctctgttttcccttcaacaagcaaaacttcttcagaaaataaaagg
+tatgatgaattagaaagcgtgaatgctgagtgcaattgcggtgatgaagatttatataat
+tcttcgattttttcagatatagtcttccttgctatggttccattagaatccttacaaacc
+tgaatcgcatttgctgcatgctttgcagaaagcatactggctgagtgagttgatattata
+acctgataccctgattcacttaatgtgacaagtgattctctgacagaattaatggctgaa
+gggtgtaaatataactcaggttcatcaatgaaaatcaaagtgtttgatttttttgattcg
+ctgttttctttttttatttcggccaggtattgaattaatgccatttgaatggaacgttgt
+gttccgtgaccaaatcggctgatatctctcattaccggttcatcttcccgagactcaaaa
+actttcagagtgccggatttaaatatctcatctaatgtcggtgtgggaaagtgtaacttt
+acacttacgtcaggaaaaaattggtttacttttttatttacacctgagtctattttatta
+aggctttctaatctgttctcaccgttgtgagaaagatatttacctatttctgatatgttt
+tttgaaaatttttcttcgtgttcttgttttatttcagaaacaattgcggaaagtatcttt
+cctattgtggtcgtgtttttgcattttgttgagtcttcgacagcgtcagacattgcaggg
+atatgaattggttccggaaatatattggagattgcaccatctatgccgccagggtttttc
+ttccacgtggtaccgtcatatacatccagactttttttggcttttcctgtttccttatta
+aattcctgtcttcttgcaaaggtaagagtcccgtcaattataaacggagctattttttgt
+tgattctcttctgttaacaaagacagagtatcatctgttataccttgaataacgccttca
+acggatacggggtgtgtaggatcgtacacatctgattctgaaatcaaagagccatctaac
+agccacttaattgctaagataatatttgattttcctgcgttattataaccaactaaagca
+gtgaaggggcgcaaaatagccgatgttgacttacaagaacgaaagttgctaattgaaact
+gaagcaagacgtacagtcattatttttccttaaatgtgctatttgtatgcaatgagttca
+tacgaaacgcttttttacattttatagtcgttgcattcaagggtgcatgagattgcatta
+agggaaactgtgatatggcttggcttttgactggaaatactgatggctcattagttttat
+taaggtgcattaaaaccgccccgtgaagcgggcgggcgaggcggggaaagcac
diff --git a/etc/af063097_v_b132222.crunch b/etc/af063097_v_b132222.crunch
new file mode 100644
index 0000000000000000000000000000000000000000..b89fbf8e85cc3258dcb73ef351c27d64c7be8411
--- /dev/null
+++ b/etc/af063097_v_b132222.crunch
@@ -0,0 +1,199 @@
+76 50.00 207 440 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 201 434 AF063097 AF063097 Bacteriophage P2, complete genome.
+373 52.00 208 1179 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 202 1173 AF063097 AF063097 Bacteriophage P2, complete genome.
+423 65.00 224 1165 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 218 1159 AF063097 AF063097 Bacteriophage P2, complete genome.
+90 71.00 999 1163 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 993 1157 AF063097 AF063097 Bacteriophage P2, complete genome.
+46 29.00 1665 1958 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 2328 2621 AF063097 AF063097 Bacteriophage P2, complete genome.
+104 70.00 1978 2127 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 1241 1390 AF063097 AF063097 Bacteriophage P2, complete genome.
+666 77.00 2103 3284 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 1366 2547 AF063097 AF063097 Bacteriophage P2, complete genome.
+204 66.00 3360 3794 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 2623 3057 AF063097 AF063097 Bacteriophage P2, complete genome.
+571 81.00 3881 4750 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 3152 4021 AF063097 AF063097 Bacteriophage P2, complete genome.
+651 76.00 4814 5872 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 4068 5126 AF063097 AF063097 Bacteriophage P2, complete genome.
+214 82.00 5895 6236 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 5154 5495 AF063097 AF063097 Bacteriophage P2, complete genome.
+148 67.00 6243 6545 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 5508 5810 AF063097 AF063097 Bacteriophage P2, complete genome.
+525 58.00 2135 3361 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 1398 2624 AF063097 AF063097 Bacteriophage P2, complete genome.
+143 57.00 3446 3793 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 2709 3056 AF063097 AF063097 Bacteriophage P2, complete genome.
+210 69.00 3883 4326 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 3154 3597 AF063097 AF063097 Bacteriophage P2, complete genome.
+44 47.00 4378 4542 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 3649 3813 AF063097 AF063097 Bacteriophage P2, complete genome.
+54 53.00 4582 4722 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 3853 3993 AF063097 AF063097 Bacteriophage P2, complete genome.
+49 61.00 2173 2286 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 1436 1549 AF063097 AF063097 Bacteriophage P2, complete genome.
+271 53.00 2476 3234 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 1739 2497 AF063097 AF063097 Bacteriophage P2, complete genome.
+67 49.00 3640 3867 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 2903 3130 AF063097 AF063097 Bacteriophage P2, complete genome.
+226 54.00 3915 4544 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 3186 3815 AF063097 AF063097 Bacteriophage P2, complete genome.
+53 48.00 4581 4763 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 3852 4034 AF063097 AF063097 Bacteriophage P2, complete genome.
+94 61.00 5178 5393 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 4432 4647 AF063097 AF063097 Bacteriophage P2, complete genome.
+91 35.00 5424 5879 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 4678 5133 AF063097 AF063097 Bacteriophage P2, complete genome.
+140 52.00 5860 6246 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 5119 5505 AF063097 AF063097 Bacteriophage P2, complete genome.
+45 36.00 6355 6555 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 5620 5820 AF063097 AF063097 Bacteriophage P2, complete genome.
+73 57.00 5182 5388 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 4436 4642 AF063097 AF063097 Bacteriophage P2, complete genome.
+68 52.00 5542 5727 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 4796 4981 AF063097 AF063097 Bacteriophage P2, complete genome.
+129 58.00 5885 6229 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 5144 5488 AF063097 AF063097 Bacteriophage P2, complete genome.
+290 65.00 6734 7306 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 5997 6569 AF063097 AF063097 Bacteriophage P2, complete genome.
+137 44.00 6792 7301 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 6055 6564 AF063097 AF063097 Bacteriophage P2, complete genome.
+59 54.00 6826 6993 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 6089 6256 AF063097 AF063097 Bacteriophage P2, complete genome.
+167 61.00 7078 7449 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 6341 6712 AF063097 AF063097 Bacteriophage P2, complete genome.
+188 90.00 7452 7721 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 6716 6985 AF063097 AF063097 Bacteriophage P2, complete genome.
+390 90.00 7699 8232 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 6961 7494 AF063097 AF063097 Bacteriophage P2, complete genome.
+130 63.00 7442 7714 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 6706 6978 AF063097 AF063097 Bacteriophage P2, complete genome.
+151 47.00 7725 8231 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 6987 7493 AF063097 AF063097 Bacteriophage P2, complete genome.
+131 66.00 7453 7713 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 6717 6977 AF063097 AF063097 Bacteriophage P2, complete genome.
+108 50.00 7721 8035 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 6983 7297 AF063097 AF063097 Bacteriophage P2, complete genome.
+58 60.00 8090 8224 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 7352 7486 AF063097 AF063097 Bacteriophage P2, complete genome.
+413 50.00 8286 9500 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 7991 9205 AF063097 AF063097 Bacteriophage P2, complete genome.
+177 72.00 8485 8775 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 8190 8480 AF063097 AF063097 Bacteriophage P2, complete genome.
+259 57.00 8573 9220 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 8278 8925 AF063097 AF063097 Bacteriophage P2, complete genome.
+71 43.00 9471 9659 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 9179 9367 AF063097 AF063097 Bacteriophage P2, complete genome.
+335 68.00 9720 10343 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 10299 10922 AF063097 AF063097 Bacteriophage P2, complete genome.
+161 63.00 10367 10681 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 10940 11254 AF063097 AF063097 Bacteriophage P2, complete genome.
+844 62.00 10778 12718 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 11349 13289 AF063097 AF063097 Bacteriophage P2, complete genome.
+66 44.00 9826 10089 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 10405 10668 AF063097 AF063097 Bacteriophage P2, complete genome.
+78 49.00 10138 10353 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 10717 10932 AF063097 AF063097 Bacteriophage P2, complete genome.
+54 45.00 10369 10590 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 10942 11163 AF063097 AF063097 Bacteriophage P2, complete genome.
+55 52.00 9968 10117 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 10547 10696 AF063097 AF063097 Bacteriophage P2, complete genome.
+53 42.00 10317 10553 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 10890 11126 AF063097 AF063097 Bacteriophage P2, complete genome.
+74 44.00 10725 10985 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 11296 11556 AF063097 AF063097 Bacteriophage P2, complete genome.
+64 49.00 11040 11255 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 11611 11826 AF063097 AF063097 Bacteriophage P2, complete genome.
+140 45.00 10735 11256 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 11306 11827 AF063097 AF063097 Bacteriophage P2, complete genome.
+506 68.00 11340 12266 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 11911 12837 AF063097 AF063097 Bacteriophage P2, complete genome.
+149 49.00 12378 12908 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 12949 13479 AF063097 AF063097 Bacteriophage P2, complete genome.
+650 66.00 11575 12915 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 12146 13486 AF063097 AF063097 Bacteriophage P2, complete genome.
+57 65.00 12664 12783 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 13367 13486 AF063097 AF063097 Bacteriophage P2, complete genome.
+50 49.00 12964 13080 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 13859 13975 AF063097 AF063097 Bacteriophage P2, complete genome.
+99 60.00 13794 14018 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 15011 15235 AF063097 AF063097 Bacteriophage P2, complete genome.
+89 41.00 14145 14480 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 17614 17949 AF063097 AF063097 Bacteriophage P2, complete genome.
+89 49.00 14149 14415 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 17618 17884 AF063097 AF063097 Bacteriophage P2, complete genome.
+77 45.00 14442 14687 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 17920 18165 AF063097 AF063097 Bacteriophage P2, complete genome.
+210 79.00 14153 14488 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 17622 17957 AF063097 AF063097 Bacteriophage P2, complete genome.
+596 82.00 14468 15358 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 17946 18836 AF063097 AF063097 Bacteriophage P2, complete genome.
+290 68.00 15377 15892 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 18855 19370 AF063097 AF063097 Bacteriophage P2, complete genome.
+77 67.00 14617 14763 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 18095 18241 AF063097 AF063097 Bacteriophage P2, complete genome.
+306 52.00 14814 15746 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 18292 19224 AF063097 AF063097 Bacteriophage P2, complete genome.
+46 57.00 15774 15893 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 19252 19371 AF063097 AF063097 Bacteriophage P2, complete genome.
+88 63.00 14881 15051 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 18359 18529 AF063097 AF063097 Bacteriophage P2, complete genome.
+137 58.00 15154 15495 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 18632 18973 AF063097 AF063097 Bacteriophage P2, complete genome.
+43 42.00 15637 15795 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 19115 19273 AF063097 AF063097 Bacteriophage P2, complete genome.
+197 53.00 16019 16588 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 19429 19998 AF063097 AF063097 Bacteriophage P2, complete genome.
+58 36.00 16685 17026 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 20095 20436 AF063097 AF063097 Bacteriophage P2, complete genome.
+262 55.00 17029 17754 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 20442 21167 AF063097 AF063097 Bacteriophage P2, complete genome.
+87 46.00 17794 18045 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 21207 21458 AF063097 AF063097 Bacteriophage P2, complete genome.
+176 69.00 16032 16367 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 19442 19777 AF063097 AF063097 Bacteriophage P2, complete genome.
+276 63.00 16401 16988 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 19811 20398 AF063097 AF063097 Bacteriophage P2, complete genome.
+602 78.00 17025 18032 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 20438 21445 AF063097 AF063097 Bacteriophage P2, complete genome.
+310 67.00 18108 18650 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 21521 22063 AF063097 AF063097 Bacteriophage P2, complete genome.
+141 78.00 18657 18875 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 22073 22291 AF063097 AF063097 Bacteriophage P2, complete genome.
+231 60.00 18891 19343 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 22312 22764 AF063097 AF063097 Bacteriophage P2, complete genome.
+477 75.00 19373 20152 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 22791 23570 AF063097 AF063097 Bacteriophage P2, complete genome.
+186 72.00 20213 20536 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 23628 23951 AF063097 AF063097 Bacteriophage P2, complete genome.
+133 63.00 20609 20827 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 24036 24254 AF063097 AF063097 Bacteriophage P2, complete genome.
+172 47.00 16231 16806 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 19641 20216 AF063097 AF063097 Bacteriophage P2, complete genome.
+47 43.00 16828 17016 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 20238 20426 AF063097 AF063097 Bacteriophage P2, complete genome.
+243 49.00 17153 17881 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 20566 21294 AF063097 AF063097 Bacteriophage P2, complete genome.
+186 44.00 17924 18643 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 21337 22056 AF063097 AF063097 Bacteriophage P2, complete genome.
+68 54.00 18664 18876 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 22080 22292 AF063097 AF063097 Bacteriophage P2, complete genome.
+108 45.00 19794 20204 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 23212 23622 AF063097 AF063097 Bacteriophage P2, complete genome.
+146 53.00 19798 20181 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 23216 23599 AF063097 AF063097 Bacteriophage P2, complete genome.
+49 54.00 20304 20447 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 23719 23862 AF063097 AF063097 Bacteriophage P2, complete genome.
+56 48.00 21451 21630 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 24517 24696 AF063097 AF063097 Bacteriophage P2, complete genome.
+85 49.00 24663 24875 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 27545 27757 AF063097 AF063097 Bacteriophage P2, complete genome.
+120 55.00 25471 25728 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 27769 28026 AF063097 AF063097 Bacteriophage P2, complete genome.
+88 39.00 27293 27568 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 28592 28867 AF063097 AF063097 Bacteriophage P2, complete genome.
+78 55.00 27563 27763 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 28865 29065 AF063097 AF063097 Bacteriophage P2, complete genome.
+89 43.00 27776 27982 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 29105 29311 AF063097 AF063097 Bacteriophage P2, complete genome.
+106 52.00 28001 28255 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 29315 29569 AF063097 AF063097 Bacteriophage P2, complete genome.
+84 42.00 28298 28594 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 29615 29911 AF063097 AF063097 Bacteriophage P2, complete genome.
+42 34.00 27999 28259 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 29313 29573 AF063097 AF063097 Bacteriophage P2, complete genome.
+64 40.00 28249 27989 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 29563 29303 AF063097 AF063097 Bacteriophage P2, complete genome.
+46 53.00 27909 27775 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 29238 29104 AF063097 AF063097 Bacteriophage P2, complete genome.
+42 30.00 27997 27785 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 29326 29114 AF063097 AF063097 Bacteriophage P2, complete genome.
+75 51.00 25724 25470 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 28022 27768 AF063097 AF063097 Bacteriophage P2, complete genome.
+51 38.00 25650 25468 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 27948 27766 AF063097 AF063097 Bacteriophage P2, complete genome.
+58 56.00 24874 24719 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 27756 27601 AF063097 AF063097 Bacteriophage P2, complete genome.
+56 45.00 22442 22284 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 25484 25326 AF063097 AF063097 Bacteriophage P2, complete genome.
+69 41.00 21869 21672 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 24938 24741 AF063097 AF063097 Bacteriophage P2, complete genome.
+116 59.00 21668 21447 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 24734 24513 AF063097 AF063097 Bacteriophage P2, complete genome.
+51 38.00 20805 20563 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 24232 23990 AF063097 AF063097 Bacteriophage P2, complete genome.
+123 52.00 20536 20192 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 23951 23607 AF063097 AF063097 Bacteriophage P2, complete genome.
+375 66.00 20190 19387 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 23608 22805 AF063097 AF063097 Bacteriophage P2, complete genome.
+142 53.00 19327 18890 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 22748 22311 AF063097 AF063097 Bacteriophage P2, complete genome.
+92 56.00 18881 18657 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 22297 22073 AF063097 AF063097 Bacteriophage P2, complete genome.
+225 61.00 18616 18107 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 22029 21520 AF063097 AF063097 Bacteriophage P2, complete genome.
+523 71.00 18046 17036 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 21459 20449 AF063097 AF063097 Bacteriophage P2, complete genome.
+408 63.00 16966 16007 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 20376 19417 AF063097 AF063097 Bacteriophage P2, complete genome.
+580 54.00 15892 14468 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 19370 17946 AF063097 AF063097 Bacteriophage P2, complete genome.
+153 78.00 14418 14149 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 17887 17618 AF063097 AF063097 Bacteriophage P2, complete genome.
+74 57.00 20516 20295 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 23931 23710 AF063097 AF063097 Bacteriophage P2, complete genome.
+95 75.00 20484 20305 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 23899 23720 AF063097 AF063097 Bacteriophage P2, complete genome.
+236 43.00 20194 19361 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 23612 22779 AF063097 AF063097 Bacteriophage P2, complete genome.
+82 47.00 20072 19797 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 23490 23215 AF063097 AF063097 Bacteriophage P2, complete genome.
+68 52.00 18874 18656 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 22290 22072 AF063097 AF063097 Bacteriophage P2, complete genome.
+599 52.00 18650 17028 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 22063 20441 AF063097 AF063097 Bacteriophage P2, complete genome.
+149 42.00 17015 16431 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 20425 19841 AF063097 AF063097 Bacteriophage P2, complete genome.
+126 50.00 16388 16032 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 19798 19442 AF063097 AF063097 Bacteriophage P2, complete genome.
+66 50.00 18873 18664 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 22289 22080 AF063097 AF063097 Bacteriophage P2, complete genome.
+121 47.00 18651 18238 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 22064 21651 AF063097 AF063097 Bacteriophage P2, complete genome.
+88 52.00 18141 17884 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 21554 21297 AF063097 AF063097 Bacteriophage P2, complete genome.
+98 51.00 17751 17458 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 21164 20871 AF063097 AF063097 Bacteriophage P2, complete genome.
+121 56.00 17361 17038 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 20774 20451 AF063097 AF063097 Bacteriophage P2, complete genome.
+190 44.00 16947 16207 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 20357 19617 AF063097 AF063097 Bacteriophage P2, complete genome.
+173 72.00 15888 15556 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 19366 19034 AF063097 AF063097 Bacteriophage P2, complete genome.
+251 56.00 15572 14904 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 19050 18382 AF063097 AF063097 Bacteriophage P2, complete genome.
+302 78.00 15357 14824 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 18835 18302 AF063097 AF063097 Bacteriophage P2, complete genome.
+143 73.00 14748 14479 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 18226 17957 AF063097 AF063097 Bacteriophage P2, complete genome.
+125 52.00 14479 14144 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 17948 17613 AF063097 AF063097 Bacteriophage P2, complete genome.
+67 59.00 14750 14574 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 18228 18052 AF063097 AF063097 Bacteriophage P2, complete genome.
+50 45.00 12909 12763 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 13480 13334 AF063097 AF063097 Bacteriophage P2, complete genome.
+682 53.00 12694 10721 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 13265 11292 AF063097 AF063097 Bacteriophage P2, complete genome.
+123 55.00 10710 10366 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 11283 10939 AF063097 AF063097 Bacteriophage P2, complete genome.
+246 60.00 10297 9716 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 10876 10295 AF063097 AF063097 Bacteriophage P2, complete genome.
+127 77.00 12746 12513 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 13317 13084 AF063097 AF063097 Bacteriophage P2, complete genome.
+59 82.00 12413 12315 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 12984 12886 AF063097 AF063097 Bacteriophage P2, complete genome.
+437 45.00 12260 10731 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 12831 11302 AF063097 AF063097 Bacteriophage P2, complete genome.
+83 40.00 10651 10367 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 11224 10940 AF063097 AF063097 Bacteriophage P2, complete genome.
+102 50.00 10280 10029 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 10859 10608 AF063097 AF063097 Bacteriophage P2, complete genome.
+61 36.00 9983 9714 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 10562 10293 AF063097 AF063097 Bacteriophage P2, complete genome.
+611 55.00 12696 11092 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 13267 11663 AF063097 AF063097 Bacteriophage P2, complete genome.
+69 78.00 10935 10801 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 11506 11372 AF063097 AF063097 Bacteriophage P2, complete genome.
+57 54.00 10116 9967 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 10695 10546 AF063097 AF063097 Bacteriophage P2, complete genome.
+46 32.00 9500 9156 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 9205 8861 AF063097 AF063097 Bacteriophage P2, complete genome.
+358 46.00 9499 8228 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 9204 7933 AF063097 AF063097 Bacteriophage P2, complete genome.
+199 58.00 9021 8485 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 8726 8190 AF063097 AF063097 Bacteriophage P2, complete genome.
+43 40.00 9011 8841 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 8716 8546 AF063097 AF063097 Bacteriophage P2, complete genome.
+155 46.00 8774 8229 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 8479 7934 AF063097 AF063097 Bacteriophage P2, complete genome.
+156 49.00 8245 7724 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 7507 6986 AF063097 AF063097 Bacteriophage P2, complete genome.
+100 66.00 7713 7519 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 6977 6783 AF063097 AF063097 Bacteriophage P2, complete genome.
+264 74.00 8228 7731 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 7490 6993 AF063097 AF063097 Bacteriophage P2, complete genome.
+135 69.00 7714 7451 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 6978 6715 AF063097 AF063097 Bacteriophage P2, complete genome.
+243 53.00 7449 6727 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 6712 5990 AF063097 AF063097 Bacteriophage P2, complete genome.
+189 51.00 8223 7723 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 7485 6985 AF063097 AF063097 Bacteriophage P2, complete genome.
+125 61.00 7715 7452 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 6979 6716 AF063097 AF063097 Bacteriophage P2, complete genome.
+144 52.00 7448 7050 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 6711 6313 AF063097 AF063097 Bacteriophage P2, complete genome.
+66 52.00 7007 6825 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 6270 6088 AF063097 AF063097 Bacteriophage P2, complete genome.
+170 47.00 7309 6791 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 6572 6054 AF063097 AF063097 Bacteriophage P2, complete genome.
+66 40.00 6554 6258 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 5819 5523 AF063097 AF063097 Bacteriophage P2, complete genome.
+132 51.00 6236 5880 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 5495 5139 AF063097 AF063097 Bacteriophage P2, complete genome.
+351 45.00 5878 4817 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 5132 4071 AF063097 AF063097 Bacteriophage P2, complete genome.
+127 46.00 4751 4368 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 4022 3639 AF063097 AF063097 Bacteriophage P2, complete genome.
+241 61.00 4372 3881 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 3643 3152 AF063097 AF063097 Bacteriophage P2, complete genome.
+611 51.00 3876 2134 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 3139 1397 AF063097 AF063097 Bacteriophage P2, complete genome.
+98 52.00 6544 6245 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 5809 5510 AF063097 AF063097 Bacteriophage P2, complete genome.
+133 58.00 6235 5894 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 5494 5153 AF063097 AF063097 Bacteriophage P2, complete genome.
+301 68.00 5871 5245 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 5125 4499 AF063097 AF063097 Bacteriophage P2, complete genome.
+161 68.00 5154 4816 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 4408 4070 AF063097 AF063097 Bacteriophage P2, complete genome.
+401 66.00 4749 3880 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 4020 3151 AF063097 AF063097 Bacteriophage P2, complete genome.
+1286 85.00 3871 2000 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 3134 1263 AF063097 AF063097 Bacteriophage P2, complete genome.
+48 58.00 6228 6130 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 5487 5389 AF063097 AF063097 Bacteriophage P2, complete genome.
+72 58.00 6069 5884 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 5328 5143 AF063097 AF063097 Bacteriophage P2, complete genome.
+125 50.00 5840 5460 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 5094 4714 AF063097 AF063097 Bacteriophage P2, complete genome.
+95 53.00 5393 5109 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 4647 4363 AF063097 AF063097 Bacteriophage P2, complete genome.
+44 59.00 4916 4815 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 4170 4069 AF063097 AF063097 Bacteriophage P2, complete genome.
+122 47.00 4750 4427 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 4021 3698 AF063097 AF063097 Bacteriophage P2, complete genome.
+168 66.00 4319 3975 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 3590 3246 AF063097 AF063097 Bacteriophage P2, complete genome.
+128 52.00 3857 3486 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 3120 2749 AF063097 AF063097 Bacteriophage P2, complete genome.
+199 58.00 3254 2778 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 2517 2041 AF063097 AF063097 Bacteriophage P2, complete genome.
+89 65.00 2729 2544 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 1992 1807 AF063097 AF063097 Bacteriophage P2, complete genome.
+63 52.00 2495 2346 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 1758 1609 AF063097 AF063097 Bacteriophage P2, complete genome.
+126 54.00 2285 1977 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 1548 1240 AF063097 AF063097 Bacteriophage P2, complete genome.
+84 44.00 1958 1665 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 2621 2328 AF063097 AF063097 Bacteriophage P2, complete genome.
+58 45.00 1391 1251 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 2021 1881 AF063097 AF063097 Bacteriophage P2, complete genome.
+264 47.00 1222 362 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 1216 356 AF063097 AF063097 Bacteriophage P2, complete genome.
+645 78.00 1209 208 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 1203 202 AF063097 AF063097 Bacteriophage P2, complete genome.
+267 49.00 1145 303 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 1139 297 AF063097 AF063097 Bacteriophage P2, complete genome.
diff --git a/etc/b132222.embl b/etc/b132222.embl
new file mode 100644
index 0000000000000000000000000000000000000000..4e4dcccab25a233bb3e0108d7c4d1e4b00bb9b86
--- /dev/null
+++ b/etc/b132222.embl
@@ -0,0 +1,1512 @@
+ID   B132222    standard; DNA; PHG; 30624 BP.
+XX
+AC   U32222; U51471; X04449; X53318;
+XX
+SV   U32222.1
+XX
+DT   27-OCT-1995 (Rel. 45, Created)
+DT   09-SEP-1998 (Rel. 56, Last updated, Version 6)
+XX
+DE   Bacteriophage 186, complete sequence.
+XX
+KW   .
+XX
+OS   Enterobacteria phage 186
+OC   Viruses; dsDNA viruses, no RNA stage; Caudovirales; Myoviridae;
+OC   P2-like Viruses.
+XX
+RN   [1]
+RP   20315-23876
+RX   MEDLINE; 87112711.
+RA   Kalionis B., Dodd I.B., Egan J.B.;
+RT   "Control of gene expression in the P2-related template coliphages. III. DNA
+RT   sequence of the major control region of phage 186";
+RL   J. Mol. Biol. 191(2):199-209(1986).
+XX
+RN   [2]
+RP   23435-24666
+RX   MEDLINE; 89199647.
+RA   Richardson H., Puspurs A., Egan J.B.;
+RT   "Control of gene expression in the P2-related temperate coliphage 186. VI.
+RT   Sequence analysis of the early lytic region";
+RL   J. Mol. Biol. 206(1):251-255(1989).
+XX
+RN   [3]
+RP   22430-23430
+RX   MEDLINE; 90317829.
+RA   Dodd I.B., Kalionis B., Egan J.B.;
+RT   "Control of gene expression in the temperate coliphage 186. VIII. Control
+RT   of lysis and lysogeny by a transcriptional switch involving face-to-face
+RT   promoters";
+RL   J. Mol. Biol. 214(1):27-37(1990).
+XX
+RN   [4]
+RP   12142-14054
+RX   MEDLINE; 95407087.
+RA   Xue Q., Egan J.B.;
+RT   "DNA sequence of tail fiber genes of coliphage 186 and evidence for a
+RT   common ancestor shared by dsDNA phage fiber genes";
+RL   Virology 212(1):128-133(1995).
+XX
+RN   [5]
+RP   14042-15941
+RX   MEDLINE; 95407099.
+RA   Xue Q., Egan J.B.;
+RT   "Tail sheath and tail tube genes of the temperate coliphage 186";
+RL   Virology 212(1):218-221(1995).
+XX
+RN   [6]
+RP   11442-18696
+RA   Xue Q.;
+RT   "Studies on the tail region of the temperate coliphage 186 genome";
+RL   Thesis (1993), University of Adelaide
+XX
+RN   [7]
+RP   1-20866
+RX   MEDLINE; 98371265.
+RA   Portelli R., Dodd I.B., Xue Q., Egan J.B.;
+RT   "The late-expressed region of the temperate coliphage 186 genome";
+RL   Virology 248(1):117-130(1998).
+XX
+RN   [8]
+RP   1-30624
+RA   Dodd I.B., Egan J.B.;
+RT   "Bacteriophage 186 complete genome";
+RL   Unpublished.
+XX
+RN   [9]
+RP   11442-18696
+RA   Xue Q., Egan J.B.;
+RT   ;
+RL   Submitted (25-JUL-1995) to the EMBL/GenBank/DDBJ databases.
+RL   Department of Biochemistry, University of Adelaide, Adelaide, SA 5005,
+RL   Australia
+XX
+RN   [10]
+RP   1-30624
+RA   Xue Q., Egan J.B.;
+RT   ;
+RL   Submitted (15-MAY-1998) to the EMBL/GenBank/DDBJ databases.
+RL   Department of Biochemistry, University of Adelaide, Adelaide, SA 5005,
+RL   Australia
+XX
+DR   SPTREMBL; O80303; O80303.
+DR   SPTREMBL; O80304; O80304.
+DR   SPTREMBL; O80305; O80305.
+DR   SPTREMBL; O80306; O80306.
+DR   SPTREMBL; O80307; O80307.
+DR   SPTREMBL; O80308; O80308.
+DR   SPTREMBL; O80309; O80309.
+DR   SPTREMBL; O80310; O80310.
+DR   SPTREMBL; O80311; O80311.
+DR   SPTREMBL; O80312; O80312.
+DR   SPTREMBL; O80313; O80313.
+DR   SPTREMBL; O80314; O80314.
+DR   SPTREMBL; O80315; O80315.
+DR   SPTREMBL; O80316; O80316.
+DR   SPTREMBL; O80317; O80317.
+DR   SPTREMBL; Q01088; Q01088.
+DR   SPTREMBL; Q37840; Q37840.
+DR   SPTREMBL; Q37841; Q37841.
+DR   SPTREMBL; Q37842; Q37842.
+DR   SPTREMBL; Q37843; Q37843.
+DR   SPTREMBL; Q37844; Q37844.
+DR   SPTREMBL; Q37845; Q37845.
+DR   SPTREMBL; Q37846; Q37846.
+DR   SPTREMBL; Q37848; Q37848.
+DR   SPTREMBL; Q37850; Q37850.
+DR   SPTREMBL; Q37851; Q37851.
+DR   SPTREMBL; Q9T0R3; Q9T0R3.
+DR   SWISS-PROT; P06723; VINT_BP186.
+DR   SWISS-PROT; P08685; CP69_BP186.
+DR   SWISS-PROT; P08707; RPC1_BP186.
+DR   SWISS-PROT; P08711; VPB_BP186.
+DR   SWISS-PROT; P15236; VFIL_BP186.
+DR   SWISS-PROT; P21678; RPC2_BP186.
+DR   SWISS-PROT; P21679; VPD_BP186.
+DR   SWISS-PROT; P21680; VDHR_BP186.
+DR   SWISS-PROT; P21681; VAPL_BP186.
+DR   SWISS-PROT; P21682; CP79_BP186.
+DR   SWISS-PROT; P41059; CP80_BP186.
+DR   SWISS-PROT; P41060; CP81_BP186.
+DR   SWISS-PROT; P41061; CP83_BP186.
+DR   SWISS-PROT; P41062; CP84_BP186.
+DR   SWISS-PROT; P41063; TUM_BP186.
+DR   SWISS-PROT; P41064; VPA_BP186.
+XX
+CC   On Jul 23, 1998 this sequence version replaced gi:14895 gi:15549
+CC   gi:1262241 gi:974436.
+XX
+FH   Key             Location/Qualifiers
+FH
+FT   source          1..30624
+FT                   /db_xref="taxon:29252"
+FT                   /organism="Enterobacteria phage 186"
+FT   misc_recomb     1..19
+FT                   /evidence=EXPERIMENTAL
+FT                   /note="cos; cohesive end; top strand cut at 5' end and
+FT                   bottom strand cut at 3' end"
+FT                   /organism="Enterobacteria phage 186"
+FT   terminator      complement(164..187)
+FT                   /evidence=NOT_EXPERIMENTAL
+FT                   /note="tW"
+FT                   /gene="W"
+FT   CDS             complement(196..1218)
+FT                   /codon_start=1
+FT                   /db_xref="SPTREMBL:Q37851"
+FT                   /note="Orf2; P2 Q homolog"
+FT                   /transl_table=11
+FT                   /gene="W"
+FT                   /product="capsid portal protein"
+FT                   /protein_id="AAC34146.1"
+FT                   /translation="MSKRKPRKQVAMTASAPQKMEAFTFGEPVPVLDKRDILDYVECIS
+FT                   NGKWYEPPVSFSGLAKSLRSAVHHSSPIYVKRNVLASTYIPHPLLSRQDFSRFALDYLV
+FT                   FGNAFLEQRHSVTGQLIKLLASPAKYTRRGVDDSVFWFVENFTLPHEFAPDTVFHLLEP
+FT                   DINQEIYGLPEYLSALNSAWLNESATLFRRKYYQNGAHAGYIMYVTDPAQSATDVESLR
+FT                   EAMRNSKGLGNFKNLFFYAPNGKPDGIKIVPLSEVATKDDFFNIKKASAADLMDAHRVP
+FT                   FQLMGGKPENIGSLGDVEKVAKVFVRNDLSPLQDRFREVNDWLGMEVIRFKEYTLDNPE
+FT                   "
+FT   CDS             complement(1215..1961)
+FT                   /codon_start=1
+FT                   /db_xref="SPTREMBL:O80303"
+FT                   /note="similar to Orf12"
+FT                   /transl_table=11
+FT                   /gene="W"
+FT                   /product="W protein"
+FT                   /protein_id="AAC34147.1"
+FT                   /translation="MKNNVFSQSQIQAMADILHNDSFDYQATWLRVGKLNIDRSITKSR
+FT                   QIGATQLFSREALLDALTTGDNHVWFAHTIEHARVALMYMSNLSARVGVSLTSNGHSLQ
+FT                   LDDGAVISFVGEESHCAALAGNVYLDEFGWFNNPLRAAKVAAGIACHKRHSLTMFTSPS
+FT                   DNYDAFRVWNGTTRRHRPSPLINTGDSVFCTDGVWRQSVTLDAACQRGCNLFAPDEIKH
+FT                   EYSDDDYRLLFGCDWSFAVAAGEVAA"
+FT   CDS             complement(1961..3730)
+FT                   /codon_start=1
+FT                   /db_xref="SPTREMBL:Q9T0R3"
+FT                   /note="Orf12; P2 P homolog; contains putative
+FT                   helix-turn-helix DNA-binding motif"
+FT                   /transl_table=11
+FT                   /product="terminase subunit"
+FT                   /protein_id="AAC34148.1"
+FT                   /translation="MTISTDTTLLHDPRRQASLLYWQGFSVPQIAEMLQVKRPTVQSWK
+FT                   QRDGWDGIAPISRVESSLEARLIQLIAKPQKSGGDFKEIDLLGRQIERLARVNRYSQTG
+FT                   NEADLNPNVANRNKGERKKPKKNFFSDEAIEKLEELFFDQSFEYQLQWYRAGLAHRIRD
+FT                   ILKSRQIGATFYFSREALLRALKTGHNQIFLSASKTQAYVFREYIIQFARLVDVDLTGD
+FT                   PIVIGNNGAKLIFLGTNSNTAQSHNGDLYVDEIFWIPNFQKLRKVASGMASQKHLRSTY
+FT                   FSTPSTLAHGAYPFWSGELFNKGRSRIADRIEIDISHRALAGGQLCDDGQWRQIVTIED
+FT                   ALAGGCTLFDLDQLKRENSDEDFKNLFMCEFVDDKASVFPFEELQRCMVDVMEEWEDFA
+FT                   PFADHPFGSRPVWIGYDPSHTGDSAGCVVLAPPVVSGGKFRMLERHQWKGMDFAAQADG
+FT                   IRKLTEKYSVEYIGIDATGLGLGVFQLVRSFYPAARGIRYTPEMKTAMVLKAKDTIRRG
+FT                   CLEYDAGATDVTQSFMSIRKTMTSSGRSATYEASRTEEASHADIAWATMHALLNEPLSA
+FT                   GSGIQPKSILEFN"
+FT   promoter        complement(3753..3790)
+FT                   /evidence=EXPERIMENTAL
+FT                   /note="p12"
+FT                   /function="B-dependent transcription of orf12 operon"
+FT   protein_bind    3798..3817
+FT                   /evidence=EXPERIMENTAL
+FT                   /bound_moiety="B protein"
+FT                   /function="activation of pV and p12 promoters"
+FT   promoter        3828..3865
+FT                   /evidence=EXPERIMENTAL
+FT                   /note="pV"
+FT                   /gene="V"
+FT                   /function="B-dependent transcription of V operon"
+FT   CDS             3896..4750
+FT                   /codon_start=1
+FT                   /db_xref="SPTREMBL:Q01088"
+FT                   /note="presumed capsid scaffold; P2 O homolog"
+FT                   /transl_table=11
+FT                   /gene="V"
+FT                   /product="V protein"
+FT                   /protein_id="AAC34149.1"
+FT                   /translation="MAKKVSKFFRIGVEGDTCDGRIISASDIQEMAETYDPRVYGCRIN
+FT                   LEHLRGLLPDGIFKRYGDVVELKAEKIDDDSALNGKWALFAKITPTDDLIAMNKAAQKV
+FT                   YTSMEIQPNFANTGKCYLVGLAVTDDPASLGTEYLEFCRTAKHNPLQRFKAHPENVFSA
+FT                   ATLAELEFEDVPDTVLNSLADKVKAIFSRKQVSDDARLNDVHEAVTAVSEHVQTNLTAQ
+FT                   DKRLSDMETAFATFKQELTGKVEETSQAFSVLKTTLDKTESFSQPRRTKASGGGGDELL
+FT                   TDC"
+FT   variation       3980
+FT                   /note="Vam38; glutamine to amber"
+FT                   /replace="t"
+FT                   /gene="V"
+FT   CDS             4826..5893
+FT                   /codon_start=1
+FT                   /db_xref="SPTREMBL:O80304"
+FT                   /note="T protein; P2 N homolog"
+FT                   /transl_table=11
+FT                   /gene="T"
+FT                   /product="major capsid protein"
+FT                   /protein_id="AAC34150.1"
+FT                   /translation="MRQETRFKFNAYLTQLAKLNGISVDDVSKKFTVEPSVTQTLMNTV
+FT                   QASSAFLQMINILPVAEMKGEKIGVGVTGTIASTTDTSGDKERQTADFTALESNKYECN
+FT                   QINFDFHLTYKRLDLWARFQDFQRRIRDAIVQRQALDFIMAGFNGTTRADTSDRVKNPM
+FT                   LQDVAVGWLQKYRNEAPARVMSNITDADGKVVSAVIRVGKNGDYENLDALVMDGTNTLI
+FT                   DEIYQDDPKLVAIVGRKLLADKYFPLVNKQQENTESLAADIIISQKRIGNLPAVRVPYF
+FT                   PANAVFVTTLENLSIYFMDESHRRSIDENPKKDRVENYESMNIDYVVEAYAAGCLLENI
+FT                   TLGDFTAPAAPEGGE"
+FT   CDS             5898..6647
+FT                   /codon_start=1
+FT                   /db_xref="SPTREMBL:O80305"
+FT                   /note="terminase subunit; P2 M homolog"
+FT                   /transl_table=11
+FT                   /gene="R"
+FT                   /product="R protein"
+FT                   /protein_id="AAC34151.1"
+FT                   /translation="MTSPAQRHMMRVSASQAAQREQAPLRHATAYEQMLVKLADDRRTL
+FT                   KNIRSNERKAEKKRELLPFYAPWVAGVLTDGRGAQDDIVMTVMLWRLDAGDIAGALEIA
+FT                   PYALKYGLTSDHRRTTPYMLVEEVALAAQRLRDAGESVDLSWLQATIDLTDGADVPDMV
+FT                   RARLHKVTGLTLRDAGMNAEALAQFQRAMQLDRNAGVRKEIERLERALKPKTEAAPRKT
+FT                   TKPRTRKPATKPAAKRGRPPKAAKTAG"
+FT   CDS             6740..7246
+FT                   /codon_start=1
+FT                   /db_xref="SPTREMBL:O80306"
+FT                   /note="capsid completion protein; P2 L homolog"
+FT                   /transl_table=11
+FT                   /gene="Q"
+FT                   /product="Q protein"
+FT                   /protein_id="AAC34152.1"
+FT                   /translation="MTTVILNQPDEPQDVPGVVIPAPETGGAVIKNTFFFPDVDPKRVR
+FT                   ELMRLEQTVSDARLRNAIKTGMAETNAELYDYRLRQTAAGFKQLADVPAEEIDGENVRV
+FT                   FHYLSAVTAMATATLYERYRGVEATGKGDKKADSVETTIDDLWRDMRWSVARLQDKPRC
+FT                   IVGQL"
+FT   CDS             7246..7449
+FT                   /codon_start=1
+FT                   /db_xref="SPTREMBL:O80307"
+FT                   /note="Orf23; P2 X homolog; tail protein"
+FT                   /transl_table=11
+FT                   /protein_id="AAC34153.1"
+FT                   /translation="MKVRSMQGDTLDTICARYYGRTEGVVETVLQANPGLSELGVILPN
+FT                   GTEIDLPDVASSPVTKTINLWE"
+FT   CDS             7452..7748
+FT                   /codon_start=1
+FT                   /db_xref="SPTREMBL:O80308"
+FT                   /note="Orf24; P2 Y homolog; holin"
+FT                   /transl_table=11
+FT                   /protein_id="AAC34154.1"
+FT                   /translation="MTEGEKGVLSLFVIGVMIVVGKVLAGGEPITPRLFIGRMLLGGFV
+FT                   SMVAGVVLVQFPDMSLPAVCGIGSMLGIAGYQVVEIAIQRRFKSQKGESDAGH"
+FT   CDS             7735..8232
+FT                   /codon_start=1
+FT                   /db_xref="SPTREMBL:O80309"
+FT                   /note="endolysin; P2 K and lambda S homolog"
+FT                   /transl_table=11
+FT                   /gene="P"
+FT                   /product="P protein"
+FT                   /protein_id="AAC34155.1"
+FT                   /translation="MPVINTHQNIAAFLDMLAYSEGTANHPLTKNRGYDVIVTGLDGRP
+FT                   EIFTDYSDHPFAHGRPPKVFNRRGEKSTASGRYQQLYLFWPHYQKQLALPDFSPLSQDK
+FT                   LAIQLIRERGALDDIRAGRIERAVSRCRNIWASLPGAGYGQREHGLEKLVTIWRTAGGV
+FT                   VA"
+FT   variation       7999
+FT                   /note="Pam65"
+FT                   /replace="t"
+FT                   /gene="P"
+FT   CDS             8229..8642
+FT                   /codon_start=1
+FT                   /db_xref="SPTREMBL:O80310"
+FT                   /note="Orf27; P2 LysB homolog; control of lysis"
+FT                   /transl_table=11
+FT                   /protein_id="AAC34156.1"
+FT                   /translation="MKVLITLLVMAVLGLLWLHHENGNLSRSFETANRVASEQKTTIGM
+FT                   LKNQLSVAGQLARRNESAQVTLREQLAKASAEASRREQTITRLLNENEAFRRWYNAALP
+FT                   DAVRRLHTRTACASAGDCGQRMPEGEPLPYAGK"
+FT   CDS             8497..8787
+FT                   /codon_start=1
+FT                   /db_xref="SPTREMBL:O80311"
+FT                   /note="Orf28; homologs present in other phages, e.g. P2,
+FT                   HP1"
+FT                   /transl_table=11
+FT                   /product="unknown"
+FT                   /protein_id="AAC34157.1"
+FT                   /translation="MKMKPFAAGITLLCLMLCVGCTPEQPAPVPVIVVNGCPRVSLCPM
+FT                   PGSDPKTNGDLSADIRRLEGALTACALQVKTVKHCQDELDAEAQKPAQSAD"
+FT   CDS             8750..9217
+FT                   /codon_start=1
+FT                   /db_xref="SPTREMBL:O80312"
+FT                   /note="P2 R homolog; tail completion protein"
+FT                   /transl_table=11
+FT                   /gene="N"
+FT                   /product="N protein"
+FT                   /protein_id="AAC34158.1"
+FT                   /translation="MQKHKSLRKALINAVPQLRNNPDMLRLFADNGHTDSRLASSLSFE
+FT                   KVYVLNVVVTDFTGDLDLIFVPVQAWLREHQPDIMTTDDGREKGFTWIIDINNDDSLDI
+FT                   SISLRLTERTLVKEVGGALHVSYAPEPPLPELVKRPVAMYANGELVSQWDE"
+FT   variation       8877
+FT                   /note="Nam47"
+FT                   /replace="a"
+FT                   /gene="N"
+FT   CDS             9210..9659
+FT                   /codon_start=1
+FT                   /db_xref="SPTREMBL:O80313"
+FT                   /note="P2 S homolog; tail completion protein"
+FT                   /transl_table=11
+FT                   /gene="O"
+FT                   /product="O protein"
+FT                   /protein_id="AAC34159.1"
+FT                   /translation="MSELTALQERLAGLIASLSPAARRKMAAEIAKKLRTSQQQRIKRQ
+FT                   QAPDGTPYAARKRQPVRSKKGRIKREMFAKLRTSRFMKAKGSDSAAVVEFTGKVQRMAR
+FT                   VHQYGLKDRPNRNSRDVQYEARPLLGFTRDDEQMIEDVIISHLGK"
+FT   variation       9324
+FT                   /note="Oam61"
+FT                   /replace="t"
+FT                   /gene="O"
+FT   variation       9345
+FT                   /note="Oam62"
+FT                   /replace="t"
+FT                   /gene="O"
+FT   CDS             9729..10370
+FT                   /codon_start=1
+FT                   /db_xref="SPTREMBL:O80314"
+FT                   /note="Orf32; P2 V homolog; baseplate protein"
+FT                   /transl_table=11
+FT                   /protein_id="AAC34160.1"
+FT                   /translation="MNTLSTIQELARAIRNLIRSGVVTEVDTVQGLCRVQSGGIQTTWL
+FT                   NWLTTRAGRSRTWWAPSLGEQVLLLAIGGELDTAFVLPGIFSDDNPAPSASADAWHVVF
+FT                   PDGAVIEYEPETSALTVRGIKTADVTASESITATVPVVLVKAETRITLDTPEVVCTNKL
+FT                   TTATLEVQKGGEMRGDIVHNGGTFKSNGVQLDDHGHGGVQRGGAWTEDTK"
+FT   CDS             10367..10714
+FT                   /codon_start=1
+FT                   /db_xref="SPTREMBL:O80315"
+FT                   /note="P2 W homolog; putative baseplate protein"
+FT                   /transl_table=11
+FT                   /gene="M"
+FT                   /product="M protein"
+FT                   /protein_id="AAC34161.1"
+FT                   /translation="MTARYMGMNRNTGLGISDTEHISQSMRDILLTPVGSRVMRREYGS
+FT                   LLSALIDMPQNPALRLQIMVACYSAIQKWEPRIRLTSISFETGDAGEMYVDITGMRTDT
+FT                   GASVSTTVSLS"
+FT   CDS             10721..11629
+FT                   /codon_start=1
+FT                   /db_xref="SPTREMBL:Q37840"
+FT                   /note="P2 J homolog; baseplate or base of tail fibre"
+FT                   /transl_table=11
+FT                   /gene="L"
+FT                   /protein_id="AAC34162.1"
+FT                   /translation="MATVDLSLLPVPDVVEELDFETILAERIATLISLYPEDQQEAVAR
+FT                   TLALESEPIVKLLQENAYREVIWRQRVNEAARAGMLAYARDSDLDNLGANFNVERLVVR
+FT                   PADDTTIPPTPAEMELDADFRLRIQQAFEGMSVAGSTGAYEFHGRSADGRVADISVISP
+FT                   SPACVTISVLSRENNGAASDELQSIVRNALNAEDVRPVADRVTVQSAQIIDYQIRATLF
+FT                   VYPGPENEPIRAAAEAKLKAYISAQHRLGRDIRLSAIYAALHVEGVQRVELAAPVADIV
+FT                   LDKTQASFCTDYQIVIGGSDE"
+FT   variation       10818
+FT                   /note="Lam21"
+FT                   /replace="a"
+FT                   /gene="L"
+FT   CDS             11622..12152
+FT                   /codon_start=1
+FT                   /db_xref="SPTREMBL:Q37841"
+FT                   /note="Orf38; P2 I homolog; tail protein"
+FT                   /transl_table=11
+FT                   /protein_id="AAC34163.1"
+FT                   /translation="MSDVRLLPVGSSPLEVAAARACADIENTPVPLRRLWSPDTCPANL
+FT                   LPWLAWAFSVDRWDENWPEKTKRDVIRSAYFTHCHKGTIGAVRRVIEPLGYIINVTEWW
+FT                   ETGDPAGTFRLDIGVLESGITEEMYLEMERLIADAKPASRHLIGLNIIQDIPGYMYTGG
+FT                   VSCDGDIITVYPG"
+FT   CDS             12163..13551
+FT                   /codon_start=1
+FT                   /db_xref="SPTREMBL:Q37842"
+FT                   /note="similar to P2 tail fiber protein H, PIR Accession
+FT                   Number B42291"
+FT                   /transl_table=11
+FT                   /gene="K"
+FT                   /protein_id="AAC34164.1"
+FT                   /translation="MSTKFKTIITTAGAEKLAAATVPGGKKVNITVMAVGDGGGKLPVP
+FT                   DAGQVQLVNEVWRHALNKISQDNRNSNYIVAELVIPPEVGGFWMRELGLYDDEGTLIAV
+FT                   ANMAESYKPELAEGSGRAQTCRMVIIVSSIASVELSIDSTMVMATQEYVDDRIAEHEKS
+FT                   RRHPDATLKEKGFTQLSSATDSASEVLAATPKAVKAAYDLANAKYTAQDASTAQKGIVR
+FT                   LSSAADSTSEAEAATPKAVKIAMDNANARLAKDRNGADIPNPPLFVQNIGLKPTVDKAA
+FT                   NAVDKNGDTMNGNLTLKGDYRLSFIIQNEDGSIRAYIFKDKGGDGIRISNGDDGGGDFV
+FT                   FGKNGQFYCPDIMHVGNTIVWGDGNIEGARWGGLLSDWLTAQLVARDNNINLRAPYEWV
+FT                   NQNFVNRAQRGAQASMTMDGGLVEAPWGCFLTGGNGNEGNQVGVALYRPLQILRNNTWV
+FT                   TIEN"
+FT   misc_recomb     12962..12987
+FT                   /note="Mu-like inversion crossover site"
+FT                   /organism="Enterobacteria phage 186"
+FT                   /gene="K"
+FT   CDS             13554..14054
+FT                   /codon_start=1
+FT                   /db_xref="SPTREMBL:Q37843"
+FT                   /note="unnamed protein product"
+FT                   /transl_table=11
+FT                   /protein_id="AAC34165.1"
+FT                   /translation="MKLINLQRYILMNYFLGDGIQYFIDATGKDWYKSLPKFTKKYSLA
+FT                   IENDTGVIRSISEDASRLYPGGLTVVDVDSIPAGCDIFGGWVFDGEKVIPREYTLAEQQ
+FT                   RQSDEKKKTLLAEAEATISTLERAVRLGMATGEEIRRLEAWERYSVLVSRVKQSDDWPQ
+FT                   KPE"
+FT   terminator      14058..14081
+FT                   /evidence=NOT_EXPERIMENTAL
+FT                   /note="t45"
+FT   protein_bind    14091..14110
+FT                   /evidence=NOT_EXPERIMENTAL
+FT                   /bound_moiety="B protein"
+FT                   /function="activation of transcription from pJ"
+FT   promoter        14122..14159
+FT                   /evidence=EXPERIMENTAL
+FT                   /note="pJ"
+FT                   /function="B-dependent transcription of J operon"
+FT   promoter        14159
+FT                   /note="initiation point of late promoter pJ"
+FT   CDS             14183..15361
+FT                   /codon_start=1
+FT                   /db_xref="SPTREMBL:Q37844"
+FT                   /note="similar to P2 tail sheath protein FI, Swiss-Prot
+FT                   Accession Number P22501"
+FT                   /transl_table=11
+FT                   /gene="J"
+FT                   /protein_id="AAC34166.1"
+FT                   /translation="MSDFHHGTKVIEINDGTRVISTVATAIVGMVWTASDADAETFPLN
+FT                   EPVLITNVQSAIAKAGKKGTLSASLQAIADQSKPVTVVVRVAEGTGDDAEAQTTSNIIG
+FT                   GTDENGKYTGIKALLTAEAVTGVKPRILGVPGLDTQEVATALASVCISLRAFGYVSAWG
+FT                   CKTISEAMAYRENFSQRELMVIWPDFLAWDTTANATATAYATARALGLRAYIDQTIGWH
+FT                   KTLSNVGVQGVTGISASVFWDLQASGTDADLLNEAGVTTLVRKDGFRFWGNRTCSDDPL
+FT                   FLFENYTRTAQVLADTMAEAHMWAVDKPITASLIRDIVDGINAKFRELKSNGYIVDGEC
+FT                   WFDEESNDKETLKAGKLYIDYDYTPVPPLESLTLRQRITDKYLVNLAESVNS"
+FT   CDS             15377..15898
+FT                   /codon_start=1
+FT                   /db_xref="SPTREMBL:Q37845"
+FT                   /note="similar to P2 tail tube protein FII, Swiss-Prot
+FT                   Accession Number P22502"
+FT                   /transl_table=11
+FT                   /gene="I"
+FT                   /protein_id="AAC34167.1"
+FT                   /translation="MALPRKLKYLNMFNDGLSYMGVVESVTLPKLTRKLENYRGGGMNG
+FT                   AAAIDLGLDDDALTVEWSVGGLPDVALWAQYAAPGADAVPLRFAGSYQRDDTGEIVAVE
+FT                   VVMRGRHKEIDGGENKQGENTSTKLSTVCTYYRLTIDGSDIIEIDTVNMVEKVNGVDRL
+FT                   EQHRRAIGLL"
+FT   terminator      15906..15932
+FT                   /note="tI; partial terminator of pJ transcript"
+FT   CDS             15960..16295
+FT                   /codon_start=1
+FT                   /db_xref="SPTREMBL:Q37846"
+FT                   /note="Orf51; P2 E homolog; tail protein"
+FT                   /transl_table=11
+FT                   /gene="H"
+FT                   /protein_id="AAC34168.1"
+FT                   /translation="MAKAPRKTPEFIDTAGNEIDTVNPNVVTLDKPIKRAGQTIEKVTL
+FT                   IEPNAGTLRGVSLAAVAQSEVDALIKVLPRMTYPALTTQELTAMNLPDMLSLAAKVIGF
+FT                   LSPASAE"
+FT   CDS             <16271..16447
+FT                   /codon_start=1
+FT                   /db_xref="SPTREMBL:O80316"
+FT                   /note="Orf52; tail protein; probably produced by a
+FT                   translational frameshift from orf51 into orf52"
+FT                   /transl_table=11
+FT                   /gene="H"
+FT                   /protein_id="AAC34169.1"
+FT                   /translation="FVTGFGGIDFPPGLSTDDLMADIAVIFHWPPSELYSLSLTELITW
+FT                   REKALQRSGNHNE"
+FT   variation       16314
+FT                   /note="Ham50"
+FT                   /replace="a"
+FT                   /gene="H"
+FT   variation       16421
+FT                   /note="Ham56"
+FT                   /replace="t"
+FT                   /gene="H"
+FT   CDS             16440..18878
+FT                   /codon_start=1
+FT                   /db_xref="SPTREMBL:Q37848"
+FT                   /note="P2 T homolog; tail protein"
+FT                   /transl_table=11
+FT                   /gene="G"
+FT                   /product="G protein"
+FT                   /protein_id="AAC34170.1"
+FT                   /translation="MSNNLRLEVLLKAVDQATRPLKSIQTASKSLSGDIRDTQKGLRDL
+FT                   NGQASKIDGFRKASAQLAVTSQALDKAKREAGELAVQFKNTTNPTRAQAQALEAARRAA
+FT                   SELQTKYNSLRTSVQRQRSELMQAGINTRTLSADERRLKTSISETTAHVNRQREALARV
+FT                   SAQQAKLSRVKERYKSGKELAGNMAAAGAAGSVSRHGTMAGVKLLMPGYDFTQKNSELQ
+FT                   AVLGVDKQSPEMQALRKQARHVGDNTAASADDAASAQIIIAKSGGDAAAIQARRRVTLN
+FT                   MALSNRRTMEENAALLTGMKSAFQLSNDKIAHIGDVLSMTMNKTAADFDGLSDALTYAA
+FT                   PVAKNAGVSIEQTAAMVGALHDAKITGSMAGTGSRAILSRLQLPPEKAFEAIKELGVKT
+FT                   SDSKGNTRPIFSILKEMQRSFEKNNLGTSQRGEYMKTIFGEEASSAAAVLMEAASSGKL
+FT                   DRLTAAFKASDGKTEELVKVMQDNLGGDFKEFQSAYEAVGTDLFDQQEGSLRKLTQTAT
+FT                   QYVLKLDGWIQKNKGLATTIGIIAGGALALIGIIGGIGLVAWPVVMGINAIIAAAGVLG
+FT                   TVFTVTGSAIVTALGAITWPIVAVGAAIVAGALLIRKYWEPISAFFSGVIEGIMSAFAP
+FT                   VAEMFAPLAPIFDGLGEKLRGVWQWFKDLIAPVKATQETLDSCKNVGVIFGQALASALM
+FT                   RPLNVFNKLRSGVDWLLEKLGIINKESDNLDQTAAKTNAATQGNSYIPATSTYGGYQAY
+FT                   QPVTAPAGRSYIDQSKSEYKITLPGGAAPGHQLDRQLRDTLEQIEREKRARQRASMSHD
+FT                   "
+FT   CDS             18891..19376
+FT                   /codon_start=1
+FT                   /db_xref="SPTREMBL:O80317"
+FT                   /note="P2 U homolog; tail protein"
+FT                   /transl_table=11
+FT                   /gene="F"
+FT                   /product="F protein"
+FT                   /protein_id="AAC34171.1"
+FT                   /translation="MMLALGMFVFERRTLPYQSMQHSKDYRWASNDRVGKPPAYQFLGE
+FT                   GETSIQLAGTLYPAITGGWISLKAVEVMANEGRAWPLIEGTGNILGMYIVDKVSTTHAE
+FT                   FFSDGAARKIDFTLSLKRVDESLTAMFGDLNKQASELLGSAGNLTDKLQSALGGLTA"
+FT   CDS             19373..20542
+FT                   /codon_start=1
+FT                   /db_xref="SWISS-PROT:P21679"
+FT                   /note="P2 D homolog; tail protein"
+FT                   /transl_table=11
+FT                   /gene="D"
+FT                   /product="D protein"
+FT                   /protein_id="AAC34172.1"
+FT                   /translation="MITGMTIDAGTSLAPAFMLTLNSQDITSNFSDRLISLTMTDNRGF
+FT                   EADQLDIELDDTDGKVELPLRGAVLTLWLGWQGSALLNKGDFTVDEIEHRGAPDILTIR
+FT                   ARSADFRGTLNSRREESWHDTTIGELVSTIAKRNKLTASVADSLKKIPVPHIDQSQESD
+FT                   AVFLTRLADRNGATVSVKAGKLLFLKAGSAMTASGKPVPQMTLTRNDGDRHQFAIADRG
+FT                   AYTGVTAKWLHTKDPKPQKQKVTLKRKPKEKHLRALEHPKAKPVSKKTKAKKEPEAREG
+FT                   EYMAGEADNVLALTTVYASKAQAMRAAQAKWDKLQRGVAEFSITLALGRADLFPETPVR
+FT                   VSGFKRVIDEQAWLISKVTHNLNNSGFTTGLELEVKLSDVEYNAESDDE"
+FT   variation       20378
+FT                   /note="Dam23"
+FT                   /replace="t"
+FT                   /gene="D"
+FT   variation       20492
+FT                   /note="Dam14"
+FT                   /replace="t"
+FT                   /gene="D"
+FT   protein_bind    20548..20596
+FT                   /evidence=EXPERIMENTAL
+FT                   /note="two CI binding sites for repression of pB"
+FT                   /gene="B"
+FT                   /bound_moiety="CI"
+FT   promoter        20549..20584
+FT                   /evidence=EXPERIMENTAL
+FT                   /note="pB; repressed by CI"
+FT                   /gene="B"
+FT                   /function="transcription of B gene"
+FT   -35_signal      20549..20554
+FT                   /gene="B"
+FT   -10_signal      20572..20577
+FT                   /gene="B"
+FT   CDS             20609..20827
+FT                   /codon_start=1
+FT                   /db_xref="SWISS-PROT:P08711"
+FT                   /note="C4 Zn finger protein; P2 Ogr and P4 Delta homolog"
+FT                   /transl_table=11
+FT                   /gene="B"
+FT                   /function="activate late gene promoters"
+FT                   /product="B protein"
+FT                   /protein_id="AAC34173.1"
+FT                   /translation="MFHCPKCHHAAHARTSRYLTENTKERYHQCQNINCSCTFMTMETI
+FT                   ERFIVTPGAIDPAPPHPTVGGQRPLWL"
+FT   variation       20690
+FT                   /note="Bam57"
+FT                   /replace="t"
+FT                   /gene="B"
+FT   variation       20744
+FT                   /note="Bam17"
+FT                   /replace="t"
+FT                   /gene="B"
+FT   terminator      20845..20866
+FT                   /note="tB; termination of transcription from pB and late
+FT                   promoter"
+FT   protein_bind    20889..21147
+FT                   /note="predicted Int arm-type recognition sequences;
+FT                   consensus = YAYCGCCAYTY; 3 sites to left of attP and 2
+FT                   sites to right"
+FT                   /bound_moiety="Int"
+FT   terminator      complement(20930..20957)
+FT                   /note="predicted terminator of lysogenic operon"
+FT   protein_bind    20959..20985
+FT                   /evidence=EXPERIMENTAL
+FT                   /note="IHF DNase I footprint location"
+FT                   /bound_moiety="IHF"
+FT   tRNA            20985..21030
+FT                   /note="truncated"
+FT                   /product="tRNA-Ile"
+FT   misc_feature    20995..21030
+FT                   /note="in common with attB in Escherichia coli, which is in
+FT                   the 3' end of ileY"
+FT   misc_feature    21023..21029
+FT                   /note="attP; predicted crossover region with attB"
+FT   variation       21030..22865
+FT                   /note="del1 deletion"
+FT   protein_bind    21057..21086
+FT                   /evidence=EXPERIMENTAL
+FT                   /note="IHF DNase I footprint location"
+FT                   /bound_moiety="IHF"
+FT   protein_bind    21075..21121
+FT                   /note="five binding sites for Apl excisionase at attP"
+FT                   /bound_moiety="Apl"
+FT   CDS             complement(21157..21408)
+FT                   /codon_start=1
+FT                   /db_xref="SWISS-PROT:P08685"
+FT                   /note="Orf69"
+FT                   /transl_table=11
+FT                   /protein_id="AAC34174.1"
+FT                   /translation="MSVRLAPDGTYVYGQPMLAPNGTYVGGGAPRLAPDGTYVGGVPRL
+FT                   APNGSYVAGRPTLAPDGTYVGGRYHLAPDGTYVGDGSE"
+FT   CDS             complement(21423..22433)
+FT                   /codon_start=1
+FT                   /db_xref="SWISS-PROT:P06723"
+FT                   /note="integrase"
+FT                   /transl_table=11
+FT                   /gene="int"
+FT                   /product="Int"
+FT                   /protein_id="AAC34175.1"
+FT                   /translation="MTVRKNPAGGWICELYPNGAKGKRIRKKFATKGEALAFEQYTVQN
+FT                   PWQEEKEDRRTLKELVDSWYSAHGITLKDGLKRQLAMHHAFECMGEPLARDFDAQMFSR
+FT                   YREKRLKGEYARSNRVKEVSPRTLNLELAYFRAVFNELNRLGEWKGENPLKNMRPFRTE
+FT                   EMEMTWLTHDQISQLLGECNRHDHPDLETVVRICLATGARWSEAESLRKSQLAKYKITY
+FT                   TNTKGRKNRTVPISKELYESLPDDKKGRLFSDCYGAFRSALERTGIELPAGQLTHVLRH
+FT                   TFASHFMMNGGNILVLQRVLGHTDIKMTMRYAHFAPDHLEDAVKLNPLVHITNSK"
+FT   CDS             complement(22433..23011)
+FT                   /codon_start=1
+FT                   /db_xref="SWISS-PROT:P08707"
+FT                   /note="immunity repressor; DNA-binding protein; has
+FT                   positive and negative autoregulation by control of pL"
+FT                   /transl_table=11
+FT                   /gene="cI"
+FT                   /function="maintenance of lysogeny; repress pB and pR"
+FT                   /product="CI repressor"
+FT                   /protein_id="AAC34176.1"
+FT                   /translation="MRIDSLGWSNVDVLDRICEAYGFSQKIQLANHFDIASSSLSNRYT
+FT                   RGAISYDFAAHCALETGANLQWLLTGEGEAFVNNRESSDAKRIEGFTLSEEILKSDKQL
+FT                   SVDAQFFTKPLTDGMAIRSEGKIYFVDKQASLSDGLWLVDIEGAISIRELTKLPGRKLH
+FT                   VAGGKVPFECGIDDIKTLGRVVGVYSEVN"
+FT   variation       22684..22685
+FT                   /note="cI10"
+FT                   /replace="g"
+FT                   /gene="cI"
+FT   protein_bind    22726..22742
+FT                   /note="FL; unknown function"
+FT                   /gene="cI"
+FT                   /bound_moiety="CI"
+FT   variation       22989
+FT                   /note="cIam461"
+FT                   /replace="t"
+FT                   /gene="cI"
+FT   protein_bind    23011..23067
+FT                   /note="locus of vir mutations; 3 binding sites for CI
+FT                   repressor"
+FT                   /bound_moiety="CI"
+FT                   /function="repression of pR"
+FT   -35_signal      23026..23031
+FT                   /note="pR"
+FT   promoter        23026..23063
+FT                   /evidence=EXPERIMENTAL
+FT                   /note="pR; repressed by CI and Apl"
+FT                   /function="transcription of early lytic operon"
+FT   -10_signal      23049..23054
+FT                   /note="pR"
+FT   protein_bind    23056..23123
+FT                   /note="7 binding sites for Apl; locus of goa mutations"
+FT                   /bound_moiety="Apl"
+FT                   /function="repression of pR and pL"
+FT   promoter        complement(23125..23159)
+FT                   /evidence=EXPERIMENTAL
+FT                   /note="pL; repressed by Apl; inhibited by convergent pR
+FT                   promoter; activated by CI repression of pR"
+FT                   /function="transcription of lysogenic operon"
+FT   -10_signal      complement(23131..23136)
+FT                   /note="pL"
+FT   CDS             23141..23404
+FT                   /codon_start=1
+FT                   /db_xref="SWISS-PROT:P21681"
+FT                   /note="contains putative helix-turn-helix DNA binding
+FT                   motif"
+FT                   /transl_table=11
+FT                   /gene="apl"
+FT                   /function="excisionase; binds to attL"
+FT                   /function="repressor: binds between and represses pR and
+FT                   pL"
+FT                   /function="appears to assist derepression during prophage
+FT                   induction"
+FT                   /product="Apl"
+FT                   /protein_id="AAC34177.1"
+FT                   /translation="MASEIAIIKVPAPIVTLQQFAELEGVSERTAYRWTTGDNPCVPIE
+FT                   PRTIRKGCKKAGGPIRIYYARWKEEQLRKALGHSRFQLVIGA"
+FT   -35_signal      complement(23154..23159)
+FT                   /note="pL"
+FT                   /gene="apl"
+FT   variation       23205..23219
+FT                   /note="apl11 deletion"
+FT                   /gene="apl"
+FT   variation       23236
+FT                   /note="aplam"
+FT                   /replace="g"
+FT                   /gene="apl"
+FT   promoter        complement(23400..23462)
+FT                   /evidence=EXPERIMENTAL
+FT                   /note="pE; activated by CII, allowing transcription of
+FT                   lysogenic operon"
+FT                   /function="transcript for establishment of lysogeny"
+FT   protein_bind    23404..23420
+FT                   /note="FR"
+FT                   /bound_moiety="CI"
+FT                   /function="probably responsible for CI repression of pE
+FT                   promoter"
+FT   protein_bind    23435..23462
+FT                   /gene="cII"
+FT                   /bound_moiety="CII"
+FT                   /function="activate pE"
+FT   CDS             23435..23944
+FT                   /codon_start=1
+FT                   /db_xref="SWISS-PROT:P21678"
+FT                   /note="DNA binding protein; has putative helix-turn-helix
+FT                   motif"
+FT                   /transl_table=11
+FT                   /gene="cII"
+FT                   /function="required for establishment of lysogeny"
+FT                   /function="activates pE, alternative lysogenic operon
+FT                   promoter"
+FT                   /product="CII"
+FT                   /protein_id="AAC34178.1"
+FT                   /translation="MFDFQVSKHPHYDEACRAFAQRHNMAKLAERAGMNVQTLRNKLNP
+FT                   EQPHQFTPPELWLLTDLTEDSTLVDGFLAQIHCLPCVPVNELAKDKLQSYVMRAMSELG
+FT                   ELASGAVSDERLTTARKHNMIESVNSGIRMLSLSALALHARLQTNPAMSSVVDTMSGIG
+FT                   ASFGLI"
+FT   variation       23440
+FT                   /note="prevents CII binding to pE; cIV476"
+FT                   /replace="a"
+FT                   /gene="cII"
+FT   variation       23657
+FT                   /note="cIIam475"
+FT                   /replace="t"
+FT                   /gene="cII"
+FT   CDS             23952..24179
+FT                   /codon_start=1
+FT                   /db_xref="SWISS-PROT:P15236"
+FT                   /evidence=EXPERIMENTAL
+FT                   /note="overexpression blocks cell division"
+FT                   /transl_table=11
+FT                   /gene="fil"
+FT                   /product="Fil"
+FT                   /protein_id="AAC34179.1"
+FT                   /translation="MLKSEPSFASLLVKQSPGMHYGHGWIAGKDGKRWHPCRSQSELLK
+FT                   GLKTKSPKSSGFLIIRIVHFVIKGVKHVTR"
+FT   variation       24112
+FT                   /note="CP77am; filam"
+FT                   /replace="a"
+FT                   /gene="fil"
+FT   CDS             24166..24366
+FT                   /codon_start=1
+FT                   /db_xref="SWISS-PROT:P21680"
+FT                   /transl_table=11
+FT                   /gene="dhr"
+FT                   /function="inhibits host DNA replication"
+FT                   /product="Dhr"
+FT                   /protein_id="AAC34180.1"
+FT                   /translation="MSRDELRIVLGAMIPNMEEGFEIKTRDGAILRVDPEWECCKEFKD
+FT                   GLKAEIIKQLKSKPAVVFGYS"
+FT   variation       24194
+FT                   /note="CP78am; dhram"
+FT                   /replace="a"
+FT                   /gene="dhr"
+FT   terminator      24384..24412
+FT                   /note="tR1; one of a number of transcription terminators in
+FT                   this region that are anti-terminated during early lytic
+FT                   development by an unknown mechanism"
+FT   CDS             24433..24666
+FT                   /codon_start=1
+FT                   /db_xref="SWISS-PROT:P21682"
+FT                   /note="unknown function; not essential"
+FT                   /transl_table=11
+FT                   /product="Orf79"
+FT                   /protein_id="AAC34181.1"
+FT                   /translation="MSRTIYLSTPSGAGDHLLESLFKEAKKEERKDRRLAVSIRLEDLA
+FT                   VHITNSDMTGKEAAELLRREATRFENESQELH"
+FT   CDS             24666..24893
+FT                   /codon_start=1
+FT                   /db_xref="SWISS-PROT:P41059"
+FT                   /note="unknown function; not essential"
+FT                   /transl_table=11
+FT                   /product="Orf80"
+FT                   /protein_id="AAC34182.1"
+FT                   /translation="MADAMDLAQLREQEDRERHISNARSRRHEVSAFICEECDAPIPEA
+FT                   RRRAIPGVQCCVTCQEILELKSKHYNGGAL"
+FT   CDS             24890..25474
+FT                   /codon_start=1
+FT                   /db_xref="SWISS-PROT:P41060"
+FT                   /note="unknown function; not essential"
+FT                   /transl_table=11
+FT                   /product="Orf81"
+FT                   /protein_id="AAC34183.1"
+FT                   /translation="MSITNATISQRAKKWLEDDRIFIDTETTGLGDDAEIVEICLIDSA
+FT                   GFIMLNTLVKPTKPIPAEATAIHGITDEMVMYAPTWKDIHGAVASLFFEYGFVIYNADY
+FT                   DTRLIYQTAKLYGLENDGFCYFLNERSACAMMLYAEYRGEPGRFKGYKWHKLVDAAAHE
+FT                   GVSVEGKAHRALADCRMTLGIIDALAKGGAA"
+FT   CDS             25471..25746
+FT                   /codon_start=1
+FT                   /db_xref="SWISS-PROT:P41061"
+FT                   /note="unknown function; not essential"
+FT                   /transl_table=11
+FT                   /product="Orf83"
+FT                   /protein_id="AAC34184.1"
+FT                   /translation="MSIRIEIGDKWVITSDQYQFILNEKKVVKTGNKAGEEWLDTIGYY
+FT                   PKINQLISGLVHHHIHTAMIISLSAMAEEIEKLSFICEEAFKAVKK"
+FT   CDS             25743..26747
+FT                   /codon_start=1
+FT                   /db_xref="SWISS-PROT:P41062"
+FT                   /note="unknown function; not essential. translation to end
+FT                   of orf84 appears necessary for translation of A protein"
+FT                   /transl_table=11
+FT                   /product="Orf84"
+FT                   /protein_id="AAC34185.1"
+FT                   /translation="MIDSRCFAESTINIVSVSGGKDSLAQWILAVENDVPRTTVFADTG
+FT                   HEHSQTMEYLDYLESRLGPVIRVKADFTRRIEGKRKFIAEKWPVSLVEECGMSHEQAAE
+FT                   RIAKALEILKPTGNPFLDLCMWKGRFPSTKARFCSLELKHDSVRDKIVLPALEKYDEVI
+FT                   LWQGVRAQESPARAALPMWEEDADNTPGLHVYRPILNWTHEDVFALAKRHGIKPNPLYQ
+FT                   QGCSRVGCMPCIHARKSELAEIFARWPEEIARVAEWERLVAACSRRGNSTFFPSTHDPR
+FT                   RAEKRIEVVTVEEYGIASYRDWAMTTRGGSQYDLLAATNDKTVCSSVYAGVCE"
+FT   variation       25803
+FT                   /note="am43"
+FT                   /replace="t"
+FT                   /phenotype="lethal due to polarity on A"
+FT   variation       25845..26288
+FT                   /note="del444"
+FT                   /replace=""
+FT   variation       26460
+FT                   /note="am11"
+FT                   /replace="t"
+FT                   /phenotype="lethal due to polarity on A"
+FT   CDS             26744..28828
+FT                   /codon_start=1
+FT                   /db_xref="SWISS-PROT:P41064"
+FT                   /note="rolling circle replicase; putative endonuclease;
+FT                   similar to P2 A protein"
+FT                   /transl_table=11
+FT                   /gene="A"
+FT                   /product="A protein"
+FT                   /protein_id="AAC34186.1"
+FT                   /translation="MTGVVYAFPWNAPRSAIASSYLTYDQQHRRDRMFAALLHARKVLF
+FT                   LQPECVRFDVYRTAAVLEQNQGSQRANAFLISFCKKALPRLELVAKKYECSGINSNVSA
+FT                   AVFDGHFDTQLMQYLASRMVNMVARFNRLPDMSRADIDLLAADIANFIRAELADIDDTG
+FT                   FSELKTLYTWYMRAGFISLQFNVTPPKWERVTKKYFCEDEIAPAVMRMFNEVWWRGRLR
+FT                   RIAAAWREHLQIAVGNVSKKRHAYASKNCVTDWREQKRRTREFLKGLDLEDEEGNRISL
+FT                   IEKYDGSVANPAIRRCELMARIRGFENICNELGYVGEFYTLTAPSKYHATTKAGYRNSK
+FT                   WNGASPSDTQSYLTGLWARIRAKLHREEIRIFGIRVAEPHHDGTPHWHMLMFMLPEDVE
+FT                   RVRLIIRDYAWEEDHYELRSDKAKKARFHAEAIDPEKGSATGYVAKYISKNIDGYALDG
+FT                   ETDDESGELLKETAPAVSAWAARWHIRQFQFIGGAPVTVYRELRRMADPETARALSVEF
+FT                   AAVHDAAHYGRWADYVNAQGGPFVRRDDLQVRTLYEPRTEFNQYGEETVCIKGVYDASI
+FT                   GAGSPILTRLTQWKIVPKRAVDLAVDVKGASAPSRSSVNNCTGSESDPPILDLTKPLSR
+FT                   RERRELTNRLRKKKPTTRRKFIHGTDKQNVAITKTIDEIHSDNRHHNQPGRSPAPDGRW
+FT                   "
+FT   terminator      26829..26856
+FT                   /note="tM1; expected terminator for lytic transcripts in
+FT                   absence of translation of A gene"
+FT                   /gene="A"
+FT   variation       27542
+FT                   /note="Aam24"
+FT                   /replace="t"
+FT                   /gene="A"
+FT   rep_origin      28576
+FT                   /note="located by similarity with P2; consistent with
+FT                   electron microscopy mapping"
+FT                   /gene="A"
+FT   -35_signal      29020..29025
+FT                   /note="p95"
+FT   promoter        29020..29056
+FT                   /evidence=EXPERIMENTAL
+FT                   /note="p95"
+FT                   /function="SOS-dependent transcription of SOS operon"
+FT   -10_signal      29044..29049
+FT                   /note="p95"
+FT   protein_bind    29044..29063
+FT                   /note="putative"
+FT                   /bound_moiety="LexA"
+FT   variation       29053..29055
+FT                   /note="cIII"
+FT                   /replace="tt"
+FT   variation       29074
+FT                   /note="tum9"
+FT                   /replace="a"
+FT   CDS             29082..29522
+FT                   /codon_start=1
+FT                   /db_xref="SWISS-PROT:P41063"
+FT                   /note="expression repressed by LexA"
+FT                   /transl_table=11
+FT                   /gene="tum"
+FT                   /function="inhibits CI DNA binding"
+FT                   /product="Tum"
+FT                   /protein_id="AAC34187.1"
+FT                   /translation="MDRELNEHVMIERVEMIARLTAEGTCQERDREIALNLIAEIARGN
+FT                   LMKNNNFSVVFSAPPVGETFAKEGKVKVNITLDKDQKIGQPVIDAFQCELTKRIQSVFP
+FT                   STRVTVKKGSMTGVELMGFDKDSDREALDSILQEVWEDESWR"
+FT   CDS             29109..29522
+FT                   /codon_start=1
+FT                   /db_xref="SWISS-PROT:P41063"
+FT                   /evidence=EXPERIMENTAL
+FT                   /transl_table=11
+FT                   /gene="tum"
+FT                   /function="modulates SOS induction"
+FT                   /product="truncated Tum95.2"
+FT                   /protein_id="AAC34188.1"
+FT                   /translation="MIERVEMIARLTAEGTCQERDREIALNLIAEIARGNLMKNNNFSV
+FT                   VFSAPPVGETFAKEGKVKVNITLDKDQKIGQPVIDAFQCELTKRIQSVFPSTRVTVKKG
+FT                   SMTGVELMGFDKDSDREALDSILQEVWEDESWR"
+FT   variation       29115
+FT                   /note="tum16"
+FT                   /replace="a"
+FT                   /gene="tum"
+FT   variation       29182
+FT                   /note="tum13"
+FT                   /replace="t"
+FT                   /gene="tum"
+FT   variation       29199
+FT                   /note="tum17"
+FT                   /replace="a"
+FT                   /gene="tum"
+FT   CDS             29220..29522
+FT                   /codon_start=1
+FT                   /db_xref="SWISS-PROT:P41063"
+FT                   /evidence=EXPERIMENTAL
+FT                   /transl_table=11
+FT                   /gene="tum"
+FT                   /function="modulates SOS induction"
+FT                   /product="truncated Tum95.4"
+FT                   /protein_id="AAC34189.1"
+FT                   /translation="MKNNNFSVVFSAPPVGETFAKEGKVKVNITLDKDQKIGQPVIDAF
+FT                   QCELTKRIQSVFPSTRVTVKKGSMTGVELMGFDKDSDREALDSILQEVWEDESWR"
+FT   variation       29245..29251
+FT                   /note="tum14"
+FT                   /replace="ttttt"
+FT                   /gene="tum"
+FT   CDS             29292..29522
+FT                   /codon_start=1
+FT                   /db_xref="SWISS-PROT:P41063"
+FT                   /evidence=EXPERIMENTAL
+FT                   /note="truncated Tum - modulates SOS induction of 186
+FT                   prophage. GTG start codon."
+FT                   /transl_table=11
+FT                   /gene="tum"
+FT                   /product="bacteriophage 186 Tum95.5"
+FT                   /protein_id="AAC34190.1"
+FT                   /translation="MKVNITLDKDQKIGQPVIDAFQCELTKRIQSVFPSTRVTVKKGSM
+FT                   TGVELMGFDKDSDREALDSILQEVWEDESWR"
+FT   variation       29391
+FT                   /note="tum2"
+FT                   /replace="t"
+FT                   /gene="tum"
+FT   terminator      29545..29576
+FT                   /evidence=EXPERIMENTAL
+FT                   /note="t95a; partial termination of p95 transcript"
+FT   CDS             29604..30335
+FT                   /codon_start=1
+FT                   /db_xref="SPTREMBL:Q37850"
+FT                   /note="expression from plasmid blocks 186 infection"
+FT                   /transl_table=11
+FT                   /gene="orf97"
+FT                   /product="Orf97"
+FT                   /protein_id="AAC34191.1"
+FT                   /translation="MDTVIAFLSLALFIAFIVGLIKPSLVRMPSRKRSSAVYLGGCLAL
+FT                   GVIGSILWPTEKTQPVAKTDVPAVKAEPATPTFEYADKTLKEYRNEPKETRHEIVKDYV
+FT                   GFKGVQASATDVFYACMSEYTFTKDDALKLSDVLGWCFNDFEKDPQSLNNKINLDEFQG
+FT                   NFSGWDGSYRPLEKLIKASMNDDSSYKHVSTVYHLILNKDPHAVVKTTFRGTNAYGGVV
+FT                   KQTVAARVNVRTGEVDSILDN"
+FT   variation       29691..30304
+FT                   /note="del97"
+FT                   /replace=""
+FT                   /gene="orf97"
+FT   terminator      30436..30463
+FT                   /note="t95b; p95 transcript terminator"
+XX
+SQ   Sequence 30624 BP; 7461 A; 7801 C; 8456 G; 6906 T; 0 other;
+     ggcgtggcgg ggaaagcatt gcgcgccaga ggtggcgcgt gaatgataaa aattatcgtc        60
+     tgagcgcctc gtaatggcgc tatcgtggtg ctgttggttc gttggtggtc gtgtgtgttt       120
+     gtgcgcgtgt ggcgcgtctg agacgtgatg gtggcggggt atgaaaaagc cgccatgctg       180
+     gcggcttgag agggattatt ccgggttgtc gagggtgtac tctttgaacc tgatgacctc       240
+     catgccgagc cagtcgttta cctccctgaa cctgtcctgc agcggcgaca ggtcgttacg       300
+     cacaaatacc tttgccactt tctcaacgtc accgagcgag ccgatattct cgggcttgcc       360
+     gcccatgagc tggaacggta cgcggtgcgc gtccatcagg tcggcggcgc tggctttctt       420
+     gatgttgaaa aagtcatcct ttgtggcgac ctcgctcagt ggcacgattt taatgccgtc       480
+     cggttttcca ttgggagcgt agaaaaacag gtttttaaaa ttgccgagcc ctttcgagtt       540
+     gcgcatcgcc tcgcgcagcg attcgacgtc ggtcgcgctc tgcgccgggt cggtcacata       600
+     catgatgtaa cccgcatgcg cgccgttctg gtaatacttg cggcggaaca gcgttgcgga       660
+     ttcattcagc caggcggaat taagcgcgct gagatattcg ggcaggccgt aaatctcctg       720
+     attaatgtcg ggctccagca ggtgaaacac ggtatcaggc gcgaattcat gcggcagagt       780
+     gaagttttcc acaaaccaga aaaccgaatc gtcgaccccg cggcgggtgt atttggccgg       840
+     tgaggccagt agcttgatta gctggccggt aacgctgtgg cgctgctcaa gaaaggcgtt       900
+     gccgaatacc agatagtcga gcgcaaagcg gctgaaatcc tgacgggaca gcagcgggtg       960
+     cgggatgtag gtgctcgcga gcacgttgcg cttaacgtaa atcggtgagc tgtgatgtac      1020
+     agcagagcgc aggctctttg ccagcccgga gaagctgacc ggcggctcgt accatttgcc      1080
+     gttactgatg cactcgacat aatccagaat gtcgcgctta tcgagtaccg gcactggctc      1140
+     gccaaaggtg aacgcctcca ttttttgcgg ggcgctggcg gtcatggcta cctgtttgcg      1200
+     tggcttgcgc ttgctcatgc tgccacctca cccgctgcaa cagcgaaaga ccagtcgcag      1260
+     ccaaacagca ggcgataatc atcgtcgctg tattcgtgtt taatttcatc gggcgcaaag      1320
+     agattgcacc cgcgctggca tgctgcatcc agagtgaccg actgacgcca gacaccatct      1380
+     gtacaaaata cgctgtcgcc ggtattgatg agcggtgacg gtcggtgcct gcgggttgtg      1440
+     ccgttccata ccctgaaagc gtcataatta tcagagggcg aggtaaacat cgtcaggctg      1500
+     tggcgtttat ggcaggcgat acccgccgcg actttcgcag ctcttagcgg gttattgaac      1560
+     catccgaact catcaagata gacattaccc gccagtgcgg cgcaatggga ttcctcgccg      1620
+     acaaagctga taaccgcacc gtcgtcgagc tgcaggctgt ggccgttact cgtaagactg      1680
+     acgccgacgc gcgccgaaag gttactcatg tacatcagcg ccacgcgcgc atgctcaata      1740
+     gtgtgagcaa accagacatg attatcgcct gttgtcagcg catcgagcag cgcctcacgg      1800
+     ctaaagagct gcgttgcgcc aatctggcgc gatttggtga tgctgcggtc gatattgagt      1860
+     ttcccgacac gcaaccatgt tgcctgatag tcaaagctgt cattgtgcag aatatcggcc      1920
+     attgcctgaa tctggctttg tgagaaaacg ttatttttca ttaattaaac tccagaatgg      1980
+     atttaggctg tatgccgcta ccggcggaaa gcggttcgtt taacagggcg tgcatggtcg      2040
+     cccatgcaat atcggcgtga ctggcttcct cggtgcggct ggcctcgtag gtggcgctgc      2100
+     gcccgctgct ggtcatggtt ttgcggatgg acataaacga ctgcgtgacg tcggttgctc      2160
+     cggcgtcgta ctccagacag ccgcggcgaa tggtgtcttt tgccttgagt accattgcgg      2220
+     ttttcatttc aggcgtgtaa cggatgccgc gtgcggccgg gtagaatgag cgcaccaact      2280
+     ggaacacgcc gaggccgagg ccggttgcgt caatgccgat gtattcgacg ctgtatttct      2340
+     cggtcagttt gcggatgcca tctgcctgcg cggcaaagtc catgcccttc cactggtggc      2400
+     gctccagcat gcggaacttg ccaccagaaa ccaccggcgg cgcgagcacg acgcacccgg      2460
+     cgctgtcgcc agtgtgtgac gggtcgtagc caatccagac ggggcgagag ccgaacggat      2520
+     ggtcggcgaa cggggcgaag tcctcccatt cttccatcac gtcgaccatg cagcgctgca      2580
+     gctcctcgaa cgggaatacc gacgctttat cgtcgacaaa ctcgcacata aacaggtttt      2640
+     taaagtcctc atcactgttt tcgcgtttga gttggtcgag gtcgaacagg gtgcagccac      2700
+     cggcaagggc gtcctcaatg gtgacaatct gccgccactg gccatcgtcg cagagctggc      2760
+     caccggcgag cgcgcggtga ctgatgtcaa tttcgatgcg gtcggcaata cggctgcgcc      2820
+     ccttgttgaa cagctcgcca gaccagaagg gataagcgcc gtgcgccagc gttgagggtg      2880
+     tcgaaaagta ggttgagcgc agatgcttct gcgaggccat gcccgaggcg actttgcgca      2940
+     gcttctgaaa attcgggatc cagaatattt catcgacata caggtcgccg ttatggctct      3000
+     gagccgtgtt ggagttggta ccgagaaaaa tcagctttgc gccgttgttg ccaatgacaa      3060
+     tcgggtcgcc ggtcaggtcg acgtcaacca gtcgcgcaaa ctgtatgatg tattcgcgga      3120
+     acacgtaagc ctgcgtttta ctggccgaca gaaaaatctg gttatggccg gtcttgagtg      3180
+     ctcgcagcag tgcctcacgg gaaaaataga acgtcgcgcc aatctggcgg gatttgagaa      3240
+     tgtcgcgaat acggtgtgcc agtcctgcgc ggtaccactg caactggtac tcgaaagact      3300
+     ggtcgaaaaa taattcctcc agcttttcga tagcctcgtc gctgaaaaaa ttctttttcg      3360
+     gcttcttgcg ctcacccttg ttgcggttgg cgacgttggg gttaaggtcg gcctcgttgc      3420
+     cggtctggct gtagcggtta acgcgtgcca gtcgttcaat ctgccgcccg agcaggtcaa      3480
+     tctctttgaa gtcaccgcct gacttttgcg gcttggcgat gagctgaatc aggcgcgcct      3540
+     caaggctgct ttcaacgcgg gaaatcggtg cgatgccatc ccagccgtcg cgctgtttcc      3600
+     agctctgcac ggtcgggcgc ttgacctgca gcatttcggc aatctgcggc acggaaaaac      3660
+     cctgccagta aagcagcgat gcctgtcgtc gcgggtcatg caacaaggtt gtatcggtgg      3720
+     aaatggtcat tgatgcctcg ccgtaatgga ttcagggcaa ggctacttaa tggccgtcag      3780
+     tgattcgcta aggtgctgtt gtgtgggcgg ttgtccagtc gtcattggtg gtctggcgtg      3840
+     tcctgagtct ggaaactggc ggtgaccagt aaccccaacc tcaggactcc tgacaatggc      3900
+     aaaaaaagtc tcaaaattct ttcgaatcgg cgtcgagggt gatacctgcg acgggcgcat      3960
+     tatcagcgcc agtgatattc aggaaatggc cgaaacctat gacccgcgtg tttacggttg      4020
+     ccgtatcaac cttgaacacc tgcgcggcct gttgcccgat ggcatattca agcgttacgg      4080
+     cgatgtggtc gagctgaaag ccgagaagat tgacgacgat tctgcgctta acggcaagtg      4140
+     ggcgttgttc gctaaaatca ccccgaccga tgaccttatc gcgatgaata aagccgcgca      4200
+     gaaggtctac acctcaatgg aaattcagcc gaattttgcc aataccggca aatgctacct      4260
+     cgtcggcctt gctgtcaccg atgacccggc gagcctcggc actgaatatc tcgaattctg      4320
+     ccgcactgcg aagcacaacc cgctgcagcg ctttaaagcc caccctgaaa acgtcttttc      4380
+     cgccgccacg ctggccgaac tggaatttga agacgttccc gacacggtgc tcaacagcct      4440
+     ggccgataag gtgaaagcca ttttcagccg taagcaggtc agcgacgatg cgcgcctgaa      4500
+     tgatgtacat gaagcggtga ccgccgtcag cgagcatgtg cagaccaacc tcactgcaca      4560
+     ggataagcgt ctttccgata tggaaaccgc gtttgccacc ttcaaacagg aactgaccgg      4620
+     caaggttgaa gaaaccagcc aggcattttc cgtcctgaaa accactctcg acaaaaccga      4680
+     aagtttcagc cagccgcgac gcacgaaagc cagcggcggt ggtggcgatg agctgctgac      4740
+     tgactgctga taaaccgcag accgaaaccg ggcggaaccc ccgcccgatg ctgtgactaa      4800
+     ccgattaaat caaacaggaa atactatgcg tcaggaaacc cgttttaagt tcaatgccta      4860
+     tctgacccag ctcgccaaac tgaacggcat cagcgttgat gacgtcagca aaaaattcac      4920
+     cgtcgagccg tccgtcacgc aaacgctgat gaacaccgtg caggcgtcat ccgcgtttct      4980
+     gcagatgatt aacattctgc cggtcgcaga aatgaagggt gagaaaatcg gtgtcggtgt      5040
+     gaccggcacc atcgccagca cgaccgacac ctcgggcgac aaagagcgcc agaccgcaga      5100
+     ttttaccgcg cttgagtcca acaagtacga gtgcaaccag attaactttg acttccacct      5160
+     gacctataaa cgcctcgacc tgtgggcgcg ttttcaggac tttcagcgtc gtattcgcga      5220
+     cgccattgtc cagcgtcagg cactggattt catcatggcc gggtttaacg gtaccacccg      5280
+     cgctgacacc tctgaccgtg ttaaaaaccc gatgctgcag gatgtggccg ttggctggct      5340
+     gcagaaatac cgcaatgaag ccccggcgcg tgtgatgagc aacatcaccg acgctgacgg      5400
+     taaagtcgtt tcggcagtga ttcgcgtcgg taaaaacggc gactatgaga acctcgacgc      5460
+     actggtgatg gatggtacca ataccctgat tgacgagatt tatcaggatg acccgaaact      5520
+     cgttgccatc gttggccgta agctgctggc cgacaaatat tttccgctgg tcaacaaaca      5580
+     gcaggaaaac accgagtcgc tcgcggcgga tatcatcatc agccagaagc gcatcggcaa      5640
+     cctgccagcc gtacgtgtgc cgtacttccc ggcgaacgcg gtgttcgtga ccacgctgga      5700
+     aaacctctct atctatttca tggatgagag ccaccgccgc agcattgatg aaaacccgaa      5760
+     aaaagaccgc gtggaaaact acgagtcgat gaacatcgac tatgtggtcg aggcgtatgc      5820
+     cgccgggtgc ctgctggaaa acatcaccct gggcgatttc accgcacctg cagcaccgga      5880
+     aggcggagag taaacccatg acgagccccg cacagcgtca catgatgcgg gtctcggcct      5940
+     ctcaagccgc gcagcgggaa caagccccgc tgcgccatgc aaccgcctat gagcagatgc      6000
+     tggttaagct ggccgatgac cgccgcacgt taaaaaacat ccgttcaaac gaacgtaaag      6060
+     ccgagaaaaa gcgcgagctg ctgccgttct atgcgccgtg ggtcgccggt gtgctgactg      6120
+     atggtcgtgg tgcgcaggat gacattgtta tgaccgtcat gctgtggcgt ctcgatgccg      6180
+     gtgatatcgc tggcgcgctg gaaattgccc cctacgcgct gaagtacggc ctcacctctg      6240
+     accatcgccg cacgacacct tacatgctgg tcgaggaagt ggcacttgcc gcgcagcgcc      6300
+     tgcgcgatgc cggtgagtct gtcgaccttt cctggctgca ggccactatc gacctgaccg      6360
+     acggcgctga cgttcccgat atggtgcgcg cccgtctgca taaggtgaca ggcctgaccc      6420
+     tgcgtgatgc cggtatgaat gcagaggcgc tggcgcagtt tcagcgcgcg atgcagctcg      6480
+     accgcaatgc cggtgtgcgc aaggagattg agcgactgga acgggcattg aagccaaaga      6540
+     cagaggccgc gccccgtaaa acgactaaac cgcgcacgcg taaacctgcc accaaaccgg      6600
+     cagcaaagcg cgggcgtcca ccaaaggcgg caaaaaccgc cggttaactg aacgctcccc      6660
+     gagccgggcg gcacgccggt caaagcaggc aaagacctga cggcgaccgg cgtccaccgc      6720
+     ccaacctgat gaggttgtca tgacgacagt gatactgaac cagcccgacg aaccgcagga      6780
+     cgtaccgggc gtggtgattc ccgcaccgga gacgggcggt gcagtgatta aaaacacgtt      6840
+     ctttttccct gatgtggatc cgaagcgcgt gcgcgaactg atgcgccttg agcagacggt      6900
+     ttccgatgcg cgcctgcgca atgccatcaa gaccggcatg gccgagacca atgcggagct      6960
+     ttacgactac cggctgcgcc agactgccgc cgggtttaag caactggccg acgtgcctgc      7020
+     cgaggaaatc gacggcgaga atgtacgtgt tttccactat ctgagtgctg tgacggcaat      7080
+     ggcaaccgcc accctgtatg agcgctatcg cggcgttgag gccaccggca aaggtgacaa      7140
+     aaaagccgac agcgtggaaa ccaccattga tgacctgtgg cgggatatgc gctggtcagt      7200
+     tgcgcgtctg caggacaagc cgcgctgcat tgtggggcag ctctgatgaa agtcaggtcg      7260
+     atgcagggcg ataccctcga cacgatttgc gccaggtatt acgggcgcac tgagggcgtg      7320
+     gttgagacgg tgctgcaggc taatccgggt ctgtctgagc tgggtgtcat tctgccgaat      7380
+     ggtacagaga ttgacctgcc cgatgtggca tcgtcacccg taactaaaac tatcaacctt      7440
+     tgggagtaac catgacagaa ggtgaaaaag gcgtcctgtc actgtttgtg attggcgtga      7500
+     tgattgttgt tgggaaagtg ctggcaggcg gtgaacccat caccccgcgt ctgtttattg      7560
+     gccgcatgct gctcggtggt tttgtttcaa tggtcgccgg tgttgttctg gtgcagtttc      7620
+     ctgacatgtc actgcccgcc gtgtgcggga ttggatccat gctcggtatt gccggttatc      7680
+     aggtggttga aatcgccata cagcgccgct ttaagtcaca aaagggggaa agtgatgccg      7740
+     gtcattaaca ctcaccagaa tatcgctgcg tttctggaca tgctggcgta ttccgaagga      7800
+     acagcgaacc atccgctgac gaaaaatcgt ggctacgacg tcattgtcac tggccttgat      7860
+     ggcagaccag agattttcac cgattacagc gaccaccctt tcgcgcatgg ccgaccaccg      7920
+     aaagtgttta atcgccgtgg cgagaaatcc acagcctcgg gacgttacca gcagctttat      7980
+     ctgttctggc cgcactatca gaaacagctc gcattgcctg atttcagccc actgtcgcag      8040
+     gataagctcg cgatccagtt aatccgggag cgcggtgctc ttgacgatat ccgggcgggg      8100
+     cgtattgagc gtgctgtttc acgttgtcgc aatatctggg cgtcattacc gggggccggt      8160
+     tacggccagc gcgagcacgg tctcgaaaag ctggtcacca tctggcgcac ggctggcggg      8220
+     gtggtggcat gaaagtcctg ataacgctgc ttgtgatggc cgtgctcggg ttgctgtggc      8280
+     tgcaccatga gaacggcaat ttatcccgct catttgagac ggcaaaccgc gtcgcgagcg      8340
+     agcaaaagac gacgattggg atgctgaaaa atcagctcag tgttgccggt cagctcgccc      8400
+     gacgtaatga atccgcgcag gtgacactgc gcgaacagct cgcaaaggca agtgcagaag      8460
+     ccagccgccg tgagcagacg ataacgaggt tacttaatga aaatgaagcc tttcgccgct      8520
+     ggtataacgc tgctctgcct gatgctgtgc gtcggctgca cacccgaaca gcctgcgcca      8580
+     gtgccggtga ttgtggtcaa cggatgcccg agggtgagcc tttgccctat gccgggaagt      8640
+     gacccgaaaa ccaatggtga cctgagcgca gatatccgcc gtcttgaggg ggcgctgact      8700
+     gcctgcgcgc tgcaggtcaa aaccgtcaaa cactgtcagg atgaactcga tgcagaagca      8760
+     caaaagcctg cgcaaagcgc tgattaacgc cgtgccgcag ctccgaaata accccgatat      8820
+     gctgcgcctt tttgccgaca acggccacac cgattcccga ctggcgagct cgctgtcgtt      8880
+     tgaaaaggtg tatgtgctta acgtggtggt gaccgacttt actggcgacc tcgatttgat      8940
+     attcgtgccg gtgcaggcat ggctgcgtga acatcagccg gacattatga ccaccgacga      9000
+     cgggcgggaa aaaggattca cctggattat tgatatcaat aacgacgatt cgctcgatat      9060
+     cagtatcagc ctgaggctca ccgagcgcac gctcgtcaaa gaggtcgggg gcgcgctgca      9120
+     tgtcagttat gcaccagaac cgccactgcc tgagctggtg aagcgcccgg ttgctatgta      9180
+     tgcaaacggt gaattagtga gccagtggga tgagtgaatt aaccgcgctg caggagcgcc      9240
+     tcgccggtct gattgccagc ctgtcaccgg cggcacgtcg caaaatggcg gctgagattg      9300
+     cgaaaaagct gcgtaccagt cagcagcagc gcatcaagcg ccagcaggca cccgacggca      9360
+     ccccgtatgc cgcacgaaag cgccagccgg tacggagcaa gaaaggccgc attaagcgcg      9420
+     aaatgttcgc caaactgcgc accagtcgct ttatgaaagc caaaggcagc gatagtgcgg      9480
+     cggtggtgga gtttaccggc aaggtgcagc gcatggcgcg ggtgcatcag tacggcctca      9540
+     aagaccgccc aaaccgcaac agccgggatg tgcagtacga ggcgcgcccg ttgctcggtt      9600
+     tcacccgcga cgatgagcaa atgattgaag acgtcattat cagccacctc ggcaaataaa      9660
+     tattgtgtga accaccaccg gaggcgcgtg atttggcgcg gctaaagacc agaggcattc      9720
+     tttgcactat gaatacgtta tccacgatac aggagctcgc gcgtgcgatt cgtaacctca      9780
+     tccgctcagg tgtggtgacg gaggtcgata ccgtgcaggg gctgtgccgc gtacaaagcg      9840
+     gcgggatcca gacgacatgg ctgaactggc tgaccacccg cgccggtcgt tcgcgcacat      9900
+     ggtgggctcc ctcgctcggt gagcaggtgc tgctgctggc aatcggtggc gagcttgata      9960
+     ccgctttcgt gctgccgggg attttctccg acgataaccc cgctccgtct gcctcggcgg     10020
+     atgcgtggca tgtggttttt cctgatggcg cggtcattga gtacgagccg gagaccagtg     10080
+     cactgacggt cagaggcatc aaaactgctg acgtgaccgc gtcggaatcc atcacggcca     10140
+     ctgtgcctgt ggtgctggtg aaagcagaaa cccgcatcac cctcgacacc ccggaggtgg     10200
+     tatgcaccaa caaactgacg acggcaacgc ttgaggtgca gaaaggcggg gagatgagag     10260
+     gcgacattgt ccacaacggc ggcacattta aatcaaacgg tgtgcagctc gacgaccacg     10320
+     gtcacggtgg tgtgcaaaga ggcggtgcct ggacggagga caccaaatga cggcgcgcta     10380
+     tatggggatg aaccgcaaca ccggtctcgg tatcagtgac actgaacaca tcagccagag     10440
+     catgcgcgac attctgctga cgccggtcgg ctcgcgggtg atgcgtcgtg aatatggctc     10500
+     gctcctgtct gcgctgattg atatgccgca aaacccggcg ctcaggctgc aaatcatggt     10560
+     ggcgtgctat tcggccatcc agaagtggga gccgcgtatc aggcttacat ccatcagctt     10620
+     tgagactggt gatgctggcg agatgtatgt cgatattacc gggatgcgta ccgatacggg     10680
+     tgcgtcagtt tcaaccactg tttcactgag ttaaatcact atggcaactg ttgacctgag     10740
+     cctgttaccc gttcccgatg tggttgagga actggatttt gaaaccatcc ttgcggaacg     10800
+     cattgcgacg ctaatttcgc tataccccga agaccagcag gaagctgtag cccggacgct     10860
+     cgcacttgag tctgaaccaa ttgttaaatt gctgcaggaa aacgcctacc gtgaggttat     10920
+     ctggcgtcag cgtgttaatg aagctgctcg cgcaggcatg ctggcttatg ccagagatag     10980
+     cgacctcgat aatctcgggg cgaatttcaa tgttgagcgc ctggtcgtca ggcctgctga     11040
+     tgacaccacc atccccccga cccccgctga aatggagctt gatgccgatt ttcgtctgcg     11100
+     tatacagcag gcatttgaag ggatgagcgt tgcgggatcc accggagctt atgaatttca     11160
+     tggccgcagt gctgacgggc gtgtcgcaga tatttctgtt atcagccctt ccccagcatg     11220
+     tgtcacgata tctgtgcttt cgcgtgagaa taacggtgcg gcgtctgatg agcttcagag     11280
+     catcgtgcgc aatgcgctga atgctgagga cgtgaggccg gttgctgacc gggttacagt     11340
+     gcagtcagct cagattattg actaccagat acgcgcaaca cttttcgttt atccggggcc     11400
+     ggaaaatgag ccgattcgtg cggcggctga ggcgaagctc aaagcttata tcagtgcaca     11460
+     gcacaggttg gggcgggata ttcgcctgtc agcaatttat gccgcgttgc atgttgaggg     11520
+     ggtgcaacgt gtcgaactgg ctgcacctgt ggccgacatt gtgcttgata aaacgcaggc     11580
+     atctttttgc acagactatc agatagtgat tggtggctcc gatgagtgat gtccgcctgt     11640
+     tacctgtagg gtcatcacct cttgaggtgg ctgctgccag agcctgcgca gatattgaaa     11700
+     atacacctgt tccgttacgc cgcctgtgga gtcctgacac ctgtcctgca aatcttttgc     11760
+     cgtggctggc gtgggcgttt tccgttgacc gctgggatga gaactggccg gaaaaaacaa     11820
+     agcgcgatgt tattcgcagc gcgtatttca ctcactgcca caaaggcacg ataggcgctg     11880
+     tcaggcgagt tattgagccg ctcggataca taatcaacgt tacggaatgg tgggagacag     11940
+     gtgacccggc gggaacgttt cgtcttgata tcggtgtgct ggaaagcggt attaccgaag     12000
+     aaatgtattt agaaatggag cggttgattg ctgatgcgaa acctgcgagc cgtcatttga     12060
+     ttggcctgaa tattatccag gatattcccg gttatatgta tacaggtggt gtgagctgtg     12120
+     acggcgacat tattacagtt taccccggat aagtgaggaa taatgagcac gaaatttaaa     12180
+     actattatca ccactgccgg agccgaaaaa ctggcagcgg ctactgtgcc gggtggtaaa     12240
+     aaagtgaata tcaccgtgat ggccgttggt gacggaggcg gaaaactgcc agtgccggac     12300
+     gccggtcagg tgcagctcgt gaatgaggtc tggcgccatg ccctgaataa aatcagccag     12360
+     gacaaccgga acagcaatta cattgtagcc gagctggtta ttccgcccga ggtgggagga     12420
+     ttctggatgc gcgagttggg tctttatgat gacgagggca ctctcattgc tgttgccaat     12480
+     atggcagaaa gctacaagcc agaacttgcc gagggctcag gccgtgcgca gacatgtcgc     12540
+     atggtcatta ttgtcagcag tattgcctca gttgaattat ccattgattc gacaatggta     12600
+     atggcgacgc aggaatatgt tgatgacagg attgcggaac atgagaagtc acgtcgacat     12660
+     cctgacgcca cactgaaaga aaaaggcttt actcaactca gtagcgcaac agacagcgcg     12720
+     tctgaggtgc ttgcggcgac gccgaaagcg gttaaagcgg cgtatgacct tgctaatgct     12780
+     aaatataccg ctcaggacgc gagcacagcg caaaaaggca ttgtgaggct gagtagtgcg     12840
+     gcagacagta ccagtgaagc tgaggccgca acaccgaaag ctgtcaaaat tgcgatggat     12900
+     aatgcgaatg cgaggctggc aaaagaccgg aacggcgctg atattccgaa tccgccgttg     12960
+     tttgtccaga atatcggttt aaaacccacg gtcgataaag ctgctaatgc cgttgataaa     13020
+     aatggcgaca cgatgaacgg aaacctgaca ctcaagggtg attaccggct gagttttatt     13080
+     atccagaatg aagacggttc tattcgtgct tatatcttca aggacaaagg tggcgacggt     13140
+     attcgcatca gtaatggcga tgacggcggc ggtgattttg tttttggtaa aaatggacag     13200
+     ttttactgcc cggatattat gcatgttggt aatacgattg tatggggtga cggaaatatc     13260
+     gagggggcgc gatggggcgg tttgttgagc gactggttaa ctgctcaact ggttgcccgt     13320
+     gacaataata ttaacttgcg agcaccctat gaatgggtta accaaaactt tgtcaaccgt     13380
+     gcacagcgcg gcgcacaggc cagcatgact atggacggcg gacttgtaga ggctccatgg     13440
+     ggatgttttc ttacgggggg gaacggtaac gagggtaatc aggttggagt ggctttatac     13500
+     cgtccattgc agattcttcg caataatact tgggtaacga tagagaactg aaaatgaaac     13560
+     tgattaattt gcaacgctac attctgatga attatttttt aggtgatggc attcagtatt     13620
+     ttatagatgc cacaggtaag gactggtata aatcactgcc caaattcaca aagaaataca     13680
+     gccttgctat cgaaaatgat acgggcgtta ttcgtagtat cagcgaagat gcatcccggc     13740
+     tttatcccgg tggtttgacc gttgttgatg ttgacagtat tccggcaggt tgtgacattt     13800
+     tcggcggatg ggtatttgac ggagagaaag tcattcctcg tgagtacaca ttggccgaac     13860
+     agcaacgcca gtcagatgaa aagaaaaaaa cacttcttgc tgaggcggag gcaacaattt     13920
+     ccacgcttga gcgtgcggta aggttaggca tggctaccgg ggaagaaata aggcgactcg     13980
+     aagcatggga gcgttacagc gtattggtga gcagggttaa gcagtcagat gactggccgc     14040
+     aaaaacctga ataacccggc ggcatttgcc cgcttctttc tcatccatta gttgtgccag     14100
+     acatcatcca gccctgacaa atagcccctc acaagaccag ccaggacaat aacactcgcc     14160
+     cactaactac ggagttaacc ggatgagtga ttttcaccac ggcacgaagg tcatcgaaat     14220
+     aaatgacggt acgcgtgtta tttccacggt cgcaaccgca atcgtcggca tggtctggac     14280
+     agccagcgat gcggatgccg agacatttcc cctcaacgag ccggtactga ttaccaatgt     14340
+     gcagagcgcc attgcgaaag ccggtaaaaa aggcactctg tcagcttccc tgcaggccat     14400
+     cgccgaccag tcaaagcctg tcaccgttgt cgtgcgcgtt gccgaaggta ccggagacga     14460
+     tgcagaagcg cagaccacgt ccaacattat cggcggcacg gatgagaacg gtaaatacac     14520
+     cggtatcaag gcgctgctaa ctgccgaagc ggtcaccggc gttaagccgc gcattctcgg     14580
+     tgtgccgggt ctcgatacgc aggaagtcgc aaccgcactt gcatcggtct gtatcagcct     14640
+     gcgtgcgttt ggttacgtca gcgcatgggg ctgtaagacc atttccgagg cgatggcata     14700
+     tcgcgagaat ttcagccagc gcgagctgat ggtcatctgg cctgatttcc tcgcatggga     14760
+     taccaccgcg aacgccaccg ccacggcata cgccaccgcc cgcgcactcg gtctgcgtgc     14820
+     ctacatcgac cagactatcg gctggcacaa aacgctgtct aacgttggcg tgcagggcgt     14880
+     taccggcatc agcgcctcag tcttttggga tttgcaggca tccggcacag atgctgacct     14940
+     gctcaacgag gccggagtca ccacgctggt gcgcaaggat ggtttccgtt tttgggggaa     15000
+     ccgcacatgc tctgatgacc cgcttttcct gtttgagaac tacacccgaa ccgcgcaggt     15060
+     gctggccgac acaatggctg aggcgcacat gtgggcggtc gataagccca tcaccgcatc     15120
+     gctcatccgt gacattgtcg acggcattaa cgccaaattc cgcgagctga aatcaaatgg     15180
+     ctacatcgtg gacggtgaat gctggttcga cgaggaatcg aacgataagg aaaccctcaa     15240
+     ggccgggaaa ctgtatatcg actacgacta tacaccggtt cccccactgg aaagcctgac     15300
+     cctgcgccag cgtatcaccg ataaatatct ggtgaatctg gctgaatcgg tcaacagcta     15360
+     aggagcctga aacaacatgg cactaccccg caaacttaaa tatctgaaca tgttcaatga     15420
+     cggccttagc tacatgggcg ttgttgaatc cgtgacgctg ccgaagctga cccgcaagct     15480
+     cgaaaactat cgcggcggcg gtatgaatgg cgctgcagcg attgacctcg gcctcgacga     15540
+     tgatgcgctt actgtcgaat ggtctgtcgg tggcctgcct gatgtggcgc tgtgggcgca     15600
+     gtatgccgcg ccgggggctg atgccgtgcc gctgcgtttt gctggctctt accagcgtga     15660
+     cgacactggc gaaatcgttg cggtcgaggt ggtcatgcgt ggccgtcata aagaaatcga     15720
+     cggcggcgaa aataagcagg gtgaaaatac ctcgaccaaa ctgtcgaccg tttgcaccta     15780
+     ttaccgcctc acgattgatg gtagcgacat tatcgaaatc gacaccgtca acatggtcga     15840
+     gaaggtgaac ggcgtcgacc gtctggaaca gcaccgccgc gcaatcgggc tgctgtaatt     15900
+     ccctgaccgg tcagcactgc tggccggtta ttacccccat tcagagcaga gaaaaaatca     15960
+     tggcaaaagc accacgcaaa acccctgaat ttattgatac ggctggcaat gaaattgaca     16020
+     ccgtaaaccc gaatgtcgtg accctcgaca agccgattaa acgcgccggt cagacaattg     16080
+     aaaaggtcac gctgattgaa ccgaacgcag gcaccctgcg cggcgtcagt ctggcggcgg     16140
+     tggcgcagtc cgaggtcgat gcgctgatta aggtgctgcc ccgcatgacc tacccggcac     16200
+     tcaccacgca ggagctcacc gcaatgaacc tgcccgatat gctgtcgctg gccgctaagg     16260
+     tgattggttt tttgtcaccg gcttcggcgg aatagacttc ccgcccggcc tgtcgaccga     16320
+     tgacctgatg gcggatatcg cagtgatatt ccactggccg ccatcagagc tctattccct     16380
+     gagcctgacc gagctcatca catggcgcga aaaggcgctg cagcgtagcg gaaaccacaa     16440
+     tgagtaataa cctgaggctt gaggtattgc tgaaagcggt cgaccaggcg acccgaccgc     16500
+     ttaaatccat ccagaccgcg agtaaaagcc tgtcgggcga tattcgcgac acacaaaaag     16560
+     ggctgcgtga cctgaatggt caggcgtcga aaatcgacgg ctttcgtaag gcaagcgcgc     16620
+     aactggccgt aaccagtcag gcgcttgata aggcgaaacg cgaggccggt gagctggccg     16680
+     tgcagtttaa aaacaccacc aatccgaccc gcgcgcaggc gcaggcactt gaagcggcaa     16740
+     ggcgtgccgc ctctgagttg cagacgaaat acaacagcct gagaacgtcg gtacagcgcc     16800
+     agcgctccga gctgatgcag gccggtatta atacccgcac tctctctgca gatgagcgtc     16860
+     ggctcaaaac ctccatcagc gaaacaactg cgcacgttaa tcgacaacgt gaggcactgg     16920
+     cgcgcgtcag tgcgcagcag gcgaaattaa gccgggtgaa agagcgatat aaatcaggca     16980
+     aggagcttgc cggtaacatg gccgcagcag gcgctgcggg gtcggtatcg cgacacggaa     17040
+     cgatggccgg ggttaaatta ctgatgcccg gttatgactt tacgcagaaa aattccgagc     17100
+     tgcaggctgt gctcggggtc gataagcagt cgccagaaat gcaggcgtta cgcaaacagg     17160
+     cgcgccacgt cggcgacaat actgcagcct ctgcagatga tgcagcaagc gcgcaaatca     17220
+     tcattgcgaa aagcggcggt gatgcagctg ccattcaggc gcgacgccga gtcacgctga     17280
+     atatggcgct gtcaaaccgg cgcacgatgg aggaaaacgc agcgctgctg accgggatga     17340
+     aatcagcgtt tcagctttca aacgacaaga ttgcgcacat tggcgacgtt ctctcgatga     17400
+     cgatgaacaa aaccgccgcc gattttgacg gactgagcga cgcgctgacc tatgccgcac     17460
+     cggtggcaaa aaatgccggg gtgagcatcg agcaaaccgc cgcaatggtc ggtgcactgc     17520
+     acgatgccaa aatcaccggg tcaatggcgg gcacgggtag ccgcgccatt ctcagccgcc     17580
+     tgcagctccc accggaaaaa gcgtttgagg ccattaagga gctcggcgtc aaaacgtcag     17640
+     acagcaaggg gaacacgcgc ccgatattct ccatcctgaa agaaatgcag cgcagctttg     17700
+     agaaaaacaa cctcgggaca agccagcgcg gcgagtatat gaaaaccatt ttcggcgagg     17760
+     aggccagctc ggcggcggcg gtactgatgg aagccgcctc aagcggcaaa cttgaccggc     17820
+     tcaccgctgc gtttaaagcc tcggacggta aaaccgagga actggttaag gttatgcagg     17880
+     ataacctcgg cggcgacttt aaagagttcc agtctgctta tgaggcagtc ggtactgacc     17940
+     tttttgacca gcaagagggc tcgctgcgta aactcaccca aaccgccacg caatacgtgt     18000
+     taaagctcga cggctggatc cagaagaaca aagggctggc gacaaccatt ggcatcatcg     18060
+     ccggtggcgc tctagctctg attggtatca tcggcggtat tggcctcgtt gcgtggccgg     18120
+     ttgttatggg gattaacgcc attatcgctg ctgctggcgt gctgggtacg gtctttactg     18180
+     ttaccggtag tgccattgtg accgcacttg gcgcgattac ctggccgatt gtcgcagtgg     18240
+     gggcggctat tgtggctggt gcgttactca tccgtaaata ttgggagccc atcagcgcat     18300
+     ttttctcggg ggtgattgag ggcatcatga gtgcctttgc accggtcgca gaaatgttcg     18360
+     ctccactggc acccattttt gacggtctcg gtgagaaact gcgcggcgtc tggcagtggt     18420
+     ttaaagacct gatagcaccg gtcaaagcca cgcaggaaac gctcgatagc tgcaaaaatg     18480
+     tcggcgtcat atttggtcag gcgctggcct ctgctttgat gcgtccgctc aatgtattta     18540
+     acaagttgcg cagcggtgtc gactggcttc tcgaaaagct cggtatcatc aacaaagagt     18600
+     cagacaacct cgaccagact gccgccaaaa ccaacgccgc cacgcagggt aattcctaca     18660
+     tcccggcaac cagcacatat ggcggctatc aagcttacca gccagttacc gcaccggcgg     18720
+     gacgctctta cattgaccag agtaaaagcg aatacaaaat cactctgccg ggaggtgctg     18780
+     cgccggggca tcagcttgac agacagctac gcgacacgct cgaacagatt gagcgcgaaa     18840
+     agcgtgcgcg tcagcgtgcc agtatgagcc atgactgaga ggaataaacg atgatgcttg     18900
+     cgcttggaat gtttgtgttt gaacgtcgca ccctgcctta tcagtcgatg cagcactcga     18960
+     aggattaccg ctgggcgtct aatgaccggg tgggtaagcc gcctgcttat cagtttctcg     19020
+     gcgaggggga aacgtcgata cagcttgccg gtacactgta cccagccatc accggcggct     19080
+     ggatctcact aaaggctgta gaggtaatgg ctaacgaggg cagagcgtgg ccgttgattg     19140
+     agggaactgg aaacatttta gggatgtata tcgtcgataa ggtgtcgacc acgcacgccg     19200
+     agtttttcag cgacggcgct gccagaaaga ttgatttcac cctttcgctt aaacgggtcg     19260
+     acgaatcact gacggcaatg tttggcgacc tgaataagca ggccagcgag cttctaggct     19320
+     ctgccggaaa tctgactgat aagctgcaga gtgcgctcgg aggactgacc gcatgattac     19380
+     gggcatgact attgacgccg gaactagcct tgcaccggca tttatgttaa cgctgaacag     19440
+     ccaggacatt accagcaatt ttagtgaccg gctgatttct ctcaccatga cagacaaccg     19500
+     gggctttgag gctgaccagc tcgacattga gctcgacgac accgacggca aagtcgaatt     19560
+     accactgcgc ggggcggtgc tgacgttgtg gcttggctgg cagggttcgg cgcttctgaa     19620
+     taagggcgat ttcacggtcg atgagattga gcaccggggc gcgcctgata tcctgaccat     19680
+     ccgcgcgcgt agtgcagact ttcgcggaac gctcaattca cggcgtgaag aatcatggca     19740
+     cgatactacc atcggtgagt tggtcagcac cattgcaaag cgcaataaac tgacggccag     19800
+     tgtcgcggat tcactgaaaa aaattccggt accgcatatc gaccagtcgc aggagtccga     19860
+     cgccgtattt ctgacccgac tggctgaccg caatggggcg acggtgtcag tgaaagcggg     19920
+     gaaactcctg tttctgaaag ccggtagtgc gatgacggcc agcggcaagc ccgtcccgca     19980
+     aatgacacta actcgcaacg atggtgaccg tcatcagttt gctattgccg accgtggggc     20040
+     ttacaccggc gtaaccgcaa aatggttgca caccaaagac ccgaagccgc aaaagcagaa     20100
+     agtaacactg aaacgcaagc caaaagagaa gcacctgcgc gcactggagc acccgaaagc     20160
+     aaagccagtc agcaaaaaga caaaggccaa aaaagagccg gaagcgcgcg agggtgagta     20220
+     tatggccggt gaggccgata acgtgctggc gctgacgacg gtctacgctt ctaaggcgca     20280
+     ggcgatgcgt gccgctcagg ctaagtggga taagctgcag cgaggcgttg cggagttttc     20340
+     aattacgctg gcgcttggta gggctgattt attccctgag acaccggtgc gcgtatcagg     20400
+     ctttaagcgc gtcatagatg agcaggcatg gttaatcagt aaggtaactc acaatctgaa     20460
+     taatagcggc ttcacgacgg gcttagagct tgaggttaaa ctctctgatg tggagtacaa     20520
+     cgcggaatcg gatgatgaat aaaatgtatt cacaaaaagt gaatttatga ttatcattta     20580
+     ttcacgaatt gagaataaag ggtgggttat gtttcattgt ccgaagtgcc atcatgccgc     20640
+     acatgcgcga acaagccgct atctaaccga aaacacgaaa gaacgctacc accagtgcca     20700
+     gaacatcaac tgtagttgta cgtttatgac aatggaaacg atagagcgct ttattgttac     20760
+     tccgggagcc attgacccgg caccgcctca cccgactgtc ggtggtcagc ggccattgtg     20820
+     gctctgataa atttccgcta aatgcccgcc gcgtgcgggt ttttttatgc actcaggaaa     20880
+     gtggcggtaa aaaatccacc gccattctat cgccactcga aaacgaggca acaaaaaggc     20940
+     cactcgagag agtggcctaa ctgtatgtat ttactactta aatttggtgg cccctgctgg     21000
+     acttgaacca gcgaccaagc gattatgagt tcctacaaga acaaccgaaa atcaatagta     21060
+     tgcgttattt atcattgaca tagattgcca ttgtttgcca ataattacct attattcgcc     21120
+     atttctaccg ccactttatc gccattctat tatctgttac tcagaaccat cgccgacata     21180
+     ggttccatca ggtgcgagat gatatcttcc accaacataa gtcccatctg gggcaagtgt     21240
+     tgggcggcca gcaacataac ttccatttgg cgctaagcgt ggaacgccac cgacataagt     21300
+     tccatcgggt gcaaggcgtg gtgctcctcc tccaacataa gtcccattag gggcaagcat     21360
+     aggttgtccg taaacatagg taccatcagg tgctaatcga actgacatac aacctccata     21420
+     acttatttgc tgttagtaat gtgaactaaa ggatttagtt taactgcatc ctctaaatgg     21480
+     tcgggtgcaa agtgcgcata tcgcatggtc atttttatat ctgtatggcc gagtacgcgc     21540
+     tgcaacacca aaatattacc gccattcatc ataaagtgac tagcgaaggt gtgacgtaaa     21600
+     acgtgggtaa gttgtcctgc cggtagttcg atacctgttc tttccaaagc tgaccggaac     21660
+     gcgccataac aatcactgaa caaccggccc tttttatcat caggcagaga ctcatagagc     21720
+     tctttgctga ttgggacggt gcgatttttt ctacctttcg tgttggtgta tgtgattttg     21780
+     tatttcgcga gttggctttt tctcagactc tcggcctcag accaccgtgc gccagttgcg     21840
+     agacagattc ttaccacggt ttctaaatca gggtggtcat gtcggttaca ctctccgagc     21900
+     agttgcgaaa tttggtcgtg agttagccaa gtcatttcca tttcttctgt gcggaatggg     21960
+     cgcatatttt ttagtgggtt ttcacccttc cattctccga ggcggtttag ctcattgaac     22020
+     accgcccgga agtaggccag ctcaagatta agcgtgcgag gcgatacctc tttcactctg     22080
+     tttgaacggg catactcacc ttttaaccgt ttttctcggt agcgggaaaa catctgcgca     22140
+     tcgaaatcgc gtgcgagtgg ttcgcccata cactcaaaag catggtgcat ggctaactgg     22200
+     cgtttcaaac catctttcag tgtaatgcca tgagcgctat accatgaatc aaccagctct     22260
+     tttaacgtgc gcctgtcttc cttttcttcc tgccacgggt tttgaacggt gtactgctca     22320
+     aacgccagag cctcgccttt agtagcgaat ttctttctga tacgtttgcc ttttgcaccg     22380
+     tttgggtaga gttcacaaat ccaaccgcca gccggatttt tacggacggt cattagttaa     22440
+     cctcgctgta tacacccacc acacgcccca acgttttaat atcatcaatg ccgcattcga     22500
+     aaggaacctt cccgcctgca acatgtagtt ttctacccgg tagttttgtt aactctcgaa     22560
+     tgcttattgc tccctcaatg tcgactagcc ataagccgtc agacaatgat gcttgcttgt     22620
+     ccacaaaata aattttcccc tcggaacgga tagccatccc atctgtgagc ggttttgtga     22680
+     aaaattgggc atcaacactc aattgtttat cggatttgag gatttcttca cttaatgtga     22740
+     atccctcaat cctttttgcg tcgctcgatt ctctgttatt tacaaatgct tctccttctc     22800
+     cggtaagtaa ccactggaga ttagcacctg tttcaagggc acagtgagcc gcaaagtcat     22860
+     aggagatagc gcctcgggtg tacctgtttg acaatgagct ggacgcgata tcgaagtggt     22920
+     tagctaattg aattttctgc gaaaatccgt acgcctcgca gatgcggtca agtacatcca     22980
+     cgttgctcca tcctaaagaa tctattctca tttcgataaa acctatttac tatctctcaa     23040
+     ttgggagata tattttggct aaacccacgc aattgatggc aagtgttggc aaacagagtc     23100
+     aaatcaattg caaactttgg ctaataggga atcatgcaat atggcttctg aaatcgcaat     23160
+     catcaaagtg cctgcaccta tcgttactct gcaacaattc gcagagcttg agggtgtttc     23220
+     tgaacgcacc gcctaccgct ggacaaccgg cgacaaccct tgtgtaccaa tcgaaccccg     23280
+     cacaatccgt aaaggctgca agaaagcagg tggcccgatt cgcatttatt acgcacgctg     23340
+     gaaagaagag cagttgcgta aggcgttggg acattcccgt tttcaactcg tcatcggtgc     23400
+     ttaattcact ttatgtgaat tgtaaggatg caacatgttt gattttcagg tttccaaaca     23460
+     tccccactat gacgaagcgt gccgggcttt tgcgcagcgt cacaacatgg cgaagctggc     23520
+     cgagcgtgcg ggtatgaatg ttcaaacgtt acgtaacaag ctcaacccag aacagcctca     23580
+     ccagttcacg ccgcctgaat tgtggctgct gactgacctg accgaagact caaccctcgt     23640
+     tgatggtttt ctggcgcaga ttcattgtct gccatgcgtg ccggttaatg agctggctaa     23700
+     agataaattg cagtcttacg tcatgcgcgc aatgagtgaa ctcggtgaac tggcgagcgg     23760
+     tgcggtatct gatgagcgtc tgaccactgc ccgtaagcac aacatgattg aaagcgttaa     23820
+     ctccggcatt cgcatgttgt cattgtcggc tctggcgctg catgcacgtc tgcagactaa     23880
+     tcccgctatg tcgagcgtgg tcgataccat gagcggtatt ggcgcatcgt ttggtctgat     23940
+     ttgaggtgcg tatgctgaaa agtgaaccgt catttgcgtc tctgctcgtt aagcaaagcc     24000
+     ccggtatgca ttacggccac ggctggatcg caggtaagga cggcaagcgc tggcacccgt     24060
+     gccgctcaca gtccgaatta ttaaaagggc tgaaaacaaa gtcgccgaaa tcgtcaggtt     24120
+     ttttaattat tcgtattgtc cactttgtaa ttaaaggagt gaaacatgtc acgcgatgaa     24180
+     ttaagaattg ttttgggtgc catgattcca aatatggagg aaggttttga aattaaaacc     24240
+     cgcgacggcg caatacttcg cgttgaccct gagtgggagt gctgcaaaga atttaaggat     24300
+     ggattaaaag ccgaaatcat caagcagtta aaaagcaaac ctgctgttgt atttggatat     24360
+     agttaattaa ttaaacgtaa ttacttggcg taaacccgcc gggcattctt ttgccaaaaa     24420
+     acaggaggat atatgagtcg aactatttat ttatcaacgc cgagtggtgc tggcgaccac     24480
+     ttgctggagt ctttgtttaa agaagccaaa aaagaagagc gcaaagaccg ccgtctcgcc     24540
+     gtttcaatcc gtctcgaaga tctggccgtt cacattacca attcagatat gacaggcaaa     24600
+     gaagcggccg agctactgcg ccgcgaagcc actcgctttg agaacgaatc acaggagctt     24660
+     cactaatggc cgacgcaatg gatttagcac aactgcgcga gcaggaagac cgcgaacgcc     24720
+     acataagcaa cgcgcgcagc cgtcgccatg aggtttctgc atttatctgt gaggaatgcg     24780
+     atgcacctat cccggaagcg cgccgccgag ccataccggg cgtgcagtgc tgcgttacct     24840
+     gtcaggaaat cttagagctg aaaagtaaac attataacgg aggtgcttta tgagcattac     24900
+     caatgcaact attagccagc gtgcaaaaaa atggcttgaa gatgaccgta tatttattga     24960
+     caccgaaact acgggtttgg gtgatgatgc ggaaatagta gaaatctgtt taatagatag     25020
+     cgctggtttt atcatgctaa atacattggt taaaccaact aaaccaattc cagcagaggc     25080
+     tacggccatt catggaataa ctgatgaaat ggttatgtat gcgccaacgt ggaaagatat     25140
+     tcacggcgca gtagcttctt tattttttga gtatggcttt gttatttata acgccgatta     25200
+     cgacacaaga cttatatatc aaactgcgaa attatatggg cttgagaatg acggcttttg     25260
+     ttatttttta aatgagcgtt cggcctgcgc catgatgcta tatgcagagt atcgcggcga     25320
+     gccagggcga tttaaaggtt ataaatggca caaattagtt gatgccgctg cacatgaagg     25380
+     ggttagcgtt gaaggaaagg cacaccgtgc attagcagat tgccggatga ctcttggcat     25440
+     tatcgacgct ttggcaaaag gcggtgcagc atgagtatcc gtatcgaaat aggtgataaa     25500
+     tgggtaatca ccagcgacca atatcaattc atcctgaatg aaaaaaaagt cgttaagacc     25560
+     ggcaataaag ctggcgagga atggctcgac accatcggtt attacccgaa gattaatcag     25620
+     ctcatttctg gtctggtaca tcaccacatt catacggcaa tgattatttc ccttagtgca     25680
+     atggcagagg aaatagagaa gttatctttt atctgtgaag aagcatttaa ggcggttaaa     25740
+     aaatgattga ttcccgctgc tttgctgaaa gcacaataaa tattgtttct gtttctggtg     25800
+     gaaaggacag ccttgctcaa tggattcttg cggtagagaa cgacgtaccg cgcaccactg     25860
+     tttttgcaga taccgggcat gagcattccc aaacaatgga gtatctggat tatcttgaat     25920
+     ccagactcgg cccggttatt cgagtgaaag ccgattttac tcggcggatt gaaggcaaac     25980
+     ggaaattcat tgctgaaaaa tggcctgtct ctctcgttga agaatgcgga atgtctcatg     26040
+     agcaggctgc agaacgaatc gcaaaggcac tggaaatcct taagccaacc ggtaatccgt     26100
+     ttctcgattt gtgcatgtgg aaaggacggt tcccgagcac gaaagcaagg ttttgttcac     26160
+     tggaactgaa acatgactca gtacgggaca agattgtact cccagcgctg gagaaatatg     26220
+     acgaagtaat tctatggcag ggtgttcgtg ctcaggagtc accagcccgc gctgcgttac     26280
+     ctatgtggga ggaggatgca gataataccc ccggtttgca tgtgtatcgc ccaattctta     26340
+     actggacaca tgaagacgta tttgccttag ctaaacgaca cggaattaaa ccgaacccac     26400
+     tctatcagca aggttgtagc agagttggct gcatgccatg tattcatgca agaaaatctg     26460
+     agctggcaga gatttttgct cgctggccgg aggagattgc gcgcgttgca gagtgggaac     26520
+     gtcttgttgc tgcctgttca cgtcggggaa actcaacatt tttcccttcg actcacgacc     26580
+     cgcggcgagc agaaaaacgt attgaagttg ttaccgtaga agaatatggg atagcttcat     26640
+     atcgtgactg ggcgatgact acgcgtggcg gttctcagta cgatttgctc gctgctacaa     26700
+     acgacaaaac tgtgtgcagt agcgtttatg ccggtgtatg tgaatgacgg gtgtcgttta     26760
+     cgcgtttccg tggaatgccc cacggtcggc aatagccagc tcatatctta cctatgacca     26820
+     acagcatcgc cgcgaccgta tgttcgcggc tttgctgcat gcgagaaagg tgctttttct     26880
+     ccagccagaa tgtgtgcgct ttgacgttta tcgcaccgct gcagttctgg agcaaaatca     26940
+     gggcagtcaa cgagccaatg cctttttaat cagcttctgc aaaaaggcat taccacgtct     27000
+     tgaactggtc gcaaaaaaat acgagtgctc gggcatcaac agcaatgtat cagccgctgt     27060
+     tttcgatggt cattttgata cccagcttat gcaatatctg gcgtcacgca tggtcaatat     27120
+     ggtcgccaga tttaaccgcc tcccggatat gtcgcgcgcc gatattgacc tgctggccgc     27180
+     ggatatcgct aattttattc gcgctgaact ggccgacatt gatgacaccg gatttagcga     27240
+     actcaaaacg ctgtacactt ggtacatgcg cgccggtttt atttccctgc aattcaacgt     27300
+     tacaccgccg aaatgggagc gtgtgactaa aaaatatttt tgtgaggatg aaatcgcacc     27360
+     ggcagtaatg cgcatgttta atgaggtttg gtggcgcggc cgcttgcgac gcattgcggc     27420
+     tgcatggcgc gaacatctgc aaattgcagt cggcaacgta agcaagaaac gacacgcata     27480
+     cgcgagtaaa aactgcgtca ccgactggcg cgagcagaag cgccgcacgc gcgaatttct     27540
+     caaggggctg gatctcgaag acgaagaagg caaccgcatc agtctgattg aaaaatacga     27600
+     cggctcggtc gctaatccag caatacgccg ctgtgagctg atggcccgca ttcgtgggtt     27660
+     tgaaaatatc tgtaatgagc tcggttatgt cggggagttc tatactctga ctgcaccgtc     27720
+     taaatatcac gccaccacca aagcgggcta ccgtaacagc aaatggaacg gtgcaagccc     27780
+     gtcagacacg cagagctatc tcacaggcct ttgggcacgc atacgcgcca agctgcaccg     27840
+     ggaagaaatc cgcattttcg gaatacgcgt cgctgaaccg catcacgatg gaacgccgca     27900
+     ctggcatatg cttatgttca tgttgccgga agatgtcgag cgtgtgcgac tcatcatccg     27960
+     agattatgcg tgggaggaag accactacga actgagaagc gataaagcca aaaaggcgcg     28020
+     cttccatgct gaggccattg acccggaaaa aggcagtgct actggctatg tcgctaaata     28080
+     catttccaaa aatatcgacg gttatgctct cgatggtgaa accgatgacg aaagtggtga     28140
+     gttgttaaaa gagactgcac ccgccgtttc agcatgggcg gcgcgctggc acatccgtca     28200
+     gtttcaattt atcggcggtg cgccggtgac ggtatacagg gagctacgca gaatggctga     28260
+     ccctgaaaca gccagggcgc tcagtgttga attcgccgca gtgcatgatg ctgctcacta     28320
+     tggacgctgg gctgattatg tgaatgctca aggcggacca ttcgttcgcc gtgacgattt     28380
+     acaggtacgt acattgtatg aacctcgaac tgaatttaat cagtatggcg aagaaactgt     28440
+     gtgcatcaaa ggtgtctacg atgcctcgat aggtgctggc tctcctattc taacccggtt     28500
+     aacgcagtgg aagattgttc caaagcgtgc cgttgatttg gccgttgacg ttaagggcgc     28560
+     ttctgcgccc tctcggagtt ctgtcaataa ctgtacggga agcgaaagcg atccaccgat     28620
+     actcgattta acaaaaccgc tgagtcggcg tgaaagacga gagttgacga accgactcag     28680
+     gaagaaaaag ccaacaacac ggcgaaaatt catccacgga acggataagc aaaacgtcgc     28740
+     tataacgaaa actatcgacg agatacactc tgacaaccgg catcacaatc agccggggcg     28800
+     aagccctgca cctgatggcc ggtggtaaaa gttgttttaa cggtcgatgg gtgcgcggaa     28860
+     cgtcaaaagg tgaaatcttt gctgcagctc cttcacatca ggcgagacgc ggaaaatcct     28920
+     taatcgtgtt gcagatttag ctgagctggc aacgaaaatg taaccgctaa tattcatcca     28980
+     tatcatgtac atacagtgta tttaactgtg atttttttct tcacaccttt tgccaatacg     29040
+     tgctactgta tgtttataca gtatctcgta gtggaggttg tgtggataga gagctaaatg     29100
+     agcacgttat gattgagcgg gtcgaaatga ttgcgcgtct gactgctgaa ggtacttgtc     29160
+     aggaaagaga ccgtgaaatc gcattgaatc taattgcgga aatagcaaga ggcaacctaa     29220
+     tgaaaaataa taatttttct gttgtttttt ccgcaccgcc tgttggtgaa acatttgcaa     29280
+     aggagggcaa agtgaaagta aatatcacgt tggataaaga ccaaaaaatc ggccagccgg     29340
+     taattgatgc ttttcagtgc gaattgacca agcgaataca gtccgttttc ccgtcaacgc     29400
+     gcgttactgt taaaaaggga tccatgaccg gtgtcgagct gatggggttc gataaagatt     29460
+     cagaccgcga agcgctggat agcatccttc aggaagtgtg ggaagatgag agctggcgtt     29520
+     aatccctgaa aaatgtgcaa ccatcgaccc catgtttgat agcatggggt tgttttgtat     29580
+     gggattacac acaaaggaaa atcatggata ccgtaatagc atttttatct ctggctctct     29640
+     ttattgcttt tatcgtcggg ttaatcaagc cgtcgctggt tcgaatgccg agccgtaagc     29700
+     gctccagtgc tgtttatctc ggtggctgtc tggcgctggg cgttattggc tcaatcttat     29760
+     ggccgactga aaaaactcag ccggtggcaa aaactgacgt accggcggtt aaagcggaac     29820
+     cggctacgcc aacgtttgag tacgcagata aaaccctcaa agaatatcgc aacgagccaa     29880
+     aagaaacccg gcacgaaatc gttaaagact atgttggatt caaaggtgtg caggccagcg     29940
+     ctaccgatgt tttttatgcc tgtatgagcg agtacacttt taccaaagat gatgcgttaa     30000
+     agctcagtga tgtgttgggg tggtgtttca acgacttcga gaaagatcca caatctctga     30060
+     ataataaaat caaccttgac gaatttcagg gtaattttag cggttgggat ggctcttatc     30120
+     gcccgttaga gaagctgata aaagccagta tgaatgatga ttcctcttat aaacatgttt     30180
+     caacggtcta ccatctgatt ttgaataaag acccgcatgc cgttgtaaaa acaacgtttc     30240
+     gcggcactaa tgcttatggt ggcgtggtca aacagaccgt agcagcacgc gtcaacgtgc     30300
+     gaacgggcga ggtcgattca atactcgaca attaaacatg acaaacgccg ccggtgctga     30360
+     aactcgcttt cagtgctggc ggggttgaac aacgagcccc gcgaggcgtt agcctacccc     30420
+     tgagcaaccg cccaagaccg gtactattaa agccggtttt tttatgccac ttttccacga     30480
+     atttcccgtt tttttagccg tgcatgcaac aggtgcattg ttttgcatgc gtcaggcttg     30540
+     cccgttctgg ttgtgcgtcg ccagagctgg cgcggctcca gagtggtcat gcaactgcat     30600
+     taaaaccgac ccataaagtg ggca                                            30624
+//
diff --git a/etc/b132222.fasta b/etc/b132222.fasta
new file mode 100644
index 0000000000000000000000000000000000000000..03a6c625156a5c0760a445a0e642b27d7fc8c34d
--- /dev/null
+++ b/etc/b132222.fasta
@@ -0,0 +1,512 @@
+>B132222 U32222 Bacteriophage 186, complete sequence.
+ggcgtggcggggaaagcattgcgcgccagaggtggcgcgtgaatgataaaaattatcgtc
+tgagcgcctcgtaatggcgctatcgtggtgctgttggttcgttggtggtcgtgtgtgttt
+gtgcgcgtgtggcgcgtctgagacgtgatggtggcggggtatgaaaaagccgccatgctg
+gcggcttgagagggattattccgggttgtcgagggtgtactctttgaacctgatgacctc
+catgccgagccagtcgtttacctccctgaacctgtcctgcagcggcgacaggtcgttacg
+cacaaatacctttgccactttctcaacgtcaccgagcgagccgatattctcgggcttgcc
+gcccatgagctggaacggtacgcggtgcgcgtccatcaggtcggcggcgctggctttctt
+gatgttgaaaaagtcatcctttgtggcgacctcgctcagtggcacgattttaatgccgtc
+cggttttccattgggagcgtagaaaaacaggtttttaaaattgccgagccctttcgagtt
+gcgcatcgcctcgcgcagcgattcgacgtcggtcgcgctctgcgccgggtcggtcacata
+catgatgtaacccgcatgcgcgccgttctggtaatacttgcggcggaacagcgttgcgga
+ttcattcagccaggcggaattaagcgcgctgagatattcgggcaggccgtaaatctcctg
+attaatgtcgggctccagcaggtgaaacacggtatcaggcgcgaattcatgcggcagagt
+gaagttttccacaaaccagaaaaccgaatcgtcgaccccgcggcgggtgtatttggccgg
+tgaggccagtagcttgattagctggccggtaacgctgtggcgctgctcaagaaaggcgtt
+gccgaataccagatagtcgagcgcaaagcggctgaaatcctgacgggacagcagcgggtg
+cgggatgtaggtgctcgcgagcacgttgcgcttaacgtaaatcggtgagctgtgatgtac
+agcagagcgcaggctctttgccagcccggagaagctgaccggcggctcgtaccatttgcc
+gttactgatgcactcgacataatccagaatgtcgcgcttatcgagtaccggcactggctc
+gccaaaggtgaacgcctccattttttgcggggcgctggcggtcatggctacctgtttgcg
+tggcttgcgcttgctcatgctgccacctcacccgctgcaacagcgaaagaccagtcgcag
+ccaaacagcaggcgataatcatcgtcgctgtattcgtgtttaatttcatcgggcgcaaag
+agattgcacccgcgctggcatgctgcatccagagtgaccgactgacgccagacaccatct
+gtacaaaatacgctgtcgccggtattgatgagcggtgacggtcggtgcctgcgggttgtg
+ccgttccataccctgaaagcgtcataattatcagagggcgaggtaaacatcgtcaggctg
+tggcgtttatggcaggcgatacccgccgcgactttcgcagctcttagcgggttattgaac
+catccgaactcatcaagatagacattacccgccagtgcggcgcaatgggattcctcgccg
+acaaagctgataaccgcaccgtcgtcgagctgcaggctgtggccgttactcgtaagactg
+acgccgacgcgcgccgaaaggttactcatgtacatcagcgccacgcgcgcatgctcaata
+gtgtgagcaaaccagacatgattatcgcctgttgtcagcgcatcgagcagcgcctcacgg
+ctaaagagctgcgttgcgccaatctggcgcgatttggtgatgctgcggtcgatattgagt
+ttcccgacacgcaaccatgttgcctgatagtcaaagctgtcattgtgcagaatatcggcc
+attgcctgaatctggctttgtgagaaaacgttatttttcattaattaaactccagaatgg
+atttaggctgtatgccgctaccggcggaaagcggttcgtttaacagggcgtgcatggtcg
+cccatgcaatatcggcgtgactggcttcctcggtgcggctggcctcgtaggtggcgctgc
+gcccgctgctggtcatggttttgcggatggacataaacgactgcgtgacgtcggttgctc
+cggcgtcgtactccagacagccgcggcgaatggtgtcttttgccttgagtaccattgcgg
+ttttcatttcaggcgtgtaacggatgccgcgtgcggccgggtagaatgagcgcaccaact
+ggaacacgccgaggccgaggccggttgcgtcaatgccgatgtattcgacgctgtatttct
+cggtcagtttgcggatgccatctgcctgcgcggcaaagtccatgcccttccactggtggc
+gctccagcatgcggaacttgccaccagaaaccaccggcggcgcgagcacgacgcacccgg
+cgctgtcgccagtgtgtgacgggtcgtagccaatccagacggggcgagagccgaacggat
+ggtcggcgaacggggcgaagtcctcccattcttccatcacgtcgaccatgcagcgctgca
+gctcctcgaacgggaataccgacgctttatcgtcgacaaactcgcacataaacaggtttt
+taaagtcctcatcactgttttcgcgtttgagttggtcgaggtcgaacagggtgcagccac
+cggcaagggcgtcctcaatggtgacaatctgccgccactggccatcgtcgcagagctggc
+caccggcgagcgcgcggtgactgatgtcaatttcgatgcggtcggcaatacggctgcgcc
+ccttgttgaacagctcgccagaccagaagggataagcgccgtgcgccagcgttgagggtg
+tcgaaaagtaggttgagcgcagatgcttctgcgaggccatgcccgaggcgactttgcgca
+gcttctgaaaattcgggatccagaatatttcatcgacatacaggtcgccgttatggctct
+gagccgtgttggagttggtaccgagaaaaatcagctttgcgccgttgttgccaatgacaa
+tcgggtcgccggtcaggtcgacgtcaaccagtcgcgcaaactgtatgatgtattcgcgga
+acacgtaagcctgcgttttactggccgacagaaaaatctggttatggccggtcttgagtg
+ctcgcagcagtgcctcacgggaaaaatagaacgtcgcgccaatctggcgggatttgagaa
+tgtcgcgaatacggtgtgccagtcctgcgcggtaccactgcaactggtactcgaaagact
+ggtcgaaaaataattcctccagcttttcgatagcctcgtcgctgaaaaaattctttttcg
+gcttcttgcgctcacccttgttgcggttggcgacgttggggttaaggtcggcctcgttgc
+cggtctggctgtagcggttaacgcgtgccagtcgttcaatctgccgcccgagcaggtcaa
+tctctttgaagtcaccgcctgacttttgcggcttggcgatgagctgaatcaggcgcgcct
+caaggctgctttcaacgcgggaaatcggtgcgatgccatcccagccgtcgcgctgtttcc
+agctctgcacggtcgggcgcttgacctgcagcatttcggcaatctgcggcacggaaaaac
+cctgccagtaaagcagcgatgcctgtcgtcgcgggtcatgcaacaaggttgtatcggtgg
+aaatggtcattgatgcctcgccgtaatggattcagggcaaggctacttaatggccgtcag
+tgattcgctaaggtgctgttgtgtgggcggttgtccagtcgtcattggtggtctggcgtg
+tcctgagtctggaaactggcggtgaccagtaaccccaacctcaggactcctgacaatggc
+aaaaaaagtctcaaaattctttcgaatcggcgtcgagggtgatacctgcgacgggcgcat
+tatcagcgccagtgatattcaggaaatggccgaaacctatgacccgcgtgtttacggttg
+ccgtatcaaccttgaacacctgcgcggcctgttgcccgatggcatattcaagcgttacgg
+cgatgtggtcgagctgaaagccgagaagattgacgacgattctgcgcttaacggcaagtg
+ggcgttgttcgctaaaatcaccccgaccgatgaccttatcgcgatgaataaagccgcgca
+gaaggtctacacctcaatggaaattcagccgaattttgccaataccggcaaatgctacct
+cgtcggccttgctgtcaccgatgacccggcgagcctcggcactgaatatctcgaattctg
+ccgcactgcgaagcacaacccgctgcagcgctttaaagcccaccctgaaaacgtcttttc
+cgccgccacgctggccgaactggaatttgaagacgttcccgacacggtgctcaacagcct
+ggccgataaggtgaaagccattttcagccgtaagcaggtcagcgacgatgcgcgcctgaa
+tgatgtacatgaagcggtgaccgccgtcagcgagcatgtgcagaccaacctcactgcaca
+ggataagcgtctttccgatatggaaaccgcgtttgccaccttcaaacaggaactgaccgg
+caaggttgaagaaaccagccaggcattttccgtcctgaaaaccactctcgacaaaaccga
+aagtttcagccagccgcgacgcacgaaagccagcggcggtggtggcgatgagctgctgac
+tgactgctgataaaccgcagaccgaaaccgggcggaacccccgcccgatgctgtgactaa
+ccgattaaatcaaacaggaaatactatgcgtcaggaaacccgttttaagttcaatgccta
+tctgacccagctcgccaaactgaacggcatcagcgttgatgacgtcagcaaaaaattcac
+cgtcgagccgtccgtcacgcaaacgctgatgaacaccgtgcaggcgtcatccgcgtttct
+gcagatgattaacattctgccggtcgcagaaatgaagggtgagaaaatcggtgtcggtgt
+gaccggcaccatcgccagcacgaccgacacctcgggcgacaaagagcgccagaccgcaga
+ttttaccgcgcttgagtccaacaagtacgagtgcaaccagattaactttgacttccacct
+gacctataaacgcctcgacctgtgggcgcgttttcaggactttcagcgtcgtattcgcga
+cgccattgtccagcgtcaggcactggatttcatcatggccgggtttaacggtaccacccg
+cgctgacacctctgaccgtgttaaaaacccgatgctgcaggatgtggccgttggctggct
+gcagaaataccgcaatgaagccccggcgcgtgtgatgagcaacatcaccgacgctgacgg
+taaagtcgtttcggcagtgattcgcgtcggtaaaaacggcgactatgagaacctcgacgc
+actggtgatggatggtaccaataccctgattgacgagatttatcaggatgacccgaaact
+cgttgccatcgttggccgtaagctgctggccgacaaatattttccgctggtcaacaaaca
+gcaggaaaacaccgagtcgctcgcggcggatatcatcatcagccagaagcgcatcggcaa
+cctgccagccgtacgtgtgccgtacttcccggcgaacgcggtgttcgtgaccacgctgga
+aaacctctctatctatttcatggatgagagccaccgccgcagcattgatgaaaacccgaa
+aaaagaccgcgtggaaaactacgagtcgatgaacatcgactatgtggtcgaggcgtatgc
+cgccgggtgcctgctggaaaacatcaccctgggcgatttcaccgcacctgcagcaccgga
+aggcggagagtaaacccatgacgagccccgcacagcgtcacatgatgcgggtctcggcct
+ctcaagccgcgcagcgggaacaagccccgctgcgccatgcaaccgcctatgagcagatgc
+tggttaagctggccgatgaccgccgcacgttaaaaaacatccgttcaaacgaacgtaaag
+ccgagaaaaagcgcgagctgctgccgttctatgcgccgtgggtcgccggtgtgctgactg
+atggtcgtggtgcgcaggatgacattgttatgaccgtcatgctgtggcgtctcgatgccg
+gtgatatcgctggcgcgctggaaattgccccctacgcgctgaagtacggcctcacctctg
+accatcgccgcacgacaccttacatgctggtcgaggaagtggcacttgccgcgcagcgcc
+tgcgcgatgccggtgagtctgtcgacctttcctggctgcaggccactatcgacctgaccg
+acggcgctgacgttcccgatatggtgcgcgcccgtctgcataaggtgacaggcctgaccc
+tgcgtgatgccggtatgaatgcagaggcgctggcgcagtttcagcgcgcgatgcagctcg
+accgcaatgccggtgtgcgcaaggagattgagcgactggaacgggcattgaagccaaaga
+cagaggccgcgccccgtaaaacgactaaaccgcgcacgcgtaaacctgccaccaaaccgg
+cagcaaagcgcgggcgtccaccaaaggcggcaaaaaccgccggttaactgaacgctcccc
+gagccgggcggcacgccggtcaaagcaggcaaagacctgacggcgaccggcgtccaccgc
+ccaacctgatgaggttgtcatgacgacagtgatactgaaccagcccgacgaaccgcagga
+cgtaccgggcgtggtgattcccgcaccggagacgggcggtgcagtgattaaaaacacgtt
+ctttttccctgatgtggatccgaagcgcgtgcgcgaactgatgcgccttgagcagacggt
+ttccgatgcgcgcctgcgcaatgccatcaagaccggcatggccgagaccaatgcggagct
+ttacgactaccggctgcgccagactgccgccgggtttaagcaactggccgacgtgcctgc
+cgaggaaatcgacggcgagaatgtacgtgttttccactatctgagtgctgtgacggcaat
+ggcaaccgccaccctgtatgagcgctatcgcggcgttgaggccaccggcaaaggtgacaa
+aaaagccgacagcgtggaaaccaccattgatgacctgtggcgggatatgcgctggtcagt
+tgcgcgtctgcaggacaagccgcgctgcattgtggggcagctctgatgaaagtcaggtcg
+atgcagggcgataccctcgacacgatttgcgccaggtattacgggcgcactgagggcgtg
+gttgagacggtgctgcaggctaatccgggtctgtctgagctgggtgtcattctgccgaat
+ggtacagagattgacctgcccgatgtggcatcgtcacccgtaactaaaactatcaacctt
+tgggagtaaccatgacagaaggtgaaaaaggcgtcctgtcactgtttgtgattggcgtga
+tgattgttgttgggaaagtgctggcaggcggtgaacccatcaccccgcgtctgtttattg
+gccgcatgctgctcggtggttttgtttcaatggtcgccggtgttgttctggtgcagtttc
+ctgacatgtcactgcccgccgtgtgcgggattggatccatgctcggtattgccggttatc
+aggtggttgaaatcgccatacagcgccgctttaagtcacaaaagggggaaagtgatgccg
+gtcattaacactcaccagaatatcgctgcgtttctggacatgctggcgtattccgaagga
+acagcgaaccatccgctgacgaaaaatcgtggctacgacgtcattgtcactggccttgat
+ggcagaccagagattttcaccgattacagcgaccaccctttcgcgcatggccgaccaccg
+aaagtgtttaatcgccgtggcgagaaatccacagcctcgggacgttaccagcagctttat
+ctgttctggccgcactatcagaaacagctcgcattgcctgatttcagcccactgtcgcag
+gataagctcgcgatccagttaatccgggagcgcggtgctcttgacgatatccgggcgggg
+cgtattgagcgtgctgtttcacgttgtcgcaatatctgggcgtcattaccgggggccggt
+tacggccagcgcgagcacggtctcgaaaagctggtcaccatctggcgcacggctggcggg
+gtggtggcatgaaagtcctgataacgctgcttgtgatggccgtgctcgggttgctgtggc
+tgcaccatgagaacggcaatttatcccgctcatttgagacggcaaaccgcgtcgcgagcg
+agcaaaagacgacgattgggatgctgaaaaatcagctcagtgttgccggtcagctcgccc
+gacgtaatgaatccgcgcaggtgacactgcgcgaacagctcgcaaaggcaagtgcagaag
+ccagccgccgtgagcagacgataacgaggttacttaatgaaaatgaagcctttcgccgct
+ggtataacgctgctctgcctgatgctgtgcgtcggctgcacacccgaacagcctgcgcca
+gtgccggtgattgtggtcaacggatgcccgagggtgagcctttgccctatgccgggaagt
+gacccgaaaaccaatggtgacctgagcgcagatatccgccgtcttgagggggcgctgact
+gcctgcgcgctgcaggtcaaaaccgtcaaacactgtcaggatgaactcgatgcagaagca
+caaaagcctgcgcaaagcgctgattaacgccgtgccgcagctccgaaataaccccgatat
+gctgcgcctttttgccgacaacggccacaccgattcccgactggcgagctcgctgtcgtt
+tgaaaaggtgtatgtgcttaacgtggtggtgaccgactttactggcgacctcgatttgat
+attcgtgccggtgcaggcatggctgcgtgaacatcagccggacattatgaccaccgacga
+cgggcgggaaaaaggattcacctggattattgatatcaataacgacgattcgctcgatat
+cagtatcagcctgaggctcaccgagcgcacgctcgtcaaagaggtcgggggcgcgctgca
+tgtcagttatgcaccagaaccgccactgcctgagctggtgaagcgcccggttgctatgta
+tgcaaacggtgaattagtgagccagtgggatgagtgaattaaccgcgctgcaggagcgcc
+tcgccggtctgattgccagcctgtcaccggcggcacgtcgcaaaatggcggctgagattg
+cgaaaaagctgcgtaccagtcagcagcagcgcatcaagcgccagcaggcacccgacggca
+ccccgtatgccgcacgaaagcgccagccggtacggagcaagaaaggccgcattaagcgcg
+aaatgttcgccaaactgcgcaccagtcgctttatgaaagccaaaggcagcgatagtgcgg
+cggtggtggagtttaccggcaaggtgcagcgcatggcgcgggtgcatcagtacggcctca
+aagaccgcccaaaccgcaacagccgggatgtgcagtacgaggcgcgcccgttgctcggtt
+tcacccgcgacgatgagcaaatgattgaagacgtcattatcagccacctcggcaaataaa
+tattgtgtgaaccaccaccggaggcgcgtgatttggcgcggctaaagaccagaggcattc
+tttgcactatgaatacgttatccacgatacaggagctcgcgcgtgcgattcgtaacctca
+tccgctcaggtgtggtgacggaggtcgataccgtgcaggggctgtgccgcgtacaaagcg
+gcgggatccagacgacatggctgaactggctgaccacccgcgccggtcgttcgcgcacat
+ggtgggctccctcgctcggtgagcaggtgctgctgctggcaatcggtggcgagcttgata
+ccgctttcgtgctgccggggattttctccgacgataaccccgctccgtctgcctcggcgg
+atgcgtggcatgtggtttttcctgatggcgcggtcattgagtacgagccggagaccagtg
+cactgacggtcagaggcatcaaaactgctgacgtgaccgcgtcggaatccatcacggcca
+ctgtgcctgtggtgctggtgaaagcagaaacccgcatcaccctcgacaccccggaggtgg
+tatgcaccaacaaactgacgacggcaacgcttgaggtgcagaaaggcggggagatgagag
+gcgacattgtccacaacggcggcacatttaaatcaaacggtgtgcagctcgacgaccacg
+gtcacggtggtgtgcaaagaggcggtgcctggacggaggacaccaaatgacggcgcgcta
+tatggggatgaaccgcaacaccggtctcggtatcagtgacactgaacacatcagccagag
+catgcgcgacattctgctgacgccggtcggctcgcgggtgatgcgtcgtgaatatggctc
+gctcctgtctgcgctgattgatatgccgcaaaacccggcgctcaggctgcaaatcatggt
+ggcgtgctattcggccatccagaagtgggagccgcgtatcaggcttacatccatcagctt
+tgagactggtgatgctggcgagatgtatgtcgatattaccgggatgcgtaccgatacggg
+tgcgtcagtttcaaccactgtttcactgagttaaatcactatggcaactgttgacctgag
+cctgttacccgttcccgatgtggttgaggaactggattttgaaaccatccttgcggaacg
+cattgcgacgctaatttcgctataccccgaagaccagcaggaagctgtagcccggacgct
+cgcacttgagtctgaaccaattgttaaattgctgcaggaaaacgcctaccgtgaggttat
+ctggcgtcagcgtgttaatgaagctgctcgcgcaggcatgctggcttatgccagagatag
+cgacctcgataatctcggggcgaatttcaatgttgagcgcctggtcgtcaggcctgctga
+tgacaccaccatccccccgacccccgctgaaatggagcttgatgccgattttcgtctgcg
+tatacagcaggcatttgaagggatgagcgttgcgggatccaccggagcttatgaatttca
+tggccgcagtgctgacgggcgtgtcgcagatatttctgttatcagcccttccccagcatg
+tgtcacgatatctgtgctttcgcgtgagaataacggtgcggcgtctgatgagcttcagag
+catcgtgcgcaatgcgctgaatgctgaggacgtgaggccggttgctgaccgggttacagt
+gcagtcagctcagattattgactaccagatacgcgcaacacttttcgtttatccggggcc
+ggaaaatgagccgattcgtgcggcggctgaggcgaagctcaaagcttatatcagtgcaca
+gcacaggttggggcgggatattcgcctgtcagcaatttatgccgcgttgcatgttgaggg
+ggtgcaacgtgtcgaactggctgcacctgtggccgacattgtgcttgataaaacgcaggc
+atctttttgcacagactatcagatagtgattggtggctccgatgagtgatgtccgcctgt
+tacctgtagggtcatcacctcttgaggtggctgctgccagagcctgcgcagatattgaaa
+atacacctgttccgttacgccgcctgtggagtcctgacacctgtcctgcaaatcttttgc
+cgtggctggcgtgggcgttttccgttgaccgctgggatgagaactggccggaaaaaacaa
+agcgcgatgttattcgcagcgcgtatttcactcactgccacaaaggcacgataggcgctg
+tcaggcgagttattgagccgctcggatacataatcaacgttacggaatggtgggagacag
+gtgacccggcgggaacgtttcgtcttgatatcggtgtgctggaaagcggtattaccgaag
+aaatgtatttagaaatggagcggttgattgctgatgcgaaacctgcgagccgtcatttga
+ttggcctgaatattatccaggatattcccggttatatgtatacaggtggtgtgagctgtg
+acggcgacattattacagtttaccccggataagtgaggaataatgagcacgaaatttaaa
+actattatcaccactgccggagccgaaaaactggcagcggctactgtgccgggtggtaaa
+aaagtgaatatcaccgtgatggccgttggtgacggaggcggaaaactgccagtgccggac
+gccggtcaggtgcagctcgtgaatgaggtctggcgccatgccctgaataaaatcagccag
+gacaaccggaacagcaattacattgtagccgagctggttattccgcccgaggtgggagga
+ttctggatgcgcgagttgggtctttatgatgacgagggcactctcattgctgttgccaat
+atggcagaaagctacaagccagaacttgccgagggctcaggccgtgcgcagacatgtcgc
+atggtcattattgtcagcagtattgcctcagttgaattatccattgattcgacaatggta
+atggcgacgcaggaatatgttgatgacaggattgcggaacatgagaagtcacgtcgacat
+cctgacgccacactgaaagaaaaaggctttactcaactcagtagcgcaacagacagcgcg
+tctgaggtgcttgcggcgacgccgaaagcggttaaagcggcgtatgaccttgctaatgct
+aaatataccgctcaggacgcgagcacagcgcaaaaaggcattgtgaggctgagtagtgcg
+gcagacagtaccagtgaagctgaggccgcaacaccgaaagctgtcaaaattgcgatggat
+aatgcgaatgcgaggctggcaaaagaccggaacggcgctgatattccgaatccgccgttg
+tttgtccagaatatcggtttaaaacccacggtcgataaagctgctaatgccgttgataaa
+aatggcgacacgatgaacggaaacctgacactcaagggtgattaccggctgagttttatt
+atccagaatgaagacggttctattcgtgcttatatcttcaaggacaaaggtggcgacggt
+attcgcatcagtaatggcgatgacggcggcggtgattttgtttttggtaaaaatggacag
+ttttactgcccggatattatgcatgttggtaatacgattgtatggggtgacggaaatatc
+gagggggcgcgatggggcggtttgttgagcgactggttaactgctcaactggttgcccgt
+gacaataatattaacttgcgagcaccctatgaatgggttaaccaaaactttgtcaaccgt
+gcacagcgcggcgcacaggccagcatgactatggacggcggacttgtagaggctccatgg
+ggatgttttcttacgggggggaacggtaacgagggtaatcaggttggagtggctttatac
+cgtccattgcagattcttcgcaataatacttgggtaacgatagagaactgaaaatgaaac
+tgattaatttgcaacgctacattctgatgaattattttttaggtgatggcattcagtatt
+ttatagatgccacaggtaaggactggtataaatcactgcccaaattcacaaagaaataca
+gccttgctatcgaaaatgatacgggcgttattcgtagtatcagcgaagatgcatcccggc
+tttatcccggtggtttgaccgttgttgatgttgacagtattccggcaggttgtgacattt
+tcggcggatgggtatttgacggagagaaagtcattcctcgtgagtacacattggccgaac
+agcaacgccagtcagatgaaaagaaaaaaacacttcttgctgaggcggaggcaacaattt
+ccacgcttgagcgtgcggtaaggttaggcatggctaccggggaagaaataaggcgactcg
+aagcatgggagcgttacagcgtattggtgagcagggttaagcagtcagatgactggccgc
+aaaaacctgaataacccggcggcatttgcccgcttctttctcatccattagttgtgccag
+acatcatccagccctgacaaatagcccctcacaagaccagccaggacaataacactcgcc
+cactaactacggagttaaccggatgagtgattttcaccacggcacgaaggtcatcgaaat
+aaatgacggtacgcgtgttatttccacggtcgcaaccgcaatcgtcggcatggtctggac
+agccagcgatgcggatgccgagacatttcccctcaacgagccggtactgattaccaatgt
+gcagagcgccattgcgaaagccggtaaaaaaggcactctgtcagcttccctgcaggccat
+cgccgaccagtcaaagcctgtcaccgttgtcgtgcgcgttgccgaaggtaccggagacga
+tgcagaagcgcagaccacgtccaacattatcggcggcacggatgagaacggtaaatacac
+cggtatcaaggcgctgctaactgccgaagcggtcaccggcgttaagccgcgcattctcgg
+tgtgccgggtctcgatacgcaggaagtcgcaaccgcacttgcatcggtctgtatcagcct
+gcgtgcgtttggttacgtcagcgcatggggctgtaagaccatttccgaggcgatggcata
+tcgcgagaatttcagccagcgcgagctgatggtcatctggcctgatttcctcgcatggga
+taccaccgcgaacgccaccgccacggcatacgccaccgcccgcgcactcggtctgcgtgc
+ctacatcgaccagactatcggctggcacaaaacgctgtctaacgttggcgtgcagggcgt
+taccggcatcagcgcctcagtcttttgggatttgcaggcatccggcacagatgctgacct
+gctcaacgaggccggagtcaccacgctggtgcgcaaggatggtttccgtttttgggggaa
+ccgcacatgctctgatgacccgcttttcctgtttgagaactacacccgaaccgcgcaggt
+gctggccgacacaatggctgaggcgcacatgtgggcggtcgataagcccatcaccgcatc
+gctcatccgtgacattgtcgacggcattaacgccaaattccgcgagctgaaatcaaatgg
+ctacatcgtggacggtgaatgctggttcgacgaggaatcgaacgataaggaaaccctcaa
+ggccgggaaactgtatatcgactacgactatacaccggttcccccactggaaagcctgac
+cctgcgccagcgtatcaccgataaatatctggtgaatctggctgaatcggtcaacagcta
+aggagcctgaaacaacatggcactaccccgcaaacttaaatatctgaacatgttcaatga
+cggccttagctacatgggcgttgttgaatccgtgacgctgccgaagctgacccgcaagct
+cgaaaactatcgcggcggcggtatgaatggcgctgcagcgattgacctcggcctcgacga
+tgatgcgcttactgtcgaatggtctgtcggtggcctgcctgatgtggcgctgtgggcgca
+gtatgccgcgccgggggctgatgccgtgccgctgcgttttgctggctcttaccagcgtga
+cgacactggcgaaatcgttgcggtcgaggtggtcatgcgtggccgtcataaagaaatcga
+cggcggcgaaaataagcagggtgaaaatacctcgaccaaactgtcgaccgtttgcaccta
+ttaccgcctcacgattgatggtagcgacattatcgaaatcgacaccgtcaacatggtcga
+gaaggtgaacggcgtcgaccgtctggaacagcaccgccgcgcaatcgggctgctgtaatt
+ccctgaccggtcagcactgctggccggttattacccccattcagagcagagaaaaaatca
+tggcaaaagcaccacgcaaaacccctgaatttattgatacggctggcaatgaaattgaca
+ccgtaaacccgaatgtcgtgaccctcgacaagccgattaaacgcgccggtcagacaattg
+aaaaggtcacgctgattgaaccgaacgcaggcaccctgcgcggcgtcagtctggcggcgg
+tggcgcagtccgaggtcgatgcgctgattaaggtgctgccccgcatgacctacccggcac
+tcaccacgcaggagctcaccgcaatgaacctgcccgatatgctgtcgctggccgctaagg
+tgattggttttttgtcaccggcttcggcggaatagacttcccgcccggcctgtcgaccga
+tgacctgatggcggatatcgcagtgatattccactggccgccatcagagctctattccct
+gagcctgaccgagctcatcacatggcgcgaaaaggcgctgcagcgtagcggaaaccacaa
+tgagtaataacctgaggcttgaggtattgctgaaagcggtcgaccaggcgacccgaccgc
+ttaaatccatccagaccgcgagtaaaagcctgtcgggcgatattcgcgacacacaaaaag
+ggctgcgtgacctgaatggtcaggcgtcgaaaatcgacggctttcgtaaggcaagcgcgc
+aactggccgtaaccagtcaggcgcttgataaggcgaaacgcgaggccggtgagctggccg
+tgcagtttaaaaacaccaccaatccgacccgcgcgcaggcgcaggcacttgaagcggcaa
+ggcgtgccgcctctgagttgcagacgaaatacaacagcctgagaacgtcggtacagcgcc
+agcgctccgagctgatgcaggccggtattaatacccgcactctctctgcagatgagcgtc
+ggctcaaaacctccatcagcgaaacaactgcgcacgttaatcgacaacgtgaggcactgg
+cgcgcgtcagtgcgcagcaggcgaaattaagccgggtgaaagagcgatataaatcaggca
+aggagcttgccggtaacatggccgcagcaggcgctgcggggtcggtatcgcgacacggaa
+cgatggccggggttaaattactgatgcccggttatgactttacgcagaaaaattccgagc
+tgcaggctgtgctcggggtcgataagcagtcgccagaaatgcaggcgttacgcaaacagg
+cgcgccacgtcggcgacaatactgcagcctctgcagatgatgcagcaagcgcgcaaatca
+tcattgcgaaaagcggcggtgatgcagctgccattcaggcgcgacgccgagtcacgctga
+atatggcgctgtcaaaccggcgcacgatggaggaaaacgcagcgctgctgaccgggatga
+aatcagcgtttcagctttcaaacgacaagattgcgcacattggcgacgttctctcgatga
+cgatgaacaaaaccgccgccgattttgacggactgagcgacgcgctgacctatgccgcac
+cggtggcaaaaaatgccggggtgagcatcgagcaaaccgccgcaatggtcggtgcactgc
+acgatgccaaaatcaccgggtcaatggcgggcacgggtagccgcgccattctcagccgcc
+tgcagctcccaccggaaaaagcgtttgaggccattaaggagctcggcgtcaaaacgtcag
+acagcaaggggaacacgcgcccgatattctccatcctgaaagaaatgcagcgcagctttg
+agaaaaacaacctcgggacaagccagcgcggcgagtatatgaaaaccattttcggcgagg
+aggccagctcggcggcggcggtactgatggaagccgcctcaagcggcaaacttgaccggc
+tcaccgctgcgtttaaagcctcggacggtaaaaccgaggaactggttaaggttatgcagg
+ataacctcggcggcgactttaaagagttccagtctgcttatgaggcagtcggtactgacc
+tttttgaccagcaagagggctcgctgcgtaaactcacccaaaccgccacgcaatacgtgt
+taaagctcgacggctggatccagaagaacaaagggctggcgacaaccattggcatcatcg
+ccggtggcgctctagctctgattggtatcatcggcggtattggcctcgttgcgtggccgg
+ttgttatggggattaacgccattatcgctgctgctggcgtgctgggtacggtctttactg
+ttaccggtagtgccattgtgaccgcacttggcgcgattacctggccgattgtcgcagtgg
+gggcggctattgtggctggtgcgttactcatccgtaaatattgggagcccatcagcgcat
+ttttctcgggggtgattgagggcatcatgagtgcctttgcaccggtcgcagaaatgttcg
+ctccactggcacccatttttgacggtctcggtgagaaactgcgcggcgtctggcagtggt
+ttaaagacctgatagcaccggtcaaagccacgcaggaaacgctcgatagctgcaaaaatg
+tcggcgtcatatttggtcaggcgctggcctctgctttgatgcgtccgctcaatgtattta
+acaagttgcgcagcggtgtcgactggcttctcgaaaagctcggtatcatcaacaaagagt
+cagacaacctcgaccagactgccgccaaaaccaacgccgccacgcagggtaattcctaca
+tcccggcaaccagcacatatggcggctatcaagcttaccagccagttaccgcaccggcgg
+gacgctcttacattgaccagagtaaaagcgaatacaaaatcactctgccgggaggtgctg
+cgccggggcatcagcttgacagacagctacgcgacacgctcgaacagattgagcgcgaaa
+agcgtgcgcgtcagcgtgccagtatgagccatgactgagaggaataaacgatgatgcttg
+cgcttggaatgtttgtgtttgaacgtcgcaccctgccttatcagtcgatgcagcactcga
+aggattaccgctgggcgtctaatgaccgggtgggtaagccgcctgcttatcagtttctcg
+gcgagggggaaacgtcgatacagcttgccggtacactgtacccagccatcaccggcggct
+ggatctcactaaaggctgtagaggtaatggctaacgagggcagagcgtggccgttgattg
+agggaactggaaacattttagggatgtatatcgtcgataaggtgtcgaccacgcacgccg
+agtttttcagcgacggcgctgccagaaagattgatttcaccctttcgcttaaacgggtcg
+acgaatcactgacggcaatgtttggcgacctgaataagcaggccagcgagcttctaggct
+ctgccggaaatctgactgataagctgcagagtgcgctcggaggactgaccgcatgattac
+gggcatgactattgacgccggaactagccttgcaccggcatttatgttaacgctgaacag
+ccaggacattaccagcaattttagtgaccggctgatttctctcaccatgacagacaaccg
+gggctttgaggctgaccagctcgacattgagctcgacgacaccgacggcaaagtcgaatt
+accactgcgcggggcggtgctgacgttgtggcttggctggcagggttcggcgcttctgaa
+taagggcgatttcacggtcgatgagattgagcaccggggcgcgcctgatatcctgaccat
+ccgcgcgcgtagtgcagactttcgcggaacgctcaattcacggcgtgaagaatcatggca
+cgatactaccatcggtgagttggtcagcaccattgcaaagcgcaataaactgacggccag
+tgtcgcggattcactgaaaaaaattccggtaccgcatatcgaccagtcgcaggagtccga
+cgccgtatttctgacccgactggctgaccgcaatggggcgacggtgtcagtgaaagcggg
+gaaactcctgtttctgaaagccggtagtgcgatgacggccagcggcaagcccgtcccgca
+aatgacactaactcgcaacgatggtgaccgtcatcagtttgctattgccgaccgtggggc
+ttacaccggcgtaaccgcaaaatggttgcacaccaaagacccgaagccgcaaaagcagaa
+agtaacactgaaacgcaagccaaaagagaagcacctgcgcgcactggagcacccgaaagc
+aaagccagtcagcaaaaagacaaaggccaaaaaagagccggaagcgcgcgagggtgagta
+tatggccggtgaggccgataacgtgctggcgctgacgacggtctacgcttctaaggcgca
+ggcgatgcgtgccgctcaggctaagtgggataagctgcagcgaggcgttgcggagttttc
+aattacgctggcgcttggtagggctgatttattccctgagacaccggtgcgcgtatcagg
+ctttaagcgcgtcatagatgagcaggcatggttaatcagtaaggtaactcacaatctgaa
+taatagcggcttcacgacgggcttagagcttgaggttaaactctctgatgtggagtacaa
+cgcggaatcggatgatgaataaaatgtattcacaaaaagtgaatttatgattatcattta
+ttcacgaattgagaataaagggtgggttatgtttcattgtccgaagtgccatcatgccgc
+acatgcgcgaacaagccgctatctaaccgaaaacacgaaagaacgctaccaccagtgcca
+gaacatcaactgtagttgtacgtttatgacaatggaaacgatagagcgctttattgttac
+tccgggagccattgacccggcaccgcctcacccgactgtcggtggtcagcggccattgtg
+gctctgataaatttccgctaaatgcccgccgcgtgcgggtttttttatgcactcaggaaa
+gtggcggtaaaaaatccaccgccattctatcgccactcgaaaacgaggcaacaaaaaggc
+cactcgagagagtggcctaactgtatgtatttactacttaaatttggtggcccctgctgg
+acttgaaccagcgaccaagcgattatgagttcctacaagaacaaccgaaaatcaatagta
+tgcgttatttatcattgacatagattgccattgtttgccaataattacctattattcgcc
+atttctaccgccactttatcgccattctattatctgttactcagaaccatcgccgacata
+ggttccatcaggtgcgagatgatatcttccaccaacataagtcccatctggggcaagtgt
+tgggcggccagcaacataacttccatttggcgctaagcgtggaacgccaccgacataagt
+tccatcgggtgcaaggcgtggtgctcctcctccaacataagtcccattaggggcaagcat
+aggttgtccgtaaacataggtaccatcaggtgctaatcgaactgacatacaacctccata
+acttatttgctgttagtaatgtgaactaaaggatttagtttaactgcatcctctaaatgg
+tcgggtgcaaagtgcgcatatcgcatggtcatttttatatctgtatggccgagtacgcgc
+tgcaacaccaaaatattaccgccattcatcataaagtgactagcgaaggtgtgacgtaaa
+acgtgggtaagttgtcctgccggtagttcgatacctgttctttccaaagctgaccggaac
+gcgccataacaatcactgaacaaccggccctttttatcatcaggcagagactcatagagc
+tctttgctgattgggacggtgcgattttttctacctttcgtgttggtgtatgtgattttg
+tatttcgcgagttggctttttctcagactctcggcctcagaccaccgtgcgccagttgcg
+agacagattcttaccacggtttctaaatcagggtggtcatgtcggttacactctccgagc
+agttgcgaaatttggtcgtgagttagccaagtcatttccatttcttctgtgcggaatggg
+cgcatattttttagtgggttttcacccttccattctccgaggcggtttagctcattgaac
+accgcccggaagtaggccagctcaagattaagcgtgcgaggcgatacctctttcactctg
+tttgaacgggcatactcaccttttaaccgtttttctcggtagcgggaaaacatctgcgca
+tcgaaatcgcgtgcgagtggttcgcccatacactcaaaagcatggtgcatggctaactgg
+cgtttcaaaccatctttcagtgtaatgccatgagcgctataccatgaatcaaccagctct
+tttaacgtgcgcctgtcttccttttcttcctgccacgggttttgaacggtgtactgctca
+aacgccagagcctcgcctttagtagcgaatttctttctgatacgtttgccttttgcaccg
+tttgggtagagttcacaaatccaaccgccagccggatttttacggacggtcattagttaa
+cctcgctgtatacacccaccacacgccccaacgttttaatatcatcaatgccgcattcga
+aaggaaccttcccgcctgcaacatgtagttttctacccggtagttttgttaactctcgaa
+tgcttattgctccctcaatgtcgactagccataagccgtcagacaatgatgcttgcttgt
+ccacaaaataaattttcccctcggaacggatagccatcccatctgtgagcggttttgtga
+aaaattgggcatcaacactcaattgtttatcggatttgaggatttcttcacttaatgtga
+atccctcaatcctttttgcgtcgctcgattctctgttatttacaaatgcttctccttctc
+cggtaagtaaccactggagattagcacctgtttcaagggcacagtgagccgcaaagtcat
+aggagatagcgcctcgggtgtacctgtttgacaatgagctggacgcgatatcgaagtggt
+tagctaattgaattttctgcgaaaatccgtacgcctcgcagatgcggtcaagtacatcca
+cgttgctccatcctaaagaatctattctcatttcgataaaacctatttactatctctcaa
+ttgggagatatattttggctaaacccacgcaattgatggcaagtgttggcaaacagagtc
+aaatcaattgcaaactttggctaatagggaatcatgcaatatggcttctgaaatcgcaat
+catcaaagtgcctgcacctatcgttactctgcaacaattcgcagagcttgagggtgtttc
+tgaacgcaccgcctaccgctggacaaccggcgacaacccttgtgtaccaatcgaaccccg
+cacaatccgtaaaggctgcaagaaagcaggtggcccgattcgcatttattacgcacgctg
+gaaagaagagcagttgcgtaaggcgttgggacattcccgttttcaactcgtcatcggtgc
+ttaattcactttatgtgaattgtaaggatgcaacatgtttgattttcaggtttccaaaca
+tccccactatgacgaagcgtgccgggcttttgcgcagcgtcacaacatggcgaagctggc
+cgagcgtgcgggtatgaatgttcaaacgttacgtaacaagctcaacccagaacagcctca
+ccagttcacgccgcctgaattgtggctgctgactgacctgaccgaagactcaaccctcgt
+tgatggttttctggcgcagattcattgtctgccatgcgtgccggttaatgagctggctaa
+agataaattgcagtcttacgtcatgcgcgcaatgagtgaactcggtgaactggcgagcgg
+tgcggtatctgatgagcgtctgaccactgcccgtaagcacaacatgattgaaagcgttaa
+ctccggcattcgcatgttgtcattgtcggctctggcgctgcatgcacgtctgcagactaa
+tcccgctatgtcgagcgtggtcgataccatgagcggtattggcgcatcgtttggtctgat
+ttgaggtgcgtatgctgaaaagtgaaccgtcatttgcgtctctgctcgttaagcaaagcc
+ccggtatgcattacggccacggctggatcgcaggtaaggacggcaagcgctggcacccgt
+gccgctcacagtccgaattattaaaagggctgaaaacaaagtcgccgaaatcgtcaggtt
+ttttaattattcgtattgtccactttgtaattaaaggagtgaaacatgtcacgcgatgaa
+ttaagaattgttttgggtgccatgattccaaatatggaggaaggttttgaaattaaaacc
+cgcgacggcgcaatacttcgcgttgaccctgagtgggagtgctgcaaagaatttaaggat
+ggattaaaagccgaaatcatcaagcagttaaaaagcaaacctgctgttgtatttggatat
+agttaattaattaaacgtaattacttggcgtaaacccgccgggcattcttttgccaaaaa
+acaggaggatatatgagtcgaactatttatttatcaacgccgagtggtgctggcgaccac
+ttgctggagtctttgtttaaagaagccaaaaaagaagagcgcaaagaccgccgtctcgcc
+gtttcaatccgtctcgaagatctggccgttcacattaccaattcagatatgacaggcaaa
+gaagcggccgagctactgcgccgcgaagccactcgctttgagaacgaatcacaggagctt
+cactaatggccgacgcaatggatttagcacaactgcgcgagcaggaagaccgcgaacgcc
+acataagcaacgcgcgcagccgtcgccatgaggtttctgcatttatctgtgaggaatgcg
+atgcacctatcccggaagcgcgccgccgagccataccgggcgtgcagtgctgcgttacct
+gtcaggaaatcttagagctgaaaagtaaacattataacggaggtgctttatgagcattac
+caatgcaactattagccagcgtgcaaaaaaatggcttgaagatgaccgtatatttattga
+caccgaaactacgggtttgggtgatgatgcggaaatagtagaaatctgtttaatagatag
+cgctggttttatcatgctaaatacattggttaaaccaactaaaccaattccagcagaggc
+tacggccattcatggaataactgatgaaatggttatgtatgcgccaacgtggaaagatat
+tcacggcgcagtagcttctttattttttgagtatggctttgttatttataacgccgatta
+cgacacaagacttatatatcaaactgcgaaattatatgggcttgagaatgacggcttttg
+ttattttttaaatgagcgttcggcctgcgccatgatgctatatgcagagtatcgcggcga
+gccagggcgatttaaaggttataaatggcacaaattagttgatgccgctgcacatgaagg
+ggttagcgttgaaggaaaggcacaccgtgcattagcagattgccggatgactcttggcat
+tatcgacgctttggcaaaaggcggtgcagcatgagtatccgtatcgaaataggtgataaa
+tgggtaatcaccagcgaccaatatcaattcatcctgaatgaaaaaaaagtcgttaagacc
+ggcaataaagctggcgaggaatggctcgacaccatcggttattacccgaagattaatcag
+ctcatttctggtctggtacatcaccacattcatacggcaatgattatttcccttagtgca
+atggcagaggaaatagagaagttatcttttatctgtgaagaagcatttaaggcggttaaa
+aaatgattgattcccgctgctttgctgaaagcacaataaatattgtttctgtttctggtg
+gaaaggacagccttgctcaatggattcttgcggtagagaacgacgtaccgcgcaccactg
+tttttgcagataccgggcatgagcattcccaaacaatggagtatctggattatcttgaat
+ccagactcggcccggttattcgagtgaaagccgattttactcggcggattgaaggcaaac
+ggaaattcattgctgaaaaatggcctgtctctctcgttgaagaatgcggaatgtctcatg
+agcaggctgcagaacgaatcgcaaaggcactggaaatccttaagccaaccggtaatccgt
+ttctcgatttgtgcatgtggaaaggacggttcccgagcacgaaagcaaggttttgttcac
+tggaactgaaacatgactcagtacgggacaagattgtactcccagcgctggagaaatatg
+acgaagtaattctatggcagggtgttcgtgctcaggagtcaccagcccgcgctgcgttac
+ctatgtgggaggaggatgcagataatacccccggtttgcatgtgtatcgcccaattctta
+actggacacatgaagacgtatttgccttagctaaacgacacggaattaaaccgaacccac
+tctatcagcaaggttgtagcagagttggctgcatgccatgtattcatgcaagaaaatctg
+agctggcagagatttttgctcgctggccggaggagattgcgcgcgttgcagagtgggaac
+gtcttgttgctgcctgttcacgtcggggaaactcaacatttttcccttcgactcacgacc
+cgcggcgagcagaaaaacgtattgaagttgttaccgtagaagaatatgggatagcttcat
+atcgtgactgggcgatgactacgcgtggcggttctcagtacgatttgctcgctgctacaa
+acgacaaaactgtgtgcagtagcgtttatgccggtgtatgtgaatgacgggtgtcgttta
+cgcgtttccgtggaatgccccacggtcggcaatagccagctcatatcttacctatgacca
+acagcatcgccgcgaccgtatgttcgcggctttgctgcatgcgagaaaggtgctttttct
+ccagccagaatgtgtgcgctttgacgtttatcgcaccgctgcagttctggagcaaaatca
+gggcagtcaacgagccaatgcctttttaatcagcttctgcaaaaaggcattaccacgtct
+tgaactggtcgcaaaaaaatacgagtgctcgggcatcaacagcaatgtatcagccgctgt
+tttcgatggtcattttgatacccagcttatgcaatatctggcgtcacgcatggtcaatat
+ggtcgccagatttaaccgcctcccggatatgtcgcgcgccgatattgacctgctggccgc
+ggatatcgctaattttattcgcgctgaactggccgacattgatgacaccggatttagcga
+actcaaaacgctgtacacttggtacatgcgcgccggttttatttccctgcaattcaacgt
+tacaccgccgaaatgggagcgtgtgactaaaaaatatttttgtgaggatgaaatcgcacc
+ggcagtaatgcgcatgtttaatgaggtttggtggcgcggccgcttgcgacgcattgcggc
+tgcatggcgcgaacatctgcaaattgcagtcggcaacgtaagcaagaaacgacacgcata
+cgcgagtaaaaactgcgtcaccgactggcgcgagcagaagcgccgcacgcgcgaatttct
+caaggggctggatctcgaagacgaagaaggcaaccgcatcagtctgattgaaaaatacga
+cggctcggtcgctaatccagcaatacgccgctgtgagctgatggcccgcattcgtgggtt
+tgaaaatatctgtaatgagctcggttatgtcggggagttctatactctgactgcaccgtc
+taaatatcacgccaccaccaaagcgggctaccgtaacagcaaatggaacggtgcaagccc
+gtcagacacgcagagctatctcacaggcctttgggcacgcatacgcgccaagctgcaccg
+ggaagaaatccgcattttcggaatacgcgtcgctgaaccgcatcacgatggaacgccgca
+ctggcatatgcttatgttcatgttgccggaagatgtcgagcgtgtgcgactcatcatccg
+agattatgcgtgggaggaagaccactacgaactgagaagcgataaagccaaaaaggcgcg
+cttccatgctgaggccattgacccggaaaaaggcagtgctactggctatgtcgctaaata
+catttccaaaaatatcgacggttatgctctcgatggtgaaaccgatgacgaaagtggtga
+gttgttaaaagagactgcacccgccgtttcagcatgggcggcgcgctggcacatccgtca
+gtttcaatttatcggcggtgcgccggtgacggtatacagggagctacgcagaatggctga
+ccctgaaacagccagggcgctcagtgttgaattcgccgcagtgcatgatgctgctcacta
+tggacgctgggctgattatgtgaatgctcaaggcggaccattcgttcgccgtgacgattt
+acaggtacgtacattgtatgaacctcgaactgaatttaatcagtatggcgaagaaactgt
+gtgcatcaaaggtgtctacgatgcctcgataggtgctggctctcctattctaacccggtt
+aacgcagtggaagattgttccaaagcgtgccgttgatttggccgttgacgttaagggcgc
+ttctgcgccctctcggagttctgtcaataactgtacgggaagcgaaagcgatccaccgat
+actcgatttaacaaaaccgctgagtcggcgtgaaagacgagagttgacgaaccgactcag
+gaagaaaaagccaacaacacggcgaaaattcatccacggaacggataagcaaaacgtcgc
+tataacgaaaactatcgacgagatacactctgacaaccggcatcacaatcagccggggcg
+aagccctgcacctgatggccggtggtaaaagttgttttaacggtcgatgggtgcgcggaa
+cgtcaaaaggtgaaatctttgctgcagctccttcacatcaggcgagacgcggaaaatcct
+taatcgtgttgcagatttagctgagctggcaacgaaaatgtaaccgctaatattcatcca
+tatcatgtacatacagtgtatttaactgtgatttttttcttcacaccttttgccaatacg
+tgctactgtatgtttatacagtatctcgtagtggaggttgtgtggatagagagctaaatg
+agcacgttatgattgagcgggtcgaaatgattgcgcgtctgactgctgaaggtacttgtc
+aggaaagagaccgtgaaatcgcattgaatctaattgcggaaatagcaagaggcaacctaa
+tgaaaaataataatttttctgttgttttttccgcaccgcctgttggtgaaacatttgcaa
+aggagggcaaagtgaaagtaaatatcacgttggataaagaccaaaaaatcggccagccgg
+taattgatgcttttcagtgcgaattgaccaagcgaatacagtccgttttcccgtcaacgc
+gcgttactgttaaaaagggatccatgaccggtgtcgagctgatggggttcgataaagatt
+cagaccgcgaagcgctggatagcatccttcaggaagtgtgggaagatgagagctggcgtt
+aatccctgaaaaatgtgcaaccatcgaccccatgtttgatagcatggggttgttttgtat
+gggattacacacaaaggaaaatcatggataccgtaatagcatttttatctctggctctct
+ttattgcttttatcgtcgggttaatcaagccgtcgctggttcgaatgccgagccgtaagc
+gctccagtgctgtttatctcggtggctgtctggcgctgggcgttattggctcaatcttat
+ggccgactgaaaaaactcagccggtggcaaaaactgacgtaccggcggttaaagcggaac
+cggctacgccaacgtttgagtacgcagataaaaccctcaaagaatatcgcaacgagccaa
+aagaaacccggcacgaaatcgttaaagactatgttggattcaaaggtgtgcaggccagcg
+ctaccgatgttttttatgcctgtatgagcgagtacacttttaccaaagatgatgcgttaa
+agctcagtgatgtgttggggtggtgtttcaacgacttcgagaaagatccacaatctctga
+ataataaaatcaaccttgacgaatttcagggtaattttagcggttgggatggctcttatc
+gcccgttagagaagctgataaaagccagtatgaatgatgattcctcttataaacatgttt
+caacggtctaccatctgattttgaataaagacccgcatgccgttgtaaaaacaacgtttc
+gcggcactaatgcttatggtggcgtggtcaaacagaccgtagcagcacgcgtcaacgtgc
+gaacgggcgaggtcgattcaatactcgacaattaaacatgacaaacgccgccggtgctga
+aactcgctttcagtgctggcggggttgaacaacgagccccgcgaggcgttagcctacccc
+tgagcaaccgcccaagaccggtactattaaagccggtttttttatgccacttttccacga
+atttcccgtttttttagccgtgcatgcaacaggtgcattgttttgcatgcgtcaggcttg
+cccgttctggttgtgcgtcgccagagctggcgcggctccagagtggtcatgcaactgcat
+taaaaccgacccataaagtgggca
diff --git a/etc/c1215.blastn.crunch b/etc/c1215.blastn.crunch
new file mode 100644
index 0000000000000000000000000000000000000000..13215ee9432a16ebbeec3f0db0578aef3007662b
--- /dev/null
+++ b/etc/c1215.blastn.crunch
@@ -0,0 +1,126 @@
+9583 99.00 1474 6490 big_blast_2_50000_embl_other_c1215.seq.00000001.out 1474 6490 SPBC1215 AL096846 S.pombe chromosome II cosmid c1215.
+2712 98.00 1 1437 big_blast_2_50000_embl_other_c1215.seq.00000001.out 1 1437 SPBC1215 AL096846 S.pombe chromosome II cosmid c1215.
+276 99.00 429 574 big_blast_2_50000_embl_other_c1215.seq.00000001.out 7588 7734 SPAC1142 AL159951 S.pombe chromosome I cosmid c1142.
+274 99.00 429 574 big_blast_2_50000_embl_other_c1215.seq.00000001.out 174 319 SPRG5SC K00770 yeast (s.pombe) 5s rrna gene and flanks, clone pspr36.
+242 100.00 453 574 big_blast_2_50000_embl_other_c1215.seq.00000001.out 48 169 SPRG5S K00569 yeast (s.pombe) 5s rrna gene, clone pym3.
+242 100.00 453 574 big_blast_2_50000_embl_other_c1215.seq.00000001.out 21075 20954 SPCC63 AL049522 S.pombe chromosome III cosmid c63.
+242 100.00 453 574 big_blast_2_50000_embl_other_c1215.seq.00000001.out 33755 33876 SPCC417 AL035076 S.pombe chromosome III cosmid c417.
+228 99.00 456 574 big_blast_2_50000_embl_other_c1215.seq.00000001.out 22579 22697 SPCC417 AL035076 S.pombe chromosome III cosmid c417.
+242 100.00 453 574 big_blast_2_50000_embl_other_c1215.seq.00000001.out 31087 30966 SPCC338 AL023781 S.pombe chromosome III cosmid c338.
+129 97.00 35 107 big_blast_2_50000_embl_other_c1215.seq.00000001.out 22094 22022 SPCC338 AL023781 S.pombe chromosome III cosmid c338.
+242 100.00 453 574 big_blast_2_50000_embl_other_c1215.seq.00000001.out 6258 6379 SPBC17A3 AL109652 S.pombe chromosome II cosmid c17A3.
+242 100.00 453 574 big_blast_2_50000_embl_other_c1215.seq.00000001.out 3214 3335 SPAC5H10 Z49811 S.pombe chromosome I cosmid c5H10.
+242 100.00 453 574 big_blast_2_50000_embl_other_c1215.seq.00000001.out 8450 8571 SPAC4H3 Z69380 S.pombe chromosome I cosmid c4H3.
+242 100.00 453 574 big_blast_2_50000_embl_other_c1215.seq.00000001.out 30828 30707 SPAC25B8 AL133225 S.pombe chromosome I cosmid c25B8.
+242 100.00 453 574 big_blast_2_50000_embl_other_c1215.seq.00000001.out 24568 24447 SPAC1F7 Z67998 S.pombe chromosome I cosmid c1F7.
+242 100.00 453 574 big_blast_2_50000_embl_other_c1215.seq.00000001.out 17220 17099 SPAB4537 AB004537 Schizosaccharomyces pombe 37 kb genomic DNA, clone c213.
+240 100.00 453 573 big_blast_2_50000_embl_other_c1215.seq.00000001.out 7867 7747 SPAC926 AL110469 S.pombe chromosome I cosmid c926.
+238 100.00 455 574 big_blast_2_50000_embl_other_c1215.seq.00000001.out 29615 29496 SPCC965 AL023590 S.pombe chromosome III cosmid c965.
+238 100.00 455 574 big_blast_2_50000_embl_other_c1215.seq.00000001.out 24228 24347 SPCC24B10 AL157991 S.pombe chromosome III cosmid c24B10.
+238 100.00 455 574 big_blast_2_50000_embl_other_c1215.seq.00000001.out 5316 5435 SPCC10H11 AL162771 S.pombe chromosome III cosmid c10H11.
+238 100.00 455 574 big_blast_2_50000_embl_other_c1215.seq.00000001.out 23752 23871 SPBC428 AL034382 S.pombe chromosome II cosmid c428.
+238 100.00 455 574 big_blast_2_50000_embl_other_c1215.seq.00000001.out 15895 16014 SPBC4 AL121863 S.pombe chromosome II cosmid c4.
+238 100.00 455 574 big_blast_2_50000_embl_other_c1215.seq.00000001.out 9473 9354 SPBC342 AL096809 S.pombe chromosome II cosmid c342.
+238 100.00 456 575 big_blast_2_50000_embl_other_c1215.seq.00000001.out 9665 9546 SPBC21H7 AL023286 S.pombe chromosome II cosmid c21H7.
+238 100.00 455 574 big_blast_2_50000_embl_other_c1215.seq.00000001.out 24026 24145 SPBC1685 AL031154 S.pombe chromosome II cosmid c1685.
+236 100.00 456 574 big_blast_2_50000_embl_other_c1215.seq.00000001.out 202 320 SPRG5SE K00570 yeast (s.pombe) 5s rrna and asp-trna genes, clone pym116.
+236 100.00 456 574 big_blast_2_50000_embl_other_c1215.seq.00000001.out 34701 34819 SPBP23A10 AL136535 S.pombe chromosome II p1 p23A10.
+236 100.00 456 574 big_blast_2_50000_embl_other_c1215.seq.00000001.out 31520 31638 SPBC577 AL110506 S.pombe chromosome II cosmid c577.
+236 100.00 456 574 big_blast_2_50000_embl_other_c1215.seq.00000001.out 6163 6281 SPBC1677 AL035581 S.pombe chromosome II cosmid c1677.
+236 100.00 456 574 big_blast_2_50000_embl_other_c1215.seq.00000001.out 18162 18044 SPAC3G9 AL021046 S.pombe chromosome I cosmid c3G9.
+236 100.00 456 574 big_blast_2_50000_embl_other_c1215.seq.00000001.out 1 119 SPA K01049 Yeast (S.pombe) 5S ribosomal RNA.
+234 99.00 453 574 big_blast_2_50000_embl_other_c1215.seq.00000001.out 1664 1543 SPCC188 AL049662 S.pombe chromosome III cosmid c188.
+234 99.00 453 574 big_blast_2_50000_embl_other_c1215.seq.00000001.out 20839 20718 SPCC11E10 AL121783 S.pombe chromosome III cosmid c11E10.
+234 99.00 453 574 big_blast_2_50000_embl_other_c1215.seq.00000001.out 23408 23287 SPBC21D10 AL031536 S.pombe chromosome II cosmid c21D10.
+232 99.00 455 575 big_blast_2_50000_embl_other_c1215.seq.00000001.out 3099 3219 SPBC24C6 AL031786 S.pombe chromosome II cosmid c24C6.
+230 99.00 455 574 big_blast_2_50000_embl_other_c1215.seq.00000001.out 200 319 SPRG5SA K00768 yeast (s.pombe) 5s rrna gene and flanks, clone pspr1.
+230 99.00 455 574 big_blast_2_50000_embl_other_c1215.seq.00000001.out 24833 24952 SPBC354 AL022071 S.pombe chromosome II cosmid c354.
+230 99.00 455 574 big_blast_2_50000_embl_other_c1215.seq.00000001.out 14612 14731 SPAC167 AL035248 S.pombe chromosome I cosmid c167.
+228 99.00 456 574 big_blast_2_50000_embl_other_c1215.seq.00000001.out 201 319 SPRG5SD K00771 yeast (s.pombe) 5s rrna gene and flanks, clone pspr41.
+226 98.00 453 574 big_blast_2_50000_embl_other_c1215.seq.00000001.out 198 319 SPRG5SB K00769 yeast (s.pombe) 5s rrna gene and flanks, clone pspr11.
+226 99.00 455 572 big_blast_2_50000_embl_other_c1215.seq.00000001.out 2544 2661 SPAC24H6 Z54142 S.pombe chromosome I cosmid c24H6.
+226 98.00 453 574 big_blast_2_50000_embl_other_c1215.seq.00000001.out 13105 12984 SPAC1B1 Z98532 S.pombe chromosome I cosmid c1B1.
+222 99.00 457 572 big_blast_2_50000_embl_other_c1215.seq.00000001.out 9084 8969 SPAC1687 AL035064 S.pombe chromosome I cosmid c1687.
+220 100.00 454 564 big_blast_2_50000_embl_other_c1215.seq.00000001.out 11460 11350 SPBC14F5 AL023780 S.pombe chromosome II cosmid c14F5.
+206 100.00 6387 6490 big_blast_2_50000_embl_other_c1215.seq.00000001.out 1 104 SPBC83 AL035536 S.pombe chromosome II cosmid c83.
+163 100.00 1 82 big_blast_2_50000_embl_other_c1215.seq.00000001.out 82 1 SPAB4534 AB004534 Schizosaccharomyces pombe 38 kb genomic DNA, clone 1750.
+157 100.00 496 574 big_blast_2_50000_embl_other_c1215.seq.00000001.out 1 79 SPBC725 AL034352 S.pombe chromosome II cosmid c725.
+157 100.00 496 574 big_blast_2_50000_embl_other_c1215.seq.00000001.out 1 79 SPBC530 AL023634 S.pombe chromosome II cosmid c530.
+103 100.00 455 506 big_blast_2_50000_embl_other_c1215.seq.00000001.out 52 1 SPRHP9 Y09431 S.pombe rhp9 gene
+93 85.00 463 575 big_blast_2_50000_embl_other_c1215.seq.00000001.out 14821 14716 SPBC609 AL035226 S.pombe chromosome II cosmid c609.
+65 89.00 456 512 big_blast_2_50000_embl_other_c1215.seq.00000001.out 1 57 UURNA1 X00998 Urechis unicinctus 5S rRNA sequence
+58 95.00 476 512 big_blast_2_50000_embl_other_c1215.seq.00000001.out 21 57 PGRNA01 X00994 Phascolopsis gouldii 5S rRNA sequence
+58 95.00 476 512 big_blast_2_50000_embl_other_c1215.seq.00000001.out 904 868 CFRRN285 X06056 Calanus finmarchicus DNA for 23S and 5S rRNA
+56 93.00 477 516 big_blast_2_50000_embl_other_c1215.seq.00000001.out 1113 1074 SPBC1778 AL049489 S.pombe chromosome II cosmid c1778.
+52 100.00 6059 6084 big_blast_2_50000_embl_other_c1215.seq.00000001.out 233479 233504 AE003531 AE003531 Drosophila melanogaster genomic scaffold 142000013386050 section 37 of 54, complete sequence.
+50 92.00 476 512 big_blast_2_50000_embl_other_c1215.seq.00000001.out 21 57 PRRRN5S X01550 Planocera reticulata 5S ribosomal RNA
+50 92.00 476 512 big_blast_2_50000_embl_other_c1215.seq.00000001.out 21 57 EGRN01 X00022 Ribbon worm Emplectonema gracile 5S rRNA (Short)
+50 94.00 480 512 big_blast_2_50000_embl_other_c1215.seq.00000001.out 25 57 AMRRN5S X01518 Acyrthosiphon magnoliae (aphid) 5S ribosomal RNA
+50 89.00 461 512 big_blast_2_50000_embl_other_c1215.seq.00000001.out 6 58 CR1619 D10528 Candida rugosa 5S rRNA.
+50 88.00 521 569 big_blast_2_50000_embl_other_c1215.seq.00000001.out 66 114 AERRA K03161 Agaricus edulis 5S ribosomal RNA (5S rRNA).
+48 96.00 2466 2493 big_blast_2_50000_embl_other_c1215.seq.00000001.out 10841 10814 AC010292 AC010292 Homo sapiens chromosome 5 clone CTB-131H22, complete sequence.
+46 85.00 458 512 big_blast_2_50000_embl_other_c1215.seq.00000001.out 5564 5510 PDHISTCL X53330 P.dumerilii histone gene cluster for core histones H2A, H2B, H3 and H4
+46 100.00 4802 4824 big_blast_2_50000_embl_other_c1215.seq.00000001.out 28075 28053 HSU165H7 Z70225 Human DNA sequence from cosmid U165H7, between markers DXS366 and DXS87 on chromosome X.
+46 88.00 526 568 big_blast_2_50000_embl_other_c1215.seq.00000001.out 72 114 TDRRA M58385 Taphrina deformans 5S ribosomal RNA.
+46 96.00 487 513 big_blast_2_50000_embl_other_c1215.seq.00000001.out 3 29 SPRRAAS M19951 Schizosaccharomyces pombe 5S ribosomal RNA gene, partial sequence.
+44 100.00 4816 4837 big_blast_2_50000_embl_other_c1215.seq.00000001.out 88073 88052 AC084760 AC084760 Gallus gallus clone 65N20, complete sequence.
+44 88.00 57 98 big_blast_2_50000_embl_other_c1215.seq.00000001.out 69197 69238 CHPTTRPG D17510 Pinus thunbergii chloroplast DNA, complete sequence.
+44 88.00 57 98 big_blast_2_50000_embl_other_c1215.seq.00000001.out 48563 48522 CHNTXX Z00044 Nicotiana tabacum chloroplast genome DNA
+44 88.00 57 98 big_blast_2_50000_embl_other_c1215.seq.00000001.out 138 97 CHNTTB2 M16897 Tobacco Thr-tRNA gene.
+44 88.00 57 98 big_blast_2_50000_embl_other_c1215.seq.00000001.out 14879 14920 AP002983 AP002983 Lotus japonicus chloroplast DNA, complete genome.
+44 88.00 57 98 big_blast_2_50000_embl_other_c1215.seq.00000001.out 46263 46222 AP000423 AP000423 Arabidopsis thaliana chloroplast genomic DNA, complete sequence, strain:Columbia.
+44 100.00 893 914 big_blast_2_50000_embl_other_c1215.seq.00000001.out 49861 49882 HSEVMHC X87344 H.sapiens DMA, DMB, HLA-Z1, IPP2, LMP2, TAP1, LMP7, TAP2, DOB, DQB2 and RING8, 9, 13 and 14 genes
+44 100.00 6061 6082 big_blast_2_50000_embl_other_c1215.seq.00000001.out 143317 143296 HS377H14 AL022723 Human DNA sequence from clone 377H14 on chromosome 6p21.32-22.1. Contains the HLA-G gene for major histocompatibility complex, class I, G (HLA 6.0) two MHC class I pseudogenes, an RPL7A (60S Ribosomal Protein L7A) pseudogene, a gene for a novel MHC class 1 protein, an interferon-inducible protein 1-8U pseudogene, an RPL23A (60S Ribosomal Protein L23A) pseudogene, an HCGIX pseudogene, an MICB or PERB11.1 pseudogene,the HLA-F gene for major histocompatibility complex, class I, F (CDA12), and four P5-1 pseudogenes. Contains EST, STSs, GSS and six putative CpG islands.
+44 100.00 1237 1258 big_blast_2_50000_embl_other_c1215.seq.00000001.out 3149 3128 AP001207 AP001207 Homo sapiens genomic DNA, chromosome 8q23, clone:KB1562D12.
+44 100.00 1237 1258 big_blast_2_50000_embl_other_c1215.seq.00000001.out 201930 201909 AP000426 AP000426 Homo sapiens genomic DNA, chromosome 8q23, clone:KB1107E3.
+44 93.00 2454 2483 big_blast_2_50000_embl_other_c1215.seq.00000001.out 75294 75323 AC023426 AC023426 Homo sapiens 12 BAC RP11-396L8 (Roswell Park Cancer Institute Human BAC Library) complete sequence.
+44 100.00 6061 6082 big_blast_2_50000_embl_other_c1215.seq.00000001.out 34756 34735 AC004213 AC004213 Homo sapiens clone UWGC:y19c060 from 6p21, complete sequence.
+44 86.00 521 570 big_blast_2_50000_embl_other_c1215.seq.00000001.out 364 413 AI5SRRNA2 X99089 A.immersus 5S rRNA gene, b2-type
+42 100.00 1245 1265 big_blast_2_50000_embl_other_c1215.seq.00000001.out 12979 12959 BBU43414 U43414 Borrelia burgdorferi linear plasmid lp16 DNA, complete sequence.
+42 100.00 2454 2474 big_blast_2_50000_embl_other_c1215.seq.00000001.out 278691 278671 AP001119 AP001119 Buchnera sp. APS genomic DNA, complete sequence, segment 2/2.
+42 100.00 1245 1265 big_blast_2_50000_embl_other_c1215.seq.00000001.out 12951 12931 AE000793 AE000793 Borrelia burgdorferi plasmid lp17, complete plasmid sequence.
+42 100.00 818 838 big_blast_2_50000_embl_other_c1215.seq.00000001.out 2471 2451 OSU77637 U77637 Oryza sativa class III ADH enzyme (AdhIII) gene, complete cds.
+42 96.00 1241 1265 big_blast_2_50000_embl_other_c1215.seq.00000001.out 79773 79797 H0505A02 AL512543 Oryza sativa genomic DNA, chromosome 4, BAC clone: H0505A02, complete sequence
+42 93.00 343 371 big_blast_2_50000_embl_other_c1215.seq.00000001.out 29118 29146 AB018121 AB018121 Arabidopsis thaliana genomic DNA, chromosome 3, P1 clone: MXE2.
+42 84.00 456 512 big_blast_2_50000_embl_other_c1215.seq.00000001.out 1 57 SSRRAB K02349 Jellyfish (Spirocodon saltatrix) 5S ribosomal RNA.
+42 89.00 476 512 big_blast_2_50000_embl_other_c1215.seq.00000001.out 21 57 PCRN5SA X13039 Philosamia cynthia ricini 5S rRNA
+42 89.00 476 512 big_blast_2_50000_embl_other_c1215.seq.00000001.out 21 57 PCRN5S K02354 Philosamia cythia ricini (silkworm) 5S ribosomal RNA.
+42 89.00 476 512 big_blast_2_50000_embl_other_c1215.seq.00000001.out 21 57 OV5SRRN X06835 Octopus vulgaris 5S rRNA
+42 89.00 476 512 big_blast_2_50000_embl_other_c1215.seq.00000001.out 21 57 ME5SRNA J01869 Mussel (Mytilus edulis) 5S ribosomal RNA.
+42 89.00 476 512 big_blast_2_50000_embl_other_c1215.seq.00000001.out 21 57 LGRNO1 X00020 Ribbon worm Lineus geniculatus 5S rRNA
+42 89.00 476 512 big_blast_2_50000_embl_other_c1215.seq.00000001.out 21 57 HSRRN5S X01535 Hymeniacidon sanguinea 5S ribosomal RNA
+42 89.00 476 512 big_blast_2_50000_embl_other_c1215.seq.00000001.out 21 57 HJRN01 V00475 Halichondria japonica 5S ribosomal RNA (complete sequence).
+42 84.00 456 512 big_blast_2_50000_embl_other_c1215.seq.00000001.out 1 57 EARRN5S X03911 Enchytraeus albidus 5S rRNA
+42 100.00 6340 6360 big_blast_2_50000_embl_other_c1215.seq.00000001.out 25954 25974 CEK02B12 Z75711 Caenorhabditis elegans cosmid K02B12
+42 100.00 1213 1233 big_blast_2_50000_embl_other_c1215.seq.00000001.out 5436 5456 CEF14B8 U28737 Caenorhabditis elegans cosmid F14B8.
+42 84.00 456 512 big_blast_2_50000_embl_other_c1215.seq.00000001.out 1 57 CED132199 AJ132199 Cerastoderma edule 5S rRNA gene and nontranscribed spacer, clone 4
+42 84.00 456 512 big_blast_2_50000_embl_other_c1215.seq.00000001.out 1 57 CED132198 AJ132198 Cerastoderma edule 5S rRNA gene and nontranscribed spacer, clone 3
+42 89.00 476 512 big_blast_2_50000_embl_other_c1215.seq.00000001.out 21 57 BN5SRRN X06834 Bugula neritina (moss-animal) 5S rRNA
+42 100.00 5756 5776 big_blast_2_50000_embl_other_c1215.seq.00000001.out 2219 2239 BMU86876 U86876 Bombyx mori chitinase-like protein mRNA, complete cds.
+42 89.00 476 512 big_blast_2_50000_embl_other_c1215.seq.00000001.out 21 57 APRN5SA X13035 Antheraea pernyi 5S rRNA
+42 100.00 5756 5776 big_blast_2_50000_embl_other_c1215.seq.00000001.out 2256 2276 AF326596 AF326596 Bombyx mandarina chitinase mRNA, complete cds.
+42 100.00 136 156 big_blast_2_50000_embl_other_c1215.seq.00000001.out 6370 6350 AC084626 AC084626 Caenorhabditis briggsae cosmid G45C20, complete sequence.
+42 100.00 6091 6111 big_blast_2_50000_embl_other_c1215.seq.00000001.out 27211 27231 AC006830 AC006830 Caenorhabditis elegans cosmid ZK105, complete sequence.
+42 100.00 5756 5776 big_blast_2_50000_embl_other_c1215.seq.00000001.out 2225 2245 AB052914 AB052914 Bombyx mori chiB mRNA for chitinase precursor, complete cds.
+42 100.00 1395 1415 big_blast_2_50000_embl_other_c1215.seq.00000001.out 145576 145596 HSMX1A AL442166 Homo sapiens chromosome 21 from 5 PACs and 5 Cosmids map 21q22.2,D21S349-MX1; segment 1/2
+42 100.00 6065 6085 big_blast_2_50000_embl_other_c1215.seq.00000001.out 70745 70765 HS994L9 AL034554 Human DNA sequence from clone 994L9 on chromosome 20p12.3-13 Contains STS and GSSs.
+42 100.00 1395 1415 big_blast_2_50000_embl_other_c1215.seq.00000001.out 173941 173961 HS21C084 AL163284 Homo sapiens chromosome 21 segment HS21C084.
+42 100.00 5172 5192 big_blast_2_50000_embl_other_c1215.seq.00000001.out 8899 8879 HS21C013 AL163213 Homo sapiens chromosome 21 segment HS21C013.
+42 96.00 3691 3715 big_blast_2_50000_embl_other_c1215.seq.00000001.out 222756 222780 AP001732 AP001732 Homo sapiens genomic DNA, chromosome 21q, section 76/105.
+42 96.00 334 358 big_blast_2_50000_embl_other_c1215.seq.00000001.out 234259 234235 AP001677 AP001677 Homo sapiens genomic DNA, chromosome 21q, section 21/105.
+42 96.00 3691 3715 big_blast_2_50000_embl_other_c1215.seq.00000001.out 97170 97194 AP001038 AP001038 Homo sapiens genomic DNA, chromosome 21, clone:P178O22, ERG-ETS2 region.
+42 96.00 334 358 big_blast_2_50000_embl_other_c1215.seq.00000001.out 117565 117541 AP000946 AP000946 Homo sapiens genomic DNA, chromosome 21q21.1-q21.2, clone:B335N5, LL56-APP region.
+42 100.00 6106 6126 big_blast_2_50000_embl_other_c1215.seq.00000001.out 179419 179439 AP000810 AP000810 Homo sapiens genomic DNA, chromosome 11q, clone:RP11-765H23.
+42 100.00 5172 5192 big_blast_2_50000_embl_other_c1215.seq.00000001.out 94404 94384 AP000473 AP000473 Homo sapiens genomic DNA, chromosome 21q21.1-q21.2, clone:B291N6, LL56-APP region.
+42 96.00 1801 1825 big_blast_2_50000_embl_other_c1215.seq.00000001.out 6090 6114 AL355365 AL355365 Human DNA sequence from clone RP11-361F15 on chromosome 6
+42 96.00 5531 5555 big_blast_2_50000_embl_other_c1215.seq.00000001.out 79645 79669 AL354861 AL354861 Human DNA sequence from clone RP11-180I4 on chromosome 9
+42 100.00 1 21 big_blast_2_50000_embl_other_c1215.seq.00000001.out 28666 28686 AL139378 AL139378 Human DNA sequence from clone RP11-271B5 on chromosome 13 Contains a gene for a protein similar to ribosomal protein S7, the FGF9 (fibroblast growth factor 9 (glia-activating factor)) gene, ESTs, STSs, GSSs and CpG islands.
+42 100.00 5783 5803 big_blast_2_50000_embl_other_c1215.seq.00000001.out 15259 15279 AL139163 AL139163 Human DNA sequence from clone RP11-523O15 on chromosome 20 Contains GSSs and STSs.
+42 100.00 3803 3823 big_blast_2_50000_embl_other_c1215.seq.00000001.out 20782 20802 AL136301 AL136301 Human DNA sequence from clone RP11-195L15 on chromosome 13
+42 91.00 5752 5784 big_blast_2_50000_embl_other_c1215.seq.00000001.out 74511 74543 AL133462 AL133462 Human DNA sequence from clone RP11-108A16 on chromosome 20 Contains ESTs, STSs and GSSs.
+42 96.00 334 358 big_blast_2_50000_embl_other_c1215.seq.00000001.out 119422 119446 AF238375 AF238375 Homo sapiens chromosome 21 clone BAC 49B5 map 21q21, complete sequence.
+42 100.00 1242 1262 big_blast_2_50000_embl_other_c1215.seq.00000001.out 42069 42089 AF130342 AF130342 Homo sapiens chromosome 8 clone PAC 87.1 map 8q24.1, complete sequence.
+42 91.00 5752 5784 big_blast_2_50000_embl_other_c1215.seq.00000001.out 49339 49371 AC012380 AC012380 Genomic Sequence For Homo sapiens Clone 125H5, Chromosome 20, complete sequence.
+42 93.00 1230 1258 big_blast_2_50000_embl_other_c1215.seq.00000001.out 135503 135475 AC007392 AC007392 Homo sapiens BAC clone RP11-444B4 from 2, complete sequence.
+42 100.00 1414 1434 big_blast_2_50000_embl_other_c1215.seq.00000001.out 4290 4310 PCAROMX L18918 Pneumocystis carinii pentafunctional enzyme (arom) gene, complete cds.
+42 87.00 521 565 big_blast_2_50000_embl_other_c1215.seq.00000001.out 66 110 CH1457 D10531 Cryptococcus humicolus 5S rRNA.
diff --git a/etc/c1215.blastn.tab b/etc/c1215.blastn.tab
new file mode 100644
index 0000000000000000000000000000000000000000..e2113c43909a69058c06f066978549e0934e719c
--- /dev/null
+++ b/etc/c1215.blastn.tab
@@ -0,0 +1,630 @@
+FT   BLASTN_HIT      1474..6490
+FT                   /note="match to SPBC1215 1474..6490  blast score 9583  percent identity 99  AL096846 S.pombe chromosome II cosmid c1215."
+FT                   /label=SPBC1215
+FT                   /score=99
+FT                   /colour=255 2 2
+FT   BLASTN_HIT      1..1437
+FT                   /note="match to SPBC1215 1..1437  blast score 2712  percent identity 98  AL096846 S.pombe chromosome II cosmid c1215."
+FT                   /label=SPBC1215
+FT                   /score=98
+FT                   /colour=255 5 5
+FT   BLASTN_HIT      429..574
+FT                   /note="match to SPAC1142 7588..7734  blast score 276  percent identity 99  AL159951 S.pombe chromosome I cosmid c1142."
+FT                   /label=SPAC1142
+FT                   /score=99
+FT                   /colour=255 2 2
+FT   BLASTN_HIT      429..574
+FT                   /note="match to SPRG5SC 174..319  blast score 274  percent identity 99  K00770 yeast (s.pombe) 5s rrna gene and flanks, clone pspr36."
+FT                   /label=SPRG5SC
+FT                   /score=99
+FT                   /colour=255 2 2
+FT   BLASTN_HIT      453..574
+FT                   /note="match to SPRG5S 48..169  blast score 242  percent identity 100  K00569 yeast (s.pombe) 5s rrna gene, clone pym3."
+FT                   /label=SPRG5S
+FT                   /score=100
+FT                   /colour=255 0 0
+FT   BLASTN_HIT      453..574
+FT                   /note="match to SPCC63 20954..21075  blast score 242  percent identity 100  AL049522 S.pombe chromosome III cosmid c63."
+FT                   /label=SPCC63
+FT                   /score=100
+FT                   /colour=255 0 0
+FT   BLASTN_HIT      453..574
+FT                   /note="match to SPCC417 33755..33876  blast score 242  percent identity 100  AL035076 S.pombe chromosome III cosmid c417."
+FT                   /label=SPCC417
+FT                   /score=100
+FT                   /colour=255 0 0
+FT   BLASTN_HIT      456..574
+FT                   /note="match to SPCC417 22579..22697  blast score 228  percent identity 99  AL035076 S.pombe chromosome III cosmid c417."
+FT                   /label=SPCC417
+FT                   /score=99
+FT                   /colour=255 2 2
+FT   BLASTN_HIT      453..574
+FT                   /note="match to SPCC338 30966..31087  blast score 242  percent identity 100  AL023781 S.pombe chromosome III cosmid c338."
+FT                   /label=SPCC338
+FT                   /score=100
+FT                   /colour=255 0 0
+FT   BLASTN_HIT      35..107
+FT                   /note="match to SPCC338 22022..22094  blast score 129  percent identity 97  AL023781 S.pombe chromosome III cosmid c338."
+FT                   /label=SPCC338
+FT                   /score=97
+FT                   /colour=255 7 7
+FT   BLASTN_HIT      453..574
+FT                   /note="match to SPBC17A3 6258..6379  blast score 242  percent identity 100  AL109652 S.pombe chromosome II cosmid c17A3."
+FT                   /label=SPBC17A3
+FT                   /score=100
+FT                   /colour=255 0 0
+FT   BLASTN_HIT      453..574
+FT                   /note="match to SPAC5H10 3214..3335  blast score 242  percent identity 100  Z49811 S.pombe chromosome I cosmid c5H10."
+FT                   /label=SPAC5H10
+FT                   /score=100
+FT                   /colour=255 0 0
+FT   BLASTN_HIT      453..574
+FT                   /note="match to SPAC4H3 8450..8571  blast score 242  percent identity 100  Z69380 S.pombe chromosome I cosmid c4H3."
+FT                   /label=SPAC4H3
+FT                   /score=100
+FT                   /colour=255 0 0
+FT   BLASTN_HIT      453..574
+FT                   /note="match to SPAC25B8 30707..30828  blast score 242  percent identity 100  AL133225 S.pombe chromosome I cosmid c25B8."
+FT                   /label=SPAC25B8
+FT                   /score=100
+FT                   /colour=255 0 0
+FT   BLASTN_HIT      453..574
+FT                   /note="match to SPAC1F7 24447..24568  blast score 242  percent identity 100  Z67998 S.pombe chromosome I cosmid c1F7."
+FT                   /label=SPAC1F7
+FT                   /score=100
+FT                   /colour=255 0 0
+FT   BLASTN_HIT      453..574
+FT                   /note="match to SPAB4537 17099..17220  blast score 242  percent identity 100  AB004537 Schizosaccharomyces pombe 37 kb genomic DNA, clone c213."
+FT                   /label=SPAB4537
+FT                   /score=100
+FT                   /colour=255 0 0
+FT   BLASTN_HIT      453..573
+FT                   /note="match to SPAC926 7747..7867  blast score 240  percent identity 100  AL110469 S.pombe chromosome I cosmid c926."
+FT                   /label=SPAC926
+FT                   /score=100
+FT                   /colour=255 0 0
+FT   BLASTN_HIT      455..574
+FT                   /note="match to SPCC965 29496..29615  blast score 238  percent identity 100  AL023590 S.pombe chromosome III cosmid c965."
+FT                   /label=SPCC965
+FT                   /score=100
+FT                   /colour=255 0 0
+FT   BLASTN_HIT      455..574
+FT                   /note="match to SPCC24B10 24228..24347  blast score 238  percent identity 100  AL157991 S.pombe chromosome III cosmid c24B10."
+FT                   /label=SPCC24B10
+FT                   /score=100
+FT                   /colour=255 0 0
+FT   BLASTN_HIT      455..574
+FT                   /note="match to SPCC10H11 5316..5435  blast score 238  percent identity 100  AL162771 S.pombe chromosome III cosmid c10H11."
+FT                   /label=SPCC10H11
+FT                   /score=100
+FT                   /colour=255 0 0
+FT   BLASTN_HIT      455..574
+FT                   /note="match to SPBC428 23752..23871  blast score 238  percent identity 100  AL034382 S.pombe chromosome II cosmid c428."
+FT                   /label=SPBC428
+FT                   /score=100
+FT                   /colour=255 0 0
+FT   BLASTN_HIT      455..574
+FT                   /note="match to SPBC4 15895..16014  blast score 238  percent identity 100  AL121863 S.pombe chromosome II cosmid c4."
+FT                   /label=SPBC4
+FT                   /score=100
+FT                   /colour=255 0 0
+FT   BLASTN_HIT      455..574
+FT                   /note="match to SPBC342 9354..9473  blast score 238  percent identity 100  AL096809 S.pombe chromosome II cosmid c342."
+FT                   /label=SPBC342
+FT                   /score=100
+FT                   /colour=255 0 0
+FT   BLASTN_HIT      456..575
+FT                   /note="match to SPBC21H7 9546..9665  blast score 238  percent identity 100  AL023286 S.pombe chromosome II cosmid c21H7."
+FT                   /label=SPBC21H7
+FT                   /score=100
+FT                   /colour=255 0 0
+FT   BLASTN_HIT      455..574
+FT                   /note="match to SPBC1685 24026..24145  blast score 238  percent identity 100  AL031154 S.pombe chromosome II cosmid c1685."
+FT                   /label=SPBC1685
+FT                   /score=100
+FT                   /colour=255 0 0
+FT   BLASTN_HIT      456..574
+FT                   /note="match to SPRG5SE 202..320  blast score 236  percent identity 100  K00570 yeast (s.pombe) 5s rrna and asp-trna genes, clone pym116."
+FT                   /label=SPRG5SE
+FT                   /score=100
+FT                   /colour=255 0 0
+FT   BLASTN_HIT      456..574
+FT                   /note="match to SPBP23A10 34701..34819  blast score 236  percent identity 100  AL136535 S.pombe chromosome II p1 p23A10."
+FT                   /label=SPBP23A10
+FT                   /score=100
+FT                   /colour=255 0 0
+FT   BLASTN_HIT      456..574
+FT                   /note="match to SPBC577 31520..31638  blast score 236  percent identity 100  AL110506 S.pombe chromosome II cosmid c577."
+FT                   /label=SPBC577
+FT                   /score=100
+FT                   /colour=255 0 0
+FT   BLASTN_HIT      456..574
+FT                   /note="match to SPBC1677 6163..6281  blast score 236  percent identity 100  AL035581 S.pombe chromosome II cosmid c1677."
+FT                   /label=SPBC1677
+FT                   /score=100
+FT                   /colour=255 0 0
+FT   BLASTN_HIT      456..574
+FT                   /note="match to SPAC3G9 18044..18162  blast score 236  percent identity 100  AL021046 S.pombe chromosome I cosmid c3G9."
+FT                   /label=SPAC3G9
+FT                   /score=100
+FT                   /colour=255 0 0
+FT   BLASTN_HIT      456..574
+FT                   /note="match to SPA 1..119  blast score 236  percent identity 100  K01049 Yeast (S.pombe) 5S ribosomal RNA."
+FT                   /label=SPA
+FT                   /score=100
+FT                   /colour=255 0 0
+FT   BLASTN_HIT      453..574
+FT                   /note="match to SPCC188 1543..1664  blast score 234  percent identity 99  AL049662 S.pombe chromosome III cosmid c188."
+FT                   /label=SPCC188
+FT                   /score=99
+FT                   /colour=255 2 2
+FT   BLASTN_HIT      453..574
+FT                   /note="match to SPCC11E10 20718..20839  blast score 234  percent identity 99  AL121783 S.pombe chromosome III cosmid c11E10."
+FT                   /label=SPCC11E10
+FT                   /score=99
+FT                   /colour=255 2 2
+FT   BLASTN_HIT      453..574
+FT                   /note="match to SPBC21D10 23287..23408  blast score 234  percent identity 99  AL031536 S.pombe chromosome II cosmid c21D10."
+FT                   /label=SPBC21D10
+FT                   /score=99
+FT                   /colour=255 2 2
+FT   BLASTN_HIT      455..575
+FT                   /note="match to SPBC24C6 3099..3219  blast score 232  percent identity 99  AL031786 S.pombe chromosome II cosmid c24C6."
+FT                   /label=SPBC24C6
+FT                   /score=99
+FT                   /colour=255 2 2
+FT   BLASTN_HIT      455..574
+FT                   /note="match to SPRG5SA 200..319  blast score 230  percent identity 99  K00768 yeast (s.pombe) 5s rrna gene and flanks, clone pspr1."
+FT                   /label=SPRG5SA
+FT                   /score=99
+FT                   /colour=255 2 2
+FT   BLASTN_HIT      455..574
+FT                   /note="match to SPBC354 24833..24952  blast score 230  percent identity 99  AL022071 S.pombe chromosome II cosmid c354."
+FT                   /label=SPBC354
+FT                   /score=99
+FT                   /colour=255 2 2
+FT   BLASTN_HIT      455..574
+FT                   /note="match to SPAC167 14612..14731  blast score 230  percent identity 99  AL035248 S.pombe chromosome I cosmid c167."
+FT                   /label=SPAC167
+FT                   /score=99
+FT                   /colour=255 2 2
+FT   BLASTN_HIT      456..574
+FT                   /note="match to SPRG5SD 201..319  blast score 228  percent identity 99  K00771 yeast (s.pombe) 5s rrna gene and flanks, clone pspr41."
+FT                   /label=SPRG5SD
+FT                   /score=99
+FT                   /colour=255 2 2
+FT   BLASTN_HIT      453..574
+FT                   /note="match to SPRG5SB 198..319  blast score 226  percent identity 98  K00769 yeast (s.pombe) 5s rrna gene and flanks, clone pspr11."
+FT                   /label=SPRG5SB
+FT                   /score=98
+FT                   /colour=255 5 5
+FT   BLASTN_HIT      455..572
+FT                   /note="match to SPAC24H6 2544..2661  blast score 226  percent identity 99  Z54142 S.pombe chromosome I cosmid c24H6."
+FT                   /label=SPAC24H6
+FT                   /score=99
+FT                   /colour=255 2 2
+FT   BLASTN_HIT      453..574
+FT                   /note="match to SPAC1B1 12984..13105  blast score 226  percent identity 98  Z98532 S.pombe chromosome I cosmid c1B1."
+FT                   /label=SPAC1B1
+FT                   /score=98
+FT                   /colour=255 5 5
+FT   BLASTN_HIT      457..572
+FT                   /note="match to SPAC1687 8969..9084  blast score 222  percent identity 99  AL035064 S.pombe chromosome I cosmid c1687."
+FT                   /label=SPAC1687
+FT                   /score=99
+FT                   /colour=255 2 2
+FT   BLASTN_HIT      454..564
+FT                   /note="match to SPBC14F5 11350..11460  blast score 220  percent identity 100  AL023780 S.pombe chromosome II cosmid c14F5."
+FT                   /label=SPBC14F5
+FT                   /score=100
+FT                   /colour=255 0 0
+FT   BLASTN_HIT      6387..6490
+FT                   /note="match to SPBC83 1..104  blast score 206  percent identity 100  AL035536 S.pombe chromosome II cosmid c83."
+FT                   /label=SPBC83
+FT                   /score=100
+FT                   /colour=255 0 0
+FT   BLASTN_HIT      1..82
+FT                   /note="match to SPAB4534 1..82  blast score 163  percent identity 100  AB004534 Schizosaccharomyces pombe 38 kb genomic DNA, clone 1750."
+FT                   /label=SPAB4534
+FT                   /score=100
+FT                   /colour=255 0 0
+FT   BLASTN_HIT      496..574
+FT                   /note="match to SPBC725 1..79  blast score 157  percent identity 100  AL034352 S.pombe chromosome II cosmid c725."
+FT                   /label=SPBC725
+FT                   /score=100
+FT                   /colour=255 0 0
+FT   BLASTN_HIT      496..574
+FT                   /note="match to SPBC530 1..79  blast score 157  percent identity 100  AL023634 S.pombe chromosome II cosmid c530."
+FT                   /label=SPBC530
+FT                   /score=100
+FT                   /colour=255 0 0
+FT   BLASTN_HIT      455..506
+FT                   /note="match to SPRHP9 1..52  blast score 103  percent identity 100  Y09431 S.pombe rhp9 gene"
+FT                   /label=SPRHP9
+FT                   /score=100
+FT                   /colour=255 0 0
+FT   BLASTN_HIT      463..575
+FT                   /note="match to SPBC609 14716..14821  blast score 93.7  percent identity 85  AL035226 S.pombe chromosome II cosmid c609."
+FT                   /label=SPBC609
+FT                   /score=85
+FT                   /colour=255 38 38
+FT   BLASTN_HIT      456..512
+FT                   /note="match to UURNA1 1..57  blast score 65.9  percent identity 89  X00998 Urechis unicinctus 5S rRNA sequence"
+FT                   /label=UURNA1
+FT                   /score=89
+FT                   /colour=255 28 28
+FT   BLASTN_HIT      476..512
+FT                   /note="match to PGRNA01 21..57  blast score 58.0  percent identity 95  X00994 Phascolopsis gouldii 5S rRNA sequence"
+FT                   /label=PGRNA01
+FT                   /score=95
+FT                   /colour=255 12 12
+FT   BLASTN_HIT      476..512
+FT                   /note="match to CFRRN285 868..904  blast score 58.0  percent identity 95  X06056 Calanus finmarchicus DNA for 23S and 5S rRNA"
+FT                   /label=CFRRN285
+FT                   /score=95
+FT                   /colour=255 12 12
+FT   BLASTN_HIT      477..516
+FT                   /note="match to SPBC1778 1074..1113  blast score 56.0  percent identity 93  AL049489 S.pombe chromosome II cosmid c1778."
+FT                   /label=SPBC1778
+FT                   /score=93
+FT                   /colour=255 17 17
+FT   BLASTN_HIT      6059..6084
+FT                   /note="match to AE003531 233479..233504  blast score 52.0  percent identity 100  AE003531 Drosophila melanogaster genomic scaffold 142000013386050 section 37 of 54, complete sequence."
+FT                   /label=AE003531
+FT                   /score=100
+FT                   /colour=255 0 0
+FT   BLASTN_HIT      476..512
+FT                   /note="match to PRRRN5S 21..57  blast score 50.1  percent identity 92  X01550 Planocera reticulata 5S ribosomal RNA"
+FT                   /label=PRRRN5S
+FT                   /score=92
+FT                   /colour=255 20 20
+FT   BLASTN_HIT      476..512
+FT                   /note="match to EGRN01 21..57  blast score 50.1  percent identity 92  X00022 Ribbon worm Emplectonema gracile 5S rRNA (Short)"
+FT                   /label=EGRN01
+FT                   /score=92
+FT                   /colour=255 20 20
+FT   BLASTN_HIT      480..512
+FT                   /note="match to AMRRN5S 25..57  blast score 50.1  percent identity 94  X01518 Acyrthosiphon magnoliae (aphid) 5S ribosomal RNA"
+FT                   /label=AMRRN5S
+FT                   /score=94
+FT                   /colour=255 15 15
+FT   BLASTN_HIT      461..512
+FT                   /note="match to CR1619 6..58  blast score 50.1  percent identity 89  D10528 Candida rugosa 5S rRNA."
+FT                   /label=CR1619
+FT                   /score=89
+FT                   /colour=255 28 28
+FT   BLASTN_HIT      521..569
+FT                   /note="match to AERRA 66..114  blast score 50.1  percent identity 88  K03161 Agaricus edulis 5S ribosomal RNA (5S rRNA)."
+FT                   /label=AERRA
+FT                   /score=88
+FT                   /colour=255 30 30
+FT   BLASTN_HIT      2466..2493
+FT                   /note="match to AC010292 10814..10841  blast score 48.1  percent identity 96  AC010292 Homo sapiens chromosome 5 clone CTB-131H22, complete sequence."
+FT                   /label=AC010292
+FT                   /score=96
+FT                   /colour=255 10 10
+FT   BLASTN_HIT      458..512
+FT                   /note="match to PDHISTCL 5510..5564  blast score 46.1  percent identity 85  X53330 P.dumerilii histone gene cluster for core histones H2A, H2B, H3 and H4"
+FT                   /label=PDHISTCL
+FT                   /score=85
+FT                   /colour=255 38 38
+FT   BLASTN_HIT      4802..4824
+FT                   /note="match to HSU165H7 28053..28075  blast score 46.1  percent identity 100  Z70225 Human DNA sequence from cosmid U165H7, between markers DXS366 and DXS87 on chromosome X."
+FT                   /label=HSU165H7
+FT                   /score=100
+FT                   /colour=255 0 0
+FT   BLASTN_HIT      526..568
+FT                   /note="match to TDRRA 72..114  blast score 46.1  percent identity 88  M58385 Taphrina deformans 5S ribosomal RNA."
+FT                   /label=TDRRA
+FT                   /score=88
+FT                   /colour=255 30 30
+FT   BLASTN_HIT      487..513
+FT                   /note="match to SPRRAAS 3..29  blast score 46.1  percent identity 96  M19951 Schizosaccharomyces pombe 5S ribosomal RNA gene, partial sequence."
+FT                   /label=SPRRAAS
+FT                   /score=96
+FT                   /colour=255 10 10
+FT   BLASTN_HIT      4816..4837
+FT                   /note="match to AC084760 88052..88073  blast score 44.1  percent identity 100  AC084760 Gallus gallus clone 65N20, complete sequence."
+FT                   /label=AC084760
+FT                   /score=100
+FT                   /colour=255 0 0
+FT   BLASTN_HIT      57..98
+FT                   /note="match to CHPTTRPG 69197..69238  blast score 44.1  percent identity 88  D17510 Pinus thunbergii chloroplast DNA, complete sequence."
+FT                   /label=CHPTTRPG
+FT                   /score=88
+FT                   /colour=255 30 30
+FT   BLASTN_HIT      57..98
+FT                   /note="match to CHNTXX 48522..48563  blast score 44.1  percent identity 88  Z00044 Nicotiana tabacum chloroplast genome DNA"
+FT                   /label=CHNTXX
+FT                   /score=88
+FT                   /colour=255 30 30
+FT   BLASTN_HIT      57..98
+FT                   /note="match to CHNTTB2 97..138  blast score 44.1  percent identity 88  M16897 Tobacco Thr-tRNA gene."
+FT                   /label=CHNTTB2
+FT                   /score=88
+FT                   /colour=255 30 30
+FT   BLASTN_HIT      57..98
+FT                   /note="match to AP002983 14879..14920  blast score 44.1  percent identity 88  AP002983 Lotus japonicus chloroplast DNA, complete genome."
+FT                   /label=AP002983
+FT                   /score=88
+FT                   /colour=255 30 30
+FT   BLASTN_HIT      57..98
+FT                   /note="match to AP000423 46222..46263  blast score 44.1  percent identity 88  AP000423 Arabidopsis thaliana chloroplast genomic DNA, complete sequence, strain:Columbia."
+FT                   /label=AP000423
+FT                   /score=88
+FT                   /colour=255 30 30
+FT   BLASTN_HIT      893..914
+FT                   /note="match to HSEVMHC 49861..49882  blast score 44.1  percent identity 100  X87344 H.sapiens DMA, DMB, HLA-Z1, IPP2, LMP2, TAP1, LMP7, TAP2, DOB, DQB2 and RING8, 9, 13 and 14 genes"
+FT                   /label=HSEVMHC
+FT                   /score=100
+FT                   /colour=255 0 0
+FT   BLASTN_HIT      6061..6082
+FT                   /note="match to HS377H14 143296..143317  blast score 44.1  percent identity 100  AL022723 Human DNA sequence from clone 377H14 on chromosome 6p21.32-22.1. Contains the HLA-G gene for major histocompatibility complex, class I, G (HLA 6.0) two MHC class I pseudogenes, an RPL7A (60S Ribosomal Protein L7A) pseudogene, a gene for a novel MHC class 1 protein, an interferon-inducible protein 1-8U pseudogene, an RPL23A (60S Ribosomal Protein L23A) pseudogene, an HCGIX pseudogene, an MICB or PERB11.1 pseudogene,the HLA-F gene for major histocompatibility complex, class I, F (CDA12), and four P5-1 pseudogenes. Contains EST, STSs, GSS and six putative CpG islands."
+FT                   /label=HS377H14
+FT                   /score=100
+FT                   /colour=255 0 0
+FT   BLASTN_HIT      1237..1258
+FT                   /note="match to AP001207 3128..3149  blast score 44.1  percent identity 100  AP001207 Homo sapiens genomic DNA, chromosome 8q23, clone:KB1562D12."
+FT                   /label=AP001207
+FT                   /score=100
+FT                   /colour=255 0 0
+FT   BLASTN_HIT      1237..1258
+FT                   /note="match to AP000426 201909..201930  blast score 44.1  percent identity 100  AP000426 Homo sapiens genomic DNA, chromosome 8q23, clone:KB1107E3."
+FT                   /label=AP000426
+FT                   /score=100
+FT                   /colour=255 0 0
+FT   BLASTN_HIT      2454..2483
+FT                   /note="match to AC023426 75294..75323  blast score 44.1  percent identity 93  AC023426 Homo sapiens 12 BAC RP11-396L8 (Roswell Park Cancer Institute Human BAC Library) complete sequence."
+FT                   /label=AC023426
+FT                   /score=93
+FT                   /colour=255 17 17
+FT   BLASTN_HIT      6061..6082
+FT                   /note="match to AC004213 34735..34756  blast score 44.1  percent identity 100  AC004213 Homo sapiens clone UWGC:y19c060 from 6p21, complete sequence."
+FT                   /label=AC004213
+FT                   /score=100
+FT                   /colour=255 0 0
+FT   BLASTN_HIT      521..570
+FT                   /note="match to AI5SRRNA2 364..413  blast score 44.1  percent identity 86  X99089 A.immersus 5S rRNA gene, b2-type"
+FT                   /label=AI5SRRNA2
+FT                   /score=86
+FT                   /colour=255 35 35
+FT   BLASTN_HIT      1245..1265
+FT                   /note="match to BBU43414 12959..12979  blast score 42.1  percent identity 100  U43414 Borrelia burgdorferi linear plasmid lp16 DNA, complete sequence."
+FT                   /label=BBU43414
+FT                   /score=100
+FT                   /colour=255 0 0
+FT   BLASTN_HIT      2454..2474
+FT                   /note="match to AP001119 278671..278691  blast score 42.1  percent identity 100  AP001119 Buchnera sp. APS genomic DNA, complete sequence, segment 2/2."
+FT                   /label=AP001119
+FT                   /score=100
+FT                   /colour=255 0 0
+FT   BLASTN_HIT      1245..1265
+FT                   /note="match to AE000793 12931..12951  blast score 42.1  percent identity 100  AE000793 Borrelia burgdorferi plasmid lp17, complete plasmid sequence."
+FT                   /label=AE000793
+FT                   /score=100
+FT                   /colour=255 0 0
+FT   BLASTN_HIT      818..838
+FT                   /note="match to OSU77637 2451..2471  blast score 42.1  percent identity 100  U77637 Oryza sativa class III ADH enzyme (AdhIII) gene, complete cds."
+FT                   /label=OSU77637
+FT                   /score=100
+FT                   /colour=255 0 0
+FT   BLASTN_HIT      1241..1265
+FT                   /note="match to H0505A02 79773..79797  blast score 42.1  percent identity 96  AL512543 Oryza sativa genomic DNA, chromosome 4, BAC clone: H0505A02, complete sequence"
+FT                   /label=H0505A02
+FT                   /score=96
+FT                   /colour=255 10 10
+FT   BLASTN_HIT      343..371
+FT                   /note="match to AB018121 29118..29146  blast score 42.1  percent identity 93  AB018121 Arabidopsis thaliana genomic DNA, chromosome 3, P1 clone: MXE2."
+FT                   /label=AB018121
+FT                   /score=93
+FT                   /colour=255 17 17
+FT   BLASTN_HIT      456..512
+FT                   /note="match to SSRRAB 1..57  blast score 42.1  percent identity 84  K02349 Jellyfish (Spirocodon saltatrix) 5S ribosomal RNA."
+FT                   /label=SSRRAB
+FT                   /score=84
+FT                   /colour=255 40 40
+FT   BLASTN_HIT      476..512
+FT                   /note="match to PCRN5SA 21..57  blast score 42.1  percent identity 89  X13039 Philosamia cynthia ricini 5S rRNA"
+FT                   /label=PCRN5SA
+FT                   /score=89
+FT                   /colour=255 28 28
+FT   BLASTN_HIT      476..512
+FT                   /note="match to PCRN5S 21..57  blast score 42.1  percent identity 89  K02354 Philosamia cythia ricini (silkworm) 5S ribosomal RNA."
+FT                   /label=PCRN5S
+FT                   /score=89
+FT                   /colour=255 28 28
+FT   BLASTN_HIT      476..512
+FT                   /note="match to OV5SRRN 21..57  blast score 42.1  percent identity 89  X06835 Octopus vulgaris 5S rRNA"
+FT                   /label=OV5SRRN
+FT                   /score=89
+FT                   /colour=255 28 28
+FT   BLASTN_HIT      476..512
+FT                   /note="match to ME5SRNA 21..57  blast score 42.1  percent identity 89  J01869 Mussel (Mytilus edulis) 5S ribosomal RNA."
+FT                   /label=ME5SRNA
+FT                   /score=89
+FT                   /colour=255 28 28
+FT   BLASTN_HIT      476..512
+FT                   /note="match to LGRNO1 21..57  blast score 42.1  percent identity 89  X00020 Ribbon worm Lineus geniculatus 5S rRNA"
+FT                   /label=LGRNO1
+FT                   /score=89
+FT                   /colour=255 28 28
+FT   BLASTN_HIT      476..512
+FT                   /note="match to HSRRN5S 21..57  blast score 42.1  percent identity 89  X01535 Hymeniacidon sanguinea 5S ribosomal RNA"
+FT                   /label=HSRRN5S
+FT                   /score=89
+FT                   /colour=255 28 28
+FT   BLASTN_HIT      476..512
+FT                   /note="match to HJRN01 21..57  blast score 42.1  percent identity 89  V00475 Halichondria japonica 5S ribosomal RNA (complete sequence)."
+FT                   /label=HJRN01
+FT                   /score=89
+FT                   /colour=255 28 28
+FT   BLASTN_HIT      456..512
+FT                   /note="match to EARRN5S 1..57  blast score 42.1  percent identity 84  X03911 Enchytraeus albidus 5S rRNA"
+FT                   /label=EARRN5S
+FT                   /score=84
+FT                   /colour=255 40 40
+FT   BLASTN_HIT      6340..6360
+FT                   /note="match to CEK02B12 25954..25974  blast score 42.1  percent identity 100  Z75711 Caenorhabditis elegans cosmid K02B12"
+FT                   /label=CEK02B12
+FT                   /score=100
+FT                   /colour=255 0 0
+FT   BLASTN_HIT      1213..1233
+FT                   /note="match to CEF14B8 5436..5456  blast score 42.1  percent identity 100  U28737 Caenorhabditis elegans cosmid F14B8."
+FT                   /label=CEF14B8
+FT                   /score=100
+FT                   /colour=255 0 0
+FT   BLASTN_HIT      456..512
+FT                   /note="match to CED132199 1..57  blast score 42.1  percent identity 84  AJ132199 Cerastoderma edule 5S rRNA gene and nontranscribed spacer, clone 4"
+FT                   /label=CED132199
+FT                   /score=84
+FT                   /colour=255 40 40
+FT   BLASTN_HIT      456..512
+FT                   /note="match to CED132198 1..57  blast score 42.1  percent identity 84  AJ132198 Cerastoderma edule 5S rRNA gene and nontranscribed spacer, clone 3"
+FT                   /label=CED132198
+FT                   /score=84
+FT                   /colour=255 40 40
+FT   BLASTN_HIT      476..512
+FT                   /note="match to BN5SRRN 21..57  blast score 42.1  percent identity 89  X06834 Bugula neritina (moss-animal) 5S rRNA"
+FT                   /label=BN5SRRN
+FT                   /score=89
+FT                   /colour=255 28 28
+FT   BLASTN_HIT      5756..5776
+FT                   /note="match to BMU86876 2219..2239  blast score 42.1  percent identity 100  U86876 Bombyx mori chitinase-like protein mRNA, complete cds."
+FT                   /label=BMU86876
+FT                   /score=100
+FT                   /colour=255 0 0
+FT   BLASTN_HIT      476..512
+FT                   /note="match to APRN5SA 21..57  blast score 42.1  percent identity 89  X13035 Antheraea pernyi 5S rRNA"
+FT                   /label=APRN5SA
+FT                   /score=89
+FT                   /colour=255 28 28
+FT   BLASTN_HIT      5756..5776
+FT                   /note="match to AF326596 2256..2276  blast score 42.1  percent identity 100  AF326596 Bombyx mandarina chitinase mRNA, complete cds."
+FT                   /label=AF326596
+FT                   /score=100
+FT                   /colour=255 0 0
+FT   BLASTN_HIT      136..156
+FT                   /note="match to AC084626 6350..6370  blast score 42.1  percent identity 100  AC084626 Caenorhabditis briggsae cosmid G45C20, complete sequence."
+FT                   /label=AC084626
+FT                   /score=100
+FT                   /colour=255 0 0
+FT   BLASTN_HIT      6091..6111
+FT                   /note="match to AC006830 27211..27231  blast score 42.1  percent identity 100  AC006830 Caenorhabditis elegans cosmid ZK105, complete sequence."
+FT                   /label=AC006830
+FT                   /score=100
+FT                   /colour=255 0 0
+FT   BLASTN_HIT      5756..5776
+FT                   /note="match to AB052914 2225..2245  blast score 42.1  percent identity 100  AB052914 Bombyx mori chiB mRNA for chitinase precursor, complete cds."
+FT                   /label=AB052914
+FT                   /score=100
+FT                   /colour=255 0 0
+FT   BLASTN_HIT      1395..1415
+FT                   /note="match to HSMX1A 145576..145596  blast score 42.1  percent identity 100  AL442166 Homo sapiens chromosome 21 from 5 PACs and 5 Cosmids map 21q22.2,D21S349-MX1; segment 1/2"
+FT                   /label=HSMX1A
+FT                   /score=100
+FT                   /colour=255 0 0
+FT   BLASTN_HIT      6065..6085
+FT                   /note="match to HS994L9 70745..70765  blast score 42.1  percent identity 100  AL034554 Human DNA sequence from clone 994L9 on chromosome 20p12.3-13 Contains STS and GSSs."
+FT                   /label=HS994L9
+FT                   /score=100
+FT                   /colour=255 0 0
+FT   BLASTN_HIT      1395..1415
+FT                   /note="match to HS21C084 173941..173961  blast score 42.1  percent identity 100  AL163284 Homo sapiens chromosome 21 segment HS21C084."
+FT                   /label=HS21C084
+FT                   /score=100
+FT                   /colour=255 0 0
+FT   BLASTN_HIT      5172..5192
+FT                   /note="match to HS21C013 8879..8899  blast score 42.1  percent identity 100  AL163213 Homo sapiens chromosome 21 segment HS21C013."
+FT                   /label=HS21C013
+FT                   /score=100
+FT                   /colour=255 0 0
+FT   BLASTN_HIT      3691..3715
+FT                   /note="match to AP001732 222756..222780  blast score 42.1  percent identity 96  AP001732 Homo sapiens genomic DNA, chromosome 21q, section 76/105."
+FT                   /label=AP001732
+FT                   /score=96
+FT                   /colour=255 10 10
+FT   BLASTN_HIT      334..358
+FT                   /note="match to AP001677 234235..234259  blast score 42.1  percent identity 96  AP001677 Homo sapiens genomic DNA, chromosome 21q, section 21/105."
+FT                   /label=AP001677
+FT                   /score=96
+FT                   /colour=255 10 10
+FT   BLASTN_HIT      3691..3715
+FT                   /note="match to AP001038 97170..97194  blast score 42.1  percent identity 96  AP001038 Homo sapiens genomic DNA, chromosome 21, clone:P178O22, ERG-ETS2 region."
+FT                   /label=AP001038
+FT                   /score=96
+FT                   /colour=255 10 10
+FT   BLASTN_HIT      334..358
+FT                   /note="match to AP000946 117541..117565  blast score 42.1  percent identity 96  AP000946 Homo sapiens genomic DNA, chromosome 21q21.1-q21.2, clone:B335N5, LL56-APP region."
+FT                   /label=AP000946
+FT                   /score=96
+FT                   /colour=255 10 10
+FT   BLASTN_HIT      6106..6126
+FT                   /note="match to AP000810 179419..179439  blast score 42.1  percent identity 100  AP000810 Homo sapiens genomic DNA, chromosome 11q, clone:RP11-765H23."
+FT                   /label=AP000810
+FT                   /score=100
+FT                   /colour=255 0 0
+FT   BLASTN_HIT      5172..5192
+FT                   /note="match to AP000473 94384..94404  blast score 42.1  percent identity 100  AP000473 Homo sapiens genomic DNA, chromosome 21q21.1-q21.2, clone:B291N6, LL56-APP region."
+FT                   /label=AP000473
+FT                   /score=100
+FT                   /colour=255 0 0
+FT   BLASTN_HIT      1801..1825
+FT                   /note="match to AL355365 6090..6114  blast score 42.1  percent identity 96  AL355365 Human DNA sequence from clone RP11-361F15 on chromosome 6"
+FT                   /label=AL355365
+FT                   /score=96
+FT                   /colour=255 10 10
+FT   BLASTN_HIT      5531..5555
+FT                   /note="match to AL354861 79645..79669  blast score 42.1  percent identity 96  AL354861 Human DNA sequence from clone RP11-180I4 on chromosome 9"
+FT                   /label=AL354861
+FT                   /score=96
+FT                   /colour=255 10 10
+FT   BLASTN_HIT      1..21
+FT                   /note="match to AL139378 28666..28686  blast score 42.1  percent identity 100  AL139378 Human DNA sequence from clone RP11-271B5 on chromosome 13 Contains a gene for a protein similar to ribosomal protein S7, the FGF9 (fibroblast growth factor 9 (glia-activating factor)) gene, ESTs, STSs, GSSs and CpG islands."
+FT                   /label=AL139378
+FT                   /score=100
+FT                   /colour=255 0 0
+FT   BLASTN_HIT      5783..5803
+FT                   /note="match to AL139163 15259..15279  blast score 42.1  percent identity 100  AL139163 Human DNA sequence from clone RP11-523O15 on chromosome 20 Contains GSSs and STSs."
+FT                   /label=AL139163
+FT                   /score=100
+FT                   /colour=255 0 0
+FT   BLASTN_HIT      3803..3823
+FT                   /note="match to AL136301 20782..20802  blast score 42.1  percent identity 100  AL136301 Human DNA sequence from clone RP11-195L15 on chromosome 13"
+FT                   /label=AL136301
+FT                   /score=100
+FT                   /colour=255 0 0
+FT   BLASTN_HIT      5752..5784
+FT                   /note="match to AL133462 74511..74543  blast score 42.1  percent identity 91  AL133462 Human DNA sequence from clone RP11-108A16 on chromosome 20 Contains ESTs, STSs and GSSs."
+FT                   /label=AL133462
+FT                   /score=91
+FT                   /colour=255 22 22
+FT   BLASTN_HIT      334..358
+FT                   /note="match to AF238375 119422..119446  blast score 42.1  percent identity 96  AF238375 Homo sapiens chromosome 21 clone BAC 49B5 map 21q21, complete sequence."
+FT                   /label=AF238375
+FT                   /score=96
+FT                   /colour=255 10 10
+FT   BLASTN_HIT      1242..1262
+FT                   /note="match to AF130342 42069..42089  blast score 42.1  percent identity 100  AF130342 Homo sapiens chromosome 8 clone PAC 87.1 map 8q24.1, complete sequence."
+FT                   /label=AF130342
+FT                   /score=100
+FT                   /colour=255 0 0
+FT   BLASTN_HIT      5752..5784
+FT                   /note="match to AC012380 49339..49371  blast score 42.1  percent identity 91  AC012380 Genomic Sequence For Homo sapiens Clone 125H5, Chromosome 20, complete sequence."
+FT                   /label=AC012380
+FT                   /score=91
+FT                   /colour=255 22 22
+FT   BLASTN_HIT      1230..1258
+FT                   /note="match to AC007392 135475..135503  blast score 42.1  percent identity 93  AC007392 Homo sapiens BAC clone RP11-444B4 from 2, complete sequence."
+FT                   /label=AC007392
+FT                   /score=93
+FT                   /colour=255 17 17
+FT   BLASTN_HIT      1414..1434
+FT                   /note="match to PCAROMX 4290..4310  blast score 42.1  percent identity 100  L18918 Pneumocystis carinii pentafunctional enzyme (arom) gene, complete cds."
+FT                   /label=PCAROMX
+FT                   /score=100
+FT                   /colour=255 0 0
+FT   BLASTN_HIT      521..565
+FT                   /note="match to CH1457 66..110  blast score 42.1  percent identity 87  D10531 Cryptococcus humicolus 5S rRNA."
+FT                   /label=CH1457
+FT                   /score=87
+FT                   /colour=255 33 33
diff --git a/etc/c1215.embl b/etc/c1215.embl
new file mode 100644
index 0000000000000000000000000000000000000000..5acb69e996234db7294b82cdda9ee7300b45d926
--- /dev/null
+++ b/etc/c1215.embl
@@ -0,0 +1,258 @@
+ID   SPBC1215 standard; DNA; FUN; 6490 BP.
+XX
+AC   AL096846;
+XX
+DE   S.pombe chromosome II cosmid c1215.
+XX
+KW   SURF-family protein; COX complex biogenesis; DEC1 homologue;
+KW   mitochondrial inheritance; actin cytoskeleton organisation.
+XX
+OS   Schizosaccharomyces pombe (yeast)
+OC   Eukaryota; Plantae; Thallobionta; Eumycota; Hemiascomycetes;
+OC   Endomycetales; Saccharomycetaceae.
+XX
+RN   [1]
+RP   1-6490
+RA   Lyne M.H., Rajandream M.A., Barrell B.G., Seeger K., Quail M., Harris D.;
+RT   ;
+RL   Submitted (16-JUL-1999) to the EMBL/GenBank/DDBJ databases.      
+RL   European Schizosaccharomyces genome sequencing project,
+RL   Sanger Centre, The Wellcome Trust Genome Campus, Hinxton, 
+RL   Cambridge CB10 1SA, E-mail: barrell@sanger.ac.uk and  
+XX
+CC   Notes:
+CC
+CC   Details of yeast sequencing at the Sanger Centre are available on
+CC   the World Wide Web. 
+CC   (URL, http://www.sanger.ac.uk/Projects/S_pombe/)
+CC   During 1995 to 1996 about 66% of S. pombe chromosome 1 was sequenced 
+CC   by the Sanger Centre.  The sequencing of the S. pombe genome is now 
+CC   being continued with funding from The European Commission.  
+CC   Fourteen European sequencing laboratories, including the Sanger Centre,  
+CC   are participating in the project.
+CC
+CC   Protein coding regions (CDS) have been predicted with the help 
+CC   of computer analysis using the Genefinder program in PomBase
+CC   (an ACEDB database) with additional predictions for the
+CC   branch-acceptor sites supplied by the program Sp3splice.
+CC   CAUTION: It is possible that for any individual CDS we may have
+CC   underestimated or overestimated the number of introns/exons or
+CC   we may not have chosen the correct splice donor/acceptor sites.
+CC   
+CC   CDS are numbered using the following system eg SPBC25H2.01c.
+CC   SP (S. pombe), B (chromosome 2), c25H2 (cosmid name),
+CC   .01 (first CDS), c (complementary strand).
+CC
+CC   The more significant matches with motifs in the PROSITE
+CC   database are also included but some of these may be fortuitous.
+CC
+CC   The length in codons is given for each CDS.
+CC   
+CC   IMPORTANT: This sequence MAY NOT be the entire insert of
+CC   the sequenced clone.  It may be shorter because we only
+CC   sequence overlapping sections once, or longer, because we
+CC   arrange for a small overlap between neighbouring submissions.
+CC
+CC   Cosmid c1215 is overlapped at the 5' end by cosmid c1750, 
+CC   EMBL entry SPAB4534, accession number AB004534, and at the 3' 
+CC   end by cosmid c83, EMBL entry SPBC83, accession number AL035536.
+XX
+XX
+FH   Key             Location/Qualifiers
+FH
+FT   source          1..6490
+FT                   /organism="Schizosaccharomyces pombe"
+FT                   /strain="972h-"
+FT                   /chromosome="II"
+FT                   /clone="cosmid c1215"
+FT                   /map="IIL"
+FT   misc_feature    complement(1..82)
+FT                   /note="nominal overlap with cosmid SPAB4534 (c1750) S.
+FT                   pombe chromosome 2"
+FT   tRNA            36..107
+FT                   /note="tRNA Thr anticodon TGT, Cove score 78.51"
+FT   rRNA            415..581
+FT                   /note="SPRG5SD K00771 Yeast (s.pombe) 5s rrna gene and
+FT                   flanks"
+FT   CDS             join(1501..1760,1844..2456)
+FT                   /fasta_file="fasta/gf.tab.seq.00001.out"
+FT                   /note="SPBC1215.01, len:290, SIMILARITY:Saccharomyces
+FT                   cerevisiae, YG2X_YEAST, hypothetical 45.1 kd protein in
+FT                   clb6-spt6 intergenic region, (389 aa), fasta scores: opt:
+FT                   385, E():2.8e-19, (29.0% identity in 314 aa)"
+FT                   /gene="SPBC1215.01"
+FT                   /product="putative SURF-family protein"
+FT                   /colour=7
+FT                   /label=SPBC1215.01
+FT   misc_feature    1761..1766
+FT                   /note="gtacgt, splice donor sequence"
+FT                   /colour=6
+FT   misc_feature    1827..1843
+FT                   /note="ctaacataatcacttag, splice branch and acceptor"
+FT                   /colour=6
+FT   CDS             complement(join(2495..2602,2663..2881,2953..4071,4111..4372,4413..4849,4889..5007,5251..5389,5434..5466))
+FT                   /fasta_file="fasta/gf.tab.seq.00002.out"
+FT                   /note="SPBC1215.02c, len:811, SIMILARITY:Saccharomyces
+FT                   cerevisiae, DEC1_YEAST, dec1 protein, (796 aa), fasta
+FT                   scores: opt: 184, E():0.00014, (23.4% identity in 577 aa)"
+FT                   /gene="SPBC1215.02c"
+FT                   /product="similar to yeast DEC1 mitochondrial inheritance
+FT                   and actin cytoskeleton organisation protein"
+FT                   /colour=7
+FT                   /label=SPBC1215.02c
+FT   misc_feature    complement(2603..2612)
+FT                   /note="ctaataatag, splice branch and acceptor"
+FT                   /colour=6
+FT   misc_feature    complement(2657..2662)
+FT                   /note="gtacgt, splice donor sequence"
+FT                   /colour=6
+FT   misc_feature    complement(2882..2896)
+FT                   /note="ctaaccgaattatag, splice branch and acceptor"
+FT                   /colour=6
+FT   misc_feature    complement(2947..2952)
+FT                   /note="gtaagt, splice donor sequence"
+FT                   /colour=6
+FT   misc_feature    complement(4072..4085)
+FT                   /note="ttaactcgtcgtag, splice branch and acceptor"
+FT                   /colour=6
+FT   misc_feature    complement(4105..4110)
+FT                   /note="gtaagt, splice donor sequence"
+FT                   /colour=6
+FT   misc_feature    complement(4373..4387)
+FT                   /note="ctaacttctccatag, splice branch and acceptor"
+FT                   /colour=6
+FT   misc_feature    complement(4407..4412)
+FT                   /note="gtaagt, splice donor sequence"
+FT                   /colour=6
+FT   misc_feature    complement(4850..4861)
+FT                   /note="ctaactcctcag, splice branch and acceptor"
+FT                   /colour=6
+FT   misc_feature    complement(4883..4888)
+FT                   /note="gtaaga, splice donor sequence"
+FT                   /colour=6
+FT   misc_feature    complement(5008..5021)
+FT                   /note="ttaactatttgaag, splice branch and acceptor"
+FT                   /colour=6
+FT   misc_feature    complement(5245..5250)
+FT                   /note="gtaagt, splice donor sequence"
+FT                   /colour=6
+FT   misc_feature    complement(5390..5405)
+FT                   /note="ttaacatcctttttag, splice branch and acceptor"
+FT                   /colour=6
+FT   misc_feature    complement(5428..5433)
+FT                   /note="gtaagt, splice donor sequence"
+FT                   /colour=6
+FT   misc_feature    6387..6490
+FT                   /note="nominal overlap with cosmid SPBC83 S. pombe
+FT                   chromosome 2"
+SQ   Sequence 6490 BP; 2097 A; 1138 C; 1138 G; 2117 T; 0 other;
+     tatatataat ttaataaata cattccgacg atactgcctc tatggcttag tggtacagca        60
+     tcgcacttgt aatgcgaaga tccttggttc gattccgagt ggaggcatat acattatatt       120
+     atattctttt tcatgcggaa aaaagatttc aaatttttgg gtatgatatt aatatgactg       180
+     taacgttaat agcaaagtga gtgttaataa tgataaaata gcagcaaaat ctcttttccg       240
+     agtaagacgt tttccagtct aaatttggag tctgcagttg tttcgcaatt cttaatgtat       300
+     ggttatacta aatacaaact ttaaagctct gatttatgtt tgcaataaac taaaataaaa       360
+     gcacaaaaac ctttacccat taatttcaaa caacttataa actaccggta aacttttttt       420
+     ctaaccttta taatttataa actagaatgt ttaatgtcta cggccatacc taggcgaaaa       480
+     caccagttcc cgtccgatca ctgcagttaa gcgtctgagg gcctcgttag tactatggtt       540
+     ggagacaaca tgggaatccg gggtgctgta ggctattttt ttatatccgt ctttcttact       600
+     acttgcctaa caagtcatga tgtactctca aaatatgttt gcatgccttg taatattggt       660
+     tatggatagc tccttctgga cttgatcttt tgtagccaag aacaatgggt atagactctg       720
+     accttgtgat gttgtagcca cagattataa taggtatttt caagtacagt aacaaaaatc       780
+     ttctagtttt tttttagaaa ggatacacca agtataagca aattcaggaa ttgttgatta       840
+     aactgtcaac ttcggtaaaa ctttgggcat aagtagtgtg ggagcaagtt taactaaaat       900
+     tctattcaga tgtcgaatcc aaaccgctaa ttttgctcaa ctagcttttc ataaaaacca       960
+     attcatagtt tcatactaat aaagacgatt gtttacttta aaacatacgt cgtaagaaca      1020
+     tatattgctt tatcgaaaga taacaaatgt taagctatta tattatttaa ctatagcgca      1080
+     gatttcgctt cctttactta aaaaagacat gtgacttgta gaagcttgga gtgaatacgc      1140
+     aaaggtacct acttagacat tcgcgtctct cttagctgtc aacatcaaca aactggcccc      1200
+     gtattgaaca gtatcttact tgtcgaagga tttgactaag aaaattttat ttctttatag      1260
+     caatattccg ttttcgctta gaagattcta gtcaattgcc ctattctact tacgctttac      1320
+     agtagtatca gaagacctga gtgggatttt gctgctagta gaggccattc aagttaactc      1380
+     cgttttgcaa cattttaaaa gtttttgaat tgaatataaa tatcaattgt ttgattcctt      1440
+     ttaggattta atcttttctt tttatttttg tttcgattga atcttggatt cctgtctatc      1500
+     atgttttggt ggaaaagtgc tactaaattc acattctcaa agcgtggacc gtgtgtcttt      1560
+     cgctatttga gtactcttga aggaacaact gtgaggccta aaaaaaataa atttttagtt      1620
+     ggattgcttt ctgccgttcc aattgtcacg tttgctttag gaacttggca ggtaaagcga      1680
+     cgagaatgga aaatgggtat catcaataca ctcacggaaa ggcttcaaca gcccgcaatt      1740
+     ttattaccga aaactgttac gtacgttaag ttaacatata cacaaattgc acgttttgca      1800
+     attgaactgt cgttttttac attaagctaa cataatcact tagagagcaa gatacaaaaa      1860
+     aacttgagtg gactagggtt ttgcttcgtg gtgtgttttg tcacgaccaa gaaatgttgg      1920
+     tcggtccaag aacgaaggaa ggccaacctg gctatcacgt agtaacccca tttattttag      1980
+     acgatgggcg tcgaatttta gtcaacagag gatggattgc tcgatcattt gctgaacagt      2040
+     cttctcgaga tcctagttct ttacctaaag gtccagtggt cattgaaggt cttttgagac      2100
+     aacatactga taagccaaga tttatgatga agaatgagcc tgaaaaaaat tctttttact      2160
+     tcttaaatgt tcgtgagttt gcacaattga aaggaactct ccccattttg ataacagaac      2220
+     tacaaccatc gcttacaccg ttgcaagaag ccgatcatgt taagagaggc ttgcctcttg      2280
+     gtcatcctct aaaagttgaa attttcaaca gtcatacaga atatattatc acttggtatt      2340
+     ctctaagtgt ggtatcagct ataatgcttt acgtctattt taagagaggt tcaggcacat      2400
+     cttctctgaa ttctgcatac gaaagaagca agattctaaa caacaaacga ttataaaaaa      2460
+     ttttcatatt tataagtttc taaatattat ctacctaaaa ttttacaaat tttggaagct      2520
+     tgcttactgc gtccgtcgtt tgaatgtatg aatcgatcat tccttcacca acttgttttg      2580
+     caaacttcgg atcgtaagga acctattatt aggaagttag ttctcatgcc tataatttta      2640
+     atgctctata atcatcacgt acctgagttt cagataaatt gctcagccaa gagtttgaca      2700
+     acaattctga tacatatttt ctggcggcct tctttttatg cttcgtaatt ccagagatac      2760
+     ttcctaattt gttactgctg atgtttttaa gaagttggta ttgtctggta aattcttttt      2820
+     tcttggtagc tgacacgtga tataggaagc tgtttagaca agtgataagg tcatttatga      2880
+     tctataattc ggttagttta gaaattttta tatcattttt tttaaaaaaa aaaaccagtt      2940
+     tggtaaactt acttcagtgt actttgtcaa ttgacttaaa ggcgtggagt tctcataatc      3000
+     gaatgactca attaaatttt caatcgtttc gaacgaggaa ttttcgtagt ctccgttctt      3060
+     gacctttacc gaaagtaatc ccagttggat caataatttc atatgaacaa tttcttccga      3120
+     agttaattgc ttcgataaat cattgttttc gcacaaaact tccatttcct tagcacttaa      3180
+     aacggccttt tcaaaatcgc cgtttactat gctgtcttga acgagagaat gaccaatgac      3240
+     agtcaaatgg atccaaagcg tgtccggttt aggcgaattt cttaaacttt cttcaactgt      3300
+     tggcaattta tcagatccat aatctgcaaa gacctttaaa tctcgattat ctttcggaga      3360
+     tgaacatttg ggaagatact gtttgggtgg tttaaaagcg gtaagataat gtatcctagc      3420
+     ccgctcgacc aaagaaatgc ttttccaggt actgtggtct aaacgggatc ggaaattacg      3480
+     catatcttcg atttgagagt aagcaccatc ttcataagcc atagaaatca tctctggtgt      3540
+     ttcaaactca ttcgaaccat atattttgag acttgagtta atatagtgag aagtaacaga      3600
+     agatggataa taggtagtag cacgagtcaa gagataatga tcaagggtat cgttttgaat      3660
+     ttgcttaatg gacatagtgt cgtaaacttt agcagcagca gggaagcctc catcaagaag      3720
+     aagatataaa cgaataaggg gtagctttaa atgaaagtta tgttgactat aagtaatgcc      3780
+     tttttctaaa agacagattg cgtcaaaaat taaagcttgt ttttcggcag gttttaaatc      3840
+     cttattcccc tcccacatat atatcaatga atgaactgct aataacaaag cttcataacc      3900
+     gtgcgtaaag tcagtgggta ataagccttt acttaaagac aaaccctttt caaatgcgac      3960
+     gaagcatcta cgcacgtaat cgacaaccga ttctgcagta aacgactcaa agagcaaaaa      4020
+     atggatcttc agaagcaaaa cctcagcata taatttatcg actttttgag actacgacga      4080
+     gttaatattg aaagatgaat aaatacttac ttcattggat tcacctagat cagccaactt      4140
+     aaatgcatct aataaccggt gttgtgcatc aacattcagc ttcaatagat aaggtctcaa      4200
+     atcttcaaaa acaattggtt tcatatacag ctttttgata tagccaagta atgctgattc      4260
+     gtgttcttca ggaaaaaacc gtgcgctggc ttcaatccaa agtaaatgaa gatttctttt      4320
+     tgtgctgctg gttgacaacg ctttcaatat acaatccttt aatgggacta atctatggag      4380
+     aagttagtaa taatgcaaaa aaaaaaactt actttgaatc atcattggaa gcactatcca      4440
+     gcaaagcttt gcaaaccttc caatcagtat tcccagtttg gaaaagagaa agcgaaaacg      4500
+     tgaataaaga atcccaacgc gcacaggaag caagcaattc aagcttcctc aaaagaaggt      4560
+     cggcgtcagc atcaacaaag cgatcagcat cttgatgtat taaagcatct aacgctctgt      4620
+     ccttgtctcc cactaaaagc aacacgtcta aataaagatg aaactcctca caagaatcga      4680
+     tataacctgt tggtttttcg aaaatgagtt tagcagtttt ttcagctagt gctttcagca      4740
+     aacgttgttc aacctcattt tccgactttt tggacaaaag atacaaagat gagataaccc      4800
+     ataaggtatg tttcctagaa ggaaagttct tttgcaattc tacagcagcc tgaggagtta      4860
+     gtaaaaaaaa aacaaattaa gatcttacct ttctttggtg agacaatgat ttgatgcgaa      4920
+     tagatgcttt gaagtaagct aataagtttt tttcctgctt tccataagtt tgcaagaact      4980
+     tttcccaaaa tacaaacgat tcttctcctt caaatagtta ataacttaaa agtaagaggg      5040
+     taaaaacaag tccattgaga aataaaacgt tgcacttgaa tcatcaagct acgaaaagaa      5100
+     caaagatcgt ttttcttaag caaagtttaa ccgatcaaat aactaaagcc tttatctcaa      5160
+     ggaaatagta gaatattcaa aataaaaaat acgaccaaag tgctatcaac atttatgttc      5220
+     atctgttcaa tagaacctaa ttatacttac ccttcttttg atcatcataa acagcttgta      5280
+     taatgtctaa aagttccaag ctgttgatgg gagtcgattt taacggttct aaaagtgcta      5340
+     gagcctcggg accacgtcct gcctgagcca aggataacgc tgaataaacc taaaaaggat      5400
+     gttaacagct aaaaacataa ctcgattact tacaattgtt gattctttac tcccagaacg      5460
+     acgcattgta gtaggcaatg aaattaaagc ccaaacagta gtcagaagtt ggtaggtgtt      5520
+     gcagtcaaat tattattcta cagaggagaa tattatagcc agcgtggtag aatctggata      5580
+     tatatctact gcaaaagtgt aattgcattg gtttaaaggg tatactatgg ttaagtaata      5640
+     tattcacagc tgtacaattt acagtcataa ctaaaacttc cttaagccgt aaagaaatac      5700
+     ctggtgttgt aaaatttgtt gtatatccac ggcatggtca tataatgtga ttttgtgctc      5760
+     aaataaatat aaaatatgca taatttttgt acatttaatt tgagaaaccc atcttttgtt      5820
+     gagaggctgt caatgaatag cagtttcatt gaaaagcagc gggatgacca gaaaagtatt      5880
+     ttacaatggc aagggagtag aaagctagcg taatattcag aaagctaggt aattgagcaa      5940
+     tcctttaatt cattgctaag catgctaggt aaacgcagta aacctttcag ttttcattta      6000
+     ggtataaggc tgtttaatga gtatctccac taaatttaaa gatcaaaact cagtatcaat      6060
+     tcttaaaagt tttattttat ttaataatca tatacttctc ataatctttc aattttttcc      6120
+     ccattttgat gatattttta ttaatcctac agtaagctct atgatatcgt tattcttcaa      6180
+     ataggctggt cagcacgtgg acggtgttac ttatcgttaa ataaatcgta ctaaggaggt      6240
+     gcgatgtaaa tgatatgctt gtcaagtatt aactgctctc caccaaccgc cggtttaact      6300
+     gattattgtt gaaaagcgca gacgaagttt agagaattac tagcgtattt taaatttaat      6360
+     caacggacta ttttttattc ctttgagatc cgactttatc gctttgcttc taattttcca      6420
+     aaattcagtc tatctacgcg atccagccct gtttgcgtaa atttcatatt atttttcttt      6480
+     aaacgtttgg                                                             6490
+//
diff --git a/etc/c1215.genbank b/etc/c1215.genbank
new file mode 100644
index 0000000000000000000000000000000000000000..9e3c3d8739a1d710f015f889db476ce4055b912c
--- /dev/null
+++ b/etc/c1215.genbank
@@ -0,0 +1,277 @@
+LOCUS       SPBC1215     6490 bp    DNA             PLN       16-JUL-1999
+DEFINITION  S.pombe chromosome II cosmid c1215.
+ACCESSION   AL096846
+VERSION     AL096846.1  GI:5531459
+KEYWORDS    actin cytoskeleton organisation; COX complex biogenesis; DEC1
+            homologue; mitochondrial inheritance; SURF-family protein.
+SOURCE      fission yeast.
+  ORGANISM  Schizosaccharomyces pombe
+            Eukaryota; Fungi; Ascomycota; Schizosaccharomycetes;
+            Schizosaccharomycetales; Schizosaccharomycetaceae;
+            Schizosaccharomyces.
+REFERENCE   1  (bases 1 to 6490)
+  AUTHORS   Lyne,M.H., Rajandream,M.A., Barrell,B.G., Seeger,K., Quail,M. and
+            Harris,D.
+  TITLE     Direct Submission
+  JOURNAL   Submitted (16-JUL-1999) European Schizosaccharomyces genome
+            sequencing project, Sanger Centre, The Wellcome Trust Genome
+            Campus, Hinxton, Cambridge CB10 1SA, E-mail: barrell@sanger.ac.uk
+            and
+COMMENT     Notes:
+            Details of yeast sequencing at the Sanger Centre are available on
+            the World Wide Web.
+            (URL, http://www.sanger.ac.uk/Projects/S_pombe/)
+            During 1995 to 1996 about 66% of S. pombe chromosome 1 was
+            sequenced by the Sanger Centre.  The sequencing of the S. pombe
+            genome is now being continued with funding from The European
+            Commission. Fourteen European sequencing laboratories, including
+            the Sanger Centre, are participating in the project.
+            Protein coding regions (CDS) have been predicted with the help of
+            computer analysis using the Genefinder program in PomBase (an ACEDB
+            database) with additional predictions for the branch-acceptor sites
+            supplied by the program Sp3splice. CAUTION: It is possible that for
+            any individual CDS we may have underestimated or overestimated the
+            number of introns/exons or we may not have chosen the correct
+            splice donor/acceptor sites. 
+            CDS are numbered using the following system eg SPBC25H2.01c. SP (S.
+            pombe), B (chromosome 2), c25H2 (cosmid name), .01 (first CDS), c
+            (complementary strand).
+            The more significant matches with motifs in the PROSITE database
+            are also included but some of these may be fortuitous. 
+            The length in codons is given for each CDS.
+            IMPORTANT: This sequence MAY NOT be the entire insert of the
+            sequenced clone.  It may be shorter because we only sequence
+            overlapping sections once, or longer, because we arrange for a
+            small overlap between neighbouring submissions. 
+            Cosmid c1215 is overlapped at the 5' end by cosmid c1750, EMBL
+            entry SPAB4534, accession number AB004534, and at the 3' end by
+            cosmid c83, EMBL entry SPBC83, accession number AL035536.
+FEATURES             Location/Qualifiers
+     source          1..6490
+                     /organism="Schizosaccharomyces pombe"
+                     /strain="972h-"
+                     /db_xref="taxon:4896"
+                     /chromosome="II"
+                     /map="IIL"
+                     /clone="cosmid c1215"
+     misc_feature    complement(1..82)
+                     /note="nominal overlap with cosmid SPAB4534 (c1750) S.
+                     pombe chromosome 2"
+     tRNA            36..107
+                     /note="tRNA Thr anticodon TGT, Cove score 78.51"
+                     /product="tRNA-Thr"
+     rRNA            415..581
+                     /note="SPRG5SD K00771 Yeast (s.pombe) 5s rrna gene and
+                     flanks"
+     gene            join(1501..1760,1844..2456)
+                     /gene="SPBC1215.01"
+     CDS             join(1501..1760,1844..2456)
+                     /gene="SPBC1215.01"
+                     /note="SPBC1215.01, len:290, SIMILARITY:Saccharomyces
+                     cerevisiae, YG2X_YEAST, hypothetical 45.1 kd protein in
+                     clb6-spt6 intergenic region, (389 aa), fasta scores: opt:
+                     385, E():2.8e-19, (29.0% identity in 314 aa)"
+                     /codon_start=1
+                     /label=SPBC1215.01
+                     /product="putative SURF-family protein"
+                     /protein_id="CAB50922.1"
+                     /db_xref="GI:5531460"
+                     /translation="MFWWKSATKFTFSKRGPCVFRYLSTLEGTTVRPKKNKFLVGLLS
+                     AVPIVTFALGTWQVKRREWKMGIINTLTERLQQPAILLPKTVTEQDTKKLEWTRVLLR
+                     GVFCHDQEMLVGPRTKEGQPGYHVVTPFILDDGRRILVNRGWIARSFAEQSSRDPSSL
+                     PKGPVVIEGLLRQHTDKPRFMMKNEPEKNSFYFLNVREFAQLKGTLPILITELQPSLT
+                     PLQEADHVKRGLPLGHPLKVEIFNSHTEYIITWYSLSVVSAIMLYVYFKRGSGTSSLN
+                     SAYERSKILNNKRL"
+     misc_feature    1761..1766
+                     /gene="SPBC1215.01"
+                     /note="gtacgt, splice donor sequence"
+     misc_feature    1827..1843
+                     /gene="SPBC1215.01"
+                     /note="ctaacataatcacttag, splice branch and acceptor"
+     gene            complement(join(2495..2602,2663..2881,2953..4071,
+                     4111..4372,4413..4849,4889..5007,5251..5389,5434..5466))
+                     /gene="SPBC1215.02c"
+     CDS             complement(join(2495..2602,2663..2881,2953..4071,
+                     4111..4372,4413..4849,4889..5007,5251..5389,5434..5466))
+                     /gene="SPBC1215.02c"
+                     /note="SPBC1215.02c, len:811, SIMILARITY:Saccharomyces
+                     cerevisiae, DEC1_YEAST, dec1 protein, (796 aa), fasta
+                     scores: opt: 184, E():0.00014, (23.4% identity in 577 aa)"
+                     /codon_start=1
+                     /label=SPBC1215.02c
+                     /product="similar to yeast DEC1 mitochondrial inheritance
+                     and actin cytoskeleton organisation protein"
+                     /protein_id="CAB50923.1"
+                     /db_xref="GI:5531461"
+                     /translation="MRRSGSKESTIVYSALSLAQAGRGPEALALLEPLKSTPINSLEL
+                     LDIIQAVYDDQKKGEESFVFWEKFLQTYGKQEKNLLAYFKASIRIKSLSHQRKAAVEL
+                     QKNFPSRKHTLWVISSLYLLSKKSENEVEQRLLKALAEKTAKLIFEKPTGYIDSCEEF
+                     HLYLDVLLLVGDKDRALDALIHQDADRFVDADADLLLRKLELLASCARWDSLFTFSLS
+                     LFQTGNTDWKVCKALLDSASNDDSKLVPLKDCILKALSTSSTKRNLHLLWIEASARFF
+                     PEEHESALLGYIKKLYMKPIVFEDLRPYLLKLNVDAQHRLLDAFKLADLGESNESQKV
+                     DKLYAEVLLLKIHFLLFESFTAESVVDYVRRCFVAFEKGLSLSKGLLPTDFTHGYEAL
+                     LLAVHSLIYMWEGNKDLKPAEKQALIFDAICLLEKGITYSQHNFHLKLPLIRLYLLLD
+                     GGFPAAAKVYDTMSIKQIQNDTLDHYLLTRATTYYPSSVTSHYINSSLKIYGSNEFET
+                     PEMISMAYEDGAYSQIEDMRNFRSRLDHSTWKSISLVERARIHYLTAFKPPKQYLPKC
+                     SSPKDNRDLKVFADYGSDKLPTVEESLRNSPKPDTLWIHLTVIGHSLVQDSIVNGDFE
+                     KAVLSAKEMEVLCENNDLSKQLTSEEIVHMKLLIQLGLLSVKVKNGDYENSSFETIEN
+                     LIESFDYENSTPLSQLTKYTEIINDLITCLNSFLYHVSATKKKEFTRQYQLLKNISSN
+                     KLGSISGITKHKKKAARKYVSELLSNSWLSNLSETQVPYDPKFAKQVGEGMIDSYIQT
+                     TDAVSKLPKFVKF"
+     misc_feature    complement(2603..2612)
+                     /gene="SPBC1215.02c"
+                     /note="ctaataatag, splice branch and acceptor"
+     misc_feature    complement(2657..2662)
+                     /gene="SPBC1215.02c"
+                     /note="gtacgt, splice donor sequence"
+     misc_feature    complement(2882..2896)
+                     /gene="SPBC1215.02c"
+                     /note="ctaaccgaattatag, splice branch and acceptor"
+     misc_feature    complement(2947..2952)
+                     /gene="SPBC1215.02c"
+                     /note="gtaagt, splice donor sequence"
+     misc_feature    complement(4072..4085)
+                     /gene="SPBC1215.02c"
+                     /note="ttaactcgtcgtag, splice branch and acceptor"
+     misc_feature    complement(4105..4110)
+                     /gene="SPBC1215.02c"
+                     /note="gtaagt, splice donor sequence"
+     misc_feature    complement(4373..4387)
+                     /gene="SPBC1215.02c"
+                     /note="ctaacttctccatag, splice branch and acceptor"
+     misc_feature    complement(4407..4412)
+                     /gene="SPBC1215.02c"
+                     /note="gtaagt, splice donor sequence"
+     misc_feature    complement(4850..4861)
+                     /gene="SPBC1215.02c"
+                     /note="ctaactcctcag, splice branch and acceptor"
+     misc_feature    complement(4883..4888)
+                     /gene="SPBC1215.02c"
+                     /note="gtaaga, splice donor sequence"
+     misc_feature    complement(5008..5021)
+                     /gene="SPBC1215.02c"
+                     /note="ttaactatttgaag, splice branch and acceptor"
+     misc_feature    complement(5245..5250)
+                     /gene="SPBC1215.02c"
+                     /note="gtaagt, splice donor sequence"
+     misc_feature    complement(5390..5405)
+                     /gene="SPBC1215.02c"
+                     /note="ttaacatcctttttag, splice branch and acceptor"
+     misc_feature    complement(5428..5433)
+                     /gene="SPBC1215.02c"
+                     /note="gtaagt, splice donor sequence"
+     misc_feature    6387..6490
+                     /note="nominal overlap with cosmid SPBC83 S. pombe
+                     chromosome 2"
+BASE COUNT     2097 a   1138 c   1138 g   2117 t
+ORIGIN      
+        1 tatatataat ttaataaata cattccgacg atactgcctc tatggcttag tggtacagca
+       61 tcgcacttgt aatgcgaaga tccttggttc gattccgagt ggaggcatat acattatatt
+      121 atattctttt tcatgcggaa aaaagatttc aaatttttgg gtatgatatt aatatgactg
+      181 taacgttaat agcaaagtga gtgttaataa tgataaaata gcagcaaaat ctcttttccg
+      241 agtaagacgt tttccagtct aaatttggag tctgcagttg tttcgcaatt cttaatgtat
+      301 ggttatacta aatacaaact ttaaagctct gatttatgtt tgcaataaac taaaataaaa
+      361 gcacaaaaac ctttacccat taatttcaaa caacttataa actaccggta aacttttttt
+      421 ctaaccttta taatttataa actagaatgt ttaatgtcta cggccatacc taggcgaaaa
+      481 caccagttcc cgtccgatca ctgcagttaa gcgtctgagg gcctcgttag tactatggtt
+      541 ggagacaaca tgggaatccg gggtgctgta ggctattttt ttatatccgt ctttcttact
+      601 acttgcctaa caagtcatga tgtactctca aaatatgttt gcatgccttg taatattggt
+      661 tatggatagc tccttctgga cttgatcttt tgtagccaag aacaatgggt atagactctg
+      721 accttgtgat gttgtagcca cagattataa taggtatttt caagtacagt aacaaaaatc
+      781 ttctagtttt tttttagaaa ggatacacca agtataagca aattcaggaa ttgttgatta
+      841 aactgtcaac ttcggtaaaa ctttgggcat aagtagtgtg ggagcaagtt taactaaaat
+      901 tctattcaga tgtcgaatcc aaaccgctaa ttttgctcaa ctagcttttc ataaaaacca
+      961 attcatagtt tcatactaat aaagacgatt gtttacttta aaacatacgt cgtaagaaca
+     1021 tatattgctt tatcgaaaga taacaaatgt taagctatta tattatttaa ctatagcgca
+     1081 gatttcgctt cctttactta aaaaagacat gtgacttgta gaagcttgga gtgaatacgc
+     1141 aaaggtacct acttagacat tcgcgtctct cttagctgtc aacatcaaca aactggcccc
+     1201 gtattgaaca gtatcttact tgtcgaagga tttgactaag aaaattttat ttctttatag
+     1261 caatattccg ttttcgctta gaagattcta gtcaattgcc ctattctact tacgctttac
+     1321 agtagtatca gaagacctga gtgggatttt gctgctagta gaggccattc aagttaactc
+     1381 cgttttgcaa cattttaaaa gtttttgaat tgaatataaa tatcaattgt ttgattcctt
+     1441 ttaggattta atcttttctt tttatttttg tttcgattga atcttggatt cctgtctatc
+     1501 atgttttggt ggaaaagtgc tactaaattc acattctcaa agcgtggacc gtgtgtcttt
+     1561 cgctatttga gtactcttga aggaacaact gtgaggccta aaaaaaataa atttttagtt
+     1621 ggattgcttt ctgccgttcc aattgtcacg tttgctttag gaacttggca ggtaaagcga
+     1681 cgagaatgga aaatgggtat catcaataca ctcacggaaa ggcttcaaca gcccgcaatt
+     1741 ttattaccga aaactgttac gtacgttaag ttaacatata cacaaattgc acgttttgca
+     1801 attgaactgt cgttttttac attaagctaa cataatcact tagagagcaa gatacaaaaa
+     1861 aacttgagtg gactagggtt ttgcttcgtg gtgtgttttg tcacgaccaa gaaatgttgg
+     1921 tcggtccaag aacgaaggaa ggccaacctg gctatcacgt agtaacccca tttattttag
+     1981 acgatgggcg tcgaatttta gtcaacagag gatggattgc tcgatcattt gctgaacagt
+     2041 cttctcgaga tcctagttct ttacctaaag gtccagtggt cattgaaggt cttttgagac
+     2101 aacatactga taagccaaga tttatgatga agaatgagcc tgaaaaaaat tctttttact
+     2161 tcttaaatgt tcgtgagttt gcacaattga aaggaactct ccccattttg ataacagaac
+     2221 tacaaccatc gcttacaccg ttgcaagaag ccgatcatgt taagagaggc ttgcctcttg
+     2281 gtcatcctct aaaagttgaa attttcaaca gtcatacaga atatattatc acttggtatt
+     2341 ctctaagtgt ggtatcagct ataatgcttt acgtctattt taagagaggt tcaggcacat
+     2401 cttctctgaa ttctgcatac gaaagaagca agattctaaa caacaaacga ttataaaaaa
+     2461 ttttcatatt tataagtttc taaatattat ctacctaaaa ttttacaaat tttggaagct
+     2521 tgcttactgc gtccgtcgtt tgaatgtatg aatcgatcat tccttcacca acttgttttg
+     2581 caaacttcgg atcgtaagga acctattatt aggaagttag ttctcatgcc tataatttta
+     2641 atgctctata atcatcacgt acctgagttt cagataaatt gctcagccaa gagtttgaca
+     2701 acaattctga tacatatttt ctggcggcct tctttttatg cttcgtaatt ccagagatac
+     2761 ttcctaattt gttactgctg atgtttttaa gaagttggta ttgtctggta aattcttttt
+     2821 tcttggtagc tgacacgtga tataggaagc tgtttagaca agtgataagg tcatttatga
+     2881 tctataattc ggttagttta gaaattttta tatcattttt tttaaaaaaa aaaaccagtt
+     2941 tggtaaactt acttcagtgt actttgtcaa ttgacttaaa ggcgtggagt tctcataatc
+     3001 gaatgactca attaaatttt caatcgtttc gaacgaggaa ttttcgtagt ctccgttctt
+     3061 gacctttacc gaaagtaatc ccagttggat caataatttc atatgaacaa tttcttccga
+     3121 agttaattgc ttcgataaat cattgttttc gcacaaaact tccatttcct tagcacttaa
+     3181 aacggccttt tcaaaatcgc cgtttactat gctgtcttga acgagagaat gaccaatgac
+     3241 agtcaaatgg atccaaagcg tgtccggttt aggcgaattt cttaaacttt cttcaactgt
+     3301 tggcaattta tcagatccat aatctgcaaa gacctttaaa tctcgattat ctttcggaga
+     3361 tgaacatttg ggaagatact gtttgggtgg tttaaaagcg gtaagataat gtatcctagc
+     3421 ccgctcgacc aaagaaatgc ttttccaggt actgtggtct aaacgggatc ggaaattacg
+     3481 catatcttcg atttgagagt aagcaccatc ttcataagcc atagaaatca tctctggtgt
+     3541 ttcaaactca ttcgaaccat atattttgag acttgagtta atatagtgag aagtaacaga
+     3601 agatggataa taggtagtag cacgagtcaa gagataatga tcaagggtat cgttttgaat
+     3661 ttgcttaatg gacatagtgt cgtaaacttt agcagcagca gggaagcctc catcaagaag
+     3721 aagatataaa cgaataaggg gtagctttaa atgaaagtta tgttgactat aagtaatgcc
+     3781 tttttctaaa agacagattg cgtcaaaaat taaagcttgt ttttcggcag gttttaaatc
+     3841 cttattcccc tcccacatat atatcaatga atgaactgct aataacaaag cttcataacc
+     3901 gtgcgtaaag tcagtgggta ataagccttt acttaaagac aaaccctttt caaatgcgac
+     3961 gaagcatcta cgcacgtaat cgacaaccga ttctgcagta aacgactcaa agagcaaaaa
+     4021 atggatcttc agaagcaaaa cctcagcata taatttatcg actttttgag actacgacga
+     4081 gttaatattg aaagatgaat aaatacttac ttcattggat tcacctagat cagccaactt
+     4141 aaatgcatct aataaccggt gttgtgcatc aacattcagc ttcaatagat aaggtctcaa
+     4201 atcttcaaaa acaattggtt tcatatacag ctttttgata tagccaagta atgctgattc
+     4261 gtgttcttca ggaaaaaacc gtgcgctggc ttcaatccaa agtaaatgaa gatttctttt
+     4321 tgtgctgctg gttgacaacg ctttcaatat acaatccttt aatgggacta atctatggag
+     4381 aagttagtaa taatgcaaaa aaaaaaactt actttgaatc atcattggaa gcactatcca
+     4441 gcaaagcttt gcaaaccttc caatcagtat tcccagtttg gaaaagagaa agcgaaaacg
+     4501 tgaataaaga atcccaacgc gcacaggaag caagcaattc aagcttcctc aaaagaaggt
+     4561 cggcgtcagc atcaacaaag cgatcagcat cttgatgtat taaagcatct aacgctctgt
+     4621 ccttgtctcc cactaaaagc aacacgtcta aataaagatg aaactcctca caagaatcga
+     4681 tataacctgt tggtttttcg aaaatgagtt tagcagtttt ttcagctagt gctttcagca
+     4741 aacgttgttc aacctcattt tccgactttt tggacaaaag atacaaagat gagataaccc
+     4801 ataaggtatg tttcctagaa ggaaagttct tttgcaattc tacagcagcc tgaggagtta
+     4861 gtaaaaaaaa aacaaattaa gatcttacct ttctttggtg agacaatgat ttgatgcgaa
+     4921 tagatgcttt gaagtaagct aataagtttt tttcctgctt tccataagtt tgcaagaact
+     4981 tttcccaaaa tacaaacgat tcttctcctt caaatagtta ataacttaaa agtaagaggg
+     5041 taaaaacaag tccattgaga aataaaacgt tgcacttgaa tcatcaagct acgaaaagaa
+     5101 caaagatcgt ttttcttaag caaagtttaa ccgatcaaat aactaaagcc tttatctcaa
+     5161 ggaaatagta gaatattcaa aataaaaaat acgaccaaag tgctatcaac atttatgttc
+     5221 atctgttcaa tagaacctaa ttatacttac ccttcttttg atcatcataa acagcttgta
+     5281 taatgtctaa aagttccaag ctgttgatgg gagtcgattt taacggttct aaaagtgcta
+     5341 gagcctcggg accacgtcct gcctgagcca aggataacgc tgaataaacc taaaaaggat
+     5401 gttaacagct aaaaacataa ctcgattact tacaattgtt gattctttac tcccagaacg
+     5461 acgcattgta gtaggcaatg aaattaaagc ccaaacagta gtcagaagtt ggtaggtgtt
+     5521 gcagtcaaat tattattcta cagaggagaa tattatagcc agcgtggtag aatctggata
+     5581 tatatctact gcaaaagtgt aattgcattg gtttaaaggg tatactatgg ttaagtaata
+     5641 tattcacagc tgtacaattt acagtcataa ctaaaacttc cttaagccgt aaagaaatac
+     5701 ctggtgttgt aaaatttgtt gtatatccac ggcatggtca tataatgtga ttttgtgctc
+     5761 aaataaatat aaaatatgca taatttttgt acatttaatt tgagaaaccc atcttttgtt
+     5821 gagaggctgt caatgaatag cagtttcatt gaaaagcagc gggatgacca gaaaagtatt
+     5881 ttacaatggc aagggagtag aaagctagcg taatattcag aaagctaggt aattgagcaa
+     5941 tcctttaatt cattgctaag catgctaggt aaacgcagta aacctttcag ttttcattta
+     6001 ggtataaggc tgtttaatga gtatctccac taaatttaaa gatcaaaact cagtatcaat
+     6061 tcttaaaagt tttattttat ttaataatca tatacttctc ataatctttc aattttttcc
+     6121 ccattttgat gatattttta ttaatcctac agtaagctct atgatatcgt tattcttcaa
+     6181 ataggctggt cagcacgtgg acggtgttac ttatcgttaa ataaatcgta ctaaggaggt
+     6241 gcgatgtaaa tgatatgctt gtcaagtatt aactgctctc caccaaccgc cggtttaact
+     6301 gattattgtt gaaaagcgca gacgaagttt agagaattac tagcgtattt taaatttaat
+     6361 caacggacta ttttttattc ctttgagatc cgactttatc gctttgcttc taattttcca
+     6421 aaattcagtc tatctacgcg atccagccct gtttgcgtaa atttcatatt atttttcttt
+     6481 aaacgtttgg 
+//
diff --git a/etc/c1215.seq b/etc/c1215.seq
new file mode 100644
index 0000000000000000000000000000000000000000..94d788aba2bf0fc3317ce6f1814239b1a9c58394
--- /dev/null
+++ b/etc/c1215.seq
@@ -0,0 +1,110 @@
+>all bases
+tatatataatttaataaatacattccgacgatactgcctctatggcttagtggtacagca
+tcgcacttgtaatgcgaagatccttggttcgattccgagtggaggcatatacattatatt
+atattctttttcatgcggaaaaaagatttcaaatttttgggtatgatattaatatgactg
+taacgttaatagcaaagtgagtgttaataatgataaaatagcagcaaaatctcttttccg
+agtaagacgttttccagtctaaatttggagtctgcagttgtttcgcaattcttaatgtat
+ggttatactaaatacaaactttaaagctctgatttatgtttgcaataaactaaaataaaa
+gcacaaaaacctttacccattaatttcaaacaacttataaactaccggtaaacttttttt
+ctaacctttataatttataaactagaatgtttaatgtctacggccatacctaggcgaaaa
+caccagttcccgtccgatcactgcagttaagcgtctgagggcctcgttagtactatggtt
+ggagacaacatgggaatccggggtgctgtaggctatttttttatatccgtctttcttact
+acttgcctaacaagtcatgatgtactctcaaaatatgtttgcatgccttgtaatattggt
+tatggatagctccttctggacttgatcttttgtagccaagaacaatgggtatagactctg
+accttgtgatgttgtagccacagattataataggtattttcaagtacagtaacaaaaatc
+ttctagtttttttttagaaaggatacaccaagtataagcaaattcaggaattgttgatta
+aactgtcaacttcggtaaaactttgggcataagtagtgtgggagcaagtttaactaaaat
+tctattcagatgtcgaatccaaaccgctaattttgctcaactagcttttcataaaaacca
+attcatagtttcatactaataaagacgattgtttactttaaaacatacgtcgtaagaaca
+tatattgctttatcgaaagataacaaatgttaagctattatattatttaactatagcgca
+gatttcgcttcctttacttaaaaaagacatgtgacttgtagaagcttggagtgaatacgc
+aaaggtacctacttagacattcgcgtctctcttagctgtcaacatcaacaaactggcccc
+gtattgaacagtatcttacttgtcgaaggatttgactaagaaaattttatttctttatag
+caatattccgttttcgcttagaagattctagtcaattgccctattctacttacgctttac
+agtagtatcagaagacctgagtgggattttgctgctagtagaggccattcaagttaactc
+cgttttgcaacattttaaaagtttttgaattgaatataaatatcaattgtttgattcctt
+ttaggatttaatcttttctttttatttttgtttcgattgaatcttggattcctgtctatc
+atgttttggtggaaaagtgctactaaattcacattctcaaagcgtggaccgtgtgtcttt
+cgctatttgagtactcttgaaggaacaactgtgaggcctaaaaaaaataaatttttagtt
+ggattgctttctgccgttccaattgtcacgtttgctttaggaacttggcaggtaaagcga
+cgagaatggaaaatgggtatcatcaatacactcacggaaaggcttcaacagcccgcaatt
+ttattaccgaaaactgttacgtacgttaagttaacatatacacaaattgcacgttttgca
+attgaactgtcgttttttacattaagctaacataatcacttagagagcaagatacaaaaa
+aacttgagtggactagggttttgcttcgtggtgtgttttgtcacgaccaagaaatgttgg
+tcggtccaagaacgaaggaaggccaacctggctatcacgtagtaaccccatttattttag
+acgatgggcgtcgaattttagtcaacagaggatggattgctcgatcatttgctgaacagt
+cttctcgagatcctagttctttacctaaaggtccagtggtcattgaaggtcttttgagac
+aacatactgataagccaagatttatgatgaagaatgagcctgaaaaaaattctttttact
+tcttaaatgttcgtgagtttgcacaattgaaaggaactctccccattttgataacagaac
+tacaaccatcgcttacaccgttgcaagaagccgatcatgttaagagaggcttgcctcttg
+gtcatcctctaaaagttgaaattttcaacagtcatacagaatatattatcacttggtatt
+ctctaagtgtggtatcagctataatgctttacgtctattttaagagaggttcaggcacat
+cttctctgaattctgcatacgaaagaagcaagattctaaacaacaaacgattataaaaaa
+ttttcatatttataagtttctaaatattatctacctaaaattttacaaattttggaagct
+tgcttactgcgtccgtcgtttgaatgtatgaatcgatcattccttcaccaacttgttttg
+caaacttcggatcgtaaggaacctattattaggaagttagttctcatgcctataatttta
+atgctctataatcatcacgtacctgagtttcagataaattgctcagccaagagtttgaca
+acaattctgatacatattttctggcggccttctttttatgcttcgtaattccagagatac
+ttcctaatttgttactgctgatgtttttaagaagttggtattgtctggtaaattcttttt
+tcttggtagctgacacgtgatataggaagctgtttagacaagtgataaggtcatttatga
+tctataattcggttagtttagaaatttttatatcattttttttaaaaaaaaaaaccagtt
+tggtaaacttacttcagtgtactttgtcaattgacttaaaggcgtggagttctcataatc
+gaatgactcaattaaattttcaatcgtttcgaacgaggaattttcgtagtctccgttctt
+gacctttaccgaaagtaatcccagttggatcaataatttcatatgaacaatttcttccga
+agttaattgcttcgataaatcattgttttcgcacaaaacttccatttccttagcacttaa
+aacggccttttcaaaatcgccgtttactatgctgtcttgaacgagagaatgaccaatgac
+agtcaaatggatccaaagcgtgtccggtttaggcgaatttcttaaactttcttcaactgt
+tggcaatttatcagatccataatctgcaaagacctttaaatctcgattatctttcggaga
+tgaacatttgggaagatactgtttgggtggtttaaaagcggtaagataatgtatcctagc
+ccgctcgaccaaagaaatgcttttccaggtactgtggtctaaacgggatcggaaattacg
+catatcttcgatttgagagtaagcaccatcttcataagccatagaaatcatctctggtgt
+ttcaaactcattcgaaccatatattttgagacttgagttaatatagtgagaagtaacaga
+agatggataataggtagtagcacgagtcaagagataatgatcaagggtatcgttttgaat
+ttgcttaatggacatagtgtcgtaaactttagcagcagcagggaagcctccatcaagaag
+aagatataaacgaataaggggtagctttaaatgaaagttatgttgactataagtaatgcc
+tttttctaaaagacagattgcgtcaaaaattaaagcttgtttttcggcaggttttaaatc
+cttattcccctcccacatatatatcaatgaatgaactgctaataacaaagcttcataacc
+gtgcgtaaagtcagtgggtaataagcctttacttaaagacaaacccttttcaaatgcgac
+gaagcatctacgcacgtaatcgacaaccgattctgcagtaaacgactcaaagagcaaaaa
+atggatcttcagaagcaaaacctcagcatataatttatcgactttttgagactacgacga
+gttaatattgaaagatgaataaatacttacttcattggattcacctagatcagccaactt
+aaatgcatctaataaccggtgttgtgcatcaacattcagcttcaatagataaggtctcaa
+atcttcaaaaacaattggtttcatatacagctttttgatatagccaagtaatgctgattc
+gtgttcttcaggaaaaaaccgtgcgctggcttcaatccaaagtaaatgaagatttctttt
+tgtgctgctggttgacaacgctttcaatatacaatcctttaatgggactaatctatggag
+aagttagtaataatgcaaaaaaaaaaacttactttgaatcatcattggaagcactatcca
+gcaaagctttgcaaaccttccaatcagtattcccagtttggaaaagagaaagcgaaaacg
+tgaataaagaatcccaacgcgcacaggaagcaagcaattcaagcttcctcaaaagaaggt
+cggcgtcagcatcaacaaagcgatcagcatcttgatgtattaaagcatctaacgctctgt
+ccttgtctcccactaaaagcaacacgtctaaataaagatgaaactcctcacaagaatcga
+tataacctgttggtttttcgaaaatgagtttagcagttttttcagctagtgctttcagca
+aacgttgttcaacctcattttccgactttttggacaaaagatacaaagatgagataaccc
+ataaggtatgtttcctagaaggaaagttcttttgcaattctacagcagcctgaggagtta
+gtaaaaaaaaaacaaattaagatcttacctttctttggtgagacaatgatttgatgcgaa
+tagatgctttgaagtaagctaataagtttttttcctgctttccataagtttgcaagaact
+tttcccaaaatacaaacgattcttctccttcaaatagttaataacttaaaagtaagaggg
+taaaaacaagtccattgagaaataaaacgttgcacttgaatcatcaagctacgaaaagaa
+caaagatcgtttttcttaagcaaagtttaaccgatcaaataactaaagcctttatctcaa
+ggaaatagtagaatattcaaaataaaaaatacgaccaaagtgctatcaacatttatgttc
+atctgttcaatagaacctaattatacttacccttcttttgatcatcataaacagcttgta
+taatgtctaaaagttccaagctgttgatgggagtcgattttaacggttctaaaagtgcta
+gagcctcgggaccacgtcctgcctgagccaaggataacgctgaataaacctaaaaaggat
+gttaacagctaaaaacataactcgattacttacaattgttgattctttactcccagaacg
+acgcattgtagtaggcaatgaaattaaagcccaaacagtagtcagaagttggtaggtgtt
+gcagtcaaattattattctacagaggagaatattatagccagcgtggtagaatctggata
+tatatctactgcaaaagtgtaattgcattggtttaaagggtatactatggttaagtaata
+tattcacagctgtacaatttacagtcataactaaaacttccttaagccgtaaagaaatac
+ctggtgttgtaaaatttgttgtatatccacggcatggtcatataatgtgattttgtgctc
+aaataaatataaaatatgcataatttttgtacatttaatttgagaaacccatcttttgtt
+gagaggctgtcaatgaatagcagtttcattgaaaagcagcgggatgaccagaaaagtatt
+ttacaatggcaagggagtagaaagctagcgtaatattcagaaagctaggtaattgagcaa
+tcctttaattcattgctaagcatgctaggtaaacgcagtaaacctttcagttttcattta
+ggtataaggctgtttaatgagtatctccactaaatttaaagatcaaaactcagtatcaat
+tcttaaaagttttattttatttaataatcatatacttctcataatctttcaattttttcc
+ccattttgatgatatttttattaatcctacagtaagctctatgatatcgttattcttcaa
+ataggctggtcagcacgtggacggtgttacttatcgttaaataaatcgtactaaggaggt
+gcgatgtaaatgatatgcttgtcaagtattaactgctctccaccaaccgccggtttaact
+gattattgttgaaaagcgcagacgaagtttagagaattactagcgtattttaaatttaat
+caacggactattttttattcctttgagatccgactttatcgctttgcttctaattttcca
+aaattcagtctatctacgcgatccagccctgtttgcgtaaatttcatattatttttcttt
+aaacgtttgg
diff --git a/etc/feature_keys b/etc/feature_keys
new file mode 100644
index 0000000000000000000000000000000000000000..67d773c1d8402ffe909423f0fba7b500ec034061
--- /dev/null
+++ b/etc/feature_keys
@@ -0,0 +1,72 @@
+# All feature keys and qualifiers for EMBL/GenBank feature tables
+
+# From: http://www.ebi.ac.uk/~faruque/art/keyqual.txt
+
+# key           Qualifiers (@=mandatory)
+# =======       ========================
+-               EC_number PCR_conditions allele anticodon bound_moiety cell_line cell_type chromosome citation clone clone_lib codon codon_start cons_splice country cultivar db_xref dev_stage direction ecotype environmental_sa evidence exception focus frequency function gene germline haplotype insertion_seq isolate isolation_source lab_host label locus_tag macronuclear map mod_base mol_type note number organelle organism partial phenotype plasmid pop_variant product protein_id proviral pseudo rearranged replace rpt_family rpt_type rpt_unit segment sequenced_mol serotype serovar sex specific_host specimen_voucher standard_name strain sub_clone sub_species sub_strain tissue_lib tissue_type transgenic transl_except transl_table translation transposon usedin variety virion
+-10_signal      allele citation db_xref evidence function gene label locus_tag map note operon partial standard_name usedin
+-35_signal      allele citation db_xref evidence function gene label locus_tag map note operon partial standard_name usedin
+3'UTR           allele citation db_xref evidence function gene label locus_tag map note partial standard_name usedin
+3'clip          allele citation db_xref evidence function gene label locus_tag map note partial standard_name usedin
+5'UTR           allele citation db_xref evidence function gene label locus_tag map note partial standard_name usedin
+5'clip          allele citation db_xref evidence function gene label locus_tag map note partial standard_name usedin
+CAAT_signal     allele citation db_xref evidence gene label locus_tag map note partial usedin
+CDS             EC_number allele citation codon codon_start db_xref evidence exception function gene label locus_tag map note number operon partial product protein_id pseudo standard_name transl_except transl_table translation usedin
+C_region        allele citation codon codon_start db_xref evidence gene label locus_tag map note partial product pseudo standard_name transl_except translation usedin
+D-loop          allele citation db_xref evidence gene label locus_tag map note partial usedin
+D_segment       allele citation codon codon_start db_xref evidence gene label locus_tag map note partial product pseudo standard_name transl_except translation usedin
+GC_signal       allele citation db_xref evidence gene label locus_tag map note partial usedin
+J_segment       allele citation codon codon_start db_xref evidence gene label locus_tag map note partial product pseudo standard_name transl_except translation usedin
+LTR             allele citation db_xref evidence function gene label locus_tag map note partial standard_name usedin
+N_region        allele citation codon codon_start db_xref evidence gene label locus_tag map note partial product pseudo standard_name transl_except translation usedin
+RBS             allele citation db_xref evidence gene label locus_tag map note partial standard_name usedin
+STS             allele citation db_xref evidence gene label locus_tag map note partial standard_name usedin
+S_region        allele citation codon codon_start db_xref evidence gene label locus_tag map note partial product pseudo standard_name transl_except translation usedin
+TATA_signal     allele citation db_xref evidence gene label locus_tag map note partial usedin
+V_region        allele citation codon codon_start db_xref evidence gene label locus_tag map note partial product pseudo standard_name transl_except translation usedin
+V_segment       allele citation codon codon_start db_xref evidence gene label locus_tag map note partial product pseudo standard_name transl_except translation usedin
+attenuator      allele citation db_xref evidence gene label locus_tag map note operon partial phenotype usedin
+conflict        @citation allele db_xref evidence gene label locus_tag map note replace usedin
+enhancer        allele citation db_xref evidence gene label locus_tag map note partial standard_name usedin
+exon            EC_number allele citation codon codon_start db_xref evidence function gene label locus_tag map note number partial product pseudo standard_name transl_except usedin
+gap             @estimated_length
+gene            allele citation db_xref evidence function gene label locus_tag map note operon partial phenotype product pseudo standard_name usedin
+iDNA            allele citation db_xref evidence function gene label locus_tag map note number partial standard_name usedin
+intron          allele citation cons_splice db_xref evidence function gene label locus_tag map note number partial standard_name usedin
+mRNA            allele citation db_xref evidence exception function gene label locus_tag map note operon partial product pseudo standard_name transcript_id usedin
+mat_peptide     EC_number allele citation codon codon_start db_xref evidence function gene label locus_tag map note partial product pseudo standard_name transl_except usedin
+misc_RNA        allele citation db_xref evidence function gene label locus_tag map note operon partial product standard_name usedin
+misc_binding    @bound_moiety allele citation db_xref evidence function gene label locus_tag map note partial usedin
+misc_difference allele citation clone db_xref evidence gene label locus_tag map note partial phenotype replace standard_name usedin
+misc_feature    allele citation db_xref evidence function gene label locus_tag map note number partial phenotype product pseudo standard_name usedin
+misc_recomb     allele citation db_xref evidence gene label locus_tag map note organism partial standard_name usedin
+misc_signal     allele citation db_xref evidence function gene label locus_tag map note operon partial phenotype standard_name usedin
+misc_structure  allele citation db_xref evidence function gene label locus_tag map note partial standard_name usedin
+modified_base   @mod_base allele citation db_xref evidence frequency gene label locus_tag map note usedin
+old_sequence    @citation allele db_xref evidence gene label locus_tag map note partial replace usedin
+operon          @operon allele citation db_xref evidence function label map note phenotype pseudo standard_name usedin
+oriT            allele bound_moiety citation db_xref direction evidence gene label locus_tag map note rpt_family rpt_type rpt_unit standard_name usedin
+polyA_signal    allele citation db_xref evidence gene label locus_tag map note partial usedin
+polyA_site      allele citation db_xref evidence gene label locus_tag map note usedin
+precursor_RNA   allele citation db_xref evidence function gene label locus_tag map note operon partial product standard_name usedin
+prim_transcript allele citation db_xref evidence function gene label locus_tag map note operon partial standard_name usedin
+primer_bind     PCR_conditions allele citation db_xref evidence gene label locus_tag map note partial standard_name usedin
+promoter        allele citation db_xref evidence function gene label locus_tag map note operon partial phenotype pseudo standard_name usedin
+protein_bind    @bound_moiety allele citation db_xref evidence function gene label locus_tag map note partial standard_name usedin
+rRNA            allele citation db_xref evidence function gene label locus_tag map note partial product pseudo standard_name usedin
+rep_origin      allele citation db_xref direction evidence gene label locus_tag map note partial standard_name usedin
+repeat_region   allele citation db_xref evidence function gene insertion_seq label locus_tag map note partial rpt_family rpt_type rpt_unit standard_name transposon usedin
+repeat_unit     allele citation db_xref evidence function gene label locus_tag map note partial rpt_family rpt_type rpt_unit usedin
+satellite       allele citation db_xref evidence gene label locus_tag map note partial rpt_family rpt_type rpt_unit standard_name usedin
+scRNA           allele citation db_xref evidence function gene label locus_tag map note partial product pseudo standard_name usedin
+sig_peptide     allele citation codon codon_start db_xref evidence function gene label locus_tag map note partial product pseudo standard_name transl_except usedin
+snRNA           allele citation db_xref evidence function gene label locus_tag map note partial product pseudo standard_name usedin
+snoRNA          allele citation db_xref evidence function gene label locus_tag map note partial product pseudo standard_name usedin
+source          @organism cell_line cell_type chloroplast chromoplast chromosome citation clone clone_lib country cultivar cyanelle db_xref dev_stage ecotype environmental_sample evidence focus frequency germline haplotype insertion_seq isolate isolation_source kinetoplast lab_host label macronuclear map mitochondrion mol_type note organelle plasmid pop_variant proviral rearranged segment sequenced_mol serotype serovar sex specific_host specimen_voucher strain sub_clone sub_species sub_strain tissue_lib tissue_type transgenic transposon usedin variety virion
+stem_loop       allele citation db_xref evidence function gene label locus_tag map note operon partial standard_name usedin
+tRNA            allele anticodon citation db_xref evidence function gene label locus_tag map note partial product pseudo standard_name usedin
+terminator      allele citation db_xref evidence gene label locus_tag map note operon partial standard_name usedin
+transit_peptide allele citation codon codon_start db_xref evidence function gene label locus_tag map note partial product pseudo standard_name transl_except usedin
+unsure          allele citation db_xref evidence gene label locus_tag map note replace usedin
+variation       allele citation db_xref evidence frequency gene label locus_tag map note partial phenotype product replace standard_name usedin
diff --git a/etc/options b/etc/options
new file mode 100644
index 0000000000000000000000000000000000000000..d1929492393492790ca36dd50414663a5059ee90
--- /dev/null
+++ b/etc/options
@@ -0,0 +1,508 @@
+# The standard options file for Artemis
+
+# (Note that comment lines start with a hash (#) symbol)
+
+# $Header: //tmp/pathsoft/artemis/etc/options,v 1.1 2004-06-09 10:02:52 tjc Exp $
+
+# This file should contain option settings that look like this:
+#
+# option_name = option_value
+#
+# If the value of an options is too long to fit on one line it can be split
+# over several lines by ending each line with a backslash like this:
+#
+# option_name = option_value another_option_value \
+#     a_third_option_value a_forth_option_value
+
+
+# This option will set the font size for all the Artemis windows.
+
+font_size = 12
+
+
+# Set the name of the font to use in Artemis.  These possibilites are
+# available on all platforms:
+#   Dialog, DialogInput, Monospaced, Serif, SansSerif, Symbol.
+
+font_name = Monospaced
+
+# This option is used to set the default minimum size (in amino acids)
+# of a "large" open reading frame, which controls which ORFS are
+# marked by the "Mark Open Reading Frames" menu item.
+
+minimum_orf_size = 100
+
+# Set the default value for the direct edit option (see
+# http://www.sanger.ac.uk/Software/Artemis/stable/manual/launch-window.html#LAUNCH-WINDOW-OPTIONS-DIRECT-EDIT
+# for more)
+direct_edit = yes
+
+# This setting controls which set of codons will be used for start codons.
+# This can be changed from the options menu.
+# There are two possible settings: eukaryote or prokaryote
+organism_type = eukaryote
+
+# This option gives the bases of the possible start codons
+eukaryotic_start_codons = atg
+prokaryotic_start_codons = atg gtg ttg
+
+
+# The translation_table option is used to lookup codon translations.  The
+# table must have exactly 64 entries, and there is one entry for each codon.
+# The entries should appear in this order:
+#   TTT, TTC, TTA, TTG,
+#   TCT, TCC, ...,
+#   ...
+
+# this is the default table:
+#
+# translation_table = \
+#     f f l l \
+#     s s s s \
+#     y y # + \
+#     c c * w \
+#             \
+#     l l l l \
+#     p p p p \
+#     h h q q \
+#     r r r r \
+#             \
+#     i i i m \
+#     t t t t \
+#     n n k k \
+#     s s r r \
+#             \
+#     v v v v \
+#     a a a a \
+#     d d e e \
+#     g g g g
+
+# this is the eukaryotic mitochondrial table:
+#
+# translation_table = \
+#     f f l l \
+#     s s s s \
+#     y y * * \
+#     c c w w \
+#             \
+#     l l l l \
+#     p p p p \
+#     h h q q \
+#     r r r r \
+#             \
+#     i i m m \
+#     t t t t \
+#     n n k k \
+#     s s * * \
+#             \
+#     v v v v \
+#     a a a a \
+#     d d e e \
+#     g g g g
+
+
+# the sequence of colour numbers must not have any gaps - if for example
+# colour_5 is missing then all colours with higher numbers will be ignored
+
+# the three numbers for each colour correspond to red, green and blue
+# respectively.  each number is an intensity from 0 to 255
+
+# white
+colour_0 = 255 255 255
+# dark grey
+colour_1 = 100 100 100
+# red
+colour_2 = 255 0 0
+# green
+colour_3 = 0 255 0
+# blue
+colour_4 = 0 0 255
+# cyan
+colour_5 = 0 255 255
+# magenta
+colour_6 = 255 0 255
+# yellow
+colour_7 = 245 245 0
+# pale green
+colour_8 = 152 251 152
+# light sky blue
+colour_9 = 135 206 250
+# orange
+colour_10 = 255 165 0
+# brown
+colour_11 = 200 150 100
+# pink
+colour_12 = 255 200 200
+# light grey
+colour_13 = 170 170 170
+# black
+colour_14 = 0 0 0
+# reds:
+colour_15 = 255  63  63
+colour_16 = 255 127 127
+colour_17 = 255 191 191
+
+colour_of_CDS = 5
+colour_of_cds? = 7
+colour_of_BLASTCDS = 2
+colour_of_BLASTN_HIT = 6
+colour_of_CRUNCH_D = 2
+colour_of_CRUNCH_X = 15
+colour_of_source = 0
+colour_of_prim_tran = 0
+colour_of_stem_loop = 2
+colour_of_misc_feature = 3
+colour_of_misc_RNA = 12
+colour_of_delta = 3
+colour_of_LTR = 4
+colour_of_repeat_region = 9
+colour_of_repeat_unit = 9
+colour_of_terminator = 3
+colour_of_promoter = 3
+colour_of_intron = 1
+colour_of_exon = 7
+colour_of_mRNA = 1
+colour_of_tRNA = 8
+colour_of_TATA = 3
+colour_of_bldA = 2
+colour_of_GFF = 11
+
+colour_of_start_codon = 6
+
+# suffixes used on files that contain features - used in file requesters
+feature_file_suffixes = tab embl gbk genbank tab_embl gff feature feat \
+   art artemis
+
+# suffixes used on files that contain sequence - used in file requesters
+sequence_file_suffixes = embl gbk genbank tab_embl seq dna \
+   art artemis
+
+# this is the URL that contains the IOR of the EMBL server
+embl_ior_url = http://corba.ebi.ac.uk/EMBL/IOR/Embl.IOR
+
+# this is the URL that contains the IOR of the EnsEMBL server
+# ensembl_ior_url = file:///nfs/disk12/kmr/powmap/db.ior
+
+
+# the default height for the base plot window
+base_plot_height = 150
+
+
+# the default height for the feature plot window
+feature_plot_height = 160
+
+
+# if this option is no then the feature labels in the overview will be off at
+# startup (the default is yes)
+# overview_feature_labels = no
+
+
+# if this option is yes then the overview will start in one line per entry
+# mode (the default is no)
+# overview_one_line_per_entry = yes
+
+
+# if this option is "yes" then the feature list will be displayed on startup
+# (this is the default)
+show_list = yes
+
+
+# if this option is "yes" then the base view will be displayed on startup
+# (this is the default)
+show_base_view = yes
+
+
+# if this option is "yes" then the entry buttons will be displayed on
+# startup
+show_entry_buttons = yes
+
+
+# if this option is "yes" then artemis will offer to show the results of a
+# search when it finishes
+show_results = no
+
+
+# if this option is "yes" the "all features on frame lines" option will
+# default to true on start up
+features_on_frame_lines = no
+
+
+# if this option is "yes" the "feature labels" option will
+# default to true on start up
+feature_labels = yes
+
+
+# if this option is "yes" the "one line per entry" option will default to
+# true on start up 
+one_line_per_entry = no
+
+
+# if this option is "yes" Sanger specific menu items and functions will be
+# visible in the display
+sanger_options = no
+
+
+# the full path to the editor used for editing the qualifiers
+#external_editor = emacs
+
+
+# if set to yes, borders will be drawn around each feature and each exon.  if
+# set to no borders will only be drawn around the selected features.
+draw_feature_borders = yes
+
+
+# if set to yes, a direction arrow will be drawn around at the end of each
+# feature.  if set to no, no arrows will be drawn.
+draw_feature_arrows = yes
+
+
+# the number of levels of undo to save or 0 if undo is disabled.  more undo
+# levels will require more memory.
+undo_levels = 20
+
+
+# this list is added to the keys from the feature_keys file
+extra_keys = \
+    BLASTN_HIT CDS_BEFORE CDS_AFTER CDS_before CDS_after \
+    CDS_motif BLASTCDS polymorphism GFF WUBLASTN_HIT \
+    WUBLASTX_HIT BLASTX_HIT TBLASTX_HIT BLASTN_HIT \
+    CRUNCH_D CRUNCH_X fasta_record allele mutation splicesite \
+    TMM signalP
+
+# Names of qualifiers to search when attempting to find the primary or display
+# name of a gene.  These qualifiers names are searched in order when looking
+# for gene names.
+display_name_qualifiers = primary_name synonym systematic_id \
+    temporary_systematic_id gene locus_tag label
+
+# Names of qualifiers to search when attempting to find the systematic name of
+# a gene
+systematic_name_qualifiers = systematic_id temporary_systematic_id \
+     locus_tag gene label
+
+
+# this list is added to the qualifiers from the qualifier_types file
+extra_qualifiers = \
+    CHROMO_LINK text \
+    C_processing "text" \  
+    C_processing_BigPi "text" \
+    C_processing_DGPI "text" \ 
+    COM_NAME "text" \
+    FEAT_NAME text \
+    GO_component "text" \
+    GO_function "text" \
+    GO_process "text" \
+    GO_slim "text" \
+    GO "text" \
+    LOCUS "text"  \
+    PUB_LOCUS text \
+    PUB_COMMENT "text" \
+    REPEAT_TYPE "text" \
+    SNP "text" \
+    algorithm "text" \
+    anchor "text" \ 
+    annotation_source "text" \
+    assembly_id "text" \
+    bb_orthologue "text" \
+    bound_moiety "text" \
+    bpp_orthologue "text" \
+    bp_orthologue "text" \
+    bicsw_file "text" \
+    blast_score text \
+    blast_file "text" \
+    blastn_file "text" \
+    blastp_file "text" \
+    blastp+go_file "text" \
+    blastp_match "text" \
+    blastx_file "text" \
+    cds_id "text" \
+    chloroplast "text" \
+    chromoplast "text" \
+    class "text" \
+    cleavage "text" \
+    cluster "text" \
+    color text \
+    colour text \
+    comment_Cterm "text" \
+    comment_Nterm "text" \
+    confidence_level "text" \
+    coord "text" \
+    contig_id "text" \
+    created "text" \
+    curation "text" \
+    curated_ortholog "text" \
+    cyanelle "text" \
+    domain "text" \
+    end_phase text \
+    exon_id "text" \
+    fasta_file "text" \
+    fasta_match "text" \
+    fastx_file "text" \
+    filename "text" \
+    function "text" \
+    gene "text" \
+    gene_id "text" \
+    gff_feature text \
+    gff_group text \
+    gff_seqname text \
+    gff_source text \
+    go_from_interpro "text" \
+    hp_match "text" \
+    hth_file "text" \
+    id "text" \
+    interaction "text" \
+    interpro "text" \
+    job "text" \
+    label text \
+    literature "text" \
+    manual none \
+    mitochondrion "text" \
+    modified "text" \
+    mutation "text" \
+    obsolete_name "text" \
+    obsolete_product "text" \
+    origid "text" \
+    ortholog "text" \
+    paralog "text" \
+    pepstats_file "text" \
+    percent_id text \
+    pfam_match "text" \
+    previous_systematic_id "text" \
+    primary_name "text" \
+    prosite_match "text" \
+    psu_db_xref "text" \
+    psu_domain "text" \
+    reserved_name "text" \
+    query_id text \
+    score text \
+    sequence_source "text" \
+    sequence_status "text" \
+    sigcleave_file "text" \
+    signal "text" \
+    similarity "text" \
+    smart_file "text" \
+    sptr_display "text" \
+    start_phase text \
+    subject_end text \
+    subject_id text \
+    subject_start text \
+    synonym "text" \
+    synteny "text" \
+    systematic_id "text" \
+    taxon_id "text" \
+    tblastn_file "text" \
+    tblastx_file "text" \
+    tb_orthologue "text" \
+    temporary_systematic_id "text" \
+    tmhelix "text" \
+    transferred_gene "text" \
+    transferred_locus_tag "text" \
+    transferred_note "text" \
+    transferred_primary_name "text" \
+    transferred_product "text" \
+    transferred_synonym "text" \
+    transferred_systematic_id "text" \
+    type "text"
+
+# this is a list of extra qualifiers that are legal but are not displayed in
+# popup menus (such as the one in the feature editor window).  this hack is
+# used by diana.components.QualifierChoice to limit the number of qualifers
+# that are displayed in the popup menu.  on some VMs if there are too many in
+# the popup the bottom ones aren't visible
+invisible_qualifiers = \
+    CHROMO_LINK    \
+    C_processing       \ 
+    C_processing_BigPi \
+    C_processing_DGPI  \
+    COM_NAME       \
+    FEAT_NAME      \
+    LOCUS          \
+    PUB_LOCUS      \
+    PUB_COMMENT    \
+    REPEAT_TYPE    \
+    SNP            \
+    bicsw_file     \
+    blast_file     \
+    blast_score    \
+    blastn_file    \
+    blastp+go_file \
+    blastp_file    \
+    blastx_file    \
+    cds_id         \
+    chloroplast    \
+    chromoplast    \
+    codon          \
+    comment_Cterm  \
+    comment_Nterm  \
+    created        \
+    cyanelle       \
+    end_phase      \
+    exception      \
+    exon_id        \
+    fasta_file     \
+    fasta_match    \
+    gene_id        \
+    gff_feature    \
+    gff_group      \
+    gff_seqname    \
+    gff_source     \
+    go_from_interpro \
+    hp_match       \
+    hth_file       \
+    interpro       \
+    map            \
+    mitochondrion  \
+    modified       \
+    number         \
+    obsolete_gene_name \
+    pepstats_file  \
+    percent_id     \
+    pfam_match     \
+    prosite_match  \
+    psu_domain     \
+    reserved_gene_name \
+    query_id       \
+    sigcleave_file \
+    score          \
+    smart_file     \
+    start_phase    \
+    tblastn_file   \
+    tblastx_file   \
+    temporary_systematic_id \
+    transl_table   \
+    translation    \
+    type           \
+    usedin
+
+
+# These pairs consist of a program name and a parameter string.
+# For blast and fasta the parameter string is the name of the database to
+# search.
+feature_protein_programs = \
+    fasta %L \
+    sigcleave 0 \
+    pepstats - \
+    blastp swall \
+    tblastn embl_other \
+    hth - \
+    smart - \
+    clustalx PROTEIN \
+    jalview -
+
+feature_dna_programs = \
+    tblastx embl_other \
+    blastn embl_other \
+    blastx swall \
+    fastx %L \ 
+    clustalx DNA
+
+application_programs = \
+
+# this is the list of keys that should be displayed by default in the edit
+# window
+common_keys = \
+    allele attenuator CDS conflict exon intron LTR misc_feature misc_RNA mRNA \
+    mutation polyA_signal polyA_site promoter protein_bind RBS repeat_region \
+    repeat_unit rRNA scRNA snRNA source stem_loop STS TATA_signal terminator \
+    tRNA unsure variation -10_signal -35_signal CDS_motif gene \
+    BLASTN_HIT BLASTCDS 3'UTR 5'UTR
diff --git a/etc/pombe.usage b/etc/pombe.usage
new file mode 100644
index 0000000000000000000000000000000000000000..bb7176ed17ae6efc63d8dad9426c19be3e2d4009
--- /dev/null
+++ b/etc/pombe.usage
@@ -0,0 +1,20 @@
+UUU 32.2( 48423)  UCU 30.5( 45913)  UAU 21.8( 32829)  UGU  8.9( 13371)
+UUC 13.0( 19519)  UCC 12.1( 18149)  UAC 11.8( 17721)  UGC  5.6(  8372)
+UUA 26.0( 39138)  UCA 17.9( 26850)  UAA  1.3(  1944)  UGA  0.5(   733)
+UUG 24.0( 36134)  UCG  8.0( 12055)  UAG  0.5(   705)  UGG 10.9( 16364)
+
+CUU 25.3( 38015)  CCU 21.9( 32964)  CAU 16.3( 24577)  CGU 16.3( 24495)
+CUC  7.3( 10922)  CCC  8.4( 12619)  CAC  6.4(  9653)  CGC  6.2(  9316)
+CUA  8.6( 12957)  CCA 12.7( 19075)  CAA 27.3( 41066)  CGA  7.9( 11896)
+CUG  6.3(  9503)  CCG  4.6(  6910)  CAG 10.9( 16457)  CGG  3.0(  4487)
+
+AUU 35.0( 52636)  ACU 22.9( 34419)  AAU 33.9( 51009)  AGU 14.7( 22108)
+AUC 12.6( 19000)  ACC 10.9( 16378)  AAC 17.9( 26895)  AGC  9.2( 13905)
+AUA 13.1( 19726)  ACA 13.9( 20898)  AAA 39.3( 59079)  AGA 11.1( 16742)
+AUG 20.9( 31376)  ACG  6.5(  9744)  AAG 25.2( 37825)  AGG  5.1(  7615)
+
+GUU 29.3( 44015)  GCU 30.2( 45397)  GAU 38.1( 57240)  GGU 22.0( 33101)
+GUC 11.0( 16497)  GCC 11.6( 17518)  GAC 15.8( 23749)  GGC  8.5( 12717)
+GUA 12.3( 18451)  GCA 15.7( 23649)  GAA 44.3( 66550)  GGA 15.7( 23623)
+GUG  8.3( 12422)  GCG  5.3(  8011)  GAG 21.3( 31979)  GGG  4.3(  6497)
+
diff --git a/etc/qualifier_types b/etc/qualifier_types
new file mode 100644
index 0000000000000000000000000000000000000000..f860210db44e7da055fa54019fa9fa3caebeea2b
--- /dev/null
+++ b/etc/qualifier_types
@@ -0,0 +1,110 @@
+# Feature qualifiers for EMBL/GenBank feature tables
+# 
+# From: http://www.ebi.ac.uk/~faruque/art/keyqual.txt
+#
+# valid qualifier types are:
+#         (::)		(text:text,text:text)
+#         EC		"n.n.n.n"
+#         feature		dbname::accno:location
+#         item		single text item
+#         list		one of the listed values
+#         modbase         one of the stored modbase values
+#         none		no value
+#         number		nn
+#         (other)		(text)
+#         location	a valid location range (or feature label)
+#         real		n.n within specified range
+#         ref     	[nn]
+#         text		any text, no quotes added, spaces allowed if quoted
+#         "text"		quoted text, double any contained quotes
+#         "opt"		optional quoted text, double any contained quotes
+#         "list"		quoted text, list of accepted values
+# 
+# if not specified, the default is text (so anything is accepted)
+# 
+# Name           required   Type    Value(s) ..
+allele           no         "text"
+anticodon        yes        (::)    pos aa
+bound_moiety     no         "text"
+cell_line        no         "text"
+cell_type        no         "text"
+chromosome       no         "opt"
+citation         no         ref
+clone            no         "text"
+clone_lib        no         "text"
+codon            no         (::)    seq aa
+codon_start      yes        number  1 3
+cons_splice      yes        (::)    5'site 3'site
+country          no         "text"
+cultivar         no         "text"
+db_xref          no         "text"
+dev_stage        no         "text"
+direction        yes        list    LEFT RIGHT BOTH
+ecotype          no         "text"
+EC_number        no         "text"
+environmental_sample   no   none
+estimated_length no         "text"
+evidence         yes        list    EXPERIMENTAL NOT_EXPERIMENTAL
+exception        no         "text"
+focus            no         none
+frequency        yes        real    0.0  1.0
+function         yes        "text"
+gene             no         "text"
+germline         yes        none
+haplotype        no         "text"
+insertion_seq    no         "text"
+isolation_source no         "text"
+isolate          no         "text"
+kinetoplast      no         "opt"
+label            yes        item
+lab_host         no         "text"
+locus_tag        no         "text"
+macronuclear     no         none
+map              no         "text"
+mod_base         no         modbase
+mol_type         no         "text"
+note             no         "text"
+number           yes        number  1 99999999
+operon           no         "text"
+organell         no         "text"
+organism         yes        "text"
+partial          yes        none
+PCR_conditions   no         "text"
+phenotype        no         "text"
+plasmid          no         "text"
+pop_variant      no         "text"
+product          no         "text"
+protein_id       no         "text"
+proviral         yes        none
+pseudo           yes        none
+rearranged       yes        none
+replace          no         "text"
+rpt_family       no         "text"
+rpt_type         no         list    TANDEM INVERTED FLANKING TERMINAL DIRECT \
+                                    DISPERSED OTHER
+rpt_unit         no         location
+segment          no         "text"
+sequenced_mol    no         "list"  "cDNA" "cDNA to genomic RNA" \
+                                    "cDNA to mRNA" "cDNA to other RNA" \
+                                    "cDNA to rRNA" "DNA" "mRNA" \
+                                    "RNA" "rRNA" "scRNA" "snRNA" "tRNA"
+serotype         no         "text"
+serovar          no         "text"
+sex              no         "text"
+specific_host    no         "text"
+specimen_voucher no         "text"
+standard_name    no         "text"
+strain           no         "text"
+sub_clone        no         "text"
+sub_species      no         "text"
+sub_strain       no         "text"
+tissue_lib       no         "text"  
+tissue_type      no         "text"
+transgenic       no         "text"
+translation      no         "text"
+transl_except    no         (::)    pos aa
+transl_table     no         number  1 11
+transposon       no         "text"
+usedin           no         feature
+variety          no         "text"
+virion           no         none
diff --git a/etc/results_to_netscape b/etc/results_to_netscape
new file mode 100755
index 0000000000000000000000000000000000000000..3de1626a4737efddf073dc2c91c54577dd232e59
--- /dev/null
+++ b/etc/results_to_netscape
@@ -0,0 +1,214 @@
+#!/bin/sh -
+
+# This script will send a file to netscape with database IDs linked to SRS.
+# To customize this script edit the $DATABASES and $SRS_SERVER variable in the
+# perl code below and the NETSCAPE variable at the top of the script.
+
+# To enable this in Artemis, sanger_options must be set to true in the options
+# file.
+
+NETSCAPE=/usr/bin/X11/real-netscape
+
+if [ -f "$DIANA_ENVIRONMENT_FILE" ]
+then
+   . $DIANA_ENVIRONMENT_FILE
+fi
+
+if [ $# = 0 ]
+then
+    echo no argument given 1>&2
+    exit 1
+fi
+
+file_arg=$1
+
+unique_bit=$$.`hostname`
+
+# sanger hack:
+file_arg=`echo $file_arg | sed 's@^/tmp_mnt/nfs/@/nfs/@' | sed 's@^/tmp_mnt/tmp_nfs/@/nfs/@'`
+# fix for pcs3:
+file_arg=`echo $file_arg | sed 's@^/yeastpub4/@/nfs/disk222/yeastpub4/@'`
+
+
+if [ -f ./$file_arg ]
+then
+    # the file is in the current directory - we need the full path so netscape
+    # can find the file
+    new_file=$PWD/$file_arg.$unique_bit.html
+else
+    new_file=$file_arg.$unique_bit.html
+fi
+
+cat <<EOF > $new_file
+<HTML>
+ <HEAD>
+  <TITLE>
+  Results for $file_arg
+ </TITLE>
+ </HEAD>
+ <BODY>
+<PRE>
+EOF
+
+perl -e '
+BEGIN {
+  # change these variable to list the databases to search for the IDs - the
+  # database names should be separated by spaces
+  $PROTEIN_DATABASES = "swall";
+  $DNA_DATABASES = "embl";
+
+  # change this to point to the wgetz script of your SRS server
+  $SRS_SERVER = "www.sanger.ac.uk/srs6bin/cgi-bin/wgetz?-e+";
+
+  $PROTEIN_DATABASES =~ s/ /%20/g;
+  $DNA_DATABASES =~ s/ /%20/g;
+
+  %GENEDB_PATTERNS = (tryp => q!Tb\d+\.\d+\.\d+|TRYP_\S+!,
+                      leish => q!LmjF\d+.\d+!);
+
+  $GENEDB_PATTERN = join ("|", values %GENEDB_PATTERNS);
+
+  $BLAST_START_LINE = "Sequences producing High-scoring Segment Pairs|" .
+    "Sequences producing significant alignments:";
+  $FASTA_START_LINE = "The best scores are";
+
+  # the list of IDs we have seen so far
+  @ids = ();
+
+  # the list of IDs we have made anchors for so far
+  @anchored_ids = ();
+
+  $db_type = "unknown";
+}
+
+sub hyperlink_to_anchor
+{
+  $id = shift;
+  qq(<a href="#$id">$id</a>);
+}
+
+sub hyperlink_id
+{
+  $id = shift;
+
+  if ($db_type eq "dna") {
+    $r = qq#<a href="http://$SRS_SERVER\[\{$DNA_DATABASES\}-ID:$id*]|[\{$DNA_DATABASES\}-AccNumber:$id*]">$id</a>#;
+  } else {
+    for my $org (keys %GENEDB_PATTERNS) {
+      my $pattern = $GENEDB_PATTERNS{$org};
+
+      if ($id =~ /$pattern/) {
+        $r = qq#<a href="http://www.genedb.org/genedb/Search?organism=$org&name=$id">$id</a>#;
+        return $r
+      }
+    }
+
+    $r = qq#<a href="http://$SRS_SERVER\[\{$PROTEIN_DATABASES\}-ID:$id*]|[\{$PROTEIN_DATABASES\}-AccNumber:$id*]">$id</a>#;
+  }
+  return $r
+}
+
+$file_name = $ARGV[0];
+
+if ($file_name =~ /\.gz$/) {
+  open IN_FILE, "gzip -d < $file_name |" or die "failed to open $file_name\n";
+} else {
+  open IN_FILE, "$file_name" or die "failed to open $file_name\n";
+}
+
+while (<IN_FILE>) {
+  if ($. == 1) {
+    if (/^\s*([^\s]+)/) {
+      if (lc $1 eq "blastn" or lc $1 eq "tblastn" or lc $1 eq "tblastx") {
+        $db_type = "dna";
+      } else {
+        if (lc $1 eq "fasta" or lc $1 eq "blastp" or lc $1 eq "blastx") {
+          $db_type = "protein";
+        } else {
+          print "\nWARNING: could not identify file type: $1\n";
+        }
+      }
+    } else {
+      print "\nWARNING: could not identify file type\n";
+    }
+  }
+
+
+  # ignore header lines
+  if (1..m/$BLAST_START_LINE|$FASTA_START_LINE/) {
+    print;
+    next;
+  }
+
+  if (@ids && /^\s*$/) {
+    $summary_finished = 1;
+  }
+
+  if (/^(?:(?:>?>?(?:[A-Z]+:)?)(\w+)|($GENEDB_PATTERN)) /) {
+    $id = $1;
+
+    if (!defined $id) {
+      $id = $2;
+    }
+
+    if ($summary_finished) {
+      if ((grep {$_ eq $id} @ids) && (!grep {$_ eq $id} @anchored_ids)) {
+        # not anchored yet so make it an anchor
+        if (s/\b$id\b/"<a name=\"$id\">" . (hyperlink_id($id)) . "<\/a>"/e) {
+          push @anchored_ids, $id;
+        }
+      }
+    } else {
+      if (!grep {$_ eq $id} @ids) {
+        push @ids, $id;
+      }
+
+      s/$id/hyperlink_to_anchor($id)/ei;
+
+      if (!s/ $id/" " . hyperlink_id($id)/ei) {
+        # if the id occurs once in the line put a link at end of line
+        s/$/"  LINK:" . hyperlink_id($id)/e;
+      }
+    }
+  }
+  print;
+}
+
+' $file_arg >> $new_file
+
+cat <<EOF >> $new_file;
+</PRE>
+  </BODY>
+</HTML>
+EOF
+
+# delete it at some point
+echo "rm -f $new_file > /dev/null 2>&1" | at now + 36 hours
+
+if $NETSCAPE -remote "openURL($new_file)"
+then
+    exit 0
+else
+    echo starting new netscape 2>&1
+    # netscape isn't running - so start it
+    ($NETSCAPE &)&
+
+    # now send the URL.  we do things this way so that the script doesn't exit
+    # until netscape has successfully shown the URL
+
+    sleep 1
+
+    # don't exit the script until the file is successfully displayed or until
+    # 40 seconds is up
+    for i in 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20
+    do
+        if $NETSCAPE -remote "openURL($new_file)" 2> /dev/null
+        then
+            exit 0
+        else
+            sleep 2
+        fi
+    done
+
+    exit 1
+fi
diff --git a/etc/run_blastn b/etc/run_blastn
new file mode 100755
index 0000000000000000000000000000000000000000..ef5297bd16b83b8b4ede61a949641a40220bffa2
--- /dev/null
+++ b/etc/run_blastn
@@ -0,0 +1,87 @@
+#!/bin/sh -
+
+# this script will run a search program on a sequence input file or on each
+# file in a file of filenames
+
+# to customise this script see the function called run_one_prog below
+
+
+RCS_HEADER="$Header: //tmp/pathsoft/artemis/etc/run_blastn,v 1.1 2004-06-09 10:02:58 tjc Exp $"
+
+PROG=`echo $RCS_HEADER | sed 's/.*run_\(.*\),v.*/\1/'`
+
+
+if [ $# = 4 -a x$1 = x-onefile ]
+then
+    shift
+    ONEFILE=t
+    DATABASE=$3 export DATABASE
+else
+    if [ $# = 2 ]
+    then
+        DATABASE=$2 export DATABASE
+    else
+        echo usage: $0 -onefile input_file output_file database
+        echo    or: $0 file_of_filenames database
+        exit 1
+    fi
+fi
+
+
+# expand any ~ or environment variables
+EXPANDED_DATABASE=`echo "echo $DATABASE" | /bin/csh -f`
+
+
+### change this function to suit your site:
+
+run_one_prog () {
+    INPUT_FILE=$1
+    OUTPUT_FILE=$2
+    DATABASE=$3
+
+
+    ### change these lines:
+    EXEC=blastall
+
+    echo "about to start $EXEC with input from $INPUT_FILE and output to"
+    echo "$OUTPUT_FILE using database $DATABASE"
+
+
+    EXTRA_ARGS=
+
+    # add/change the flags to suit your site:
+    lsrun -v blastwrap.pl $EXEC -d $DATABASE -i $INPUT_FILE -p blastn \
+      $EXTRA_ARGS 2>&1 > $OUTPUT_FILE | 
+      tee ${PROG}_errors.new 1>&2
+
+    #### end of changes
+
+
+    # Artemis can read compressed files
+    gzip -9 $OUTPUT_FILE &
+
+    if [ -s ${PROG}_errors.new ]
+    then
+        ( echo ERROR running $PROG: ; echo; 
+          echo ===================================================
+          cat ${PROG}_errors.new ) >> $OUTPUT_FILE
+        cat ${PROG}_errors.new >> ${PROG}_errors
+    fi
+}
+
+(echo "#!/bin/sh -"; echo "kill $$") > $PROG.kill
+
+chmod a+x $PROG.kill
+
+if [ x$ONEFILE = x ]
+then
+    for i in `cat $1`
+    do
+        run_one_prog $i $i.out $EXPANDED_DATABASE
+    done
+
+else
+    run_one_prog $1 $2 $EXPANDED_DATABASE
+fi
+
+exit 0
diff --git a/etc/run_blastp b/etc/run_blastp
new file mode 100755
index 0000000000000000000000000000000000000000..2ac573c1b1c306ed2a4cdc9d2535dde5f0040e93
--- /dev/null
+++ b/etc/run_blastp
@@ -0,0 +1,88 @@
+#!/bin/sh -
+
+# this script will run a search program on a sequence input file or on each
+# file in a file of filenames
+
+# to customise this script see the function called run_one_prog below
+
+
+RCS_HEADER="$Header: //tmp/pathsoft/artemis/etc/run_blastp,v 1.1 2004-06-09 10:02:59 tjc Exp $"
+
+PROG=`echo $RCS_HEADER | sed 's/.*run_\(.*\),v.*/\1/'`
+
+
+if [ $# = 4 -a x$1 = x-onefile ]
+then
+    shift
+    ONEFILE=t
+    DATABASE=$3 export DATABASE
+else
+    if [ $# = 2 ]
+    then
+        DATABASE=$2 export DATABASE
+    else
+        echo usage: $0 -onefile input_file output_file database
+        echo    or: $0 file_of_filenames database
+        exit 1
+    fi
+fi
+
+
+# expand any ~ or environment variables
+EXPANDED_DATABASE=`echo "echo $DATABASE" | /bin/csh -f`
+
+
+### change this function to suit your site:
+
+run_one_prog () {
+    INPUT_FILE=$1
+    OUTPUT_FILE=$2
+    DATABASE=$3
+
+
+    ### change these lines:
+    EXEC=blastall
+
+    echo "about to start $EXEC with input from $INPUT_FILE and output to"
+    echo "$OUTPUT_FILE using database $DATABASE"
+
+
+    EXTRA_ARGS=
+
+    # add/change the flags to suit your site:
+    lsrun -R 'select[blast && mem > 500] rusage[r1m=1:mem=500]' -v \
+      blastwrap.pl $EXEC -d $DATABASE -i $INPUT_FILE -p blastp \
+      $EXTRA_ARGS 2>&1 > $OUTPUT_FILE | 
+      tee ${PROG}_errors.new 1>&2
+
+    #### end of changes
+
+
+    # Artemis can read compressed files
+    gzip -9 $OUTPUT_FILE &
+
+    if [ -s ${PROG}_errors.new ]
+    then
+        ( echo ERROR running $PROG: ; echo; 
+          echo ===================================================
+          cat ${PROG}_errors.new ) >> $OUTPUT_FILE
+        cat ${PROG}_errors.new >> ${PROG}_errors
+    fi
+}
+
+(echo "#!/bin/sh -"; echo "kill $$") > $PROG.kill
+
+chmod a+x $PROG.kill
+
+if [ x$ONEFILE = x ]
+then
+    for i in `cat $1`
+    do
+        run_one_prog $i $i.out $EXPANDED_DATABASE
+    done
+
+else
+    run_one_prog $1 $2 $EXPANDED_DATABASE
+fi
+
+exit 0
diff --git a/etc/run_blastx b/etc/run_blastx
new file mode 100755
index 0000000000000000000000000000000000000000..21c88d11b21760719b8286077f5c09b37e609cc2
--- /dev/null
+++ b/etc/run_blastx
@@ -0,0 +1,87 @@
+#!/bin/sh -
+
+# this script will run a search program on a sequence input file or on each
+# file in a file of filenames
+
+# to customise this script see the function called run_one_prog below
+
+
+RCS_HEADER="$Header: //tmp/pathsoft/artemis/etc/run_blastx,v 1.1 2004-06-09 10:03:00 tjc Exp $"
+
+PROG=`echo $RCS_HEADER | sed 's/.*run_\(.*\),v.*/\1/'`
+
+
+if [ $# = 4 -a x$1 = x-onefile ]
+then
+    shift
+    ONEFILE=t
+    DATABASE=$3 export DATABASE
+else
+    if [ $# = 2 ]
+    then
+        DATABASE=$2 export DATABASE
+    else
+        echo usage: $0 -onefile input_file output_file database
+        echo    or: $0 file_of_filenames database
+        exit 1
+    fi
+fi
+
+
+# expand any ~ or environment variables
+EXPANDED_DATABASE=`echo "echo $DATABASE" | /bin/csh -f`
+
+
+### change this function to suit your site:
+
+run_one_prog () {
+    INPUT_FILE=$1
+    OUTPUT_FILE=$2
+    DATABASE=$3
+
+
+    ### change these lines:
+    EXEC=blastall
+
+    echo "about to start $EXEC with input from $INPUT_FILE and output to"
+    echo "$OUTPUT_FILE using database $DATABASE"
+
+
+    EXTRA_ARGS=
+
+    # add/change the flags to suit your site:
+    lsrun -v blastwrap.pl $EXEC -d $DATABASE -i $INPUT_FILE -p blastx \
+      $EXTRA_ARGS 2>&1 > $OUTPUT_FILE | 
+      tee ${PROG}_errors.new 1>&2
+
+    #### end of changes
+
+
+    # Artemis can read compressed files
+    gzip -9 $OUTPUT_FILE &
+
+    if [ -s ${PROG}_errors.new ]
+    then
+        ( echo ERROR running $PROG: ; echo; 
+          echo ===================================================
+          cat ${PROG}_errors.new ) >> $OUTPUT_FILE
+        cat ${PROG}_errors.new >> ${PROG}_errors
+    fi
+}
+
+(echo "#!/bin/sh -"; echo "kill $$") > $PROG.kill
+
+chmod a+x $PROG.kill
+
+if [ x$ONEFILE = x ]
+then
+    for i in `cat $1`
+    do
+        run_one_prog $i $i.out $EXPANDED_DATABASE
+    done
+
+else
+    run_one_prog $1 $2 $EXPANDED_DATABASE
+fi
+
+exit 0
diff --git a/etc/run_clustalx b/etc/run_clustalx
new file mode 100755
index 0000000000000000000000000000000000000000..1e40a7c0eb91ff028d1ddea7640514d4dfcfd29e
--- /dev/null
+++ b/etc/run_clustalx
@@ -0,0 +1,41 @@
+#!/bin/sh -
+
+# this script will run clustalx on a temporary file containing the concatenated
+# contents of files listed in a file of filenames
+
+
+RCS_HEADER="$Header: //tmp/pathsoft/artemis/etc/run_clustalx,v 1.1 2004-06-09 10:03:01 tjc Exp $"
+
+PROG=`echo $RCS_HEADER | sed 's/.*run_\(.*\),v.*/\1/'`
+
+
+if [ $# != 1 ]
+then
+    echo usage: $0 file_of_filenames
+fi
+
+(echo "#!/bin/sh -"; echo "kill $$") > $PROG.kill
+
+chmod a+x $PROG.kill
+
+file_of_filenames=$1
+date=`date +"%y_%m_%d"`
+hostname=`hostname`
+temp_file_name=/tmp/artemis_temp.$$.$hostname.$date.clustalx_input.fasta
+
+cat $file_of_filenames | xargs cat > $temp_file_name
+
+# make sure that the identifiers are unique for clustalx
+perl -pne 'if (/^>(\S+)/) {
+  $name = $1;
+  if (exists $h{$name}) {
+    $i = $h{$name}++;
+    s/^>(\S+)/>$name.$i/;
+  } else {
+    $h{$name} = 0;
+  }
+}' $temp_file_name > $temp_file_name.processed
+
+clustalx $temp_file_name.processed
+
+exit 0
diff --git a/etc/run_fasta b/etc/run_fasta
new file mode 100755
index 0000000000000000000000000000000000000000..b46d0dd56bd147e660d98957c0c9828a80ed4609
--- /dev/null
+++ b/etc/run_fasta
@@ -0,0 +1,90 @@
+#!/bin/sh -
+
+# this script will run a search program on a sequence input file or on each
+# file in a file of filenames
+
+# to customise this script see the function called run_one_prog below
+
+
+RCS_HEADER="$Header: //tmp/pathsoft/artemis/etc/run_fasta,v 1.1 2004-06-09 10:03:03 tjc Exp $"
+
+PROG=`echo $RCS_HEADER | sed 's/.*run_\(.*\),v.*/\1/'`
+
+
+if [ $# = 4 -a x$1 = x-onefile ]
+then
+    shift
+    ONEFILE=t
+    DATABASE=$3 export DATABASE
+else
+    if [ $# = 2 ]
+    then
+        DATABASE=$2 export DATABASE
+    else
+        echo usage: $0 -onefile input_file output_file database 1>&2
+        echo    or: $0 file_of_filenames database 1>&2
+        exit 1
+    fi
+fi
+
+
+# expand any ~ or environment variables
+EXPANDED_DATABASE=`echo "echo $DATABASE" | /bin/csh -f`
+
+
+### change this function to suit your site:
+
+run_one_prog () {
+    INPUT_FILE=$1
+    OUTPUT_FILE=$2
+    DATABASE=$3
+
+
+    ### change these lines:
+
+    FASTLIBS=/nfs/disk222/yeastpub/bio-soft/fasta/pubseqgbs export FASTLIBS
+    EXEC=/nfs/disk222/yeastpub/bio-soft/fasta/fasta33
+
+    echo "about to start $EXEC with input from $INPUT_FILE and output to" 1>&2
+    echo "$OUTPUT_FILE using database $DATABASE" 1>&2
+
+    # add/change the flags to suit your site:
+    COMMAND="$EXEC -B -S -q -b 100 -H $INPUT_FILE $DATABASE ktup 2"
+
+    echo "command line: $COMMAND" 1>&2
+
+#    lsrun -R 'select[blast && mem > 500] rusage[r1m=1:mem=500]' -v $COMMAND 2>&1 > $OUTPUT_FILE | 
+     bsub -q longblastq -R 'select[blast && mem > 500] rusage[r1m=1:mem=500]' -I $COMMAND 2>&1 > $OUTPUT_FILE |
+      tee ${PROG}_errors.new 1>&2
+
+    #### end of changes
+
+
+    # Artemis can read compressed files
+    gzip -9 $OUTPUT_FILE &
+
+    if [ -s ${PROG}_errors.new ]
+    then
+        ( echo ERROR running $PROG: ; echo; 
+          echo ===================================================
+          cat ${PROG}_errors.new ) >> $OUTPUT_FILE
+        cat ${PROG}_errors.new >> ${PROG}_errors
+    fi
+}
+
+(echo "#!/bin/sh -"; echo "kill $$") > $PROG.kill
+
+chmod a+x $PROG.kill
+
+if [ x$ONEFILE = x ]
+then
+    for i in `cat $1`
+    do
+        run_one_prog $i $i.out $EXPANDED_DATABASE
+    done
+
+else
+    run_one_prog $1 $2 $EXPANDED_DATABASE
+fi
+
+exit 0
diff --git a/etc/run_fasta_orig b/etc/run_fasta_orig
new file mode 100755
index 0000000000000000000000000000000000000000..63c87b3e35c5363d8e246a3bd14694a62e332c94
--- /dev/null
+++ b/etc/run_fasta_orig
@@ -0,0 +1,90 @@
+#!/bin/sh -
+
+# this script will run a search program on a sequence input file or on each
+# file in a file of filenames
+
+# to customise this script see the function called run_one_prog below
+
+
+RCS_HEADER="$Header: //tmp/pathsoft/artemis/etc/run_fasta_orig,v 1.1 2004-06-09 10:03:04 tjc Exp $"
+
+PROG=`echo $RCS_HEADER | sed 's/.*run_\(.*\),v.*/\1/'`
+
+
+if [ $# = 4 -a x$1 = x-onefile ]
+then
+    shift
+    ONEFILE=t
+    DATABASE=$3 export DATABASE
+else
+    if [ $# = 2 ]
+    then
+        DATABASE=$2 export DATABASE
+    else
+        echo usage: $0 -onefile input_file output_file database 1>&2
+        echo    or: $0 file_of_filenames database 1>&2
+        exit 1
+    fi
+fi
+
+
+# expand any ~ or environment variables
+EXPANDED_DATABASE=`echo "echo $DATABASE" | /bin/csh -f`
+
+
+### change this function to suit your site:
+
+run_one_prog () {
+    INPUT_FILE=$1
+    OUTPUT_FILE=$2
+    DATABASE=$3
+
+
+    ### change these lines:
+
+    FASTLIBS=/nfs/disk222/yeastpub/bio-soft/fasta/pubseqgbs export FASTLIBS
+    EXEC=/nfs/disk222/yeastpub/bio-soft/fasta/fasta33
+
+    echo "about to start $EXEC with input from $INPUT_FILE and output to" 1>&2
+    echo "$OUTPUT_FILE using database $DATABASE" 1>&2
+
+    # add/change the flags to suit your site:
+    COMMAND="$EXEC -B -S -q -b 40 -H $INPUT_FILE $DATABASE ktup 2"
+
+    echo "command line: $COMMAND" 1>&2
+
+    lsrun -R 'select[blast && mem > 500] rusage[r1m=1:mem=500]' -v \
+      $COMMAND 2>&1 > $OUTPUT_FILE | 
+      tee ${PROG}_errors.new 1>&2
+
+    #### end of changes
+
+
+    # Artemis can read compressed files
+    gzip -9 $OUTPUT_FILE &
+
+    if [ -s ${PROG}_errors.new ]
+    then
+        ( echo ERROR running $PROG: ; echo; 
+          echo ===================================================
+          cat ${PROG}_errors.new ) >> $OUTPUT_FILE
+        cat ${PROG}_errors.new >> ${PROG}_errors
+    fi
+}
+
+(echo "#!/bin/sh -"; echo "kill $$") > $PROG.kill
+
+chmod a+x $PROG.kill
+
+if [ x$ONEFILE = x ]
+then
+    for i in `cat $1`
+    do
+        run_one_prog $i $i.out $EXPANDED_DATABASE
+    done
+
+else
+    run_one_prog $1 $2 $EXPANDED_DATABASE
+fi
+
+exit 0
diff --git a/etc/run_fastx b/etc/run_fastx
new file mode 100644
index 0000000000000000000000000000000000000000..b04a259a909a3921f654e2340fb6a1e14d5110f8
--- /dev/null
+++ b/etc/run_fastx
@@ -0,0 +1,89 @@
+#!/bin/sh -
+
+# this script will run a search program on a sequence input file or on each
+# file in a file of filenames
+
+# to customise this script see the function called run_one_prog below
+
+
+RCS_HEADER="$Header: //tmp/pathsoft/artemis/etc/run_fastx,v 1.1 2004-06-09 10:03:05 tjc Exp $"
+
+PROG=`echo $RCS_HEADER | sed 's/.*run_\(.*\),v.*/\1/'`
+
+
+if [ $# = 4 -a x$1 = x-onefile ]
+then
+    shift
+    ONEFILE=t
+    DATABASE=$3 export DATABASE
+else
+    if [ $# = 2 ]
+    then
+        DATABASE=$2 export DATABASE
+    else
+        echo usage: $0 -onefile input_file output_file database 1>&2
+        echo    or: $0 file_of_filenames database 1>&2
+        exit 1
+    fi
+fi
+
+
+# expand any ~ or environment variables
+EXPANDED_DATABASE=`echo "echo $DATABASE" | /bin/csh -f`
+
+
+### change this function to suit your site:
+
+run_one_prog () {
+    INPUT_FILE=$1
+    OUTPUT_FILE=$2
+    DATABASE=$3
+
+
+    ### change these lines:
+
+    FASTLIBS=/nfs/disk222/yeastpub/bio-soft/fasta/pubseqgbs export FASTLIBS
+    EXEC=/nfs/disk222/yeastpub/bio-soft/fasta/fastx33_t
+
+    echo "about to start $EXEC with input from $INPUT_FILE and output to" 1>&2
+    echo "$OUTPUT_FILE using database $DATABASE" 1>&2
+
+    # add/change the flags to suit your site:
+    COMMAND="$EXEC -B -S -q -b 40 -H $INPUT_FILE $DATABASE ktup 2"
+
+    echo "command line: $COMMAND" 1>&2
+
+    $COMMAND 2>&1 > $OUTPUT_FILE | 
+      tee ${PROG}_errors.new 1>&2
+
+    #### end of changes
+
+
+    # Artemis can read compressed files
+    gzip -9 $OUTPUT_FILE &
+
+    if [ -s ${PROG}_errors.new ]
+    then
+        ( echo ERROR running $PROG: ; echo; 
+          echo ===================================================
+          cat ${PROG}_errors.new ) >> $OUTPUT_FILE
+        cat ${PROG}_errors.new >> ${PROG}_errors
+    fi
+}
+
+(echo "#!/bin/sh -"; echo "kill $$") > $PROG.kill
+
+chmod a+x $PROG.kill
+
+if [ x$ONEFILE = x ]
+then
+    for i in `cat $1`
+    do
+        run_one_prog $i $i.out $EXPANDED_DATABASE
+    done
+
+else
+    run_one_prog $1 $2 $EXPANDED_DATABASE
+fi
+
+exit 0
diff --git a/etc/run_hth b/etc/run_hth
new file mode 100755
index 0000000000000000000000000000000000000000..a61aeca54b06f0a1bfae60d7fb8fa82e38639e69
--- /dev/null
+++ b/etc/run_hth
@@ -0,0 +1,148 @@
+#!/bin/sh -
+
+# this script will run a search program on a sequence input file or on each
+# file in a file of filenames
+
+# to customise this script see the function called run_one_prog below
+
+
+RCS_HEADER="$Header: //tmp/pathsoft/artemis/etc/run_hth,v 1.1 2004-06-09 10:03:06 tjc Exp $"
+
+PROG=`echo $RCS_HEADER | sed 's/.*run_\(.*\),v.*/\1/'`
+
+
+if [ $# = 4 -a x$1 = x-onefile ]
+then
+    shift
+    ONEFILE=t
+    PARAMETERS=$3 export PARAMETERS
+else
+    if [ $# = 2 ]
+    then
+        PARAMETERS=$2 export PARAMETERS
+    else
+        echo usage: $0 -onefile input_file output_file parameters 1>&2
+        echo    or: $0 file_of_filenames parameters 1>&2
+        exit 1
+    fi
+fi
+
+
+# expand any ~ or environment variables
+EXPANDED_PARAMETERS=`echo "echo $PARAMETERS" | /bin/csh -f`
+
+
+### change this function to suit your site:
+
+run_one_prog () {
+    INPUT_FILE=$1
+    OUTPUT_FILE=$2
+    PARAMETERS=$3
+
+
+    ### change these lines:
+    EXEC=helixturnhelix
+
+    echo "about to start $EXEC with input from $INPUT_FILE and output to" 1>&2
+    echo "$OUTPUT_FILE using database $PARAMETERS" 1>&2
+    echo "command line: $EXEC $PARAMETERS $INPUT_FILE" 1>&2
+
+    $EXEC $INPUT_FILE $OUTPUT_FILE $PARAMETERS 2> hth_errors.new
+
+    # add/change the flags to suit your site:
+    $EXEC $INPUT_FILE -outfile $OUTPUT_FILE $PARAMETERS 2>&1 | 
+      tee ${PROG}_errors.new 1>&2
+
+    #### end of changes
+
+
+    if [ -s ${PROG}_errors.new ]
+    then
+        ( echo ERROR running $PROG: ; echo; 
+          echo ===================================================
+          cat ${PROG}_errors.new ) >> $OUTPUT_FILE
+        cat ${PROG}_errors.new >> ${PROG}_errors
+    fi
+}
+
+(echo "#!/bin/sh -"; echo "kill $$") > $PROG.kill
+
+chmod a+x $PROG.kill
+
+if [ x$ONEFILE = x ]
+then
+    for i in `cat $1`
+    do
+        run_one_prog $i $i.out $EXPANDED_PARAMETERS
+    done
+
+else
+    run_one_prog $1 $2 $EXPANDED_PARAMETERS
+fi
+
+if [ x$ONEFILE = x ]
+then
+    PEPFILES=`cat $1`
+else
+    PEPFILES=$1
+fi
+
+if [ -e hth/hth.tab ]
+then
+    mv -f hth/hth.tab hth/hth.tab.old
+fi
+
+for i in $PEPFILES
+do
+# write a tab file containing a feature for each hth
+perl -e '
+open PEPFILE, "$ARGV[0]" or die "$0: cannot open $ARGV[0]\n";
+
+my $first_line = <PEPFILE>;
+
+close PEPFILE;
+
+if ($first_line !~ m/^>(.*?), (.*) (\d+):(\d+)\s+(\S+)/) {
+  die "first line of $ARGV[0] is badly formatted\n";
+}
+
+my ($gene_name, $description, $pep_first_base,
+    $pep_last_base, $forward_or_back) = ($1, $2, $3, $4, $5);
+
+open HTHFILE, "$ARGV[1]" or die "$0: cannot open $ARGV[1]\n";
+
+my $score;
+my $first_match_base;
+
+while (<HTHFILE>) {
+  if (m/^Score (\d+) .* in .* at residue (\d+)/) {
+    $score = $1;
+    $first_match_base = $2;
+  }
+
+  if (m/^\s+Sequence:\s+(\S+)/ && 
+      defined ($score) && defined ($pep_first_base)) {
+    if ($forward_or_back eq "forward") {
+      my $start_base = $pep_first_base + ($first_match_base - 1) * 3;
+      my $end_base = $start_base + (length $1) * 3 - 1;
+      print <<EOF;
+FT   CDS_motif       $start_base..$end_base
+FT                   /note="Helix-turn-helix from $gene_name score $score"
+FT                   /label=hth
+EOF
+    } else {
+      my $end_base = $pep_last_base - ($first_match_base - 1) * 3;
+      my $start_base = $end_base - ((length $1) * 3 - 1);
+      print <<EOF;
+FT   CDS_motif       complement($start_base..$end_base)
+FT                   /note="Helix-turn-helix from $gene_name score $score"
+FT                   /label=hth
+EOF
+    }
+  }
+}
+' $i $i.out >> hth/hth.tab
+
+done
+
+exit 0
diff --git a/etc/run_jalview b/etc/run_jalview
new file mode 100755
index 0000000000000000000000000000000000000000..bf214db58819f454661629c01ba0889c5e46bdb9
--- /dev/null
+++ b/etc/run_jalview
@@ -0,0 +1,51 @@
+#!/bin/sh -
+
+# This script needs one argument - a file of file names.
+
+PERL_PROG='
+
+use strict;
+
+if (@ARGV < 1)
+{ 
+  die "$0 needs one argument - a file of sequence file names\n";
+}
+
+my $file = $ARGV[0];
+
+chomp $file;
+
+if (-e $file)
+{
+  my $msf_file = "$file.fasta_msf";   
+
+  my $seqnum = 1;
+  open(LIST_FILE,$file);
+  while(my $line = <LIST_FILE>)
+  {
+    chomp($line);
+
+    #
+    # run descseq to ensure unique names
+    #
+    my $emboss_command_line = "descseq -append -name _$seqnum $line $line.new -auto";
+
+    open EMBOSS, "|$emboss_command_line" or
+              die "cannot open pipe to descseq: $!\n";
+    close EMBOSS;
+
+    unlink("$line");
+    rename("$line.new","$line");
+    $seqnum++;
+  }
+
+  my $emboss_command_line = "emma \"\@$file\" -filter -stdout -osf msf  -dendoutfile /dev/null -outseq $msf_file";
+
+  open EMBOSS, "|$emboss_command_line" or
+            die "cannot open pipe to emma: $!\n";
+  close EMBOSS;
+  system "jalview", "$msf_file";
+}
+'
+
+perl -w -e "$PERL_PROG" "$@" 
diff --git a/etc/run_jalview.orig b/etc/run_jalview.orig
new file mode 100755
index 0000000000000000000000000000000000000000..03e6e537b15854ad412609f5fcd3411adcedadc6
--- /dev/null
+++ b/etc/run_jalview.orig
@@ -0,0 +1,167 @@
+#!/bin/sh -
+
+# This script needs one argument - a file of file names.
+# Each name should refer to a file that contains a EMBL format feature.
+# The feature must have a /fasta_file= qualifier which is used to read the
+# FASTA search results for the feature and to find the protein sequence of the
+# feature.  The sequence and the sequence of the FASTA hits will be passed to
+# jalview.
+
+PERL_PROG='
+
+use strict;
+
+if (@ARGV != 1) {
+  die "$0 needs one argument - a file of feature file names\n";
+}
+
+
+sub process_fasta
+{
+  my $feature_file = shift;
+  my $fasta_results_file = shift;
+
+  my $sequence_file;
+
+  if ($fasta_results_file =~ /(.*).out/) {
+    $sequence_file = $1;
+  } else {
+    die "cannot understand $fasta_results_file\n";
+  }
+
+  if (! -e $sequence_file) {
+    die "cannot find $sequence_file\n";
+  }
+
+  my $fasta_seq_for_alignment = "";
+
+  open SEQ_FILE, $sequence_file or die "cannot open $sequence_file: $!\n";
+
+  while (<SEQ_FILE>) {
+    $fasta_seq_for_alignment .= $_;
+  }
+
+  close SEQ_FILE;
+
+  if (-e $fasta_results_file) {
+    open FASTA_OUTPUT, $fasta_results_file
+      or die "cannot open $fasta_results_file: $!\n";
+  } else {
+    my $gzip_fasta_results_file = $fasta_results_file . ".gz";
+    if (-e $gzip_fasta_results_file) {
+      open FASTA_OUTPUT, "gzip -d < $gzip_fasta_results_file |"
+        or die "cannot open $gzip_fasta_results_file: $!\n";
+    } else {
+      die "cannot find $fasta_results_file or $gzip_fasta_results_file\n";
+    }
+  }
+
+
+  my $top_re = "^The best scores are:";
+
+  my $seen_top = 0;
+  my $seen_bottom = 0;
+
+  my @protein_ids = ();
+
+  while (<FASTA_OUTPUT>) {
+    if (/$top_re/) {
+      $seen_top = 1;
+      next;
+    }
+
+    if ($seen_top && /^\s*$/) {
+      $seen_bottom = 1;
+      next;
+    }
+
+    if ($seen_top && !$seen_bottom) {
+      if (/^(\S+)/) {
+        if (@protein_ids < 20) {
+          push @protein_ids, "$1"
+        } else {
+          last;
+        }
+      } else {
+        warn "cannot understand this line:\n$_\n";
+      }
+    }
+  }
+
+  my %hash = ();
+
+  @hash{@protein_ids} = (1) x @protein_ids;
+
+  @protein_ids = sort keys %hash;
+
+  my $protein_db = "swall";
+
+  # look for each of the IDs from the FASTA output in each of the DBs
+
+  for my $id (@protein_ids) {
+    my $fetch = "getz -sf fasta -f seq [swall-id:$id]";
+
+    my $temp_seq = "";
+
+    open FETCH, "$fetch |" or
+      die "cannot open pipe to $fetch: $!\n";
+
+    while (<FETCH>) {
+      $temp_seq .= $_;
+    }
+
+    close FETCH;
+
+    if ($? == 0) {
+      $fasta_seq_for_alignment .= $temp_seq;
+    } else {
+      print STDERR "$id was not found in $protein_db\n";
+    }
+  }
+
+  my $msf_file = "$feature_file.fasta_msf";
+
+  my $emboss_prog = "emma";
+
+  my $emboss_command_line = "$emboss_prog -filter -stdout -osf msf  -dendoutfile /dev/null > $msf_file";
+
+  open EMBOSS, "|$emboss_command_line" or
+     die "cannot open pipe to $emboss_prog: $!\n";
+
+  print EMBOSS $fasta_seq_for_alignment;
+
+  close EMBOSS;
+
+  my $jalview_prog = "jalview";
+
+  print STDERR "\nstarting $jalview_prog:\n";
+
+  system "$jalview_prog", "$msf_file";
+}
+
+
+my $file;
+
+while (defined ($file = <>)) {
+  chomp $file;
+
+  if (-e $file) {
+    open IN_FILE, "$file\n" or die "cannot open $file\n";
+
+    my $line;
+
+    while (defined ($line = <IN_FILE>)) {
+      if ($line  =~ m!/fasta_file="(.*)"!) {
+        my $fasta_results_file = $1;
+
+        process_fasta $file, $fasta_results_file;
+
+        last;
+      }
+    }
+
+    close IN_FILE;
+  }
+}'
+
+perl -w -e "$PERL_PROG" "$@"
diff --git a/etc/run_pepstats b/etc/run_pepstats
new file mode 100755
index 0000000000000000000000000000000000000000..22239de3a9161d69056b9ff7f1f016320a25ea24
--- /dev/null
+++ b/etc/run_pepstats
@@ -0,0 +1,77 @@
+#!/bin/sh -
+
+# this script will run pepstats on a sequence input file or on each
+# file in a file of filenames
+
+# to customise this script see the function called run_one_prog below
+
+
+RCS_HEADER="$Header: //tmp/pathsoft/artemis/etc/run_pepstats,v 1.1 2004-06-09 10:03:10 tjc Exp $"
+
+PROG=`echo $RCS_HEADER | sed 's/.*run_\(.*\),v.*/\1/'`
+
+
+if [ $# = 4 -a x$1 = x-onefile ]
+then
+    shift
+    ONEFILE=t
+    PARAMETERS=$3 export PARAMETERS
+else
+    if [ $# = 2 ]
+    then
+        PARAMETERS=$2 export PARAMETERS
+    else
+        echo usage: $0 -onefile input_file output_file parameters 1>&2
+        echo    or: $0 file_of_filenames parameters 1>&2
+        exit 1
+    fi
+fi
+
+
+### change this function to suit your site:
+
+run_one_prog () {
+    INPUT_FILE=$1
+    OUTPUT_FILE=$2
+
+    ### change these lines:
+    EXEC=pepstats
+
+    COMMAND_LINE="$EXEC -filter $INPUT_FILE"
+
+    echo "about to start $EXEC with input from $INPUT_FILE and output to" 1>&2
+    echo "$OUTPUT_FILE using parameters: $PARAMETERS" 1>&2
+    echo "command line: $COMMAND_LINE" 1>&2
+
+    # add/change the flags to suit your site:
+    (head -1 $INPUT_FILE | sed 's/^>//'; echo;
+     $COMMAND_LINE) 2>&1 > $OUTPUT_FILE | tee ${PROG}_errors.new 1>&2
+
+    #### end of changes
+
+
+    if [ -s ${PROG}_errors.new ]
+    then
+        ( echo ERROR running $PROG: ; echo; 
+          echo ===================================================
+          cat ${PROG}_errors.new ) >> $OUTPUT_FILE
+        cat ${PROG}_errors.new >> ${PROG}_errors
+    fi
+}
+
+(echo "#!/bin/sh -"; echo "kill $$") > $PROG.kill
+
+chmod a+x $PROG.kill
+
+if [ x$ONEFILE = x ]
+then
+    for i in `cat $1`
+    do
+        run_one_prog $i $i.out
+    done
+
+else
+    run_one_prog $1 $2
+fi
+
+exit 0
diff --git a/etc/run_sigcleave b/etc/run_sigcleave
new file mode 100755
index 0000000000000000000000000000000000000000..a8a0733679b7fe49ba086b07242c3d84c3f572ab
--- /dev/null
+++ b/etc/run_sigcleave
@@ -0,0 +1,78 @@
+#!/bin/sh -
+
+# this script will run a search program on a sequence input file or on each
+# file in a file of filenames
+
+# to customise this script see the function called run_one_prog below
+
+
+RCS_HEADER="$Header: //tmp/pathsoft/artemis/etc/run_sigcleave,v 1.1 2004-06-09 10:03:11 tjc Exp $"
+
+PROG=`echo $RCS_HEADER | sed 's/.*run_\(.*\),v.*/\1/'`
+
+
+if [ $# = 4 -a x$1 = x-onefile ]
+then
+    shift
+    ONEFILE=t
+    MINWEIGHT=$3
+else
+    if [ $# = 2 ]
+    then
+        MINWEIGHT=$2
+    else
+        echo usage: $0 -onefile input_file output_file minimum_weight 1>&2
+        echo    or: $0 file_of_filenames minimum_weight 1>&2
+        exit 1
+    fi
+fi
+
+PARAMETERS="-minweight $MINWEIGHT"
+
+### change this function to suit your site:
+
+run_one_prog () {
+    INPUT_FILE=$1
+    OUTPUT_FILE=$2
+    PARAMETERS="$3 $4 $5 $6 $7 $8 $9"
+
+    ### change these lines:
+    EXEC=sigcleave
+
+    COMMAND_LINE="$EXEC $INPUT_FILE -outfile $OUTPUT_FILE $PARAMETERS"
+
+    echo "about to start $EXEC with input from $INPUT_FILE and output to" 1>&2
+    echo "$OUTPUT_FILE using parameters: $PARAMETERS" 1>&2
+    echo "command line: $COMMAND_LINE" 1>&2
+
+    # add/change the flags to suit your site:
+    $COMMAND_LINE 2>&1 | tee ${PROG}_errors.new 1>&2
+
+    #### end of changes
+
+
+    if [ -s ${PROG}_errors.new ]
+    then
+        ( echo ERROR running $PROG: ; echo; 
+          echo ===================================================
+          cat ${PROG}_errors.new ) >> $OUTPUT_FILE
+        cat ${PROG}_errors.new >> ${PROG}_errors
+    fi
+}
+
+(echo "#!/bin/sh -"; echo "kill $$") > $PROG.kill
+
+chmod a+x $PROG.kill
+
+if [ x$ONEFILE = x ]
+then
+    for i in `cat $1`
+    do
+        run_one_prog $i $i.out $PARAMETERS
+    done
+
+else
+    run_one_prog $1 $2 $PARAMETERS
+fi
+
+exit 0
diff --git a/etc/run_smart b/etc/run_smart
new file mode 100755
index 0000000000000000000000000000000000000000..cc9ffb592854a0434a771208eeeebb5a47d4730c
--- /dev/null
+++ b/etc/run_smart
@@ -0,0 +1,95 @@
+#!/bin/sh -
+
+# this script will run SMART (http://smart.embl-heidelberg.de/) for an
+# sequence input file or on each file in a file of filenames.  it uses
+# lynx to access send a query to the SMART web site and then writes
+# the output to a file in the same way as run_fasta and run_blastp.
+# see:
+#   http://www.sanger.ac.uk/Software/Artemis/stable/manual/runmenu.html#RUNMENU-CONFIGURATION
+# for more details.
+
+# you will need the "GET" command from the perl LWP module to use this script
+
+# to customise this script see the function called run_one_prog below
+
+
+RCS_HEADER="$Header: //tmp/pathsoft/artemis/etc/run_smart,v 1.1 2004-06-09 10:03:12 tjc Exp $"
+
+PROG=`echo $RCS_HEADER | sed 's/.*run_\(.*\),v.*/\1/'`
+
+
+if [ $# = 3 -a x$1 = x-onefile -o $# = 4 -a x$1 = x-onefile ]
+then
+    shift
+    ONEFILE=t
+else
+    if [ $# != 2 -a $# = != 1 ]
+    then
+        echo usage: $0 -onefile input_file output_file 1>&2
+        echo    or: $0 file_of_filenames 1>&2
+        exit 1
+    fi
+fi
+
+
+# expand any ~ or environment variables
+EXPANDED_PARAMETERS=`echo "echo $PARAMETERS" | /bin/csh -f`
+
+
+### change this function to suit your site:
+
+run_one_prog () {
+    INPUT_FILE=$1
+    OUTPUT_FILE=$2
+    PARAMETERS=$3
+
+    # remove the rubbish from the FASTA header and change the sequence
+    # into URL form
+    SEQUENCE=`perl -pne 'chomp; s/^>.*/>sequence/; s/ /\%20/g; $_ .= "%0D"' $INPUT_FILE`
+
+    SEQUENCE=`echo $SEQUENCE | sed 's/%0D$//'`
+
+    URL='http://smart.embl-heidelberg.de/smart/show_motifs.pl?INCLUDE_SIGNALP=INCLUDE_SIGNALP&DO_PROSPERO=DO_PROSPERO&DO_PFAM=DO_PFAM&SEQUENCE='"$SEQUENCE"
+
+    ### change these lines:
+    EXEC=lynx
+
+    echo "about to start $EXEC with input from $INPUT_FILE and output to" 1>&2
+    echo "$OUTPUT_FILE" 1>&2
+
+    COMMAND="$EXEC -force_html -dump $URL"
+
+    echo "command line: $COMMAND" 1>&2
+
+    (echo "read from $URL"; echo) > $OUTPUT_FILE
+
+    $COMMAND 2>&1 >> $OUTPUT_FILE |
+      tee ${PROG}_errors.new 1>&2
+
+    #### end of changes
+
+    if [ -s ${PROG}_errors.new ]
+    then
+        ( echo ERROR running $PROG: ; echo;
+          echo ===================================================
+          cat ${PROG}_errors.new ) >> $OUTPUT_FILE
+        cat ${PROG}_errors.new >> ${PROG}_errors
+    fi
+}
+
+(echo "#!/bin/sh -"; echo "kill $$") > $PROG.kill
+
+chmod a+x $PROG.kill
+
+if [ x$ONEFILE = x ]
+then
+    for i in `cat $1`
+    do
+        run_one_prog $i $i.out $EXPANDED_PARAMETERS
+    done
+
+else
+    run_one_prog $1 $2 $EXPANDED_PARAMETERS
+fi
+
+exit 0
diff --git a/etc/run_tblastn b/etc/run_tblastn
new file mode 100755
index 0000000000000000000000000000000000000000..321853d7ae9d0b274976722d5cc4fb948c9091f2
--- /dev/null
+++ b/etc/run_tblastn
@@ -0,0 +1,88 @@
+#!/bin/sh -
+
+# this script will run a search program on a sequence input file or on each
+# file in a file of filenames
+
+# to customise this script see the function called run_one_prog below
+
+
+RCS_HEADER="$Header: //tmp/pathsoft/artemis/etc/run_tblastn,v 1.1 2004-06-09 10:03:13 tjc Exp $"
+
+PROG=`echo $RCS_HEADER | sed 's/.*run_\(.*\),v.*/\1/'`
+
+
+if [ $# = 4 -a x$1 = x-onefile ]
+then
+    shift
+    ONEFILE=t
+    DATABASE=$3 export DATABASE
+else
+    if [ $# = 2 ]
+    then
+        DATABASE=$2 export DATABASE
+    else
+        echo usage: $0 -onefile input_file output_file database 1>&2
+        echo    or: $0 file_of_filenames database 1>&2
+        exit 1
+    fi
+fi
+
+
+# expand any ~ or environment variables
+EXPANDED_DATABASE=`echo "echo $DATABASE" | /bin/csh -f`
+
+
+### change this function to suit your site:
+
+run_one_prog () {
+    INPUT_FILE=$1
+    OUTPUT_FILE=$2
+    DATABASE=$3
+
+
+    ### change these lines:
+    EXEC=blastall
+
+    echo "about to start $EXEC with input from $INPUT_FILE and output to" 1>&2
+    echo "$OUTPUT_FILE using database $DATABASE" 1>&2
+    echo "command line: $EXEC $DATABASE $INPUT_FILE" 1>&2
+
+
+    EXTRA_ARGS=
+
+    # add/change the flags to suit your site:
+    lsrun -v blastwrap.pl $EXEC -d $DATABASE -i $INPUT_FILE -p tblastn \
+      $EXTRA_ARGS 2>&1 > $OUTPUT_FILE | 
+      tee ${PROG}_errors.new 1>&2
+
+    #### end of changes
+
+
+    # Artemis can read compressed files
+    gzip -9 $OUTPUT_FILE &
+
+    if [ -s ${PROG}_errors.new ]
+    then
+        ( echo ERROR running $PROG: ; echo; 
+          echo ===================================================
+          cat ${PROG}_errors.new ) >> $OUTPUT_FILE
+        cat ${PROG}_errors.new >> ${PROG}_errors
+    fi
+}
+
+(echo "#!/bin/sh -"; echo "kill $$") > $PROG.kill
+
+chmod a+x $PROG.kill
+
+if [ x$ONEFILE = x ]
+then
+    for i in `cat $1`
+    do
+        run_one_prog $i $i.out $EXPANDED_DATABASE
+    done
+
+else
+    run_one_prog $1 $2 $EXPANDED_DATABASE
+fi
+
+exit 0
diff --git a/etc/run_tblastx b/etc/run_tblastx
new file mode 100755
index 0000000000000000000000000000000000000000..92fd500f014c721ff5aeebaa24e3e7caaa7c7713
--- /dev/null
+++ b/etc/run_tblastx
@@ -0,0 +1,87 @@
+#!/bin/sh -
+
+# this script will run a search program on a sequence input file or on each
+# file in a file of filenames
+
+# to customise this script see the function called run_one_prog below
+
+
+RCS_HEADER="$Header: //tmp/pathsoft/artemis/etc/run_tblastx,v 1.1 2004-06-09 10:03:14 tjc Exp $"
+
+PROG=`echo $RCS_HEADER | sed 's/.*run_\(.*\),v.*/\1/'`
+
+
+if [ $# = 4 -a x$1 = x-onefile ]
+then
+    shift
+    ONEFILE=t
+    DATABASE=$3 export DATABASE
+else
+    if [ $# = 2 ]
+    then
+        DATABASE=$2 export DATABASE
+    else
+        echo usage: $0 -onefile input_file output_file database 1>&2
+        echo    or: $0 file_of_filenames database 1>&2
+        exit 1
+    fi
+fi
+
+
+# expand any ~ or environment variables
+EXPANDED_DATABASE=`echo "echo $DATABASE" | /bin/csh -f`
+
+
+### change this function to suit your site:
+
+run_one_prog () {
+    INPUT_FILE=$1
+    OUTPUT_FILE=$2
+    DATABASE=$3
+
+
+    ### change these lines:
+    EXEC=blastall
+
+    echo "about to start $EXEC with input from $INPUT_FILE and output to" 1>&2
+    echo "$OUTPUT_FILE using database $DATABASE" 1>&2
+
+
+    EXTRA_ARGS=
+
+    # add/change the flags to suit your site:
+    lsrun -v blastwrap.pl $EXEC -d $DATABASE -i $INPUT_FILE -p tblastx \
+      $EXTRA_ARGS 2>&1 > $OUTPUT_FILE | 
+      tee ${PROG}_errors.new 1>&2
+
+    #### end of changes
+
+
+    # Artemis can read compressed files
+    gzip -9 $OUTPUT_FILE &
+
+    if [ -s ${PROG}_errors.new ]
+    then
+        ( echo ERROR running $PROG: ; echo; 
+          echo ===================================================
+          cat ${PROG}_errors.new ) >> $OUTPUT_FILE
+        cat ${PROG}_errors.new >> ${PROG}_errors
+    fi
+}
+
+(echo "#!/bin/sh -"; echo "kill $$") > $PROG.kill
+
+chmod a+x $PROG.kill
+
+if [ x$ONEFILE = x ]
+then
+    for i in `cat $1`
+    do
+        run_one_prog $i $i.out $EXPANDED_DATABASE
+    done
+
+else
+    run_one_prog $1 $2 $EXPANDED_DATABASE
+fi
+
+exit 0