From 528a70f1a695b681702ee440b4232edea58e84dc Mon Sep 17 00:00:00 2001 From: tjc <tjc@ee4ac58c-ac51-4696-9907-e4b3aa274f04> Date: Wed, 9 Jun 2004 10:03:14 +0000 Subject: [PATCH] java2 version git-svn-id: svn+ssh://svn.internal.sanger.ac.uk/repos/svn/pathsoft/artemis/trunk@1637 ee4ac58c-ac51-4696-9907-e4b3aa274f04 --- etc/af063097.embl | 1903 +++++++++++++++++++++++++++++++++ etc/af063097.fasta | 561 ++++++++++ etc/af063097_v_b132222.crunch | 199 ++++ etc/b132222.embl | 1512 ++++++++++++++++++++++++++ etc/b132222.fasta | 512 +++++++++ etc/c1215.blastn.crunch | 126 +++ etc/c1215.blastn.tab | 630 +++++++++++ etc/c1215.embl | 258 +++++ etc/c1215.genbank | 277 +++++ etc/c1215.seq | 110 ++ etc/feature_keys | 72 ++ etc/options | 508 +++++++++ etc/pombe.usage | 20 + etc/qualifier_types | 110 ++ etc/results_to_netscape | 214 ++++ etc/run_blastn | 87 ++ etc/run_blastp | 88 ++ etc/run_blastx | 87 ++ etc/run_clustalx | 41 + etc/run_fasta | 90 ++ etc/run_fasta_orig | 90 ++ etc/run_fastx | 89 ++ etc/run_hth | 148 +++ etc/run_jalview | 51 + etc/run_jalview.orig | 167 +++ etc/run_pepstats | 77 ++ etc/run_sigcleave | 78 ++ etc/run_smart | 95 ++ etc/run_tblastn | 88 ++ etc/run_tblastx | 87 ++ 30 files changed, 8375 insertions(+) create mode 100644 etc/af063097.embl create mode 100644 etc/af063097.fasta create mode 100644 etc/af063097_v_b132222.crunch create mode 100644 etc/b132222.embl create mode 100644 etc/b132222.fasta create mode 100644 etc/c1215.blastn.crunch create mode 100644 etc/c1215.blastn.tab create mode 100644 etc/c1215.embl create mode 100644 etc/c1215.genbank create mode 100644 etc/c1215.seq create mode 100644 etc/feature_keys create mode 100644 etc/options create mode 100644 etc/pombe.usage create mode 100644 etc/qualifier_types create mode 100755 etc/results_to_netscape create mode 100755 etc/run_blastn create mode 100755 etc/run_blastp create mode 100755 etc/run_blastx create mode 100755 etc/run_clustalx create mode 100755 etc/run_fasta create mode 100755 etc/run_fasta_orig create mode 100644 etc/run_fastx create mode 100755 etc/run_hth create mode 100755 etc/run_jalview create mode 100755 etc/run_jalview.orig create mode 100755 etc/run_pepstats create mode 100755 etc/run_sigcleave create mode 100755 etc/run_smart create mode 100755 etc/run_tblastn create mode 100755 etc/run_tblastx diff --git a/etc/af063097.embl b/etc/af063097.embl new file mode 100644 index 000000000..99cf9f44a --- /dev/null +++ b/etc/af063097.embl @@ -0,0 +1,1903 @@ +ID AF063097 standard; DNA; PHG; 33593 BP. +XX +AC AF063097; J02474; L29304; M12772; M13202; M27131; M27836; M34756; M58023; +AC M59752; M64677; U02597; X02300; X02301; X05655; X61229; X87173; X99627; +AC X99628; Z11483; +XX +SV AF063097.1 +XX +DT 21-MAY-1998 (Rel. 55, Created) +DT 07-JAN-1999 (Rel. 58, Last updated, Version 2) +XX +DE Bacteriophage P2, complete genome. +XX +KW . +XX +OS Enterobacteria phage P2 +OC Viruses; dsDNA viruses, no RNA stage; Caudovirales; Myoviridae; +OC P2-like Viruses. +XX +RN [1] +RP 1-9, 33582-33593 +RX MEDLINE; 73220701. +RA Murray K., Murray N.E.; +RT "Terminal nucleotide sequences of DNA from temperate coliphages"; +RL Nature New Biol. 243(126):134-139(1973). +XX +RN [2] +RP 1-26, 33568-33593 +RX MEDLINE; 77209985. +RA Murray K., Isaksson-Forsen A.G., Challberg M., Englund P.T.; +RT "Symmetrical nucleotide sequences in the recognition sites for the ter +RT function of bacteriophages P2, 299 and 186"; +RL J. Mol. Biol. 112(3):471-489(1977). +XX +RN [3] +RP 1-26, 33568-33593 +RX MEDLINE; 82051282. +RA Lindqvist B.H.; +RT "Recombination between satellite phage P4 and its helper P2. I. In vivo and +RT in vitro construction of P4: :P2 hybrid satellite phage"; +RL Gene 14(4):231-241(1981). +XX +RN [4] +RP 2929-3589 +RX MEDLINE; 83268689. +RA Christie G.E., Calendar R.; +RT "Bacteriophage P2 late promoters. Transcription initiation sites for two +RT late mRNAs"; +RL J. Mol. Biol. 167(4):773-790(1983). +XX +RN [5] +RP 25456-25995 +RX MEDLINE; 84248044. +RA Ljungquist E., Kockum K., Bertani E.L.; +RT "DNA sequence of the repressor gene and operator region of bacteriophage +RT P2"; +RL Proc. Natl. Acad. Sci. U.S.A. 81:3988-3992(1984). +XX +RN [6] +RP 10188-10518, 17510-17996 +RX MEDLINE; 85160858. +RA Christie G.E., Calender R.; +RT "Bacteriophage P2 late promoters - comparison of the four late promoter +RT sequences"; +RL J. Mol. Biol. 181:373-382(1985). +XX +RN [7] +RP 23909-24339 +RX MEDLINE; 86281704. +RA Birkeland N.K., Lindquist B.H.; +RT "Coliphage P2 late control gene ogr. DNA sequence and product +RT identification"; +RL J. Mol. Biol. 188(3):487-490(1986). +XX +RN [8] +RP 23889-24333 +RX MEDLINE; 86205872. +RA Christie G.E., Haggard-Ljungquist E., Feiwell R., Calendar R.; +RT "Regulation of bacteriophage P2 late-gene expression: the ogr gene"; +RL Proc. Natl. Acad. Sci. U.S.A. 83(10):3238-3242(1986). +XX +RN [9] +RP 25849-27048 +RX MEDLINE; 87286423. +RA Haggard-Ljungquist E., Kockum K., Bertani L.E.; +RT "DNA sequences of bacteriophage P2 early genes cox and B and their +RT regulatory sites"; +RL Mol. Gen. Genet. 208(1-2):52-56(1987). +XX +RN [10] +RP 25849-27048 +RX MEDLINE; 88082694. +RA Saha S., Haggard-Ljungquist E., Nordstrom K.; +RT "The cox protein of bacteriophage P2 inhibits the formation of the +RT repressor protein and autoregulates the early operon"; +RL EMBO J. 6(10):3191-3199(1987). +XX +RN [11] +RP 24252-25595 +RX MEDLINE; 90006769. +RA Yu A., Bertani L.E., Haggard-Ljungquist E.; +RT "Control of prophage integration and excision in bacteriophage P2: +RT nucleotide sequences of the int gene and att sites"; +RL Gene 80(1):1-11(1989). +XX +RN [12] +RP 31590-33593 +RX MEDLINE; 90152373. +RA Haggard-Ljungquist E., Barreiro V., Calendar R., Kurnit D.M., Cheng H.; +RT "The P2 phage old gene: sequence, transcription and translational control"; +RL Gene 85(1):25-33(1989). +XX +RN [13] +RP 1-266, 33200-33593 +RX MEDLINE; 91092507. +RA Ziermann R., Calendar R.; +RT "Characterization of the cos sites of bacteriophages P2 and P4"; +RL Gene 96(1):9-15(1990). +XX +RN [14] +RP 17627-19373 +RX MEDLINE; 91135001. +RA Temple L.M., Forsburg S.L., Calendar R., Christie G.E.; +RT "Nucleotide sequence of the genes encoding the major tail sheath and tail +RT tube proteins of bacteriophage P2"; +RL Virology 181(1):353-358(1991). +XX +RN [15] +RP 4050-5178 +RX MEDLINE; 91220668. +RA Six E.W., Sunshine M.G., Williams J., Haggard-Ljungquist E., +RA Lindqvist B.H.; +RT "Morphopoietic switch mutations of bacteriophage P2"; +RL Virology 182(1):34-46(1991). +XX +RN [16] +RP 1-6551 +RX MEDLINE; 92115571. +RA Linderoth N.A., Ziermann R., Haggard-Ljungquist E., Christie G.E., +RA Calendar R.; +RT "Nucleotide sequence of the DNA packaging and capsid synthesis genes of +RT bacteriophage P2"; +RL Nucleic Acids Res. 19(25):7207-7214(1991). +XX +RN [17] +RP 12173-15684 +RX MEDLINE; 92165720. +RA Haggard-Ljungquist E., Halling C., Calendar R.; +RT "DNA sequence of two tail genes of bacteriophage P2: Further evidence for +RT horizontal transfer of tail fiber genes among unrelated bacteriophages"; +RL J. Bacteriol. 174:1462-1477(1992). +XX +RN [18] +RP 26923-30721 +RX MEDLINE; 93287108. +RA Liu Y., Saha S., Haggard-Ljungquist E.; +RT "Studies of bacteriophage P2 DNA replication. The DNA sequence of the +RT cis-acting gene A and ori region and construction of a P2 mini-chromosome"; +RL J. Mol. Biol. 231(2):361-374(1993). +XX +RN [19] +RP 6288-8381 +RX MEDLINE; 94327465. +RA Ziermann R., Bartlett B., Calendar R., Christie G.E.; +RT "Functions involved in bacteriophage P2-induced host cell lysis and +RT identification of a new tail gene"; +RL J. Bacteriol. 176:4974-4984(1994). +XX +RN [20] +RP 8376-10381 +RX MEDLINE; 94233699. +RA Linderoth N.A., Julien B., Flick K.E., Calendar R., Christie G.E.; +RT "Molecular cloning and characterization of bacteriophage P2 genes R and S +RT involved in tail completion"; +RL Virology 200:347-359(1994). +XX +RN [21] +RP 10276-12739 +RX MEDLINE; 96036485. +RA Haggard-Liungquist E., Jacobsen E., Rishovd S., Six W.S., Nilssen O., +RA Sunshine M.G., Lindqvist B.H., Kim K.J., Barreiro V., Koonin E.V., +RA Calendar R.; +RT "Bacteriophage P2: genes involved in baseplate assembly"; +RL Virology 213(1):109-121(1995). +XX +RN [22] +RP 15627-17626, 30643-31622 +RA Calendar R., Yu S., Myung H., Barreiro V., Odegrip R., Bertani L.E., +RA Carlson K., Davenport L., Mosig G., Christie G.E., Haggard-Ljungquist E.; +RT "The lysogenic conversion genes of coliphage P2 have unusually high AT +RT content"; +RL (in) Syvanen M., Kado C. (eds.); +RL HORIZONTAL GENE TRANSFER:1-1; +RL Chapman and Hall, London (1998) +XX +RN [23] +RP 19374-23954 +RA Christie G.E., Temple L.M., Bartlett B.A., Goodwin T.S.; +RT "Bacteriophage P2 tail assembly genes: Gene organization and a programmed +RT translational frameshift parallel those of bacteriophage lambda"; +RL Unpublished. +XX +RN [24] +RP 1-33593 +RA Christie G.E., Haggard-Ljungquist E., Calendar R.; +RT "The complete genome of bacteriophage P2"; +RL Unpublished. +XX +RN [25] +RP 24351-25595 +RA Haggard-Ljungquist E.; +RT ; +RL Submitted (15-SEP-1989) to the EMBL/GenBank/DDBJ databases. +RL Department of Microbial Genetics, Karolinska Institutet, Stockholm, Sweden +XX +RN [26] +RP 1-6551 +RA Linderoth N.A.; +RT ; +RL Submitted (13-AUG-1991) to the EMBL/GenBank/DDBJ databases. +RL Dept of Mol and Cell Biology, Div of Biochemistry and Molecular Biology, +RL University of California, 401 Barker Hall, Berkeley, CA 94720, USA +XX +RN [27] +RP 26923-30721 +RA Haggard-Ljungquist E.; +RT ; +RL Submitted (12-NOV-1991) to the EMBL/GenBank/DDBJ databases. +RL Department of Microbial Genetics, Karolinska Institutet, S-10401, +RL Stockholm, Sweden +XX +RN [28] +RP 8376-10381 +RA Linderoth N.A.; +RT ; +RL Submitted (18-OCT-1993) to the EMBL/GenBank/DDBJ databases. +RL Nora A. Linderoth, Laboratory of Genetics, The Rockefeller University, 1230 +RL York Avenue, New York, NY 10021, USA +XX +RN [29] +RP 10276-12739 +RA Haggard E.B.; +RT ; +RL Submitted (12-MAY-1995) to the EMBL/GenBank/DDBJ databases. +RL Department of Genetics, Stockholm University, S-10691, Stockholm, Sweden +XX +RN [30] +RP 15627-17626, 30643-31622 +RA Haggard-Ljungquist E.; +RT ; +RL Submitted (30-JUL-1996) to the EMBL/GenBank/DDBJ databases. +RL Department of Genetics, Stockholm University, S-106 91, Stockholm, Sweden +XX +RN [31] +RP 17510-23954 +RA Christie G.E.; +RT ; +RL Submitted (21-NOV-1996) to the EMBL/GenBank/DDBJ databases. +RL Department of Microbiology and Immunology, Virginia Commonwealth +RL University, Box 980678, Richmond, VA 23298-0678, USA +XX +RN [32] +RP 1-33593 +RA Christie G.E.; +RT ; +RL Submitted (05-MAY-1998) to the EMBL/GenBank/DDBJ databases. +RL Department of Microbiology and Immunology, Virginia Commonwealth +RL University, Richmond, VA 23298-0678, USA +XX +DR SPTREMBL; O64312; O64312. +DR SPTREMBL; O64313; O64313. +DR SPTREMBL; O64314; O64314. +DR SPTREMBL; O64315; O64315. +DR SPTREMBL; P79669; P79669. +DR SPTREMBL; P79670; P79670. +DR SPTREMBL; Q38498; Q38498. +DR SWISS-PROT; P04132; RPC_BPP2. +DR SWISS-PROT; P07695; VCOX_BPP2. +DR SWISS-PROT; P07696; VPB_BPP2. +DR SWISS-PROT; P08762; VOGR_BPP2. +DR SWISS-PROT; P10312; VPD_BPP2. +DR SWISS-PROT; P13520; VOLD_BPP2. +DR SWISS-PROT; P22501; VPF1_BPP2. +DR SWISS-PROT; P22502; VPF2_BPP2. +DR SWISS-PROT; P25475; VPL_BPP2. +DR SWISS-PROT; P25476; VPM_BPP2. +DR SWISS-PROT; P25477; VPN_BPP2. +DR SWISS-PROT; P25478; VPO_BPP2. +DR SWISS-PROT; P25479; VPP_BPP2. +DR SWISS-PROT; P25480; VPQ_BPP2. +DR SWISS-PROT; P26699; TFA_BPP2. +DR SWISS-PROT; P26700; VPH_BPP2. +DR SWISS-PROT; P26701; VPI_BPP2. +DR SWISS-PROT; P31340; VPV_BPP2. +DR SWISS-PROT; P36932; VINT_BPP2. +DR SWISS-PROT; P36933; VPR_BPP2. +DR SWISS-PROT; P36934; VPS_BPP2. +DR SWISS-PROT; P36935; YSV_BPP2. +DR SWISS-PROT; P51767; VPJ_BPP2. +DR SWISS-PROT; P51768; VPW_BPP2. +DR SWISS-PROT; P51769; LYSA_BPP2. +DR SWISS-PROT; P51770; LYSB_BPP2. +DR SWISS-PROT; P51771; LYCV_BPP2. +DR SWISS-PROT; P51772; VPX_BPP2. +DR SWISS-PROT; P51773; HOLI_BPP2. +DR SWISS-PROT; Q06419; VPA_BPP2. +DR SWISS-PROT; Q06422; YO80_BPP2. +DR SWISS-PROT; Q06423; YO81_BPP2. +DR SWISS-PROT; Q06424; YO82_BPP2. +DR SWISS-PROT; Q06425; YO83_BPP2. +DR SWISS-PROT; Q06426; YO91_BPP2. +XX +CC On May 20, 1998 this sequence version replaced gi:506838 gi:15821 +CC gi:1806573 gi:215666 gi:506836 gi:508561 gi:1061043 gi:215669 +CC gi:1769975 gi:494974 gi:215664 gi:15620 gi:393451 gi:1769977 +CC gi:215681 gi:215675 gi:215676 gi:15141 gi:414530. +XX +FH Key Location/Qualifiers +FH +FT source 1..33593 +FT /db_xref="taxon:10679" +FT /organism="Enterobacteria phage P2" +FT /lab_host="Escherichia coli" +FT misc_feature 1..19 +FT /note="cosL; left cohesive end" +FT terminator complement(160..181) +FT /note="tQ; putative rho-independent terminator for P +FT operon" +FT CDS complement(187..1221) +FT /codon_start=1 +FT /db_xref="SWISS-PROT:P25480" +FT /evidence=EXPERIMENTAL +FT /transl_table=11 +FT /gene="Q" +FT /function="presumed portal protein" +FT /product="gpQ" +FT /protein_id="AAD03268.1" +FT /translation="MSKKKGKTPQPAAKTMTASGPKMEAFTFGEPVPVLDRRDILDYVE +FT CISNGRWYEPPVSFTGLAKSLRAAVHHSSPIYVKRNILASTFIPHPWLSQQDFSRFVLD +FT FLVFGNAFLEKRYSTTGKVIRLETSPAKYTRRGVEEDVYWWVPSFNEPTAFAPGSVFHL +FT LEPDINQELYGLPEYLSALNSAWLNESATLFRRKYYENGAHAGYIMYVTDAVQDRNDIE +FT MLRENMVKSKGRNNFKNLFLYAPQGKADGIKIIPLSEVATKDDFFNIKKASAADLLDAH +FT RIPFQLMGGKPENVGSLGDIEKVAKVFVRNELIPLQDRIREINGWLGQEVIRFKNYSLD +FT TDND" +FT variation complement(653) +FT /note="Qam34 mutation" +FT /replace="t" +FT /gene="Q" +FT CDS complement(1221..2993) +FT /codon_start=1 +FT /db_xref="SWISS-PROT:P25479" +FT /evidence=EXPERIMENTAL +FT /transl_table=11 +FT /gene="P" +FT /function="terminase; DNA-dependent ATPase" +FT /product="gpP" +FT /protein_id="AAD03269.1" +FT /translation="MTITTDTTLLHDPRRQAALLYWQGFSVPQIAAMLQMKRPTVQSWK +FT QRDGWDSVAPISRVEMSLEARLTQLIIKPQKTGGDFKEIDLLGRQIERLARVNRYSQTG +FT NEADLNPNVANRNKGGRRKPKKNFFSDEAIEKLEQIFFEQSFDYQLHWYRAGLEHRIRD +FT ILKSRQIGATFYFSREALLRALKTGHNQIFLSASKTQAYVFREYIIAFARLVDVDLTGD +FT PIVLGNNGAKLIFLGTNSNTAQSHNGDLYVDEIFWIPNFQVLRKVASGMASQSHLRSTY +FT FSTPSTLAHDAYPFWSGELFNRGRASAAERVEIDVSHNALAGGLLCADGQWRQIVTIED +FT ALKGGCTLFDIEQLKRENSADDFKNLFMCEFVDDKASVFPFEELQRCMVDTLEEWEDYA +FT PFAANPFGSRPVWIGYDPSHRGDSAGCVVLAPPVVAGGKFRILERHQWKGMDFATQAES +FT IRKLTEKYNVEYIGIDATGLGVGVFQLVRSFYPAARDIRYTPEMKTAMVLKAKDVIRRG +FT CLEYDVSATDITSSFMAIRKTMTSSGRSATYEASRSEEASHADLAWATMHALLNEPLTA +FT GISTPLTSTILEFY" +FT variation complement(2210) +FT /note="Pam24 and Pam137 mutations" +FT /replace="a" +FT /gene="P" +FT variation complement(2948) +FT /note="Pam253 mutation" +FT /replace="a" +FT /gene="P" +FT misc_feature complement(3016) +FT /note="transcription start site for P operon; encodes P,Q" +FT /gene="P" +FT misc_feature 3057..3087 +FT /evidence=EXPERIMENTAL +FT /note="activator binding site; pO, pP promoters" +FT misc_feature 3127 +FT /evidence=EXPERIMENTAL +FT /note="transcription start site for O operon; encodes O, N, +FT M, L, X, Y, K, lysA, lysB, R, S" +FT CDS 3167..4021 +FT /codon_start=1 +FT /db_xref="SWISS-PROT:P25478" +FT /transl_table=11 +FT /gene="O" +FT /function="presumed capsid scaffolding protein" +FT /product="gpO" +FT /protein_id="AAD03270.1" +FT /translation="MAKKVSKFFRIGVEGDTCDGRVISAQDIQEMAETFDPRVYGCRIN +FT LEHLRGILPDGIFKRYGDVAELKAEKIDDDSALKGKWALFAKITPTDDLIAMNKAAQKV +FT YTSMEIQPNFANTGKCYLVGLAVTDDPASLGTEYLEFCRTAKHNPLNRFKLSPENLISV +FT ATPVELEFEDLPETVFTALTEKVKSIFGRKQASDDARLNDVHEAVTAVAEHVQEKLSAT +FT EQRLAEMETAFSALKQEVTDRADETSQAFTRLKNSLDHTESLTQQRRSKATGGGGDALM +FT TNC" +FT variation 3206 +FT /note="Oam71 mutation" +FT /replace="t" +FT /gene="O" +FT variation 3411 +FT /note="Oam7 mutation" +FT /replace="a" +FT /gene="O" +FT variation 3878 +FT /note="Oam279 mutation" +FT /replace="t" +FT /gene="O" +FT CDS 4080..5153 +FT /codon_start=1 +FT /db_xref="SWISS-PROT:P25477" +FT /transl_table=11 +FT /gene="N" +FT /function="major capsid precursor" +FT /product="gpN" +FT /protein_id="AAD03271.1" +FT /translation="MRQETRFKFNAYLSRVAELNGIDAGDVSKKFTVEPSVTQTLMNTM +FT QESSDFLTRINIVPVSEMKGEKIGIGVTGSIASTTDTAGGTERQPKDFSKLASNKYECD +FT QINFDFYIRYKTLDLWARYQDFQLRIRNAIIKRQSLDFIMAGFNGVKRAETSDRSSNPM +FT LQDVAVGWLQKYRNEAPARVMSKVTDEEGRTTSEVIRVGKGGDYASLDALVMDATNNLI +FT EPWYQEDPDLVVIVGRQLLADKYFPIVNKEQDNSEMLAADVIISQKRIGNLPAVRVPYF +FT PADAMLITKLENLSIYYMDDSHRRVIEENPKLDRVENYESMNIDYVVEDYAAGCLVEKI +FT KVGDFSTPAKATAEPGA" +FT variation 4349..4350 +FT /note="Nam209 mutation" +FT /replace="at" +FT /gene="N" +FT variation 4630 +FT /note="sir3 mutation; defective for choice of small capsids +FT by satellite phage P4" +FT /replace="c" +FT /gene="N" +FT variation 4695 +FT /note="sir5 mutation; defective for choice of small capsids +FT by satellite phage P4" +FT /replace="t" +FT /gene="N" +FT variation 4695..4697 +FT /note="sir9 mutation; defective for choice of small capsids +FT by satellite phage P4" +FT /replace="" +FT /gene="N" +FT variation 4699 +FT /note="sir2, sir6 and sir8 mutations; defective for choice +FT of small capsids by satellite phage P4" +FT /replace="t" +FT /gene="N" +FT variation 4740 +FT /note="sir1 mutation; defective for choice of small capsids +FT by satellite phage P4" +FT /replace="g" +FT /gene="N" +FT variation 4741 +FT /note="sir4 mutation; defective for choice of small capsids +FT by satellite phage P4" +FT /replace="a" +FT /gene="N" +FT CDS 5157..5900 +FT /codon_start=1 +FT /db_xref="SWISS-PROT:P25476" +FT /transl_table=11 +FT /gene="M" +FT /function="terminase" +FT /product="gpM" +FT /protein_id="AAD03272.1" +FT /translation="MTSPAQRHMMRVSAAMTAQREAAPLRHATVYEQMLVKLAADQRTL +FT KAIYSKELKAAKKRELLPFWLPWVNGVLELGKGAQDDILMTVMLWRLDTGDIAGALEIA +FT RYALKYGLTMPGKHRRTPPYMFTEEVALAAMRAHAAGESVDTRLLTETLELTATADMPD +FT EVRAKLHKITGLFLRDGGDAAGALAHLQRATQLDCQAGVKKEIERLERELKPKPEPQPK +FT AATRAPRKTRSVTPAKRGRPKKKAS" +FT variation 5361 +FT /note="Mts52 mutation" +FT /replace="a" +FT /gene="M" +FT variation 5751 +FT /note="Mam32 mutation" +FT /replace="t" +FT /gene="M" +FT CDS 6000..6509 +FT /codon_start=1 +FT /db_xref="SWISS-PROT:P25475" +FT /transl_table=11 +FT /gene="L" +FT /function="capsid completion protein" +FT /product="gpL" +FT /protein_id="AAD03273.1" +FT /translation="MMTLIIPRKEAPVSGEGTVVIPQPAGDEPVIKNTFFFPDIDPKRV +FT RERMRLEQTVAPARLREAIKSGMAETNAELYEYREQKIAAGFTRLADVPADDIDGESIK +FT VFYYERAVCAMATASLYERYRGVDASAKGDKKADSIDSTIDELWRDMRWAVARIQGKPR +FT CIVSQI" +FT variation 6024 +FT /note="Lam79 mutation" +FT /replace="t" +FT /gene="L" +FT variation 6240 +FT /note="Lam9 mutation" +FT /replace="t" +FT /gene="L" +FT CDS 6509..6712 +FT /codon_start=1 +FT /db_xref="SWISS-PROT:P51772" +FT /evidence=EXPERIMENTAL +FT /transl_table=11 +FT /gene="X" +FT /function="essential tail gene" +FT /product="gpX" +FT /protein_id="AAD03274.1" +FT /translation="MKTFALQGDTLDAICVRYYGRTEGVVETVLAANPGLAELGAVLPH +FT GTAVELPDVQTAPVAETVNLWE" +FT variation 6562 +FT /note="Xam95 mutation" +FT /replace="g" +FT /gene="X" +FT CDS 6716..6997 +FT /codon_start=1 +FT /db_xref="SWISS-PROT:P51773" +FT /evidence=EXPERIMENTAL +FT /transl_table=11 +FT /gene="Y" +FT /function="holin; essential for host cell cell lysis" +FT /product="gpY" +FT /protein_id="AAD03275.1" +FT /translation="MTAEEKSVLSLFMIGVLIVVGKVLAGGEPITPRLFIGRMLLGGFV +FT SMVAGVVLVQFPDLSLPAVCGIGSMLGIAGYQVIEIAIQRRFKGRGKQ" +FT variation 6852 +FT /note="Yam94 mutation" +FT /replace="a" +FT /gene="Y" +FT CDS 6997..7494 +FT /codon_start=1 +FT /db_xref="SWISS-PROT:P51771" +FT /evidence=EXPERIMENTAL +FT /transl_table=11 +FT /gene="K" +FT /function="endolysin; essential for host cell lysis" +FT /product="gpK" +FT /protein_id="AAD03276.1" +FT /translation="MPVINTHQNIAAFLDMLAVSEGTANHPLTKNRGYDVIVTGLDGKP +FT EIFTDYSDHPFAHGRPAKVFNRRGEKSTASGRYQQLYLFWPHYRKQLALPDFSPLSQDR +FT LAIQLIRERGALDDIRAGRIERAISRCRNIWASLPGAGYGQREHSLEKLVTVWRTAGGV +FT PA" +FT variation 7114 +FT /note="Kts60 mutation" +FT /replace="a" +FT /gene="K" +FT variation 7126 +FT /note="Kam218 mutation" +FT /replace="t" +FT /gene="K" +FT variation 7318 +FT /note="Kam12 mutation" +FT /replace="t" +FT /gene="K" +FT variation 7322 +FT /note="Kam76 mutation" +FT /replace="a" +FT /gene="K" +FT CDS 7509..7934 +FT /codon_start=1 +FT /db_xref="SWISS-PROT:P51769" +FT /evidence=EXPERIMENTAL +FT /transl_table=11 +FT /gene="lysA" +FT /function="nonessential; affects timing of lysis" +FT /product="LysA" +FT /protein_id="AAD03277.1" +FT /translation="MKKLSLSLMLNVSLALMLALSLIYPQSVAVNFVAAWAILATVICV +FT VAGGVGVYATEYVLERYGRELPPESLAVKIVTSLFLQPVPWRRRAAALVVVVATFISLV +FT AAGWIFTALIYLVVSLFFRLIRKACRQRLEGREPCQG" +FT variation 7694 +FT /note="lysAam96 mutation" +FT /replace="g" +FT /gene="lysA" +FT CDS 7922..8347 +FT /codon_start=1 +FT /db_xref="SWISS-PROT:P51770" +FT /evidence=EXPERIMENTAL +FT /transl_table=11 +FT /gene="lysB" +FT /function="nonessential; affects timing of lysis" +FT /product="LysB" +FT /protein_id="AAD03278.1" +FT /translation="MSRLMIVLVVLLSLAVAGLFLVKHKNASLRASLDRANNVASGQQT +FT TITMLKNQLHVALTRADKNELAQVALRQELENAAKREAQREKTITRLLNENEDFRRWYG +FT ADLPDAVRRLHQRPACTDASDCPQRMPESEPLPDAGQ" +FT variation 8099..8100 +FT /note="lysBam97 mutation" +FT /replace="ta" +FT /gene="lysB" +FT attenuator 8399..8417 +FT /note="putative transcription attenuator; O operon" +FT CDS 8455..8922 +FT /codon_start=1 +FT /db_xref="SWISS-PROT:P36933" +FT /evidence=EXPERIMENTAL +FT /transl_table=11 +FT /gene="R" +FT /function="essential tail gene; tail completion" +FT /product="gpR" +FT /protein_id="AAD03279.1" +FT /translation="MLKPDSLRRALTDAVTVLKTNPDMLRIFVDNGSIASTLAASLSFE +FT KRYTLNVIVTDFTGDFDLLIVPVLAWLRENQPDIMTTDEGQKKGFTFYADINNDSSFDI +FT SISLMLTERTLVSEVDGALHVKNISEPPPPEPVTRPMELYINGELVSKWDE" +FT variation 8680 +FT /note="Ram3 mutation" +FT /replace="t" +FT /gene="R" +FT variation 8710 +FT /note="Ram42 mutation" +FT /replace="t" +FT /gene="R" +FT variation 8857 +FT /note="Ram23 mutation" +FT /replace="t" +FT /gene="R" +FT CDS 8915..9367 +FT /codon_start=1 +FT /db_xref="SWISS-PROT:P36934" +FT /evidence=EXPERIMENTAL +FT /transl_table=11 +FT /gene="S" +FT /function="essential tail gene; tail completion" +FT /product="gpS" +FT /protein_id="AAD03280.1" +FT /translation="MNEFKRFEDRLTGLIESLSPSGRRRLSAELAKRLRQSQQRRVMAQ +FT KAPDGTPYAPRQQQSVRKKTGRVKRKMFAKLITSRFLHIRASPEQASMEFYGGKSPKIA +FT SVHQFGLSEENRKDGKKIDYPARPLLGFTGEDVQMIEEIILAHLER" +FT variation 9209 +FT /note="Sam75 mutation" +FT /replace="t" +FT /gene="S" +FT variation 9213 +FT /note="Sam89 mutation" +FT /replace="a" +FT /gene="S" +FT terminator 9397..9433 +FT /note="putative rho-independent terminator for O operon" +FT CDS complement(9439..10224) +FT /codon_start=1 +FT /db_xref="SWISS-PROT:P36935" +FT /transl_table=11 +FT /gene="orf30" +FT /function="nonessential" +FT /product="Orf30" +FT /protein_id="AAD03281.1" +FT /translation="MVSYNVTNVWGLIVFFLCSFAVLAFFSFGKSNLMRLIAHYFNFGY +FT SDKKLKRLDREWRDIQLFKIINGINVSGIENVRMIQQGLIDGKLKTSYFFLTRIWGDIT +FT KPPHIIKTIIVILASIFYILLACYIHNEQSVIVRDATGIPYKNMMYYVYSDKVLLSFKN +FT KAVEFNKTYSLADCKRLQNVFIKDTLPEIACNKLLQLNEEDSEWLSQEIKDNNSHKKAL +FT LILSLVYFTSGLVIFLSYTKFFYANKKVLEYKASNKNHS" +FT misc_feature 10239..10266 +FT /evidence=EXPERIMENTAL +FT /note="activator binding site; activation of pV promoter" +FT CDS 10308..10943 +FT /codon_start=1 +FT /db_xref="SWISS-PROT:P31340" +FT /evidence=EXPERIMENTAL +FT /transl_table=11 +FT /gene="V" +FT /function="baseplate assembly protein" +FT /product="gpV" +FT /protein_id="AAD03282.1" +FT /translation="MNTLANIQELARALRNMIRTGIIVETDLNAGRCRVQTGGMCTDWL +FT QWLTHRAGRSRTWWAPSVGEQVLILAVGGELDTAFVLPGIYSGDNPSPSVSADALHIRF +FT PDGAVIEYEPETSALTVSGIKTASVTASGSVTATVPVVMVKASTRVTLDTPEVVCTNRL +FT ITGTLEVQKGGTMRGNIEHTGGELSSNGKVLHTHKHPGDSGGTTGSPL" +FT misc_feature 10308 +FT /evidence=EXPERIMENTAL +FT /note="transcription start site for V operon; encodes V, W, +FT J, I, H, G" +FT /gene="V" +FT variation 10329 +FT /note="Vam42, Vam203 and Vam205 mutations" +FT /replace="t" +FT /gene="V" +FT variation 10498 +FT /note="Vts199 mutation" +FT /replace="a" +FT /gene="V" +FT CDS 10940..11287 +FT /codon_start=1 +FT /db_xref="SWISS-PROT:P51768" +FT /evidence=EXPERIMENTAL +FT /transl_table=11 +FT /gene="W" +FT /function="baseplate assembly protein" +FT /product="gpW" +FT /protein_id="AAD03283.1" +FT /translation="MTARYLGMNRSDGLTVTDLEHISQSIGDILRTPVGSRVMRRDYGS +FT LLASMIDQPQTPALELQIKVACYMAVLKWEPRVTLSSVTTARSFDGRMTVTLTGQHNDT +FT GQPLSLTIPVS" +FT variation 11237 +FT /note="Wam50 mutation" +FT /replace="t" +FT /gene="W" +FT CDS 11292..12200 +FT /codon_start=1 +FT /db_xref="SWISS-PROT:P51767" +FT /evidence=EXPERIMENTAL +FT /transl_table=11 +FT /gene="J" +FT /function="baseplate assembly protein" +FT /product="gpJ" +FT /protein_id="AAD03284.1" +FT /translation="MPIIDLNQLPAPDVVEELDFESILAERKATLISLYPEDQQEAVAR +FT TLTLESEPLVKLLEENAYRELIWRQRVNEAARAVMLACAAGNDLDVIGANYNTTRLTIT +FT PADDSTIPPTPAVMESDTDYRLRIQQAFEGLSVAGSVGAYQYHGRSADGRVADISVTSP +FT SPACVTISVLSRENNGVASEDLLAVVRNALNGEDVRPVADRVTVQSAAIVEYQINATLY +FT LYPGPESEPIRAAAVKKLEAYITAQHRLGRDIRLSAIYAALHVEGVQRVELAAPLADIV +FT LNSTQASFCTEYRVVTGGSDE" +FT variation 11937 +FT /note="Jam31 mutation" +FT /replace="t" +FT /gene="J" +FT CDS 12193..12723 +FT /codon_start=1 +FT /db_xref="SWISS-PROT:P26701" +FT /evidence=EXPERIMENTAL +FT /transl_table=11 +FT /gene="I" +FT /function="baseplate assembly protein" +FT /product="gpI" +FT /protein_id="AAD03285.1" +FT /translation="MSDSRLLPTGSSPLEVAAAKACAEIEKTPVSIRELWNPDTCPANL +FT LPWLAWAFSVDRWDEKWPEATKRAVIRDAYFIHCHKGTIGAIRRVVEPLGYLINVTEWW +FT ENSDPPGTFRLDIGVLESGITEAMYQEMERLIADAKPASRHLIGLNITRDIPGYLFAGG +FT VAYDGDVITVYPG" +FT variation 12235 +FT /note="Iam78 mutation" +FT /replace="t" +FT /gene="I" +FT CDS 12734..14743 +FT /codon_start=1 +FT /db_xref="SWISS-PROT:P26700" +FT /transl_table=11 +FT /gene="H" +FT /function="probable tail fiber protein" +FT /product="gpH" +FT /protein_id="AAD03286.1" +FT /translation="MSIKFRTVITTAGAAKLAAATAPGRRKVGITTMAVGDGGGKLPVP +FT DAGQTGLIHEVWRHALNKISQDKRNSNYIIAELVIPPEVGGFWMRELGLYDDAGTLIAV +FT ANMAESYKPALAEGSGRWQTCRMVIIVSSVASVELTIDTTTVMATQDYVDDKIAEHEQS +FT RRHPDASLTAKGFTQLSSATNSTSETLAATPKAVKAAYDLANGKYTAQDATTARKGLVQ +FT LSSATNSTSETLAATPKAVKTVMDETNKKAPLNSPALTGTPTTPTARQGTNNTQIANTA +FT FVMAAIAALVDSSPDALNTLNELAAALGNDPNFATTMTNALAGKQPKDATLTALAGLAT +FT AADRFPYFTGNDVASLATLTKVGRDILAKSTVAAVIEYLGLQETVNRAGNAVQKNGDTL +FT SGGLTFENDSILAWIRNTDWAKIGFKNDADGDTDSYMWFETGDNGNEYFKWRSRQSTTT +FT KDLMTLKWDALNILVNAVINGCFGVGTTNALGGSSIVLGDNDTGFKQNGDGILDVYANS +FT QRVFRFQNGVAIAFKNIQAGDSKKFSLSSSNTSTKNITFNLWGASTRPVVAELGDEAGW +FT HFYSQRNTDNSVIFAVNGQMQPSNWGNFDSRYVKDVRLGTRVVQLMARGGRYEKAGHTI +FT TGLRIIGEVDGDDEAIFRPIQKYINGTWYNVAQV" +FT variation 13994 +FT /note="Ham72 mutation" +FT /replace="t" +FT /gene="H" +FT variation 14336 +FT /note="Ham59 mutation" +FT /replace="t" +FT /gene="H" +FT CDS 14747..15274 +FT /codon_start=1 +FT /db_xref="SWISS-PROT:P26699" +FT /transl_table=11 +FT /gene="G" +FT /function="probable tail fiber assembly protein" +FT /product="gpG" +FT /protein_id="AAD03287.1" +FT /translation="MQHLKNIKSGNPKTKEQYQLTKNFDVIWLWSEDGKNWYEEVKNFQ +FT PDTIKIVYDENNIIVAITRDASTLNPEGFSVVEVPDITSNRRADDSGKWMFKDGAVVKR +FT IYTADEQQQQAESQKAALLSEAENVIQPLERAVRLNMATDEERARLESWERYSVLVSRV +FT DPANPEWPEMPQ" +FT variation 14879 +FT /note="Gam1 mutation" +FT /replace="t" +FT /gene="G" +FT variation 15294..17233 +FT /note="del2 deletion" +FT /replace="" +FT terminator 15639..15666 +FT /note="putative rho-independent terminator for V operon" +FT CDS complement(15675..17261) +FT /codon_start=1 +FT /db_xref="SPTREMBL:P79669" +FT /note="cloned gene blocks growth of T5" +FT /transl_table=11 +FT /gene="fun(Z)" +FT /function="nonessential; lysogenic conversion; confers +FT sensitivity to FUdR" +FT /product="Fun(Z)" +FT /protein_id="AAD03288.1" +FT /translation="MIPIKDLTLGYADAENYKRRENKELLNKVFIRDNHLSRLCEPNIS +FT FLVGEKGTGKTAYSIYLSNNNINNTLATTKYIRETEYQKFITLKSEKHLNLSDFSGIWK +FT VILYLLISKQVLDKEGKISKLLNYSKFSSLNDAIDEYYLKAFSPEIIQALSFVQESKVA +FT AELLHKHATLKGEERESLSFSESRFQINLFYIQKKFEEAFSQIRLSQNHILFIDGIDIR +FT PSSIPYDDYLECIKGLAHAVWEINNDFFPSIKGGKGRMKAVLLIRPDIFESIGLQNQNA +FT KIRDNSVFLDWRTEYVNHRSSQLFEVLDHLLRTQQDMALKKGQAWDHYFPWDSPNVHDN +FT YNHPTSFINFLRWSYYRPRDILRMLEIIKSHASGDDGKNQFSLDDFESPSMQRDYSNYL +FT LGEIKDHLSFYYGSEHYEIFLKFFEFLSGKDTFDYAEYLLAYKQLETHISSISTTKPKF +FT MTTANDFLQFLFGLNVICYIETTEDNNRFIRWCFRERSYANISPKIKTGMKYQIFYGLA +FT KSLNVGKALKK" +FT variation complement(15784) +FT /note="Z81su3 mutation" +FT /replace="a" +FT /gene="fun(Z)" +FT variation complement(15872) +FT /note="Z20 mutation" +FT /replace="t" +FT /gene="fun(Z)" +FT variation complement(15944) +FT /note="Z81 mutation" +FT /replace="t" +FT /gene="fun(Z)" +FT variation complement(15946) +FT /note="fun1 mutation" +FT /replace="t" +FT /gene="fun(Z)" +FT variation complement(16079) +FT /note="csZ150 mutation" +FT /replace="t" +FT /gene="fun(Z)" +FT variation complement(16266) +FT /note="fun99 mutation" +FT /replace="t" +FT /gene="fun(Z)" +FT variation 16267..17299 +FT /note="del5 deletion" +FT /replace="" +FT variation complement(16638) +FT /note="csZ150 mutation" +FT /replace="a" +FT /gene="fun(Z)" +FT misc_feature 17555..17583 +FT /evidence=EXPERIMENTAL +FT /note="activator binding site; activation of pF promoter" +FT misc_feature 17626..17628 +FT /evidence=EXPERIMENTAL +FT /note="transcription start site for F operon; encodes FI, +FT FII, E, E', T, U, D" +FT CDS 17652..18842 +FT /codon_start=1 +FT /db_xref="SWISS-PROT:P22501" +FT /transl_table=11 +FT /gene="FI" +FT /function="essential tail protein; tail sheath" +FT /product="gpFI" +FT /protein_id="AAD03289.1" +FT /translation="MSDYHHGVQVLEINEGTRVISTVSTAIVGMVCTASDADAETFPLN +FT KPVLITNVQSAISKAGKKGTLAASLQAIADQSKPVTVVMRVEDGTGDDEETKLAQTVSN +FT IIGTTDENGQYTGLKAMLAAESVTGVKPRILGVPGLDTKEVAVALASVCQKLRAFGYIS +FT AWGCKTISEVKAYRQNFSQRELMVIWPDFLAWDTVTSTTATAYATARALGLRAKIDQEQ +FT GWHKTLSNVGVNGVTGISASVFWDLQESGTDADLLNESGVTTLIRRDGFRFWGNRTCSD +FT DPLFLFENYTRTAQVVADTMAEAHMWAVDKPITATLIRDIVDGINAKFRELKTNGYIVD +FT ATCWFSEESNDAETLKAGKLYIDYDYTPVPPLENLTLRQRITDKYLANLVTSVNSN" +FT variation 18183 +FT /note="Fam4 mutation" +FT /replace="t" +FT /gene="FI" +FT CDS 18855..19373 +FT /codon_start=1 +FT /db_xref="SWISS-PROT:P22502" +FT /transl_table=11 +FT /gene="FII" +FT /function="essential tail protein; tail tube" +FT /product="gpFII" +FT /protein_id="AAD03290.1" +FT /translation="MAMPRKLKLMNVFLNGYSYQGVAKSVTLPKLTRKLENYRGAGMNG +FT SAPVDLGLDDDALSMEWSLGGFPDSVIWELYAATGVDAVPIRFAGSYQRDDTGETVAVE +FT VVMRGRQKEIDTGEGKQGEDTESKISVVCTYFRLTMDGKELVEIDTINMIEKVNGVDRL +FT EQHRRNIGL" +FT CDS join(19430..19684,19684..19857) +FT /codon_start=1 +FT /db_xref="SPTREMBL:O64312" +FT /note="shares amino terminus with gpE; -1 frameshift" +FT /transl_table=11 +FT /gene="E+E'" +FT /function="essential tail protein" +FT /product="gpE+E'" +FT /protein_id="AAD03292.1" +FT /translation="MNKENVITLDNPVKRGEQVIEQVTLMKPSAGTLRGVSLAAVANSE +FT VDALIKVLPRMTAPMLTEQEVAALELPDLVALAGKVVGFLVAELGAVTFPKNLSVDDLM +FT ADVAVIFHWPPSELYPMSLTELITWREKALRRSGNTNE" +FT CDS 19430..19705 +FT /codon_start=1 +FT /db_xref="SPTREMBL:O64313" +FT /transl_table=11 +FT /gene="E" +FT /function="essential tail protein" +FT /product="gpE" +FT /protein_id="AAD03291.1" +FT /translation="MNKENVITLDNPVKRGEQVIEQVTLMKPSAGTLRGVSLAAVANSE +FT VDALIKVLPRMTAPMLTEQEVAALELPDLVALAGKVVGFLSPNSVQ" +FT variation 19473 +FT /note="Ets55 mutation" +FT /replace="a" +FT /gene="E" +FT variation 19619 +FT /note="Eam30 mutation" +FT /replace="t" +FT /gene="E" +FT misc_feature 19685 +FT /evidence=EXPERIMENTAL +FT /note="site of -1 translational frameshift" +FT /gene="E+E'" +FT CDS 19850..22297 +FT /codon_start=1 +FT /db_xref="SPTREMBL:O64314" +FT /transl_table=11 +FT /gene="T" +FT /function="essential tail protein; putative tail length +FT determinator" +FT /product="gpT" +FT /protein_id="AAD03293.1" +FT /translation="MSNNVKLQVLLRAVDQASRPFKSIRTASKSLSGDIRETQKSLREL +FT NGHASRIEGFRKTSAQLAVTGHALEKARQEAEALATQFKNTERPTRAQAKVLESAKRAA +FT EDLQAKYNRLTDSVKRQQRELAAVGINTRNLAHDEQGLKNRISETTAQLNRQRDALVRV +FT SAQQAKLNAVKQRYQAGKELAGNMASVGAAGVGIAAAGTMAGVKLLMPGYEFAQKNSEL +FT QAVIGVAKDSAEMAALRKQARQLGDNTAASADDAAGAQIIIAKAGGDVDAIQAATPVTL +FT NMALANRRTMEENAALLMGMKSAFQLSNDKVAHIGDVLSMTMNKTAADFDGMSDALTYA +FT APVAKNAGVSIEETAAMVGALHDAKITGSMAGTGSRAVLSRLQAPTGKAWDALKELGVK +FT TSDSKGNTRPIFTILKEMQASFEKNRLGTAQQAEYMKTIFGEEASSAAAVLMTAASTGK +FT LDKLTAAFKASDGKTAELVNIMQDNLGGDFKAFQSAYEAVGTDLFDQQEGALRKLTQTA +FT TKYVLKLDGWIQKNKSLASTIGIIAGGALALTGIIGAIGLVAWPVITGINAIIAAAGAM +FT GAVFTTVGSAVMTAIGAISWPVVAVVAAIVAGALLIRKYWEPVSAFFGGVVEGLKAAFA +FT PVGELFTPLKPVFDWLGEKLQAAWQWFKNLIAPVKATQDTLNRCRDTGVMFGQALADAL +FT MLPLNAFNKLRSGIDWVLEKLGVINKESDTLDQTAARTHTATYGTGDYIPATSSYAGYQ +FT AYQPVTAPAGRSYVDQSKNEYHISLTGGTAPGTQLDRQLQDALEKYERDKRARARASMM +FT HDG" +FT variation 20669 +FT /note="Tam215 mutation" +FT /replace="t" +FT /gene="T" +FT variation 21101 +FT /note="Tam5 mutation" +FT /replace="t" +FT /gene="T" +FT variation 21528 +FT /note="Tam64 mutation" +FT /replace="a" +FT /gene="T" +FT CDS 22312..22791 +FT /codon_start=1 +FT /db_xref="SPTREMBL:O64315" +FT /transl_table=11 +FT /gene="U" +FT /function="essential tail protein" +FT /product="gpU" +FT /protein_id="AAD03294.1" +FT /translation="MMLALGMFVFMRQTLPHQTMQRESDYRWPSNSRIGKRDAFQFLGV +FT GEENITLAGVLYPELTGGKLTMTTLRLMAEEGRAWPLLDGTGMIYGMYVISRVSETGSI +FT FFADGTPRKIDFTLSLTRVDESLAALYGDIGKQAESLIGKAGSMATRFTGMTGAG" +FT variation 22363 +FT /note="Uam25 mutation" +FT /replace="t" +FT /gene="U" +FT variation 22501 +FT /note="Uam77 and Uam92 mutations" +FT /replace="t" +FT /gene="U" +FT CDS 22791..23954 +FT /codon_start=1 +FT /db_xref="SWISS-PROT:P10312" +FT /transl_table=11 +FT /gene="D" +FT /function="essential tail protein" +FT /product="gpD" +FT /protein_id="AAD03295.1" +FT /translation="MLDALTFDAGSTLTPDYMLMLDSRDITGNISDRLMSMTLTDNRGF +FT EADQLDIELNDADGQVGLPVRGAVLTVYIGWKGFALVCKGKFTVDEVEHRGAPDVVTIR +FT ARSADFRGTLNSRREGSWHDTTLGAIVKAIATRNRLEASVAPSLAGIKIPHIDQSQESD +FT AKFLTRLAERNGGEVSVKMGKLLFLKAGQGVTASGKKIPQVTITRSDGDRHHFAIADRG +FT AYTGVTAKWLHTKDPKPQKQKVKLKRKKKEKHLRALEHPKAKPVRQKKAPKVPEAREGE +FT YMAGEADNVFALTTVYATKAQAMRAAQAKWDKLQRGVAEFSISLATGRADIYTETPVKV +FT SGFKRVIDEQDWTITKVTHFLNNSGFTTSLELEVRLSDVEYETEDDE" +FT variation 23592 +FT /note="Dam6 mutation" +FT /replace="t" +FT /gene="D" +FT -35_signal 23973..23975 +FT -10_signal 23996..24002 +FT prim_transcript 24008..24288 +FT /note="putative" +FT CDS 24036..24254 +FT /codon_start=1 +FT /db_xref="SWISS-PROT:P08762" +FT /transl_table=11 +FT /gene="ogr" +FT /product="Ogr" +FT /protein_id="AAD03296.1" +FT /translation="MFHCPLCQHAAHARTSRYITDTTKERYHQCQNVNCSATFITYESV +FT QRYIVKPGEVHAVRPHPLPSGQQIMWM" +FT variation 24148..25274 +FT /note="del15 deletion" +FT /replace="" +FT variation 24160 +FT /note="ogr1 and ogr52 mutations" +FT /replace="g" +FT /gene="ogr" +FT terminator 24265..24288 +FT /evidence=EXPERIMENTAL +FT /note="rho-independent terminator for ogr transcript and F +FT operon" +FT protein_bind 24293..24320 +FT /note="P arm" +FT /bound_moiety="Int" +FT protein_bind 24324..24357 +FT /bound_moiety="IHF" +FT misc_feature complement(24356..24382) +FT /note="attP" +FT protein_bind 24356..24383 +FT /note="attP core" +FT /bound_moiety="Int" +FT variation 24372 +FT /note="saf mutation; altered integration site specificity" +FT /replace="g" +FT variation 24376 +FT /note="left end del3 deletion/insertion" +FT variation 24378..25927 +FT /note="vir22 deletion/insertion" +FT variation 24378..25065 +FT /note="del6 deletion" +FT /replace="" +FT variation 24381..26340 +FT /note="vir94 deletion/insertion" +FT protein_bind 24399..24472 +FT /bound_moiety="Cox" +FT CDS complement(24462..25475) +FT /codon_start=1 +FT /db_xref="SWISS-PROT:P36932" +FT /transl_table=11 +FT /gene="int" +FT /function="integrase" +FT /product="Int" +FT /protein_id="AAD03297.1" +FT /translation="MAIKKLDDGRYEVDIRPTGRNGKRIRRKFDKKSEAVAFEKYTLYN +FT HHNKEWLSKPTDKRRLSELTQIWWDLKGKHEEHGKSNLGKIEIFTKITNDPCAFQITKS +FT LISQYCATRRSQGIKPSSINRDLTCISGMFTALIEAELFFGEHPIRGTKRLKEEKPETG +FT YLTQEEIALLLAALDGDNKKIAILCLSTGARWGEAARLKAENIIHNRVTFVKTKTNKPR +FT TVPISEAVAKMIADNKRGFLFPDADYPRFRRTMKAIKPDLPMGQATHALRHSFATHFMI +FT NGGSIITLQRILGHTRIEQTMVYAHFAPEYLQDAISLNPLRGGTEAESVHTVSTVE" +FT protein_bind 24470..24496 +FT /note="P' arm" +FT /gene="int" +FT /bound_moiety="Int" +FT variation complement(24539) +FT /note="intam150 mutation" +FT /replace="a" +FT /gene="int" +FT variation complement(25130) +FT /note="intam239 mutation" +FT /replace="a" +FT /gene="int" +FT variation complement(25454) +FT /note="nip1 mutation" +FT /replace="t" +FT /gene="int" +FT variation 25492..25839 +FT /note="vir 79 deletion" +FT /replace="" +FT CDS complement(25591..25890) +FT /codon_start=1 +FT /db_xref="SWISS-PROT:P04132" +FT /transl_table=11 +FT /gene="C" +FT /function="immunity repressor" +FT /product="gpC" +FT /protein_id="AAD03298.1" +FT /translation="MSNTISEKIVLMRKSEYLSRQQLADLTGVPYGTLSYYESGRSTPP +FT TDVMMNILQTPQFTKYTLWFMTNQIAPESGQIAPALAHFGQNETTSPHSGQKTG" +FT variation complement(25637) +FT /note="sly1 mutation" +FT /replace="t" +FT /gene="C" +FT variation complement(25682) +FT /note="cts7 mutation" +FT /replace="t" +FT /gene="C" +FT variation complement(25686..25702) +FT /note="cam11 and cam13 mutations" +FT /replace="a" +FT /gene="C" +FT variation complement(25702) +FT /note="cts6 mutation" +FT /replace="a" +FT /gene="C" +FT variation complement(25731) +FT /note="cam10 and cam12 mutations" +FT /replace="a" +FT /gene="C" +FT variation complement(25772) +FT /note="cts9 mutation" +FT /replace="t" +FT /gene="C" +FT variation complement(25802) +FT /note="vir1 mutation" +FT /replace="t" +FT /gene="C" +FT variation complement(25829) +FT /note="cts8 mutation" +FT /replace="g" +FT /gene="C" +FT variation complement(25844) +FT /note="cts5 mutation" +FT /replace="a" +FT /gene="C" +FT -35_signal 25884..25889 +FT /note="early promoter Pe" +FT misc_feature 25894..25901 +FT /note="O1 repressor binding site" +FT variation 25899..25955 +FT /note="vir24 deletion" +FT /replace="" +FT variation 25900..25916 +FT /note="vir3 deletion" +FT /replace="" +FT variation 25904..25920 +FT /note="vir65 deletion" +FT /replace="" +FT -10_signal 25907..25912 +FT /note="early promoter Pe" +FT variation 25909..25983 +FT /note="vir40 deletion" +FT /replace="" +FT variation 25913 +FT /note="c1 mutation" +FT /replace="c" +FT misc_feature 25916..25923 +FT /note="O2 repressor binding site" +FT variation 25922 +FT /note="vir6 mutation" +FT /replace="" +FT -10_signal complement(25962..25967) +FT /note="Pc promoter" +FT -35_signal complement(25982..25987) +FT /note="Pc promoter" +FT CDS 26005..26280 +FT /codon_start=1 +FT /db_xref="SWISS-PROT:P07695" +FT /transl_table=11 +FT /gene="cox" +FT /function="repressor of Pc; required for prophage excision; +FT inhibits integration; activates P11 promoter of satellite +FT phage P4" +FT /product="Cox" +FT /protein_id="AAD03299.1" +FT /translation="MSKQVTLMTDAIPYQEFAKLIGKSTGAVRRMIDKGKLPVIDMTDP +FT QSASGRAGEYWVYLPAWNNGLKLAYESRPKEIRDGWLMWLGLGEPR" +FT variation 26069 +FT /note="cox3 mutation" +FT /replace="a" +FT /gene="cox" +FT variation 26129 +FT /note="cox2 mutation" +FT /replace="c" +FT /gene="cox" +FT variation 26164 +FT /note="cox4 mutation" +FT /replace="a" +FT /gene="cox" +FT CDS 26291..26461 +FT /codon_start=1 +FT /db_xref="SPTREMBL:Q38498" +FT /transl_table=11 +FT /gene="orf78" +FT /product="Orf78" +FT /protein_id="AAD03300.1" +FT /translation="MNEPRCIAQLLRNESPRAIDFTITHGKGRKGIIIRTKKQSPLKKA +FT LTFLKSRRVWK" +FT CDS 26458..26958 +FT /codon_start=1 +FT /db_xref="SWISS-PROT:P07696" +FT /transl_table=11 +FT /gene="B" +FT /function="essential protein; DNA replication; required for +FT lagging strand synthesis" +FT /product="gpB" +FT /protein_id="AAD03301.1" +FT /translation="MTVMTLNLVEKQPAAMRRIIGKHLAVPRWQDTCDYYNQMMERERL +FT TVCFHAQLKQRHATMCFEEMNDVERERLVCAIDELRGAFSKRRQVGASEYAYISFLTVS +FT QRRTLFMHAGLTEKEFNQPYWRINEESCYWRDALFRALRELFSLFEYAPTILTSVKPEQ +FT YLH" +FT variation 26525 +FT /note="rlb1 mutation" +FT /replace="g" +FT /gene="B" +FT variation 26611 +FT /note="Bam213 mutation" +FT /replace="t" +FT /gene="B" +FT variation 26722 +FT /note="Bam116 mutation" +FT /replace="t" +FT /gene="B" +FT variation 26762 +FT /note="Bts6 mutation" +FT /replace="t" +FT /gene="B" +FT variation 26914 +FT /note="Bts40 mutation" +FT /replace="t" +FT /gene="B" +FT terminator 26980..27007 +FT /note="putative rho-independent terminator" +FT CDS 27022..27246 +FT /codon_start=1 +FT /db_xref="SWISS-PROT:Q06422" +FT /transl_table=11 +FT /gene="orf80" +FT /product="Orf80" +FT /protein_id="AAD03302.1" +FT /translation="MHTVSENQCGIYALLLQQARTEAQADAATRFSSHLDAMIRHITKA +FT ELSRVEIVELLSQESEKFHNIGLSRGEVL" +FT CDS 27246..27548 +FT /codon_start=1 +FT /db_xref="SWISS-PROT:Q06423" +FT /transl_table=11 +FT /gene="orf81" +FT /product="Orf81" +FT /protein_id="AAD03303.1" +FT /translation="MFCSRAVVLLNNALKIAVMKNGDLSLIQLGLDKEKREITESVIAI +FT YQSELNLLSDVVNLLVKRAVFHKQISSVDELTKLTTEIASYCADEFKKLNDKRNW" +FT CDS 27548..27772 +FT /codon_start=1 +FT /db_xref="SWISS-PROT:Q06424" +FT /transl_table=11 +FT /gene="orf82" +FT /product="Orf82" +FT /protein_id="AAD03304.1" +FT /translation="MPDNVDFIQEQQAELLERQINAARVKHCGASALVCEECDAPIPAA +FT RRAAYPSATRCVSCQSVFEAKNKHYRRTA" +FT CDS 27769..28044 +FT /codon_start=1 +FT /db_xref="SWISS-PROT:Q06425" +FT /transl_table=11 +FT /gene="orf83" +FT /product="Orf83" +FT /protein_id="AAD03305.1" +FT /translation="MSIRIEIGERYVVTSDSFQFILHEKKRAESGKNAGQEWLAVVGYY +FT PKLSQLVSGLMHHDILTGSAKSFADLNVQVEQLSKRCSEAFGSYGR" +FT CDS 28034..30319 +FT /codon_start=1 +FT /db_xref="SWISS-PROT:Q06419" +FT /transl_table=11 +FT /gene="A" +FT /function="essential protein; DNA replication; makes +FT site-specific nick at origin of replication" +FT /product="gpA" +FT /protein_id="AAD03306.1" +FT /translation="MAVKASGRFVPPSAFAAGTGKMFTGAYAWNAPREAVGRERPLTRD +FT EMRQMQGVLSTINRLPYFLRSLFTSRYDYIRRNKSPVHGFYFLTSTFQRRLWPRIERVN +FT QRHEMNTDASLLFLAERDHYARLPGMNDKELKKFAARISSQLFMMYEELSDAWVDAHGE +FT KESLFTDEAQAHLYGHVAGAARAFNISPLYWKKYRKGQMTTRQAYSAIARLFNDEWWTH +FT QLKGQRMRWHETLLIAVGEVNKDRSPYASKHAIRDVRARRQANLEFLKSCDLENRETGE +FT RIDLISKVMGSISNPEIRRMELMNTIAGIERYAAAEGDVGMFITLTAPSKYHPTRQVGK +FT GESKTVQLNHGWNDEAFNPKDAQRYLCHIWSLMRTAFKDNDLQVYGLRVVEPHHDGTPH +FT WHMMLFCNPRQRNQIIEIMRRYALKEDGDERGAARNRFQAKHLNQGGAAGYIAKYISKN +FT IDGYALDGQLDNDTGRPLKDTAAAVTAWASTWRIPQFKTVGLPTMGAYRELRKLPRGVS +FT IADEFDERVEAARAAADSGDFALYISAQGGANVPRDCQTVRVARSPSDEVNEYEEEVER +FT VVGIYAPHLGARHIHITRTTDWRIVPKVPVVEPLTLKSGIAAPRSPVNNCGKLTGGDTS +FT LPAPTPSEHAAAVLNLVDDGVIEWNEPEVVRALRGALKYDMRTPNRQQRNGSPLKPHEI +FT APSARLTRSERLQITRIRVDLAQNGIRPQRWELEALARGATVNYDGKKFTYPVADEWPG +FT FSTVMEWT" +FT variation 28649 +FT /note="Aam127 mutation" +FT /replace="t" +FT /gene="A" +FT variation 29528 +FT /note="Ats54 mutation" +FT /replace="a" +FT /gene="A" +FT rep_origin 29892 +FT /evidence=EXPERIMENTAL +FT /note="nick site at ori" +FT CDS 30316..30645 +FT /codon_start=1 +FT /db_xref="SWISS-PROT:Q06426" +FT /transl_table=11 +FT /gene="orf91" +FT /product="Orf91" +FT /protein_id="AAD03307.1" +FT /translation="MMAKIHEVKLHAKYFDLVLEGKKRAEFRKKDRNYERGDTLILHEW +FT VQGVFTGRKVEARITDVTDLSDWLEDYVLLHRILGEILPLTVKLAVSSTFFINLRRRTV +FT AIYLL" +FT CDS complement(30684..31445) +FT /codon_start=1 +FT /db_xref="SPTREMBL:P79670" +FT /transl_table=11 +FT /gene="tin" +FT /function="nonessential protein; lysogenic conversion; +FT blocks growth of T-even phages" +FT /product="Tin" +FT /protein_id="AAD03308.1" +FT /translation="MNNMDIVKAVKDGMKKSADATYLMDFRSGAKINTEYVATVSIGLS +FT LLEIKSFRHGDYKVIFEYHTNKFINATVPLSKRSDPQKIFSKKTVRKNTNTTRSGRIDI +FT AILDSRPFFDIPICAIEVKGNAPCKSLLFSDIRRNLEYFKHTGPTGNSSLGLALNCSFH +FT SYNDSTKKNYCTTIHHKEDMIRKLKNKYKKYISELNEEIPDDISVTIDVFTAAEHLLSP +FT DADQYEYESHIDDLHLTLGVMVIFERKSILN" +FT variation 30992..33334 +FT /note="del4 deletion" +FT /replace="" +FT variation 31022..33454 +FT /note="del1 deletion" +FT /replace="" +FT CDS complement(31620..33380) +FT /codon_start=1 +FT /db_xref="SWISS-PROT:P13520" +FT /transl_table=11 +FT /gene="old" +FT /function="nonessential protein; lysogenic conversion; +FT exonuclease; blocks growth of phage lambda" +FT /product="Old" +FT /protein_id="AAD03309.1" +FT /translation="MTVRLASVSISNFRSCKSTSAILRPFTALVGYNNAGKSNIILAIK +FT WLLDGSLISESDVYDPTHPVSVEGVIQGITDDTLSLLTEENQQKIAPFIIDGTLTFARR +FT QEFNKETGKAKKSLDVYDGTTWKKNPGGIDGAISNIFPEPIHIPAMSDAVEDSTKCKNT +FT TTIGKILSAIVSEIKQEHEEKFSKNISEIGKYLSHNGENRLESLNKIDSGVNKKVNQFF +FT PDVSVKLHFPTPTLDEIFKSGTLKVFESREDEPVMRDISRFGHGTQRSIQMALIQYLAE +FT IKKENSESKKSNTLIFIDEPELYLHPSAINSVRESLVTLSESGYQVIISTHSASMLSAK +FT HAANAIQVCKDSNGTIARKTISEKIEELYKSSSPQLHSAFTLSNSSYLLFSEEVLLVEG +FT KTETNVLYALYKKINGHELNPSKICIVAVDGKGSLFKMSQIINAIGIKTRILADCDFLS +FT NILLTEHKDLLSTECDNLLTALIESINSGELSLNTKVTTFESFKSISSKDFIKICNHEK +FT TQKHIHEIHQKLKDNGIYIWKSGDIEAVYGFGKKQTEWDSLLDCLCDESKDVRAVIKKY +FT DEMEDFIKWI" +FT variation complement(31991) +FT /note="oldam11 mutation" +FT /replace="a" +FT /gene="old" +FT variation complement(32576) +FT /note="old1 mutation" +FT /replace="t" +FT /gene="old" +FT misc_feature complement(33424) +FT /note="transcript start 1; old-tin mRNA" +FT misc_feature complement(33426) +FT /note="transcript start 2; old-tin mRNA" +FT misc_feature 33575..33593 +FT /note="cosR; right cohesive end" +XX +SQ Sequence 33593 BP; 8398 A; 7983 C; 8870 G; 8342 T; 0 other; + ggcgaggcgg ggaaagcact gcgcgctgac ggtggtgctg attgtatttt ttcagcgtct 60 + cagcgcgtcg tgacggcact tagtctgccc gttgaggcgt tgtgtgtctg cggggtgttt 120 + tgtgcggtgg tgagcgtgtg aggggggatg acggggtgta aaaaagccgc ccgcaggcgg 180 + cgatgttcag tcgttgtcag tgtccagtga gtagttttta aagcggatga cctcctgacc 240 + gagccagccg tttatctcgc ggatcctgtc ctgtaacggg ataagctcat tgcggacaaa 300 + gacctttgcc actttctcaa tatcacccag cgacccgacg ttctccggct tgccacccat 360 + caactgaaag gggatgcggt gcgcgtccag caggtcagcg gcgctggctt ttttgatatt 420 + aaaaaaatcg tccttcgtcg ccacttcact gagggggata attttaatgc cgtcggcttt 480 + cccctgtggg gcatagagaa acaggttttt aaagttgttg cggcctttcg acttgaccat 540 + gttttcgcga agcatttcga tatcgttgcg atcctgcacg gcatcggtga catacatgat 600 + gtatccggca tgtgcgccat tttcgtaata cttgcggcgg aacaacgtgg ccgactcatt 660 + cagccaggca gagttaaggg cgctgagata ttccggcagg ccgtacagct cctgattaat 720 + atccggctcc agcaggtgaa acacggagcc gggcgcgaag gctgtcggct cgttgaagga 780 + cggcacccac cagtaaacat cctcttccac gccacggcgg gtatattttg ccggtgaggt 840 + ttccagtctg atgaccttac cggtggtgct gtaacgcttt tccagaaacg cattaccgaa 900 + caccagaaaa tccagcacaa agcggctgaa atcctgctgg gaaagccatg gatgcgggat 960 + aaatgtcgag gccagaatat tgcgtttgac gtaaatcggc gagctgtgat gcacggcagc 1020 + ccgcaggctt tttgccagac cggtaaagct gaccggtggc tcataccatc tgccgttact 1080 + gatgcactcg acgtaatcca gaatgtcacg gcggtcgagt accggcaccg gctcaccaaa 1140 + ggtgaatgcc tccattttcg ggccgctggc ggtcattgtt tttgccgcag gttgcggtgt 1200 + tttccctttt ttcttgctca tcagtaaaac tccagaatgg tggatgtcag cggggtgctg 1260 + ataccggcgg tgagtggctc atttaacagg gcgtgcatgg tcgcccaggc gaggtcggcg 1320 + tggctggctt cctcgctgcg gctggcctca taggtggcgc tgcgtccgct gctggtcatg 1380 + gtcttgcgga tagccataaa cgagctggtg atgtcggtgg cgctgacgtc gtattccaga 1440 + cagccacggc ggataacgtc ttttgccttg agcaccattg cggttttcat ttccggcgtg 1500 + tagcggatat cacgcgcggc gggatagaac gagcgcacga gctggaacac gccgacaccg 1560 + aggccggtgg catcaatacc gatgtattcg acgttgtatt tttcggtgag tttgcggatg 1620 + gattccgcct gggtggcaaa gtccatgcct ttccactggt gacgctcaag tattctgaat 1680 + ttgccaccgg ccaccaccgg cggtgccagt accacgcatc cggcgctgtc gccacggtgt 1740 + gacgggtcgt aaccaatcca taccgggcgg gagccgaacg gattggcggc aaacggcgca 1800 + tagtcttccc attcttccag cgtgtcgacc atgcagcgtt gcagctcctc gaacgggaac 1860 + accgatgcct tgtcgtcaac aaattcacac atgaacaggt ttttaaaatc gtcggcgctg 1920 + ttttcgcgtt tgagctgctc aatgtcgaac agcgtgcagc cgcctttcag ggcgtcctca 1980 + atggtgacaa tctgtcgcca ctggccgtcc gcacagagaa gcccaccggc aagggcgtta 2040 + tgactgacgt cgatttccac gcgttcggcg gcgctggcgc gtccccggtt aaacagttca 2100 + cccgaccaga acgggtaggc gtcgtgcgcc agcgtggacg gggtggagaa ataggtcgag 2160 + cgcaggtgac tctgtgaggc catacctgat gccaccttac gcagtacctg aaaattcggg 2220 + atccagaaaa tctcatcgac gtacaggtcg ccgttatgac tctgcgcggt gttggagttg 2280 + gtgccgagaa aaatcagttt tgcgccgtta ttgcccagga caatcgggtc accggtcagg 2340 + tcaacgtcaa ccagacgggc aaaggcgatg atgtattcgc ggaacacata cgcctgtgtt 2400 + ttactggccg acagaaaaat ctggttatga ccggttttca gggcacgcag cagcgcctcg 2460 + cgggaaaaat aaaacgtcgc gccaatctgg cgggatttca ggatatcgcg gatgcggtgc 2520 + tcaagcccgg cacgatacca gtgcagctga tagtcgaaag actgctcaaa gaaaatctgc 2580 + tccagctttt cgatggcctc gtcactgaaa aaattctttt tcggtttgcg ccgtccgcct 2640 + ttgttacggt tagcgacgtt cggattaagg tctgcctcgt tgccggtctg gctgtagcgg 2700 + ttgacccgtg ccagtcgttc aatctggcgt cccagcaggt caatttcctt gaagtcaccg 2760 + ccggttttct gtggtttgat gatgagctgg gtcagccgcg cttccagact catttcgaca 2820 + cggctgatgg gggcaacgct gtcccagccg tcgcgctgtt tccagctctg cactgtcggg 2880 + cgtttcatct gcaacatggc ggcaatctgc ggcacggaaa acccctgcca gtacagcagc 2940 + gccgcctgac gacgcgggtc gtgtaaaaga gtggtgtctg tggtgatggt catgaatacc 3000 + tcgccgtgat gaatacacgg caaggctact gagtcgcgcc ccgcgattcg ctaaggtgct 3060 + gttgtgtcag tgataagcca tccgggactg atggcggagg atgcgcatcg tcgggaaact 3120 + gatgccgaca tgtgactcct ctaatcacta ttcaggactc ctgacaatgg caaaaaaagt 3180 + ctcaaaattc tttcgtatcg gcgttgaggg tgacacctgt gacgggcgtg tcatcagtgc 3240 + gcaggatatt caggaaatgg ccgaaacctt tgacccgcgt gtctatggtt gccgcattaa 3300 + cctggaacat ctgcgcggca tcctgcctga cggtattttt aagcgttatg gcgatgtggc 3360 + cgaactgaag gccgaaaaga ttgacgatga ttcggcgctg aaaggcaaat gggcgctgtt 3420 + tgcgaaaatc accccgaccg atgaccttat cgcgatgaac aaggccgcgc agaaggtcta 3480 + cacctcaatg gaaattcagc cgaactttgc caacaccggc aaatgttatc tggtgggtct 3540 + ggccgtcacc gatgacccgg caagcctcgg cacggaatac ctggaattct gccgcacggc 3600 + aaaacacaac cccctgaacc gcttcaaatt aagccctgaa aacctgattt cagtggcaac 3660 + gcctgttgag ctggaatttg aagacctgcc tgaaaccgtg ttcaccgccc tgaccgaaaa 3720 + ggtgaagtcc atttttggcc gcaaacaggc cagcgatgat gcccgtctga atgacgtgca 3780 + tgaagcggtg accgctgttg ctgaacatgt gcaggaaaaa ctgagcgcca ctgagcagcg 3840 + cctcgctgag atggaaaccg ccttttctgc acttaagcag gaggtgactg acagggcgga 3900 + tgaaaccagc caggcattca cccgcctgaa aaacagtctc gaccacaccg aaagtctgac 3960 + ccagcagcgc cgcagcaaag ccaccggcgg tggcggtgac gccctgatga cgaactgctg 4020 + accggcgtca gtcagtccgg gaaaaccttc acgattaacc cttaatttca ggaaaaacta 4080 + tgcgccagga aacccgcttt aaatttaatg cctacctgtc ccgtgttgcc gaactgaacg 4140 + gcatcgacgc cggtgatgtg tcgaaaaaat tcaccgttga accgtcggtc acccagaccc 4200 + tgatgaacac catgcaggag tcctctgact ttctgacccg catcaatatt gtgccggtca 4260 + gcgaaatgaa aggggaaaaa attggtatcg gtgtcaccgg ctccatcgcc agcactaccg 4320 + acactgccgg tggtaccgag cgtcagccga aggacttctc gaagctggcg tcaaacaagt 4380 + acgaatgcga ccagattaac ttcgattttt atatccgcta caaaacgctg gacctgtggg 4440 + cgcgttatca ggatttccag ctccgtatcc gtaacgccat tatcaaacgc cagtcccttg 4500 + atttcatcat ggccggtttt aacggcgtga agcgtgccga aacctctgac cgcagcagca 4560 + atccgatgtt gcaggatgtg gcggtcggct ggctgcagaa ataccgcaat gaagcaccgg 4620 + cgcgcgtgat gagcaaggtc actgacgagg aaggccgcac cacctctgag gttatccgcg 4680 + tgggtaaggg cggtgattat gccagccttg atgcactggt gatggatgcg accaacaacc 4740 + tgattgaacc gtggtatcag gaagaccctg accttgtggt gattgtgggg cgtcagctac 4800 + tggcggacaa gtatttcccc atcgtcaaca aggagcagga caacagcgaa atgctggccg 4860 + ctgacgtcat catcagccag aaacgcatcg gtaacctacc agcggtacgc gtcccgtact 4920 + tcccggcgga tgcgatgctc atcacgaagc tggaaaacct gtccatctac tacatggatg 4980 + acagccatcg ccgcgtgatt gaggaaaacc cgaaactcga ccgcgtggag aactacgagt 5040 + caatgaacat tgattacgtg gtggaagact acgccgccgg ttgtctggtg gaaaaaatca 5100 + aggtcggtga cttctccaca ccggctaagg cgaccgcaga gccgggagcg taaccgatga 5160 + cgagtcccgc acagcgccac atgatgcggg tctcggcagc gatgaccgcg cagcgggaag 5220 + ccgccccgct gcgacatgca actgtctatg agcagatgct ggttaagctc gccgcagacc 5280 + agcgcacact gaaagcgatt tactcaaaag agctgaaggc cgcaaaaaaa cgcgaactgc 5340 + tgccgttctg gttgccgtgg gtgaacggcg tgctggagct gggcaaaggt gcacaggatg 5400 + acattctgat gacggtcatg ctgtggcgtc tggataccgg cgatattgcc ggtgcgctgg 5460 + agattgcccg ttatgccctg aagtacggtc tgaccatgcc gggtaaacac cgccgtaccc 5520 + cgccgtacat gttcaccgag gaggtagcgc ttgcggccat gcgcgctcac gctgccggtg 5580 + agtctgtgga tacccgcctg ctgacggaga cccttgaact gaccgccacg gctgacatgc 5640 + ctgatgaagt gcgcgcaaag ctgcacaaaa tcaccggtct gtttctgcgt gacggtggtg 5700 + atgccgccgg tgcgctggcg cacctgcaac gtgcgacaca gctcgactgt caggcaggcg 5760 + tcaaaaaaga gattgaacga ctggagcggg agctgaaacc gaagccggag ccgcagccca 5820 + aagcggccac ccgcgccccg cgtaagaccc ggagcgtgac accggcaaaa cgtggacgcc 5880 + cgaaaaagaa agccagttaa caaccgaatg cgccccgcgc cagggcggca cgccggtcag 5940 + tgacggtgaa tcacctgaca ctgcaccggc gtccaccgcc cgacttttca gaggtagtca 6000 + tgatgacgct gattattccg cgaaaggagg ctcccgtgtc cggtgagggt acggtggtca 6060 + tcccgcaacc ggcaggcgac gagccggtga ttaaaaacac gttctttttt cccgatatcg 6120 + acccgaagcg cgtccgggaa cgtatgcgcc ttgagcagac cgtcgccccc gcccgtctgc 6180 + gtgaggccat caagtcaggc atggctgaaa cgaatgcgga gctgtacgag taccgcgaac 6240 + agaaaattgc cgccggtttt acgcgtctgg ctgacgtccc ggcggacgat atcgacggtg 6300 + aaagcatcaa ggttttttac tacgagcgcg ccgtgtgtgc gatggcgacc gcgtcgcttt 6360 + atgagcgtta tcgcggtgtg gatgccagtg cgaaaggcga caagaaggct gacagcattg 6420 + acagcaccat tgatgagctg tggcgggata tgcgctgggc ggtggcgcgc atccagggca 6480 + agccgcgctg catcgtgagt caaatctgat gaagaccttt gcgctacagg gcgacacgct 6540 + cgacgccatt tgtgtccgct attacgggcg cactgagggc gtggttgaga ccgtgctcgc 6600 + cgcaaatccg ggactggctg aactgggggc ggtgctgcca cacggcaccg ccgtcgaact 6660 + gcccgacgtt cagaccgcgc ccgtggctga aactgtcaat ctgtgggagt aacgcatgac 6720 + agcagaagaa aaaagcgtcc tgtcgctttt catgattggg gtgctgattg ttgtcggcaa 6780 + ggtgcttgcc ggtggtgaac ctatcacccc gcgtctgttt atcgggcgca tgttgctcgg 6840 + tggttttgtc tcgatggttg ccggtgttgt tctggtgcag tttcctgacc tgtcactgcc 6900 + agcggtgtgc ggcatcggct ccatgctggg tatcgccggt tatcaggtga ttgagattgc 6960 + cattcagcgc cgctttaagg gcagggggaa acagtaatgc cggtaattaa cacgcatcag 7020 + aatatcgccg cctttctcga catgctggcc gtgtccgaag ggacggcgaa tcatccactg 7080 + acgaaaaacc ggggctatga cgtgatagtc accggactgg acgggaagcc ggaaattttc 7140 + accgactaca gtgaccaccc gttcgcacat ggccgaccgg cgaaggtgtt taaccgtcgc 7200 + ggtgaaaaat ccacggcctc cggtcgctat cagcagcttt acctgttctg gccgcattac 7260 + cgcaaacagc ttgccctgcc ggatttcagt ccgttgtcac aggacagact cgccattcag 7320 + ttgatccgcg aacgcggagc actggatgac atccgggcgg gacgcattga gcgcgccatt 7380 + tcacgctgtc gcaatatctg ggcgtccctg ccgggtgccg gttacggtca gcgtgagcat 7440 + tcactggaaa aactggtcac cgtctggcgt accgctggcg gcgtaccggc ttaaacggag 7500 + taaataccat gaagaaatta tccctttcac tgatgctgaa cgtgtcgctg gcgctgatgc 7560 + tggcactgtc cctgatttac ccgcagagcg tggccgtcaa ttttgtcgct gcctgggcga 7620 + ttctggcgac ggttatctgt gtggttgccg gtggtgtggg cgtgtatgcc actgagtatg 7680 + tgctggaacg ctacgggcgg gagctgccgc cggaatcgct ggccgtgaag attgtcacgt 7740 + cgctgttttt gcagccggtg ccgtggcgca gacgggcggc ggctctggta gtggtggtgg 7800 + cgacgtttat ctcgctggtc gctgccgggt ggatttttac cgcgctgatt tatcttgtgg 7860 + tgtcgctgtt tttccggctg atacgtaaag cctgtcgtca gcgtcttgag gggcgggaac 7920 + catgtcaagg ctgatgattg tgctggtcgt gttgttatcg ctggcggtgg ccggtctgtt 7980 + tctggtgaaa cacaaaaatg ccagcctgcg cgcctcgctg gacagggcga acaacgtcgc 8040 + cagcggtcag cagacgacca tcaccatgct gaaaaatcag cttcatgttg cgctcaccag 8100 + ggcagataaa aacgagctgg cgcaggtggc actgcgtcag gaactggaga acgccgcgaa 8160 + acgtgaagca cagcgcgaga aaaccatcac gaggttactt aatgagaacg aagattttcg 8220 + ccgctggtac ggtgctgacc tgcctgatgc tgtgcgccgg ttgcaccagc gccccgcctg 8280 + caccgacgcc agtgattgtc cccaacgcat gcccgaaagt gagcctttgc ccgatgccgg 8340 + gcagtgaccc gcagacgaac ggcgatttaa gtgccgatat ccggcagctt gagaacgcgc 8400 + tggcacgctg tgccagccag gtaaaaatga ttaaacactg tcaggacgaa aacgatgctc 8460 + aaacccgaca gcctgcgcag ggcgctgact gatgccgtca cggtgctgaa aactaacccc 8520 + gatatgctgc ggatattcgt ggataacggg agtattgcct ccacactggc ggcgtcgctg 8580 + tcattcgaaa agcgttacac gctcaatgtg attgtgaccg actttaccgg tgattttgac 8640 + ctgctcattg tgccggtgct ggcgtggctg cgggaaaatc agcccgacat catgaccacc 8700 + gacgaaggcc agaaaaaggg cttcacgttt tatgcagaca tcaacaatga cagcagcttt 8760 + gatatcagta tcagcctgat gctgaccgag cgcacgctgg tcagtgaggt ggacggcgca 8820 + ctgcatgtga agaatatctc ggaacccccg ccgccggagc cggtcacccg cccgatggag 8880 + ctgtatatca atggcgaact ggtgagtaag tgggatgaat gagtttaagc gttttgaaga 8940 + ccggctgacc ggactgattg aatcgctgtc accgtcaggg cgtcggcgac tgagtgccga 9000 + actggcgaaa cgtctgcggc agagtcagca gcgtcgggtg atggcacaga aagccccgga 9060 + cggcacaccc tacgcgccac gccagcagca gagcgtcaga aaaaagaccg gtcgcgttaa 9120 + gcgaaaaatg tttgcgaaac ttattaccag tcgttttttg catatccgtg ccagcccgga 9180 + gcaggcatca atggaatttt acggcgggaa gtcgccgaaa atcgccagtg tgcatcagtt 9240 + tggtctgtcg gaagaaaacc ggaaagacgg taagaaaatt gattatccgg cgcgtcccct 9300 + gctcggcttt accggtgagg atgtgcagat gattgaagag attatcctgg ctcaccttga 9360 + gcgttagttt tatccaggca gaggctgatg cgcaattaaa cattgagcgg ccatgctggt 9420 + cgctcaatgt ttagaggttt atgagtgatt tttatttgat gctttgtatt ctaaaacctt 9480 + cttattggcg taaaagaatt ttgtatatga caggaatata accagacctg aagtgaaata 9540 + gacgagggat agtattaata atgctttttt gtgactgtta ttatctttaa tctcctggct 9600 + taaccattcg gagtcctcct cgtttagctg taagagctta ttgcaggcga tctcaggaag 9660 + tgtgtctttt ataaatacgt tttgcagtct cttgcaatcg gcaaggctat aagttttatt 9720 + aaattcaact gctttatttt tgaaggataa aagaactttg tcactataaa catagtacat 9780 + catgttttta tatggtatgc ctgtggcatc ccttactata acggattgtt cgttgtgtat 9840 + gtaacatgcg aggagaatgt aaaaaatact ggccagaatt acaattattg ttttaattat 9900 + gtgtggtggt tttgttatgt caccccagat acgagtaagg aaaaaatacg atgtttttag 9960 + ttttccatca atcagtccct gctgtatcat tctcacattt tcaatgcctg atacattgat 10020 + tccgttaatt attttaaata gttgaatgtc gcgccactcg cggtcaagtc tttttaattt 10080 + tttgtctgaa tatccaaaat tgaaataatg tgcaataagc ctcataaggt tacttttacc 10140 + aaagctaaaa aatgctaata ctgcaaagct acaaaggaaa aaaacgatta gcccccacac 10200 + attagtcaca ttatagctga ccattacgct ctccttgaat gttgtctggt agttctacaa 10260 + atgaatccag atagcataac ttttatatat tgtgcaatct cacatgcatg aacactctcg 10320 + caaatattca ggaactcgcg cgcgcactgc gcaacatgat tcgcactggc attatcgtcg 10380 + aaaccgacct taacgccggt cgctgccgcg tgcagaccgg cggcatgtgc accgactggc 10440 + ttcagtggct gacccatcgc gcaggacgtt cgcgcacatg gtgggcacct tccgtggggg 10500 + aacaggtgct gattctggcc gtgggtggtg aactcgacac ggcgttcgtt ctgccgggga 10560 + tttattccgg cgataacccc tcgccgtctg tgtcggcgga tgccctgcat atccgtttcc 10620 + ctgacggggc ggtgattgaa tatgaacccg aaaccagtgc actcacggta agcggaatta 10680 + aaacggccag cgtgacggct tccggttctg ttactgccac ggtgccggtg gtcatggtga 10740 + aagcatcaac ccgcgtcacc ctggacaccc cggaggtggt ctgcaccaac aggctgatta 10800 + ccggcacgct ggaagtgcag aaaggcggga cgatgcgcgg caacattgaa cacaccggcg 10860 + gtgaactctc atcaaacggt aaggtactgc atacccataa acaccccggc gacagcggcg 10920 + gcacaaccgg gagtccttta tgacagcgcg ttatctcgga atgaatcgca gtgatggcct 10980 + gactgtcact gaccttgagc atatcagcca gagtatcggc gatatcctgc gcacaccggt 11040 + cggctcacgg gtgatgcgtc gtgattacgg ctcgttgctg gcgtcaatga ttgaccagcc 11100 + gcagaccccg gcgcttgagt tgcagattaa agtcgcctgt tacatggcag tgctgaaatg 11160 + ggaaccccgc gtcaccctgt catccgtcac cacggcgcgc agttttgacg ggcgaatgac 11220 + ggtcacgtta accggccagc acaacgacac cggccagcca ctttcattaa ccatccctgt 11280 + gagttgaaac catgccgatt atcgacctga accagctacc cgcaccggat gtggtcgagg 11340 + agctggactt tgaaagcatt ctcgctgaac gcaaggcgac actgatttcc ctttacccgg 11400 + aagatcagca ggaggcggtc gcccgtaccc tgacactgga atctgagcct ctcgtcaaac 11460 + tgctggaaga aaatgcttat cgtgagctta tctggcgtca gcgtgtgaat gaggccgcac 11520 + gggcggtgat gctggcctgt gccgccggta atgaccttga tgtgattggt gccaattaca 11580 + acaccacgcg cctgactatc accccggcag atgattcgac catcccgccg acaccggcag 11640 + tgatggaatc tgacaccgat tatcgtctgc gtattcagca ggcttttgag ggcttaagcg 11700 + tcgccgggtc agtgggagcc tatcagtatc atggtcgcag tgctgacggg cgtgtcgcgg 11760 + atatttctgt caccagtccg tctccggcct gtgtcaccat ctctgtgctg tcacgtgaaa 11820 + ataacggcgt cgcatccgaa gacctgctgg ctgtggtgcg taacgccctt aatggcgagg 11880 + acgtcaggcc ggtggccgac cgcgtgaccg tgcagtctgc cgccatcgtt gaataccaga 11940 + taaacgccac gctttacctt taccctggtc ccgaaagcga acccatccgc gctgccgctg 12000 + tgaaaaagct ggaagcgtat atcacggcac agcaccggct ggggcgcgac atccgtctgt 12060 + ctgccattta tgccgctttg catgtggaag gtgtgcagcg tgtcgaactg gctgcaccac 12120 + tggccgacat cgtgctcaac agtacgcagg cgtctttctg taccgaatac cgcgtcgtga 12180 + ccggaggctc ggatgagtga ttcgcgactg ctgccgaccg gctcatcacc gcttgaggtc 12240 + gccgccgcaa aagcctgtgc ggaaattgaa aaaacgccgg tcagtattcg tgaactgtgg 12300 + aacccggaca cctgtccggc aaatctgctg ccgtggctgg cgtgggcgtt ttcggtcgac 12360 + aggtgggatg aaaagtggcc ggaagcgaca aaacgcgccg ttatccgcga tgcctatttc 12420 + atccactgtc ataagggcac gataggtgca atccggcgtg tggtggagcc gctcggctat 12480 + ctcatcaacg tgacggagtg gtgggaaaac agtgacccgc ccggcacctt ccggcttgat 12540 + attggtgtac tggaaagcgg tatcacagag gcaatgtatc aggaaatgga acggctgatt 12600 + gctgatgcca aacctgcaag ccgtcacctt attggcctga acattacccg ggacattccc 12660 + ggctatctgt tcgccggtgg tgtggcttac gacggcgatg taattacggt ttaccccgga 12720 + taagtgagga ataatgagca taaaattcag aaccgttatc accactgccg gtgcagcaaa 12780 + gctggcagcg gcaaccgcgc cgggaaggcg gaaggtcggc attaccacga tggccgtcgg 12840 + ggatggcggt ggtaaattgc ctgtcccgga tgccggacag accgggctta tccatgaagt 12900 + ctggcgacat gcgctgaaca aaatcagcca ggacaaacga aacagtaatt atattatcgc 12960 + cgagctggtt attccgccgg aggtgggcgg tttctggatg cgtgagcttg gcctgtacga 13020 + tgatgcggga acgttaattg ccgtggcgaa catggccgaa agctataagc cagcccttgc 13080 + cgaaggctca ggacgttggc agacctgtcg catggtcatc atcgtcagca gtgtggcctc 13140 + agtggagctg accattgaca ccacaacggt gatggcgacg caggattacg ttgatgacaa 13200 + aattgcagag cacgaacagt cacgacgtca cccggacgcc tcgctgacag caaaaggttt 13260 + tactcagtta agcagtgcga ccaacagcac gtctgaaaca ctggccgcaa cgccgaaagc 13320 + ggtaaaggcc gcgtatgacc tggctaacgg gaaatatacc gcacaggacg ccaccacagc 13380 + gcgaaaaggc cttgtccagc ttagtagcgc caccaacagc acgtctgaaa cgctcgccgc 13440 + aacaccaaaa gccgttaaga cggtaatgga tgaaacgaac aaaaaagcgc cattaaacag 13500 + ccctgcactg accggaacgc caacgacgcc aactgcgcga cagggaacga ataatactca 13560 + gatcgcaaac acggctttcg ttatggccgc gattgccgcc cttgtagact cgtcgcctga 13620 + cgcactgaat acgctgaacg agctggcggc ggcgctgggc aatgacccga attttgctac 13680 + caccatgact aatgcgcttg cgggtaagca accgaaagat gctaccctga cggcgctggc 13740 + ggggcttgct actgcggcag acaggtttcc gtattttacg gggaatgatg ttgccagcct 13800 + ggcgaccctg acaaaagtcg ggcgggatat tctggctaaa tcgaccgttg ccgccgttat 13860 + cgaatatctc ggtttacagg aaacggtaaa ccgagccggg aacgccgtgc aaaaaaatgg 13920 + cgataccttg tccggtggac ttacttttga aaacgactca atccttgcct ggattcgaaa 13980 + tactgactgg gcgaagattg gatttaaaaa tgatgccgat ggtgacactg attcatacat 14040 + gtggtttgaa acgggggata acggcaatga atatttcaaa tggagaagcc gccagagtac 14100 + cacaacaaaa gacctgatga cgttgaaatg ggatgcacta aatattcttg ttaatgccgt 14160 + cattaatggc tgttttggag ttggtacgac gaatgcacta ggtggtagct ctattgttct 14220 + tggtgataat gataccggat ttaaacagaa tggagacggt attcttgatg tttatgctaa 14280 + cagtcagcgt gtattccgtt ttcagaatgg agtggctatt gcttttaaaa atattcaggc 14340 + aggtgatagt aaaaagttct cgctatccag ctctaataca tccacgaaga atattacctt 14400 + taatttatgg ggtgcttcca cccgtccagt ggttgcagag ttaggcgatg aggccggatg 14460 + gcatttctat agccagcgaa atacagataa ctcggtaata tttgctgtta acggtcagat 14520 + gcaacccagc aactggggaa attttgattc ccgctatgtg aaagatgttc gcctgggtac 14580 + gcgagttgtt caattgatgg cgcgaggtgg tcgttatgaa aaagccggac acacgattac 14640 + cggattaaga atcattggtg aagtagatgg cgatgatgaa gccatcttca ggccgataca 14700 + aaaatacatc aatggcacat ggtataacgt tgcgcaggtg taagttatgc agcatttaaa 14760 + gaacattaag tcaggtaatc caaaaacaaa agagcaatat cagctaacaa agaattttga 14820 + tgttatctgg ttatggtccg aagacggaaa aaactggtat gaggaagtga agaactttca 14880 + gccagacaca ataaagattg tttacgatga aaataatatt attgtcgcta tcaccagaga 14940 + tgcttcaacg cttaatcctg aaggttttag cgttgttgag gttcctgata ttacctccaa 15000 + ccgacgtgct gacgactcag gtaaatggat gtttaaggat ggtgctgtgg ttaaacggat 15060 + ttatacggca gatgaacagc aacaacaggc agaatcacaa aaggccgcgt tactttccga 15120 + agcggaaaac gttattcagc cactggaacg cgctgtcagg ctgaatatgg cgacggatga 15180 + ggaacgtgca cgactggagt catgggaacg ttacagcgtt ctggtcagcc gtgtggatcc 15240 + tgcaaatcct gaatggccgg aaatgccgca ataagttgta tgacctctgt tgtgaactta 15300 + catatctatg gcacagagta aagcctaatc tgaagtccac tctgtgccaa aagcggacct 15360 + tataaacaag aacaatggtc atatcagtgt gttttgattg catagctaac gtgcgtcttc 15420 + ctgtacagaa tcataagatg atagggcata ggagatgatt attatcgcgt gttttaaaaa 15480 + tagctttctg catcaagtgt cacttgcgaa gaggtattgg cgctatgatt ggcatcactc 15540 + agttcagata atattttaaa tatttggtaa atgttcagat tacacaattc ggtctgcgtc 15600 + ccgttaaaat tatctactat tagttattac tatgaggtga atggcaagtg ttttccactc 15660 + gccatttttg ttttttattt ttttaaagcc tttccgacgt ttaaggattt tgccaagcca 15720 + taaaatattt gatatttcat tcctgttttt atttttggtg agatatttgc gtaacttctt 15780 + tctctaaaac accaacgtat aaacctatta ttatcttcgg ttgtttctat atagcatatt 15840 + acattgagac caaaaagaaa ctgaaggaag tcatttgcag ttgtcatgaa ttttggtttt 15900 + gttgtggaaa tggaactaat atgagtttca agttgtttat atgctaagag gtattcagcg 15960 + taatcaaaag tatcttttcc agagaggaat tcaaagaact ttaaaaaaat ctcataatgt 16020 + tcacttccat aataaaatga taaatgatct tttatttctc caagtaaata gttagagtaa 16080 + tctctttgca tgctaggact ttcaaagtca tctagactaa attgattttt cccatcatca 16140 + ccgctggcgt gtgatttgat aatttcgagc atccgtaata tatctcttgg gcgataatat 16200 + gaccagcgaa ggaaattaat aaatgatgtg gggtggttat aattatcatg gacgttgggt 16260 + gaatcccaag ggaaataatg gtcccatgcc tgtccctttt taagggccat gtcttgctga 16320 + gtcctaagca gatgatctaa tacctcaaat aattgagagc tacggtggtt aacatattct 16380 + gtccgccagt ccaagaatac tgaattatct ctgatttttg cgttttgatt ttgtaatcct 16440 + atggattcaa atatatctgg cctgatcaag agaacggcct tcattctccc ttttcctccc 16500 + tttatacttg ggaagaaatc gttgttaatc tcccagactg cgtgagctaa tccttttata 16560 + cattctagat aatcatcgta tggaattgag gaagggcgga tatcaatacc atcgataaat 16620 + aaaatatgat tttgagataa acgtatttgg ctaaaggcct cttcaaattt tttttgtata 16680 + taaaataaat ttatctgaaa tctgctctca gaaaaagata aagactctct ttcttcacct 16740 + tttaaggttg catgcttatg aagtagttcg gctgcaactt ttgactcttg aacaaaactg 16800 + agggcttgaa ttatttctgg tgaaaatgcc ttaagataat actcatctat tgcatcatta 16860 + agtgatgaga attttgaata atttagtaac tttgaaattt tcccttcttt atctaatact 16920 + tgttttgata ttaataaata tagaataact ttccatatgc cagagaagtc agacaaattt 16980 + aaatgctttt cagatttaag agtgataaat ttttgatatt ctgtctctct tatatattta 17040 + gttgtagcta gcgtattgtt aatattgtta tttgagagat agatagagta tgcggtttta 17100 + ccagtacctt tctctcctac aagaaacgat atatttggtt cacataatct agataggtga 17160 + ttatcacgta tgaacacttt gttaagtaat tctttattct cccttctctt ataattttca 17220 + gcatcagcat agccaagagt tagatctttg attggtatca ttattacctc aactaaagca 17280 + attgaaaaac atatggttat aaaaacatag cgctgctctg tcgcatattg tggatatcaa 17340 + catatgaaat gtaaaggaac tatttgtgga tgaatgaacc gaatcgctgt agcttcggta 17400 + gtcatctttc agacttgtat aaatgaacaa cttccgcttc tcgctcaaag gaaactgtca 17460 + gatttgatag cttttgggct atgtaaactg tcagtcggaa aatgagtgag tacaaatcag 17520 + ggcaggtgag cgaattgccc gccttttctt taccggtggt tgtgctgtcg attagccaac 17580 + cgggacaaat agcctgacat ctccggcgca actgaaaata ccactcaccc attaaccacg 17640 + gagttaaacg gatgagtgac tatcatcacg gcgtgcaggt gctggagatt aacgagggca 17700 + cccgcgtcat ttccaccgta tccacggcca ttgtcggcat ggtctgcacg gccagcgatg 17760 + cagatgcgga aaccttcccc ctcaataaac ctgtgctgat taccaatgtg cagagcgcaa 17820 + tttcaaaggc cggtaaaaaa ggcacgctgg cggcatcgtt gcaggccatc gctgaccagt 17880 + caaaaccggt caccgttgtc atgcgcgtgg aagacggcac cggtgatgac gaggaaacga 17940 + aactcgcgca gaccgtttcc aatatcatcg gcaccaccga tgaaaacggt cagtacaccg 18000 + gactaaaagc catgctggcg gcggagtcgg taaccggtgt taaaccgcgt attctcggcg 18060 + tgccgggact ggataccaaa gaggtggctg ttgcactggc atcagtctgt cagaagctgc 18120 + gtgctttcgg gtatatcagc gcatggggct gtaaaaccat ttccgaggtg aaagcctatc 18180 + gtcagaattt cagccagcgt gagctgatgg tcatctggcc ggatttcctc gcatgggata 18240 + cggtcaccag taccaccgcc accgcgtatg ccaccgcccg tgcgctgggg ctgcgcgcta 18300 + aaatcgacca ggagcagggc tggcataaaa cgctgtccaa tgtcggggtg aacggtgtta 18360 + ccggcatcag cgcatctgta ttctgggatt tgcaggagtc cggcaccgat gctgacctgc 18420 + ttaacgagtc aggcgtcact acgctgattc gccgcgacgg tttccgcttc tggggtaacc 18480 + gtacctgctc tgatgacccg ctgttcctct ttgaaaacta cacccgcacc gcgcaggtcg 18540 + tggccgacac gatggctgag gcgcacatgt gggcggtgga caagcccatc actgcaacgc 18600 + tgattcgcga catcgttgac ggcatcaatg ccaaattccg tgagctgaaa acaaacggct 18660 + atatcgtgga tgcgacctgc tggttcagcg aagaatccaa cgatgcggaa accctcaagg 18720 + ccggaaaact gtatatcgac tacgactata caccggtgcc tcctctcgaa aacctgaccc 18780 + tgcgccagcg tattaccgat aaatacctgg caaatctggt cacctcggtt aacagcaatt 18840 + aaggagcctg accgatggca atgccgcgca aactcaagtt aatgaacgtc tttctgaacg 18900 + gctacagcta tcagggcgtt gcaaagtccg tcacgctgcc aaaactgacc cgtaagctcg 18960 + aaaactatcg cggtgcgggg atgaacggca gcgcaccggt agacctcggc cttgatgacg 19020 + atgcgctgtc aatggagtgg tcgctcggtg gcttcccgga ttcggttatc tgggagcttt 19080 + acgccgcaac cggtgtggat gccgtgccga ttcgttttgc aggctcttac cagcgcgacg 19140 + ataccggcga aacggtggcc gtcgaagtgg tcatgcgtgg acgtcagaaa gaaatcgaca 19200 + ccggcgaggg taaacaggga gaagacactg agtcgaaaat ctccgtggtc tgcacctatt 19260 + tccggctgac gatggacggt aaggagctgg tcgaaattga caccatcaac atgattgaga 19320 + aggtgaacgg cgtcgatcgg ctggagcaac accgccgcaa tatcggcctg tgattttcat 19380 + ccggtcagcc tggctggccg gttaaccctg attcagaagt gagaaaacca tgaacaaaga 19440 + aaatgtcatt accctggaca atccggtcaa acgtggtgag caggttatcg aacaggtcac 19500 + gctgatgaaa cccagtgccg ggacgctacg cggtgtcagt ctggctgcgg ttgcaaactc 19560 + cgaagtcgat gcactgatta aggtgctgcc gcgcatgacg gcaccgatgc tgaccgagca 19620 + ggaagtcgcc gcgctggaac tgcctgacct tgtggcgctg gccggtaagg tggtcggttt 19680 + tttgtcgccg aactcggtgc agtgacgttt ccgaaaaatc tctcggtcga tgacctgatg 19740 + gcggatgtgg cagtgatatt tcactggccg ccatcagaac tgtatcccat gagcctgacc 19800 + gaactcatca catggcgcga aaaggcgctc cggcgaagcg gaaacacgaa tgagtaacaa 19860 + tgtaaaatta caggtattgc tcagggctgt tgaccaggca tcccgcccgt ttaaatccat 19920 + ccgcacagcg agcaagtcgc tgtcggggga tatccgggaa acacaaaaat cactgcgcga 19980 + gctgaacggt cacgcatccc gtattgaggg attccgcaag accagtgcac agctcgccgt 20040 + gactggtcat gcacttgaaa aggcacggca ggaggccgaa gcccttgcca cacagtttaa 20100 + aaacaccgaa cgtccgaccc gtgctcaggc gaaagtcctg gaatccgcaa agcgtgcggc 20160 + ggaggactta caggcgaaat ataaccgcct gacagattcc gttaaacgcc agcagcggga 20220 + actggccgct gtgggaatta atacccgcaa tcttgcacat gatgagcagg gactgaaaaa 20280 + ccgtatcagt gaaaccaccg cacagcttaa ccgtcagcgt gatgcgctgg tgcgtgtcag 20340 + tgcgcaacag gcaaaactta acgcagtaaa acagcgttat caggccggaa aggaactggc 20400 + cggaaatatg gcctcagtgg gcgctgccgg tgtggggatt gcggcggcgg gaacgatggc 20460 + cggtgttaag ctactgatgc ccggttatga gtttgcgcag aaaaactcag aattacaggc 20520 + tgtgatcgga gtggcaaaag actccgccga aatggccgca ctccgcaagc aggcgcgcca 20580 + gctcggcgac aataccgccg cctcggcaga tgatgcagcc ggtgcgcaga ttattattgc 20640 + gaaagccggt ggggatgttg atgccattca ggcggcaacg ccggtcacgc tgaacatggc 20700 + gctggcgaac cgtcgcacaa tggaagaaaa cgccgccctg ctgatgggga tgaaatccgc 20760 + ctttcagctt tcaaacgata aggtcgctca tatcggggat gttctctcca tgacgatgaa 20820 + caaaaccgcc gccgattttg acggcatgag cgatgcgctg acctatgccg cacctgtggc 20880 + aaaaaatgcc ggtgtcagca ttgaagaaac cgccgcaatg gtcggggcgc tgcatgatgc 20940 + aaaaatcaca ggctcaatgg cggggacggg aagccgtgcc gtgttaagcc gcctgcaggc 21000 + accgacggga aaagcatggg atgcactcaa agagcttgga gtgaaaacct cagacagcaa 21060 + aggaaacacc cggccaatat ttaccattct gaaagaaatg caggccagtt ttgagaaaaa 21120 + ccggctcggt actgcccagc aggctgaata catgaaaact attttcgggg aggaggccag 21180 + ctcagccgct gccgtgctga tgactgccgc ctcaaccgga aagctggaca aactgaccgc 21240 + tgcgtttaaa gcctcagacg ggaagaccgc cgagctggta aatatcatgc aggacaacct 21300 + aggcggtgac tttaaagcgt ttcagtccgc ttatgaggcg gtggggactg acctgtttga 21360 + ccagcaggaa ggcgcgctgc gtaagctcac gcagacggcc acaaagtatg tgttaaaact 21420 + cgacggctgg atacagaaaa acaaatcact ggcgtcaacc atcggcatca ttgccggcgg 21480 + tgcactggcg cttactggca tcatcggtgc cattggcctc gtagcctggc cggttatcac 21540 + cggcatcaat gccatcatcg cggcagcagg cgcaatgggg gcagtcttca cgacggttgg 21600 + cagtgctgtt atgaccgcca tcggggctat tagctggccg gttgtggccg tggtggctgc 21660 + cattgtcgcc ggtgcgttgc ttatccgtaa atactgggag cctgtcagcg cattctttgg 21720 + tggtgtggtt gaagggctga aagcggcatt tgcgccggtg ggggaactgt tcacgccact 21780 + taaaccggtt tttgactggc tgggcgaaaa gttacaggcc gcgtggcagt ggtttaaaaa 21840 + cctgattgcc ccggtcaaag ccacccagga caccctgaac cgttgccgtg acacgggcgt 21900 + catgttcggg caggcactgg ctgacgcgtt gatgctgccg cttaatgcgt tcaacaaact 21960 + gcgcagtggt attgactggg tactggaaaa actcggtgtt atcaacaaag agtcagacac 22020 + acttgaccag accgccgcca gaactcatac cgccacgtat ggtaccggtg actatattcc 22080 + ggcgaccagc tcttatgcag gctatcaggc ttatcagccg gtcacggcac cggctggccg 22140 + ctcttatgta gaccagagta aaaacgaata tcacatcagc ctgacggggg ggactgcgcc 22200 + ggggacacag cttgaccgcc agttacagga tgcgctcgaa aaatacgagc gggataaacg 22260 + tgcgcgcgcc cgtgccagca tgatgcatga cggttaagga ggtgacgaaa aatgatgctc 22320 + gcgttaggta tgtttgtttt tatgcgccag acgctgccac accagaccat gcagcgtgaa 22380 + tcagattatc gctggccgtc aaattcccgt atcggtaaac gggatgcctt tcagtttctc 22440 + ggtgtgggtg aggaaaacat cacgctggcc ggtgtgcttt atcccgaact gaccggcggc 22500 + aagctgacga tgaccacgct caggctgatg gcagaggagg ggcgggcgtg gccgttgctg 22560 + gatggcaccg gcatgattta cggcatgtat gtcatcagca gggtgagtga aacagggagt 22620 + attttctttg cagacggcac accccggaaa attgatttta cgctgtcact cacccgcgtt 22680 + gatgaatcac tggccgcgct ttatggcgat atcggtaaac aggcggaatc gctcatcggt 22740 + aaggccggca gtatggcgac cagattcaca ggtatgacgg gggcgggata atgctggatg 22800 + cgctgacatt tgatgcaggc agtacgctga cgccggatta catgctgatg ctcgacagca 22860 + gggatattac cggcaatatc agcgaccgtc tgatgagcat gaccctgacg gataaccggg 22920 + gctttgaggc tgaccagctt gatattgaac tgaacgatgc cgacgggcag gtcgggctgc 22980 + cggttcgtgg cgctgtcctg acggtgtata tcggctggaa aggttttgcc ctggtatgca 23040 + aagggaaatt taccgttgat gaggttgaac accggggcgc accggatgta gtcaccatcc 23100 + gcgcccggag tgcagatttt cgcgggacgc tcaattcccg ccgggaaggc tcctggcatg 23160 + acaccacgct cggtgcgatt gttaaggcga tagccacccg taacaggctg gaagccagtg 23220 + tcgctccgtc actggccgga ataaaaattc cacacatcga ccagtcgcag gagtctgatg 23280 + cgaaattcct gacccgtctt gcagaacgca acggcggtga ggtgtcggta aaaatgggaa 23340 + aactgttgtt tctcaaagcg gggcagggag tgacggccag cggtaaaaaa atcccgcagg 23400 + tcaccataac ccgcagcgac ggcgaccgcc atcattttgc gattgctgac cgtggagcct 23460 + acaccggtgt aacggcaaaa tggctacaca ctaaagaccc gaagccgcaa aagcagaagg 23520 + taaaactgaa acgcaaaaag aaagagaaac acctgcgcgc actggagcac ccgaaagcga 23580 + aaccggtcag gcagaagaaa gcgcctaaag taccggaagc gcgtgaaggt gaatacatgg 23640 + ccggtgaggc tgacaacgtt tttgccctga ccacggtata tgccacgaaa gcgcaggcca 23700 + tgcgcgccgc tcaggcgaag tgggataaac tgcaacgggg cgttgcggag ttctctatca 23760 + gcctggctac cggtcgggca gatatttaca cggaaacacc ggtcaaagtg tctggcttta 23820 + agcgcgtcat agacgagcag gactggacaa tcactaaggt gacacatttt ctgaataata 23880 + gcggcttcac gacgtcctta gagcttgagg tcaggctttc tgatgtggag tacgaaacag 23940 + aagatgatga gtgatgtttt tgttttatct gtttgttttg taaggataaa ttaactaaaa 24000 + tggcaccatc aacaaaaccg gaagaggtgc tcgcgatgtt tcattgtcct ttatgccagc 24060 + atgccgcaca tgcgcgtaca agtcgctata tcactgacac gacaaaagag cgttatcatc 24120 + agtgccagaa cgtgaattgc agcgccacgt tcatcactta tgagtcggta cagcgataca 24180 + tcgtgaagcc gggagaagtc cacgccgtaa ggccgcaccc gttgccatca gggcagcaaa 24240 + ttatgtggat gtaattacaa acagaaagcc cctcagtcga ggggcttttt tgtcgatgtg 24300 + gtcaatgtgt ggacgtgacc agaaataaat ccttttattt caatttattg tacgtaaaaa 24360 + ataagcccgt gtaagggaga tttagggtgt caccagtagg ggctttcaac ggtacaatgc 24420 + gggtttgagc ggcataaatt accactgaaa gcccttaaac gttactctac tgtggacact 24480 + gtgtggacac tctcggcctc agtaccacct cttagcggat taagagaaat ggcgtcctga 24540 + aggtactctg gcgcaaaatg agcgtaaacc atagtttgct caatccgcgt gtgacctagt 24600 + atccgttgta gcgtgataat acttcctcca ttaatcatga aatgagtggc aaagctgtgc 24660 + cttagtgcat gtgtggcttg ccccattggc aaatccggtt ttattgcttt cattgttcgt 24720 + ctgaagcgag ggtaatcagc atcagggaat aaaaaacctc gtttgttatc cgcgatcatt 24780 + ttggcaacag cctctgagat cgggacggtg cgtggtttgt ttgttttcgt tttaacaaac 24840 + gtgacgcggt tatggatgat attttctgct ttcaaacgag ctgcttctcc ccaacgtgct 24900 + cctgtactca ggcaaagaat cgcaatcttt ttattgtcgc cgtcaagtgc tgcaagcagt 24960 + aaggcaattt cttcctgtgt tagatagcct gtttctggtt tttcctcctt aagccttttt 25020 + gtccctctga tagggtgctc accaaagaat aactccgctt caatcagggc tgtaaacatg 25080 + ccgctaatac atgttaaatc acgattgata ctcgaaggtt taataccctg acttcttcgg 25140 + gtggcgcagt actggctgat aagcgatttc gtaatttgaa atgcgcatgg gtcattcgtt 25200 + atttttgtga agatttcaat ttttccaaga ttagatttcc catgctcttc gtgtttaccc 25260 + tttaaatccc accagatctg tgtcagctcc gacagacgtc gcttgtctgt tggttttgat 25320 + agccattctt tattgtggtg gttgtacaac gtgtatttct cgaaagcgac agcttcgctt 25380 + ttcttatcaa acttcctacg gatgcgtttt ccattacgtc cagtagggcg gatgtccact 25440 + tcatatcgac catcatcgag ttttttgatt gccatcagaa aaccctccga gtggtgtgtt 25500 + tttttgcgac tactaatcgc ttttttcgtg gtggctgaaa tttagccacc aatagtaggc 25560 + acttgtgatg aatatattca cgatgaattg ttaaccagtc ttttgaccgg agtggggcga 25620 + cgttgtttcg ttttgcccaa agtgtgcgag agcgggcgca atttgcccgg actcaggagc 25680 + gatctgattg gtcatgaacc ataaagtgta tttggtgaat tgtggggtct gcaggatgtt 25740 + catcatgaca tctgttggag gtgttgaacg accactttca tagtaactca gcgtgccata 25800 + cggaacccct gttaaatcag caagttgttg tctgctcaaa tactctgatt ttcgcattaa 25860 + gactatcttc tcgcttatcg tgtttgacat ggtgtttaga tctcaatagt atttagttta 25920 + gatgtagatt gtttagtgct tggatgtggg cactaaaagg cattataaga cattaaacgc 25980 + aattcatgag ggctagagga cgacatgagc aagcaagtaa cactcatgac tgatgcgatt 26040 + ccttatcagg agttcgcaaa actaatagga aaatcgacag gagcggttcg tcggatgatc 26100 + gataaaggaa agctgcctgt aattgatatg accgatccac aatcagcttc aggtcgtgca 26160 + ggtgaatatt gggtatacct tccggcatgg aataacggac taaaactggc ttatgaaagc 26220 + cgccctaaag agattcgtga cggctggttg atgtggttag gtctcggtga accacgttaa 26280 + ggagaaccgt atgaatgagc ctcgttgtat tgctcagtta ctgcgtaacg aaagccccag 26340 + ggcgattgac ttcaccatca cccacggtaa ggggcgtaag ggaatcatta tccgcaccaa 26400 + aaaacagagt ccgttaaaaa aggctctgac ctttctgaaa agccggaggg tatggaaatg 26460 + acagtgatga cgctcaatct cgttgaaaaa cagccagcag ctatgcgccg gataattggt 26520 + aagcatcttg ccgttcctcg ctggcaggat acatgtgatt attataatca gatgatggag 26580 + cgcgaacggt taacggtttg cttccatgct cagttaaaac agcgtcacgc aacgatgtgt 26640 + tttgaagaaa tgaacgacgt cgaacgtgaa cgactggtat gtgcaattga tgaattgcgt 26700 + ggtgcattct caaaacgccg tcaggttggc gcaagtgagt atgcatatat tagtttttta 26760 + acagtcagtc agcgtcgtac tttatttatg catgccggat tgactgaaaa agaattcaac 26820 + cagccatact ggcgaattaa tgaagagtca tgttactggc gtgatgcttt attccgtgca 26880 + ttacgtgaat tattcagtct gtttgagtat gcaccgacaa ttctgacgtc ggtaaaaccg 26940 + gagcaatatc tgcattaagt aattaaccag agtttttaac gcacttaatt gtgcggggct 27000 + tctttttgcc tggagaaagt tatgcataca gtttctgaaa atcagtgcgg tatatacgca 27060 + ttactgctgc aacaggccag aaccgaagca caggccgacg ctgcgacgcg cttttcttct 27120 + catcttgatg ccatgattcg ccacatcaca aaggcggagt tatcccgcgt ggagatagtc 27180 + gagctgctca gtcaggagtc ggaaaaattt cacaatatcg gattgtctcg cggggaggtg 27240 + ctttgatgtt ctgttctcgt gcagttgtat tactgaataa cgccttaaaa atcgccgtta 27300 + tgaaaaatgg cgatttgtct cttattcaac ttggtcttga taaagaaaaa cgcgaaataa 27360 + ctgaatctgt tatcgcgatt tatcagagtg aattaaacct cctgtctgat gtggtcaatt 27420 + tacttgttaa acgcgctgta tttcacaagc aaatttcctc cgtggatgaa ctgacgaaat 27480 + taacgacaga aatcgccagc tattgcgctg atgaatttaa aaaactgaac gacaaaagga 27540 + actggtaatg ccggacaacg tagattttat tcaggaacaa caggctgaat tactggagcg 27600 + ccagattaac gcggcaaggg taaaacattg cggtgcttct gcgctggttt gcgaagagtg 27660 + tgacgcgcca atacctgctg cccgtcgtgc ggcttacccg tcagccacgc gttgtgtttc 27720 + ctgtcagtca gtctttgaag caaaaaacaa acattaccgg agaacggcat gagtattcgt 27780 + attgaaattg gcgaacgtta tgtcgttacc agtgacagct ttcagtttat tctccacgag 27840 + aaaaagagag cggaaagcgg taaaaacgcc ggtcaggaat ggctggcggt ggttggttat 27900 + tacccgaaat taagccagct cgtttcaggc ctgatgcatc acgatattct gaccggaagc 27960 + gcaaagtctt ttgctgattt aaacgtgcag gttgagcaac tcagcaagcg ttgttcagag 28020 + gcttttggct catatggccg ttaaagcctc cgggcgtttt gtccctccgt cagcatttgc 28080 + cgcaggcacc ggtaagatgt ttaccggtgc ttatgcatgg aacgcgccac gcgaggccgt 28140 + cgggcgcgaa agacccctta cacgtgacga gatgcgtcag atgcaaggtg ttttatccac 28200 + gattaaccgc ctgccttact ttttgcgctc gctgtttact tcacgctatg actacatccg 28260 + gcgcaataaa agcccggtgc acgggtttta tttcctcaca tccacttttc agcgtcgttt 28320 + atggccgcgc attgagcgtg tgaatcagcg ccatgaaatg aacaccgacg cgtcgttgct 28380 + gtttctggca gagcgtgacc actatgcgcg cctgccggga atgaatgaca aggagctgaa 28440 + aaagtttgcc gcccgtatct catcgcagct tttcatgatg tatgaggaac tcagcgatgc 28500 + ctgggtggat gcacatggcg aaaaagaatc gctgtttacg gatgaggcgc aggctcacct 28560 + ctatggtcat gttgctggcg ctgcacgtgc tttcaatatt tccccgcttt actggaaaaa 28620 + ataccgtaaa ggacagatga ccacgaggca ggcatattct gccattgccc gtctgtttaa 28680 + cgatgagtgg tggactcatc agctcaaagg ccagcgtatg cgctggcatg agacgttact 28740 + gattgctgtc ggggaggtga ataaagaccg ttctccttat gccagtaaac atgccattcg 28800 + tgatgtgcgt gcacgccgcc aagcaaatct ggaatttctt aaatcgtgtg accttgaaaa 28860 + cagggaaacc ggcgagcgca tcgaccttat cagtaaggtg atgggcagta tttctaatcc 28920 + tgaaattcgc cggatggagc tgatgaacac cattgccggt attgagcgtt acgccgccgc 28980 + agagggtgat gtggggatgt ttatcacgct taccgcgcct tcaaagtatc acccgacacg 29040 + tcaggtcgga aaaggcgaaa gtaaaaccgt ccagctaaat cacggctgga acgatgaggc 29100 + atttaatcca aaggatgcgc agcgttatct ctgccatatc tggagcctga tgcgcacggc 29160 + attcaaagat aatgatttac aggtctacgg tttgcgtgtc gtcgagccac accacgacgg 29220 + aacgccgcac tggcatatga tgcttttttg taatccacgc cagcgtaacc agattatcga 29280 + aatcatgcgt cgctatgcgc tcaaagagga tggcgacgaa agaggagccg cgcgaaaccg 29340 + ttttcaggca aaacacctta accagggcgg tgctgcgggg tatatcgcga aatacatctc 29400 + aaaaaacatc gatggctatg cactggatgg tcagctcgat aacgataccg gcagaccgct 29460 + gaaagacact gctgcggctg ttaccgcatg ggcgtcaacg tggcgcatcc cacaatttaa 29520 + aacggttggt ctgccgacaa tgggggctta ccgtgaacta cgcaaattgc ctcgcggcgt 29580 + cagcattgct gatgagtttg acgagcgcgt cgaggctgca cgcgccgccg cagacagtgg 29640 + tgattttgcg ttgtatatca gcgcgcaggg tggggcaaat gtcccgcgcg attgtcagac 29700 + tgtcagggtc gcccgtagtc cgtcggatga ggttaacgag tacgaggaag aagtcgagag 29760 + agtggtcggc atttacgcgc cgcatctcgg cgcgcgtcat attcatatca ccagaacgac 29820 + ggactggcgc attgtgccga aagttccggt cgttgagcct ctgactttaa aaagcggcat 29880 + cgccgcgcct cggagtcctg tcaataactg tggaaagctc accggtggtg atacttcgtt 29940 + accggctccc acaccttctg agcacgccgc agcagtgctt aatctggttg atgacggtgt 30000 + tattgaatgg aatgaaccgg aggtcgtgag ggcgctcagg ggcgcattaa aatacgacat 30060 + gagaacgcca aaccgtcagc aaagaaacgg aagcccgtta aaaccgcatg aaattgcacc 30120 + atctgccaga ctgaccaggt ctgaacgatt gcagatcacc cgtatccgcg ttgaccttgc 30180 + tcagaacggt atcaggcctc agcgatggga acttgaggcg ctggcgcgtg gagcaaccgt 30240 + aaattatgac gggaaaaaat tcacgtatcc ggtcgctgat gagtggccgg gattctcaac 30300 + agtaatggag tggacatgat ggcaaaaatt cacgaggtaa agctgcacgc aaaatatttc 30360 + gaccttgtac tggaaggaaa gaaacgcgca gagtttcgga aaaaagatcg taattatgag 30420 + cgcggggaca cgttgatttt gcatgaatgg gtgcagggtg tgtttacggg gcgaaaggtt 30480 + gaagcccgga taacagatgt tactgacctg tcagactggc tggaagatta tgtcttgctg 30540 + cacagaatac taggtgagat actgccgctg actgtcaagc tggcagtatc ctccacattt 30600 + tttataaatc taaggcgaag aacggtggca atatatttgc tttaaattgt aaataagcaa 30660 + attattctaa gccacaaatg atatcaattg agtatcgatt ttcgttcgaa tataaccata 30720 + acgccaagcg tcaaatgtaa gtcatctata tgtgattcgt attcatattg gtcagcatca 30780 + ggagatagta aatgctctgc tgctgtaaaa acatcaattg taacagatat atcgtctgga 30840 + atttcttcat ttaattcgga tatgtatttt ttatatttgt tttttaattt ccttatcatg 30900 + tcttccttat ggtggattgt agtgcagtaa ttttttttag ttgaatcatt gtatgaatgg 30960 + aatgaacagt ttaatgctag gccaagactt gaatttcctg tagggcctgt gtgtttaaag 31020 + tattcaagat ttcttcttat gtcagaaaat aaaagacttt tacagggggc atttccttta 31080 + acttctattg cacatattgg aatgtcgaaa aatggtctgc tgtccaatat ggcaatatca 31140 + attctgcctg atcttgttgt gtttgtgttt tttctgacag ttttttttga gaatattttt 31200 + tgggggtcag accgtttcga taaaggaact gttgcattaa tgaatttatt tgtatggtac 31260 + tcaaatataa ctttgtaatc accatggcga aaagatttta tttctaacaa cgatagacct 31320 + atagatacgg tagctacata ttcagtgttt atttttgcac cagacctgaa atccattaaa 31380 + taagttgcgt cggctgactt tttcattcca tcttttacag ctttcacaat atccatgtta 31440 + ttcatatcaa caccttttat attccagaat tataaatctt aatgattgat ttgtttgtgt 31500 + gtttaggtta ctagattgac gtacttatag cacattctga ttttgaaatc accatccttg 31560 + ggtaaagcac agcctatcac tattggttta gtactgtgct gtaatagtat cagattaagt 31620 + taaatccatt ttatgaaatc ttccatttca tcatattttt ttattactgc tctaacatct 31680 + ttgctttcat cacataaaca atctaaaaga ctatcccatt cagtttgttt tttaccaaat 31740 + ccataaacag cctctatatc accggatttc catatataga ttccgttatc tttcaatttt 31800 + tgatgtattt catgtatatg cttttgtgtt ttttcatggt tacatatttt gatgaagtct 31860 + ttgcttgaaa tgcttttgaa tgactcaaaa gtagtaactt ttgtatttaa actaagctct 31920 + cctgagttga ttgattcaat caaagcagtc aatagattat cacattcagt actaagtaag 31980 + tctttatgct ctgttaatag aatatttgat aagaaatcac aatcagctag aatccttgtt 32040 + tttatgccga tggcattgat gatttgtgac atcttaaata aactaccctt accgtcaacg 32100 + gcaacaatgc agattttact cgggttgagt tcatgtccgt taattttttt ataaagtgca 32160 + tatagaacgt ttgtctctgt tttcccttca acaagcaaaa cttcttcaga aaataaaagg 32220 + tatgatgaat tagaaagcgt gaatgctgag tgcaattgcg gtgatgaaga tttatataat 32280 + tcttcgattt tttcagatat agtcttcctt gctatggttc cattagaatc cttacaaacc 32340 + tgaatcgcat ttgctgcatg ctttgcagaa agcatactgg ctgagtgagt tgatattata 32400 + acctgatacc ctgattcact taatgtgaca agtgattctc tgacagaatt aatggctgaa 32460 + gggtgtaaat ataactcagg ttcatcaatg aaaatcaaag tgtttgattt ttttgattcg 32520 + ctgttttctt tttttatttc ggccaggtat tgaattaatg ccatttgaat ggaacgttgt 32580 + gttccgtgac caaatcggct gatatctctc attaccggtt catcttcccg agactcaaaa 32640 + actttcagag tgccggattt aaatatctca tctaatgtcg gtgtgggaaa gtgtaacttt 32700 + acacttacgt caggaaaaaa ttggtttact tttttattta cacctgagtc tattttatta 32760 + aggctttcta atctgttctc accgttgtga gaaagatatt tacctatttc tgatatgttt 32820 + tttgaaaatt tttcttcgtg ttcttgtttt atttcagaaa caattgcgga aagtatcttt 32880 + cctattgtgg tcgtgttttt gcattttgtt gagtcttcga cagcgtcaga cattgcaggg 32940 + atatgaattg gttccggaaa tatattggag attgcaccat ctatgccgcc agggtttttc 33000 + ttccacgtgg taccgtcata tacatccaga ctttttttgg cttttcctgt ttccttatta 33060 + aattcctgtc ttcttgcaaa ggtaagagtc ccgtcaatta taaacggagc tattttttgt 33120 + tgattctctt ctgttaacaa agacagagta tcatctgtta taccttgaat aacgccttca 33180 + acggatacgg ggtgtgtagg atcgtacaca tctgattctg aaatcaaaga gccatctaac 33240 + agccacttaa ttgctaagat aatatttgat tttcctgcgt tattataacc aactaaagca 33300 + gtgaaggggc gcaaaatagc cgatgttgac ttacaagaac gaaagttgct aattgaaact 33360 + gaagcaagac gtacagtcat tatttttcct taaatgtgct atttgtatgc aatgagttca 33420 + tacgaaacgc ttttttacat tttatagtcg ttgcattcaa gggtgcatga gattgcatta 33480 + agggaaactg tgatatggct tggcttttga ctggaaatac tgatggctca ttagttttat 33540 + taaggtgcat taaaaccgcc ccgtgaagcg ggcgggcgag gcggggaaag cac 33593 +// diff --git a/etc/af063097.fasta b/etc/af063097.fasta new file mode 100644 index 000000000..8ed33789e --- /dev/null +++ b/etc/af063097.fasta @@ -0,0 +1,561 @@ +>AF063097 AF063097 Bacteriophage P2, complete genome. +ggcgaggcggggaaagcactgcgcgctgacggtggtgctgattgtattttttcagcgtct +cagcgcgtcgtgacggcacttagtctgcccgttgaggcgttgtgtgtctgcggggtgttt +tgtgcggtggtgagcgtgtgaggggggatgacggggtgtaaaaaagccgcccgcaggcgg +cgatgttcagtcgttgtcagtgtccagtgagtagtttttaaagcggatgacctcctgacc +gagccagccgtttatctcgcggatcctgtcctgtaacgggataagctcattgcggacaaa +gacctttgccactttctcaatatcacccagcgacccgacgttctccggcttgccacccat +caactgaaaggggatgcggtgcgcgtccagcaggtcagcggcgctggcttttttgatatt +aaaaaaatcgtccttcgtcgccacttcactgagggggataattttaatgccgtcggcttt +cccctgtggggcatagagaaacaggtttttaaagttgttgcggcctttcgacttgaccat +gttttcgcgaagcatttcgatatcgttgcgatcctgcacggcatcggtgacatacatgat +gtatccggcatgtgcgccattttcgtaatacttgcggcggaacaacgtggccgactcatt +cagccaggcagagttaagggcgctgagatattccggcaggccgtacagctcctgattaat +atccggctccagcaggtgaaacacggagccgggcgcgaaggctgtcggctcgttgaagga +cggcacccaccagtaaacatcctcttccacgccacggcgggtatattttgccggtgaggt +ttccagtctgatgaccttaccggtggtgctgtaacgcttttccagaaacgcattaccgaa +caccagaaaatccagcacaaagcggctgaaatcctgctgggaaagccatggatgcgggat +aaatgtcgaggccagaatattgcgtttgacgtaaatcggcgagctgtgatgcacggcagc +ccgcaggctttttgccagaccggtaaagctgaccggtggctcataccatctgccgttact +gatgcactcgacgtaatccagaatgtcacggcggtcgagtaccggcaccggctcaccaaa +ggtgaatgcctccattttcgggccgctggcggtcattgtttttgccgcaggttgcggtgt +tttcccttttttcttgctcatcagtaaaactccagaatggtggatgtcagcggggtgctg +ataccggcggtgagtggctcatttaacagggcgtgcatggtcgcccaggcgaggtcggcg +tggctggcttcctcgctgcggctggcctcataggtggcgctgcgtccgctgctggtcatg +gtcttgcggatagccataaacgagctggtgatgtcggtggcgctgacgtcgtattccaga +cagccacggcggataacgtcttttgccttgagcaccattgcggttttcatttccggcgtg +tagcggatatcacgcgcggcgggatagaacgagcgcacgagctggaacacgccgacaccg +aggccggtggcatcaataccgatgtattcgacgttgtatttttcggtgagtttgcggatg +gattccgcctgggtggcaaagtccatgcctttccactggtgacgctcaagtattctgaat +ttgccaccggccaccaccggcggtgccagtaccacgcatccggcgctgtcgccacggtgt +gacgggtcgtaaccaatccataccgggcgggagccgaacggattggcggcaaacggcgca +tagtcttcccattcttccagcgtgtcgaccatgcagcgttgcagctcctcgaacgggaac +accgatgccttgtcgtcaacaaattcacacatgaacaggtttttaaaatcgtcggcgctg +ttttcgcgtttgagctgctcaatgtcgaacagcgtgcagccgcctttcagggcgtcctca +atggtgacaatctgtcgccactggccgtccgcacagagaagcccaccggcaagggcgtta +tgactgacgtcgatttccacgcgttcggcggcgctggcgcgtccccggttaaacagttca +cccgaccagaacgggtaggcgtcgtgcgccagcgtggacggggtggagaaataggtcgag +cgcaggtgactctgtgaggccatacctgatgccaccttacgcagtacctgaaaattcggg +atccagaaaatctcatcgacgtacaggtcgccgttatgactctgcgcggtgttggagttg +gtgccgagaaaaatcagttttgcgccgttattgcccaggacaatcgggtcaccggtcagg +tcaacgtcaaccagacgggcaaaggcgatgatgtattcgcggaacacatacgcctgtgtt +ttactggccgacagaaaaatctggttatgaccggttttcagggcacgcagcagcgcctcg +cgggaaaaataaaacgtcgcgccaatctggcgggatttcaggatatcgcggatgcggtgc +tcaagcccggcacgataccagtgcagctgatagtcgaaagactgctcaaagaaaatctgc +tccagcttttcgatggcctcgtcactgaaaaaattctttttcggtttgcgccgtccgcct +ttgttacggttagcgacgttcggattaaggtctgcctcgttgccggtctggctgtagcgg +ttgacccgtgccagtcgttcaatctggcgtcccagcaggtcaatttccttgaagtcaccg +ccggttttctgtggtttgatgatgagctgggtcagccgcgcttccagactcatttcgaca +cggctgatgggggcaacgctgtcccagccgtcgcgctgtttccagctctgcactgtcggg +cgtttcatctgcaacatggcggcaatctgcggcacggaaaacccctgccagtacagcagc +gccgcctgacgacgcgggtcgtgtaaaagagtggtgtctgtggtgatggtcatgaatacc +tcgccgtgatgaatacacggcaaggctactgagtcgcgccccgcgattcgctaaggtgct +gttgtgtcagtgataagccatccgggactgatggcggaggatgcgcatcgtcgggaaact +gatgccgacatgtgactcctctaatcactattcaggactcctgacaatggcaaaaaaagt +ctcaaaattctttcgtatcggcgttgagggtgacacctgtgacgggcgtgtcatcagtgc +gcaggatattcaggaaatggccgaaacctttgacccgcgtgtctatggttgccgcattaa +cctggaacatctgcgcggcatcctgcctgacggtatttttaagcgttatggcgatgtggc +cgaactgaaggccgaaaagattgacgatgattcggcgctgaaaggcaaatgggcgctgtt +tgcgaaaatcaccccgaccgatgaccttatcgcgatgaacaaggccgcgcagaaggtcta +cacctcaatggaaattcagccgaactttgccaacaccggcaaatgttatctggtgggtct +ggccgtcaccgatgacccggcaagcctcggcacggaatacctggaattctgccgcacggc +aaaacacaaccccctgaaccgcttcaaattaagccctgaaaacctgatttcagtggcaac +gcctgttgagctggaatttgaagacctgcctgaaaccgtgttcaccgccctgaccgaaaa +ggtgaagtccatttttggccgcaaacaggccagcgatgatgcccgtctgaatgacgtgca +tgaagcggtgaccgctgttgctgaacatgtgcaggaaaaactgagcgccactgagcagcg +cctcgctgagatggaaaccgccttttctgcacttaagcaggaggtgactgacagggcgga +tgaaaccagccaggcattcacccgcctgaaaaacagtctcgaccacaccgaaagtctgac +ccagcagcgccgcagcaaagccaccggcggtggcggtgacgccctgatgacgaactgctg +accggcgtcagtcagtccgggaaaaccttcacgattaacccttaatttcaggaaaaacta +tgcgccaggaaacccgctttaaatttaatgcctacctgtcccgtgttgccgaactgaacg +gcatcgacgccggtgatgtgtcgaaaaaattcaccgttgaaccgtcggtcacccagaccc +tgatgaacaccatgcaggagtcctctgactttctgacccgcatcaatattgtgccggtca +gcgaaatgaaaggggaaaaaattggtatcggtgtcaccggctccatcgccagcactaccg +acactgccggtggtaccgagcgtcagccgaaggacttctcgaagctggcgtcaaacaagt +acgaatgcgaccagattaacttcgatttttatatccgctacaaaacgctggacctgtggg +cgcgttatcaggatttccagctccgtatccgtaacgccattatcaaacgccagtcccttg +atttcatcatggccggttttaacggcgtgaagcgtgccgaaacctctgaccgcagcagca +atccgatgttgcaggatgtggcggtcggctggctgcagaaataccgcaatgaagcaccgg +cgcgcgtgatgagcaaggtcactgacgaggaaggccgcaccacctctgaggttatccgcg +tgggtaagggcggtgattatgccagccttgatgcactggtgatggatgcgaccaacaacc +tgattgaaccgtggtatcaggaagaccctgaccttgtggtgattgtggggcgtcagctac +tggcggacaagtatttccccatcgtcaacaaggagcaggacaacagcgaaatgctggccg +ctgacgtcatcatcagccagaaacgcatcggtaacctaccagcggtacgcgtcccgtact +tcccggcggatgcgatgctcatcacgaagctggaaaacctgtccatctactacatggatg +acagccatcgccgcgtgattgaggaaaacccgaaactcgaccgcgtggagaactacgagt +caatgaacattgattacgtggtggaagactacgccgccggttgtctggtggaaaaaatca +aggtcggtgacttctccacaccggctaaggcgaccgcagagccgggagcgtaaccgatga +cgagtcccgcacagcgccacatgatgcgggtctcggcagcgatgaccgcgcagcgggaag +ccgccccgctgcgacatgcaactgtctatgagcagatgctggttaagctcgccgcagacc +agcgcacactgaaagcgatttactcaaaagagctgaaggccgcaaaaaaacgcgaactgc +tgccgttctggttgccgtgggtgaacggcgtgctggagctgggcaaaggtgcacaggatg +acattctgatgacggtcatgctgtggcgtctggataccggcgatattgccggtgcgctgg +agattgcccgttatgccctgaagtacggtctgaccatgccgggtaaacaccgccgtaccc +cgccgtacatgttcaccgaggaggtagcgcttgcggccatgcgcgctcacgctgccggtg +agtctgtggatacccgcctgctgacggagacccttgaactgaccgccacggctgacatgc +ctgatgaagtgcgcgcaaagctgcacaaaatcaccggtctgtttctgcgtgacggtggtg +atgccgccggtgcgctggcgcacctgcaacgtgcgacacagctcgactgtcaggcaggcg +tcaaaaaagagattgaacgactggagcgggagctgaaaccgaagccggagccgcagccca +aagcggccacccgcgccccgcgtaagacccggagcgtgacaccggcaaaacgtggacgcc +cgaaaaagaaagccagttaacaaccgaatgcgccccgcgccagggcggcacgccggtcag +tgacggtgaatcacctgacactgcaccggcgtccaccgcccgacttttcagaggtagtca +tgatgacgctgattattccgcgaaaggaggctcccgtgtccggtgagggtacggtggtca +tcccgcaaccggcaggcgacgagccggtgattaaaaacacgttcttttttcccgatatcg +acccgaagcgcgtccgggaacgtatgcgccttgagcagaccgtcgcccccgcccgtctgc +gtgaggccatcaagtcaggcatggctgaaacgaatgcggagctgtacgagtaccgcgaac +agaaaattgccgccggttttacgcgtctggctgacgtcccggcggacgatatcgacggtg +aaagcatcaaggttttttactacgagcgcgccgtgtgtgcgatggcgaccgcgtcgcttt +atgagcgttatcgcggtgtggatgccagtgcgaaaggcgacaagaaggctgacagcattg +acagcaccattgatgagctgtggcgggatatgcgctgggcggtggcgcgcatccagggca +agccgcgctgcatcgtgagtcaaatctgatgaagacctttgcgctacagggcgacacgct +cgacgccatttgtgtccgctattacgggcgcactgagggcgtggttgagaccgtgctcgc +cgcaaatccgggactggctgaactgggggcggtgctgccacacggcaccgccgtcgaact +gcccgacgttcagaccgcgcccgtggctgaaactgtcaatctgtgggagtaacgcatgac +agcagaagaaaaaagcgtcctgtcgcttttcatgattggggtgctgattgttgtcggcaa +ggtgcttgccggtggtgaacctatcaccccgcgtctgtttatcgggcgcatgttgctcgg +tggttttgtctcgatggttgccggtgttgttctggtgcagtttcctgacctgtcactgcc +agcggtgtgcggcatcggctccatgctgggtatcgccggttatcaggtgattgagattgc +cattcagcgccgctttaagggcagggggaaacagtaatgccggtaattaacacgcatcag +aatatcgccgcctttctcgacatgctggccgtgtccgaagggacggcgaatcatccactg +acgaaaaaccggggctatgacgtgatagtcaccggactggacgggaagccggaaattttc +accgactacagtgaccacccgttcgcacatggccgaccggcgaaggtgtttaaccgtcgc +ggtgaaaaatccacggcctccggtcgctatcagcagctttacctgttctggccgcattac +cgcaaacagcttgccctgccggatttcagtccgttgtcacaggacagactcgccattcag +ttgatccgcgaacgcggagcactggatgacatccgggcgggacgcattgagcgcgccatt +tcacgctgtcgcaatatctgggcgtccctgccgggtgccggttacggtcagcgtgagcat +tcactggaaaaactggtcaccgtctggcgtaccgctggcggcgtaccggcttaaacggag +taaataccatgaagaaattatccctttcactgatgctgaacgtgtcgctggcgctgatgc +tggcactgtccctgatttacccgcagagcgtggccgtcaattttgtcgctgcctgggcga +ttctggcgacggttatctgtgtggttgccggtggtgtgggcgtgtatgccactgagtatg +tgctggaacgctacgggcgggagctgccgccggaatcgctggccgtgaagattgtcacgt +cgctgtttttgcagccggtgccgtggcgcagacgggcggcggctctggtagtggtggtgg +cgacgtttatctcgctggtcgctgccgggtggatttttaccgcgctgatttatcttgtgg +tgtcgctgtttttccggctgatacgtaaagcctgtcgtcagcgtcttgaggggcgggaac +catgtcaaggctgatgattgtgctggtcgtgttgttatcgctggcggtggccggtctgtt +tctggtgaaacacaaaaatgccagcctgcgcgcctcgctggacagggcgaacaacgtcgc +cagcggtcagcagacgaccatcaccatgctgaaaaatcagcttcatgttgcgctcaccag +ggcagataaaaacgagctggcgcaggtggcactgcgtcaggaactggagaacgccgcgaa +acgtgaagcacagcgcgagaaaaccatcacgaggttacttaatgagaacgaagattttcg +ccgctggtacggtgctgacctgcctgatgctgtgcgccggttgcaccagcgccccgcctg +caccgacgccagtgattgtccccaacgcatgcccgaaagtgagcctttgcccgatgccgg +gcagtgacccgcagacgaacggcgatttaagtgccgatatccggcagcttgagaacgcgc +tggcacgctgtgccagccaggtaaaaatgattaaacactgtcaggacgaaaacgatgctc +aaacccgacagcctgcgcagggcgctgactgatgccgtcacggtgctgaaaactaacccc +gatatgctgcggatattcgtggataacgggagtattgcctccacactggcggcgtcgctg +tcattcgaaaagcgttacacgctcaatgtgattgtgaccgactttaccggtgattttgac +ctgctcattgtgccggtgctggcgtggctgcgggaaaatcagcccgacatcatgaccacc +gacgaaggccagaaaaagggcttcacgttttatgcagacatcaacaatgacagcagcttt +gatatcagtatcagcctgatgctgaccgagcgcacgctggtcagtgaggtggacggcgca +ctgcatgtgaagaatatctcggaacccccgccgccggagccggtcacccgcccgatggag +ctgtatatcaatggcgaactggtgagtaagtgggatgaatgagtttaagcgttttgaaga +ccggctgaccggactgattgaatcgctgtcaccgtcagggcgtcggcgactgagtgccga +actggcgaaacgtctgcggcagagtcagcagcgtcgggtgatggcacagaaagccccgga +cggcacaccctacgcgccacgccagcagcagagcgtcagaaaaaagaccggtcgcgttaa +gcgaaaaatgtttgcgaaacttattaccagtcgttttttgcatatccgtgccagcccgga +gcaggcatcaatggaattttacggcgggaagtcgccgaaaatcgccagtgtgcatcagtt +tggtctgtcggaagaaaaccggaaagacggtaagaaaattgattatccggcgcgtcccct +gctcggctttaccggtgaggatgtgcagatgattgaagagattatcctggctcaccttga +gcgttagttttatccaggcagaggctgatgcgcaattaaacattgagcggccatgctggt +cgctcaatgtttagaggtttatgagtgatttttatttgatgctttgtattctaaaacctt +cttattggcgtaaaagaattttgtatatgacaggaatataaccagacctgaagtgaaata +gacgagggatagtattaataatgcttttttgtgactgttattatctttaatctcctggct +taaccattcggagtcctcctcgtttagctgtaagagcttattgcaggcgatctcaggaag +tgtgtcttttataaatacgttttgcagtctcttgcaatcggcaaggctataagttttatt +aaattcaactgctttatttttgaaggataaaagaactttgtcactataaacatagtacat +catgtttttatatggtatgcctgtggcatcccttactataacggattgttcgttgtgtat +gtaacatgcgaggagaatgtaaaaaatactggccagaattacaattattgttttaattat +gtgtggtggttttgttatgtcaccccagatacgagtaaggaaaaaatacgatgtttttag +ttttccatcaatcagtccctgctgtatcattctcacattttcaatgcctgatacattgat +tccgttaattattttaaatagttgaatgtcgcgccactcgcggtcaagtctttttaattt +tttgtctgaatatccaaaattgaaataatgtgcaataagcctcataaggttacttttacc +aaagctaaaaaatgctaatactgcaaagctacaaaggaaaaaaacgattagcccccacac +attagtcacattatagctgaccattacgctctccttgaatgttgtctggtagttctacaa +atgaatccagatagcataacttttatatattgtgcaatctcacatgcatgaacactctcg +caaatattcaggaactcgcgcgcgcactgcgcaacatgattcgcactggcattatcgtcg +aaaccgaccttaacgccggtcgctgccgcgtgcagaccggcggcatgtgcaccgactggc +ttcagtggctgacccatcgcgcaggacgttcgcgcacatggtgggcaccttccgtggggg +aacaggtgctgattctggccgtgggtggtgaactcgacacggcgttcgttctgccgggga +tttattccggcgataacccctcgccgtctgtgtcggcggatgccctgcatatccgtttcc +ctgacggggcggtgattgaatatgaacccgaaaccagtgcactcacggtaagcggaatta +aaacggccagcgtgacggcttccggttctgttactgccacggtgccggtggtcatggtga +aagcatcaacccgcgtcaccctggacaccccggaggtggtctgcaccaacaggctgatta +ccggcacgctggaagtgcagaaaggcgggacgatgcgcggcaacattgaacacaccggcg +gtgaactctcatcaaacggtaaggtactgcatacccataaacaccccggcgacagcggcg +gcacaaccgggagtcctttatgacagcgcgttatctcggaatgaatcgcagtgatggcct +gactgtcactgaccttgagcatatcagccagagtatcggcgatatcctgcgcacaccggt +cggctcacgggtgatgcgtcgtgattacggctcgttgctggcgtcaatgattgaccagcc +gcagaccccggcgcttgagttgcagattaaagtcgcctgttacatggcagtgctgaaatg +ggaaccccgcgtcaccctgtcatccgtcaccacggcgcgcagttttgacgggcgaatgac +ggtcacgttaaccggccagcacaacgacaccggccagccactttcattaaccatccctgt +gagttgaaaccatgccgattatcgacctgaaccagctacccgcaccggatgtggtcgagg +agctggactttgaaagcattctcgctgaacgcaaggcgacactgatttccctttacccgg +aagatcagcaggaggcggtcgcccgtaccctgacactggaatctgagcctctcgtcaaac +tgctggaagaaaatgcttatcgtgagcttatctggcgtcagcgtgtgaatgaggccgcac +gggcggtgatgctggcctgtgccgccggtaatgaccttgatgtgattggtgccaattaca +acaccacgcgcctgactatcaccccggcagatgattcgaccatcccgccgacaccggcag +tgatggaatctgacaccgattatcgtctgcgtattcagcaggcttttgagggcttaagcg +tcgccgggtcagtgggagcctatcagtatcatggtcgcagtgctgacgggcgtgtcgcgg +atatttctgtcaccagtccgtctccggcctgtgtcaccatctctgtgctgtcacgtgaaa +ataacggcgtcgcatccgaagacctgctggctgtggtgcgtaacgcccttaatggcgagg +acgtcaggccggtggccgaccgcgtgaccgtgcagtctgccgccatcgttgaataccaga +taaacgccacgctttacctttaccctggtcccgaaagcgaacccatccgcgctgccgctg +tgaaaaagctggaagcgtatatcacggcacagcaccggctggggcgcgacatccgtctgt +ctgccatttatgccgctttgcatgtggaaggtgtgcagcgtgtcgaactggctgcaccac +tggccgacatcgtgctcaacagtacgcaggcgtctttctgtaccgaataccgcgtcgtga +ccggaggctcggatgagtgattcgcgactgctgccgaccggctcatcaccgcttgaggtc +gccgccgcaaaagcctgtgcggaaattgaaaaaacgccggtcagtattcgtgaactgtgg +aacccggacacctgtccggcaaatctgctgccgtggctggcgtgggcgttttcggtcgac +aggtgggatgaaaagtggccggaagcgacaaaacgcgccgttatccgcgatgcctatttc +atccactgtcataagggcacgataggtgcaatccggcgtgtggtggagccgctcggctat +ctcatcaacgtgacggagtggtgggaaaacagtgacccgcccggcaccttccggcttgat +attggtgtactggaaagcggtatcacagaggcaatgtatcaggaaatggaacggctgatt +gctgatgccaaacctgcaagccgtcaccttattggcctgaacattacccgggacattccc +ggctatctgttcgccggtggtgtggcttacgacggcgatgtaattacggtttaccccgga +taagtgaggaataatgagcataaaattcagaaccgttatcaccactgccggtgcagcaaa +gctggcagcggcaaccgcgccgggaaggcggaaggtcggcattaccacgatggccgtcgg +ggatggcggtggtaaattgcctgtcccggatgccggacagaccgggcttatccatgaagt +ctggcgacatgcgctgaacaaaatcagccaggacaaacgaaacagtaattatattatcgc +cgagctggttattccgccggaggtgggcggtttctggatgcgtgagcttggcctgtacga +tgatgcgggaacgttaattgccgtggcgaacatggccgaaagctataagccagcccttgc +cgaaggctcaggacgttggcagacctgtcgcatggtcatcatcgtcagcagtgtggcctc +agtggagctgaccattgacaccacaacggtgatggcgacgcaggattacgttgatgacaa +aattgcagagcacgaacagtcacgacgtcacccggacgcctcgctgacagcaaaaggttt +tactcagttaagcagtgcgaccaacagcacgtctgaaacactggccgcaacgccgaaagc +ggtaaaggccgcgtatgacctggctaacgggaaatataccgcacaggacgccaccacagc +gcgaaaaggccttgtccagcttagtagcgccaccaacagcacgtctgaaacgctcgccgc +aacaccaaaagccgttaagacggtaatggatgaaacgaacaaaaaagcgccattaaacag +ccctgcactgaccggaacgccaacgacgccaactgcgcgacagggaacgaataatactca +gatcgcaaacacggctttcgttatggccgcgattgccgcccttgtagactcgtcgcctga +cgcactgaatacgctgaacgagctggcggcggcgctgggcaatgacccgaattttgctac +caccatgactaatgcgcttgcgggtaagcaaccgaaagatgctaccctgacggcgctggc +ggggcttgctactgcggcagacaggtttccgtattttacggggaatgatgttgccagcct +ggcgaccctgacaaaagtcgggcgggatattctggctaaatcgaccgttgccgccgttat +cgaatatctcggtttacaggaaacggtaaaccgagccgggaacgccgtgcaaaaaaatgg +cgataccttgtccggtggacttacttttgaaaacgactcaatccttgcctggattcgaaa +tactgactgggcgaagattggatttaaaaatgatgccgatggtgacactgattcatacat +gtggtttgaaacgggggataacggcaatgaatatttcaaatggagaagccgccagagtac +cacaacaaaagacctgatgacgttgaaatgggatgcactaaatattcttgttaatgccgt +cattaatggctgttttggagttggtacgacgaatgcactaggtggtagctctattgttct +tggtgataatgataccggatttaaacagaatggagacggtattcttgatgtttatgctaa +cagtcagcgtgtattccgttttcagaatggagtggctattgcttttaaaaatattcaggc +aggtgatagtaaaaagttctcgctatccagctctaatacatccacgaagaatattacctt +taatttatggggtgcttccacccgtccagtggttgcagagttaggcgatgaggccggatg +gcatttctatagccagcgaaatacagataactcggtaatatttgctgttaacggtcagat +gcaacccagcaactggggaaattttgattcccgctatgtgaaagatgttcgcctgggtac +gcgagttgttcaattgatggcgcgaggtggtcgttatgaaaaagccggacacacgattac +cggattaagaatcattggtgaagtagatggcgatgatgaagccatcttcaggccgataca +aaaatacatcaatggcacatggtataacgttgcgcaggtgtaagttatgcagcatttaaa +gaacattaagtcaggtaatccaaaaacaaaagagcaatatcagctaacaaagaattttga +tgttatctggttatggtccgaagacggaaaaaactggtatgaggaagtgaagaactttca +gccagacacaataaagattgtttacgatgaaaataatattattgtcgctatcaccagaga +tgcttcaacgcttaatcctgaaggttttagcgttgttgaggttcctgatattacctccaa +ccgacgtgctgacgactcaggtaaatggatgtttaaggatggtgctgtggttaaacggat +ttatacggcagatgaacagcaacaacaggcagaatcacaaaaggccgcgttactttccga +agcggaaaacgttattcagccactggaacgcgctgtcaggctgaatatggcgacggatga +ggaacgtgcacgactggagtcatgggaacgttacagcgttctggtcagccgtgtggatcc +tgcaaatcctgaatggccggaaatgccgcaataagttgtatgacctctgttgtgaactta +catatctatggcacagagtaaagcctaatctgaagtccactctgtgccaaaagcggacct +tataaacaagaacaatggtcatatcagtgtgttttgattgcatagctaacgtgcgtcttc +ctgtacagaatcataagatgatagggcataggagatgattattatcgcgtgttttaaaaa +tagctttctgcatcaagtgtcacttgcgaagaggtattggcgctatgattggcatcactc +agttcagataatattttaaatatttggtaaatgttcagattacacaattcggtctgcgtc +ccgttaaaattatctactattagttattactatgaggtgaatggcaagtgttttccactc +gccatttttgttttttatttttttaaagcctttccgacgtttaaggattttgccaagcca +taaaatatttgatatttcattcctgtttttatttttggtgagatatttgcgtaacttctt +tctctaaaacaccaacgtataaacctattattatcttcggttgtttctatatagcatatt +acattgagaccaaaaagaaactgaaggaagtcatttgcagttgtcatgaattttggtttt +gttgtggaaatggaactaatatgagtttcaagttgtttatatgctaagaggtattcagcg +taatcaaaagtatcttttccagagaggaattcaaagaactttaaaaaaatctcataatgt +tcacttccataataaaatgataaatgatcttttatttctccaagtaaatagttagagtaa +tctctttgcatgctaggactttcaaagtcatctagactaaattgatttttcccatcatca +ccgctggcgtgtgatttgataatttcgagcatccgtaatatatctcttgggcgataatat +gaccagcgaaggaaattaataaatgatgtggggtggttataattatcatggacgttgggt +gaatcccaagggaaataatggtcccatgcctgtccctttttaagggccatgtcttgctga +gtcctaagcagatgatctaatacctcaaataattgagagctacggtggttaacatattct +gtccgccagtccaagaatactgaattatctctgatttttgcgttttgattttgtaatcct +atggattcaaatatatctggcctgatcaagagaacggccttcattctcccttttcctccc +tttatacttgggaagaaatcgttgttaatctcccagactgcgtgagctaatccttttata +cattctagataatcatcgtatggaattgaggaagggcggatatcaataccatcgataaat +aaaatatgattttgagataaacgtatttggctaaaggcctcttcaaattttttttgtata +taaaataaatttatctgaaatctgctctcagaaaaagataaagactctctttcttcacct +tttaaggttgcatgcttatgaagtagttcggctgcaacttttgactcttgaacaaaactg +agggcttgaattatttctggtgaaaatgccttaagataatactcatctattgcatcatta +agtgatgagaattttgaataatttagtaactttgaaattttcccttctttatctaatact +tgttttgatattaataaatatagaataactttccatatgccagagaagtcagacaaattt +aaatgcttttcagatttaagagtgataaatttttgatattctgtctctcttatatattta +gttgtagctagcgtattgttaatattgttatttgagagatagatagagtatgcggtttta +ccagtacctttctctcctacaagaaacgatatatttggttcacataatctagataggtga +ttatcacgtatgaacactttgttaagtaattctttattctcccttctcttataattttca +gcatcagcatagccaagagttagatctttgattggtatcattattacctcaactaaagca +attgaaaaacatatggttataaaaacatagcgctgctctgtcgcatattgtggatatcaa +catatgaaatgtaaaggaactatttgtggatgaatgaaccgaatcgctgtagcttcggta +gtcatctttcagacttgtataaatgaacaacttccgcttctcgctcaaaggaaactgtca +gatttgatagcttttgggctatgtaaactgtcagtcggaaaatgagtgagtacaaatcag +ggcaggtgagcgaattgcccgccttttctttaccggtggttgtgctgtcgattagccaac +cgggacaaatagcctgacatctccggcgcaactgaaaataccactcacccattaaccacg +gagttaaacggatgagtgactatcatcacggcgtgcaggtgctggagattaacgagggca +cccgcgtcatttccaccgtatccacggccattgtcggcatggtctgcacggccagcgatg +cagatgcggaaaccttccccctcaataaacctgtgctgattaccaatgtgcagagcgcaa +tttcaaaggccggtaaaaaaggcacgctggcggcatcgttgcaggccatcgctgaccagt +caaaaccggtcaccgttgtcatgcgcgtggaagacggcaccggtgatgacgaggaaacga +aactcgcgcagaccgtttccaatatcatcggcaccaccgatgaaaacggtcagtacaccg +gactaaaagccatgctggcggcggagtcggtaaccggtgttaaaccgcgtattctcggcg +tgccgggactggataccaaagaggtggctgttgcactggcatcagtctgtcagaagctgc +gtgctttcgggtatatcagcgcatggggctgtaaaaccatttccgaggtgaaagcctatc +gtcagaatttcagccagcgtgagctgatggtcatctggccggatttcctcgcatgggata +cggtcaccagtaccaccgccaccgcgtatgccaccgcccgtgcgctggggctgcgcgcta +aaatcgaccaggagcagggctggcataaaacgctgtccaatgtcggggtgaacggtgtta +ccggcatcagcgcatctgtattctgggatttgcaggagtccggcaccgatgctgacctgc +ttaacgagtcaggcgtcactacgctgattcgccgcgacggtttccgcttctggggtaacc +gtacctgctctgatgacccgctgttcctctttgaaaactacacccgcaccgcgcaggtcg +tggccgacacgatggctgaggcgcacatgtgggcggtggacaagcccatcactgcaacgc +tgattcgcgacatcgttgacggcatcaatgccaaattccgtgagctgaaaacaaacggct +atatcgtggatgcgacctgctggttcagcgaagaatccaacgatgcggaaaccctcaagg +ccggaaaactgtatatcgactacgactatacaccggtgcctcctctcgaaaacctgaccc +tgcgccagcgtattaccgataaatacctggcaaatctggtcacctcggttaacagcaatt +aaggagcctgaccgatggcaatgccgcgcaaactcaagttaatgaacgtctttctgaacg +gctacagctatcagggcgttgcaaagtccgtcacgctgccaaaactgacccgtaagctcg +aaaactatcgcggtgcggggatgaacggcagcgcaccggtagacctcggccttgatgacg +atgcgctgtcaatggagtggtcgctcggtggcttcccggattcggttatctgggagcttt +acgccgcaaccggtgtggatgccgtgccgattcgttttgcaggctcttaccagcgcgacg +ataccggcgaaacggtggccgtcgaagtggtcatgcgtggacgtcagaaagaaatcgaca +ccggcgagggtaaacagggagaagacactgagtcgaaaatctccgtggtctgcacctatt +tccggctgacgatggacggtaaggagctggtcgaaattgacaccatcaacatgattgaga +aggtgaacggcgtcgatcggctggagcaacaccgccgcaatatcggcctgtgattttcat +ccggtcagcctggctggccggttaaccctgattcagaagtgagaaaaccatgaacaaaga +aaatgtcattaccctggacaatccggtcaaacgtggtgagcaggttatcgaacaggtcac +gctgatgaaacccagtgccgggacgctacgcggtgtcagtctggctgcggttgcaaactc +cgaagtcgatgcactgattaaggtgctgccgcgcatgacggcaccgatgctgaccgagca +ggaagtcgccgcgctggaactgcctgaccttgtggcgctggccggtaaggtggtcggttt +tttgtcgccgaactcggtgcagtgacgtttccgaaaaatctctcggtcgatgacctgatg +gcggatgtggcagtgatatttcactggccgccatcagaactgtatcccatgagcctgacc +gaactcatcacatggcgcgaaaaggcgctccggcgaagcggaaacacgaatgagtaacaa +tgtaaaattacaggtattgctcagggctgttgaccaggcatcccgcccgtttaaatccat +ccgcacagcgagcaagtcgctgtcgggggatatccgggaaacacaaaaatcactgcgcga +gctgaacggtcacgcatcccgtattgagggattccgcaagaccagtgcacagctcgccgt +gactggtcatgcacttgaaaaggcacggcaggaggccgaagcccttgccacacagtttaa +aaacaccgaacgtccgacccgtgctcaggcgaaagtcctggaatccgcaaagcgtgcggc +ggaggacttacaggcgaaatataaccgcctgacagattccgttaaacgccagcagcggga +actggccgctgtgggaattaatacccgcaatcttgcacatgatgagcagggactgaaaaa +ccgtatcagtgaaaccaccgcacagcttaaccgtcagcgtgatgcgctggtgcgtgtcag +tgcgcaacaggcaaaacttaacgcagtaaaacagcgttatcaggccggaaaggaactggc +cggaaatatggcctcagtgggcgctgccggtgtggggattgcggcggcgggaacgatggc +cggtgttaagctactgatgcccggttatgagtttgcgcagaaaaactcagaattacaggc +tgtgatcggagtggcaaaagactccgccgaaatggccgcactccgcaagcaggcgcgcca +gctcggcgacaataccgccgcctcggcagatgatgcagccggtgcgcagattattattgc +gaaagccggtggggatgttgatgccattcaggcggcaacgccggtcacgctgaacatggc +gctggcgaaccgtcgcacaatggaagaaaacgccgccctgctgatggggatgaaatccgc +ctttcagctttcaaacgataaggtcgctcatatcggggatgttctctccatgacgatgaa +caaaaccgccgccgattttgacggcatgagcgatgcgctgacctatgccgcacctgtggc +aaaaaatgccggtgtcagcattgaagaaaccgccgcaatggtcggggcgctgcatgatgc +aaaaatcacaggctcaatggcggggacgggaagccgtgccgtgttaagccgcctgcaggc +accgacgggaaaagcatgggatgcactcaaagagcttggagtgaaaacctcagacagcaa +aggaaacacccggccaatatttaccattctgaaagaaatgcaggccagttttgagaaaaa +ccggctcggtactgcccagcaggctgaatacatgaaaactattttcggggaggaggccag +ctcagccgctgccgtgctgatgactgccgcctcaaccggaaagctggacaaactgaccgc +tgcgtttaaagcctcagacgggaagaccgccgagctggtaaatatcatgcaggacaacct +aggcggtgactttaaagcgtttcagtccgcttatgaggcggtggggactgacctgtttga +ccagcaggaaggcgcgctgcgtaagctcacgcagacggccacaaagtatgtgttaaaact +cgacggctggatacagaaaaacaaatcactggcgtcaaccatcggcatcattgccggcgg +tgcactggcgcttactggcatcatcggtgccattggcctcgtagcctggccggttatcac +cggcatcaatgccatcatcgcggcagcaggcgcaatgggggcagtcttcacgacggttgg +cagtgctgttatgaccgccatcggggctattagctggccggttgtggccgtggtggctgc +cattgtcgccggtgcgttgcttatccgtaaatactgggagcctgtcagcgcattctttgg +tggtgtggttgaagggctgaaagcggcatttgcgccggtgggggaactgttcacgccact +taaaccggtttttgactggctgggcgaaaagttacaggccgcgtggcagtggtttaaaaa +cctgattgccccggtcaaagccacccaggacaccctgaaccgttgccgtgacacgggcgt +catgttcgggcaggcactggctgacgcgttgatgctgccgcttaatgcgttcaacaaact +gcgcagtggtattgactgggtactggaaaaactcggtgttatcaacaaagagtcagacac +acttgaccagaccgccgccagaactcataccgccacgtatggtaccggtgactatattcc +ggcgaccagctcttatgcaggctatcaggcttatcagccggtcacggcaccggctggccg +ctcttatgtagaccagagtaaaaacgaatatcacatcagcctgacgggggggactgcgcc +ggggacacagcttgaccgccagttacaggatgcgctcgaaaaatacgagcgggataaacg +tgcgcgcgcccgtgccagcatgatgcatgacggttaaggaggtgacgaaaaatgatgctc +gcgttaggtatgtttgtttttatgcgccagacgctgccacaccagaccatgcagcgtgaa +tcagattatcgctggccgtcaaattcccgtatcggtaaacgggatgcctttcagtttctc +ggtgtgggtgaggaaaacatcacgctggccggtgtgctttatcccgaactgaccggcggc +aagctgacgatgaccacgctcaggctgatggcagaggaggggcgggcgtggccgttgctg +gatggcaccggcatgatttacggcatgtatgtcatcagcagggtgagtgaaacagggagt +attttctttgcagacggcacaccccggaaaattgattttacgctgtcactcacccgcgtt +gatgaatcactggccgcgctttatggcgatatcggtaaacaggcggaatcgctcatcggt +aaggccggcagtatggcgaccagattcacaggtatgacgggggcgggataatgctggatg +cgctgacatttgatgcaggcagtacgctgacgccggattacatgctgatgctcgacagca +gggatattaccggcaatatcagcgaccgtctgatgagcatgaccctgacggataaccggg +gctttgaggctgaccagcttgatattgaactgaacgatgccgacgggcaggtcgggctgc +cggttcgtggcgctgtcctgacggtgtatatcggctggaaaggttttgccctggtatgca +aagggaaatttaccgttgatgaggttgaacaccggggcgcaccggatgtagtcaccatcc +gcgcccggagtgcagattttcgcgggacgctcaattcccgccgggaaggctcctggcatg +acaccacgctcggtgcgattgttaaggcgatagccacccgtaacaggctggaagccagtg +tcgctccgtcactggccggaataaaaattccacacatcgaccagtcgcaggagtctgatg +cgaaattcctgacccgtcttgcagaacgcaacggcggtgaggtgtcggtaaaaatgggaa +aactgttgtttctcaaagcggggcagggagtgacggccagcggtaaaaaaatcccgcagg +tcaccataacccgcagcgacggcgaccgccatcattttgcgattgctgaccgtggagcct +acaccggtgtaacggcaaaatggctacacactaaagacccgaagccgcaaaagcagaagg +taaaactgaaacgcaaaaagaaagagaaacacctgcgcgcactggagcacccgaaagcga +aaccggtcaggcagaagaaagcgcctaaagtaccggaagcgcgtgaaggtgaatacatgg +ccggtgaggctgacaacgtttttgccctgaccacggtatatgccacgaaagcgcaggcca +tgcgcgccgctcaggcgaagtgggataaactgcaacggggcgttgcggagttctctatca +gcctggctaccggtcgggcagatatttacacggaaacaccggtcaaagtgtctggcttta +agcgcgtcatagacgagcaggactggacaatcactaaggtgacacattttctgaataata +gcggcttcacgacgtccttagagcttgaggtcaggctttctgatgtggagtacgaaacag +aagatgatgagtgatgtttttgttttatctgtttgttttgtaaggataaattaactaaaa +tggcaccatcaacaaaaccggaagaggtgctcgcgatgtttcattgtcctttatgccagc +atgccgcacatgcgcgtacaagtcgctatatcactgacacgacaaaagagcgttatcatc +agtgccagaacgtgaattgcagcgccacgttcatcacttatgagtcggtacagcgataca +tcgtgaagccgggagaagtccacgccgtaaggccgcacccgttgccatcagggcagcaaa +ttatgtggatgtaattacaaacagaaagcccctcagtcgaggggcttttttgtcgatgtg +gtcaatgtgtggacgtgaccagaaataaatccttttatttcaatttattgtacgtaaaaa +ataagcccgtgtaagggagatttagggtgtcaccagtaggggctttcaacggtacaatgc +gggtttgagcggcataaattaccactgaaagcccttaaacgttactctactgtggacact +gtgtggacactctcggcctcagtaccacctcttagcggattaagagaaatggcgtcctga +aggtactctggcgcaaaatgagcgtaaaccatagtttgctcaatccgcgtgtgacctagt +atccgttgtagcgtgataatacttcctccattaatcatgaaatgagtggcaaagctgtgc +cttagtgcatgtgtggcttgccccattggcaaatccggttttattgctttcattgttcgt +ctgaagcgagggtaatcagcatcagggaataaaaaacctcgtttgttatccgcgatcatt +ttggcaacagcctctgagatcgggacggtgcgtggtttgtttgttttcgttttaacaaac +gtgacgcggttatggatgatattttctgctttcaaacgagctgcttctccccaacgtgct +cctgtactcaggcaaagaatcgcaatctttttattgtcgccgtcaagtgctgcaagcagt +aaggcaatttcttcctgtgttagatagcctgtttctggtttttcctccttaagccttttt +gtccctctgatagggtgctcaccaaagaataactccgcttcaatcagggctgtaaacatg +ccgctaatacatgttaaatcacgattgatactcgaaggtttaataccctgacttcttcgg +gtggcgcagtactggctgataagcgatttcgtaatttgaaatgcgcatgggtcattcgtt +atttttgtgaagatttcaatttttccaagattagatttcccatgctcttcgtgtttaccc +tttaaatcccaccagatctgtgtcagctccgacagacgtcgcttgtctgttggttttgat +agccattctttattgtggtggttgtacaacgtgtatttctcgaaagcgacagcttcgctt +ttcttatcaaacttcctacggatgcgttttccattacgtccagtagggcggatgtccact +tcatatcgaccatcatcgagttttttgattgccatcagaaaaccctccgagtggtgtgtt +tttttgcgactactaatcgcttttttcgtggtggctgaaatttagccaccaatagtaggc +acttgtgatgaatatattcacgatgaattgttaaccagtcttttgaccggagtggggcga +cgttgtttcgttttgcccaaagtgtgcgagagcgggcgcaatttgcccggactcaggagc +gatctgattggtcatgaaccataaagtgtatttggtgaattgtggggtctgcaggatgtt +catcatgacatctgttggaggtgttgaacgaccactttcatagtaactcagcgtgccata +cggaacccctgttaaatcagcaagttgttgtctgctcaaatactctgattttcgcattaa +gactatcttctcgcttatcgtgtttgacatggtgtttagatctcaatagtatttagttta +gatgtagattgtttagtgcttggatgtgggcactaaaaggcattataagacattaaacgc +aattcatgagggctagaggacgacatgagcaagcaagtaacactcatgactgatgcgatt +ccttatcaggagttcgcaaaactaataggaaaatcgacaggagcggttcgtcggatgatc +gataaaggaaagctgcctgtaattgatatgaccgatccacaatcagcttcaggtcgtgca +ggtgaatattgggtataccttccggcatggaataacggactaaaactggcttatgaaagc +cgccctaaagagattcgtgacggctggttgatgtggttaggtctcggtgaaccacgttaa +ggagaaccgtatgaatgagcctcgttgtattgctcagttactgcgtaacgaaagccccag +ggcgattgacttcaccatcacccacggtaaggggcgtaagggaatcattatccgcaccaa +aaaacagagtccgttaaaaaaggctctgacctttctgaaaagccggagggtatggaaatg +acagtgatgacgctcaatctcgttgaaaaacagccagcagctatgcgccggataattggt +aagcatcttgccgttcctcgctggcaggatacatgtgattattataatcagatgatggag +cgcgaacggttaacggtttgcttccatgctcagttaaaacagcgtcacgcaacgatgtgt +tttgaagaaatgaacgacgtcgaacgtgaacgactggtatgtgcaattgatgaattgcgt +ggtgcattctcaaaacgccgtcaggttggcgcaagtgagtatgcatatattagtttttta +acagtcagtcagcgtcgtactttatttatgcatgccggattgactgaaaaagaattcaac +cagccatactggcgaattaatgaagagtcatgttactggcgtgatgctttattccgtgca +ttacgtgaattattcagtctgtttgagtatgcaccgacaattctgacgtcggtaaaaccg +gagcaatatctgcattaagtaattaaccagagtttttaacgcacttaattgtgcggggct +tctttttgcctggagaaagttatgcatacagtttctgaaaatcagtgcggtatatacgca +ttactgctgcaacaggccagaaccgaagcacaggccgacgctgcgacgcgcttttcttct +catcttgatgccatgattcgccacatcacaaaggcggagttatcccgcgtggagatagtc +gagctgctcagtcaggagtcggaaaaatttcacaatatcggattgtctcgcggggaggtg +ctttgatgttctgttctcgtgcagttgtattactgaataacgccttaaaaatcgccgtta +tgaaaaatggcgatttgtctcttattcaacttggtcttgataaagaaaaacgcgaaataa +ctgaatctgttatcgcgatttatcagagtgaattaaacctcctgtctgatgtggtcaatt +tacttgttaaacgcgctgtatttcacaagcaaatttcctccgtggatgaactgacgaaat +taacgacagaaatcgccagctattgcgctgatgaatttaaaaaactgaacgacaaaagga +actggtaatgccggacaacgtagattttattcaggaacaacaggctgaattactggagcg +ccagattaacgcggcaagggtaaaacattgcggtgcttctgcgctggtttgcgaagagtg +tgacgcgccaatacctgctgcccgtcgtgcggcttacccgtcagccacgcgttgtgtttc +ctgtcagtcagtctttgaagcaaaaaacaaacattaccggagaacggcatgagtattcgt +attgaaattggcgaacgttatgtcgttaccagtgacagctttcagtttattctccacgag +aaaaagagagcggaaagcggtaaaaacgccggtcaggaatggctggcggtggttggttat +tacccgaaattaagccagctcgtttcaggcctgatgcatcacgatattctgaccggaagc +gcaaagtcttttgctgatttaaacgtgcaggttgagcaactcagcaagcgttgttcagag +gcttttggctcatatggccgttaaagcctccgggcgttttgtccctccgtcagcatttgc +cgcaggcaccggtaagatgtttaccggtgcttatgcatggaacgcgccacgcgaggccgt +cgggcgcgaaagaccccttacacgtgacgagatgcgtcagatgcaaggtgttttatccac +gattaaccgcctgccttactttttgcgctcgctgtttacttcacgctatgactacatccg +gcgcaataaaagcccggtgcacgggttttatttcctcacatccacttttcagcgtcgttt +atggccgcgcattgagcgtgtgaatcagcgccatgaaatgaacaccgacgcgtcgttgct +gtttctggcagagcgtgaccactatgcgcgcctgccgggaatgaatgacaaggagctgaa +aaagtttgccgcccgtatctcatcgcagcttttcatgatgtatgaggaactcagcgatgc +ctgggtggatgcacatggcgaaaaagaatcgctgtttacggatgaggcgcaggctcacct +ctatggtcatgttgctggcgctgcacgtgctttcaatatttccccgctttactggaaaaa +ataccgtaaaggacagatgaccacgaggcaggcatattctgccattgcccgtctgtttaa +cgatgagtggtggactcatcagctcaaaggccagcgtatgcgctggcatgagacgttact +gattgctgtcggggaggtgaataaagaccgttctccttatgccagtaaacatgccattcg +tgatgtgcgtgcacgccgccaagcaaatctggaatttcttaaatcgtgtgaccttgaaaa +cagggaaaccggcgagcgcatcgaccttatcagtaaggtgatgggcagtatttctaatcc +tgaaattcgccggatggagctgatgaacaccattgccggtattgagcgttacgccgccgc +agagggtgatgtggggatgtttatcacgcttaccgcgccttcaaagtatcacccgacacg +tcaggtcggaaaaggcgaaagtaaaaccgtccagctaaatcacggctggaacgatgaggc +atttaatccaaaggatgcgcagcgttatctctgccatatctggagcctgatgcgcacggc +attcaaagataatgatttacaggtctacggtttgcgtgtcgtcgagccacaccacgacgg +aacgccgcactggcatatgatgcttttttgtaatccacgccagcgtaaccagattatcga +aatcatgcgtcgctatgcgctcaaagaggatggcgacgaaagaggagccgcgcgaaaccg +ttttcaggcaaaacaccttaaccagggcggtgctgcggggtatatcgcgaaatacatctc +aaaaaacatcgatggctatgcactggatggtcagctcgataacgataccggcagaccgct +gaaagacactgctgcggctgttaccgcatgggcgtcaacgtggcgcatcccacaatttaa +aacggttggtctgccgacaatgggggcttaccgtgaactacgcaaattgcctcgcggcgt +cagcattgctgatgagtttgacgagcgcgtcgaggctgcacgcgccgccgcagacagtgg +tgattttgcgttgtatatcagcgcgcagggtggggcaaatgtcccgcgcgattgtcagac +tgtcagggtcgcccgtagtccgtcggatgaggttaacgagtacgaggaagaagtcgagag +agtggtcggcatttacgcgccgcatctcggcgcgcgtcatattcatatcaccagaacgac +ggactggcgcattgtgccgaaagttccggtcgttgagcctctgactttaaaaagcggcat +cgccgcgcctcggagtcctgtcaataactgtggaaagctcaccggtggtgatacttcgtt +accggctcccacaccttctgagcacgccgcagcagtgcttaatctggttgatgacggtgt +tattgaatggaatgaaccggaggtcgtgagggcgctcaggggcgcattaaaatacgacat +gagaacgccaaaccgtcagcaaagaaacggaagcccgttaaaaccgcatgaaattgcacc +atctgccagactgaccaggtctgaacgattgcagatcacccgtatccgcgttgaccttgc +tcagaacggtatcaggcctcagcgatgggaacttgaggcgctggcgcgtggagcaaccgt +aaattatgacgggaaaaaattcacgtatccggtcgctgatgagtggccgggattctcaac +agtaatggagtggacatgatggcaaaaattcacgaggtaaagctgcacgcaaaatatttc +gaccttgtactggaaggaaagaaacgcgcagagtttcggaaaaaagatcgtaattatgag +cgcggggacacgttgattttgcatgaatgggtgcagggtgtgtttacggggcgaaaggtt +gaagcccggataacagatgttactgacctgtcagactggctggaagattatgtcttgctg +cacagaatactaggtgagatactgccgctgactgtcaagctggcagtatcctccacattt +tttataaatctaaggcgaagaacggtggcaatatatttgctttaaattgtaaataagcaa +attattctaagccacaaatgatatcaattgagtatcgattttcgttcgaatataaccata +acgccaagcgtcaaatgtaagtcatctatatgtgattcgtattcatattggtcagcatca +ggagatagtaaatgctctgctgctgtaaaaacatcaattgtaacagatatatcgtctgga +atttcttcatttaattcggatatgtattttttatatttgttttttaatttccttatcatg +tcttccttatggtggattgtagtgcagtaattttttttagttgaatcattgtatgaatgg +aatgaacagtttaatgctaggccaagacttgaatttcctgtagggcctgtgtgtttaaag +tattcaagatttcttcttatgtcagaaaataaaagacttttacagggggcatttccttta +acttctattgcacatattggaatgtcgaaaaatggtctgctgtccaatatggcaatatca +attctgcctgatcttgttgtgtttgtgttttttctgacagttttttttgagaatattttt +tgggggtcagaccgtttcgataaaggaactgttgcattaatgaatttatttgtatggtac +tcaaatataactttgtaatcaccatggcgaaaagattttatttctaacaacgatagacct +atagatacggtagctacatattcagtgtttatttttgcaccagacctgaaatccattaaa +taagttgcgtcggctgactttttcattccatcttttacagctttcacaatatccatgtta +ttcatatcaacaccttttatattccagaattataaatcttaatgattgatttgtttgtgt +gtttaggttactagattgacgtacttatagcacattctgattttgaaatcaccatccttg +ggtaaagcacagcctatcactattggtttagtactgtgctgtaatagtatcagattaagt +taaatccattttatgaaatcttccatttcatcatatttttttattactgctctaacatct +ttgctttcatcacataaacaatctaaaagactatcccattcagtttgttttttaccaaat +ccataaacagcctctatatcaccggatttccatatatagattccgttatctttcaatttt +tgatgtatttcatgtatatgcttttgtgttttttcatggttacatattttgatgaagtct +ttgcttgaaatgcttttgaatgactcaaaagtagtaacttttgtatttaaactaagctct +cctgagttgattgattcaatcaaagcagtcaatagattatcacattcagtactaagtaag +tctttatgctctgttaatagaatatttgataagaaatcacaatcagctagaatccttgtt +tttatgccgatggcattgatgatttgtgacatcttaaataaactacccttaccgtcaacg +gcaacaatgcagattttactcgggttgagttcatgtccgttaatttttttataaagtgca +tatagaacgtttgtctctgttttcccttcaacaagcaaaacttcttcagaaaataaaagg +tatgatgaattagaaagcgtgaatgctgagtgcaattgcggtgatgaagatttatataat +tcttcgattttttcagatatagtcttccttgctatggttccattagaatccttacaaacc +tgaatcgcatttgctgcatgctttgcagaaagcatactggctgagtgagttgatattata +acctgataccctgattcacttaatgtgacaagtgattctctgacagaattaatggctgaa +gggtgtaaatataactcaggttcatcaatgaaaatcaaagtgtttgatttttttgattcg +ctgttttctttttttatttcggccaggtattgaattaatgccatttgaatggaacgttgt +gttccgtgaccaaatcggctgatatctctcattaccggttcatcttcccgagactcaaaa +actttcagagtgccggatttaaatatctcatctaatgtcggtgtgggaaagtgtaacttt +acacttacgtcaggaaaaaattggtttacttttttatttacacctgagtctattttatta +aggctttctaatctgttctcaccgttgtgagaaagatatttacctatttctgatatgttt +tttgaaaatttttcttcgtgttcttgttttatttcagaaacaattgcggaaagtatcttt +cctattgtggtcgtgtttttgcattttgttgagtcttcgacagcgtcagacattgcaggg +atatgaattggttccggaaatatattggagattgcaccatctatgccgccagggtttttc +ttccacgtggtaccgtcatatacatccagactttttttggcttttcctgtttccttatta +aattcctgtcttcttgcaaaggtaagagtcccgtcaattataaacggagctattttttgt +tgattctcttctgttaacaaagacagagtatcatctgttataccttgaataacgccttca +acggatacggggtgtgtaggatcgtacacatctgattctgaaatcaaagagccatctaac +agccacttaattgctaagataatatttgattttcctgcgttattataaccaactaaagca +gtgaaggggcgcaaaatagccgatgttgacttacaagaacgaaagttgctaattgaaact +gaagcaagacgtacagtcattatttttccttaaatgtgctatttgtatgcaatgagttca +tacgaaacgcttttttacattttatagtcgttgcattcaagggtgcatgagattgcatta +agggaaactgtgatatggcttggcttttgactggaaatactgatggctcattagttttat +taaggtgcattaaaaccgccccgtgaagcgggcgggcgaggcggggaaagcac diff --git a/etc/af063097_v_b132222.crunch b/etc/af063097_v_b132222.crunch new file mode 100644 index 000000000..b89fbf8e8 --- /dev/null +++ b/etc/af063097_v_b132222.crunch @@ -0,0 +1,199 @@ +76 50.00 207 440 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 201 434 AF063097 AF063097 Bacteriophage P2, complete genome. +373 52.00 208 1179 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 202 1173 AF063097 AF063097 Bacteriophage P2, complete genome. +423 65.00 224 1165 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 218 1159 AF063097 AF063097 Bacteriophage P2, complete genome. +90 71.00 999 1163 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 993 1157 AF063097 AF063097 Bacteriophage P2, complete genome. +46 29.00 1665 1958 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 2328 2621 AF063097 AF063097 Bacteriophage P2, complete genome. +104 70.00 1978 2127 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 1241 1390 AF063097 AF063097 Bacteriophage P2, complete genome. +666 77.00 2103 3284 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 1366 2547 AF063097 AF063097 Bacteriophage P2, complete genome. +204 66.00 3360 3794 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 2623 3057 AF063097 AF063097 Bacteriophage P2, complete genome. +571 81.00 3881 4750 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 3152 4021 AF063097 AF063097 Bacteriophage P2, complete genome. +651 76.00 4814 5872 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 4068 5126 AF063097 AF063097 Bacteriophage P2, complete genome. +214 82.00 5895 6236 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 5154 5495 AF063097 AF063097 Bacteriophage P2, complete genome. +148 67.00 6243 6545 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 5508 5810 AF063097 AF063097 Bacteriophage P2, complete genome. +525 58.00 2135 3361 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 1398 2624 AF063097 AF063097 Bacteriophage P2, complete genome. +143 57.00 3446 3793 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 2709 3056 AF063097 AF063097 Bacteriophage P2, complete genome. +210 69.00 3883 4326 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 3154 3597 AF063097 AF063097 Bacteriophage P2, complete genome. +44 47.00 4378 4542 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 3649 3813 AF063097 AF063097 Bacteriophage P2, complete genome. +54 53.00 4582 4722 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 3853 3993 AF063097 AF063097 Bacteriophage P2, complete genome. +49 61.00 2173 2286 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 1436 1549 AF063097 AF063097 Bacteriophage P2, complete genome. +271 53.00 2476 3234 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 1739 2497 AF063097 AF063097 Bacteriophage P2, complete genome. +67 49.00 3640 3867 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 2903 3130 AF063097 AF063097 Bacteriophage P2, complete genome. +226 54.00 3915 4544 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 3186 3815 AF063097 AF063097 Bacteriophage P2, complete genome. +53 48.00 4581 4763 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 3852 4034 AF063097 AF063097 Bacteriophage P2, complete genome. +94 61.00 5178 5393 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 4432 4647 AF063097 AF063097 Bacteriophage P2, complete genome. +91 35.00 5424 5879 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 4678 5133 AF063097 AF063097 Bacteriophage P2, complete genome. +140 52.00 5860 6246 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 5119 5505 AF063097 AF063097 Bacteriophage P2, complete genome. +45 36.00 6355 6555 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 5620 5820 AF063097 AF063097 Bacteriophage P2, complete genome. +73 57.00 5182 5388 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 4436 4642 AF063097 AF063097 Bacteriophage P2, complete genome. +68 52.00 5542 5727 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 4796 4981 AF063097 AF063097 Bacteriophage P2, complete genome. +129 58.00 5885 6229 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 5144 5488 AF063097 AF063097 Bacteriophage P2, complete genome. +290 65.00 6734 7306 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 5997 6569 AF063097 AF063097 Bacteriophage P2, complete genome. +137 44.00 6792 7301 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 6055 6564 AF063097 AF063097 Bacteriophage P2, complete genome. +59 54.00 6826 6993 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 6089 6256 AF063097 AF063097 Bacteriophage P2, complete genome. +167 61.00 7078 7449 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 6341 6712 AF063097 AF063097 Bacteriophage P2, complete genome. +188 90.00 7452 7721 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 6716 6985 AF063097 AF063097 Bacteriophage P2, complete genome. +390 90.00 7699 8232 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 6961 7494 AF063097 AF063097 Bacteriophage P2, complete genome. +130 63.00 7442 7714 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 6706 6978 AF063097 AF063097 Bacteriophage P2, complete genome. +151 47.00 7725 8231 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 6987 7493 AF063097 AF063097 Bacteriophage P2, complete genome. +131 66.00 7453 7713 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 6717 6977 AF063097 AF063097 Bacteriophage P2, complete genome. +108 50.00 7721 8035 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 6983 7297 AF063097 AF063097 Bacteriophage P2, complete genome. +58 60.00 8090 8224 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 7352 7486 AF063097 AF063097 Bacteriophage P2, complete genome. +413 50.00 8286 9500 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 7991 9205 AF063097 AF063097 Bacteriophage P2, complete genome. +177 72.00 8485 8775 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 8190 8480 AF063097 AF063097 Bacteriophage P2, complete genome. +259 57.00 8573 9220 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 8278 8925 AF063097 AF063097 Bacteriophage P2, complete genome. +71 43.00 9471 9659 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 9179 9367 AF063097 AF063097 Bacteriophage P2, complete genome. +335 68.00 9720 10343 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 10299 10922 AF063097 AF063097 Bacteriophage P2, complete genome. +161 63.00 10367 10681 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 10940 11254 AF063097 AF063097 Bacteriophage P2, complete genome. +844 62.00 10778 12718 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 11349 13289 AF063097 AF063097 Bacteriophage P2, complete genome. +66 44.00 9826 10089 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 10405 10668 AF063097 AF063097 Bacteriophage P2, complete genome. +78 49.00 10138 10353 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 10717 10932 AF063097 AF063097 Bacteriophage P2, complete genome. +54 45.00 10369 10590 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 10942 11163 AF063097 AF063097 Bacteriophage P2, complete genome. +55 52.00 9968 10117 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 10547 10696 AF063097 AF063097 Bacteriophage P2, complete genome. +53 42.00 10317 10553 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 10890 11126 AF063097 AF063097 Bacteriophage P2, complete genome. +74 44.00 10725 10985 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 11296 11556 AF063097 AF063097 Bacteriophage P2, complete genome. +64 49.00 11040 11255 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 11611 11826 AF063097 AF063097 Bacteriophage P2, complete genome. +140 45.00 10735 11256 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 11306 11827 AF063097 AF063097 Bacteriophage P2, complete genome. +506 68.00 11340 12266 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 11911 12837 AF063097 AF063097 Bacteriophage P2, complete genome. +149 49.00 12378 12908 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 12949 13479 AF063097 AF063097 Bacteriophage P2, complete genome. +650 66.00 11575 12915 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 12146 13486 AF063097 AF063097 Bacteriophage P2, complete genome. +57 65.00 12664 12783 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 13367 13486 AF063097 AF063097 Bacteriophage P2, complete genome. +50 49.00 12964 13080 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 13859 13975 AF063097 AF063097 Bacteriophage P2, complete genome. +99 60.00 13794 14018 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 15011 15235 AF063097 AF063097 Bacteriophage P2, complete genome. +89 41.00 14145 14480 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 17614 17949 AF063097 AF063097 Bacteriophage P2, complete genome. +89 49.00 14149 14415 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 17618 17884 AF063097 AF063097 Bacteriophage P2, complete genome. +77 45.00 14442 14687 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 17920 18165 AF063097 AF063097 Bacteriophage P2, complete genome. +210 79.00 14153 14488 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 17622 17957 AF063097 AF063097 Bacteriophage P2, complete genome. +596 82.00 14468 15358 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 17946 18836 AF063097 AF063097 Bacteriophage P2, complete genome. +290 68.00 15377 15892 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 18855 19370 AF063097 AF063097 Bacteriophage P2, complete genome. +77 67.00 14617 14763 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 18095 18241 AF063097 AF063097 Bacteriophage P2, complete genome. +306 52.00 14814 15746 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 18292 19224 AF063097 AF063097 Bacteriophage P2, complete genome. +46 57.00 15774 15893 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 19252 19371 AF063097 AF063097 Bacteriophage P2, complete genome. +88 63.00 14881 15051 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 18359 18529 AF063097 AF063097 Bacteriophage P2, complete genome. +137 58.00 15154 15495 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 18632 18973 AF063097 AF063097 Bacteriophage P2, complete genome. +43 42.00 15637 15795 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 19115 19273 AF063097 AF063097 Bacteriophage P2, complete genome. +197 53.00 16019 16588 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 19429 19998 AF063097 AF063097 Bacteriophage P2, complete genome. +58 36.00 16685 17026 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 20095 20436 AF063097 AF063097 Bacteriophage P2, complete genome. +262 55.00 17029 17754 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 20442 21167 AF063097 AF063097 Bacteriophage P2, complete genome. +87 46.00 17794 18045 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 21207 21458 AF063097 AF063097 Bacteriophage P2, complete genome. +176 69.00 16032 16367 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 19442 19777 AF063097 AF063097 Bacteriophage P2, complete genome. +276 63.00 16401 16988 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 19811 20398 AF063097 AF063097 Bacteriophage P2, complete genome. +602 78.00 17025 18032 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 20438 21445 AF063097 AF063097 Bacteriophage P2, complete genome. +310 67.00 18108 18650 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 21521 22063 AF063097 AF063097 Bacteriophage P2, complete genome. +141 78.00 18657 18875 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 22073 22291 AF063097 AF063097 Bacteriophage P2, complete genome. +231 60.00 18891 19343 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 22312 22764 AF063097 AF063097 Bacteriophage P2, complete genome. +477 75.00 19373 20152 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 22791 23570 AF063097 AF063097 Bacteriophage P2, complete genome. +186 72.00 20213 20536 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 23628 23951 AF063097 AF063097 Bacteriophage P2, complete genome. +133 63.00 20609 20827 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 24036 24254 AF063097 AF063097 Bacteriophage P2, complete genome. +172 47.00 16231 16806 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 19641 20216 AF063097 AF063097 Bacteriophage P2, complete genome. +47 43.00 16828 17016 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 20238 20426 AF063097 AF063097 Bacteriophage P2, complete genome. +243 49.00 17153 17881 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 20566 21294 AF063097 AF063097 Bacteriophage P2, complete genome. +186 44.00 17924 18643 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 21337 22056 AF063097 AF063097 Bacteriophage P2, complete genome. +68 54.00 18664 18876 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 22080 22292 AF063097 AF063097 Bacteriophage P2, complete genome. +108 45.00 19794 20204 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 23212 23622 AF063097 AF063097 Bacteriophage P2, complete genome. +146 53.00 19798 20181 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 23216 23599 AF063097 AF063097 Bacteriophage P2, complete genome. +49 54.00 20304 20447 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 23719 23862 AF063097 AF063097 Bacteriophage P2, complete genome. +56 48.00 21451 21630 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 24517 24696 AF063097 AF063097 Bacteriophage P2, complete genome. +85 49.00 24663 24875 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 27545 27757 AF063097 AF063097 Bacteriophage P2, complete genome. +120 55.00 25471 25728 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 27769 28026 AF063097 AF063097 Bacteriophage P2, complete genome. +88 39.00 27293 27568 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 28592 28867 AF063097 AF063097 Bacteriophage P2, complete genome. +78 55.00 27563 27763 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 28865 29065 AF063097 AF063097 Bacteriophage P2, complete genome. +89 43.00 27776 27982 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 29105 29311 AF063097 AF063097 Bacteriophage P2, complete genome. +106 52.00 28001 28255 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 29315 29569 AF063097 AF063097 Bacteriophage P2, complete genome. +84 42.00 28298 28594 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 29615 29911 AF063097 AF063097 Bacteriophage P2, complete genome. +42 34.00 27999 28259 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 29313 29573 AF063097 AF063097 Bacteriophage P2, complete genome. +64 40.00 28249 27989 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 29563 29303 AF063097 AF063097 Bacteriophage P2, complete genome. +46 53.00 27909 27775 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 29238 29104 AF063097 AF063097 Bacteriophage P2, complete genome. +42 30.00 27997 27785 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 29326 29114 AF063097 AF063097 Bacteriophage P2, complete genome. +75 51.00 25724 25470 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 28022 27768 AF063097 AF063097 Bacteriophage P2, complete genome. +51 38.00 25650 25468 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 27948 27766 AF063097 AF063097 Bacteriophage P2, complete genome. +58 56.00 24874 24719 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 27756 27601 AF063097 AF063097 Bacteriophage P2, complete genome. +56 45.00 22442 22284 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 25484 25326 AF063097 AF063097 Bacteriophage P2, complete genome. +69 41.00 21869 21672 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 24938 24741 AF063097 AF063097 Bacteriophage P2, complete genome. +116 59.00 21668 21447 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 24734 24513 AF063097 AF063097 Bacteriophage P2, complete genome. +51 38.00 20805 20563 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 24232 23990 AF063097 AF063097 Bacteriophage P2, complete genome. +123 52.00 20536 20192 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 23951 23607 AF063097 AF063097 Bacteriophage P2, complete genome. +375 66.00 20190 19387 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 23608 22805 AF063097 AF063097 Bacteriophage P2, complete genome. +142 53.00 19327 18890 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 22748 22311 AF063097 AF063097 Bacteriophage P2, complete genome. +92 56.00 18881 18657 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 22297 22073 AF063097 AF063097 Bacteriophage P2, complete genome. +225 61.00 18616 18107 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 22029 21520 AF063097 AF063097 Bacteriophage P2, complete genome. +523 71.00 18046 17036 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 21459 20449 AF063097 AF063097 Bacteriophage P2, complete genome. +408 63.00 16966 16007 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 20376 19417 AF063097 AF063097 Bacteriophage P2, complete genome. +580 54.00 15892 14468 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 19370 17946 AF063097 AF063097 Bacteriophage P2, complete genome. +153 78.00 14418 14149 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 17887 17618 AF063097 AF063097 Bacteriophage P2, complete genome. +74 57.00 20516 20295 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 23931 23710 AF063097 AF063097 Bacteriophage P2, complete genome. +95 75.00 20484 20305 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 23899 23720 AF063097 AF063097 Bacteriophage P2, complete genome. +236 43.00 20194 19361 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 23612 22779 AF063097 AF063097 Bacteriophage P2, complete genome. +82 47.00 20072 19797 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 23490 23215 AF063097 AF063097 Bacteriophage P2, complete genome. +68 52.00 18874 18656 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 22290 22072 AF063097 AF063097 Bacteriophage P2, complete genome. +599 52.00 18650 17028 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 22063 20441 AF063097 AF063097 Bacteriophage P2, complete genome. +149 42.00 17015 16431 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 20425 19841 AF063097 AF063097 Bacteriophage P2, complete genome. +126 50.00 16388 16032 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 19798 19442 AF063097 AF063097 Bacteriophage P2, complete genome. +66 50.00 18873 18664 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 22289 22080 AF063097 AF063097 Bacteriophage P2, complete genome. +121 47.00 18651 18238 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 22064 21651 AF063097 AF063097 Bacteriophage P2, complete genome. +88 52.00 18141 17884 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 21554 21297 AF063097 AF063097 Bacteriophage P2, complete genome. +98 51.00 17751 17458 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 21164 20871 AF063097 AF063097 Bacteriophage P2, complete genome. +121 56.00 17361 17038 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 20774 20451 AF063097 AF063097 Bacteriophage P2, complete genome. +190 44.00 16947 16207 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 20357 19617 AF063097 AF063097 Bacteriophage P2, complete genome. +173 72.00 15888 15556 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 19366 19034 AF063097 AF063097 Bacteriophage P2, complete genome. +251 56.00 15572 14904 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 19050 18382 AF063097 AF063097 Bacteriophage P2, complete genome. +302 78.00 15357 14824 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 18835 18302 AF063097 AF063097 Bacteriophage P2, complete genome. +143 73.00 14748 14479 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 18226 17957 AF063097 AF063097 Bacteriophage P2, complete genome. +125 52.00 14479 14144 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 17948 17613 AF063097 AF063097 Bacteriophage P2, complete genome. +67 59.00 14750 14574 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 18228 18052 AF063097 AF063097 Bacteriophage P2, complete genome. +50 45.00 12909 12763 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 13480 13334 AF063097 AF063097 Bacteriophage P2, complete genome. +682 53.00 12694 10721 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 13265 11292 AF063097 AF063097 Bacteriophage P2, complete genome. +123 55.00 10710 10366 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 11283 10939 AF063097 AF063097 Bacteriophage P2, complete genome. +246 60.00 10297 9716 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 10876 10295 AF063097 AF063097 Bacteriophage P2, complete genome. +127 77.00 12746 12513 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 13317 13084 AF063097 AF063097 Bacteriophage P2, complete genome. +59 82.00 12413 12315 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 12984 12886 AF063097 AF063097 Bacteriophage P2, complete genome. +437 45.00 12260 10731 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 12831 11302 AF063097 AF063097 Bacteriophage P2, complete genome. +83 40.00 10651 10367 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 11224 10940 AF063097 AF063097 Bacteriophage P2, complete genome. +102 50.00 10280 10029 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 10859 10608 AF063097 AF063097 Bacteriophage P2, complete genome. +61 36.00 9983 9714 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 10562 10293 AF063097 AF063097 Bacteriophage P2, complete genome. +611 55.00 12696 11092 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 13267 11663 AF063097 AF063097 Bacteriophage P2, complete genome. +69 78.00 10935 10801 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 11506 11372 AF063097 AF063097 Bacteriophage P2, complete genome. +57 54.00 10116 9967 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 10695 10546 AF063097 AF063097 Bacteriophage P2, complete genome. +46 32.00 9500 9156 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 9205 8861 AF063097 AF063097 Bacteriophage P2, complete genome. +358 46.00 9499 8228 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 9204 7933 AF063097 AF063097 Bacteriophage P2, complete genome. +199 58.00 9021 8485 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 8726 8190 AF063097 AF063097 Bacteriophage P2, complete genome. +43 40.00 9011 8841 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 8716 8546 AF063097 AF063097 Bacteriophage P2, complete genome. +155 46.00 8774 8229 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 8479 7934 AF063097 AF063097 Bacteriophage P2, complete genome. +156 49.00 8245 7724 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 7507 6986 AF063097 AF063097 Bacteriophage P2, complete genome. +100 66.00 7713 7519 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 6977 6783 AF063097 AF063097 Bacteriophage P2, complete genome. +264 74.00 8228 7731 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 7490 6993 AF063097 AF063097 Bacteriophage P2, complete genome. +135 69.00 7714 7451 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 6978 6715 AF063097 AF063097 Bacteriophage P2, complete genome. +243 53.00 7449 6727 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 6712 5990 AF063097 AF063097 Bacteriophage P2, complete genome. +189 51.00 8223 7723 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 7485 6985 AF063097 AF063097 Bacteriophage P2, complete genome. +125 61.00 7715 7452 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 6979 6716 AF063097 AF063097 Bacteriophage P2, complete genome. +144 52.00 7448 7050 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 6711 6313 AF063097 AF063097 Bacteriophage P2, complete genome. +66 52.00 7007 6825 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 6270 6088 AF063097 AF063097 Bacteriophage P2, complete genome. +170 47.00 7309 6791 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 6572 6054 AF063097 AF063097 Bacteriophage P2, complete genome. +66 40.00 6554 6258 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 5819 5523 AF063097 AF063097 Bacteriophage P2, complete genome. +132 51.00 6236 5880 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 5495 5139 AF063097 AF063097 Bacteriophage P2, complete genome. +351 45.00 5878 4817 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 5132 4071 AF063097 AF063097 Bacteriophage P2, complete genome. +127 46.00 4751 4368 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 4022 3639 AF063097 AF063097 Bacteriophage P2, complete genome. +241 61.00 4372 3881 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 3643 3152 AF063097 AF063097 Bacteriophage P2, complete genome. +611 51.00 3876 2134 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 3139 1397 AF063097 AF063097 Bacteriophage P2, complete genome. +98 52.00 6544 6245 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 5809 5510 AF063097 AF063097 Bacteriophage P2, complete genome. +133 58.00 6235 5894 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 5494 5153 AF063097 AF063097 Bacteriophage P2, complete genome. +301 68.00 5871 5245 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 5125 4499 AF063097 AF063097 Bacteriophage P2, complete genome. +161 68.00 5154 4816 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 4408 4070 AF063097 AF063097 Bacteriophage P2, complete genome. +401 66.00 4749 3880 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 4020 3151 AF063097 AF063097 Bacteriophage P2, complete genome. +1286 85.00 3871 2000 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 3134 1263 AF063097 AF063097 Bacteriophage P2, complete genome. +48 58.00 6228 6130 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 5487 5389 AF063097 AF063097 Bacteriophage P2, complete genome. +72 58.00 6069 5884 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 5328 5143 AF063097 AF063097 Bacteriophage P2, complete genome. +125 50.00 5840 5460 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 5094 4714 AF063097 AF063097 Bacteriophage P2, complete genome. +95 53.00 5393 5109 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 4647 4363 AF063097 AF063097 Bacteriophage P2, complete genome. +44 59.00 4916 4815 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 4170 4069 AF063097 AF063097 Bacteriophage P2, complete genome. +122 47.00 4750 4427 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 4021 3698 AF063097 AF063097 Bacteriophage P2, complete genome. +168 66.00 4319 3975 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 3590 3246 AF063097 AF063097 Bacteriophage P2, complete genome. +128 52.00 3857 3486 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 3120 2749 AF063097 AF063097 Bacteriophage P2, complete genome. +199 58.00 3254 2778 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 2517 2041 AF063097 AF063097 Bacteriophage P2, complete genome. +89 65.00 2729 2544 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 1992 1807 AF063097 AF063097 Bacteriophage P2, complete genome. +63 52.00 2495 2346 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 1758 1609 AF063097 AF063097 Bacteriophage P2, complete genome. +126 54.00 2285 1977 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 1548 1240 AF063097 AF063097 Bacteriophage P2, complete genome. +84 44.00 1958 1665 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 2621 2328 AF063097 AF063097 Bacteriophage P2, complete genome. +58 45.00 1391 1251 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 2021 1881 AF063097 AF063097 Bacteriophage P2, complete genome. +264 47.00 1222 362 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 1216 356 AF063097 AF063097 Bacteriophage P2, complete genome. +645 78.00 1209 208 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 1203 202 AF063097 AF063097 Bacteriophage P2, complete genome. +267 49.00 1145 303 big_blast_x_t_2_50000_af063097.fasta_b132222.fasta.00000001 1139 297 AF063097 AF063097 Bacteriophage P2, complete genome. diff --git a/etc/b132222.embl b/etc/b132222.embl new file mode 100644 index 000000000..4e4dcccab --- /dev/null +++ b/etc/b132222.embl @@ -0,0 +1,1512 @@ +ID B132222 standard; DNA; PHG; 30624 BP. +XX +AC U32222; U51471; X04449; X53318; +XX +SV U32222.1 +XX +DT 27-OCT-1995 (Rel. 45, Created) +DT 09-SEP-1998 (Rel. 56, Last updated, Version 6) +XX +DE Bacteriophage 186, complete sequence. +XX +KW . +XX +OS Enterobacteria phage 186 +OC Viruses; dsDNA viruses, no RNA stage; Caudovirales; Myoviridae; +OC P2-like Viruses. +XX +RN [1] +RP 20315-23876 +RX MEDLINE; 87112711. +RA Kalionis B., Dodd I.B., Egan J.B.; +RT "Control of gene expression in the P2-related template coliphages. III. DNA +RT sequence of the major control region of phage 186"; +RL J. Mol. Biol. 191(2):199-209(1986). +XX +RN [2] +RP 23435-24666 +RX MEDLINE; 89199647. +RA Richardson H., Puspurs A., Egan J.B.; +RT "Control of gene expression in the P2-related temperate coliphage 186. VI. +RT Sequence analysis of the early lytic region"; +RL J. Mol. Biol. 206(1):251-255(1989). +XX +RN [3] +RP 22430-23430 +RX MEDLINE; 90317829. +RA Dodd I.B., Kalionis B., Egan J.B.; +RT "Control of gene expression in the temperate coliphage 186. VIII. Control +RT of lysis and lysogeny by a transcriptional switch involving face-to-face +RT promoters"; +RL J. Mol. Biol. 214(1):27-37(1990). +XX +RN [4] +RP 12142-14054 +RX MEDLINE; 95407087. +RA Xue Q., Egan J.B.; +RT "DNA sequence of tail fiber genes of coliphage 186 and evidence for a +RT common ancestor shared by dsDNA phage fiber genes"; +RL Virology 212(1):128-133(1995). +XX +RN [5] +RP 14042-15941 +RX MEDLINE; 95407099. +RA Xue Q., Egan J.B.; +RT "Tail sheath and tail tube genes of the temperate coliphage 186"; +RL Virology 212(1):218-221(1995). +XX +RN [6] +RP 11442-18696 +RA Xue Q.; +RT "Studies on the tail region of the temperate coliphage 186 genome"; +RL Thesis (1993), University of Adelaide +XX +RN [7] +RP 1-20866 +RX MEDLINE; 98371265. +RA Portelli R., Dodd I.B., Xue Q., Egan J.B.; +RT "The late-expressed region of the temperate coliphage 186 genome"; +RL Virology 248(1):117-130(1998). +XX +RN [8] +RP 1-30624 +RA Dodd I.B., Egan J.B.; +RT "Bacteriophage 186 complete genome"; +RL Unpublished. +XX +RN [9] +RP 11442-18696 +RA Xue Q., Egan J.B.; +RT ; +RL Submitted (25-JUL-1995) to the EMBL/GenBank/DDBJ databases. +RL Department of Biochemistry, University of Adelaide, Adelaide, SA 5005, +RL Australia +XX +RN [10] +RP 1-30624 +RA Xue Q., Egan J.B.; +RT ; +RL Submitted (15-MAY-1998) to the EMBL/GenBank/DDBJ databases. +RL Department of Biochemistry, University of Adelaide, Adelaide, SA 5005, +RL Australia +XX +DR SPTREMBL; O80303; O80303. +DR SPTREMBL; O80304; O80304. +DR SPTREMBL; O80305; O80305. +DR SPTREMBL; O80306; O80306. +DR SPTREMBL; O80307; O80307. +DR SPTREMBL; O80308; O80308. +DR SPTREMBL; O80309; O80309. +DR SPTREMBL; O80310; O80310. +DR SPTREMBL; O80311; O80311. +DR SPTREMBL; O80312; O80312. +DR SPTREMBL; O80313; O80313. +DR SPTREMBL; O80314; O80314. +DR SPTREMBL; O80315; O80315. +DR SPTREMBL; O80316; O80316. +DR SPTREMBL; O80317; O80317. +DR SPTREMBL; Q01088; Q01088. +DR SPTREMBL; Q37840; Q37840. +DR SPTREMBL; Q37841; Q37841. +DR SPTREMBL; Q37842; Q37842. +DR SPTREMBL; Q37843; Q37843. +DR SPTREMBL; Q37844; Q37844. +DR SPTREMBL; Q37845; Q37845. +DR SPTREMBL; Q37846; Q37846. +DR SPTREMBL; Q37848; Q37848. +DR SPTREMBL; Q37850; Q37850. +DR SPTREMBL; Q37851; Q37851. +DR SPTREMBL; Q9T0R3; Q9T0R3. +DR SWISS-PROT; P06723; VINT_BP186. +DR SWISS-PROT; P08685; CP69_BP186. +DR SWISS-PROT; P08707; RPC1_BP186. +DR SWISS-PROT; P08711; VPB_BP186. +DR SWISS-PROT; P15236; VFIL_BP186. +DR SWISS-PROT; P21678; RPC2_BP186. +DR SWISS-PROT; P21679; VPD_BP186. +DR SWISS-PROT; P21680; VDHR_BP186. +DR SWISS-PROT; P21681; VAPL_BP186. +DR SWISS-PROT; P21682; CP79_BP186. +DR SWISS-PROT; P41059; CP80_BP186. +DR SWISS-PROT; P41060; CP81_BP186. +DR SWISS-PROT; P41061; CP83_BP186. +DR SWISS-PROT; P41062; CP84_BP186. +DR SWISS-PROT; P41063; TUM_BP186. +DR SWISS-PROT; P41064; VPA_BP186. +XX +CC On Jul 23, 1998 this sequence version replaced gi:14895 gi:15549 +CC gi:1262241 gi:974436. +XX +FH Key Location/Qualifiers +FH +FT source 1..30624 +FT /db_xref="taxon:29252" +FT /organism="Enterobacteria phage 186" +FT misc_recomb 1..19 +FT /evidence=EXPERIMENTAL +FT /note="cos; cohesive end; top strand cut at 5' end and +FT bottom strand cut at 3' end" +FT /organism="Enterobacteria phage 186" +FT terminator complement(164..187) +FT /evidence=NOT_EXPERIMENTAL +FT /note="tW" +FT /gene="W" +FT CDS complement(196..1218) +FT /codon_start=1 +FT /db_xref="SPTREMBL:Q37851" +FT /note="Orf2; P2 Q homolog" +FT /transl_table=11 +FT /gene="W" +FT /product="capsid portal protein" +FT /protein_id="AAC34146.1" +FT /translation="MSKRKPRKQVAMTASAPQKMEAFTFGEPVPVLDKRDILDYVECIS +FT NGKWYEPPVSFSGLAKSLRSAVHHSSPIYVKRNVLASTYIPHPLLSRQDFSRFALDYLV +FT FGNAFLEQRHSVTGQLIKLLASPAKYTRRGVDDSVFWFVENFTLPHEFAPDTVFHLLEP +FT DINQEIYGLPEYLSALNSAWLNESATLFRRKYYQNGAHAGYIMYVTDPAQSATDVESLR +FT EAMRNSKGLGNFKNLFFYAPNGKPDGIKIVPLSEVATKDDFFNIKKASAADLMDAHRVP +FT FQLMGGKPENIGSLGDVEKVAKVFVRNDLSPLQDRFREVNDWLGMEVIRFKEYTLDNPE +FT " +FT CDS complement(1215..1961) +FT /codon_start=1 +FT /db_xref="SPTREMBL:O80303" +FT /note="similar to Orf12" +FT /transl_table=11 +FT /gene="W" +FT /product="W protein" +FT /protein_id="AAC34147.1" +FT /translation="MKNNVFSQSQIQAMADILHNDSFDYQATWLRVGKLNIDRSITKSR +FT QIGATQLFSREALLDALTTGDNHVWFAHTIEHARVALMYMSNLSARVGVSLTSNGHSLQ +FT LDDGAVISFVGEESHCAALAGNVYLDEFGWFNNPLRAAKVAAGIACHKRHSLTMFTSPS +FT DNYDAFRVWNGTTRRHRPSPLINTGDSVFCTDGVWRQSVTLDAACQRGCNLFAPDEIKH +FT EYSDDDYRLLFGCDWSFAVAAGEVAA" +FT CDS complement(1961..3730) +FT /codon_start=1 +FT /db_xref="SPTREMBL:Q9T0R3" +FT /note="Orf12; P2 P homolog; contains putative +FT helix-turn-helix DNA-binding motif" +FT /transl_table=11 +FT /product="terminase subunit" +FT /protein_id="AAC34148.1" +FT /translation="MTISTDTTLLHDPRRQASLLYWQGFSVPQIAEMLQVKRPTVQSWK +FT QRDGWDGIAPISRVESSLEARLIQLIAKPQKSGGDFKEIDLLGRQIERLARVNRYSQTG +FT NEADLNPNVANRNKGERKKPKKNFFSDEAIEKLEELFFDQSFEYQLQWYRAGLAHRIRD +FT ILKSRQIGATFYFSREALLRALKTGHNQIFLSASKTQAYVFREYIIQFARLVDVDLTGD +FT PIVIGNNGAKLIFLGTNSNTAQSHNGDLYVDEIFWIPNFQKLRKVASGMASQKHLRSTY +FT FSTPSTLAHGAYPFWSGELFNKGRSRIADRIEIDISHRALAGGQLCDDGQWRQIVTIED +FT ALAGGCTLFDLDQLKRENSDEDFKNLFMCEFVDDKASVFPFEELQRCMVDVMEEWEDFA +FT PFADHPFGSRPVWIGYDPSHTGDSAGCVVLAPPVVSGGKFRMLERHQWKGMDFAAQADG +FT IRKLTEKYSVEYIGIDATGLGLGVFQLVRSFYPAARGIRYTPEMKTAMVLKAKDTIRRG +FT CLEYDAGATDVTQSFMSIRKTMTSSGRSATYEASRTEEASHADIAWATMHALLNEPLSA +FT GSGIQPKSILEFN" +FT promoter complement(3753..3790) +FT /evidence=EXPERIMENTAL +FT /note="p12" +FT /function="B-dependent transcription of orf12 operon" +FT protein_bind 3798..3817 +FT /evidence=EXPERIMENTAL +FT /bound_moiety="B protein" +FT /function="activation of pV and p12 promoters" +FT promoter 3828..3865 +FT /evidence=EXPERIMENTAL +FT /note="pV" +FT /gene="V" +FT /function="B-dependent transcription of V operon" +FT CDS 3896..4750 +FT /codon_start=1 +FT /db_xref="SPTREMBL:Q01088" +FT /note="presumed capsid scaffold; P2 O homolog" +FT /transl_table=11 +FT /gene="V" +FT /product="V protein" +FT /protein_id="AAC34149.1" +FT /translation="MAKKVSKFFRIGVEGDTCDGRIISASDIQEMAETYDPRVYGCRIN +FT LEHLRGLLPDGIFKRYGDVVELKAEKIDDDSALNGKWALFAKITPTDDLIAMNKAAQKV +FT YTSMEIQPNFANTGKCYLVGLAVTDDPASLGTEYLEFCRTAKHNPLQRFKAHPENVFSA +FT ATLAELEFEDVPDTVLNSLADKVKAIFSRKQVSDDARLNDVHEAVTAVSEHVQTNLTAQ +FT DKRLSDMETAFATFKQELTGKVEETSQAFSVLKTTLDKTESFSQPRRTKASGGGGDELL +FT TDC" +FT variation 3980 +FT /note="Vam38; glutamine to amber" +FT /replace="t" +FT /gene="V" +FT CDS 4826..5893 +FT /codon_start=1 +FT /db_xref="SPTREMBL:O80304" +FT /note="T protein; P2 N homolog" +FT /transl_table=11 +FT /gene="T" +FT /product="major capsid protein" +FT /protein_id="AAC34150.1" +FT /translation="MRQETRFKFNAYLTQLAKLNGISVDDVSKKFTVEPSVTQTLMNTV +FT QASSAFLQMINILPVAEMKGEKIGVGVTGTIASTTDTSGDKERQTADFTALESNKYECN +FT QINFDFHLTYKRLDLWARFQDFQRRIRDAIVQRQALDFIMAGFNGTTRADTSDRVKNPM +FT LQDVAVGWLQKYRNEAPARVMSNITDADGKVVSAVIRVGKNGDYENLDALVMDGTNTLI +FT DEIYQDDPKLVAIVGRKLLADKYFPLVNKQQENTESLAADIIISQKRIGNLPAVRVPYF +FT PANAVFVTTLENLSIYFMDESHRRSIDENPKKDRVENYESMNIDYVVEAYAAGCLLENI +FT TLGDFTAPAAPEGGE" +FT CDS 5898..6647 +FT /codon_start=1 +FT /db_xref="SPTREMBL:O80305" +FT /note="terminase subunit; P2 M homolog" +FT /transl_table=11 +FT /gene="R" +FT /product="R protein" +FT /protein_id="AAC34151.1" +FT /translation="MTSPAQRHMMRVSASQAAQREQAPLRHATAYEQMLVKLADDRRTL +FT KNIRSNERKAEKKRELLPFYAPWVAGVLTDGRGAQDDIVMTVMLWRLDAGDIAGALEIA +FT PYALKYGLTSDHRRTTPYMLVEEVALAAQRLRDAGESVDLSWLQATIDLTDGADVPDMV +FT RARLHKVTGLTLRDAGMNAEALAQFQRAMQLDRNAGVRKEIERLERALKPKTEAAPRKT +FT TKPRTRKPATKPAAKRGRPPKAAKTAG" +FT CDS 6740..7246 +FT /codon_start=1 +FT /db_xref="SPTREMBL:O80306" +FT /note="capsid completion protein; P2 L homolog" +FT /transl_table=11 +FT /gene="Q" +FT /product="Q protein" +FT /protein_id="AAC34152.1" +FT /translation="MTTVILNQPDEPQDVPGVVIPAPETGGAVIKNTFFFPDVDPKRVR +FT ELMRLEQTVSDARLRNAIKTGMAETNAELYDYRLRQTAAGFKQLADVPAEEIDGENVRV +FT FHYLSAVTAMATATLYERYRGVEATGKGDKKADSVETTIDDLWRDMRWSVARLQDKPRC +FT IVGQL" +FT CDS 7246..7449 +FT /codon_start=1 +FT /db_xref="SPTREMBL:O80307" +FT /note="Orf23; P2 X homolog; tail protein" +FT /transl_table=11 +FT /protein_id="AAC34153.1" +FT /translation="MKVRSMQGDTLDTICARYYGRTEGVVETVLQANPGLSELGVILPN +FT GTEIDLPDVASSPVTKTINLWE" +FT CDS 7452..7748 +FT /codon_start=1 +FT /db_xref="SPTREMBL:O80308" +FT /note="Orf24; P2 Y homolog; holin" +FT /transl_table=11 +FT /protein_id="AAC34154.1" +FT /translation="MTEGEKGVLSLFVIGVMIVVGKVLAGGEPITPRLFIGRMLLGGFV +FT SMVAGVVLVQFPDMSLPAVCGIGSMLGIAGYQVVEIAIQRRFKSQKGESDAGH" +FT CDS 7735..8232 +FT /codon_start=1 +FT /db_xref="SPTREMBL:O80309" +FT /note="endolysin; P2 K and lambda S homolog" +FT /transl_table=11 +FT /gene="P" +FT /product="P protein" +FT /protein_id="AAC34155.1" +FT /translation="MPVINTHQNIAAFLDMLAYSEGTANHPLTKNRGYDVIVTGLDGRP +FT EIFTDYSDHPFAHGRPPKVFNRRGEKSTASGRYQQLYLFWPHYQKQLALPDFSPLSQDK +FT LAIQLIRERGALDDIRAGRIERAVSRCRNIWASLPGAGYGQREHGLEKLVTIWRTAGGV +FT VA" +FT variation 7999 +FT /note="Pam65" +FT /replace="t" +FT /gene="P" +FT CDS 8229..8642 +FT /codon_start=1 +FT /db_xref="SPTREMBL:O80310" +FT /note="Orf27; P2 LysB homolog; control of lysis" +FT /transl_table=11 +FT /protein_id="AAC34156.1" +FT /translation="MKVLITLLVMAVLGLLWLHHENGNLSRSFETANRVASEQKTTIGM +FT LKNQLSVAGQLARRNESAQVTLREQLAKASAEASRREQTITRLLNENEAFRRWYNAALP +FT DAVRRLHTRTACASAGDCGQRMPEGEPLPYAGK" +FT CDS 8497..8787 +FT /codon_start=1 +FT /db_xref="SPTREMBL:O80311" +FT /note="Orf28; homologs present in other phages, e.g. P2, +FT HP1" +FT /transl_table=11 +FT /product="unknown" +FT /protein_id="AAC34157.1" +FT /translation="MKMKPFAAGITLLCLMLCVGCTPEQPAPVPVIVVNGCPRVSLCPM +FT PGSDPKTNGDLSADIRRLEGALTACALQVKTVKHCQDELDAEAQKPAQSAD" +FT CDS 8750..9217 +FT /codon_start=1 +FT /db_xref="SPTREMBL:O80312" +FT /note="P2 R homolog; tail completion protein" +FT /transl_table=11 +FT /gene="N" +FT /product="N protein" +FT /protein_id="AAC34158.1" +FT /translation="MQKHKSLRKALINAVPQLRNNPDMLRLFADNGHTDSRLASSLSFE +FT KVYVLNVVVTDFTGDLDLIFVPVQAWLREHQPDIMTTDDGREKGFTWIIDINNDDSLDI +FT SISLRLTERTLVKEVGGALHVSYAPEPPLPELVKRPVAMYANGELVSQWDE" +FT variation 8877 +FT /note="Nam47" +FT /replace="a" +FT /gene="N" +FT CDS 9210..9659 +FT /codon_start=1 +FT /db_xref="SPTREMBL:O80313" +FT /note="P2 S homolog; tail completion protein" +FT /transl_table=11 +FT /gene="O" +FT /product="O protein" +FT /protein_id="AAC34159.1" +FT /translation="MSELTALQERLAGLIASLSPAARRKMAAEIAKKLRTSQQQRIKRQ +FT QAPDGTPYAARKRQPVRSKKGRIKREMFAKLRTSRFMKAKGSDSAAVVEFTGKVQRMAR +FT VHQYGLKDRPNRNSRDVQYEARPLLGFTRDDEQMIEDVIISHLGK" +FT variation 9324 +FT /note="Oam61" +FT /replace="t" +FT /gene="O" +FT variation 9345 +FT /note="Oam62" +FT /replace="t" +FT /gene="O" +FT CDS 9729..10370 +FT /codon_start=1 +FT /db_xref="SPTREMBL:O80314" +FT /note="Orf32; P2 V homolog; baseplate protein" +FT /transl_table=11 +FT /protein_id="AAC34160.1" +FT /translation="MNTLSTIQELARAIRNLIRSGVVTEVDTVQGLCRVQSGGIQTTWL +FT NWLTTRAGRSRTWWAPSLGEQVLLLAIGGELDTAFVLPGIFSDDNPAPSASADAWHVVF +FT PDGAVIEYEPETSALTVRGIKTADVTASESITATVPVVLVKAETRITLDTPEVVCTNKL +FT TTATLEVQKGGEMRGDIVHNGGTFKSNGVQLDDHGHGGVQRGGAWTEDTK" +FT CDS 10367..10714 +FT /codon_start=1 +FT /db_xref="SPTREMBL:O80315" +FT /note="P2 W homolog; putative baseplate protein" +FT /transl_table=11 +FT /gene="M" +FT /product="M protein" +FT /protein_id="AAC34161.1" +FT /translation="MTARYMGMNRNTGLGISDTEHISQSMRDILLTPVGSRVMRREYGS +FT LLSALIDMPQNPALRLQIMVACYSAIQKWEPRIRLTSISFETGDAGEMYVDITGMRTDT +FT GASVSTTVSLS" +FT CDS 10721..11629 +FT /codon_start=1 +FT /db_xref="SPTREMBL:Q37840" +FT /note="P2 J homolog; baseplate or base of tail fibre" +FT /transl_table=11 +FT /gene="L" +FT /protein_id="AAC34162.1" +FT /translation="MATVDLSLLPVPDVVEELDFETILAERIATLISLYPEDQQEAVAR +FT TLALESEPIVKLLQENAYREVIWRQRVNEAARAGMLAYARDSDLDNLGANFNVERLVVR +FT PADDTTIPPTPAEMELDADFRLRIQQAFEGMSVAGSTGAYEFHGRSADGRVADISVISP +FT SPACVTISVLSRENNGAASDELQSIVRNALNAEDVRPVADRVTVQSAQIIDYQIRATLF +FT VYPGPENEPIRAAAEAKLKAYISAQHRLGRDIRLSAIYAALHVEGVQRVELAAPVADIV +FT LDKTQASFCTDYQIVIGGSDE" +FT variation 10818 +FT /note="Lam21" +FT /replace="a" +FT /gene="L" +FT CDS 11622..12152 +FT /codon_start=1 +FT /db_xref="SPTREMBL:Q37841" +FT /note="Orf38; P2 I homolog; tail protein" +FT /transl_table=11 +FT /protein_id="AAC34163.1" +FT /translation="MSDVRLLPVGSSPLEVAAARACADIENTPVPLRRLWSPDTCPANL +FT LPWLAWAFSVDRWDENWPEKTKRDVIRSAYFTHCHKGTIGAVRRVIEPLGYIINVTEWW +FT ETGDPAGTFRLDIGVLESGITEEMYLEMERLIADAKPASRHLIGLNIIQDIPGYMYTGG +FT VSCDGDIITVYPG" +FT CDS 12163..13551 +FT /codon_start=1 +FT /db_xref="SPTREMBL:Q37842" +FT /note="similar to P2 tail fiber protein H, PIR Accession +FT Number B42291" +FT /transl_table=11 +FT /gene="K" +FT /protein_id="AAC34164.1" +FT /translation="MSTKFKTIITTAGAEKLAAATVPGGKKVNITVMAVGDGGGKLPVP +FT DAGQVQLVNEVWRHALNKISQDNRNSNYIVAELVIPPEVGGFWMRELGLYDDEGTLIAV +FT ANMAESYKPELAEGSGRAQTCRMVIIVSSIASVELSIDSTMVMATQEYVDDRIAEHEKS +FT RRHPDATLKEKGFTQLSSATDSASEVLAATPKAVKAAYDLANAKYTAQDASTAQKGIVR +FT LSSAADSTSEAEAATPKAVKIAMDNANARLAKDRNGADIPNPPLFVQNIGLKPTVDKAA +FT NAVDKNGDTMNGNLTLKGDYRLSFIIQNEDGSIRAYIFKDKGGDGIRISNGDDGGGDFV +FT FGKNGQFYCPDIMHVGNTIVWGDGNIEGARWGGLLSDWLTAQLVARDNNINLRAPYEWV +FT NQNFVNRAQRGAQASMTMDGGLVEAPWGCFLTGGNGNEGNQVGVALYRPLQILRNNTWV +FT TIEN" +FT misc_recomb 12962..12987 +FT /note="Mu-like inversion crossover site" +FT /organism="Enterobacteria phage 186" +FT /gene="K" +FT CDS 13554..14054 +FT /codon_start=1 +FT /db_xref="SPTREMBL:Q37843" +FT /note="unnamed protein product" +FT /transl_table=11 +FT /protein_id="AAC34165.1" +FT /translation="MKLINLQRYILMNYFLGDGIQYFIDATGKDWYKSLPKFTKKYSLA +FT IENDTGVIRSISEDASRLYPGGLTVVDVDSIPAGCDIFGGWVFDGEKVIPREYTLAEQQ +FT RQSDEKKKTLLAEAEATISTLERAVRLGMATGEEIRRLEAWERYSVLVSRVKQSDDWPQ +FT KPE" +FT terminator 14058..14081 +FT /evidence=NOT_EXPERIMENTAL +FT /note="t45" +FT protein_bind 14091..14110 +FT /evidence=NOT_EXPERIMENTAL +FT /bound_moiety="B protein" +FT /function="activation of transcription from pJ" +FT promoter 14122..14159 +FT /evidence=EXPERIMENTAL +FT /note="pJ" +FT /function="B-dependent transcription of J operon" +FT promoter 14159 +FT /note="initiation point of late promoter pJ" +FT CDS 14183..15361 +FT /codon_start=1 +FT /db_xref="SPTREMBL:Q37844" +FT /note="similar to P2 tail sheath protein FI, Swiss-Prot +FT Accession Number P22501" +FT /transl_table=11 +FT /gene="J" +FT /protein_id="AAC34166.1" +FT /translation="MSDFHHGTKVIEINDGTRVISTVATAIVGMVWTASDADAETFPLN +FT EPVLITNVQSAIAKAGKKGTLSASLQAIADQSKPVTVVVRVAEGTGDDAEAQTTSNIIG +FT GTDENGKYTGIKALLTAEAVTGVKPRILGVPGLDTQEVATALASVCISLRAFGYVSAWG +FT CKTISEAMAYRENFSQRELMVIWPDFLAWDTTANATATAYATARALGLRAYIDQTIGWH +FT KTLSNVGVQGVTGISASVFWDLQASGTDADLLNEAGVTTLVRKDGFRFWGNRTCSDDPL +FT FLFENYTRTAQVLADTMAEAHMWAVDKPITASLIRDIVDGINAKFRELKSNGYIVDGEC +FT WFDEESNDKETLKAGKLYIDYDYTPVPPLESLTLRQRITDKYLVNLAESVNS" +FT CDS 15377..15898 +FT /codon_start=1 +FT /db_xref="SPTREMBL:Q37845" +FT /note="similar to P2 tail tube protein FII, Swiss-Prot +FT Accession Number P22502" +FT /transl_table=11 +FT /gene="I" +FT /protein_id="AAC34167.1" +FT /translation="MALPRKLKYLNMFNDGLSYMGVVESVTLPKLTRKLENYRGGGMNG +FT AAAIDLGLDDDALTVEWSVGGLPDVALWAQYAAPGADAVPLRFAGSYQRDDTGEIVAVE +FT VVMRGRHKEIDGGENKQGENTSTKLSTVCTYYRLTIDGSDIIEIDTVNMVEKVNGVDRL +FT EQHRRAIGLL" +FT terminator 15906..15932 +FT /note="tI; partial terminator of pJ transcript" +FT CDS 15960..16295 +FT /codon_start=1 +FT /db_xref="SPTREMBL:Q37846" +FT /note="Orf51; P2 E homolog; tail protein" +FT /transl_table=11 +FT /gene="H" +FT /protein_id="AAC34168.1" +FT /translation="MAKAPRKTPEFIDTAGNEIDTVNPNVVTLDKPIKRAGQTIEKVTL +FT IEPNAGTLRGVSLAAVAQSEVDALIKVLPRMTYPALTTQELTAMNLPDMLSLAAKVIGF +FT LSPASAE" +FT CDS <16271..16447 +FT /codon_start=1 +FT /db_xref="SPTREMBL:O80316" +FT /note="Orf52; tail protein; probably produced by a +FT translational frameshift from orf51 into orf52" +FT /transl_table=11 +FT /gene="H" +FT /protein_id="AAC34169.1" +FT /translation="FVTGFGGIDFPPGLSTDDLMADIAVIFHWPPSELYSLSLTELITW +FT REKALQRSGNHNE" +FT variation 16314 +FT /note="Ham50" +FT /replace="a" +FT /gene="H" +FT variation 16421 +FT /note="Ham56" +FT /replace="t" +FT /gene="H" +FT CDS 16440..18878 +FT /codon_start=1 +FT /db_xref="SPTREMBL:Q37848" +FT /note="P2 T homolog; tail protein" +FT /transl_table=11 +FT /gene="G" +FT /product="G protein" +FT /protein_id="AAC34170.1" +FT /translation="MSNNLRLEVLLKAVDQATRPLKSIQTASKSLSGDIRDTQKGLRDL +FT NGQASKIDGFRKASAQLAVTSQALDKAKREAGELAVQFKNTTNPTRAQAQALEAARRAA +FT SELQTKYNSLRTSVQRQRSELMQAGINTRTLSADERRLKTSISETTAHVNRQREALARV +FT SAQQAKLSRVKERYKSGKELAGNMAAAGAAGSVSRHGTMAGVKLLMPGYDFTQKNSELQ +FT AVLGVDKQSPEMQALRKQARHVGDNTAASADDAASAQIIIAKSGGDAAAIQARRRVTLN +FT MALSNRRTMEENAALLTGMKSAFQLSNDKIAHIGDVLSMTMNKTAADFDGLSDALTYAA +FT PVAKNAGVSIEQTAAMVGALHDAKITGSMAGTGSRAILSRLQLPPEKAFEAIKELGVKT +FT SDSKGNTRPIFSILKEMQRSFEKNNLGTSQRGEYMKTIFGEEASSAAAVLMEAASSGKL +FT DRLTAAFKASDGKTEELVKVMQDNLGGDFKEFQSAYEAVGTDLFDQQEGSLRKLTQTAT +FT QYVLKLDGWIQKNKGLATTIGIIAGGALALIGIIGGIGLVAWPVVMGINAIIAAAGVLG +FT TVFTVTGSAIVTALGAITWPIVAVGAAIVAGALLIRKYWEPISAFFSGVIEGIMSAFAP +FT VAEMFAPLAPIFDGLGEKLRGVWQWFKDLIAPVKATQETLDSCKNVGVIFGQALASALM +FT RPLNVFNKLRSGVDWLLEKLGIINKESDNLDQTAAKTNAATQGNSYIPATSTYGGYQAY +FT QPVTAPAGRSYIDQSKSEYKITLPGGAAPGHQLDRQLRDTLEQIEREKRARQRASMSHD +FT " +FT CDS 18891..19376 +FT /codon_start=1 +FT /db_xref="SPTREMBL:O80317" +FT /note="P2 U homolog; tail protein" +FT /transl_table=11 +FT /gene="F" +FT /product="F protein" +FT /protein_id="AAC34171.1" +FT /translation="MMLALGMFVFERRTLPYQSMQHSKDYRWASNDRVGKPPAYQFLGE +FT GETSIQLAGTLYPAITGGWISLKAVEVMANEGRAWPLIEGTGNILGMYIVDKVSTTHAE +FT FFSDGAARKIDFTLSLKRVDESLTAMFGDLNKQASELLGSAGNLTDKLQSALGGLTA" +FT CDS 19373..20542 +FT /codon_start=1 +FT /db_xref="SWISS-PROT:P21679" +FT /note="P2 D homolog; tail protein" +FT /transl_table=11 +FT /gene="D" +FT /product="D protein" +FT /protein_id="AAC34172.1" +FT /translation="MITGMTIDAGTSLAPAFMLTLNSQDITSNFSDRLISLTMTDNRGF +FT EADQLDIELDDTDGKVELPLRGAVLTLWLGWQGSALLNKGDFTVDEIEHRGAPDILTIR +FT ARSADFRGTLNSRREESWHDTTIGELVSTIAKRNKLTASVADSLKKIPVPHIDQSQESD +FT AVFLTRLADRNGATVSVKAGKLLFLKAGSAMTASGKPVPQMTLTRNDGDRHQFAIADRG +FT AYTGVTAKWLHTKDPKPQKQKVTLKRKPKEKHLRALEHPKAKPVSKKTKAKKEPEAREG +FT EYMAGEADNVLALTTVYASKAQAMRAAQAKWDKLQRGVAEFSITLALGRADLFPETPVR +FT VSGFKRVIDEQAWLISKVTHNLNNSGFTTGLELEVKLSDVEYNAESDDE" +FT variation 20378 +FT /note="Dam23" +FT /replace="t" +FT /gene="D" +FT variation 20492 +FT /note="Dam14" +FT /replace="t" +FT /gene="D" +FT protein_bind 20548..20596 +FT /evidence=EXPERIMENTAL +FT /note="two CI binding sites for repression of pB" +FT /gene="B" +FT /bound_moiety="CI" +FT promoter 20549..20584 +FT /evidence=EXPERIMENTAL +FT /note="pB; repressed by CI" +FT /gene="B" +FT /function="transcription of B gene" +FT -35_signal 20549..20554 +FT /gene="B" +FT -10_signal 20572..20577 +FT /gene="B" +FT CDS 20609..20827 +FT /codon_start=1 +FT /db_xref="SWISS-PROT:P08711" +FT /note="C4 Zn finger protein; P2 Ogr and P4 Delta homolog" +FT /transl_table=11 +FT /gene="B" +FT /function="activate late gene promoters" +FT /product="B protein" +FT /protein_id="AAC34173.1" +FT /translation="MFHCPKCHHAAHARTSRYLTENTKERYHQCQNINCSCTFMTMETI +FT ERFIVTPGAIDPAPPHPTVGGQRPLWL" +FT variation 20690 +FT /note="Bam57" +FT /replace="t" +FT /gene="B" +FT variation 20744 +FT /note="Bam17" +FT /replace="t" +FT /gene="B" +FT terminator 20845..20866 +FT /note="tB; termination of transcription from pB and late +FT promoter" +FT protein_bind 20889..21147 +FT /note="predicted Int arm-type recognition sequences; +FT consensus = YAYCGCCAYTY; 3 sites to left of attP and 2 +FT sites to right" +FT /bound_moiety="Int" +FT terminator complement(20930..20957) +FT /note="predicted terminator of lysogenic operon" +FT protein_bind 20959..20985 +FT /evidence=EXPERIMENTAL +FT /note="IHF DNase I footprint location" +FT /bound_moiety="IHF" +FT tRNA 20985..21030 +FT /note="truncated" +FT /product="tRNA-Ile" +FT misc_feature 20995..21030 +FT /note="in common with attB in Escherichia coli, which is in +FT the 3' end of ileY" +FT misc_feature 21023..21029 +FT /note="attP; predicted crossover region with attB" +FT variation 21030..22865 +FT /note="del1 deletion" +FT protein_bind 21057..21086 +FT /evidence=EXPERIMENTAL +FT /note="IHF DNase I footprint location" +FT /bound_moiety="IHF" +FT protein_bind 21075..21121 +FT /note="five binding sites for Apl excisionase at attP" +FT /bound_moiety="Apl" +FT CDS complement(21157..21408) +FT /codon_start=1 +FT /db_xref="SWISS-PROT:P08685" +FT /note="Orf69" +FT /transl_table=11 +FT /protein_id="AAC34174.1" +FT /translation="MSVRLAPDGTYVYGQPMLAPNGTYVGGGAPRLAPDGTYVGGVPRL +FT APNGSYVAGRPTLAPDGTYVGGRYHLAPDGTYVGDGSE" +FT CDS complement(21423..22433) +FT /codon_start=1 +FT /db_xref="SWISS-PROT:P06723" +FT /note="integrase" +FT /transl_table=11 +FT /gene="int" +FT /product="Int" +FT /protein_id="AAC34175.1" +FT /translation="MTVRKNPAGGWICELYPNGAKGKRIRKKFATKGEALAFEQYTVQN +FT PWQEEKEDRRTLKELVDSWYSAHGITLKDGLKRQLAMHHAFECMGEPLARDFDAQMFSR +FT YREKRLKGEYARSNRVKEVSPRTLNLELAYFRAVFNELNRLGEWKGENPLKNMRPFRTE +FT EMEMTWLTHDQISQLLGECNRHDHPDLETVVRICLATGARWSEAESLRKSQLAKYKITY +FT TNTKGRKNRTVPISKELYESLPDDKKGRLFSDCYGAFRSALERTGIELPAGQLTHVLRH +FT TFASHFMMNGGNILVLQRVLGHTDIKMTMRYAHFAPDHLEDAVKLNPLVHITNSK" +FT CDS complement(22433..23011) +FT /codon_start=1 +FT /db_xref="SWISS-PROT:P08707" +FT /note="immunity repressor; DNA-binding protein; has +FT positive and negative autoregulation by control of pL" +FT /transl_table=11 +FT /gene="cI" +FT /function="maintenance of lysogeny; repress pB and pR" +FT /product="CI repressor" +FT /protein_id="AAC34176.1" +FT /translation="MRIDSLGWSNVDVLDRICEAYGFSQKIQLANHFDIASSSLSNRYT +FT RGAISYDFAAHCALETGANLQWLLTGEGEAFVNNRESSDAKRIEGFTLSEEILKSDKQL +FT SVDAQFFTKPLTDGMAIRSEGKIYFVDKQASLSDGLWLVDIEGAISIRELTKLPGRKLH +FT VAGGKVPFECGIDDIKTLGRVVGVYSEVN" +FT variation 22684..22685 +FT /note="cI10" +FT /replace="g" +FT /gene="cI" +FT protein_bind 22726..22742 +FT /note="FL; unknown function" +FT /gene="cI" +FT /bound_moiety="CI" +FT variation 22989 +FT /note="cIam461" +FT /replace="t" +FT /gene="cI" +FT protein_bind 23011..23067 +FT /note="locus of vir mutations; 3 binding sites for CI +FT repressor" +FT /bound_moiety="CI" +FT /function="repression of pR" +FT -35_signal 23026..23031 +FT /note="pR" +FT promoter 23026..23063 +FT /evidence=EXPERIMENTAL +FT /note="pR; repressed by CI and Apl" +FT /function="transcription of early lytic operon" +FT -10_signal 23049..23054 +FT /note="pR" +FT protein_bind 23056..23123 +FT /note="7 binding sites for Apl; locus of goa mutations" +FT /bound_moiety="Apl" +FT /function="repression of pR and pL" +FT promoter complement(23125..23159) +FT /evidence=EXPERIMENTAL +FT /note="pL; repressed by Apl; inhibited by convergent pR +FT promoter; activated by CI repression of pR" +FT /function="transcription of lysogenic operon" +FT -10_signal complement(23131..23136) +FT /note="pL" +FT CDS 23141..23404 +FT /codon_start=1 +FT /db_xref="SWISS-PROT:P21681" +FT /note="contains putative helix-turn-helix DNA binding +FT motif" +FT /transl_table=11 +FT /gene="apl" +FT /function="excisionase; binds to attL" +FT /function="repressor: binds between and represses pR and +FT pL" +FT /function="appears to assist derepression during prophage +FT induction" +FT /product="Apl" +FT /protein_id="AAC34177.1" +FT /translation="MASEIAIIKVPAPIVTLQQFAELEGVSERTAYRWTTGDNPCVPIE +FT PRTIRKGCKKAGGPIRIYYARWKEEQLRKALGHSRFQLVIGA" +FT -35_signal complement(23154..23159) +FT /note="pL" +FT /gene="apl" +FT variation 23205..23219 +FT /note="apl11 deletion" +FT /gene="apl" +FT variation 23236 +FT /note="aplam" +FT /replace="g" +FT /gene="apl" +FT promoter complement(23400..23462) +FT /evidence=EXPERIMENTAL +FT /note="pE; activated by CII, allowing transcription of +FT lysogenic operon" +FT /function="transcript for establishment of lysogeny" +FT protein_bind 23404..23420 +FT /note="FR" +FT /bound_moiety="CI" +FT /function="probably responsible for CI repression of pE +FT promoter" +FT protein_bind 23435..23462 +FT /gene="cII" +FT /bound_moiety="CII" +FT /function="activate pE" +FT CDS 23435..23944 +FT /codon_start=1 +FT /db_xref="SWISS-PROT:P21678" +FT /note="DNA binding protein; has putative helix-turn-helix +FT motif" +FT /transl_table=11 +FT /gene="cII" +FT /function="required for establishment of lysogeny" +FT /function="activates pE, alternative lysogenic operon +FT promoter" +FT /product="CII" +FT /protein_id="AAC34178.1" +FT /translation="MFDFQVSKHPHYDEACRAFAQRHNMAKLAERAGMNVQTLRNKLNP +FT EQPHQFTPPELWLLTDLTEDSTLVDGFLAQIHCLPCVPVNELAKDKLQSYVMRAMSELG +FT ELASGAVSDERLTTARKHNMIESVNSGIRMLSLSALALHARLQTNPAMSSVVDTMSGIG +FT ASFGLI" +FT variation 23440 +FT /note="prevents CII binding to pE; cIV476" +FT /replace="a" +FT /gene="cII" +FT variation 23657 +FT /note="cIIam475" +FT /replace="t" +FT /gene="cII" +FT CDS 23952..24179 +FT /codon_start=1 +FT /db_xref="SWISS-PROT:P15236" +FT /evidence=EXPERIMENTAL +FT /note="overexpression blocks cell division" +FT /transl_table=11 +FT /gene="fil" +FT /product="Fil" +FT /protein_id="AAC34179.1" +FT /translation="MLKSEPSFASLLVKQSPGMHYGHGWIAGKDGKRWHPCRSQSELLK +FT GLKTKSPKSSGFLIIRIVHFVIKGVKHVTR" +FT variation 24112 +FT /note="CP77am; filam" +FT /replace="a" +FT /gene="fil" +FT CDS 24166..24366 +FT /codon_start=1 +FT /db_xref="SWISS-PROT:P21680" +FT /transl_table=11 +FT /gene="dhr" +FT /function="inhibits host DNA replication" +FT /product="Dhr" +FT /protein_id="AAC34180.1" +FT /translation="MSRDELRIVLGAMIPNMEEGFEIKTRDGAILRVDPEWECCKEFKD +FT GLKAEIIKQLKSKPAVVFGYS" +FT variation 24194 +FT /note="CP78am; dhram" +FT /replace="a" +FT /gene="dhr" +FT terminator 24384..24412 +FT /note="tR1; one of a number of transcription terminators in +FT this region that are anti-terminated during early lytic +FT development by an unknown mechanism" +FT CDS 24433..24666 +FT /codon_start=1 +FT /db_xref="SWISS-PROT:P21682" +FT /note="unknown function; not essential" +FT /transl_table=11 +FT /product="Orf79" +FT /protein_id="AAC34181.1" +FT /translation="MSRTIYLSTPSGAGDHLLESLFKEAKKEERKDRRLAVSIRLEDLA +FT VHITNSDMTGKEAAELLRREATRFENESQELH" +FT CDS 24666..24893 +FT /codon_start=1 +FT /db_xref="SWISS-PROT:P41059" +FT /note="unknown function; not essential" +FT /transl_table=11 +FT /product="Orf80" +FT /protein_id="AAC34182.1" +FT /translation="MADAMDLAQLREQEDRERHISNARSRRHEVSAFICEECDAPIPEA +FT RRRAIPGVQCCVTCQEILELKSKHYNGGAL" +FT CDS 24890..25474 +FT /codon_start=1 +FT /db_xref="SWISS-PROT:P41060" +FT /note="unknown function; not essential" +FT /transl_table=11 +FT /product="Orf81" +FT /protein_id="AAC34183.1" +FT /translation="MSITNATISQRAKKWLEDDRIFIDTETTGLGDDAEIVEICLIDSA +FT GFIMLNTLVKPTKPIPAEATAIHGITDEMVMYAPTWKDIHGAVASLFFEYGFVIYNADY +FT DTRLIYQTAKLYGLENDGFCYFLNERSACAMMLYAEYRGEPGRFKGYKWHKLVDAAAHE +FT GVSVEGKAHRALADCRMTLGIIDALAKGGAA" +FT CDS 25471..25746 +FT /codon_start=1 +FT /db_xref="SWISS-PROT:P41061" +FT /note="unknown function; not essential" +FT /transl_table=11 +FT /product="Orf83" +FT /protein_id="AAC34184.1" +FT /translation="MSIRIEIGDKWVITSDQYQFILNEKKVVKTGNKAGEEWLDTIGYY +FT PKINQLISGLVHHHIHTAMIISLSAMAEEIEKLSFICEEAFKAVKK" +FT CDS 25743..26747 +FT /codon_start=1 +FT /db_xref="SWISS-PROT:P41062" +FT /note="unknown function; not essential. translation to end +FT of orf84 appears necessary for translation of A protein" +FT /transl_table=11 +FT /product="Orf84" +FT /protein_id="AAC34185.1" +FT /translation="MIDSRCFAESTINIVSVSGGKDSLAQWILAVENDVPRTTVFADTG +FT HEHSQTMEYLDYLESRLGPVIRVKADFTRRIEGKRKFIAEKWPVSLVEECGMSHEQAAE +FT RIAKALEILKPTGNPFLDLCMWKGRFPSTKARFCSLELKHDSVRDKIVLPALEKYDEVI +FT LWQGVRAQESPARAALPMWEEDADNTPGLHVYRPILNWTHEDVFALAKRHGIKPNPLYQ +FT QGCSRVGCMPCIHARKSELAEIFARWPEEIARVAEWERLVAACSRRGNSTFFPSTHDPR +FT RAEKRIEVVTVEEYGIASYRDWAMTTRGGSQYDLLAATNDKTVCSSVYAGVCE" +FT variation 25803 +FT /note="am43" +FT /replace="t" +FT /phenotype="lethal due to polarity on A" +FT variation 25845..26288 +FT /note="del444" +FT /replace="" +FT variation 26460 +FT /note="am11" +FT /replace="t" +FT /phenotype="lethal due to polarity on A" +FT CDS 26744..28828 +FT /codon_start=1 +FT /db_xref="SWISS-PROT:P41064" +FT /note="rolling circle replicase; putative endonuclease; +FT similar to P2 A protein" +FT /transl_table=11 +FT /gene="A" +FT /product="A protein" +FT /protein_id="AAC34186.1" +FT /translation="MTGVVYAFPWNAPRSAIASSYLTYDQQHRRDRMFAALLHARKVLF +FT LQPECVRFDVYRTAAVLEQNQGSQRANAFLISFCKKALPRLELVAKKYECSGINSNVSA +FT AVFDGHFDTQLMQYLASRMVNMVARFNRLPDMSRADIDLLAADIANFIRAELADIDDTG +FT FSELKTLYTWYMRAGFISLQFNVTPPKWERVTKKYFCEDEIAPAVMRMFNEVWWRGRLR +FT RIAAAWREHLQIAVGNVSKKRHAYASKNCVTDWREQKRRTREFLKGLDLEDEEGNRISL +FT IEKYDGSVANPAIRRCELMARIRGFENICNELGYVGEFYTLTAPSKYHATTKAGYRNSK +FT WNGASPSDTQSYLTGLWARIRAKLHREEIRIFGIRVAEPHHDGTPHWHMLMFMLPEDVE +FT RVRLIIRDYAWEEDHYELRSDKAKKARFHAEAIDPEKGSATGYVAKYISKNIDGYALDG +FT ETDDESGELLKETAPAVSAWAARWHIRQFQFIGGAPVTVYRELRRMADPETARALSVEF +FT AAVHDAAHYGRWADYVNAQGGPFVRRDDLQVRTLYEPRTEFNQYGEETVCIKGVYDASI +FT GAGSPILTRLTQWKIVPKRAVDLAVDVKGASAPSRSSVNNCTGSESDPPILDLTKPLSR +FT RERRELTNRLRKKKPTTRRKFIHGTDKQNVAITKTIDEIHSDNRHHNQPGRSPAPDGRW +FT " +FT terminator 26829..26856 +FT /note="tM1; expected terminator for lytic transcripts in +FT absence of translation of A gene" +FT /gene="A" +FT variation 27542 +FT /note="Aam24" +FT /replace="t" +FT /gene="A" +FT rep_origin 28576 +FT /note="located by similarity with P2; consistent with +FT electron microscopy mapping" +FT /gene="A" +FT -35_signal 29020..29025 +FT /note="p95" +FT promoter 29020..29056 +FT /evidence=EXPERIMENTAL +FT /note="p95" +FT /function="SOS-dependent transcription of SOS operon" +FT -10_signal 29044..29049 +FT /note="p95" +FT protein_bind 29044..29063 +FT /note="putative" +FT /bound_moiety="LexA" +FT variation 29053..29055 +FT /note="cIII" +FT /replace="tt" +FT variation 29074 +FT /note="tum9" +FT /replace="a" +FT CDS 29082..29522 +FT /codon_start=1 +FT /db_xref="SWISS-PROT:P41063" +FT /note="expression repressed by LexA" +FT /transl_table=11 +FT /gene="tum" +FT /function="inhibits CI DNA binding" +FT /product="Tum" +FT /protein_id="AAC34187.1" +FT /translation="MDRELNEHVMIERVEMIARLTAEGTCQERDREIALNLIAEIARGN +FT LMKNNNFSVVFSAPPVGETFAKEGKVKVNITLDKDQKIGQPVIDAFQCELTKRIQSVFP +FT STRVTVKKGSMTGVELMGFDKDSDREALDSILQEVWEDESWR" +FT CDS 29109..29522 +FT /codon_start=1 +FT /db_xref="SWISS-PROT:P41063" +FT /evidence=EXPERIMENTAL +FT /transl_table=11 +FT /gene="tum" +FT /function="modulates SOS induction" +FT /product="truncated Tum95.2" +FT /protein_id="AAC34188.1" +FT /translation="MIERVEMIARLTAEGTCQERDREIALNLIAEIARGNLMKNNNFSV +FT VFSAPPVGETFAKEGKVKVNITLDKDQKIGQPVIDAFQCELTKRIQSVFPSTRVTVKKG +FT SMTGVELMGFDKDSDREALDSILQEVWEDESWR" +FT variation 29115 +FT /note="tum16" +FT /replace="a" +FT /gene="tum" +FT variation 29182 +FT /note="tum13" +FT /replace="t" +FT /gene="tum" +FT variation 29199 +FT /note="tum17" +FT /replace="a" +FT /gene="tum" +FT CDS 29220..29522 +FT /codon_start=1 +FT /db_xref="SWISS-PROT:P41063" +FT /evidence=EXPERIMENTAL +FT /transl_table=11 +FT /gene="tum" +FT /function="modulates SOS induction" +FT /product="truncated Tum95.4" +FT /protein_id="AAC34189.1" +FT /translation="MKNNNFSVVFSAPPVGETFAKEGKVKVNITLDKDQKIGQPVIDAF +FT QCELTKRIQSVFPSTRVTVKKGSMTGVELMGFDKDSDREALDSILQEVWEDESWR" +FT variation 29245..29251 +FT /note="tum14" +FT /replace="ttttt" +FT /gene="tum" +FT CDS 29292..29522 +FT /codon_start=1 +FT /db_xref="SWISS-PROT:P41063" +FT /evidence=EXPERIMENTAL +FT /note="truncated Tum - modulates SOS induction of 186 +FT prophage. GTG start codon." +FT /transl_table=11 +FT /gene="tum" +FT /product="bacteriophage 186 Tum95.5" +FT /protein_id="AAC34190.1" +FT /translation="MKVNITLDKDQKIGQPVIDAFQCELTKRIQSVFPSTRVTVKKGSM +FT TGVELMGFDKDSDREALDSILQEVWEDESWR" +FT variation 29391 +FT /note="tum2" +FT /replace="t" +FT /gene="tum" +FT terminator 29545..29576 +FT /evidence=EXPERIMENTAL +FT /note="t95a; partial termination of p95 transcript" +FT CDS 29604..30335 +FT /codon_start=1 +FT /db_xref="SPTREMBL:Q37850" +FT /note="expression from plasmid blocks 186 infection" +FT /transl_table=11 +FT /gene="orf97" +FT /product="Orf97" +FT /protein_id="AAC34191.1" +FT /translation="MDTVIAFLSLALFIAFIVGLIKPSLVRMPSRKRSSAVYLGGCLAL +FT GVIGSILWPTEKTQPVAKTDVPAVKAEPATPTFEYADKTLKEYRNEPKETRHEIVKDYV +FT GFKGVQASATDVFYACMSEYTFTKDDALKLSDVLGWCFNDFEKDPQSLNNKINLDEFQG +FT NFSGWDGSYRPLEKLIKASMNDDSSYKHVSTVYHLILNKDPHAVVKTTFRGTNAYGGVV +FT KQTVAARVNVRTGEVDSILDN" +FT variation 29691..30304 +FT /note="del97" +FT /replace="" +FT /gene="orf97" +FT terminator 30436..30463 +FT /note="t95b; p95 transcript terminator" +XX +SQ Sequence 30624 BP; 7461 A; 7801 C; 8456 G; 6906 T; 0 other; + ggcgtggcgg ggaaagcatt gcgcgccaga ggtggcgcgt gaatgataaa aattatcgtc 60 + tgagcgcctc gtaatggcgc tatcgtggtg ctgttggttc gttggtggtc gtgtgtgttt 120 + gtgcgcgtgt ggcgcgtctg agacgtgatg gtggcggggt atgaaaaagc cgccatgctg 180 + gcggcttgag agggattatt ccgggttgtc gagggtgtac tctttgaacc tgatgacctc 240 + catgccgagc cagtcgttta cctccctgaa cctgtcctgc agcggcgaca ggtcgttacg 300 + cacaaatacc tttgccactt tctcaacgtc accgagcgag ccgatattct cgggcttgcc 360 + gcccatgagc tggaacggta cgcggtgcgc gtccatcagg tcggcggcgc tggctttctt 420 + gatgttgaaa aagtcatcct ttgtggcgac ctcgctcagt ggcacgattt taatgccgtc 480 + cggttttcca ttgggagcgt agaaaaacag gtttttaaaa ttgccgagcc ctttcgagtt 540 + gcgcatcgcc tcgcgcagcg attcgacgtc ggtcgcgctc tgcgccgggt cggtcacata 600 + catgatgtaa cccgcatgcg cgccgttctg gtaatacttg cggcggaaca gcgttgcgga 660 + ttcattcagc caggcggaat taagcgcgct gagatattcg ggcaggccgt aaatctcctg 720 + attaatgtcg ggctccagca ggtgaaacac ggtatcaggc gcgaattcat gcggcagagt 780 + gaagttttcc acaaaccaga aaaccgaatc gtcgaccccg cggcgggtgt atttggccgg 840 + tgaggccagt agcttgatta gctggccggt aacgctgtgg cgctgctcaa gaaaggcgtt 900 + gccgaatacc agatagtcga gcgcaaagcg gctgaaatcc tgacgggaca gcagcgggtg 960 + cgggatgtag gtgctcgcga gcacgttgcg cttaacgtaa atcggtgagc tgtgatgtac 1020 + agcagagcgc aggctctttg ccagcccgga gaagctgacc ggcggctcgt accatttgcc 1080 + gttactgatg cactcgacat aatccagaat gtcgcgctta tcgagtaccg gcactggctc 1140 + gccaaaggtg aacgcctcca ttttttgcgg ggcgctggcg gtcatggcta cctgtttgcg 1200 + tggcttgcgc ttgctcatgc tgccacctca cccgctgcaa cagcgaaaga ccagtcgcag 1260 + ccaaacagca ggcgataatc atcgtcgctg tattcgtgtt taatttcatc gggcgcaaag 1320 + agattgcacc cgcgctggca tgctgcatcc agagtgaccg actgacgcca gacaccatct 1380 + gtacaaaata cgctgtcgcc ggtattgatg agcggtgacg gtcggtgcct gcgggttgtg 1440 + ccgttccata ccctgaaagc gtcataatta tcagagggcg aggtaaacat cgtcaggctg 1500 + tggcgtttat ggcaggcgat acccgccgcg actttcgcag ctcttagcgg gttattgaac 1560 + catccgaact catcaagata gacattaccc gccagtgcgg cgcaatggga ttcctcgccg 1620 + acaaagctga taaccgcacc gtcgtcgagc tgcaggctgt ggccgttact cgtaagactg 1680 + acgccgacgc gcgccgaaag gttactcatg tacatcagcg ccacgcgcgc atgctcaata 1740 + gtgtgagcaa accagacatg attatcgcct gttgtcagcg catcgagcag cgcctcacgg 1800 + ctaaagagct gcgttgcgcc aatctggcgc gatttggtga tgctgcggtc gatattgagt 1860 + ttcccgacac gcaaccatgt tgcctgatag tcaaagctgt cattgtgcag aatatcggcc 1920 + attgcctgaa tctggctttg tgagaaaacg ttatttttca ttaattaaac tccagaatgg 1980 + atttaggctg tatgccgcta ccggcggaaa gcggttcgtt taacagggcg tgcatggtcg 2040 + cccatgcaat atcggcgtga ctggcttcct cggtgcggct ggcctcgtag gtggcgctgc 2100 + gcccgctgct ggtcatggtt ttgcggatgg acataaacga ctgcgtgacg tcggttgctc 2160 + cggcgtcgta ctccagacag ccgcggcgaa tggtgtcttt tgccttgagt accattgcgg 2220 + ttttcatttc aggcgtgtaa cggatgccgc gtgcggccgg gtagaatgag cgcaccaact 2280 + ggaacacgcc gaggccgagg ccggttgcgt caatgccgat gtattcgacg ctgtatttct 2340 + cggtcagttt gcggatgcca tctgcctgcg cggcaaagtc catgcccttc cactggtggc 2400 + gctccagcat gcggaacttg ccaccagaaa ccaccggcgg cgcgagcacg acgcacccgg 2460 + cgctgtcgcc agtgtgtgac gggtcgtagc caatccagac ggggcgagag ccgaacggat 2520 + ggtcggcgaa cggggcgaag tcctcccatt cttccatcac gtcgaccatg cagcgctgca 2580 + gctcctcgaa cgggaatacc gacgctttat cgtcgacaaa ctcgcacata aacaggtttt 2640 + taaagtcctc atcactgttt tcgcgtttga gttggtcgag gtcgaacagg gtgcagccac 2700 + cggcaagggc gtcctcaatg gtgacaatct gccgccactg gccatcgtcg cagagctggc 2760 + caccggcgag cgcgcggtga ctgatgtcaa tttcgatgcg gtcggcaata cggctgcgcc 2820 + ccttgttgaa cagctcgcca gaccagaagg gataagcgcc gtgcgccagc gttgagggtg 2880 + tcgaaaagta ggttgagcgc agatgcttct gcgaggccat gcccgaggcg actttgcgca 2940 + gcttctgaaa attcgggatc cagaatattt catcgacata caggtcgccg ttatggctct 3000 + gagccgtgtt ggagttggta ccgagaaaaa tcagctttgc gccgttgttg ccaatgacaa 3060 + tcgggtcgcc ggtcaggtcg acgtcaacca gtcgcgcaaa ctgtatgatg tattcgcgga 3120 + acacgtaagc ctgcgtttta ctggccgaca gaaaaatctg gttatggccg gtcttgagtg 3180 + ctcgcagcag tgcctcacgg gaaaaataga acgtcgcgcc aatctggcgg gatttgagaa 3240 + tgtcgcgaat acggtgtgcc agtcctgcgc ggtaccactg caactggtac tcgaaagact 3300 + ggtcgaaaaa taattcctcc agcttttcga tagcctcgtc gctgaaaaaa ttctttttcg 3360 + gcttcttgcg ctcacccttg ttgcggttgg cgacgttggg gttaaggtcg gcctcgttgc 3420 + cggtctggct gtagcggtta acgcgtgcca gtcgttcaat ctgccgcccg agcaggtcaa 3480 + tctctttgaa gtcaccgcct gacttttgcg gcttggcgat gagctgaatc aggcgcgcct 3540 + caaggctgct ttcaacgcgg gaaatcggtg cgatgccatc ccagccgtcg cgctgtttcc 3600 + agctctgcac ggtcgggcgc ttgacctgca gcatttcggc aatctgcggc acggaaaaac 3660 + cctgccagta aagcagcgat gcctgtcgtc gcgggtcatg caacaaggtt gtatcggtgg 3720 + aaatggtcat tgatgcctcg ccgtaatgga ttcagggcaa ggctacttaa tggccgtcag 3780 + tgattcgcta aggtgctgtt gtgtgggcgg ttgtccagtc gtcattggtg gtctggcgtg 3840 + tcctgagtct ggaaactggc ggtgaccagt aaccccaacc tcaggactcc tgacaatggc 3900 + aaaaaaagtc tcaaaattct ttcgaatcgg cgtcgagggt gatacctgcg acgggcgcat 3960 + tatcagcgcc agtgatattc aggaaatggc cgaaacctat gacccgcgtg tttacggttg 4020 + ccgtatcaac cttgaacacc tgcgcggcct gttgcccgat ggcatattca agcgttacgg 4080 + cgatgtggtc gagctgaaag ccgagaagat tgacgacgat tctgcgctta acggcaagtg 4140 + ggcgttgttc gctaaaatca ccccgaccga tgaccttatc gcgatgaata aagccgcgca 4200 + gaaggtctac acctcaatgg aaattcagcc gaattttgcc aataccggca aatgctacct 4260 + cgtcggcctt gctgtcaccg atgacccggc gagcctcggc actgaatatc tcgaattctg 4320 + ccgcactgcg aagcacaacc cgctgcagcg ctttaaagcc caccctgaaa acgtcttttc 4380 + cgccgccacg ctggccgaac tggaatttga agacgttccc gacacggtgc tcaacagcct 4440 + ggccgataag gtgaaagcca ttttcagccg taagcaggtc agcgacgatg cgcgcctgaa 4500 + tgatgtacat gaagcggtga ccgccgtcag cgagcatgtg cagaccaacc tcactgcaca 4560 + ggataagcgt ctttccgata tggaaaccgc gtttgccacc ttcaaacagg aactgaccgg 4620 + caaggttgaa gaaaccagcc aggcattttc cgtcctgaaa accactctcg acaaaaccga 4680 + aagtttcagc cagccgcgac gcacgaaagc cagcggcggt ggtggcgatg agctgctgac 4740 + tgactgctga taaaccgcag accgaaaccg ggcggaaccc ccgcccgatg ctgtgactaa 4800 + ccgattaaat caaacaggaa atactatgcg tcaggaaacc cgttttaagt tcaatgccta 4860 + tctgacccag ctcgccaaac tgaacggcat cagcgttgat gacgtcagca aaaaattcac 4920 + cgtcgagccg tccgtcacgc aaacgctgat gaacaccgtg caggcgtcat ccgcgtttct 4980 + gcagatgatt aacattctgc cggtcgcaga aatgaagggt gagaaaatcg gtgtcggtgt 5040 + gaccggcacc atcgccagca cgaccgacac ctcgggcgac aaagagcgcc agaccgcaga 5100 + ttttaccgcg cttgagtcca acaagtacga gtgcaaccag attaactttg acttccacct 5160 + gacctataaa cgcctcgacc tgtgggcgcg ttttcaggac tttcagcgtc gtattcgcga 5220 + cgccattgtc cagcgtcagg cactggattt catcatggcc gggtttaacg gtaccacccg 5280 + cgctgacacc tctgaccgtg ttaaaaaccc gatgctgcag gatgtggccg ttggctggct 5340 + gcagaaatac cgcaatgaag ccccggcgcg tgtgatgagc aacatcaccg acgctgacgg 5400 + taaagtcgtt tcggcagtga ttcgcgtcgg taaaaacggc gactatgaga acctcgacgc 5460 + actggtgatg gatggtacca ataccctgat tgacgagatt tatcaggatg acccgaaact 5520 + cgttgccatc gttggccgta agctgctggc cgacaaatat tttccgctgg tcaacaaaca 5580 + gcaggaaaac accgagtcgc tcgcggcgga tatcatcatc agccagaagc gcatcggcaa 5640 + cctgccagcc gtacgtgtgc cgtacttccc ggcgaacgcg gtgttcgtga ccacgctgga 5700 + aaacctctct atctatttca tggatgagag ccaccgccgc agcattgatg aaaacccgaa 5760 + aaaagaccgc gtggaaaact acgagtcgat gaacatcgac tatgtggtcg aggcgtatgc 5820 + cgccgggtgc ctgctggaaa acatcaccct gggcgatttc accgcacctg cagcaccgga 5880 + aggcggagag taaacccatg acgagccccg cacagcgtca catgatgcgg gtctcggcct 5940 + ctcaagccgc gcagcgggaa caagccccgc tgcgccatgc aaccgcctat gagcagatgc 6000 + tggttaagct ggccgatgac cgccgcacgt taaaaaacat ccgttcaaac gaacgtaaag 6060 + ccgagaaaaa gcgcgagctg ctgccgttct atgcgccgtg ggtcgccggt gtgctgactg 6120 + atggtcgtgg tgcgcaggat gacattgtta tgaccgtcat gctgtggcgt ctcgatgccg 6180 + gtgatatcgc tggcgcgctg gaaattgccc cctacgcgct gaagtacggc ctcacctctg 6240 + accatcgccg cacgacacct tacatgctgg tcgaggaagt ggcacttgcc gcgcagcgcc 6300 + tgcgcgatgc cggtgagtct gtcgaccttt cctggctgca ggccactatc gacctgaccg 6360 + acggcgctga cgttcccgat atggtgcgcg cccgtctgca taaggtgaca ggcctgaccc 6420 + tgcgtgatgc cggtatgaat gcagaggcgc tggcgcagtt tcagcgcgcg atgcagctcg 6480 + accgcaatgc cggtgtgcgc aaggagattg agcgactgga acgggcattg aagccaaaga 6540 + cagaggccgc gccccgtaaa acgactaaac cgcgcacgcg taaacctgcc accaaaccgg 6600 + cagcaaagcg cgggcgtcca ccaaaggcgg caaaaaccgc cggttaactg aacgctcccc 6660 + gagccgggcg gcacgccggt caaagcaggc aaagacctga cggcgaccgg cgtccaccgc 6720 + ccaacctgat gaggttgtca tgacgacagt gatactgaac cagcccgacg aaccgcagga 6780 + cgtaccgggc gtggtgattc ccgcaccgga gacgggcggt gcagtgatta aaaacacgtt 6840 + ctttttccct gatgtggatc cgaagcgcgt gcgcgaactg atgcgccttg agcagacggt 6900 + ttccgatgcg cgcctgcgca atgccatcaa gaccggcatg gccgagacca atgcggagct 6960 + ttacgactac cggctgcgcc agactgccgc cgggtttaag caactggccg acgtgcctgc 7020 + cgaggaaatc gacggcgaga atgtacgtgt tttccactat ctgagtgctg tgacggcaat 7080 + ggcaaccgcc accctgtatg agcgctatcg cggcgttgag gccaccggca aaggtgacaa 7140 + aaaagccgac agcgtggaaa ccaccattga tgacctgtgg cgggatatgc gctggtcagt 7200 + tgcgcgtctg caggacaagc cgcgctgcat tgtggggcag ctctgatgaa agtcaggtcg 7260 + atgcagggcg ataccctcga cacgatttgc gccaggtatt acgggcgcac tgagggcgtg 7320 + gttgagacgg tgctgcaggc taatccgggt ctgtctgagc tgggtgtcat tctgccgaat 7380 + ggtacagaga ttgacctgcc cgatgtggca tcgtcacccg taactaaaac tatcaacctt 7440 + tgggagtaac catgacagaa ggtgaaaaag gcgtcctgtc actgtttgtg attggcgtga 7500 + tgattgttgt tgggaaagtg ctggcaggcg gtgaacccat caccccgcgt ctgtttattg 7560 + gccgcatgct gctcggtggt tttgtttcaa tggtcgccgg tgttgttctg gtgcagtttc 7620 + ctgacatgtc actgcccgcc gtgtgcggga ttggatccat gctcggtatt gccggttatc 7680 + aggtggttga aatcgccata cagcgccgct ttaagtcaca aaagggggaa agtgatgccg 7740 + gtcattaaca ctcaccagaa tatcgctgcg tttctggaca tgctggcgta ttccgaagga 7800 + acagcgaacc atccgctgac gaaaaatcgt ggctacgacg tcattgtcac tggccttgat 7860 + ggcagaccag agattttcac cgattacagc gaccaccctt tcgcgcatgg ccgaccaccg 7920 + aaagtgttta atcgccgtgg cgagaaatcc acagcctcgg gacgttacca gcagctttat 7980 + ctgttctggc cgcactatca gaaacagctc gcattgcctg atttcagccc actgtcgcag 8040 + gataagctcg cgatccagtt aatccgggag cgcggtgctc ttgacgatat ccgggcgggg 8100 + cgtattgagc gtgctgtttc acgttgtcgc aatatctggg cgtcattacc gggggccggt 8160 + tacggccagc gcgagcacgg tctcgaaaag ctggtcacca tctggcgcac ggctggcggg 8220 + gtggtggcat gaaagtcctg ataacgctgc ttgtgatggc cgtgctcggg ttgctgtggc 8280 + tgcaccatga gaacggcaat ttatcccgct catttgagac ggcaaaccgc gtcgcgagcg 8340 + agcaaaagac gacgattggg atgctgaaaa atcagctcag tgttgccggt cagctcgccc 8400 + gacgtaatga atccgcgcag gtgacactgc gcgaacagct cgcaaaggca agtgcagaag 8460 + ccagccgccg tgagcagacg ataacgaggt tacttaatga aaatgaagcc tttcgccgct 8520 + ggtataacgc tgctctgcct gatgctgtgc gtcggctgca cacccgaaca gcctgcgcca 8580 + gtgccggtga ttgtggtcaa cggatgcccg agggtgagcc tttgccctat gccgggaagt 8640 + gacccgaaaa ccaatggtga cctgagcgca gatatccgcc gtcttgaggg ggcgctgact 8700 + gcctgcgcgc tgcaggtcaa aaccgtcaaa cactgtcagg atgaactcga tgcagaagca 8760 + caaaagcctg cgcaaagcgc tgattaacgc cgtgccgcag ctccgaaata accccgatat 8820 + gctgcgcctt tttgccgaca acggccacac cgattcccga ctggcgagct cgctgtcgtt 8880 + tgaaaaggtg tatgtgctta acgtggtggt gaccgacttt actggcgacc tcgatttgat 8940 + attcgtgccg gtgcaggcat ggctgcgtga acatcagccg gacattatga ccaccgacga 9000 + cgggcgggaa aaaggattca cctggattat tgatatcaat aacgacgatt cgctcgatat 9060 + cagtatcagc ctgaggctca ccgagcgcac gctcgtcaaa gaggtcgggg gcgcgctgca 9120 + tgtcagttat gcaccagaac cgccactgcc tgagctggtg aagcgcccgg ttgctatgta 9180 + tgcaaacggt gaattagtga gccagtggga tgagtgaatt aaccgcgctg caggagcgcc 9240 + tcgccggtct gattgccagc ctgtcaccgg cggcacgtcg caaaatggcg gctgagattg 9300 + cgaaaaagct gcgtaccagt cagcagcagc gcatcaagcg ccagcaggca cccgacggca 9360 + ccccgtatgc cgcacgaaag cgccagccgg tacggagcaa gaaaggccgc attaagcgcg 9420 + aaatgttcgc caaactgcgc accagtcgct ttatgaaagc caaaggcagc gatagtgcgg 9480 + cggtggtgga gtttaccggc aaggtgcagc gcatggcgcg ggtgcatcag tacggcctca 9540 + aagaccgccc aaaccgcaac agccgggatg tgcagtacga ggcgcgcccg ttgctcggtt 9600 + tcacccgcga cgatgagcaa atgattgaag acgtcattat cagccacctc ggcaaataaa 9660 + tattgtgtga accaccaccg gaggcgcgtg atttggcgcg gctaaagacc agaggcattc 9720 + tttgcactat gaatacgtta tccacgatac aggagctcgc gcgtgcgatt cgtaacctca 9780 + tccgctcagg tgtggtgacg gaggtcgata ccgtgcaggg gctgtgccgc gtacaaagcg 9840 + gcgggatcca gacgacatgg ctgaactggc tgaccacccg cgccggtcgt tcgcgcacat 9900 + ggtgggctcc ctcgctcggt gagcaggtgc tgctgctggc aatcggtggc gagcttgata 9960 + ccgctttcgt gctgccgggg attttctccg acgataaccc cgctccgtct gcctcggcgg 10020 + atgcgtggca tgtggttttt cctgatggcg cggtcattga gtacgagccg gagaccagtg 10080 + cactgacggt cagaggcatc aaaactgctg acgtgaccgc gtcggaatcc atcacggcca 10140 + ctgtgcctgt ggtgctggtg aaagcagaaa cccgcatcac cctcgacacc ccggaggtgg 10200 + tatgcaccaa caaactgacg acggcaacgc ttgaggtgca gaaaggcggg gagatgagag 10260 + gcgacattgt ccacaacggc ggcacattta aatcaaacgg tgtgcagctc gacgaccacg 10320 + gtcacggtgg tgtgcaaaga ggcggtgcct ggacggagga caccaaatga cggcgcgcta 10380 + tatggggatg aaccgcaaca ccggtctcgg tatcagtgac actgaacaca tcagccagag 10440 + catgcgcgac attctgctga cgccggtcgg ctcgcgggtg atgcgtcgtg aatatggctc 10500 + gctcctgtct gcgctgattg atatgccgca aaacccggcg ctcaggctgc aaatcatggt 10560 + ggcgtgctat tcggccatcc agaagtggga gccgcgtatc aggcttacat ccatcagctt 10620 + tgagactggt gatgctggcg agatgtatgt cgatattacc gggatgcgta ccgatacggg 10680 + tgcgtcagtt tcaaccactg tttcactgag ttaaatcact atggcaactg ttgacctgag 10740 + cctgttaccc gttcccgatg tggttgagga actggatttt gaaaccatcc ttgcggaacg 10800 + cattgcgacg ctaatttcgc tataccccga agaccagcag gaagctgtag cccggacgct 10860 + cgcacttgag tctgaaccaa ttgttaaatt gctgcaggaa aacgcctacc gtgaggttat 10920 + ctggcgtcag cgtgttaatg aagctgctcg cgcaggcatg ctggcttatg ccagagatag 10980 + cgacctcgat aatctcgggg cgaatttcaa tgttgagcgc ctggtcgtca ggcctgctga 11040 + tgacaccacc atccccccga cccccgctga aatggagctt gatgccgatt ttcgtctgcg 11100 + tatacagcag gcatttgaag ggatgagcgt tgcgggatcc accggagctt atgaatttca 11160 + tggccgcagt gctgacgggc gtgtcgcaga tatttctgtt atcagccctt ccccagcatg 11220 + tgtcacgata tctgtgcttt cgcgtgagaa taacggtgcg gcgtctgatg agcttcagag 11280 + catcgtgcgc aatgcgctga atgctgagga cgtgaggccg gttgctgacc gggttacagt 11340 + gcagtcagct cagattattg actaccagat acgcgcaaca cttttcgttt atccggggcc 11400 + ggaaaatgag ccgattcgtg cggcggctga ggcgaagctc aaagcttata tcagtgcaca 11460 + gcacaggttg gggcgggata ttcgcctgtc agcaatttat gccgcgttgc atgttgaggg 11520 + ggtgcaacgt gtcgaactgg ctgcacctgt ggccgacatt gtgcttgata aaacgcaggc 11580 + atctttttgc acagactatc agatagtgat tggtggctcc gatgagtgat gtccgcctgt 11640 + tacctgtagg gtcatcacct cttgaggtgg ctgctgccag agcctgcgca gatattgaaa 11700 + atacacctgt tccgttacgc cgcctgtgga gtcctgacac ctgtcctgca aatcttttgc 11760 + cgtggctggc gtgggcgttt tccgttgacc gctgggatga gaactggccg gaaaaaacaa 11820 + agcgcgatgt tattcgcagc gcgtatttca ctcactgcca caaaggcacg ataggcgctg 11880 + tcaggcgagt tattgagccg ctcggataca taatcaacgt tacggaatgg tgggagacag 11940 + gtgacccggc gggaacgttt cgtcttgata tcggtgtgct ggaaagcggt attaccgaag 12000 + aaatgtattt agaaatggag cggttgattg ctgatgcgaa acctgcgagc cgtcatttga 12060 + ttggcctgaa tattatccag gatattcccg gttatatgta tacaggtggt gtgagctgtg 12120 + acggcgacat tattacagtt taccccggat aagtgaggaa taatgagcac gaaatttaaa 12180 + actattatca ccactgccgg agccgaaaaa ctggcagcgg ctactgtgcc gggtggtaaa 12240 + aaagtgaata tcaccgtgat ggccgttggt gacggaggcg gaaaactgcc agtgccggac 12300 + gccggtcagg tgcagctcgt gaatgaggtc tggcgccatg ccctgaataa aatcagccag 12360 + gacaaccgga acagcaatta cattgtagcc gagctggtta ttccgcccga ggtgggagga 12420 + ttctggatgc gcgagttggg tctttatgat gacgagggca ctctcattgc tgttgccaat 12480 + atggcagaaa gctacaagcc agaacttgcc gagggctcag gccgtgcgca gacatgtcgc 12540 + atggtcatta ttgtcagcag tattgcctca gttgaattat ccattgattc gacaatggta 12600 + atggcgacgc aggaatatgt tgatgacagg attgcggaac atgagaagtc acgtcgacat 12660 + cctgacgcca cactgaaaga aaaaggcttt actcaactca gtagcgcaac agacagcgcg 12720 + tctgaggtgc ttgcggcgac gccgaaagcg gttaaagcgg cgtatgacct tgctaatgct 12780 + aaatataccg ctcaggacgc gagcacagcg caaaaaggca ttgtgaggct gagtagtgcg 12840 + gcagacagta ccagtgaagc tgaggccgca acaccgaaag ctgtcaaaat tgcgatggat 12900 + aatgcgaatg cgaggctggc aaaagaccgg aacggcgctg atattccgaa tccgccgttg 12960 + tttgtccaga atatcggttt aaaacccacg gtcgataaag ctgctaatgc cgttgataaa 13020 + aatggcgaca cgatgaacgg aaacctgaca ctcaagggtg attaccggct gagttttatt 13080 + atccagaatg aagacggttc tattcgtgct tatatcttca aggacaaagg tggcgacggt 13140 + attcgcatca gtaatggcga tgacggcggc ggtgattttg tttttggtaa aaatggacag 13200 + ttttactgcc cggatattat gcatgttggt aatacgattg tatggggtga cggaaatatc 13260 + gagggggcgc gatggggcgg tttgttgagc gactggttaa ctgctcaact ggttgcccgt 13320 + gacaataata ttaacttgcg agcaccctat gaatgggtta accaaaactt tgtcaaccgt 13380 + gcacagcgcg gcgcacaggc cagcatgact atggacggcg gacttgtaga ggctccatgg 13440 + ggatgttttc ttacgggggg gaacggtaac gagggtaatc aggttggagt ggctttatac 13500 + cgtccattgc agattcttcg caataatact tgggtaacga tagagaactg aaaatgaaac 13560 + tgattaattt gcaacgctac attctgatga attatttttt aggtgatggc attcagtatt 13620 + ttatagatgc cacaggtaag gactggtata aatcactgcc caaattcaca aagaaataca 13680 + gccttgctat cgaaaatgat acgggcgtta ttcgtagtat cagcgaagat gcatcccggc 13740 + tttatcccgg tggtttgacc gttgttgatg ttgacagtat tccggcaggt tgtgacattt 13800 + tcggcggatg ggtatttgac ggagagaaag tcattcctcg tgagtacaca ttggccgaac 13860 + agcaacgcca gtcagatgaa aagaaaaaaa cacttcttgc tgaggcggag gcaacaattt 13920 + ccacgcttga gcgtgcggta aggttaggca tggctaccgg ggaagaaata aggcgactcg 13980 + aagcatggga gcgttacagc gtattggtga gcagggttaa gcagtcagat gactggccgc 14040 + aaaaacctga ataacccggc ggcatttgcc cgcttctttc tcatccatta gttgtgccag 14100 + acatcatcca gccctgacaa atagcccctc acaagaccag ccaggacaat aacactcgcc 14160 + cactaactac ggagttaacc ggatgagtga ttttcaccac ggcacgaagg tcatcgaaat 14220 + aaatgacggt acgcgtgtta tttccacggt cgcaaccgca atcgtcggca tggtctggac 14280 + agccagcgat gcggatgccg agacatttcc cctcaacgag ccggtactga ttaccaatgt 14340 + gcagagcgcc attgcgaaag ccggtaaaaa aggcactctg tcagcttccc tgcaggccat 14400 + cgccgaccag tcaaagcctg tcaccgttgt cgtgcgcgtt gccgaaggta ccggagacga 14460 + tgcagaagcg cagaccacgt ccaacattat cggcggcacg gatgagaacg gtaaatacac 14520 + cggtatcaag gcgctgctaa ctgccgaagc ggtcaccggc gttaagccgc gcattctcgg 14580 + tgtgccgggt ctcgatacgc aggaagtcgc aaccgcactt gcatcggtct gtatcagcct 14640 + gcgtgcgttt ggttacgtca gcgcatgggg ctgtaagacc atttccgagg cgatggcata 14700 + tcgcgagaat ttcagccagc gcgagctgat ggtcatctgg cctgatttcc tcgcatggga 14760 + taccaccgcg aacgccaccg ccacggcata cgccaccgcc cgcgcactcg gtctgcgtgc 14820 + ctacatcgac cagactatcg gctggcacaa aacgctgtct aacgttggcg tgcagggcgt 14880 + taccggcatc agcgcctcag tcttttggga tttgcaggca tccggcacag atgctgacct 14940 + gctcaacgag gccggagtca ccacgctggt gcgcaaggat ggtttccgtt tttgggggaa 15000 + ccgcacatgc tctgatgacc cgcttttcct gtttgagaac tacacccgaa ccgcgcaggt 15060 + gctggccgac acaatggctg aggcgcacat gtgggcggtc gataagccca tcaccgcatc 15120 + gctcatccgt gacattgtcg acggcattaa cgccaaattc cgcgagctga aatcaaatgg 15180 + ctacatcgtg gacggtgaat gctggttcga cgaggaatcg aacgataagg aaaccctcaa 15240 + ggccgggaaa ctgtatatcg actacgacta tacaccggtt cccccactgg aaagcctgac 15300 + cctgcgccag cgtatcaccg ataaatatct ggtgaatctg gctgaatcgg tcaacagcta 15360 + aggagcctga aacaacatgg cactaccccg caaacttaaa tatctgaaca tgttcaatga 15420 + cggccttagc tacatgggcg ttgttgaatc cgtgacgctg ccgaagctga cccgcaagct 15480 + cgaaaactat cgcggcggcg gtatgaatgg cgctgcagcg attgacctcg gcctcgacga 15540 + tgatgcgctt actgtcgaat ggtctgtcgg tggcctgcct gatgtggcgc tgtgggcgca 15600 + gtatgccgcg ccgggggctg atgccgtgcc gctgcgtttt gctggctctt accagcgtga 15660 + cgacactggc gaaatcgttg cggtcgaggt ggtcatgcgt ggccgtcata aagaaatcga 15720 + cggcggcgaa aataagcagg gtgaaaatac ctcgaccaaa ctgtcgaccg tttgcaccta 15780 + ttaccgcctc acgattgatg gtagcgacat tatcgaaatc gacaccgtca acatggtcga 15840 + gaaggtgaac ggcgtcgacc gtctggaaca gcaccgccgc gcaatcgggc tgctgtaatt 15900 + ccctgaccgg tcagcactgc tggccggtta ttacccccat tcagagcaga gaaaaaatca 15960 + tggcaaaagc accacgcaaa acccctgaat ttattgatac ggctggcaat gaaattgaca 16020 + ccgtaaaccc gaatgtcgtg accctcgaca agccgattaa acgcgccggt cagacaattg 16080 + aaaaggtcac gctgattgaa ccgaacgcag gcaccctgcg cggcgtcagt ctggcggcgg 16140 + tggcgcagtc cgaggtcgat gcgctgatta aggtgctgcc ccgcatgacc tacccggcac 16200 + tcaccacgca ggagctcacc gcaatgaacc tgcccgatat gctgtcgctg gccgctaagg 16260 + tgattggttt tttgtcaccg gcttcggcgg aatagacttc ccgcccggcc tgtcgaccga 16320 + tgacctgatg gcggatatcg cagtgatatt ccactggccg ccatcagagc tctattccct 16380 + gagcctgacc gagctcatca catggcgcga aaaggcgctg cagcgtagcg gaaaccacaa 16440 + tgagtaataa cctgaggctt gaggtattgc tgaaagcggt cgaccaggcg acccgaccgc 16500 + ttaaatccat ccagaccgcg agtaaaagcc tgtcgggcga tattcgcgac acacaaaaag 16560 + ggctgcgtga cctgaatggt caggcgtcga aaatcgacgg ctttcgtaag gcaagcgcgc 16620 + aactggccgt aaccagtcag gcgcttgata aggcgaaacg cgaggccggt gagctggccg 16680 + tgcagtttaa aaacaccacc aatccgaccc gcgcgcaggc gcaggcactt gaagcggcaa 16740 + ggcgtgccgc ctctgagttg cagacgaaat acaacagcct gagaacgtcg gtacagcgcc 16800 + agcgctccga gctgatgcag gccggtatta atacccgcac tctctctgca gatgagcgtc 16860 + ggctcaaaac ctccatcagc gaaacaactg cgcacgttaa tcgacaacgt gaggcactgg 16920 + cgcgcgtcag tgcgcagcag gcgaaattaa gccgggtgaa agagcgatat aaatcaggca 16980 + aggagcttgc cggtaacatg gccgcagcag gcgctgcggg gtcggtatcg cgacacggaa 17040 + cgatggccgg ggttaaatta ctgatgcccg gttatgactt tacgcagaaa aattccgagc 17100 + tgcaggctgt gctcggggtc gataagcagt cgccagaaat gcaggcgtta cgcaaacagg 17160 + cgcgccacgt cggcgacaat actgcagcct ctgcagatga tgcagcaagc gcgcaaatca 17220 + tcattgcgaa aagcggcggt gatgcagctg ccattcaggc gcgacgccga gtcacgctga 17280 + atatggcgct gtcaaaccgg cgcacgatgg aggaaaacgc agcgctgctg accgggatga 17340 + aatcagcgtt tcagctttca aacgacaaga ttgcgcacat tggcgacgtt ctctcgatga 17400 + cgatgaacaa aaccgccgcc gattttgacg gactgagcga cgcgctgacc tatgccgcac 17460 + cggtggcaaa aaatgccggg gtgagcatcg agcaaaccgc cgcaatggtc ggtgcactgc 17520 + acgatgccaa aatcaccggg tcaatggcgg gcacgggtag ccgcgccatt ctcagccgcc 17580 + tgcagctccc accggaaaaa gcgtttgagg ccattaagga gctcggcgtc aaaacgtcag 17640 + acagcaaggg gaacacgcgc ccgatattct ccatcctgaa agaaatgcag cgcagctttg 17700 + agaaaaacaa cctcgggaca agccagcgcg gcgagtatat gaaaaccatt ttcggcgagg 17760 + aggccagctc ggcggcggcg gtactgatgg aagccgcctc aagcggcaaa cttgaccggc 17820 + tcaccgctgc gtttaaagcc tcggacggta aaaccgagga actggttaag gttatgcagg 17880 + ataacctcgg cggcgacttt aaagagttcc agtctgctta tgaggcagtc ggtactgacc 17940 + tttttgacca gcaagagggc tcgctgcgta aactcaccca aaccgccacg caatacgtgt 18000 + taaagctcga cggctggatc cagaagaaca aagggctggc gacaaccatt ggcatcatcg 18060 + ccggtggcgc tctagctctg attggtatca tcggcggtat tggcctcgtt gcgtggccgg 18120 + ttgttatggg gattaacgcc attatcgctg ctgctggcgt gctgggtacg gtctttactg 18180 + ttaccggtag tgccattgtg accgcacttg gcgcgattac ctggccgatt gtcgcagtgg 18240 + gggcggctat tgtggctggt gcgttactca tccgtaaata ttgggagccc atcagcgcat 18300 + ttttctcggg ggtgattgag ggcatcatga gtgcctttgc accggtcgca gaaatgttcg 18360 + ctccactggc acccattttt gacggtctcg gtgagaaact gcgcggcgtc tggcagtggt 18420 + ttaaagacct gatagcaccg gtcaaagcca cgcaggaaac gctcgatagc tgcaaaaatg 18480 + tcggcgtcat atttggtcag gcgctggcct ctgctttgat gcgtccgctc aatgtattta 18540 + acaagttgcg cagcggtgtc gactggcttc tcgaaaagct cggtatcatc aacaaagagt 18600 + cagacaacct cgaccagact gccgccaaaa ccaacgccgc cacgcagggt aattcctaca 18660 + tcccggcaac cagcacatat ggcggctatc aagcttacca gccagttacc gcaccggcgg 18720 + gacgctctta cattgaccag agtaaaagcg aatacaaaat cactctgccg ggaggtgctg 18780 + cgccggggca tcagcttgac agacagctac gcgacacgct cgaacagatt gagcgcgaaa 18840 + agcgtgcgcg tcagcgtgcc agtatgagcc atgactgaga ggaataaacg atgatgcttg 18900 + cgcttggaat gtttgtgttt gaacgtcgca ccctgcctta tcagtcgatg cagcactcga 18960 + aggattaccg ctgggcgtct aatgaccggg tgggtaagcc gcctgcttat cagtttctcg 19020 + gcgaggggga aacgtcgata cagcttgccg gtacactgta cccagccatc accggcggct 19080 + ggatctcact aaaggctgta gaggtaatgg ctaacgaggg cagagcgtgg ccgttgattg 19140 + agggaactgg aaacatttta gggatgtata tcgtcgataa ggtgtcgacc acgcacgccg 19200 + agtttttcag cgacggcgct gccagaaaga ttgatttcac cctttcgctt aaacgggtcg 19260 + acgaatcact gacggcaatg tttggcgacc tgaataagca ggccagcgag cttctaggct 19320 + ctgccggaaa tctgactgat aagctgcaga gtgcgctcgg aggactgacc gcatgattac 19380 + gggcatgact attgacgccg gaactagcct tgcaccggca tttatgttaa cgctgaacag 19440 + ccaggacatt accagcaatt ttagtgaccg gctgatttct ctcaccatga cagacaaccg 19500 + gggctttgag gctgaccagc tcgacattga gctcgacgac accgacggca aagtcgaatt 19560 + accactgcgc ggggcggtgc tgacgttgtg gcttggctgg cagggttcgg cgcttctgaa 19620 + taagggcgat ttcacggtcg atgagattga gcaccggggc gcgcctgata tcctgaccat 19680 + ccgcgcgcgt agtgcagact ttcgcggaac gctcaattca cggcgtgaag aatcatggca 19740 + cgatactacc atcggtgagt tggtcagcac cattgcaaag cgcaataaac tgacggccag 19800 + tgtcgcggat tcactgaaaa aaattccggt accgcatatc gaccagtcgc aggagtccga 19860 + cgccgtattt ctgacccgac tggctgaccg caatggggcg acggtgtcag tgaaagcggg 19920 + gaaactcctg tttctgaaag ccggtagtgc gatgacggcc agcggcaagc ccgtcccgca 19980 + aatgacacta actcgcaacg atggtgaccg tcatcagttt gctattgccg accgtggggc 20040 + ttacaccggc gtaaccgcaa aatggttgca caccaaagac ccgaagccgc aaaagcagaa 20100 + agtaacactg aaacgcaagc caaaagagaa gcacctgcgc gcactggagc acccgaaagc 20160 + aaagccagtc agcaaaaaga caaaggccaa aaaagagccg gaagcgcgcg agggtgagta 20220 + tatggccggt gaggccgata acgtgctggc gctgacgacg gtctacgctt ctaaggcgca 20280 + ggcgatgcgt gccgctcagg ctaagtggga taagctgcag cgaggcgttg cggagttttc 20340 + aattacgctg gcgcttggta gggctgattt attccctgag acaccggtgc gcgtatcagg 20400 + ctttaagcgc gtcatagatg agcaggcatg gttaatcagt aaggtaactc acaatctgaa 20460 + taatagcggc ttcacgacgg gcttagagct tgaggttaaa ctctctgatg tggagtacaa 20520 + cgcggaatcg gatgatgaat aaaatgtatt cacaaaaagt gaatttatga ttatcattta 20580 + ttcacgaatt gagaataaag ggtgggttat gtttcattgt ccgaagtgcc atcatgccgc 20640 + acatgcgcga acaagccgct atctaaccga aaacacgaaa gaacgctacc accagtgcca 20700 + gaacatcaac tgtagttgta cgtttatgac aatggaaacg atagagcgct ttattgttac 20760 + tccgggagcc attgacccgg caccgcctca cccgactgtc ggtggtcagc ggccattgtg 20820 + gctctgataa atttccgcta aatgcccgcc gcgtgcgggt ttttttatgc actcaggaaa 20880 + gtggcggtaa aaaatccacc gccattctat cgccactcga aaacgaggca acaaaaaggc 20940 + cactcgagag agtggcctaa ctgtatgtat ttactactta aatttggtgg cccctgctgg 21000 + acttgaacca gcgaccaagc gattatgagt tcctacaaga acaaccgaaa atcaatagta 21060 + tgcgttattt atcattgaca tagattgcca ttgtttgcca ataattacct attattcgcc 21120 + atttctaccg ccactttatc gccattctat tatctgttac tcagaaccat cgccgacata 21180 + ggttccatca ggtgcgagat gatatcttcc accaacataa gtcccatctg gggcaagtgt 21240 + tgggcggcca gcaacataac ttccatttgg cgctaagcgt ggaacgccac cgacataagt 21300 + tccatcgggt gcaaggcgtg gtgctcctcc tccaacataa gtcccattag gggcaagcat 21360 + aggttgtccg taaacatagg taccatcagg tgctaatcga actgacatac aacctccata 21420 + acttatttgc tgttagtaat gtgaactaaa ggatttagtt taactgcatc ctctaaatgg 21480 + tcgggtgcaa agtgcgcata tcgcatggtc atttttatat ctgtatggcc gagtacgcgc 21540 + tgcaacacca aaatattacc gccattcatc ataaagtgac tagcgaaggt gtgacgtaaa 21600 + acgtgggtaa gttgtcctgc cggtagttcg atacctgttc tttccaaagc tgaccggaac 21660 + gcgccataac aatcactgaa caaccggccc tttttatcat caggcagaga ctcatagagc 21720 + tctttgctga ttgggacggt gcgatttttt ctacctttcg tgttggtgta tgtgattttg 21780 + tatttcgcga gttggctttt tctcagactc tcggcctcag accaccgtgc gccagttgcg 21840 + agacagattc ttaccacggt ttctaaatca gggtggtcat gtcggttaca ctctccgagc 21900 + agttgcgaaa tttggtcgtg agttagccaa gtcatttcca tttcttctgt gcggaatggg 21960 + cgcatatttt ttagtgggtt ttcacccttc cattctccga ggcggtttag ctcattgaac 22020 + accgcccgga agtaggccag ctcaagatta agcgtgcgag gcgatacctc tttcactctg 22080 + tttgaacggg catactcacc ttttaaccgt ttttctcggt agcgggaaaa catctgcgca 22140 + tcgaaatcgc gtgcgagtgg ttcgcccata cactcaaaag catggtgcat ggctaactgg 22200 + cgtttcaaac catctttcag tgtaatgcca tgagcgctat accatgaatc aaccagctct 22260 + tttaacgtgc gcctgtcttc cttttcttcc tgccacgggt tttgaacggt gtactgctca 22320 + aacgccagag cctcgccttt agtagcgaat ttctttctga tacgtttgcc ttttgcaccg 22380 + tttgggtaga gttcacaaat ccaaccgcca gccggatttt tacggacggt cattagttaa 22440 + cctcgctgta tacacccacc acacgcccca acgttttaat atcatcaatg ccgcattcga 22500 + aaggaacctt cccgcctgca acatgtagtt ttctacccgg tagttttgtt aactctcgaa 22560 + tgcttattgc tccctcaatg tcgactagcc ataagccgtc agacaatgat gcttgcttgt 22620 + ccacaaaata aattttcccc tcggaacgga tagccatccc atctgtgagc ggttttgtga 22680 + aaaattgggc atcaacactc aattgtttat cggatttgag gatttcttca cttaatgtga 22740 + atccctcaat cctttttgcg tcgctcgatt ctctgttatt tacaaatgct tctccttctc 22800 + cggtaagtaa ccactggaga ttagcacctg tttcaagggc acagtgagcc gcaaagtcat 22860 + aggagatagc gcctcgggtg tacctgtttg acaatgagct ggacgcgata tcgaagtggt 22920 + tagctaattg aattttctgc gaaaatccgt acgcctcgca gatgcggtca agtacatcca 22980 + cgttgctcca tcctaaagaa tctattctca tttcgataaa acctatttac tatctctcaa 23040 + ttgggagata tattttggct aaacccacgc aattgatggc aagtgttggc aaacagagtc 23100 + aaatcaattg caaactttgg ctaataggga atcatgcaat atggcttctg aaatcgcaat 23160 + catcaaagtg cctgcaccta tcgttactct gcaacaattc gcagagcttg agggtgtttc 23220 + tgaacgcacc gcctaccgct ggacaaccgg cgacaaccct tgtgtaccaa tcgaaccccg 23280 + cacaatccgt aaaggctgca agaaagcagg tggcccgatt cgcatttatt acgcacgctg 23340 + gaaagaagag cagttgcgta aggcgttggg acattcccgt tttcaactcg tcatcggtgc 23400 + ttaattcact ttatgtgaat tgtaaggatg caacatgttt gattttcagg tttccaaaca 23460 + tccccactat gacgaagcgt gccgggcttt tgcgcagcgt cacaacatgg cgaagctggc 23520 + cgagcgtgcg ggtatgaatg ttcaaacgtt acgtaacaag ctcaacccag aacagcctca 23580 + ccagttcacg ccgcctgaat tgtggctgct gactgacctg accgaagact caaccctcgt 23640 + tgatggtttt ctggcgcaga ttcattgtct gccatgcgtg ccggttaatg agctggctaa 23700 + agataaattg cagtcttacg tcatgcgcgc aatgagtgaa ctcggtgaac tggcgagcgg 23760 + tgcggtatct gatgagcgtc tgaccactgc ccgtaagcac aacatgattg aaagcgttaa 23820 + ctccggcatt cgcatgttgt cattgtcggc tctggcgctg catgcacgtc tgcagactaa 23880 + tcccgctatg tcgagcgtgg tcgataccat gagcggtatt ggcgcatcgt ttggtctgat 23940 + ttgaggtgcg tatgctgaaa agtgaaccgt catttgcgtc tctgctcgtt aagcaaagcc 24000 + ccggtatgca ttacggccac ggctggatcg caggtaagga cggcaagcgc tggcacccgt 24060 + gccgctcaca gtccgaatta ttaaaagggc tgaaaacaaa gtcgccgaaa tcgtcaggtt 24120 + ttttaattat tcgtattgtc cactttgtaa ttaaaggagt gaaacatgtc acgcgatgaa 24180 + ttaagaattg ttttgggtgc catgattcca aatatggagg aaggttttga aattaaaacc 24240 + cgcgacggcg caatacttcg cgttgaccct gagtgggagt gctgcaaaga atttaaggat 24300 + ggattaaaag ccgaaatcat caagcagtta aaaagcaaac ctgctgttgt atttggatat 24360 + agttaattaa ttaaacgtaa ttacttggcg taaacccgcc gggcattctt ttgccaaaaa 24420 + acaggaggat atatgagtcg aactatttat ttatcaacgc cgagtggtgc tggcgaccac 24480 + ttgctggagt ctttgtttaa agaagccaaa aaagaagagc gcaaagaccg ccgtctcgcc 24540 + gtttcaatcc gtctcgaaga tctggccgtt cacattacca attcagatat gacaggcaaa 24600 + gaagcggccg agctactgcg ccgcgaagcc actcgctttg agaacgaatc acaggagctt 24660 + cactaatggc cgacgcaatg gatttagcac aactgcgcga gcaggaagac cgcgaacgcc 24720 + acataagcaa cgcgcgcagc cgtcgccatg aggtttctgc atttatctgt gaggaatgcg 24780 + atgcacctat cccggaagcg cgccgccgag ccataccggg cgtgcagtgc tgcgttacct 24840 + gtcaggaaat cttagagctg aaaagtaaac attataacgg aggtgcttta tgagcattac 24900 + caatgcaact attagccagc gtgcaaaaaa atggcttgaa gatgaccgta tatttattga 24960 + caccgaaact acgggtttgg gtgatgatgc ggaaatagta gaaatctgtt taatagatag 25020 + cgctggtttt atcatgctaa atacattggt taaaccaact aaaccaattc cagcagaggc 25080 + tacggccatt catggaataa ctgatgaaat ggttatgtat gcgccaacgt ggaaagatat 25140 + tcacggcgca gtagcttctt tattttttga gtatggcttt gttatttata acgccgatta 25200 + cgacacaaga cttatatatc aaactgcgaa attatatggg cttgagaatg acggcttttg 25260 + ttatttttta aatgagcgtt cggcctgcgc catgatgcta tatgcagagt atcgcggcga 25320 + gccagggcga tttaaaggtt ataaatggca caaattagtt gatgccgctg cacatgaagg 25380 + ggttagcgtt gaaggaaagg cacaccgtgc attagcagat tgccggatga ctcttggcat 25440 + tatcgacgct ttggcaaaag gcggtgcagc atgagtatcc gtatcgaaat aggtgataaa 25500 + tgggtaatca ccagcgacca atatcaattc atcctgaatg aaaaaaaagt cgttaagacc 25560 + ggcaataaag ctggcgagga atggctcgac accatcggtt attacccgaa gattaatcag 25620 + ctcatttctg gtctggtaca tcaccacatt catacggcaa tgattatttc ccttagtgca 25680 + atggcagagg aaatagagaa gttatctttt atctgtgaag aagcatttaa ggcggttaaa 25740 + aaatgattga ttcccgctgc tttgctgaaa gcacaataaa tattgtttct gtttctggtg 25800 + gaaaggacag ccttgctcaa tggattcttg cggtagagaa cgacgtaccg cgcaccactg 25860 + tttttgcaga taccgggcat gagcattccc aaacaatgga gtatctggat tatcttgaat 25920 + ccagactcgg cccggttatt cgagtgaaag ccgattttac tcggcggatt gaaggcaaac 25980 + ggaaattcat tgctgaaaaa tggcctgtct ctctcgttga agaatgcgga atgtctcatg 26040 + agcaggctgc agaacgaatc gcaaaggcac tggaaatcct taagccaacc ggtaatccgt 26100 + ttctcgattt gtgcatgtgg aaaggacggt tcccgagcac gaaagcaagg ttttgttcac 26160 + tggaactgaa acatgactca gtacgggaca agattgtact cccagcgctg gagaaatatg 26220 + acgaagtaat tctatggcag ggtgttcgtg ctcaggagtc accagcccgc gctgcgttac 26280 + ctatgtggga ggaggatgca gataataccc ccggtttgca tgtgtatcgc ccaattctta 26340 + actggacaca tgaagacgta tttgccttag ctaaacgaca cggaattaaa ccgaacccac 26400 + tctatcagca aggttgtagc agagttggct gcatgccatg tattcatgca agaaaatctg 26460 + agctggcaga gatttttgct cgctggccgg aggagattgc gcgcgttgca gagtgggaac 26520 + gtcttgttgc tgcctgttca cgtcggggaa actcaacatt tttcccttcg actcacgacc 26580 + cgcggcgagc agaaaaacgt attgaagttg ttaccgtaga agaatatggg atagcttcat 26640 + atcgtgactg ggcgatgact acgcgtggcg gttctcagta cgatttgctc gctgctacaa 26700 + acgacaaaac tgtgtgcagt agcgtttatg ccggtgtatg tgaatgacgg gtgtcgttta 26760 + cgcgtttccg tggaatgccc cacggtcggc aatagccagc tcatatctta cctatgacca 26820 + acagcatcgc cgcgaccgta tgttcgcggc tttgctgcat gcgagaaagg tgctttttct 26880 + ccagccagaa tgtgtgcgct ttgacgttta tcgcaccgct gcagttctgg agcaaaatca 26940 + gggcagtcaa cgagccaatg cctttttaat cagcttctgc aaaaaggcat taccacgtct 27000 + tgaactggtc gcaaaaaaat acgagtgctc gggcatcaac agcaatgtat cagccgctgt 27060 + tttcgatggt cattttgata cccagcttat gcaatatctg gcgtcacgca tggtcaatat 27120 + ggtcgccaga tttaaccgcc tcccggatat gtcgcgcgcc gatattgacc tgctggccgc 27180 + ggatatcgct aattttattc gcgctgaact ggccgacatt gatgacaccg gatttagcga 27240 + actcaaaacg ctgtacactt ggtacatgcg cgccggtttt atttccctgc aattcaacgt 27300 + tacaccgccg aaatgggagc gtgtgactaa aaaatatttt tgtgaggatg aaatcgcacc 27360 + ggcagtaatg cgcatgttta atgaggtttg gtggcgcggc cgcttgcgac gcattgcggc 27420 + tgcatggcgc gaacatctgc aaattgcagt cggcaacgta agcaagaaac gacacgcata 27480 + cgcgagtaaa aactgcgtca ccgactggcg cgagcagaag cgccgcacgc gcgaatttct 27540 + caaggggctg gatctcgaag acgaagaagg caaccgcatc agtctgattg aaaaatacga 27600 + cggctcggtc gctaatccag caatacgccg ctgtgagctg atggcccgca ttcgtgggtt 27660 + tgaaaatatc tgtaatgagc tcggttatgt cggggagttc tatactctga ctgcaccgtc 27720 + taaatatcac gccaccacca aagcgggcta ccgtaacagc aaatggaacg gtgcaagccc 27780 + gtcagacacg cagagctatc tcacaggcct ttgggcacgc atacgcgcca agctgcaccg 27840 + ggaagaaatc cgcattttcg gaatacgcgt cgctgaaccg catcacgatg gaacgccgca 27900 + ctggcatatg cttatgttca tgttgccgga agatgtcgag cgtgtgcgac tcatcatccg 27960 + agattatgcg tgggaggaag accactacga actgagaagc gataaagcca aaaaggcgcg 28020 + cttccatgct gaggccattg acccggaaaa aggcagtgct actggctatg tcgctaaata 28080 + catttccaaa aatatcgacg gttatgctct cgatggtgaa accgatgacg aaagtggtga 28140 + gttgttaaaa gagactgcac ccgccgtttc agcatgggcg gcgcgctggc acatccgtca 28200 + gtttcaattt atcggcggtg cgccggtgac ggtatacagg gagctacgca gaatggctga 28260 + ccctgaaaca gccagggcgc tcagtgttga attcgccgca gtgcatgatg ctgctcacta 28320 + tggacgctgg gctgattatg tgaatgctca aggcggacca ttcgttcgcc gtgacgattt 28380 + acaggtacgt acattgtatg aacctcgaac tgaatttaat cagtatggcg aagaaactgt 28440 + gtgcatcaaa ggtgtctacg atgcctcgat aggtgctggc tctcctattc taacccggtt 28500 + aacgcagtgg aagattgttc caaagcgtgc cgttgatttg gccgttgacg ttaagggcgc 28560 + ttctgcgccc tctcggagtt ctgtcaataa ctgtacggga agcgaaagcg atccaccgat 28620 + actcgattta acaaaaccgc tgagtcggcg tgaaagacga gagttgacga accgactcag 28680 + gaagaaaaag ccaacaacac ggcgaaaatt catccacgga acggataagc aaaacgtcgc 28740 + tataacgaaa actatcgacg agatacactc tgacaaccgg catcacaatc agccggggcg 28800 + aagccctgca cctgatggcc ggtggtaaaa gttgttttaa cggtcgatgg gtgcgcggaa 28860 + cgtcaaaagg tgaaatcttt gctgcagctc cttcacatca ggcgagacgc ggaaaatcct 28920 + taatcgtgtt gcagatttag ctgagctggc aacgaaaatg taaccgctaa tattcatcca 28980 + tatcatgtac atacagtgta tttaactgtg atttttttct tcacaccttt tgccaatacg 29040 + tgctactgta tgtttataca gtatctcgta gtggaggttg tgtggataga gagctaaatg 29100 + agcacgttat gattgagcgg gtcgaaatga ttgcgcgtct gactgctgaa ggtacttgtc 29160 + aggaaagaga ccgtgaaatc gcattgaatc taattgcgga aatagcaaga ggcaacctaa 29220 + tgaaaaataa taatttttct gttgtttttt ccgcaccgcc tgttggtgaa acatttgcaa 29280 + aggagggcaa agtgaaagta aatatcacgt tggataaaga ccaaaaaatc ggccagccgg 29340 + taattgatgc ttttcagtgc gaattgacca agcgaataca gtccgttttc ccgtcaacgc 29400 + gcgttactgt taaaaaggga tccatgaccg gtgtcgagct gatggggttc gataaagatt 29460 + cagaccgcga agcgctggat agcatccttc aggaagtgtg ggaagatgag agctggcgtt 29520 + aatccctgaa aaatgtgcaa ccatcgaccc catgtttgat agcatggggt tgttttgtat 29580 + gggattacac acaaaggaaa atcatggata ccgtaatagc atttttatct ctggctctct 29640 + ttattgcttt tatcgtcggg ttaatcaagc cgtcgctggt tcgaatgccg agccgtaagc 29700 + gctccagtgc tgtttatctc ggtggctgtc tggcgctggg cgttattggc tcaatcttat 29760 + ggccgactga aaaaactcag ccggtggcaa aaactgacgt accggcggtt aaagcggaac 29820 + cggctacgcc aacgtttgag tacgcagata aaaccctcaa agaatatcgc aacgagccaa 29880 + aagaaacccg gcacgaaatc gttaaagact atgttggatt caaaggtgtg caggccagcg 29940 + ctaccgatgt tttttatgcc tgtatgagcg agtacacttt taccaaagat gatgcgttaa 30000 + agctcagtga tgtgttgggg tggtgtttca acgacttcga gaaagatcca caatctctga 30060 + ataataaaat caaccttgac gaatttcagg gtaattttag cggttgggat ggctcttatc 30120 + gcccgttaga gaagctgata aaagccagta tgaatgatga ttcctcttat aaacatgttt 30180 + caacggtcta ccatctgatt ttgaataaag acccgcatgc cgttgtaaaa acaacgtttc 30240 + gcggcactaa tgcttatggt ggcgtggtca aacagaccgt agcagcacgc gtcaacgtgc 30300 + gaacgggcga ggtcgattca atactcgaca attaaacatg acaaacgccg ccggtgctga 30360 + aactcgcttt cagtgctggc ggggttgaac aacgagcccc gcgaggcgtt agcctacccc 30420 + tgagcaaccg cccaagaccg gtactattaa agccggtttt tttatgccac ttttccacga 30480 + atttcccgtt tttttagccg tgcatgcaac aggtgcattg ttttgcatgc gtcaggcttg 30540 + cccgttctgg ttgtgcgtcg ccagagctgg cgcggctcca gagtggtcat gcaactgcat 30600 + taaaaccgac ccataaagtg ggca 30624 +// diff --git a/etc/b132222.fasta b/etc/b132222.fasta new file mode 100644 index 000000000..03a6c6251 --- /dev/null +++ b/etc/b132222.fasta @@ -0,0 +1,512 @@ +>B132222 U32222 Bacteriophage 186, complete sequence. +ggcgtggcggggaaagcattgcgcgccagaggtggcgcgtgaatgataaaaattatcgtc +tgagcgcctcgtaatggcgctatcgtggtgctgttggttcgttggtggtcgtgtgtgttt +gtgcgcgtgtggcgcgtctgagacgtgatggtggcggggtatgaaaaagccgccatgctg +gcggcttgagagggattattccgggttgtcgagggtgtactctttgaacctgatgacctc +catgccgagccagtcgtttacctccctgaacctgtcctgcagcggcgacaggtcgttacg +cacaaatacctttgccactttctcaacgtcaccgagcgagccgatattctcgggcttgcc +gcccatgagctggaacggtacgcggtgcgcgtccatcaggtcggcggcgctggctttctt +gatgttgaaaaagtcatcctttgtggcgacctcgctcagtggcacgattttaatgccgtc +cggttttccattgggagcgtagaaaaacaggtttttaaaattgccgagccctttcgagtt +gcgcatcgcctcgcgcagcgattcgacgtcggtcgcgctctgcgccgggtcggtcacata +catgatgtaacccgcatgcgcgccgttctggtaatacttgcggcggaacagcgttgcgga +ttcattcagccaggcggaattaagcgcgctgagatattcgggcaggccgtaaatctcctg +attaatgtcgggctccagcaggtgaaacacggtatcaggcgcgaattcatgcggcagagt +gaagttttccacaaaccagaaaaccgaatcgtcgaccccgcggcgggtgtatttggccgg +tgaggccagtagcttgattagctggccggtaacgctgtggcgctgctcaagaaaggcgtt +gccgaataccagatagtcgagcgcaaagcggctgaaatcctgacgggacagcagcgggtg +cgggatgtaggtgctcgcgagcacgttgcgcttaacgtaaatcggtgagctgtgatgtac +agcagagcgcaggctctttgccagcccggagaagctgaccggcggctcgtaccatttgcc +gttactgatgcactcgacataatccagaatgtcgcgcttatcgagtaccggcactggctc +gccaaaggtgaacgcctccattttttgcggggcgctggcggtcatggctacctgtttgcg +tggcttgcgcttgctcatgctgccacctcacccgctgcaacagcgaaagaccagtcgcag +ccaaacagcaggcgataatcatcgtcgctgtattcgtgtttaatttcatcgggcgcaaag +agattgcacccgcgctggcatgctgcatccagagtgaccgactgacgccagacaccatct +gtacaaaatacgctgtcgccggtattgatgagcggtgacggtcggtgcctgcgggttgtg +ccgttccataccctgaaagcgtcataattatcagagggcgaggtaaacatcgtcaggctg +tggcgtttatggcaggcgatacccgccgcgactttcgcagctcttagcgggttattgaac +catccgaactcatcaagatagacattacccgccagtgcggcgcaatgggattcctcgccg +acaaagctgataaccgcaccgtcgtcgagctgcaggctgtggccgttactcgtaagactg +acgccgacgcgcgccgaaaggttactcatgtacatcagcgccacgcgcgcatgctcaata +gtgtgagcaaaccagacatgattatcgcctgttgtcagcgcatcgagcagcgcctcacgg +ctaaagagctgcgttgcgccaatctggcgcgatttggtgatgctgcggtcgatattgagt +ttcccgacacgcaaccatgttgcctgatagtcaaagctgtcattgtgcagaatatcggcc +attgcctgaatctggctttgtgagaaaacgttatttttcattaattaaactccagaatgg +atttaggctgtatgccgctaccggcggaaagcggttcgtttaacagggcgtgcatggtcg +cccatgcaatatcggcgtgactggcttcctcggtgcggctggcctcgtaggtggcgctgc +gcccgctgctggtcatggttttgcggatggacataaacgactgcgtgacgtcggttgctc +cggcgtcgtactccagacagccgcggcgaatggtgtcttttgccttgagtaccattgcgg +ttttcatttcaggcgtgtaacggatgccgcgtgcggccgggtagaatgagcgcaccaact +ggaacacgccgaggccgaggccggttgcgtcaatgccgatgtattcgacgctgtatttct +cggtcagtttgcggatgccatctgcctgcgcggcaaagtccatgcccttccactggtggc +gctccagcatgcggaacttgccaccagaaaccaccggcggcgcgagcacgacgcacccgg +cgctgtcgccagtgtgtgacgggtcgtagccaatccagacggggcgagagccgaacggat +ggtcggcgaacggggcgaagtcctcccattcttccatcacgtcgaccatgcagcgctgca +gctcctcgaacgggaataccgacgctttatcgtcgacaaactcgcacataaacaggtttt +taaagtcctcatcactgttttcgcgtttgagttggtcgaggtcgaacagggtgcagccac +cggcaagggcgtcctcaatggtgacaatctgccgccactggccatcgtcgcagagctggc +caccggcgagcgcgcggtgactgatgtcaatttcgatgcggtcggcaatacggctgcgcc +ccttgttgaacagctcgccagaccagaagggataagcgccgtgcgccagcgttgagggtg +tcgaaaagtaggttgagcgcagatgcttctgcgaggccatgcccgaggcgactttgcgca +gcttctgaaaattcgggatccagaatatttcatcgacatacaggtcgccgttatggctct +gagccgtgttggagttggtaccgagaaaaatcagctttgcgccgttgttgccaatgacaa +tcgggtcgccggtcaggtcgacgtcaaccagtcgcgcaaactgtatgatgtattcgcgga +acacgtaagcctgcgttttactggccgacagaaaaatctggttatggccggtcttgagtg +ctcgcagcagtgcctcacgggaaaaatagaacgtcgcgccaatctggcgggatttgagaa +tgtcgcgaatacggtgtgccagtcctgcgcggtaccactgcaactggtactcgaaagact +ggtcgaaaaataattcctccagcttttcgatagcctcgtcgctgaaaaaattctttttcg +gcttcttgcgctcacccttgttgcggttggcgacgttggggttaaggtcggcctcgttgc +cggtctggctgtagcggttaacgcgtgccagtcgttcaatctgccgcccgagcaggtcaa +tctctttgaagtcaccgcctgacttttgcggcttggcgatgagctgaatcaggcgcgcct +caaggctgctttcaacgcgggaaatcggtgcgatgccatcccagccgtcgcgctgtttcc +agctctgcacggtcgggcgcttgacctgcagcatttcggcaatctgcggcacggaaaaac +cctgccagtaaagcagcgatgcctgtcgtcgcgggtcatgcaacaaggttgtatcggtgg +aaatggtcattgatgcctcgccgtaatggattcagggcaaggctacttaatggccgtcag +tgattcgctaaggtgctgttgtgtgggcggttgtccagtcgtcattggtggtctggcgtg +tcctgagtctggaaactggcggtgaccagtaaccccaacctcaggactcctgacaatggc +aaaaaaagtctcaaaattctttcgaatcggcgtcgagggtgatacctgcgacgggcgcat +tatcagcgccagtgatattcaggaaatggccgaaacctatgacccgcgtgtttacggttg +ccgtatcaaccttgaacacctgcgcggcctgttgcccgatggcatattcaagcgttacgg +cgatgtggtcgagctgaaagccgagaagattgacgacgattctgcgcttaacggcaagtg +ggcgttgttcgctaaaatcaccccgaccgatgaccttatcgcgatgaataaagccgcgca +gaaggtctacacctcaatggaaattcagccgaattttgccaataccggcaaatgctacct +cgtcggccttgctgtcaccgatgacccggcgagcctcggcactgaatatctcgaattctg +ccgcactgcgaagcacaacccgctgcagcgctttaaagcccaccctgaaaacgtcttttc +cgccgccacgctggccgaactggaatttgaagacgttcccgacacggtgctcaacagcct +ggccgataaggtgaaagccattttcagccgtaagcaggtcagcgacgatgcgcgcctgaa +tgatgtacatgaagcggtgaccgccgtcagcgagcatgtgcagaccaacctcactgcaca +ggataagcgtctttccgatatggaaaccgcgtttgccaccttcaaacaggaactgaccgg +caaggttgaagaaaccagccaggcattttccgtcctgaaaaccactctcgacaaaaccga +aagtttcagccagccgcgacgcacgaaagccagcggcggtggtggcgatgagctgctgac +tgactgctgataaaccgcagaccgaaaccgggcggaacccccgcccgatgctgtgactaa +ccgattaaatcaaacaggaaatactatgcgtcaggaaacccgttttaagttcaatgccta +tctgacccagctcgccaaactgaacggcatcagcgttgatgacgtcagcaaaaaattcac +cgtcgagccgtccgtcacgcaaacgctgatgaacaccgtgcaggcgtcatccgcgtttct +gcagatgattaacattctgccggtcgcagaaatgaagggtgagaaaatcggtgtcggtgt +gaccggcaccatcgccagcacgaccgacacctcgggcgacaaagagcgccagaccgcaga +ttttaccgcgcttgagtccaacaagtacgagtgcaaccagattaactttgacttccacct +gacctataaacgcctcgacctgtgggcgcgttttcaggactttcagcgtcgtattcgcga +cgccattgtccagcgtcaggcactggatttcatcatggccgggtttaacggtaccacccg +cgctgacacctctgaccgtgttaaaaacccgatgctgcaggatgtggccgttggctggct +gcagaaataccgcaatgaagccccggcgcgtgtgatgagcaacatcaccgacgctgacgg +taaagtcgtttcggcagtgattcgcgtcggtaaaaacggcgactatgagaacctcgacgc +actggtgatggatggtaccaataccctgattgacgagatttatcaggatgacccgaaact +cgttgccatcgttggccgtaagctgctggccgacaaatattttccgctggtcaacaaaca +gcaggaaaacaccgagtcgctcgcggcggatatcatcatcagccagaagcgcatcggcaa +cctgccagccgtacgtgtgccgtacttcccggcgaacgcggtgttcgtgaccacgctgga +aaacctctctatctatttcatggatgagagccaccgccgcagcattgatgaaaacccgaa +aaaagaccgcgtggaaaactacgagtcgatgaacatcgactatgtggtcgaggcgtatgc +cgccgggtgcctgctggaaaacatcaccctgggcgatttcaccgcacctgcagcaccgga +aggcggagagtaaacccatgacgagccccgcacagcgtcacatgatgcgggtctcggcct +ctcaagccgcgcagcgggaacaagccccgctgcgccatgcaaccgcctatgagcagatgc +tggttaagctggccgatgaccgccgcacgttaaaaaacatccgttcaaacgaacgtaaag +ccgagaaaaagcgcgagctgctgccgttctatgcgccgtgggtcgccggtgtgctgactg +atggtcgtggtgcgcaggatgacattgttatgaccgtcatgctgtggcgtctcgatgccg +gtgatatcgctggcgcgctggaaattgccccctacgcgctgaagtacggcctcacctctg +accatcgccgcacgacaccttacatgctggtcgaggaagtggcacttgccgcgcagcgcc +tgcgcgatgccggtgagtctgtcgacctttcctggctgcaggccactatcgacctgaccg +acggcgctgacgttcccgatatggtgcgcgcccgtctgcataaggtgacaggcctgaccc +tgcgtgatgccggtatgaatgcagaggcgctggcgcagtttcagcgcgcgatgcagctcg +accgcaatgccggtgtgcgcaaggagattgagcgactggaacgggcattgaagccaaaga +cagaggccgcgccccgtaaaacgactaaaccgcgcacgcgtaaacctgccaccaaaccgg +cagcaaagcgcgggcgtccaccaaaggcggcaaaaaccgccggttaactgaacgctcccc +gagccgggcggcacgccggtcaaagcaggcaaagacctgacggcgaccggcgtccaccgc +ccaacctgatgaggttgtcatgacgacagtgatactgaaccagcccgacgaaccgcagga +cgtaccgggcgtggtgattcccgcaccggagacgggcggtgcagtgattaaaaacacgtt +ctttttccctgatgtggatccgaagcgcgtgcgcgaactgatgcgccttgagcagacggt +ttccgatgcgcgcctgcgcaatgccatcaagaccggcatggccgagaccaatgcggagct +ttacgactaccggctgcgccagactgccgccgggtttaagcaactggccgacgtgcctgc +cgaggaaatcgacggcgagaatgtacgtgttttccactatctgagtgctgtgacggcaat +ggcaaccgccaccctgtatgagcgctatcgcggcgttgaggccaccggcaaaggtgacaa +aaaagccgacagcgtggaaaccaccattgatgacctgtggcgggatatgcgctggtcagt +tgcgcgtctgcaggacaagccgcgctgcattgtggggcagctctgatgaaagtcaggtcg +atgcagggcgataccctcgacacgatttgcgccaggtattacgggcgcactgagggcgtg +gttgagacggtgctgcaggctaatccgggtctgtctgagctgggtgtcattctgccgaat +ggtacagagattgacctgcccgatgtggcatcgtcacccgtaactaaaactatcaacctt +tgggagtaaccatgacagaaggtgaaaaaggcgtcctgtcactgtttgtgattggcgtga +tgattgttgttgggaaagtgctggcaggcggtgaacccatcaccccgcgtctgtttattg +gccgcatgctgctcggtggttttgtttcaatggtcgccggtgttgttctggtgcagtttc +ctgacatgtcactgcccgccgtgtgcgggattggatccatgctcggtattgccggttatc +aggtggttgaaatcgccatacagcgccgctttaagtcacaaaagggggaaagtgatgccg +gtcattaacactcaccagaatatcgctgcgtttctggacatgctggcgtattccgaagga +acagcgaaccatccgctgacgaaaaatcgtggctacgacgtcattgtcactggccttgat +ggcagaccagagattttcaccgattacagcgaccaccctttcgcgcatggccgaccaccg +aaagtgtttaatcgccgtggcgagaaatccacagcctcgggacgttaccagcagctttat +ctgttctggccgcactatcagaaacagctcgcattgcctgatttcagcccactgtcgcag +gataagctcgcgatccagttaatccgggagcgcggtgctcttgacgatatccgggcgggg +cgtattgagcgtgctgtttcacgttgtcgcaatatctgggcgtcattaccgggggccggt +tacggccagcgcgagcacggtctcgaaaagctggtcaccatctggcgcacggctggcggg +gtggtggcatgaaagtcctgataacgctgcttgtgatggccgtgctcgggttgctgtggc +tgcaccatgagaacggcaatttatcccgctcatttgagacggcaaaccgcgtcgcgagcg +agcaaaagacgacgattgggatgctgaaaaatcagctcagtgttgccggtcagctcgccc +gacgtaatgaatccgcgcaggtgacactgcgcgaacagctcgcaaaggcaagtgcagaag +ccagccgccgtgagcagacgataacgaggttacttaatgaaaatgaagcctttcgccgct +ggtataacgctgctctgcctgatgctgtgcgtcggctgcacacccgaacagcctgcgcca +gtgccggtgattgtggtcaacggatgcccgagggtgagcctttgccctatgccgggaagt +gacccgaaaaccaatggtgacctgagcgcagatatccgccgtcttgagggggcgctgact +gcctgcgcgctgcaggtcaaaaccgtcaaacactgtcaggatgaactcgatgcagaagca +caaaagcctgcgcaaagcgctgattaacgccgtgccgcagctccgaaataaccccgatat +gctgcgcctttttgccgacaacggccacaccgattcccgactggcgagctcgctgtcgtt +tgaaaaggtgtatgtgcttaacgtggtggtgaccgactttactggcgacctcgatttgat +attcgtgccggtgcaggcatggctgcgtgaacatcagccggacattatgaccaccgacga +cgggcgggaaaaaggattcacctggattattgatatcaataacgacgattcgctcgatat +cagtatcagcctgaggctcaccgagcgcacgctcgtcaaagaggtcgggggcgcgctgca +tgtcagttatgcaccagaaccgccactgcctgagctggtgaagcgcccggttgctatgta +tgcaaacggtgaattagtgagccagtgggatgagtgaattaaccgcgctgcaggagcgcc +tcgccggtctgattgccagcctgtcaccggcggcacgtcgcaaaatggcggctgagattg +cgaaaaagctgcgtaccagtcagcagcagcgcatcaagcgccagcaggcacccgacggca +ccccgtatgccgcacgaaagcgccagccggtacggagcaagaaaggccgcattaagcgcg +aaatgttcgccaaactgcgcaccagtcgctttatgaaagccaaaggcagcgatagtgcgg +cggtggtggagtttaccggcaaggtgcagcgcatggcgcgggtgcatcagtacggcctca +aagaccgcccaaaccgcaacagccgggatgtgcagtacgaggcgcgcccgttgctcggtt +tcacccgcgacgatgagcaaatgattgaagacgtcattatcagccacctcggcaaataaa +tattgtgtgaaccaccaccggaggcgcgtgatttggcgcggctaaagaccagaggcattc +tttgcactatgaatacgttatccacgatacaggagctcgcgcgtgcgattcgtaacctca +tccgctcaggtgtggtgacggaggtcgataccgtgcaggggctgtgccgcgtacaaagcg +gcgggatccagacgacatggctgaactggctgaccacccgcgccggtcgttcgcgcacat +ggtgggctccctcgctcggtgagcaggtgctgctgctggcaatcggtggcgagcttgata +ccgctttcgtgctgccggggattttctccgacgataaccccgctccgtctgcctcggcgg +atgcgtggcatgtggtttttcctgatggcgcggtcattgagtacgagccggagaccagtg +cactgacggtcagaggcatcaaaactgctgacgtgaccgcgtcggaatccatcacggcca +ctgtgcctgtggtgctggtgaaagcagaaacccgcatcaccctcgacaccccggaggtgg +tatgcaccaacaaactgacgacggcaacgcttgaggtgcagaaaggcggggagatgagag +gcgacattgtccacaacggcggcacatttaaatcaaacggtgtgcagctcgacgaccacg +gtcacggtggtgtgcaaagaggcggtgcctggacggaggacaccaaatgacggcgcgcta +tatggggatgaaccgcaacaccggtctcggtatcagtgacactgaacacatcagccagag +catgcgcgacattctgctgacgccggtcggctcgcgggtgatgcgtcgtgaatatggctc +gctcctgtctgcgctgattgatatgccgcaaaacccggcgctcaggctgcaaatcatggt +ggcgtgctattcggccatccagaagtgggagccgcgtatcaggcttacatccatcagctt +tgagactggtgatgctggcgagatgtatgtcgatattaccgggatgcgtaccgatacggg +tgcgtcagtttcaaccactgtttcactgagttaaatcactatggcaactgttgacctgag +cctgttacccgttcccgatgtggttgaggaactggattttgaaaccatccttgcggaacg +cattgcgacgctaatttcgctataccccgaagaccagcaggaagctgtagcccggacgct +cgcacttgagtctgaaccaattgttaaattgctgcaggaaaacgcctaccgtgaggttat +ctggcgtcagcgtgttaatgaagctgctcgcgcaggcatgctggcttatgccagagatag +cgacctcgataatctcggggcgaatttcaatgttgagcgcctggtcgtcaggcctgctga +tgacaccaccatccccccgacccccgctgaaatggagcttgatgccgattttcgtctgcg +tatacagcaggcatttgaagggatgagcgttgcgggatccaccggagcttatgaatttca +tggccgcagtgctgacgggcgtgtcgcagatatttctgttatcagcccttccccagcatg +tgtcacgatatctgtgctttcgcgtgagaataacggtgcggcgtctgatgagcttcagag +catcgtgcgcaatgcgctgaatgctgaggacgtgaggccggttgctgaccgggttacagt +gcagtcagctcagattattgactaccagatacgcgcaacacttttcgtttatccggggcc +ggaaaatgagccgattcgtgcggcggctgaggcgaagctcaaagcttatatcagtgcaca +gcacaggttggggcgggatattcgcctgtcagcaatttatgccgcgttgcatgttgaggg +ggtgcaacgtgtcgaactggctgcacctgtggccgacattgtgcttgataaaacgcaggc +atctttttgcacagactatcagatagtgattggtggctccgatgagtgatgtccgcctgt +tacctgtagggtcatcacctcttgaggtggctgctgccagagcctgcgcagatattgaaa +atacacctgttccgttacgccgcctgtggagtcctgacacctgtcctgcaaatcttttgc +cgtggctggcgtgggcgttttccgttgaccgctgggatgagaactggccggaaaaaacaa +agcgcgatgttattcgcagcgcgtatttcactcactgccacaaaggcacgataggcgctg +tcaggcgagttattgagccgctcggatacataatcaacgttacggaatggtgggagacag +gtgacccggcgggaacgtttcgtcttgatatcggtgtgctggaaagcggtattaccgaag +aaatgtatttagaaatggagcggttgattgctgatgcgaaacctgcgagccgtcatttga +ttggcctgaatattatccaggatattcccggttatatgtatacaggtggtgtgagctgtg +acggcgacattattacagtttaccccggataagtgaggaataatgagcacgaaatttaaa +actattatcaccactgccggagccgaaaaactggcagcggctactgtgccgggtggtaaa +aaagtgaatatcaccgtgatggccgttggtgacggaggcggaaaactgccagtgccggac +gccggtcaggtgcagctcgtgaatgaggtctggcgccatgccctgaataaaatcagccag +gacaaccggaacagcaattacattgtagccgagctggttattccgcccgaggtgggagga +ttctggatgcgcgagttgggtctttatgatgacgagggcactctcattgctgttgccaat +atggcagaaagctacaagccagaacttgccgagggctcaggccgtgcgcagacatgtcgc +atggtcattattgtcagcagtattgcctcagttgaattatccattgattcgacaatggta +atggcgacgcaggaatatgttgatgacaggattgcggaacatgagaagtcacgtcgacat +cctgacgccacactgaaagaaaaaggctttactcaactcagtagcgcaacagacagcgcg +tctgaggtgcttgcggcgacgccgaaagcggttaaagcggcgtatgaccttgctaatgct +aaatataccgctcaggacgcgagcacagcgcaaaaaggcattgtgaggctgagtagtgcg +gcagacagtaccagtgaagctgaggccgcaacaccgaaagctgtcaaaattgcgatggat +aatgcgaatgcgaggctggcaaaagaccggaacggcgctgatattccgaatccgccgttg +tttgtccagaatatcggtttaaaacccacggtcgataaagctgctaatgccgttgataaa +aatggcgacacgatgaacggaaacctgacactcaagggtgattaccggctgagttttatt +atccagaatgaagacggttctattcgtgcttatatcttcaaggacaaaggtggcgacggt +attcgcatcagtaatggcgatgacggcggcggtgattttgtttttggtaaaaatggacag +ttttactgcccggatattatgcatgttggtaatacgattgtatggggtgacggaaatatc +gagggggcgcgatggggcggtttgttgagcgactggttaactgctcaactggttgcccgt +gacaataatattaacttgcgagcaccctatgaatgggttaaccaaaactttgtcaaccgt +gcacagcgcggcgcacaggccagcatgactatggacggcggacttgtagaggctccatgg +ggatgttttcttacgggggggaacggtaacgagggtaatcaggttggagtggctttatac +cgtccattgcagattcttcgcaataatacttgggtaacgatagagaactgaaaatgaaac +tgattaatttgcaacgctacattctgatgaattattttttaggtgatggcattcagtatt +ttatagatgccacaggtaaggactggtataaatcactgcccaaattcacaaagaaataca +gccttgctatcgaaaatgatacgggcgttattcgtagtatcagcgaagatgcatcccggc +tttatcccggtggtttgaccgttgttgatgttgacagtattccggcaggttgtgacattt +tcggcggatgggtatttgacggagagaaagtcattcctcgtgagtacacattggccgaac +agcaacgccagtcagatgaaaagaaaaaaacacttcttgctgaggcggaggcaacaattt +ccacgcttgagcgtgcggtaaggttaggcatggctaccggggaagaaataaggcgactcg +aagcatgggagcgttacagcgtattggtgagcagggttaagcagtcagatgactggccgc +aaaaacctgaataacccggcggcatttgcccgcttctttctcatccattagttgtgccag +acatcatccagccctgacaaatagcccctcacaagaccagccaggacaataacactcgcc +cactaactacggagttaaccggatgagtgattttcaccacggcacgaaggtcatcgaaat +aaatgacggtacgcgtgttatttccacggtcgcaaccgcaatcgtcggcatggtctggac +agccagcgatgcggatgccgagacatttcccctcaacgagccggtactgattaccaatgt +gcagagcgccattgcgaaagccggtaaaaaaggcactctgtcagcttccctgcaggccat +cgccgaccagtcaaagcctgtcaccgttgtcgtgcgcgttgccgaaggtaccggagacga +tgcagaagcgcagaccacgtccaacattatcggcggcacggatgagaacggtaaatacac +cggtatcaaggcgctgctaactgccgaagcggtcaccggcgttaagccgcgcattctcgg +tgtgccgggtctcgatacgcaggaagtcgcaaccgcacttgcatcggtctgtatcagcct +gcgtgcgtttggttacgtcagcgcatggggctgtaagaccatttccgaggcgatggcata +tcgcgagaatttcagccagcgcgagctgatggtcatctggcctgatttcctcgcatggga +taccaccgcgaacgccaccgccacggcatacgccaccgcccgcgcactcggtctgcgtgc +ctacatcgaccagactatcggctggcacaaaacgctgtctaacgttggcgtgcagggcgt +taccggcatcagcgcctcagtcttttgggatttgcaggcatccggcacagatgctgacct +gctcaacgaggccggagtcaccacgctggtgcgcaaggatggtttccgtttttgggggaa +ccgcacatgctctgatgacccgcttttcctgtttgagaactacacccgaaccgcgcaggt +gctggccgacacaatggctgaggcgcacatgtgggcggtcgataagcccatcaccgcatc +gctcatccgtgacattgtcgacggcattaacgccaaattccgcgagctgaaatcaaatgg +ctacatcgtggacggtgaatgctggttcgacgaggaatcgaacgataaggaaaccctcaa +ggccgggaaactgtatatcgactacgactatacaccggttcccccactggaaagcctgac +cctgcgccagcgtatcaccgataaatatctggtgaatctggctgaatcggtcaacagcta +aggagcctgaaacaacatggcactaccccgcaaacttaaatatctgaacatgttcaatga +cggccttagctacatgggcgttgttgaatccgtgacgctgccgaagctgacccgcaagct +cgaaaactatcgcggcggcggtatgaatggcgctgcagcgattgacctcggcctcgacga +tgatgcgcttactgtcgaatggtctgtcggtggcctgcctgatgtggcgctgtgggcgca +gtatgccgcgccgggggctgatgccgtgccgctgcgttttgctggctcttaccagcgtga +cgacactggcgaaatcgttgcggtcgaggtggtcatgcgtggccgtcataaagaaatcga +cggcggcgaaaataagcagggtgaaaatacctcgaccaaactgtcgaccgtttgcaccta +ttaccgcctcacgattgatggtagcgacattatcgaaatcgacaccgtcaacatggtcga +gaaggtgaacggcgtcgaccgtctggaacagcaccgccgcgcaatcgggctgctgtaatt +ccctgaccggtcagcactgctggccggttattacccccattcagagcagagaaaaaatca +tggcaaaagcaccacgcaaaacccctgaatttattgatacggctggcaatgaaattgaca +ccgtaaacccgaatgtcgtgaccctcgacaagccgattaaacgcgccggtcagacaattg +aaaaggtcacgctgattgaaccgaacgcaggcaccctgcgcggcgtcagtctggcggcgg +tggcgcagtccgaggtcgatgcgctgattaaggtgctgccccgcatgacctacccggcac +tcaccacgcaggagctcaccgcaatgaacctgcccgatatgctgtcgctggccgctaagg +tgattggttttttgtcaccggcttcggcggaatagacttcccgcccggcctgtcgaccga +tgacctgatggcggatatcgcagtgatattccactggccgccatcagagctctattccct +gagcctgaccgagctcatcacatggcgcgaaaaggcgctgcagcgtagcggaaaccacaa +tgagtaataacctgaggcttgaggtattgctgaaagcggtcgaccaggcgacccgaccgc +ttaaatccatccagaccgcgagtaaaagcctgtcgggcgatattcgcgacacacaaaaag +ggctgcgtgacctgaatggtcaggcgtcgaaaatcgacggctttcgtaaggcaagcgcgc +aactggccgtaaccagtcaggcgcttgataaggcgaaacgcgaggccggtgagctggccg +tgcagtttaaaaacaccaccaatccgacccgcgcgcaggcgcaggcacttgaagcggcaa +ggcgtgccgcctctgagttgcagacgaaatacaacagcctgagaacgtcggtacagcgcc +agcgctccgagctgatgcaggccggtattaatacccgcactctctctgcagatgagcgtc +ggctcaaaacctccatcagcgaaacaactgcgcacgttaatcgacaacgtgaggcactgg +cgcgcgtcagtgcgcagcaggcgaaattaagccgggtgaaagagcgatataaatcaggca +aggagcttgccggtaacatggccgcagcaggcgctgcggggtcggtatcgcgacacggaa +cgatggccggggttaaattactgatgcccggttatgactttacgcagaaaaattccgagc +tgcaggctgtgctcggggtcgataagcagtcgccagaaatgcaggcgttacgcaaacagg +cgcgccacgtcggcgacaatactgcagcctctgcagatgatgcagcaagcgcgcaaatca +tcattgcgaaaagcggcggtgatgcagctgccattcaggcgcgacgccgagtcacgctga +atatggcgctgtcaaaccggcgcacgatggaggaaaacgcagcgctgctgaccgggatga +aatcagcgtttcagctttcaaacgacaagattgcgcacattggcgacgttctctcgatga +cgatgaacaaaaccgccgccgattttgacggactgagcgacgcgctgacctatgccgcac +cggtggcaaaaaatgccggggtgagcatcgagcaaaccgccgcaatggtcggtgcactgc +acgatgccaaaatcaccgggtcaatggcgggcacgggtagccgcgccattctcagccgcc +tgcagctcccaccggaaaaagcgtttgaggccattaaggagctcggcgtcaaaacgtcag +acagcaaggggaacacgcgcccgatattctccatcctgaaagaaatgcagcgcagctttg +agaaaaacaacctcgggacaagccagcgcggcgagtatatgaaaaccattttcggcgagg +aggccagctcggcggcggcggtactgatggaagccgcctcaagcggcaaacttgaccggc +tcaccgctgcgtttaaagcctcggacggtaaaaccgaggaactggttaaggttatgcagg +ataacctcggcggcgactttaaagagttccagtctgcttatgaggcagtcggtactgacc +tttttgaccagcaagagggctcgctgcgtaaactcacccaaaccgccacgcaatacgtgt +taaagctcgacggctggatccagaagaacaaagggctggcgacaaccattggcatcatcg +ccggtggcgctctagctctgattggtatcatcggcggtattggcctcgttgcgtggccgg +ttgttatggggattaacgccattatcgctgctgctggcgtgctgggtacggtctttactg +ttaccggtagtgccattgtgaccgcacttggcgcgattacctggccgattgtcgcagtgg +gggcggctattgtggctggtgcgttactcatccgtaaatattgggagcccatcagcgcat +ttttctcgggggtgattgagggcatcatgagtgcctttgcaccggtcgcagaaatgttcg +ctccactggcacccatttttgacggtctcggtgagaaactgcgcggcgtctggcagtggt +ttaaagacctgatagcaccggtcaaagccacgcaggaaacgctcgatagctgcaaaaatg +tcggcgtcatatttggtcaggcgctggcctctgctttgatgcgtccgctcaatgtattta +acaagttgcgcagcggtgtcgactggcttctcgaaaagctcggtatcatcaacaaagagt +cagacaacctcgaccagactgccgccaaaaccaacgccgccacgcagggtaattcctaca +tcccggcaaccagcacatatggcggctatcaagcttaccagccagttaccgcaccggcgg +gacgctcttacattgaccagagtaaaagcgaatacaaaatcactctgccgggaggtgctg +cgccggggcatcagcttgacagacagctacgcgacacgctcgaacagattgagcgcgaaa +agcgtgcgcgtcagcgtgccagtatgagccatgactgagaggaataaacgatgatgcttg +cgcttggaatgtttgtgtttgaacgtcgcaccctgccttatcagtcgatgcagcactcga +aggattaccgctgggcgtctaatgaccgggtgggtaagccgcctgcttatcagtttctcg +gcgagggggaaacgtcgatacagcttgccggtacactgtacccagccatcaccggcggct +ggatctcactaaaggctgtagaggtaatggctaacgagggcagagcgtggccgttgattg +agggaactggaaacattttagggatgtatatcgtcgataaggtgtcgaccacgcacgccg +agtttttcagcgacggcgctgccagaaagattgatttcaccctttcgcttaaacgggtcg +acgaatcactgacggcaatgtttggcgacctgaataagcaggccagcgagcttctaggct +ctgccggaaatctgactgataagctgcagagtgcgctcggaggactgaccgcatgattac +gggcatgactattgacgccggaactagccttgcaccggcatttatgttaacgctgaacag +ccaggacattaccagcaattttagtgaccggctgatttctctcaccatgacagacaaccg +gggctttgaggctgaccagctcgacattgagctcgacgacaccgacggcaaagtcgaatt +accactgcgcggggcggtgctgacgttgtggcttggctggcagggttcggcgcttctgaa +taagggcgatttcacggtcgatgagattgagcaccggggcgcgcctgatatcctgaccat +ccgcgcgcgtagtgcagactttcgcggaacgctcaattcacggcgtgaagaatcatggca +cgatactaccatcggtgagttggtcagcaccattgcaaagcgcaataaactgacggccag +tgtcgcggattcactgaaaaaaattccggtaccgcatatcgaccagtcgcaggagtccga +cgccgtatttctgacccgactggctgaccgcaatggggcgacggtgtcagtgaaagcggg +gaaactcctgtttctgaaagccggtagtgcgatgacggccagcggcaagcccgtcccgca +aatgacactaactcgcaacgatggtgaccgtcatcagtttgctattgccgaccgtggggc +ttacaccggcgtaaccgcaaaatggttgcacaccaaagacccgaagccgcaaaagcagaa +agtaacactgaaacgcaagccaaaagagaagcacctgcgcgcactggagcacccgaaagc +aaagccagtcagcaaaaagacaaaggccaaaaaagagccggaagcgcgcgagggtgagta +tatggccggtgaggccgataacgtgctggcgctgacgacggtctacgcttctaaggcgca +ggcgatgcgtgccgctcaggctaagtgggataagctgcagcgaggcgttgcggagttttc +aattacgctggcgcttggtagggctgatttattccctgagacaccggtgcgcgtatcagg +ctttaagcgcgtcatagatgagcaggcatggttaatcagtaaggtaactcacaatctgaa +taatagcggcttcacgacgggcttagagcttgaggttaaactctctgatgtggagtacaa +cgcggaatcggatgatgaataaaatgtattcacaaaaagtgaatttatgattatcattta +ttcacgaattgagaataaagggtgggttatgtttcattgtccgaagtgccatcatgccgc +acatgcgcgaacaagccgctatctaaccgaaaacacgaaagaacgctaccaccagtgcca +gaacatcaactgtagttgtacgtttatgacaatggaaacgatagagcgctttattgttac +tccgggagccattgacccggcaccgcctcacccgactgtcggtggtcagcggccattgtg +gctctgataaatttccgctaaatgcccgccgcgtgcgggtttttttatgcactcaggaaa +gtggcggtaaaaaatccaccgccattctatcgccactcgaaaacgaggcaacaaaaaggc +cactcgagagagtggcctaactgtatgtatttactacttaaatttggtggcccctgctgg +acttgaaccagcgaccaagcgattatgagttcctacaagaacaaccgaaaatcaatagta +tgcgttatttatcattgacatagattgccattgtttgccaataattacctattattcgcc +atttctaccgccactttatcgccattctattatctgttactcagaaccatcgccgacata +ggttccatcaggtgcgagatgatatcttccaccaacataagtcccatctggggcaagtgt +tgggcggccagcaacataacttccatttggcgctaagcgtggaacgccaccgacataagt +tccatcgggtgcaaggcgtggtgctcctcctccaacataagtcccattaggggcaagcat +aggttgtccgtaaacataggtaccatcaggtgctaatcgaactgacatacaacctccata +acttatttgctgttagtaatgtgaactaaaggatttagtttaactgcatcctctaaatgg +tcgggtgcaaagtgcgcatatcgcatggtcatttttatatctgtatggccgagtacgcgc +tgcaacaccaaaatattaccgccattcatcataaagtgactagcgaaggtgtgacgtaaa +acgtgggtaagttgtcctgccggtagttcgatacctgttctttccaaagctgaccggaac +gcgccataacaatcactgaacaaccggccctttttatcatcaggcagagactcatagagc +tctttgctgattgggacggtgcgattttttctacctttcgtgttggtgtatgtgattttg +tatttcgcgagttggctttttctcagactctcggcctcagaccaccgtgcgccagttgcg +agacagattcttaccacggtttctaaatcagggtggtcatgtcggttacactctccgagc +agttgcgaaatttggtcgtgagttagccaagtcatttccatttcttctgtgcggaatggg +cgcatattttttagtgggttttcacccttccattctccgaggcggtttagctcattgaac +accgcccggaagtaggccagctcaagattaagcgtgcgaggcgatacctctttcactctg +tttgaacgggcatactcaccttttaaccgtttttctcggtagcgggaaaacatctgcgca +tcgaaatcgcgtgcgagtggttcgcccatacactcaaaagcatggtgcatggctaactgg +cgtttcaaaccatctttcagtgtaatgccatgagcgctataccatgaatcaaccagctct +tttaacgtgcgcctgtcttccttttcttcctgccacgggttttgaacggtgtactgctca +aacgccagagcctcgcctttagtagcgaatttctttctgatacgtttgccttttgcaccg +tttgggtagagttcacaaatccaaccgccagccggatttttacggacggtcattagttaa +cctcgctgtatacacccaccacacgccccaacgttttaatatcatcaatgccgcattcga +aaggaaccttcccgcctgcaacatgtagttttctacccggtagttttgttaactctcgaa +tgcttattgctccctcaatgtcgactagccataagccgtcagacaatgatgcttgcttgt +ccacaaaataaattttcccctcggaacggatagccatcccatctgtgagcggttttgtga +aaaattgggcatcaacactcaattgtttatcggatttgaggatttcttcacttaatgtga +atccctcaatcctttttgcgtcgctcgattctctgttatttacaaatgcttctccttctc +cggtaagtaaccactggagattagcacctgtttcaagggcacagtgagccgcaaagtcat +aggagatagcgcctcgggtgtacctgtttgacaatgagctggacgcgatatcgaagtggt +tagctaattgaattttctgcgaaaatccgtacgcctcgcagatgcggtcaagtacatcca +cgttgctccatcctaaagaatctattctcatttcgataaaacctatttactatctctcaa +ttgggagatatattttggctaaacccacgcaattgatggcaagtgttggcaaacagagtc +aaatcaattgcaaactttggctaatagggaatcatgcaatatggcttctgaaatcgcaat +catcaaagtgcctgcacctatcgttactctgcaacaattcgcagagcttgagggtgtttc +tgaacgcaccgcctaccgctggacaaccggcgacaacccttgtgtaccaatcgaaccccg +cacaatccgtaaaggctgcaagaaagcaggtggcccgattcgcatttattacgcacgctg +gaaagaagagcagttgcgtaaggcgttgggacattcccgttttcaactcgtcatcggtgc +ttaattcactttatgtgaattgtaaggatgcaacatgtttgattttcaggtttccaaaca +tccccactatgacgaagcgtgccgggcttttgcgcagcgtcacaacatggcgaagctggc +cgagcgtgcgggtatgaatgttcaaacgttacgtaacaagctcaacccagaacagcctca +ccagttcacgccgcctgaattgtggctgctgactgacctgaccgaagactcaaccctcgt +tgatggttttctggcgcagattcattgtctgccatgcgtgccggttaatgagctggctaa +agataaattgcagtcttacgtcatgcgcgcaatgagtgaactcggtgaactggcgagcgg +tgcggtatctgatgagcgtctgaccactgcccgtaagcacaacatgattgaaagcgttaa +ctccggcattcgcatgttgtcattgtcggctctggcgctgcatgcacgtctgcagactaa +tcccgctatgtcgagcgtggtcgataccatgagcggtattggcgcatcgtttggtctgat +ttgaggtgcgtatgctgaaaagtgaaccgtcatttgcgtctctgctcgttaagcaaagcc +ccggtatgcattacggccacggctggatcgcaggtaaggacggcaagcgctggcacccgt +gccgctcacagtccgaattattaaaagggctgaaaacaaagtcgccgaaatcgtcaggtt +ttttaattattcgtattgtccactttgtaattaaaggagtgaaacatgtcacgcgatgaa +ttaagaattgttttgggtgccatgattccaaatatggaggaaggttttgaaattaaaacc +cgcgacggcgcaatacttcgcgttgaccctgagtgggagtgctgcaaagaatttaaggat +ggattaaaagccgaaatcatcaagcagttaaaaagcaaacctgctgttgtatttggatat +agttaattaattaaacgtaattacttggcgtaaacccgccgggcattcttttgccaaaaa +acaggaggatatatgagtcgaactatttatttatcaacgccgagtggtgctggcgaccac +ttgctggagtctttgtttaaagaagccaaaaaagaagagcgcaaagaccgccgtctcgcc +gtttcaatccgtctcgaagatctggccgttcacattaccaattcagatatgacaggcaaa +gaagcggccgagctactgcgccgcgaagccactcgctttgagaacgaatcacaggagctt +cactaatggccgacgcaatggatttagcacaactgcgcgagcaggaagaccgcgaacgcc +acataagcaacgcgcgcagccgtcgccatgaggtttctgcatttatctgtgaggaatgcg +atgcacctatcccggaagcgcgccgccgagccataccgggcgtgcagtgctgcgttacct +gtcaggaaatcttagagctgaaaagtaaacattataacggaggtgctttatgagcattac +caatgcaactattagccagcgtgcaaaaaaatggcttgaagatgaccgtatatttattga +caccgaaactacgggtttgggtgatgatgcggaaatagtagaaatctgtttaatagatag +cgctggttttatcatgctaaatacattggttaaaccaactaaaccaattccagcagaggc +tacggccattcatggaataactgatgaaatggttatgtatgcgccaacgtggaaagatat +tcacggcgcagtagcttctttattttttgagtatggctttgttatttataacgccgatta +cgacacaagacttatatatcaaactgcgaaattatatgggcttgagaatgacggcttttg +ttattttttaaatgagcgttcggcctgcgccatgatgctatatgcagagtatcgcggcga +gccagggcgatttaaaggttataaatggcacaaattagttgatgccgctgcacatgaagg +ggttagcgttgaaggaaaggcacaccgtgcattagcagattgccggatgactcttggcat +tatcgacgctttggcaaaaggcggtgcagcatgagtatccgtatcgaaataggtgataaa +tgggtaatcaccagcgaccaatatcaattcatcctgaatgaaaaaaaagtcgttaagacc +ggcaataaagctggcgaggaatggctcgacaccatcggttattacccgaagattaatcag +ctcatttctggtctggtacatcaccacattcatacggcaatgattatttcccttagtgca +atggcagaggaaatagagaagttatcttttatctgtgaagaagcatttaaggcggttaaa +aaatgattgattcccgctgctttgctgaaagcacaataaatattgtttctgtttctggtg +gaaaggacagccttgctcaatggattcttgcggtagagaacgacgtaccgcgcaccactg +tttttgcagataccgggcatgagcattcccaaacaatggagtatctggattatcttgaat +ccagactcggcccggttattcgagtgaaagccgattttactcggcggattgaaggcaaac +ggaaattcattgctgaaaaatggcctgtctctctcgttgaagaatgcggaatgtctcatg +agcaggctgcagaacgaatcgcaaaggcactggaaatccttaagccaaccggtaatccgt +ttctcgatttgtgcatgtggaaaggacggttcccgagcacgaaagcaaggttttgttcac +tggaactgaaacatgactcagtacgggacaagattgtactcccagcgctggagaaatatg +acgaagtaattctatggcagggtgttcgtgctcaggagtcaccagcccgcgctgcgttac +ctatgtgggaggaggatgcagataatacccccggtttgcatgtgtatcgcccaattctta +actggacacatgaagacgtatttgccttagctaaacgacacggaattaaaccgaacccac +tctatcagcaaggttgtagcagagttggctgcatgccatgtattcatgcaagaaaatctg +agctggcagagatttttgctcgctggccggaggagattgcgcgcgttgcagagtgggaac +gtcttgttgctgcctgttcacgtcggggaaactcaacatttttcccttcgactcacgacc +cgcggcgagcagaaaaacgtattgaagttgttaccgtagaagaatatgggatagcttcat +atcgtgactgggcgatgactacgcgtggcggttctcagtacgatttgctcgctgctacaa +acgacaaaactgtgtgcagtagcgtttatgccggtgtatgtgaatgacgggtgtcgttta +cgcgtttccgtggaatgccccacggtcggcaatagccagctcatatcttacctatgacca +acagcatcgccgcgaccgtatgttcgcggctttgctgcatgcgagaaaggtgctttttct +ccagccagaatgtgtgcgctttgacgtttatcgcaccgctgcagttctggagcaaaatca +gggcagtcaacgagccaatgcctttttaatcagcttctgcaaaaaggcattaccacgtct +tgaactggtcgcaaaaaaatacgagtgctcgggcatcaacagcaatgtatcagccgctgt +tttcgatggtcattttgatacccagcttatgcaatatctggcgtcacgcatggtcaatat +ggtcgccagatttaaccgcctcccggatatgtcgcgcgccgatattgacctgctggccgc +ggatatcgctaattttattcgcgctgaactggccgacattgatgacaccggatttagcga +actcaaaacgctgtacacttggtacatgcgcgccggttttatttccctgcaattcaacgt +tacaccgccgaaatgggagcgtgtgactaaaaaatatttttgtgaggatgaaatcgcacc +ggcagtaatgcgcatgtttaatgaggtttggtggcgcggccgcttgcgacgcattgcggc +tgcatggcgcgaacatctgcaaattgcagtcggcaacgtaagcaagaaacgacacgcata +cgcgagtaaaaactgcgtcaccgactggcgcgagcagaagcgccgcacgcgcgaatttct +caaggggctggatctcgaagacgaagaaggcaaccgcatcagtctgattgaaaaatacga +cggctcggtcgctaatccagcaatacgccgctgtgagctgatggcccgcattcgtgggtt +tgaaaatatctgtaatgagctcggttatgtcggggagttctatactctgactgcaccgtc +taaatatcacgccaccaccaaagcgggctaccgtaacagcaaatggaacggtgcaagccc +gtcagacacgcagagctatctcacaggcctttgggcacgcatacgcgccaagctgcaccg +ggaagaaatccgcattttcggaatacgcgtcgctgaaccgcatcacgatggaacgccgca +ctggcatatgcttatgttcatgttgccggaagatgtcgagcgtgtgcgactcatcatccg +agattatgcgtgggaggaagaccactacgaactgagaagcgataaagccaaaaaggcgcg +cttccatgctgaggccattgacccggaaaaaggcagtgctactggctatgtcgctaaata +catttccaaaaatatcgacggttatgctctcgatggtgaaaccgatgacgaaagtggtga +gttgttaaaagagactgcacccgccgtttcagcatgggcggcgcgctggcacatccgtca +gtttcaatttatcggcggtgcgccggtgacggtatacagggagctacgcagaatggctga +ccctgaaacagccagggcgctcagtgttgaattcgccgcagtgcatgatgctgctcacta +tggacgctgggctgattatgtgaatgctcaaggcggaccattcgttcgccgtgacgattt +acaggtacgtacattgtatgaacctcgaactgaatttaatcagtatggcgaagaaactgt +gtgcatcaaaggtgtctacgatgcctcgataggtgctggctctcctattctaacccggtt +aacgcagtggaagattgttccaaagcgtgccgttgatttggccgttgacgttaagggcgc +ttctgcgccctctcggagttctgtcaataactgtacgggaagcgaaagcgatccaccgat +actcgatttaacaaaaccgctgagtcggcgtgaaagacgagagttgacgaaccgactcag +gaagaaaaagccaacaacacggcgaaaattcatccacggaacggataagcaaaacgtcgc +tataacgaaaactatcgacgagatacactctgacaaccggcatcacaatcagccggggcg +aagccctgcacctgatggccggtggtaaaagttgttttaacggtcgatgggtgcgcggaa +cgtcaaaaggtgaaatctttgctgcagctccttcacatcaggcgagacgcggaaaatcct +taatcgtgttgcagatttagctgagctggcaacgaaaatgtaaccgctaatattcatcca +tatcatgtacatacagtgtatttaactgtgatttttttcttcacaccttttgccaatacg +tgctactgtatgtttatacagtatctcgtagtggaggttgtgtggatagagagctaaatg +agcacgttatgattgagcgggtcgaaatgattgcgcgtctgactgctgaaggtacttgtc +aggaaagagaccgtgaaatcgcattgaatctaattgcggaaatagcaagaggcaacctaa +tgaaaaataataatttttctgttgttttttccgcaccgcctgttggtgaaacatttgcaa +aggagggcaaagtgaaagtaaatatcacgttggataaagaccaaaaaatcggccagccgg +taattgatgcttttcagtgcgaattgaccaagcgaatacagtccgttttcccgtcaacgc +gcgttactgttaaaaagggatccatgaccggtgtcgagctgatggggttcgataaagatt +cagaccgcgaagcgctggatagcatccttcaggaagtgtgggaagatgagagctggcgtt +aatccctgaaaaatgtgcaaccatcgaccccatgtttgatagcatggggttgttttgtat +gggattacacacaaaggaaaatcatggataccgtaatagcatttttatctctggctctct +ttattgcttttatcgtcgggttaatcaagccgtcgctggttcgaatgccgagccgtaagc +gctccagtgctgtttatctcggtggctgtctggcgctgggcgttattggctcaatcttat +ggccgactgaaaaaactcagccggtggcaaaaactgacgtaccggcggttaaagcggaac +cggctacgccaacgtttgagtacgcagataaaaccctcaaagaatatcgcaacgagccaa +aagaaacccggcacgaaatcgttaaagactatgttggattcaaaggtgtgcaggccagcg +ctaccgatgttttttatgcctgtatgagcgagtacacttttaccaaagatgatgcgttaa +agctcagtgatgtgttggggtggtgtttcaacgacttcgagaaagatccacaatctctga +ataataaaatcaaccttgacgaatttcagggtaattttagcggttgggatggctcttatc +gcccgttagagaagctgataaaagccagtatgaatgatgattcctcttataaacatgttt +caacggtctaccatctgattttgaataaagacccgcatgccgttgtaaaaacaacgtttc +gcggcactaatgcttatggtggcgtggtcaaacagaccgtagcagcacgcgtcaacgtgc +gaacgggcgaggtcgattcaatactcgacaattaaacatgacaaacgccgccggtgctga +aactcgctttcagtgctggcggggttgaacaacgagccccgcgaggcgttagcctacccc +tgagcaaccgcccaagaccggtactattaaagccggtttttttatgccacttttccacga +atttcccgtttttttagccgtgcatgcaacaggtgcattgttttgcatgcgtcaggcttg +cccgttctggttgtgcgtcgccagagctggcgcggctccagagtggtcatgcaactgcat +taaaaccgacccataaagtgggca diff --git a/etc/c1215.blastn.crunch b/etc/c1215.blastn.crunch new file mode 100644 index 000000000..13215ee94 --- /dev/null +++ b/etc/c1215.blastn.crunch @@ -0,0 +1,126 @@ +9583 99.00 1474 6490 big_blast_2_50000_embl_other_c1215.seq.00000001.out 1474 6490 SPBC1215 AL096846 S.pombe chromosome II cosmid c1215. +2712 98.00 1 1437 big_blast_2_50000_embl_other_c1215.seq.00000001.out 1 1437 SPBC1215 AL096846 S.pombe chromosome II cosmid c1215. +276 99.00 429 574 big_blast_2_50000_embl_other_c1215.seq.00000001.out 7588 7734 SPAC1142 AL159951 S.pombe chromosome I cosmid c1142. +274 99.00 429 574 big_blast_2_50000_embl_other_c1215.seq.00000001.out 174 319 SPRG5SC K00770 yeast (s.pombe) 5s rrna gene and flanks, clone pspr36. +242 100.00 453 574 big_blast_2_50000_embl_other_c1215.seq.00000001.out 48 169 SPRG5S K00569 yeast (s.pombe) 5s rrna gene, clone pym3. +242 100.00 453 574 big_blast_2_50000_embl_other_c1215.seq.00000001.out 21075 20954 SPCC63 AL049522 S.pombe chromosome III cosmid c63. +242 100.00 453 574 big_blast_2_50000_embl_other_c1215.seq.00000001.out 33755 33876 SPCC417 AL035076 S.pombe chromosome III cosmid c417. +228 99.00 456 574 big_blast_2_50000_embl_other_c1215.seq.00000001.out 22579 22697 SPCC417 AL035076 S.pombe chromosome III cosmid c417. +242 100.00 453 574 big_blast_2_50000_embl_other_c1215.seq.00000001.out 31087 30966 SPCC338 AL023781 S.pombe chromosome III cosmid c338. +129 97.00 35 107 big_blast_2_50000_embl_other_c1215.seq.00000001.out 22094 22022 SPCC338 AL023781 S.pombe chromosome III cosmid c338. +242 100.00 453 574 big_blast_2_50000_embl_other_c1215.seq.00000001.out 6258 6379 SPBC17A3 AL109652 S.pombe chromosome II cosmid c17A3. +242 100.00 453 574 big_blast_2_50000_embl_other_c1215.seq.00000001.out 3214 3335 SPAC5H10 Z49811 S.pombe chromosome I cosmid c5H10. +242 100.00 453 574 big_blast_2_50000_embl_other_c1215.seq.00000001.out 8450 8571 SPAC4H3 Z69380 S.pombe chromosome I cosmid c4H3. +242 100.00 453 574 big_blast_2_50000_embl_other_c1215.seq.00000001.out 30828 30707 SPAC25B8 AL133225 S.pombe chromosome I cosmid c25B8. +242 100.00 453 574 big_blast_2_50000_embl_other_c1215.seq.00000001.out 24568 24447 SPAC1F7 Z67998 S.pombe chromosome I cosmid c1F7. +242 100.00 453 574 big_blast_2_50000_embl_other_c1215.seq.00000001.out 17220 17099 SPAB4537 AB004537 Schizosaccharomyces pombe 37 kb genomic DNA, clone c213. +240 100.00 453 573 big_blast_2_50000_embl_other_c1215.seq.00000001.out 7867 7747 SPAC926 AL110469 S.pombe chromosome I cosmid c926. +238 100.00 455 574 big_blast_2_50000_embl_other_c1215.seq.00000001.out 29615 29496 SPCC965 AL023590 S.pombe chromosome III cosmid c965. +238 100.00 455 574 big_blast_2_50000_embl_other_c1215.seq.00000001.out 24228 24347 SPCC24B10 AL157991 S.pombe chromosome III cosmid c24B10. +238 100.00 455 574 big_blast_2_50000_embl_other_c1215.seq.00000001.out 5316 5435 SPCC10H11 AL162771 S.pombe chromosome III cosmid c10H11. +238 100.00 455 574 big_blast_2_50000_embl_other_c1215.seq.00000001.out 23752 23871 SPBC428 AL034382 S.pombe chromosome II cosmid c428. +238 100.00 455 574 big_blast_2_50000_embl_other_c1215.seq.00000001.out 15895 16014 SPBC4 AL121863 S.pombe chromosome II cosmid c4. +238 100.00 455 574 big_blast_2_50000_embl_other_c1215.seq.00000001.out 9473 9354 SPBC342 AL096809 S.pombe chromosome II cosmid c342. +238 100.00 456 575 big_blast_2_50000_embl_other_c1215.seq.00000001.out 9665 9546 SPBC21H7 AL023286 S.pombe chromosome II cosmid c21H7. +238 100.00 455 574 big_blast_2_50000_embl_other_c1215.seq.00000001.out 24026 24145 SPBC1685 AL031154 S.pombe chromosome II cosmid c1685. +236 100.00 456 574 big_blast_2_50000_embl_other_c1215.seq.00000001.out 202 320 SPRG5SE K00570 yeast (s.pombe) 5s rrna and asp-trna genes, clone pym116. +236 100.00 456 574 big_blast_2_50000_embl_other_c1215.seq.00000001.out 34701 34819 SPBP23A10 AL136535 S.pombe chromosome II p1 p23A10. +236 100.00 456 574 big_blast_2_50000_embl_other_c1215.seq.00000001.out 31520 31638 SPBC577 AL110506 S.pombe chromosome II cosmid c577. +236 100.00 456 574 big_blast_2_50000_embl_other_c1215.seq.00000001.out 6163 6281 SPBC1677 AL035581 S.pombe chromosome II cosmid c1677. +236 100.00 456 574 big_blast_2_50000_embl_other_c1215.seq.00000001.out 18162 18044 SPAC3G9 AL021046 S.pombe chromosome I cosmid c3G9. +236 100.00 456 574 big_blast_2_50000_embl_other_c1215.seq.00000001.out 1 119 SPA K01049 Yeast (S.pombe) 5S ribosomal RNA. +234 99.00 453 574 big_blast_2_50000_embl_other_c1215.seq.00000001.out 1664 1543 SPCC188 AL049662 S.pombe chromosome III cosmid c188. +234 99.00 453 574 big_blast_2_50000_embl_other_c1215.seq.00000001.out 20839 20718 SPCC11E10 AL121783 S.pombe chromosome III cosmid c11E10. +234 99.00 453 574 big_blast_2_50000_embl_other_c1215.seq.00000001.out 23408 23287 SPBC21D10 AL031536 S.pombe chromosome II cosmid c21D10. +232 99.00 455 575 big_blast_2_50000_embl_other_c1215.seq.00000001.out 3099 3219 SPBC24C6 AL031786 S.pombe chromosome II cosmid c24C6. +230 99.00 455 574 big_blast_2_50000_embl_other_c1215.seq.00000001.out 200 319 SPRG5SA K00768 yeast (s.pombe) 5s rrna gene and flanks, clone pspr1. +230 99.00 455 574 big_blast_2_50000_embl_other_c1215.seq.00000001.out 24833 24952 SPBC354 AL022071 S.pombe chromosome II cosmid c354. +230 99.00 455 574 big_blast_2_50000_embl_other_c1215.seq.00000001.out 14612 14731 SPAC167 AL035248 S.pombe chromosome I cosmid c167. +228 99.00 456 574 big_blast_2_50000_embl_other_c1215.seq.00000001.out 201 319 SPRG5SD K00771 yeast (s.pombe) 5s rrna gene and flanks, clone pspr41. +226 98.00 453 574 big_blast_2_50000_embl_other_c1215.seq.00000001.out 198 319 SPRG5SB K00769 yeast (s.pombe) 5s rrna gene and flanks, clone pspr11. +226 99.00 455 572 big_blast_2_50000_embl_other_c1215.seq.00000001.out 2544 2661 SPAC24H6 Z54142 S.pombe chromosome I cosmid c24H6. +226 98.00 453 574 big_blast_2_50000_embl_other_c1215.seq.00000001.out 13105 12984 SPAC1B1 Z98532 S.pombe chromosome I cosmid c1B1. +222 99.00 457 572 big_blast_2_50000_embl_other_c1215.seq.00000001.out 9084 8969 SPAC1687 AL035064 S.pombe chromosome I cosmid c1687. +220 100.00 454 564 big_blast_2_50000_embl_other_c1215.seq.00000001.out 11460 11350 SPBC14F5 AL023780 S.pombe chromosome II cosmid c14F5. +206 100.00 6387 6490 big_blast_2_50000_embl_other_c1215.seq.00000001.out 1 104 SPBC83 AL035536 S.pombe chromosome II cosmid c83. +163 100.00 1 82 big_blast_2_50000_embl_other_c1215.seq.00000001.out 82 1 SPAB4534 AB004534 Schizosaccharomyces pombe 38 kb genomic DNA, clone 1750. +157 100.00 496 574 big_blast_2_50000_embl_other_c1215.seq.00000001.out 1 79 SPBC725 AL034352 S.pombe chromosome II cosmid c725. +157 100.00 496 574 big_blast_2_50000_embl_other_c1215.seq.00000001.out 1 79 SPBC530 AL023634 S.pombe chromosome II cosmid c530. +103 100.00 455 506 big_blast_2_50000_embl_other_c1215.seq.00000001.out 52 1 SPRHP9 Y09431 S.pombe rhp9 gene +93 85.00 463 575 big_blast_2_50000_embl_other_c1215.seq.00000001.out 14821 14716 SPBC609 AL035226 S.pombe chromosome II cosmid c609. +65 89.00 456 512 big_blast_2_50000_embl_other_c1215.seq.00000001.out 1 57 UURNA1 X00998 Urechis unicinctus 5S rRNA sequence +58 95.00 476 512 big_blast_2_50000_embl_other_c1215.seq.00000001.out 21 57 PGRNA01 X00994 Phascolopsis gouldii 5S rRNA sequence +58 95.00 476 512 big_blast_2_50000_embl_other_c1215.seq.00000001.out 904 868 CFRRN285 X06056 Calanus finmarchicus DNA for 23S and 5S rRNA +56 93.00 477 516 big_blast_2_50000_embl_other_c1215.seq.00000001.out 1113 1074 SPBC1778 AL049489 S.pombe chromosome II cosmid c1778. +52 100.00 6059 6084 big_blast_2_50000_embl_other_c1215.seq.00000001.out 233479 233504 AE003531 AE003531 Drosophila melanogaster genomic scaffold 142000013386050 section 37 of 54, complete sequence. +50 92.00 476 512 big_blast_2_50000_embl_other_c1215.seq.00000001.out 21 57 PRRRN5S X01550 Planocera reticulata 5S ribosomal RNA +50 92.00 476 512 big_blast_2_50000_embl_other_c1215.seq.00000001.out 21 57 EGRN01 X00022 Ribbon worm Emplectonema gracile 5S rRNA (Short) +50 94.00 480 512 big_blast_2_50000_embl_other_c1215.seq.00000001.out 25 57 AMRRN5S X01518 Acyrthosiphon magnoliae (aphid) 5S ribosomal RNA +50 89.00 461 512 big_blast_2_50000_embl_other_c1215.seq.00000001.out 6 58 CR1619 D10528 Candida rugosa 5S rRNA. +50 88.00 521 569 big_blast_2_50000_embl_other_c1215.seq.00000001.out 66 114 AERRA K03161 Agaricus edulis 5S ribosomal RNA (5S rRNA). +48 96.00 2466 2493 big_blast_2_50000_embl_other_c1215.seq.00000001.out 10841 10814 AC010292 AC010292 Homo sapiens chromosome 5 clone CTB-131H22, complete sequence. +46 85.00 458 512 big_blast_2_50000_embl_other_c1215.seq.00000001.out 5564 5510 PDHISTCL X53330 P.dumerilii histone gene cluster for core histones H2A, H2B, H3 and H4 +46 100.00 4802 4824 big_blast_2_50000_embl_other_c1215.seq.00000001.out 28075 28053 HSU165H7 Z70225 Human DNA sequence from cosmid U165H7, between markers DXS366 and DXS87 on chromosome X. +46 88.00 526 568 big_blast_2_50000_embl_other_c1215.seq.00000001.out 72 114 TDRRA M58385 Taphrina deformans 5S ribosomal RNA. +46 96.00 487 513 big_blast_2_50000_embl_other_c1215.seq.00000001.out 3 29 SPRRAAS M19951 Schizosaccharomyces pombe 5S ribosomal RNA gene, partial sequence. +44 100.00 4816 4837 big_blast_2_50000_embl_other_c1215.seq.00000001.out 88073 88052 AC084760 AC084760 Gallus gallus clone 65N20, complete sequence. +44 88.00 57 98 big_blast_2_50000_embl_other_c1215.seq.00000001.out 69197 69238 CHPTTRPG D17510 Pinus thunbergii chloroplast DNA, complete sequence. +44 88.00 57 98 big_blast_2_50000_embl_other_c1215.seq.00000001.out 48563 48522 CHNTXX Z00044 Nicotiana tabacum chloroplast genome DNA +44 88.00 57 98 big_blast_2_50000_embl_other_c1215.seq.00000001.out 138 97 CHNTTB2 M16897 Tobacco Thr-tRNA gene. +44 88.00 57 98 big_blast_2_50000_embl_other_c1215.seq.00000001.out 14879 14920 AP002983 AP002983 Lotus japonicus chloroplast DNA, complete genome. +44 88.00 57 98 big_blast_2_50000_embl_other_c1215.seq.00000001.out 46263 46222 AP000423 AP000423 Arabidopsis thaliana chloroplast genomic DNA, complete sequence, strain:Columbia. +44 100.00 893 914 big_blast_2_50000_embl_other_c1215.seq.00000001.out 49861 49882 HSEVMHC X87344 H.sapiens DMA, DMB, HLA-Z1, IPP2, LMP2, TAP1, LMP7, TAP2, DOB, DQB2 and RING8, 9, 13 and 14 genes +44 100.00 6061 6082 big_blast_2_50000_embl_other_c1215.seq.00000001.out 143317 143296 HS377H14 AL022723 Human DNA sequence from clone 377H14 on chromosome 6p21.32-22.1. Contains the HLA-G gene for major histocompatibility complex, class I, G (HLA 6.0) two MHC class I pseudogenes, an RPL7A (60S Ribosomal Protein L7A) pseudogene, a gene for a novel MHC class 1 protein, an interferon-inducible protein 1-8U pseudogene, an RPL23A (60S Ribosomal Protein L23A) pseudogene, an HCGIX pseudogene, an MICB or PERB11.1 pseudogene,the HLA-F gene for major histocompatibility complex, class I, F (CDA12), and four P5-1 pseudogenes. Contains EST, STSs, GSS and six putative CpG islands. +44 100.00 1237 1258 big_blast_2_50000_embl_other_c1215.seq.00000001.out 3149 3128 AP001207 AP001207 Homo sapiens genomic DNA, chromosome 8q23, clone:KB1562D12. +44 100.00 1237 1258 big_blast_2_50000_embl_other_c1215.seq.00000001.out 201930 201909 AP000426 AP000426 Homo sapiens genomic DNA, chromosome 8q23, clone:KB1107E3. +44 93.00 2454 2483 big_blast_2_50000_embl_other_c1215.seq.00000001.out 75294 75323 AC023426 AC023426 Homo sapiens 12 BAC RP11-396L8 (Roswell Park Cancer Institute Human BAC Library) complete sequence. +44 100.00 6061 6082 big_blast_2_50000_embl_other_c1215.seq.00000001.out 34756 34735 AC004213 AC004213 Homo sapiens clone UWGC:y19c060 from 6p21, complete sequence. +44 86.00 521 570 big_blast_2_50000_embl_other_c1215.seq.00000001.out 364 413 AI5SRRNA2 X99089 A.immersus 5S rRNA gene, b2-type +42 100.00 1245 1265 big_blast_2_50000_embl_other_c1215.seq.00000001.out 12979 12959 BBU43414 U43414 Borrelia burgdorferi linear plasmid lp16 DNA, complete sequence. +42 100.00 2454 2474 big_blast_2_50000_embl_other_c1215.seq.00000001.out 278691 278671 AP001119 AP001119 Buchnera sp. APS genomic DNA, complete sequence, segment 2/2. +42 100.00 1245 1265 big_blast_2_50000_embl_other_c1215.seq.00000001.out 12951 12931 AE000793 AE000793 Borrelia burgdorferi plasmid lp17, complete plasmid sequence. +42 100.00 818 838 big_blast_2_50000_embl_other_c1215.seq.00000001.out 2471 2451 OSU77637 U77637 Oryza sativa class III ADH enzyme (AdhIII) gene, complete cds. +42 96.00 1241 1265 big_blast_2_50000_embl_other_c1215.seq.00000001.out 79773 79797 H0505A02 AL512543 Oryza sativa genomic DNA, chromosome 4, BAC clone: H0505A02, complete sequence +42 93.00 343 371 big_blast_2_50000_embl_other_c1215.seq.00000001.out 29118 29146 AB018121 AB018121 Arabidopsis thaliana genomic DNA, chromosome 3, P1 clone: MXE2. +42 84.00 456 512 big_blast_2_50000_embl_other_c1215.seq.00000001.out 1 57 SSRRAB K02349 Jellyfish (Spirocodon saltatrix) 5S ribosomal RNA. +42 89.00 476 512 big_blast_2_50000_embl_other_c1215.seq.00000001.out 21 57 PCRN5SA X13039 Philosamia cynthia ricini 5S rRNA +42 89.00 476 512 big_blast_2_50000_embl_other_c1215.seq.00000001.out 21 57 PCRN5S K02354 Philosamia cythia ricini (silkworm) 5S ribosomal RNA. +42 89.00 476 512 big_blast_2_50000_embl_other_c1215.seq.00000001.out 21 57 OV5SRRN X06835 Octopus vulgaris 5S rRNA +42 89.00 476 512 big_blast_2_50000_embl_other_c1215.seq.00000001.out 21 57 ME5SRNA J01869 Mussel (Mytilus edulis) 5S ribosomal RNA. +42 89.00 476 512 big_blast_2_50000_embl_other_c1215.seq.00000001.out 21 57 LGRNO1 X00020 Ribbon worm Lineus geniculatus 5S rRNA +42 89.00 476 512 big_blast_2_50000_embl_other_c1215.seq.00000001.out 21 57 HSRRN5S X01535 Hymeniacidon sanguinea 5S ribosomal RNA +42 89.00 476 512 big_blast_2_50000_embl_other_c1215.seq.00000001.out 21 57 HJRN01 V00475 Halichondria japonica 5S ribosomal RNA (complete sequence). +42 84.00 456 512 big_blast_2_50000_embl_other_c1215.seq.00000001.out 1 57 EARRN5S X03911 Enchytraeus albidus 5S rRNA +42 100.00 6340 6360 big_blast_2_50000_embl_other_c1215.seq.00000001.out 25954 25974 CEK02B12 Z75711 Caenorhabditis elegans cosmid K02B12 +42 100.00 1213 1233 big_blast_2_50000_embl_other_c1215.seq.00000001.out 5436 5456 CEF14B8 U28737 Caenorhabditis elegans cosmid F14B8. +42 84.00 456 512 big_blast_2_50000_embl_other_c1215.seq.00000001.out 1 57 CED132199 AJ132199 Cerastoderma edule 5S rRNA gene and nontranscribed spacer, clone 4 +42 84.00 456 512 big_blast_2_50000_embl_other_c1215.seq.00000001.out 1 57 CED132198 AJ132198 Cerastoderma edule 5S rRNA gene and nontranscribed spacer, clone 3 +42 89.00 476 512 big_blast_2_50000_embl_other_c1215.seq.00000001.out 21 57 BN5SRRN X06834 Bugula neritina (moss-animal) 5S rRNA +42 100.00 5756 5776 big_blast_2_50000_embl_other_c1215.seq.00000001.out 2219 2239 BMU86876 U86876 Bombyx mori chitinase-like protein mRNA, complete cds. +42 89.00 476 512 big_blast_2_50000_embl_other_c1215.seq.00000001.out 21 57 APRN5SA X13035 Antheraea pernyi 5S rRNA +42 100.00 5756 5776 big_blast_2_50000_embl_other_c1215.seq.00000001.out 2256 2276 AF326596 AF326596 Bombyx mandarina chitinase mRNA, complete cds. +42 100.00 136 156 big_blast_2_50000_embl_other_c1215.seq.00000001.out 6370 6350 AC084626 AC084626 Caenorhabditis briggsae cosmid G45C20, complete sequence. +42 100.00 6091 6111 big_blast_2_50000_embl_other_c1215.seq.00000001.out 27211 27231 AC006830 AC006830 Caenorhabditis elegans cosmid ZK105, complete sequence. +42 100.00 5756 5776 big_blast_2_50000_embl_other_c1215.seq.00000001.out 2225 2245 AB052914 AB052914 Bombyx mori chiB mRNA for chitinase precursor, complete cds. +42 100.00 1395 1415 big_blast_2_50000_embl_other_c1215.seq.00000001.out 145576 145596 HSMX1A AL442166 Homo sapiens chromosome 21 from 5 PACs and 5 Cosmids map 21q22.2,D21S349-MX1; segment 1/2 +42 100.00 6065 6085 big_blast_2_50000_embl_other_c1215.seq.00000001.out 70745 70765 HS994L9 AL034554 Human DNA sequence from clone 994L9 on chromosome 20p12.3-13 Contains STS and GSSs. +42 100.00 1395 1415 big_blast_2_50000_embl_other_c1215.seq.00000001.out 173941 173961 HS21C084 AL163284 Homo sapiens chromosome 21 segment HS21C084. +42 100.00 5172 5192 big_blast_2_50000_embl_other_c1215.seq.00000001.out 8899 8879 HS21C013 AL163213 Homo sapiens chromosome 21 segment HS21C013. +42 96.00 3691 3715 big_blast_2_50000_embl_other_c1215.seq.00000001.out 222756 222780 AP001732 AP001732 Homo sapiens genomic DNA, chromosome 21q, section 76/105. +42 96.00 334 358 big_blast_2_50000_embl_other_c1215.seq.00000001.out 234259 234235 AP001677 AP001677 Homo sapiens genomic DNA, chromosome 21q, section 21/105. +42 96.00 3691 3715 big_blast_2_50000_embl_other_c1215.seq.00000001.out 97170 97194 AP001038 AP001038 Homo sapiens genomic DNA, chromosome 21, clone:P178O22, ERG-ETS2 region. +42 96.00 334 358 big_blast_2_50000_embl_other_c1215.seq.00000001.out 117565 117541 AP000946 AP000946 Homo sapiens genomic DNA, chromosome 21q21.1-q21.2, clone:B335N5, LL56-APP region. +42 100.00 6106 6126 big_blast_2_50000_embl_other_c1215.seq.00000001.out 179419 179439 AP000810 AP000810 Homo sapiens genomic DNA, chromosome 11q, clone:RP11-765H23. +42 100.00 5172 5192 big_blast_2_50000_embl_other_c1215.seq.00000001.out 94404 94384 AP000473 AP000473 Homo sapiens genomic DNA, chromosome 21q21.1-q21.2, clone:B291N6, LL56-APP region. +42 96.00 1801 1825 big_blast_2_50000_embl_other_c1215.seq.00000001.out 6090 6114 AL355365 AL355365 Human DNA sequence from clone RP11-361F15 on chromosome 6 +42 96.00 5531 5555 big_blast_2_50000_embl_other_c1215.seq.00000001.out 79645 79669 AL354861 AL354861 Human DNA sequence from clone RP11-180I4 on chromosome 9 +42 100.00 1 21 big_blast_2_50000_embl_other_c1215.seq.00000001.out 28666 28686 AL139378 AL139378 Human DNA sequence from clone RP11-271B5 on chromosome 13 Contains a gene for a protein similar to ribosomal protein S7, the FGF9 (fibroblast growth factor 9 (glia-activating factor)) gene, ESTs, STSs, GSSs and CpG islands. +42 100.00 5783 5803 big_blast_2_50000_embl_other_c1215.seq.00000001.out 15259 15279 AL139163 AL139163 Human DNA sequence from clone RP11-523O15 on chromosome 20 Contains GSSs and STSs. +42 100.00 3803 3823 big_blast_2_50000_embl_other_c1215.seq.00000001.out 20782 20802 AL136301 AL136301 Human DNA sequence from clone RP11-195L15 on chromosome 13 +42 91.00 5752 5784 big_blast_2_50000_embl_other_c1215.seq.00000001.out 74511 74543 AL133462 AL133462 Human DNA sequence from clone RP11-108A16 on chromosome 20 Contains ESTs, STSs and GSSs. +42 96.00 334 358 big_blast_2_50000_embl_other_c1215.seq.00000001.out 119422 119446 AF238375 AF238375 Homo sapiens chromosome 21 clone BAC 49B5 map 21q21, complete sequence. +42 100.00 1242 1262 big_blast_2_50000_embl_other_c1215.seq.00000001.out 42069 42089 AF130342 AF130342 Homo sapiens chromosome 8 clone PAC 87.1 map 8q24.1, complete sequence. +42 91.00 5752 5784 big_blast_2_50000_embl_other_c1215.seq.00000001.out 49339 49371 AC012380 AC012380 Genomic Sequence For Homo sapiens Clone 125H5, Chromosome 20, complete sequence. +42 93.00 1230 1258 big_blast_2_50000_embl_other_c1215.seq.00000001.out 135503 135475 AC007392 AC007392 Homo sapiens BAC clone RP11-444B4 from 2, complete sequence. +42 100.00 1414 1434 big_blast_2_50000_embl_other_c1215.seq.00000001.out 4290 4310 PCAROMX L18918 Pneumocystis carinii pentafunctional enzyme (arom) gene, complete cds. +42 87.00 521 565 big_blast_2_50000_embl_other_c1215.seq.00000001.out 66 110 CH1457 D10531 Cryptococcus humicolus 5S rRNA. diff --git a/etc/c1215.blastn.tab b/etc/c1215.blastn.tab new file mode 100644 index 000000000..e2113c439 --- /dev/null +++ b/etc/c1215.blastn.tab @@ -0,0 +1,630 @@ +FT BLASTN_HIT 1474..6490 +FT /note="match to SPBC1215 1474..6490 blast score 9583 percent identity 99 AL096846 S.pombe chromosome II cosmid c1215." +FT /label=SPBC1215 +FT /score=99 +FT /colour=255 2 2 +FT BLASTN_HIT 1..1437 +FT /note="match to SPBC1215 1..1437 blast score 2712 percent identity 98 AL096846 S.pombe chromosome II cosmid c1215." +FT /label=SPBC1215 +FT /score=98 +FT /colour=255 5 5 +FT BLASTN_HIT 429..574 +FT /note="match to SPAC1142 7588..7734 blast score 276 percent identity 99 AL159951 S.pombe chromosome I cosmid c1142." +FT /label=SPAC1142 +FT /score=99 +FT /colour=255 2 2 +FT BLASTN_HIT 429..574 +FT /note="match to SPRG5SC 174..319 blast score 274 percent identity 99 K00770 yeast (s.pombe) 5s rrna gene and flanks, clone pspr36." +FT /label=SPRG5SC +FT /score=99 +FT /colour=255 2 2 +FT BLASTN_HIT 453..574 +FT /note="match to SPRG5S 48..169 blast score 242 percent identity 100 K00569 yeast (s.pombe) 5s rrna gene, clone pym3." +FT /label=SPRG5S +FT /score=100 +FT /colour=255 0 0 +FT BLASTN_HIT 453..574 +FT /note="match to SPCC63 20954..21075 blast score 242 percent identity 100 AL049522 S.pombe chromosome III cosmid c63." +FT /label=SPCC63 +FT /score=100 +FT /colour=255 0 0 +FT BLASTN_HIT 453..574 +FT /note="match to SPCC417 33755..33876 blast score 242 percent identity 100 AL035076 S.pombe chromosome III cosmid c417." +FT /label=SPCC417 +FT /score=100 +FT /colour=255 0 0 +FT BLASTN_HIT 456..574 +FT /note="match to SPCC417 22579..22697 blast score 228 percent identity 99 AL035076 S.pombe chromosome III cosmid c417." +FT /label=SPCC417 +FT /score=99 +FT /colour=255 2 2 +FT BLASTN_HIT 453..574 +FT /note="match to SPCC338 30966..31087 blast score 242 percent identity 100 AL023781 S.pombe chromosome III cosmid c338." +FT /label=SPCC338 +FT /score=100 +FT /colour=255 0 0 +FT BLASTN_HIT 35..107 +FT /note="match to SPCC338 22022..22094 blast score 129 percent identity 97 AL023781 S.pombe chromosome III cosmid c338." +FT /label=SPCC338 +FT /score=97 +FT /colour=255 7 7 +FT BLASTN_HIT 453..574 +FT /note="match to SPBC17A3 6258..6379 blast score 242 percent identity 100 AL109652 S.pombe chromosome II cosmid c17A3." +FT /label=SPBC17A3 +FT /score=100 +FT /colour=255 0 0 +FT BLASTN_HIT 453..574 +FT /note="match to SPAC5H10 3214..3335 blast score 242 percent identity 100 Z49811 S.pombe chromosome I cosmid c5H10." +FT /label=SPAC5H10 +FT /score=100 +FT /colour=255 0 0 +FT BLASTN_HIT 453..574 +FT /note="match to SPAC4H3 8450..8571 blast score 242 percent identity 100 Z69380 S.pombe chromosome I cosmid c4H3." +FT /label=SPAC4H3 +FT /score=100 +FT /colour=255 0 0 +FT BLASTN_HIT 453..574 +FT /note="match to SPAC25B8 30707..30828 blast score 242 percent identity 100 AL133225 S.pombe chromosome I cosmid c25B8." +FT /label=SPAC25B8 +FT /score=100 +FT /colour=255 0 0 +FT BLASTN_HIT 453..574 +FT /note="match to SPAC1F7 24447..24568 blast score 242 percent identity 100 Z67998 S.pombe chromosome I cosmid c1F7." +FT /label=SPAC1F7 +FT /score=100 +FT /colour=255 0 0 +FT BLASTN_HIT 453..574 +FT /note="match to SPAB4537 17099..17220 blast score 242 percent identity 100 AB004537 Schizosaccharomyces pombe 37 kb genomic DNA, clone c213." +FT /label=SPAB4537 +FT /score=100 +FT /colour=255 0 0 +FT BLASTN_HIT 453..573 +FT /note="match to SPAC926 7747..7867 blast score 240 percent identity 100 AL110469 S.pombe chromosome I cosmid c926." +FT /label=SPAC926 +FT /score=100 +FT /colour=255 0 0 +FT BLASTN_HIT 455..574 +FT /note="match to SPCC965 29496..29615 blast score 238 percent identity 100 AL023590 S.pombe chromosome III cosmid c965." +FT /label=SPCC965 +FT /score=100 +FT /colour=255 0 0 +FT BLASTN_HIT 455..574 +FT /note="match to SPCC24B10 24228..24347 blast score 238 percent identity 100 AL157991 S.pombe chromosome III cosmid c24B10." +FT /label=SPCC24B10 +FT /score=100 +FT /colour=255 0 0 +FT BLASTN_HIT 455..574 +FT /note="match to SPCC10H11 5316..5435 blast score 238 percent identity 100 AL162771 S.pombe chromosome III cosmid c10H11." +FT /label=SPCC10H11 +FT /score=100 +FT /colour=255 0 0 +FT BLASTN_HIT 455..574 +FT /note="match to SPBC428 23752..23871 blast score 238 percent identity 100 AL034382 S.pombe chromosome II cosmid c428." +FT /label=SPBC428 +FT /score=100 +FT /colour=255 0 0 +FT BLASTN_HIT 455..574 +FT /note="match to SPBC4 15895..16014 blast score 238 percent identity 100 AL121863 S.pombe chromosome II cosmid c4." +FT /label=SPBC4 +FT /score=100 +FT /colour=255 0 0 +FT BLASTN_HIT 455..574 +FT /note="match to SPBC342 9354..9473 blast score 238 percent identity 100 AL096809 S.pombe chromosome II cosmid c342." +FT /label=SPBC342 +FT /score=100 +FT /colour=255 0 0 +FT BLASTN_HIT 456..575 +FT /note="match to SPBC21H7 9546..9665 blast score 238 percent identity 100 AL023286 S.pombe chromosome II cosmid c21H7." +FT /label=SPBC21H7 +FT /score=100 +FT /colour=255 0 0 +FT BLASTN_HIT 455..574 +FT /note="match to SPBC1685 24026..24145 blast score 238 percent identity 100 AL031154 S.pombe chromosome II cosmid c1685." +FT /label=SPBC1685 +FT /score=100 +FT /colour=255 0 0 +FT BLASTN_HIT 456..574 +FT /note="match to SPRG5SE 202..320 blast score 236 percent identity 100 K00570 yeast (s.pombe) 5s rrna and asp-trna genes, clone pym116." +FT /label=SPRG5SE +FT /score=100 +FT /colour=255 0 0 +FT BLASTN_HIT 456..574 +FT /note="match to SPBP23A10 34701..34819 blast score 236 percent identity 100 AL136535 S.pombe chromosome II p1 p23A10." +FT /label=SPBP23A10 +FT /score=100 +FT /colour=255 0 0 +FT BLASTN_HIT 456..574 +FT /note="match to SPBC577 31520..31638 blast score 236 percent identity 100 AL110506 S.pombe chromosome II cosmid c577." +FT /label=SPBC577 +FT /score=100 +FT /colour=255 0 0 +FT BLASTN_HIT 456..574 +FT /note="match to SPBC1677 6163..6281 blast score 236 percent identity 100 AL035581 S.pombe chromosome II cosmid c1677." +FT /label=SPBC1677 +FT /score=100 +FT /colour=255 0 0 +FT BLASTN_HIT 456..574 +FT /note="match to SPAC3G9 18044..18162 blast score 236 percent identity 100 AL021046 S.pombe chromosome I cosmid c3G9." +FT /label=SPAC3G9 +FT /score=100 +FT /colour=255 0 0 +FT BLASTN_HIT 456..574 +FT /note="match to SPA 1..119 blast score 236 percent identity 100 K01049 Yeast (S.pombe) 5S ribosomal RNA." +FT /label=SPA +FT /score=100 +FT /colour=255 0 0 +FT BLASTN_HIT 453..574 +FT /note="match to SPCC188 1543..1664 blast score 234 percent identity 99 AL049662 S.pombe chromosome III cosmid c188." +FT /label=SPCC188 +FT /score=99 +FT /colour=255 2 2 +FT BLASTN_HIT 453..574 +FT /note="match to SPCC11E10 20718..20839 blast score 234 percent identity 99 AL121783 S.pombe chromosome III cosmid c11E10." +FT /label=SPCC11E10 +FT /score=99 +FT /colour=255 2 2 +FT BLASTN_HIT 453..574 +FT /note="match to SPBC21D10 23287..23408 blast score 234 percent identity 99 AL031536 S.pombe chromosome II cosmid c21D10." +FT /label=SPBC21D10 +FT /score=99 +FT /colour=255 2 2 +FT BLASTN_HIT 455..575 +FT /note="match to SPBC24C6 3099..3219 blast score 232 percent identity 99 AL031786 S.pombe chromosome II cosmid c24C6." +FT /label=SPBC24C6 +FT /score=99 +FT /colour=255 2 2 +FT BLASTN_HIT 455..574 +FT /note="match to SPRG5SA 200..319 blast score 230 percent identity 99 K00768 yeast (s.pombe) 5s rrna gene and flanks, clone pspr1." +FT /label=SPRG5SA +FT /score=99 +FT /colour=255 2 2 +FT BLASTN_HIT 455..574 +FT /note="match to SPBC354 24833..24952 blast score 230 percent identity 99 AL022071 S.pombe chromosome II cosmid c354." +FT /label=SPBC354 +FT /score=99 +FT /colour=255 2 2 +FT BLASTN_HIT 455..574 +FT /note="match to SPAC167 14612..14731 blast score 230 percent identity 99 AL035248 S.pombe chromosome I cosmid c167." +FT /label=SPAC167 +FT /score=99 +FT /colour=255 2 2 +FT BLASTN_HIT 456..574 +FT /note="match to SPRG5SD 201..319 blast score 228 percent identity 99 K00771 yeast (s.pombe) 5s rrna gene and flanks, clone pspr41." +FT /label=SPRG5SD +FT /score=99 +FT /colour=255 2 2 +FT BLASTN_HIT 453..574 +FT /note="match to SPRG5SB 198..319 blast score 226 percent identity 98 K00769 yeast (s.pombe) 5s rrna gene and flanks, clone pspr11." +FT /label=SPRG5SB +FT /score=98 +FT /colour=255 5 5 +FT BLASTN_HIT 455..572 +FT /note="match to SPAC24H6 2544..2661 blast score 226 percent identity 99 Z54142 S.pombe chromosome I cosmid c24H6." +FT /label=SPAC24H6 +FT /score=99 +FT /colour=255 2 2 +FT BLASTN_HIT 453..574 +FT /note="match to SPAC1B1 12984..13105 blast score 226 percent identity 98 Z98532 S.pombe chromosome I cosmid c1B1." +FT /label=SPAC1B1 +FT /score=98 +FT /colour=255 5 5 +FT BLASTN_HIT 457..572 +FT /note="match to SPAC1687 8969..9084 blast score 222 percent identity 99 AL035064 S.pombe chromosome I cosmid c1687." +FT /label=SPAC1687 +FT /score=99 +FT /colour=255 2 2 +FT BLASTN_HIT 454..564 +FT /note="match to SPBC14F5 11350..11460 blast score 220 percent identity 100 AL023780 S.pombe chromosome II cosmid c14F5." +FT /label=SPBC14F5 +FT /score=100 +FT /colour=255 0 0 +FT BLASTN_HIT 6387..6490 +FT /note="match to SPBC83 1..104 blast score 206 percent identity 100 AL035536 S.pombe chromosome II cosmid c83." +FT /label=SPBC83 +FT /score=100 +FT /colour=255 0 0 +FT BLASTN_HIT 1..82 +FT /note="match to SPAB4534 1..82 blast score 163 percent identity 100 AB004534 Schizosaccharomyces pombe 38 kb genomic DNA, clone 1750." +FT /label=SPAB4534 +FT /score=100 +FT /colour=255 0 0 +FT BLASTN_HIT 496..574 +FT /note="match to SPBC725 1..79 blast score 157 percent identity 100 AL034352 S.pombe chromosome II cosmid c725." +FT /label=SPBC725 +FT /score=100 +FT /colour=255 0 0 +FT BLASTN_HIT 496..574 +FT /note="match to SPBC530 1..79 blast score 157 percent identity 100 AL023634 S.pombe chromosome II cosmid c530." +FT /label=SPBC530 +FT /score=100 +FT /colour=255 0 0 +FT BLASTN_HIT 455..506 +FT /note="match to SPRHP9 1..52 blast score 103 percent identity 100 Y09431 S.pombe rhp9 gene" +FT /label=SPRHP9 +FT /score=100 +FT /colour=255 0 0 +FT BLASTN_HIT 463..575 +FT /note="match to SPBC609 14716..14821 blast score 93.7 percent identity 85 AL035226 S.pombe chromosome II cosmid c609." +FT /label=SPBC609 +FT /score=85 +FT /colour=255 38 38 +FT BLASTN_HIT 456..512 +FT /note="match to UURNA1 1..57 blast score 65.9 percent identity 89 X00998 Urechis unicinctus 5S rRNA sequence" +FT /label=UURNA1 +FT /score=89 +FT /colour=255 28 28 +FT BLASTN_HIT 476..512 +FT /note="match to PGRNA01 21..57 blast score 58.0 percent identity 95 X00994 Phascolopsis gouldii 5S rRNA sequence" +FT /label=PGRNA01 +FT /score=95 +FT /colour=255 12 12 +FT BLASTN_HIT 476..512 +FT /note="match to CFRRN285 868..904 blast score 58.0 percent identity 95 X06056 Calanus finmarchicus DNA for 23S and 5S rRNA" +FT /label=CFRRN285 +FT /score=95 +FT /colour=255 12 12 +FT BLASTN_HIT 477..516 +FT /note="match to SPBC1778 1074..1113 blast score 56.0 percent identity 93 AL049489 S.pombe chromosome II cosmid c1778." +FT /label=SPBC1778 +FT /score=93 +FT /colour=255 17 17 +FT BLASTN_HIT 6059..6084 +FT /note="match to AE003531 233479..233504 blast score 52.0 percent identity 100 AE003531 Drosophila melanogaster genomic scaffold 142000013386050 section 37 of 54, complete sequence." +FT /label=AE003531 +FT /score=100 +FT /colour=255 0 0 +FT BLASTN_HIT 476..512 +FT /note="match to PRRRN5S 21..57 blast score 50.1 percent identity 92 X01550 Planocera reticulata 5S ribosomal RNA" +FT /label=PRRRN5S +FT /score=92 +FT /colour=255 20 20 +FT BLASTN_HIT 476..512 +FT /note="match to EGRN01 21..57 blast score 50.1 percent identity 92 X00022 Ribbon worm Emplectonema gracile 5S rRNA (Short)" +FT /label=EGRN01 +FT /score=92 +FT /colour=255 20 20 +FT BLASTN_HIT 480..512 +FT /note="match to AMRRN5S 25..57 blast score 50.1 percent identity 94 X01518 Acyrthosiphon magnoliae (aphid) 5S ribosomal RNA" +FT /label=AMRRN5S +FT /score=94 +FT /colour=255 15 15 +FT BLASTN_HIT 461..512 +FT /note="match to CR1619 6..58 blast score 50.1 percent identity 89 D10528 Candida rugosa 5S rRNA." +FT /label=CR1619 +FT /score=89 +FT /colour=255 28 28 +FT BLASTN_HIT 521..569 +FT /note="match to AERRA 66..114 blast score 50.1 percent identity 88 K03161 Agaricus edulis 5S ribosomal RNA (5S rRNA)." +FT /label=AERRA +FT /score=88 +FT /colour=255 30 30 +FT BLASTN_HIT 2466..2493 +FT /note="match to AC010292 10814..10841 blast score 48.1 percent identity 96 AC010292 Homo sapiens chromosome 5 clone CTB-131H22, complete sequence." +FT /label=AC010292 +FT /score=96 +FT /colour=255 10 10 +FT BLASTN_HIT 458..512 +FT /note="match to PDHISTCL 5510..5564 blast score 46.1 percent identity 85 X53330 P.dumerilii histone gene cluster for core histones H2A, H2B, H3 and H4" +FT /label=PDHISTCL +FT /score=85 +FT /colour=255 38 38 +FT BLASTN_HIT 4802..4824 +FT /note="match to HSU165H7 28053..28075 blast score 46.1 percent identity 100 Z70225 Human DNA sequence from cosmid U165H7, between markers DXS366 and DXS87 on chromosome X." +FT /label=HSU165H7 +FT /score=100 +FT /colour=255 0 0 +FT BLASTN_HIT 526..568 +FT /note="match to TDRRA 72..114 blast score 46.1 percent identity 88 M58385 Taphrina deformans 5S ribosomal RNA." +FT /label=TDRRA +FT /score=88 +FT /colour=255 30 30 +FT BLASTN_HIT 487..513 +FT /note="match to SPRRAAS 3..29 blast score 46.1 percent identity 96 M19951 Schizosaccharomyces pombe 5S ribosomal RNA gene, partial sequence." +FT /label=SPRRAAS +FT /score=96 +FT /colour=255 10 10 +FT BLASTN_HIT 4816..4837 +FT /note="match to AC084760 88052..88073 blast score 44.1 percent identity 100 AC084760 Gallus gallus clone 65N20, complete sequence." +FT /label=AC084760 +FT /score=100 +FT /colour=255 0 0 +FT BLASTN_HIT 57..98 +FT /note="match to CHPTTRPG 69197..69238 blast score 44.1 percent identity 88 D17510 Pinus thunbergii chloroplast DNA, complete sequence." +FT /label=CHPTTRPG +FT /score=88 +FT /colour=255 30 30 +FT BLASTN_HIT 57..98 +FT /note="match to CHNTXX 48522..48563 blast score 44.1 percent identity 88 Z00044 Nicotiana tabacum chloroplast genome DNA" +FT /label=CHNTXX +FT /score=88 +FT /colour=255 30 30 +FT BLASTN_HIT 57..98 +FT /note="match to CHNTTB2 97..138 blast score 44.1 percent identity 88 M16897 Tobacco Thr-tRNA gene." +FT /label=CHNTTB2 +FT /score=88 +FT /colour=255 30 30 +FT BLASTN_HIT 57..98 +FT /note="match to AP002983 14879..14920 blast score 44.1 percent identity 88 AP002983 Lotus japonicus chloroplast DNA, complete genome." +FT /label=AP002983 +FT /score=88 +FT /colour=255 30 30 +FT BLASTN_HIT 57..98 +FT /note="match to AP000423 46222..46263 blast score 44.1 percent identity 88 AP000423 Arabidopsis thaliana chloroplast genomic DNA, complete sequence, strain:Columbia." +FT /label=AP000423 +FT /score=88 +FT /colour=255 30 30 +FT BLASTN_HIT 893..914 +FT /note="match to HSEVMHC 49861..49882 blast score 44.1 percent identity 100 X87344 H.sapiens DMA, DMB, HLA-Z1, IPP2, LMP2, TAP1, LMP7, TAP2, DOB, DQB2 and RING8, 9, 13 and 14 genes" +FT /label=HSEVMHC +FT /score=100 +FT /colour=255 0 0 +FT BLASTN_HIT 6061..6082 +FT /note="match to HS377H14 143296..143317 blast score 44.1 percent identity 100 AL022723 Human DNA sequence from clone 377H14 on chromosome 6p21.32-22.1. Contains the HLA-G gene for major histocompatibility complex, class I, G (HLA 6.0) two MHC class I pseudogenes, an RPL7A (60S Ribosomal Protein L7A) pseudogene, a gene for a novel MHC class 1 protein, an interferon-inducible protein 1-8U pseudogene, an RPL23A (60S Ribosomal Protein L23A) pseudogene, an HCGIX pseudogene, an MICB or PERB11.1 pseudogene,the HLA-F gene for major histocompatibility complex, class I, F (CDA12), and four P5-1 pseudogenes. Contains EST, STSs, GSS and six putative CpG islands." +FT /label=HS377H14 +FT /score=100 +FT /colour=255 0 0 +FT BLASTN_HIT 1237..1258 +FT /note="match to AP001207 3128..3149 blast score 44.1 percent identity 100 AP001207 Homo sapiens genomic DNA, chromosome 8q23, clone:KB1562D12." +FT /label=AP001207 +FT /score=100 +FT /colour=255 0 0 +FT BLASTN_HIT 1237..1258 +FT /note="match to AP000426 201909..201930 blast score 44.1 percent identity 100 AP000426 Homo sapiens genomic DNA, chromosome 8q23, clone:KB1107E3." +FT /label=AP000426 +FT /score=100 +FT /colour=255 0 0 +FT BLASTN_HIT 2454..2483 +FT /note="match to AC023426 75294..75323 blast score 44.1 percent identity 93 AC023426 Homo sapiens 12 BAC RP11-396L8 (Roswell Park Cancer Institute Human BAC Library) complete sequence." +FT /label=AC023426 +FT /score=93 +FT /colour=255 17 17 +FT BLASTN_HIT 6061..6082 +FT /note="match to AC004213 34735..34756 blast score 44.1 percent identity 100 AC004213 Homo sapiens clone UWGC:y19c060 from 6p21, complete sequence." +FT /label=AC004213 +FT /score=100 +FT /colour=255 0 0 +FT BLASTN_HIT 521..570 +FT /note="match to AI5SRRNA2 364..413 blast score 44.1 percent identity 86 X99089 A.immersus 5S rRNA gene, b2-type" +FT /label=AI5SRRNA2 +FT /score=86 +FT /colour=255 35 35 +FT BLASTN_HIT 1245..1265 +FT /note="match to BBU43414 12959..12979 blast score 42.1 percent identity 100 U43414 Borrelia burgdorferi linear plasmid lp16 DNA, complete sequence." +FT /label=BBU43414 +FT /score=100 +FT /colour=255 0 0 +FT BLASTN_HIT 2454..2474 +FT /note="match to AP001119 278671..278691 blast score 42.1 percent identity 100 AP001119 Buchnera sp. APS genomic DNA, complete sequence, segment 2/2." +FT /label=AP001119 +FT /score=100 +FT /colour=255 0 0 +FT BLASTN_HIT 1245..1265 +FT /note="match to AE000793 12931..12951 blast score 42.1 percent identity 100 AE000793 Borrelia burgdorferi plasmid lp17, complete plasmid sequence." +FT /label=AE000793 +FT /score=100 +FT /colour=255 0 0 +FT BLASTN_HIT 818..838 +FT /note="match to OSU77637 2451..2471 blast score 42.1 percent identity 100 U77637 Oryza sativa class III ADH enzyme (AdhIII) gene, complete cds." +FT /label=OSU77637 +FT /score=100 +FT /colour=255 0 0 +FT BLASTN_HIT 1241..1265 +FT /note="match to H0505A02 79773..79797 blast score 42.1 percent identity 96 AL512543 Oryza sativa genomic DNA, chromosome 4, BAC clone: H0505A02, complete sequence" +FT /label=H0505A02 +FT /score=96 +FT /colour=255 10 10 +FT BLASTN_HIT 343..371 +FT /note="match to AB018121 29118..29146 blast score 42.1 percent identity 93 AB018121 Arabidopsis thaliana genomic DNA, chromosome 3, P1 clone: MXE2." +FT /label=AB018121 +FT /score=93 +FT /colour=255 17 17 +FT BLASTN_HIT 456..512 +FT /note="match to SSRRAB 1..57 blast score 42.1 percent identity 84 K02349 Jellyfish (Spirocodon saltatrix) 5S ribosomal RNA." +FT /label=SSRRAB +FT /score=84 +FT /colour=255 40 40 +FT BLASTN_HIT 476..512 +FT /note="match to PCRN5SA 21..57 blast score 42.1 percent identity 89 X13039 Philosamia cynthia ricini 5S rRNA" +FT /label=PCRN5SA +FT /score=89 +FT /colour=255 28 28 +FT BLASTN_HIT 476..512 +FT /note="match to PCRN5S 21..57 blast score 42.1 percent identity 89 K02354 Philosamia cythia ricini (silkworm) 5S ribosomal RNA." +FT /label=PCRN5S +FT /score=89 +FT /colour=255 28 28 +FT BLASTN_HIT 476..512 +FT /note="match to OV5SRRN 21..57 blast score 42.1 percent identity 89 X06835 Octopus vulgaris 5S rRNA" +FT /label=OV5SRRN +FT /score=89 +FT /colour=255 28 28 +FT BLASTN_HIT 476..512 +FT /note="match to ME5SRNA 21..57 blast score 42.1 percent identity 89 J01869 Mussel (Mytilus edulis) 5S ribosomal RNA." +FT /label=ME5SRNA +FT /score=89 +FT /colour=255 28 28 +FT BLASTN_HIT 476..512 +FT /note="match to LGRNO1 21..57 blast score 42.1 percent identity 89 X00020 Ribbon worm Lineus geniculatus 5S rRNA" +FT /label=LGRNO1 +FT /score=89 +FT /colour=255 28 28 +FT BLASTN_HIT 476..512 +FT /note="match to HSRRN5S 21..57 blast score 42.1 percent identity 89 X01535 Hymeniacidon sanguinea 5S ribosomal RNA" +FT /label=HSRRN5S +FT /score=89 +FT /colour=255 28 28 +FT BLASTN_HIT 476..512 +FT /note="match to HJRN01 21..57 blast score 42.1 percent identity 89 V00475 Halichondria japonica 5S ribosomal RNA (complete sequence)." +FT /label=HJRN01 +FT /score=89 +FT /colour=255 28 28 +FT BLASTN_HIT 456..512 +FT /note="match to EARRN5S 1..57 blast score 42.1 percent identity 84 X03911 Enchytraeus albidus 5S rRNA" +FT /label=EARRN5S +FT /score=84 +FT /colour=255 40 40 +FT BLASTN_HIT 6340..6360 +FT /note="match to CEK02B12 25954..25974 blast score 42.1 percent identity 100 Z75711 Caenorhabditis elegans cosmid K02B12" +FT /label=CEK02B12 +FT /score=100 +FT /colour=255 0 0 +FT BLASTN_HIT 1213..1233 +FT /note="match to CEF14B8 5436..5456 blast score 42.1 percent identity 100 U28737 Caenorhabditis elegans cosmid F14B8." +FT /label=CEF14B8 +FT /score=100 +FT /colour=255 0 0 +FT BLASTN_HIT 456..512 +FT /note="match to CED132199 1..57 blast score 42.1 percent identity 84 AJ132199 Cerastoderma edule 5S rRNA gene and nontranscribed spacer, clone 4" +FT /label=CED132199 +FT /score=84 +FT /colour=255 40 40 +FT BLASTN_HIT 456..512 +FT /note="match to CED132198 1..57 blast score 42.1 percent identity 84 AJ132198 Cerastoderma edule 5S rRNA gene and nontranscribed spacer, clone 3" +FT /label=CED132198 +FT /score=84 +FT /colour=255 40 40 +FT BLASTN_HIT 476..512 +FT /note="match to BN5SRRN 21..57 blast score 42.1 percent identity 89 X06834 Bugula neritina (moss-animal) 5S rRNA" +FT /label=BN5SRRN +FT /score=89 +FT /colour=255 28 28 +FT BLASTN_HIT 5756..5776 +FT /note="match to BMU86876 2219..2239 blast score 42.1 percent identity 100 U86876 Bombyx mori chitinase-like protein mRNA, complete cds." +FT /label=BMU86876 +FT /score=100 +FT /colour=255 0 0 +FT BLASTN_HIT 476..512 +FT /note="match to APRN5SA 21..57 blast score 42.1 percent identity 89 X13035 Antheraea pernyi 5S rRNA" +FT /label=APRN5SA +FT /score=89 +FT /colour=255 28 28 +FT BLASTN_HIT 5756..5776 +FT /note="match to AF326596 2256..2276 blast score 42.1 percent identity 100 AF326596 Bombyx mandarina chitinase mRNA, complete cds." +FT /label=AF326596 +FT /score=100 +FT /colour=255 0 0 +FT BLASTN_HIT 136..156 +FT /note="match to AC084626 6350..6370 blast score 42.1 percent identity 100 AC084626 Caenorhabditis briggsae cosmid G45C20, complete sequence." +FT /label=AC084626 +FT /score=100 +FT /colour=255 0 0 +FT BLASTN_HIT 6091..6111 +FT /note="match to AC006830 27211..27231 blast score 42.1 percent identity 100 AC006830 Caenorhabditis elegans cosmid ZK105, complete sequence." +FT /label=AC006830 +FT /score=100 +FT /colour=255 0 0 +FT BLASTN_HIT 5756..5776 +FT /note="match to AB052914 2225..2245 blast score 42.1 percent identity 100 AB052914 Bombyx mori chiB mRNA for chitinase precursor, complete cds." +FT /label=AB052914 +FT /score=100 +FT /colour=255 0 0 +FT BLASTN_HIT 1395..1415 +FT /note="match to HSMX1A 145576..145596 blast score 42.1 percent identity 100 AL442166 Homo sapiens chromosome 21 from 5 PACs and 5 Cosmids map 21q22.2,D21S349-MX1; segment 1/2" +FT /label=HSMX1A +FT /score=100 +FT /colour=255 0 0 +FT BLASTN_HIT 6065..6085 +FT /note="match to HS994L9 70745..70765 blast score 42.1 percent identity 100 AL034554 Human DNA sequence from clone 994L9 on chromosome 20p12.3-13 Contains STS and GSSs." +FT /label=HS994L9 +FT /score=100 +FT /colour=255 0 0 +FT BLASTN_HIT 1395..1415 +FT /note="match to HS21C084 173941..173961 blast score 42.1 percent identity 100 AL163284 Homo sapiens chromosome 21 segment HS21C084." +FT /label=HS21C084 +FT /score=100 +FT /colour=255 0 0 +FT BLASTN_HIT 5172..5192 +FT /note="match to HS21C013 8879..8899 blast score 42.1 percent identity 100 AL163213 Homo sapiens chromosome 21 segment HS21C013." +FT /label=HS21C013 +FT /score=100 +FT /colour=255 0 0 +FT BLASTN_HIT 3691..3715 +FT /note="match to AP001732 222756..222780 blast score 42.1 percent identity 96 AP001732 Homo sapiens genomic DNA, chromosome 21q, section 76/105." +FT /label=AP001732 +FT /score=96 +FT /colour=255 10 10 +FT BLASTN_HIT 334..358 +FT /note="match to AP001677 234235..234259 blast score 42.1 percent identity 96 AP001677 Homo sapiens genomic DNA, chromosome 21q, section 21/105." +FT /label=AP001677 +FT /score=96 +FT /colour=255 10 10 +FT BLASTN_HIT 3691..3715 +FT /note="match to AP001038 97170..97194 blast score 42.1 percent identity 96 AP001038 Homo sapiens genomic DNA, chromosome 21, clone:P178O22, ERG-ETS2 region." +FT /label=AP001038 +FT /score=96 +FT /colour=255 10 10 +FT BLASTN_HIT 334..358 +FT /note="match to AP000946 117541..117565 blast score 42.1 percent identity 96 AP000946 Homo sapiens genomic DNA, chromosome 21q21.1-q21.2, clone:B335N5, LL56-APP region." +FT /label=AP000946 +FT /score=96 +FT /colour=255 10 10 +FT BLASTN_HIT 6106..6126 +FT /note="match to AP000810 179419..179439 blast score 42.1 percent identity 100 AP000810 Homo sapiens genomic DNA, chromosome 11q, clone:RP11-765H23." +FT /label=AP000810 +FT /score=100 +FT /colour=255 0 0 +FT BLASTN_HIT 5172..5192 +FT /note="match to AP000473 94384..94404 blast score 42.1 percent identity 100 AP000473 Homo sapiens genomic DNA, chromosome 21q21.1-q21.2, clone:B291N6, LL56-APP region." +FT /label=AP000473 +FT /score=100 +FT /colour=255 0 0 +FT BLASTN_HIT 1801..1825 +FT /note="match to AL355365 6090..6114 blast score 42.1 percent identity 96 AL355365 Human DNA sequence from clone RP11-361F15 on chromosome 6" +FT /label=AL355365 +FT /score=96 +FT /colour=255 10 10 +FT BLASTN_HIT 5531..5555 +FT /note="match to AL354861 79645..79669 blast score 42.1 percent identity 96 AL354861 Human DNA sequence from clone RP11-180I4 on chromosome 9" +FT /label=AL354861 +FT /score=96 +FT /colour=255 10 10 +FT BLASTN_HIT 1..21 +FT /note="match to AL139378 28666..28686 blast score 42.1 percent identity 100 AL139378 Human DNA sequence from clone RP11-271B5 on chromosome 13 Contains a gene for a protein similar to ribosomal protein S7, the FGF9 (fibroblast growth factor 9 (glia-activating factor)) gene, ESTs, STSs, GSSs and CpG islands." +FT /label=AL139378 +FT /score=100 +FT /colour=255 0 0 +FT BLASTN_HIT 5783..5803 +FT /note="match to AL139163 15259..15279 blast score 42.1 percent identity 100 AL139163 Human DNA sequence from clone RP11-523O15 on chromosome 20 Contains GSSs and STSs." +FT /label=AL139163 +FT /score=100 +FT /colour=255 0 0 +FT BLASTN_HIT 3803..3823 +FT /note="match to AL136301 20782..20802 blast score 42.1 percent identity 100 AL136301 Human DNA sequence from clone RP11-195L15 on chromosome 13" +FT /label=AL136301 +FT /score=100 +FT /colour=255 0 0 +FT BLASTN_HIT 5752..5784 +FT /note="match to AL133462 74511..74543 blast score 42.1 percent identity 91 AL133462 Human DNA sequence from clone RP11-108A16 on chromosome 20 Contains ESTs, STSs and GSSs." +FT /label=AL133462 +FT /score=91 +FT /colour=255 22 22 +FT BLASTN_HIT 334..358 +FT /note="match to AF238375 119422..119446 blast score 42.1 percent identity 96 AF238375 Homo sapiens chromosome 21 clone BAC 49B5 map 21q21, complete sequence." +FT /label=AF238375 +FT /score=96 +FT /colour=255 10 10 +FT BLASTN_HIT 1242..1262 +FT /note="match to AF130342 42069..42089 blast score 42.1 percent identity 100 AF130342 Homo sapiens chromosome 8 clone PAC 87.1 map 8q24.1, complete sequence." +FT /label=AF130342 +FT /score=100 +FT /colour=255 0 0 +FT BLASTN_HIT 5752..5784 +FT /note="match to AC012380 49339..49371 blast score 42.1 percent identity 91 AC012380 Genomic Sequence For Homo sapiens Clone 125H5, Chromosome 20, complete sequence." +FT /label=AC012380 +FT /score=91 +FT /colour=255 22 22 +FT BLASTN_HIT 1230..1258 +FT /note="match to AC007392 135475..135503 blast score 42.1 percent identity 93 AC007392 Homo sapiens BAC clone RP11-444B4 from 2, complete sequence." +FT /label=AC007392 +FT /score=93 +FT /colour=255 17 17 +FT BLASTN_HIT 1414..1434 +FT /note="match to PCAROMX 4290..4310 blast score 42.1 percent identity 100 L18918 Pneumocystis carinii pentafunctional enzyme (arom) gene, complete cds." +FT /label=PCAROMX +FT /score=100 +FT /colour=255 0 0 +FT BLASTN_HIT 521..565 +FT /note="match to CH1457 66..110 blast score 42.1 percent identity 87 D10531 Cryptococcus humicolus 5S rRNA." +FT /label=CH1457 +FT /score=87 +FT /colour=255 33 33 diff --git a/etc/c1215.embl b/etc/c1215.embl new file mode 100644 index 000000000..5acb69e99 --- /dev/null +++ b/etc/c1215.embl @@ -0,0 +1,258 @@ +ID SPBC1215 standard; DNA; FUN; 6490 BP. +XX +AC AL096846; +XX +DE S.pombe chromosome II cosmid c1215. +XX +KW SURF-family protein; COX complex biogenesis; DEC1 homologue; +KW mitochondrial inheritance; actin cytoskeleton organisation. +XX +OS Schizosaccharomyces pombe (yeast) +OC Eukaryota; Plantae; Thallobionta; Eumycota; Hemiascomycetes; +OC Endomycetales; Saccharomycetaceae. +XX +RN [1] +RP 1-6490 +RA Lyne M.H., Rajandream M.A., Barrell B.G., Seeger K., Quail M., Harris D.; +RT ; +RL Submitted (16-JUL-1999) to the EMBL/GenBank/DDBJ databases. +RL European Schizosaccharomyces genome sequencing project, +RL Sanger Centre, The Wellcome Trust Genome Campus, Hinxton, +RL Cambridge CB10 1SA, E-mail: barrell@sanger.ac.uk and +XX +CC Notes: +CC +CC Details of yeast sequencing at the Sanger Centre are available on +CC the World Wide Web. +CC (URL, http://www.sanger.ac.uk/Projects/S_pombe/) +CC During 1995 to 1996 about 66% of S. pombe chromosome 1 was sequenced +CC by the Sanger Centre. The sequencing of the S. pombe genome is now +CC being continued with funding from The European Commission. +CC Fourteen European sequencing laboratories, including the Sanger Centre, +CC are participating in the project. +CC +CC Protein coding regions (CDS) have been predicted with the help +CC of computer analysis using the Genefinder program in PomBase +CC (an ACEDB database) with additional predictions for the +CC branch-acceptor sites supplied by the program Sp3splice. +CC CAUTION: It is possible that for any individual CDS we may have +CC underestimated or overestimated the number of introns/exons or +CC we may not have chosen the correct splice donor/acceptor sites. +CC +CC CDS are numbered using the following system eg SPBC25H2.01c. +CC SP (S. pombe), B (chromosome 2), c25H2 (cosmid name), +CC .01 (first CDS), c (complementary strand). +CC +CC The more significant matches with motifs in the PROSITE +CC database are also included but some of these may be fortuitous. +CC +CC The length in codons is given for each CDS. +CC +CC IMPORTANT: This sequence MAY NOT be the entire insert of +CC the sequenced clone. It may be shorter because we only +CC sequence overlapping sections once, or longer, because we +CC arrange for a small overlap between neighbouring submissions. +CC +CC Cosmid c1215 is overlapped at the 5' end by cosmid c1750, +CC EMBL entry SPAB4534, accession number AB004534, and at the 3' +CC end by cosmid c83, EMBL entry SPBC83, accession number AL035536. +XX +XX +FH Key Location/Qualifiers +FH +FT source 1..6490 +FT /organism="Schizosaccharomyces pombe" +FT /strain="972h-" +FT /chromosome="II" +FT /clone="cosmid c1215" +FT /map="IIL" +FT misc_feature complement(1..82) +FT /note="nominal overlap with cosmid SPAB4534 (c1750) S. +FT pombe chromosome 2" +FT tRNA 36..107 +FT /note="tRNA Thr anticodon TGT, Cove score 78.51" +FT rRNA 415..581 +FT /note="SPRG5SD K00771 Yeast (s.pombe) 5s rrna gene and +FT flanks" +FT CDS join(1501..1760,1844..2456) +FT /fasta_file="fasta/gf.tab.seq.00001.out" +FT /note="SPBC1215.01, len:290, SIMILARITY:Saccharomyces +FT cerevisiae, YG2X_YEAST, hypothetical 45.1 kd protein in +FT clb6-spt6 intergenic region, (389 aa), fasta scores: opt: +FT 385, E():2.8e-19, (29.0% identity in 314 aa)" +FT /gene="SPBC1215.01" +FT /product="putative SURF-family protein" +FT /colour=7 +FT /label=SPBC1215.01 +FT misc_feature 1761..1766 +FT /note="gtacgt, splice donor sequence" +FT /colour=6 +FT misc_feature 1827..1843 +FT /note="ctaacataatcacttag, splice branch and acceptor" +FT /colour=6 +FT CDS complement(join(2495..2602,2663..2881,2953..4071,4111..4372,4413..4849,4889..5007,5251..5389,5434..5466)) +FT /fasta_file="fasta/gf.tab.seq.00002.out" +FT /note="SPBC1215.02c, len:811, SIMILARITY:Saccharomyces +FT cerevisiae, DEC1_YEAST, dec1 protein, (796 aa), fasta +FT scores: opt: 184, E():0.00014, (23.4% identity in 577 aa)" +FT /gene="SPBC1215.02c" +FT /product="similar to yeast DEC1 mitochondrial inheritance +FT and actin cytoskeleton organisation protein" +FT /colour=7 +FT /label=SPBC1215.02c +FT misc_feature complement(2603..2612) +FT /note="ctaataatag, splice branch and acceptor" +FT /colour=6 +FT misc_feature complement(2657..2662) +FT /note="gtacgt, splice donor sequence" +FT /colour=6 +FT misc_feature complement(2882..2896) +FT /note="ctaaccgaattatag, splice branch and acceptor" +FT /colour=6 +FT misc_feature complement(2947..2952) +FT /note="gtaagt, splice donor sequence" +FT /colour=6 +FT misc_feature complement(4072..4085) +FT /note="ttaactcgtcgtag, splice branch and acceptor" +FT /colour=6 +FT misc_feature complement(4105..4110) +FT /note="gtaagt, splice donor sequence" +FT /colour=6 +FT misc_feature complement(4373..4387) +FT /note="ctaacttctccatag, splice branch and acceptor" +FT /colour=6 +FT misc_feature complement(4407..4412) +FT /note="gtaagt, splice donor sequence" +FT /colour=6 +FT misc_feature complement(4850..4861) +FT /note="ctaactcctcag, splice branch and acceptor" +FT /colour=6 +FT misc_feature complement(4883..4888) +FT /note="gtaaga, splice donor sequence" +FT /colour=6 +FT misc_feature complement(5008..5021) +FT /note="ttaactatttgaag, splice branch and acceptor" +FT /colour=6 +FT misc_feature complement(5245..5250) +FT /note="gtaagt, splice donor sequence" +FT /colour=6 +FT misc_feature complement(5390..5405) +FT /note="ttaacatcctttttag, splice branch and acceptor" +FT /colour=6 +FT misc_feature complement(5428..5433) +FT /note="gtaagt, splice donor sequence" +FT /colour=6 +FT misc_feature 6387..6490 +FT /note="nominal overlap with cosmid SPBC83 S. pombe +FT chromosome 2" +SQ Sequence 6490 BP; 2097 A; 1138 C; 1138 G; 2117 T; 0 other; + tatatataat ttaataaata cattccgacg atactgcctc tatggcttag tggtacagca 60 + tcgcacttgt aatgcgaaga tccttggttc gattccgagt ggaggcatat acattatatt 120 + atattctttt tcatgcggaa aaaagatttc aaatttttgg gtatgatatt aatatgactg 180 + taacgttaat agcaaagtga gtgttaataa tgataaaata gcagcaaaat ctcttttccg 240 + agtaagacgt tttccagtct aaatttggag tctgcagttg tttcgcaatt cttaatgtat 300 + ggttatacta aatacaaact ttaaagctct gatttatgtt tgcaataaac taaaataaaa 360 + gcacaaaaac ctttacccat taatttcaaa caacttataa actaccggta aacttttttt 420 + ctaaccttta taatttataa actagaatgt ttaatgtcta cggccatacc taggcgaaaa 480 + caccagttcc cgtccgatca ctgcagttaa gcgtctgagg gcctcgttag tactatggtt 540 + ggagacaaca tgggaatccg gggtgctgta ggctattttt ttatatccgt ctttcttact 600 + acttgcctaa caagtcatga tgtactctca aaatatgttt gcatgccttg taatattggt 660 + tatggatagc tccttctgga cttgatcttt tgtagccaag aacaatgggt atagactctg 720 + accttgtgat gttgtagcca cagattataa taggtatttt caagtacagt aacaaaaatc 780 + ttctagtttt tttttagaaa ggatacacca agtataagca aattcaggaa ttgttgatta 840 + aactgtcaac ttcggtaaaa ctttgggcat aagtagtgtg ggagcaagtt taactaaaat 900 + tctattcaga tgtcgaatcc aaaccgctaa ttttgctcaa ctagcttttc ataaaaacca 960 + attcatagtt tcatactaat aaagacgatt gtttacttta aaacatacgt cgtaagaaca 1020 + tatattgctt tatcgaaaga taacaaatgt taagctatta tattatttaa ctatagcgca 1080 + gatttcgctt cctttactta aaaaagacat gtgacttgta gaagcttgga gtgaatacgc 1140 + aaaggtacct acttagacat tcgcgtctct cttagctgtc aacatcaaca aactggcccc 1200 + gtattgaaca gtatcttact tgtcgaagga tttgactaag aaaattttat ttctttatag 1260 + caatattccg ttttcgctta gaagattcta gtcaattgcc ctattctact tacgctttac 1320 + agtagtatca gaagacctga gtgggatttt gctgctagta gaggccattc aagttaactc 1380 + cgttttgcaa cattttaaaa gtttttgaat tgaatataaa tatcaattgt ttgattcctt 1440 + ttaggattta atcttttctt tttatttttg tttcgattga atcttggatt cctgtctatc 1500 + atgttttggt ggaaaagtgc tactaaattc acattctcaa agcgtggacc gtgtgtcttt 1560 + cgctatttga gtactcttga aggaacaact gtgaggccta aaaaaaataa atttttagtt 1620 + ggattgcttt ctgccgttcc aattgtcacg tttgctttag gaacttggca ggtaaagcga 1680 + cgagaatgga aaatgggtat catcaataca ctcacggaaa ggcttcaaca gcccgcaatt 1740 + ttattaccga aaactgttac gtacgttaag ttaacatata cacaaattgc acgttttgca 1800 + attgaactgt cgttttttac attaagctaa cataatcact tagagagcaa gatacaaaaa 1860 + aacttgagtg gactagggtt ttgcttcgtg gtgtgttttg tcacgaccaa gaaatgttgg 1920 + tcggtccaag aacgaaggaa ggccaacctg gctatcacgt agtaacccca tttattttag 1980 + acgatgggcg tcgaatttta gtcaacagag gatggattgc tcgatcattt gctgaacagt 2040 + cttctcgaga tcctagttct ttacctaaag gtccagtggt cattgaaggt cttttgagac 2100 + aacatactga taagccaaga tttatgatga agaatgagcc tgaaaaaaat tctttttact 2160 + tcttaaatgt tcgtgagttt gcacaattga aaggaactct ccccattttg ataacagaac 2220 + tacaaccatc gcttacaccg ttgcaagaag ccgatcatgt taagagaggc ttgcctcttg 2280 + gtcatcctct aaaagttgaa attttcaaca gtcatacaga atatattatc acttggtatt 2340 + ctctaagtgt ggtatcagct ataatgcttt acgtctattt taagagaggt tcaggcacat 2400 + cttctctgaa ttctgcatac gaaagaagca agattctaaa caacaaacga ttataaaaaa 2460 + ttttcatatt tataagtttc taaatattat ctacctaaaa ttttacaaat tttggaagct 2520 + tgcttactgc gtccgtcgtt tgaatgtatg aatcgatcat tccttcacca acttgttttg 2580 + caaacttcgg atcgtaagga acctattatt aggaagttag ttctcatgcc tataatttta 2640 + atgctctata atcatcacgt acctgagttt cagataaatt gctcagccaa gagtttgaca 2700 + acaattctga tacatatttt ctggcggcct tctttttatg cttcgtaatt ccagagatac 2760 + ttcctaattt gttactgctg atgtttttaa gaagttggta ttgtctggta aattcttttt 2820 + tcttggtagc tgacacgtga tataggaagc tgtttagaca agtgataagg tcatttatga 2880 + tctataattc ggttagttta gaaattttta tatcattttt tttaaaaaaa aaaaccagtt 2940 + tggtaaactt acttcagtgt actttgtcaa ttgacttaaa ggcgtggagt tctcataatc 3000 + gaatgactca attaaatttt caatcgtttc gaacgaggaa ttttcgtagt ctccgttctt 3060 + gacctttacc gaaagtaatc ccagttggat caataatttc atatgaacaa tttcttccga 3120 + agttaattgc ttcgataaat cattgttttc gcacaaaact tccatttcct tagcacttaa 3180 + aacggccttt tcaaaatcgc cgtttactat gctgtcttga acgagagaat gaccaatgac 3240 + agtcaaatgg atccaaagcg tgtccggttt aggcgaattt cttaaacttt cttcaactgt 3300 + tggcaattta tcagatccat aatctgcaaa gacctttaaa tctcgattat ctttcggaga 3360 + tgaacatttg ggaagatact gtttgggtgg tttaaaagcg gtaagataat gtatcctagc 3420 + ccgctcgacc aaagaaatgc ttttccaggt actgtggtct aaacgggatc ggaaattacg 3480 + catatcttcg atttgagagt aagcaccatc ttcataagcc atagaaatca tctctggtgt 3540 + ttcaaactca ttcgaaccat atattttgag acttgagtta atatagtgag aagtaacaga 3600 + agatggataa taggtagtag cacgagtcaa gagataatga tcaagggtat cgttttgaat 3660 + ttgcttaatg gacatagtgt cgtaaacttt agcagcagca gggaagcctc catcaagaag 3720 + aagatataaa cgaataaggg gtagctttaa atgaaagtta tgttgactat aagtaatgcc 3780 + tttttctaaa agacagattg cgtcaaaaat taaagcttgt ttttcggcag gttttaaatc 3840 + cttattcccc tcccacatat atatcaatga atgaactgct aataacaaag cttcataacc 3900 + gtgcgtaaag tcagtgggta ataagccttt acttaaagac aaaccctttt caaatgcgac 3960 + gaagcatcta cgcacgtaat cgacaaccga ttctgcagta aacgactcaa agagcaaaaa 4020 + atggatcttc agaagcaaaa cctcagcata taatttatcg actttttgag actacgacga 4080 + gttaatattg aaagatgaat aaatacttac ttcattggat tcacctagat cagccaactt 4140 + aaatgcatct aataaccggt gttgtgcatc aacattcagc ttcaatagat aaggtctcaa 4200 + atcttcaaaa acaattggtt tcatatacag ctttttgata tagccaagta atgctgattc 4260 + gtgttcttca ggaaaaaacc gtgcgctggc ttcaatccaa agtaaatgaa gatttctttt 4320 + tgtgctgctg gttgacaacg ctttcaatat acaatccttt aatgggacta atctatggag 4380 + aagttagtaa taatgcaaaa aaaaaaactt actttgaatc atcattggaa gcactatcca 4440 + gcaaagcttt gcaaaccttc caatcagtat tcccagtttg gaaaagagaa agcgaaaacg 4500 + tgaataaaga atcccaacgc gcacaggaag caagcaattc aagcttcctc aaaagaaggt 4560 + cggcgtcagc atcaacaaag cgatcagcat cttgatgtat taaagcatct aacgctctgt 4620 + ccttgtctcc cactaaaagc aacacgtcta aataaagatg aaactcctca caagaatcga 4680 + tataacctgt tggtttttcg aaaatgagtt tagcagtttt ttcagctagt gctttcagca 4740 + aacgttgttc aacctcattt tccgactttt tggacaaaag atacaaagat gagataaccc 4800 + ataaggtatg tttcctagaa ggaaagttct tttgcaattc tacagcagcc tgaggagtta 4860 + gtaaaaaaaa aacaaattaa gatcttacct ttctttggtg agacaatgat ttgatgcgaa 4920 + tagatgcttt gaagtaagct aataagtttt tttcctgctt tccataagtt tgcaagaact 4980 + tttcccaaaa tacaaacgat tcttctcctt caaatagtta ataacttaaa agtaagaggg 5040 + taaaaacaag tccattgaga aataaaacgt tgcacttgaa tcatcaagct acgaaaagaa 5100 + caaagatcgt ttttcttaag caaagtttaa ccgatcaaat aactaaagcc tttatctcaa 5160 + ggaaatagta gaatattcaa aataaaaaat acgaccaaag tgctatcaac atttatgttc 5220 + atctgttcaa tagaacctaa ttatacttac ccttcttttg atcatcataa acagcttgta 5280 + taatgtctaa aagttccaag ctgttgatgg gagtcgattt taacggttct aaaagtgcta 5340 + gagcctcggg accacgtcct gcctgagcca aggataacgc tgaataaacc taaaaaggat 5400 + gttaacagct aaaaacataa ctcgattact tacaattgtt gattctttac tcccagaacg 5460 + acgcattgta gtaggcaatg aaattaaagc ccaaacagta gtcagaagtt ggtaggtgtt 5520 + gcagtcaaat tattattcta cagaggagaa tattatagcc agcgtggtag aatctggata 5580 + tatatctact gcaaaagtgt aattgcattg gtttaaaggg tatactatgg ttaagtaata 5640 + tattcacagc tgtacaattt acagtcataa ctaaaacttc cttaagccgt aaagaaatac 5700 + ctggtgttgt aaaatttgtt gtatatccac ggcatggtca tataatgtga ttttgtgctc 5760 + aaataaatat aaaatatgca taatttttgt acatttaatt tgagaaaccc atcttttgtt 5820 + gagaggctgt caatgaatag cagtttcatt gaaaagcagc gggatgacca gaaaagtatt 5880 + ttacaatggc aagggagtag aaagctagcg taatattcag aaagctaggt aattgagcaa 5940 + tcctttaatt cattgctaag catgctaggt aaacgcagta aacctttcag ttttcattta 6000 + ggtataaggc tgtttaatga gtatctccac taaatttaaa gatcaaaact cagtatcaat 6060 + tcttaaaagt tttattttat ttaataatca tatacttctc ataatctttc aattttttcc 6120 + ccattttgat gatattttta ttaatcctac agtaagctct atgatatcgt tattcttcaa 6180 + ataggctggt cagcacgtgg acggtgttac ttatcgttaa ataaatcgta ctaaggaggt 6240 + gcgatgtaaa tgatatgctt gtcaagtatt aactgctctc caccaaccgc cggtttaact 6300 + gattattgtt gaaaagcgca gacgaagttt agagaattac tagcgtattt taaatttaat 6360 + caacggacta ttttttattc ctttgagatc cgactttatc gctttgcttc taattttcca 6420 + aaattcagtc tatctacgcg atccagccct gtttgcgtaa atttcatatt atttttcttt 6480 + aaacgtttgg 6490 +// diff --git a/etc/c1215.genbank b/etc/c1215.genbank new file mode 100644 index 000000000..9e3c3d873 --- /dev/null +++ b/etc/c1215.genbank @@ -0,0 +1,277 @@ +LOCUS SPBC1215 6490 bp DNA PLN 16-JUL-1999 +DEFINITION S.pombe chromosome II cosmid c1215. +ACCESSION AL096846 +VERSION AL096846.1 GI:5531459 +KEYWORDS actin cytoskeleton organisation; COX complex biogenesis; DEC1 + homologue; mitochondrial inheritance; SURF-family protein. +SOURCE fission yeast. + ORGANISM Schizosaccharomyces pombe + Eukaryota; Fungi; Ascomycota; Schizosaccharomycetes; + Schizosaccharomycetales; Schizosaccharomycetaceae; + Schizosaccharomyces. +REFERENCE 1 (bases 1 to 6490) + AUTHORS Lyne,M.H., Rajandream,M.A., Barrell,B.G., Seeger,K., Quail,M. and + Harris,D. + TITLE Direct Submission + JOURNAL Submitted (16-JUL-1999) European Schizosaccharomyces genome + sequencing project, Sanger Centre, The Wellcome Trust Genome + Campus, Hinxton, Cambridge CB10 1SA, E-mail: barrell@sanger.ac.uk + and +COMMENT Notes: + Details of yeast sequencing at the Sanger Centre are available on + the World Wide Web. + (URL, http://www.sanger.ac.uk/Projects/S_pombe/) + During 1995 to 1996 about 66% of S. pombe chromosome 1 was + sequenced by the Sanger Centre. The sequencing of the S. pombe + genome is now being continued with funding from The European + Commission. Fourteen European sequencing laboratories, including + the Sanger Centre, are participating in the project. + Protein coding regions (CDS) have been predicted with the help of + computer analysis using the Genefinder program in PomBase (an ACEDB + database) with additional predictions for the branch-acceptor sites + supplied by the program Sp3splice. CAUTION: It is possible that for + any individual CDS we may have underestimated or overestimated the + number of introns/exons or we may not have chosen the correct + splice donor/acceptor sites. + CDS are numbered using the following system eg SPBC25H2.01c. SP (S. + pombe), B (chromosome 2), c25H2 (cosmid name), .01 (first CDS), c + (complementary strand). + The more significant matches with motifs in the PROSITE database + are also included but some of these may be fortuitous. + The length in codons is given for each CDS. + IMPORTANT: This sequence MAY NOT be the entire insert of the + sequenced clone. It may be shorter because we only sequence + overlapping sections once, or longer, because we arrange for a + small overlap between neighbouring submissions. + Cosmid c1215 is overlapped at the 5' end by cosmid c1750, EMBL + entry SPAB4534, accession number AB004534, and at the 3' end by + cosmid c83, EMBL entry SPBC83, accession number AL035536. +FEATURES Location/Qualifiers + source 1..6490 + /organism="Schizosaccharomyces pombe" + /strain="972h-" + /db_xref="taxon:4896" + /chromosome="II" + /map="IIL" + /clone="cosmid c1215" + misc_feature complement(1..82) + /note="nominal overlap with cosmid SPAB4534 (c1750) S. + pombe chromosome 2" + tRNA 36..107 + /note="tRNA Thr anticodon TGT, Cove score 78.51" + /product="tRNA-Thr" + rRNA 415..581 + /note="SPRG5SD K00771 Yeast (s.pombe) 5s rrna gene and + flanks" + gene join(1501..1760,1844..2456) + /gene="SPBC1215.01" + CDS join(1501..1760,1844..2456) + /gene="SPBC1215.01" + /note="SPBC1215.01, len:290, SIMILARITY:Saccharomyces + cerevisiae, YG2X_YEAST, hypothetical 45.1 kd protein in + clb6-spt6 intergenic region, (389 aa), fasta scores: opt: + 385, E():2.8e-19, (29.0% identity in 314 aa)" + /codon_start=1 + /label=SPBC1215.01 + /product="putative SURF-family protein" + /protein_id="CAB50922.1" + /db_xref="GI:5531460" + /translation="MFWWKSATKFTFSKRGPCVFRYLSTLEGTTVRPKKNKFLVGLLS + AVPIVTFALGTWQVKRREWKMGIINTLTERLQQPAILLPKTVTEQDTKKLEWTRVLLR + GVFCHDQEMLVGPRTKEGQPGYHVVTPFILDDGRRILVNRGWIARSFAEQSSRDPSSL + PKGPVVIEGLLRQHTDKPRFMMKNEPEKNSFYFLNVREFAQLKGTLPILITELQPSLT + PLQEADHVKRGLPLGHPLKVEIFNSHTEYIITWYSLSVVSAIMLYVYFKRGSGTSSLN + SAYERSKILNNKRL" + misc_feature 1761..1766 + /gene="SPBC1215.01" + /note="gtacgt, splice donor sequence" + misc_feature 1827..1843 + /gene="SPBC1215.01" + /note="ctaacataatcacttag, splice branch and acceptor" + gene complement(join(2495..2602,2663..2881,2953..4071, + 4111..4372,4413..4849,4889..5007,5251..5389,5434..5466)) + /gene="SPBC1215.02c" + CDS complement(join(2495..2602,2663..2881,2953..4071, + 4111..4372,4413..4849,4889..5007,5251..5389,5434..5466)) + /gene="SPBC1215.02c" + /note="SPBC1215.02c, len:811, SIMILARITY:Saccharomyces + cerevisiae, DEC1_YEAST, dec1 protein, (796 aa), fasta + scores: opt: 184, E():0.00014, (23.4% identity in 577 aa)" + /codon_start=1 + /label=SPBC1215.02c + /product="similar to yeast DEC1 mitochondrial inheritance + and actin cytoskeleton organisation protein" + /protein_id="CAB50923.1" + /db_xref="GI:5531461" + /translation="MRRSGSKESTIVYSALSLAQAGRGPEALALLEPLKSTPINSLEL + LDIIQAVYDDQKKGEESFVFWEKFLQTYGKQEKNLLAYFKASIRIKSLSHQRKAAVEL + QKNFPSRKHTLWVISSLYLLSKKSENEVEQRLLKALAEKTAKLIFEKPTGYIDSCEEF + HLYLDVLLLVGDKDRALDALIHQDADRFVDADADLLLRKLELLASCARWDSLFTFSLS + LFQTGNTDWKVCKALLDSASNDDSKLVPLKDCILKALSTSSTKRNLHLLWIEASARFF + PEEHESALLGYIKKLYMKPIVFEDLRPYLLKLNVDAQHRLLDAFKLADLGESNESQKV + DKLYAEVLLLKIHFLLFESFTAESVVDYVRRCFVAFEKGLSLSKGLLPTDFTHGYEAL + LLAVHSLIYMWEGNKDLKPAEKQALIFDAICLLEKGITYSQHNFHLKLPLIRLYLLLD + GGFPAAAKVYDTMSIKQIQNDTLDHYLLTRATTYYPSSVTSHYINSSLKIYGSNEFET + PEMISMAYEDGAYSQIEDMRNFRSRLDHSTWKSISLVERARIHYLTAFKPPKQYLPKC + SSPKDNRDLKVFADYGSDKLPTVEESLRNSPKPDTLWIHLTVIGHSLVQDSIVNGDFE + KAVLSAKEMEVLCENNDLSKQLTSEEIVHMKLLIQLGLLSVKVKNGDYENSSFETIEN + LIESFDYENSTPLSQLTKYTEIINDLITCLNSFLYHVSATKKKEFTRQYQLLKNISSN + KLGSISGITKHKKKAARKYVSELLSNSWLSNLSETQVPYDPKFAKQVGEGMIDSYIQT + TDAVSKLPKFVKF" + misc_feature complement(2603..2612) + /gene="SPBC1215.02c" + /note="ctaataatag, splice branch and acceptor" + misc_feature complement(2657..2662) + /gene="SPBC1215.02c" + /note="gtacgt, splice donor sequence" + misc_feature complement(2882..2896) + /gene="SPBC1215.02c" + /note="ctaaccgaattatag, splice branch and acceptor" + misc_feature complement(2947..2952) + /gene="SPBC1215.02c" + /note="gtaagt, splice donor sequence" + misc_feature complement(4072..4085) + /gene="SPBC1215.02c" + /note="ttaactcgtcgtag, splice branch and acceptor" + misc_feature complement(4105..4110) + /gene="SPBC1215.02c" + /note="gtaagt, splice donor sequence" + misc_feature complement(4373..4387) + /gene="SPBC1215.02c" + /note="ctaacttctccatag, splice branch and acceptor" + misc_feature complement(4407..4412) + /gene="SPBC1215.02c" + /note="gtaagt, splice donor sequence" + misc_feature complement(4850..4861) + /gene="SPBC1215.02c" + /note="ctaactcctcag, splice branch and acceptor" + misc_feature complement(4883..4888) + /gene="SPBC1215.02c" + /note="gtaaga, splice donor sequence" + misc_feature complement(5008..5021) + /gene="SPBC1215.02c" + /note="ttaactatttgaag, splice branch and acceptor" + misc_feature complement(5245..5250) + /gene="SPBC1215.02c" + /note="gtaagt, splice donor sequence" + misc_feature complement(5390..5405) + /gene="SPBC1215.02c" + /note="ttaacatcctttttag, splice branch and acceptor" + misc_feature complement(5428..5433) + /gene="SPBC1215.02c" + /note="gtaagt, splice donor sequence" + misc_feature 6387..6490 + /note="nominal overlap with cosmid SPBC83 S. pombe + chromosome 2" +BASE COUNT 2097 a 1138 c 1138 g 2117 t +ORIGIN + 1 tatatataat ttaataaata cattccgacg atactgcctc tatggcttag tggtacagca + 61 tcgcacttgt aatgcgaaga tccttggttc gattccgagt ggaggcatat acattatatt + 121 atattctttt tcatgcggaa aaaagatttc aaatttttgg gtatgatatt aatatgactg + 181 taacgttaat agcaaagtga gtgttaataa tgataaaata gcagcaaaat ctcttttccg + 241 agtaagacgt tttccagtct aaatttggag tctgcagttg tttcgcaatt cttaatgtat + 301 ggttatacta aatacaaact ttaaagctct gatttatgtt tgcaataaac taaaataaaa + 361 gcacaaaaac ctttacccat taatttcaaa caacttataa actaccggta aacttttttt + 421 ctaaccttta taatttataa actagaatgt ttaatgtcta cggccatacc taggcgaaaa + 481 caccagttcc cgtccgatca ctgcagttaa gcgtctgagg gcctcgttag tactatggtt + 541 ggagacaaca tgggaatccg gggtgctgta ggctattttt ttatatccgt ctttcttact + 601 acttgcctaa caagtcatga tgtactctca aaatatgttt gcatgccttg taatattggt + 661 tatggatagc tccttctgga cttgatcttt tgtagccaag aacaatgggt atagactctg + 721 accttgtgat gttgtagcca cagattataa taggtatttt caagtacagt aacaaaaatc + 781 ttctagtttt tttttagaaa ggatacacca agtataagca aattcaggaa ttgttgatta + 841 aactgtcaac ttcggtaaaa ctttgggcat aagtagtgtg ggagcaagtt taactaaaat + 901 tctattcaga tgtcgaatcc aaaccgctaa ttttgctcaa ctagcttttc ataaaaacca + 961 attcatagtt tcatactaat aaagacgatt gtttacttta aaacatacgt cgtaagaaca + 1021 tatattgctt tatcgaaaga taacaaatgt taagctatta tattatttaa ctatagcgca + 1081 gatttcgctt cctttactta aaaaagacat gtgacttgta gaagcttgga gtgaatacgc + 1141 aaaggtacct acttagacat tcgcgtctct cttagctgtc aacatcaaca aactggcccc + 1201 gtattgaaca gtatcttact tgtcgaagga tttgactaag aaaattttat ttctttatag + 1261 caatattccg ttttcgctta gaagattcta gtcaattgcc ctattctact tacgctttac + 1321 agtagtatca gaagacctga gtgggatttt gctgctagta gaggccattc aagttaactc + 1381 cgttttgcaa cattttaaaa gtttttgaat tgaatataaa tatcaattgt ttgattcctt + 1441 ttaggattta atcttttctt tttatttttg tttcgattga atcttggatt cctgtctatc + 1501 atgttttggt ggaaaagtgc tactaaattc acattctcaa agcgtggacc gtgtgtcttt + 1561 cgctatttga gtactcttga aggaacaact gtgaggccta aaaaaaataa atttttagtt + 1621 ggattgcttt ctgccgttcc aattgtcacg tttgctttag gaacttggca ggtaaagcga + 1681 cgagaatgga aaatgggtat catcaataca ctcacggaaa ggcttcaaca gcccgcaatt + 1741 ttattaccga aaactgttac gtacgttaag ttaacatata cacaaattgc acgttttgca + 1801 attgaactgt cgttttttac attaagctaa cataatcact tagagagcaa gatacaaaaa + 1861 aacttgagtg gactagggtt ttgcttcgtg gtgtgttttg tcacgaccaa gaaatgttgg + 1921 tcggtccaag aacgaaggaa ggccaacctg gctatcacgt agtaacccca tttattttag + 1981 acgatgggcg tcgaatttta gtcaacagag gatggattgc tcgatcattt gctgaacagt + 2041 cttctcgaga tcctagttct ttacctaaag gtccagtggt cattgaaggt cttttgagac + 2101 aacatactga taagccaaga tttatgatga agaatgagcc tgaaaaaaat tctttttact + 2161 tcttaaatgt tcgtgagttt gcacaattga aaggaactct ccccattttg ataacagaac + 2221 tacaaccatc gcttacaccg ttgcaagaag ccgatcatgt taagagaggc ttgcctcttg + 2281 gtcatcctct aaaagttgaa attttcaaca gtcatacaga atatattatc acttggtatt + 2341 ctctaagtgt ggtatcagct ataatgcttt acgtctattt taagagaggt tcaggcacat + 2401 cttctctgaa ttctgcatac gaaagaagca agattctaaa caacaaacga ttataaaaaa + 2461 ttttcatatt tataagtttc taaatattat ctacctaaaa ttttacaaat tttggaagct + 2521 tgcttactgc gtccgtcgtt tgaatgtatg aatcgatcat tccttcacca acttgttttg + 2581 caaacttcgg atcgtaagga acctattatt aggaagttag ttctcatgcc tataatttta + 2641 atgctctata atcatcacgt acctgagttt cagataaatt gctcagccaa gagtttgaca + 2701 acaattctga tacatatttt ctggcggcct tctttttatg cttcgtaatt ccagagatac + 2761 ttcctaattt gttactgctg atgtttttaa gaagttggta ttgtctggta aattcttttt + 2821 tcttggtagc tgacacgtga tataggaagc tgtttagaca agtgataagg tcatttatga + 2881 tctataattc ggttagttta gaaattttta tatcattttt tttaaaaaaa aaaaccagtt + 2941 tggtaaactt acttcagtgt actttgtcaa ttgacttaaa ggcgtggagt tctcataatc + 3001 gaatgactca attaaatttt caatcgtttc gaacgaggaa ttttcgtagt ctccgttctt + 3061 gacctttacc gaaagtaatc ccagttggat caataatttc atatgaacaa tttcttccga + 3121 agttaattgc ttcgataaat cattgttttc gcacaaaact tccatttcct tagcacttaa + 3181 aacggccttt tcaaaatcgc cgtttactat gctgtcttga acgagagaat gaccaatgac + 3241 agtcaaatgg atccaaagcg tgtccggttt aggcgaattt cttaaacttt cttcaactgt + 3301 tggcaattta tcagatccat aatctgcaaa gacctttaaa tctcgattat ctttcggaga + 3361 tgaacatttg ggaagatact gtttgggtgg tttaaaagcg gtaagataat gtatcctagc + 3421 ccgctcgacc aaagaaatgc ttttccaggt actgtggtct aaacgggatc ggaaattacg + 3481 catatcttcg atttgagagt aagcaccatc ttcataagcc atagaaatca tctctggtgt + 3541 ttcaaactca ttcgaaccat atattttgag acttgagtta atatagtgag aagtaacaga + 3601 agatggataa taggtagtag cacgagtcaa gagataatga tcaagggtat cgttttgaat + 3661 ttgcttaatg gacatagtgt cgtaaacttt agcagcagca gggaagcctc catcaagaag + 3721 aagatataaa cgaataaggg gtagctttaa atgaaagtta tgttgactat aagtaatgcc + 3781 tttttctaaa agacagattg cgtcaaaaat taaagcttgt ttttcggcag gttttaaatc + 3841 cttattcccc tcccacatat atatcaatga atgaactgct aataacaaag cttcataacc + 3901 gtgcgtaaag tcagtgggta ataagccttt acttaaagac aaaccctttt caaatgcgac + 3961 gaagcatcta cgcacgtaat cgacaaccga ttctgcagta aacgactcaa agagcaaaaa + 4021 atggatcttc agaagcaaaa cctcagcata taatttatcg actttttgag actacgacga + 4081 gttaatattg aaagatgaat aaatacttac ttcattggat tcacctagat cagccaactt + 4141 aaatgcatct aataaccggt gttgtgcatc aacattcagc ttcaatagat aaggtctcaa + 4201 atcttcaaaa acaattggtt tcatatacag ctttttgata tagccaagta atgctgattc + 4261 gtgttcttca ggaaaaaacc gtgcgctggc ttcaatccaa agtaaatgaa gatttctttt + 4321 tgtgctgctg gttgacaacg ctttcaatat acaatccttt aatgggacta atctatggag + 4381 aagttagtaa taatgcaaaa aaaaaaactt actttgaatc atcattggaa gcactatcca + 4441 gcaaagcttt gcaaaccttc caatcagtat tcccagtttg gaaaagagaa agcgaaaacg + 4501 tgaataaaga atcccaacgc gcacaggaag caagcaattc aagcttcctc aaaagaaggt + 4561 cggcgtcagc atcaacaaag cgatcagcat cttgatgtat taaagcatct aacgctctgt + 4621 ccttgtctcc cactaaaagc aacacgtcta aataaagatg aaactcctca caagaatcga + 4681 tataacctgt tggtttttcg aaaatgagtt tagcagtttt ttcagctagt gctttcagca + 4741 aacgttgttc aacctcattt tccgactttt tggacaaaag atacaaagat gagataaccc + 4801 ataaggtatg tttcctagaa ggaaagttct tttgcaattc tacagcagcc tgaggagtta + 4861 gtaaaaaaaa aacaaattaa gatcttacct ttctttggtg agacaatgat ttgatgcgaa + 4921 tagatgcttt gaagtaagct aataagtttt tttcctgctt tccataagtt tgcaagaact + 4981 tttcccaaaa tacaaacgat tcttctcctt caaatagtta ataacttaaa agtaagaggg + 5041 taaaaacaag tccattgaga aataaaacgt tgcacttgaa tcatcaagct acgaaaagaa + 5101 caaagatcgt ttttcttaag caaagtttaa ccgatcaaat aactaaagcc tttatctcaa + 5161 ggaaatagta gaatattcaa aataaaaaat acgaccaaag tgctatcaac atttatgttc + 5221 atctgttcaa tagaacctaa ttatacttac ccttcttttg atcatcataa acagcttgta + 5281 taatgtctaa aagttccaag ctgttgatgg gagtcgattt taacggttct aaaagtgcta + 5341 gagcctcggg accacgtcct gcctgagcca aggataacgc tgaataaacc taaaaaggat + 5401 gttaacagct aaaaacataa ctcgattact tacaattgtt gattctttac tcccagaacg + 5461 acgcattgta gtaggcaatg aaattaaagc ccaaacagta gtcagaagtt ggtaggtgtt + 5521 gcagtcaaat tattattcta cagaggagaa tattatagcc agcgtggtag aatctggata + 5581 tatatctact gcaaaagtgt aattgcattg gtttaaaggg tatactatgg ttaagtaata + 5641 tattcacagc tgtacaattt acagtcataa ctaaaacttc cttaagccgt aaagaaatac + 5701 ctggtgttgt aaaatttgtt gtatatccac ggcatggtca tataatgtga ttttgtgctc + 5761 aaataaatat aaaatatgca taatttttgt acatttaatt tgagaaaccc atcttttgtt + 5821 gagaggctgt caatgaatag cagtttcatt gaaaagcagc gggatgacca gaaaagtatt + 5881 ttacaatggc aagggagtag aaagctagcg taatattcag aaagctaggt aattgagcaa + 5941 tcctttaatt cattgctaag catgctaggt aaacgcagta aacctttcag ttttcattta + 6001 ggtataaggc tgtttaatga gtatctccac taaatttaaa gatcaaaact cagtatcaat + 6061 tcttaaaagt tttattttat ttaataatca tatacttctc ataatctttc aattttttcc + 6121 ccattttgat gatattttta ttaatcctac agtaagctct atgatatcgt tattcttcaa + 6181 ataggctggt cagcacgtgg acggtgttac ttatcgttaa ataaatcgta ctaaggaggt + 6241 gcgatgtaaa tgatatgctt gtcaagtatt aactgctctc caccaaccgc cggtttaact + 6301 gattattgtt gaaaagcgca gacgaagttt agagaattac tagcgtattt taaatttaat + 6361 caacggacta ttttttattc ctttgagatc cgactttatc gctttgcttc taattttcca + 6421 aaattcagtc tatctacgcg atccagccct gtttgcgtaa atttcatatt atttttcttt + 6481 aaacgtttgg +// diff --git a/etc/c1215.seq b/etc/c1215.seq new file mode 100644 index 000000000..94d788aba --- /dev/null +++ b/etc/c1215.seq @@ -0,0 +1,110 @@ +>all bases +tatatataatttaataaatacattccgacgatactgcctctatggcttagtggtacagca +tcgcacttgtaatgcgaagatccttggttcgattccgagtggaggcatatacattatatt +atattctttttcatgcggaaaaaagatttcaaatttttgggtatgatattaatatgactg +taacgttaatagcaaagtgagtgttaataatgataaaatagcagcaaaatctcttttccg +agtaagacgttttccagtctaaatttggagtctgcagttgtttcgcaattcttaatgtat +ggttatactaaatacaaactttaaagctctgatttatgtttgcaataaactaaaataaaa +gcacaaaaacctttacccattaatttcaaacaacttataaactaccggtaaacttttttt +ctaacctttataatttataaactagaatgtttaatgtctacggccatacctaggcgaaaa +caccagttcccgtccgatcactgcagttaagcgtctgagggcctcgttagtactatggtt +ggagacaacatgggaatccggggtgctgtaggctatttttttatatccgtctttcttact +acttgcctaacaagtcatgatgtactctcaaaatatgtttgcatgccttgtaatattggt +tatggatagctccttctggacttgatcttttgtagccaagaacaatgggtatagactctg +accttgtgatgttgtagccacagattataataggtattttcaagtacagtaacaaaaatc +ttctagtttttttttagaaaggatacaccaagtataagcaaattcaggaattgttgatta +aactgtcaacttcggtaaaactttgggcataagtagtgtgggagcaagtttaactaaaat +tctattcagatgtcgaatccaaaccgctaattttgctcaactagcttttcataaaaacca +attcatagtttcatactaataaagacgattgtttactttaaaacatacgtcgtaagaaca +tatattgctttatcgaaagataacaaatgttaagctattatattatttaactatagcgca +gatttcgcttcctttacttaaaaaagacatgtgacttgtagaagcttggagtgaatacgc +aaaggtacctacttagacattcgcgtctctcttagctgtcaacatcaacaaactggcccc +gtattgaacagtatcttacttgtcgaaggatttgactaagaaaattttatttctttatag +caatattccgttttcgcttagaagattctagtcaattgccctattctacttacgctttac +agtagtatcagaagacctgagtgggattttgctgctagtagaggccattcaagttaactc +cgttttgcaacattttaaaagtttttgaattgaatataaatatcaattgtttgattcctt +ttaggatttaatcttttctttttatttttgtttcgattgaatcttggattcctgtctatc +atgttttggtggaaaagtgctactaaattcacattctcaaagcgtggaccgtgtgtcttt +cgctatttgagtactcttgaaggaacaactgtgaggcctaaaaaaaataaatttttagtt +ggattgctttctgccgttccaattgtcacgtttgctttaggaacttggcaggtaaagcga +cgagaatggaaaatgggtatcatcaatacactcacggaaaggcttcaacagcccgcaatt +ttattaccgaaaactgttacgtacgttaagttaacatatacacaaattgcacgttttgca +attgaactgtcgttttttacattaagctaacataatcacttagagagcaagatacaaaaa +aacttgagtggactagggttttgcttcgtggtgtgttttgtcacgaccaagaaatgttgg +tcggtccaagaacgaaggaaggccaacctggctatcacgtagtaaccccatttattttag +acgatgggcgtcgaattttagtcaacagaggatggattgctcgatcatttgctgaacagt +cttctcgagatcctagttctttacctaaaggtccagtggtcattgaaggtcttttgagac +aacatactgataagccaagatttatgatgaagaatgagcctgaaaaaaattctttttact +tcttaaatgttcgtgagtttgcacaattgaaaggaactctccccattttgataacagaac +tacaaccatcgcttacaccgttgcaagaagccgatcatgttaagagaggcttgcctcttg +gtcatcctctaaaagttgaaattttcaacagtcatacagaatatattatcacttggtatt +ctctaagtgtggtatcagctataatgctttacgtctattttaagagaggttcaggcacat +cttctctgaattctgcatacgaaagaagcaagattctaaacaacaaacgattataaaaaa +ttttcatatttataagtttctaaatattatctacctaaaattttacaaattttggaagct +tgcttactgcgtccgtcgtttgaatgtatgaatcgatcattccttcaccaacttgttttg +caaacttcggatcgtaaggaacctattattaggaagttagttctcatgcctataatttta +atgctctataatcatcacgtacctgagtttcagataaattgctcagccaagagtttgaca +acaattctgatacatattttctggcggccttctttttatgcttcgtaattccagagatac +ttcctaatttgttactgctgatgtttttaagaagttggtattgtctggtaaattcttttt +tcttggtagctgacacgtgatataggaagctgtttagacaagtgataaggtcatttatga +tctataattcggttagtttagaaatttttatatcattttttttaaaaaaaaaaaccagtt +tggtaaacttacttcagtgtactttgtcaattgacttaaaggcgtggagttctcataatc +gaatgactcaattaaattttcaatcgtttcgaacgaggaattttcgtagtctccgttctt +gacctttaccgaaagtaatcccagttggatcaataatttcatatgaacaatttcttccga +agttaattgcttcgataaatcattgttttcgcacaaaacttccatttccttagcacttaa +aacggccttttcaaaatcgccgtttactatgctgtcttgaacgagagaatgaccaatgac +agtcaaatggatccaaagcgtgtccggtttaggcgaatttcttaaactttcttcaactgt +tggcaatttatcagatccataatctgcaaagacctttaaatctcgattatctttcggaga +tgaacatttgggaagatactgtttgggtggtttaaaagcggtaagataatgtatcctagc +ccgctcgaccaaagaaatgcttttccaggtactgtggtctaaacgggatcggaaattacg +catatcttcgatttgagagtaagcaccatcttcataagccatagaaatcatctctggtgt +ttcaaactcattcgaaccatatattttgagacttgagttaatatagtgagaagtaacaga +agatggataataggtagtagcacgagtcaagagataatgatcaagggtatcgttttgaat +ttgcttaatggacatagtgtcgtaaactttagcagcagcagggaagcctccatcaagaag +aagatataaacgaataaggggtagctttaaatgaaagttatgttgactataagtaatgcc +tttttctaaaagacagattgcgtcaaaaattaaagcttgtttttcggcaggttttaaatc +cttattcccctcccacatatatatcaatgaatgaactgctaataacaaagcttcataacc +gtgcgtaaagtcagtgggtaataagcctttacttaaagacaaacccttttcaaatgcgac +gaagcatctacgcacgtaatcgacaaccgattctgcagtaaacgactcaaagagcaaaaa +atggatcttcagaagcaaaacctcagcatataatttatcgactttttgagactacgacga +gttaatattgaaagatgaataaatacttacttcattggattcacctagatcagccaactt +aaatgcatctaataaccggtgttgtgcatcaacattcagcttcaatagataaggtctcaa +atcttcaaaaacaattggtttcatatacagctttttgatatagccaagtaatgctgattc +gtgttcttcaggaaaaaaccgtgcgctggcttcaatccaaagtaaatgaagatttctttt +tgtgctgctggttgacaacgctttcaatatacaatcctttaatgggactaatctatggag +aagttagtaataatgcaaaaaaaaaaacttactttgaatcatcattggaagcactatcca +gcaaagctttgcaaaccttccaatcagtattcccagtttggaaaagagaaagcgaaaacg +tgaataaagaatcccaacgcgcacaggaagcaagcaattcaagcttcctcaaaagaaggt +cggcgtcagcatcaacaaagcgatcagcatcttgatgtattaaagcatctaacgctctgt +ccttgtctcccactaaaagcaacacgtctaaataaagatgaaactcctcacaagaatcga +tataacctgttggtttttcgaaaatgagtttagcagttttttcagctagtgctttcagca +aacgttgttcaacctcattttccgactttttggacaaaagatacaaagatgagataaccc +ataaggtatgtttcctagaaggaaagttcttttgcaattctacagcagcctgaggagtta +gtaaaaaaaaaacaaattaagatcttacctttctttggtgagacaatgatttgatgcgaa +tagatgctttgaagtaagctaataagtttttttcctgctttccataagtttgcaagaact +tttcccaaaatacaaacgattcttctccttcaaatagttaataacttaaaagtaagaggg +taaaaacaagtccattgagaaataaaacgttgcacttgaatcatcaagctacgaaaagaa +caaagatcgtttttcttaagcaaagtttaaccgatcaaataactaaagcctttatctcaa +ggaaatagtagaatattcaaaataaaaaatacgaccaaagtgctatcaacatttatgttc +atctgttcaatagaacctaattatacttacccttcttttgatcatcataaacagcttgta +taatgtctaaaagttccaagctgttgatgggagtcgattttaacggttctaaaagtgcta +gagcctcgggaccacgtcctgcctgagccaaggataacgctgaataaacctaaaaaggat +gttaacagctaaaaacataactcgattacttacaattgttgattctttactcccagaacg +acgcattgtagtaggcaatgaaattaaagcccaaacagtagtcagaagttggtaggtgtt +gcagtcaaattattattctacagaggagaatattatagccagcgtggtagaatctggata +tatatctactgcaaaagtgtaattgcattggtttaaagggtatactatggttaagtaata +tattcacagctgtacaatttacagtcataactaaaacttccttaagccgtaaagaaatac +ctggtgttgtaaaatttgttgtatatccacggcatggtcatataatgtgattttgtgctc +aaataaatataaaatatgcataatttttgtacatttaatttgagaaacccatcttttgtt +gagaggctgtcaatgaatagcagtttcattgaaaagcagcgggatgaccagaaaagtatt +ttacaatggcaagggagtagaaagctagcgtaatattcagaaagctaggtaattgagcaa +tcctttaattcattgctaagcatgctaggtaaacgcagtaaacctttcagttttcattta +ggtataaggctgtttaatgagtatctccactaaatttaaagatcaaaactcagtatcaat +tcttaaaagttttattttatttaataatcatatacttctcataatctttcaattttttcc +ccattttgatgatatttttattaatcctacagtaagctctatgatatcgttattcttcaa +ataggctggtcagcacgtggacggtgttacttatcgttaaataaatcgtactaaggaggt +gcgatgtaaatgatatgcttgtcaagtattaactgctctccaccaaccgccggtttaact +gattattgttgaaaagcgcagacgaagtttagagaattactagcgtattttaaatttaat +caacggactattttttattcctttgagatccgactttatcgctttgcttctaattttcca +aaattcagtctatctacgcgatccagccctgtttgcgtaaatttcatattatttttcttt +aaacgtttgg diff --git a/etc/feature_keys b/etc/feature_keys new file mode 100644 index 000000000..67d773c1d --- /dev/null +++ b/etc/feature_keys @@ -0,0 +1,72 @@ +# All feature keys and qualifiers for EMBL/GenBank feature tables + +# From: http://www.ebi.ac.uk/~faruque/art/keyqual.txt + +# key Qualifiers (@=mandatory) +# ======= ======================== +- EC_number PCR_conditions allele anticodon bound_moiety cell_line cell_type chromosome citation clone clone_lib codon codon_start cons_splice country cultivar db_xref dev_stage direction ecotype environmental_sa evidence exception focus frequency function gene germline haplotype insertion_seq isolate isolation_source lab_host label locus_tag macronuclear map mod_base mol_type note number organelle organism partial phenotype plasmid pop_variant product protein_id proviral pseudo rearranged replace rpt_family rpt_type rpt_unit segment sequenced_mol serotype serovar sex specific_host specimen_voucher standard_name strain sub_clone sub_species sub_strain tissue_lib tissue_type transgenic transl_except transl_table translation transposon usedin variety virion +-10_signal allele citation db_xref evidence function gene label locus_tag map note operon partial standard_name usedin +-35_signal allele citation db_xref evidence function gene label locus_tag map note operon partial standard_name usedin +3'UTR allele citation db_xref evidence function gene label locus_tag map note partial standard_name usedin +3'clip allele citation db_xref evidence function gene label locus_tag map note partial standard_name usedin +5'UTR allele citation db_xref evidence function gene label locus_tag map note partial standard_name usedin +5'clip allele citation db_xref evidence function gene label locus_tag map note partial standard_name usedin +CAAT_signal allele citation db_xref evidence gene label locus_tag map note partial usedin +CDS EC_number allele citation codon codon_start db_xref evidence exception function gene label locus_tag map note number operon partial product protein_id pseudo standard_name transl_except transl_table translation usedin +C_region allele citation codon codon_start db_xref evidence gene label locus_tag map note partial product pseudo standard_name transl_except translation usedin +D-loop allele citation db_xref evidence gene label locus_tag map note partial usedin +D_segment allele citation codon codon_start db_xref evidence gene label locus_tag map note partial product pseudo standard_name transl_except translation usedin +GC_signal allele citation db_xref evidence gene label locus_tag map note partial usedin +J_segment allele citation codon codon_start db_xref evidence gene label locus_tag map note partial product pseudo standard_name transl_except translation usedin +LTR allele citation db_xref evidence function gene label locus_tag map note partial standard_name usedin +N_region allele citation codon codon_start db_xref evidence gene label locus_tag map note partial product pseudo standard_name transl_except translation usedin +RBS allele citation db_xref evidence gene label locus_tag map note partial standard_name usedin +STS allele citation db_xref evidence gene label locus_tag map note partial standard_name usedin +S_region allele citation codon codon_start db_xref evidence gene label locus_tag map note partial product pseudo standard_name transl_except translation usedin +TATA_signal allele citation db_xref evidence gene label locus_tag map note partial usedin +V_region allele citation codon codon_start db_xref evidence gene label locus_tag map note partial product pseudo standard_name transl_except translation usedin +V_segment allele citation codon codon_start db_xref evidence gene label locus_tag map note partial product pseudo standard_name transl_except translation usedin +attenuator allele citation db_xref evidence gene label locus_tag map note operon partial phenotype usedin +conflict @citation allele db_xref evidence gene label locus_tag map note replace usedin +enhancer allele citation db_xref evidence gene label locus_tag map note partial standard_name usedin +exon EC_number allele citation codon codon_start db_xref evidence function gene label locus_tag map note number partial product pseudo standard_name transl_except usedin +gap @estimated_length +gene allele citation db_xref evidence function gene label locus_tag map note operon partial phenotype product pseudo standard_name usedin +iDNA allele citation db_xref evidence function gene label locus_tag map note number partial standard_name usedin +intron allele citation cons_splice db_xref evidence function gene label locus_tag map note number partial standard_name usedin +mRNA allele citation db_xref evidence exception function gene label locus_tag map note operon partial product pseudo standard_name transcript_id usedin +mat_peptide EC_number allele citation codon codon_start db_xref evidence function gene label locus_tag map note partial product pseudo standard_name transl_except usedin +misc_RNA allele citation db_xref evidence function gene label locus_tag map note operon partial product standard_name usedin +misc_binding @bound_moiety allele citation db_xref evidence function gene label locus_tag map note partial usedin +misc_difference allele citation clone db_xref evidence gene label locus_tag map note partial phenotype replace standard_name usedin +misc_feature allele citation db_xref evidence function gene label locus_tag map note number partial phenotype product pseudo standard_name usedin +misc_recomb allele citation db_xref evidence gene label locus_tag map note organism partial standard_name usedin +misc_signal allele citation db_xref evidence function gene label locus_tag map note operon partial phenotype standard_name usedin +misc_structure allele citation db_xref evidence function gene label locus_tag map note partial standard_name usedin +modified_base @mod_base allele citation db_xref evidence frequency gene label locus_tag map note usedin +old_sequence @citation allele db_xref evidence gene label locus_tag map note partial replace usedin +operon @operon allele citation db_xref evidence function label map note phenotype pseudo standard_name usedin +oriT allele bound_moiety citation db_xref direction evidence gene label locus_tag map note rpt_family rpt_type rpt_unit standard_name usedin +polyA_signal allele citation db_xref evidence gene label locus_tag map note partial usedin +polyA_site allele citation db_xref evidence gene label locus_tag map note usedin +precursor_RNA allele citation db_xref evidence function gene label locus_tag map note operon partial product standard_name usedin +prim_transcript allele citation db_xref evidence function gene label locus_tag map note operon partial standard_name usedin +primer_bind PCR_conditions allele citation db_xref evidence gene label locus_tag map note partial standard_name usedin +promoter allele citation db_xref evidence function gene label locus_tag map note operon partial phenotype pseudo standard_name usedin +protein_bind @bound_moiety allele citation db_xref evidence function gene label locus_tag map note partial standard_name usedin +rRNA allele citation db_xref evidence function gene label locus_tag map note partial product pseudo standard_name usedin +rep_origin allele citation db_xref direction evidence gene label locus_tag map note partial standard_name usedin +repeat_region allele citation db_xref evidence function gene insertion_seq label locus_tag map note partial rpt_family rpt_type rpt_unit standard_name transposon usedin +repeat_unit allele citation db_xref evidence function gene label locus_tag map note partial rpt_family rpt_type rpt_unit usedin +satellite allele citation db_xref evidence gene label locus_tag map note partial rpt_family rpt_type rpt_unit standard_name usedin +scRNA allele citation db_xref evidence function gene label locus_tag map note partial product pseudo standard_name usedin +sig_peptide allele citation codon codon_start db_xref evidence function gene label locus_tag map note partial product pseudo standard_name transl_except usedin +snRNA allele citation db_xref evidence function gene label locus_tag map note partial product pseudo standard_name usedin +snoRNA allele citation db_xref evidence function gene label locus_tag map note partial product pseudo standard_name usedin +source @organism cell_line cell_type chloroplast chromoplast chromosome citation clone clone_lib country cultivar cyanelle db_xref dev_stage ecotype environmental_sample evidence focus frequency germline haplotype insertion_seq isolate isolation_source kinetoplast lab_host label macronuclear map mitochondrion mol_type note organelle plasmid pop_variant proviral rearranged segment sequenced_mol serotype serovar sex specific_host specimen_voucher strain sub_clone sub_species sub_strain tissue_lib tissue_type transgenic transposon usedin variety virion +stem_loop allele citation db_xref evidence function gene label locus_tag map note operon partial standard_name usedin +tRNA allele anticodon citation db_xref evidence function gene label locus_tag map note partial product pseudo standard_name usedin +terminator allele citation db_xref evidence gene label locus_tag map note operon partial standard_name usedin +transit_peptide allele citation codon codon_start db_xref evidence function gene label locus_tag map note partial product pseudo standard_name transl_except usedin +unsure allele citation db_xref evidence gene label locus_tag map note replace usedin +variation allele citation db_xref evidence frequency gene label locus_tag map note partial phenotype product replace standard_name usedin diff --git a/etc/options b/etc/options new file mode 100644 index 000000000..d19294923 --- /dev/null +++ b/etc/options @@ -0,0 +1,508 @@ +# The standard options file for Artemis + +# (Note that comment lines start with a hash (#) symbol) + +# $Header: //tmp/pathsoft/artemis/etc/options,v 1.1 2004-06-09 10:02:52 tjc Exp $ + +# This file should contain option settings that look like this: +# +# option_name = option_value +# +# If the value of an options is too long to fit on one line it can be split +# over several lines by ending each line with a backslash like this: +# +# option_name = option_value another_option_value \ +# a_third_option_value a_forth_option_value + + +# This option will set the font size for all the Artemis windows. + +font_size = 12 + + +# Set the name of the font to use in Artemis. These possibilites are +# available on all platforms: +# Dialog, DialogInput, Monospaced, Serif, SansSerif, Symbol. + +font_name = Monospaced + +# This option is used to set the default minimum size (in amino acids) +# of a "large" open reading frame, which controls which ORFS are +# marked by the "Mark Open Reading Frames" menu item. + +minimum_orf_size = 100 + +# Set the default value for the direct edit option (see +# http://www.sanger.ac.uk/Software/Artemis/stable/manual/launch-window.html#LAUNCH-WINDOW-OPTIONS-DIRECT-EDIT +# for more) +direct_edit = yes + +# This setting controls which set of codons will be used for start codons. +# This can be changed from the options menu. +# There are two possible settings: eukaryote or prokaryote +organism_type = eukaryote + +# This option gives the bases of the possible start codons +eukaryotic_start_codons = atg +prokaryotic_start_codons = atg gtg ttg + + +# The translation_table option is used to lookup codon translations. The +# table must have exactly 64 entries, and there is one entry for each codon. +# The entries should appear in this order: +# TTT, TTC, TTA, TTG, +# TCT, TCC, ..., +# ... + +# this is the default table: +# +# translation_table = \ +# f f l l \ +# s s s s \ +# y y # + \ +# c c * w \ +# \ +# l l l l \ +# p p p p \ +# h h q q \ +# r r r r \ +# \ +# i i i m \ +# t t t t \ +# n n k k \ +# s s r r \ +# \ +# v v v v \ +# a a a a \ +# d d e e \ +# g g g g + +# this is the eukaryotic mitochondrial table: +# +# translation_table = \ +# f f l l \ +# s s s s \ +# y y * * \ +# c c w w \ +# \ +# l l l l \ +# p p p p \ +# h h q q \ +# r r r r \ +# \ +# i i m m \ +# t t t t \ +# n n k k \ +# s s * * \ +# \ +# v v v v \ +# a a a a \ +# d d e e \ +# g g g g + + +# the sequence of colour numbers must not have any gaps - if for example +# colour_5 is missing then all colours with higher numbers will be ignored + +# the three numbers for each colour correspond to red, green and blue +# respectively. each number is an intensity from 0 to 255 + +# white +colour_0 = 255 255 255 +# dark grey +colour_1 = 100 100 100 +# red +colour_2 = 255 0 0 +# green +colour_3 = 0 255 0 +# blue +colour_4 = 0 0 255 +# cyan +colour_5 = 0 255 255 +# magenta +colour_6 = 255 0 255 +# yellow +colour_7 = 245 245 0 +# pale green +colour_8 = 152 251 152 +# light sky blue +colour_9 = 135 206 250 +# orange +colour_10 = 255 165 0 +# brown +colour_11 = 200 150 100 +# pink +colour_12 = 255 200 200 +# light grey +colour_13 = 170 170 170 +# black +colour_14 = 0 0 0 +# reds: +colour_15 = 255 63 63 +colour_16 = 255 127 127 +colour_17 = 255 191 191 + +colour_of_CDS = 5 +colour_of_cds? = 7 +colour_of_BLASTCDS = 2 +colour_of_BLASTN_HIT = 6 +colour_of_CRUNCH_D = 2 +colour_of_CRUNCH_X = 15 +colour_of_source = 0 +colour_of_prim_tran = 0 +colour_of_stem_loop = 2 +colour_of_misc_feature = 3 +colour_of_misc_RNA = 12 +colour_of_delta = 3 +colour_of_LTR = 4 +colour_of_repeat_region = 9 +colour_of_repeat_unit = 9 +colour_of_terminator = 3 +colour_of_promoter = 3 +colour_of_intron = 1 +colour_of_exon = 7 +colour_of_mRNA = 1 +colour_of_tRNA = 8 +colour_of_TATA = 3 +colour_of_bldA = 2 +colour_of_GFF = 11 + +colour_of_start_codon = 6 + +# suffixes used on files that contain features - used in file requesters +feature_file_suffixes = tab embl gbk genbank tab_embl gff feature feat \ + art artemis + +# suffixes used on files that contain sequence - used in file requesters +sequence_file_suffixes = embl gbk genbank tab_embl seq dna \ + art artemis + +# this is the URL that contains the IOR of the EMBL server +embl_ior_url = http://corba.ebi.ac.uk/EMBL/IOR/Embl.IOR + +# this is the URL that contains the IOR of the EnsEMBL server +# ensembl_ior_url = file:///nfs/disk12/kmr/powmap/db.ior + + +# the default height for the base plot window +base_plot_height = 150 + + +# the default height for the feature plot window +feature_plot_height = 160 + + +# if this option is no then the feature labels in the overview will be off at +# startup (the default is yes) +# overview_feature_labels = no + + +# if this option is yes then the overview will start in one line per entry +# mode (the default is no) +# overview_one_line_per_entry = yes + + +# if this option is "yes" then the feature list will be displayed on startup +# (this is the default) +show_list = yes + + +# if this option is "yes" then the base view will be displayed on startup +# (this is the default) +show_base_view = yes + + +# if this option is "yes" then the entry buttons will be displayed on +# startup +show_entry_buttons = yes + + +# if this option is "yes" then artemis will offer to show the results of a +# search when it finishes +show_results = no + + +# if this option is "yes" the "all features on frame lines" option will +# default to true on start up +features_on_frame_lines = no + + +# if this option is "yes" the "feature labels" option will +# default to true on start up +feature_labels = yes + + +# if this option is "yes" the "one line per entry" option will default to +# true on start up +one_line_per_entry = no + + +# if this option is "yes" Sanger specific menu items and functions will be +# visible in the display +sanger_options = no + + +# the full path to the editor used for editing the qualifiers +#external_editor = emacs + + +# if set to yes, borders will be drawn around each feature and each exon. if +# set to no borders will only be drawn around the selected features. +draw_feature_borders = yes + + +# if set to yes, a direction arrow will be drawn around at the end of each +# feature. if set to no, no arrows will be drawn. +draw_feature_arrows = yes + + +# the number of levels of undo to save or 0 if undo is disabled. more undo +# levels will require more memory. +undo_levels = 20 + + +# this list is added to the keys from the feature_keys file +extra_keys = \ + BLASTN_HIT CDS_BEFORE CDS_AFTER CDS_before CDS_after \ + CDS_motif BLASTCDS polymorphism GFF WUBLASTN_HIT \ + WUBLASTX_HIT BLASTX_HIT TBLASTX_HIT BLASTN_HIT \ + CRUNCH_D CRUNCH_X fasta_record allele mutation splicesite \ + TMM signalP + +# Names of qualifiers to search when attempting to find the primary or display +# name of a gene. These qualifiers names are searched in order when looking +# for gene names. +display_name_qualifiers = primary_name synonym systematic_id \ + temporary_systematic_id gene locus_tag label + +# Names of qualifiers to search when attempting to find the systematic name of +# a gene +systematic_name_qualifiers = systematic_id temporary_systematic_id \ + locus_tag gene label + + +# this list is added to the qualifiers from the qualifier_types file +extra_qualifiers = \ + CHROMO_LINK text \ + C_processing "text" \ + C_processing_BigPi "text" \ + C_processing_DGPI "text" \ + COM_NAME "text" \ + FEAT_NAME text \ + GO_component "text" \ + GO_function "text" \ + GO_process "text" \ + GO_slim "text" \ + GO "text" \ + LOCUS "text" \ + PUB_LOCUS text \ + PUB_COMMENT "text" \ + REPEAT_TYPE "text" \ + SNP "text" \ + algorithm "text" \ + anchor "text" \ + annotation_source "text" \ + assembly_id "text" \ + bb_orthologue "text" \ + bound_moiety "text" \ + bpp_orthologue "text" \ + bp_orthologue "text" \ + bicsw_file "text" \ + blast_score text \ + blast_file "text" \ + blastn_file "text" \ + blastp_file "text" \ + blastp+go_file "text" \ + blastp_match "text" \ + blastx_file "text" \ + cds_id "text" \ + chloroplast "text" \ + chromoplast "text" \ + class "text" \ + cleavage "text" \ + cluster "text" \ + color text \ + colour text \ + comment_Cterm "text" \ + comment_Nterm "text" \ + confidence_level "text" \ + coord "text" \ + contig_id "text" \ + created "text" \ + curation "text" \ + curated_ortholog "text" \ + cyanelle "text" \ + domain "text" \ + end_phase text \ + exon_id "text" \ + fasta_file "text" \ + fasta_match "text" \ + fastx_file "text" \ + filename "text" \ + function "text" \ + gene "text" \ + gene_id "text" \ + gff_feature text \ + gff_group text \ + gff_seqname text \ + gff_source text \ + go_from_interpro "text" \ + hp_match "text" \ + hth_file "text" \ + id "text" \ + interaction "text" \ + interpro "text" \ + job "text" \ + label text \ + literature "text" \ + manual none \ + mitochondrion "text" \ + modified "text" \ + mutation "text" \ + obsolete_name "text" \ + obsolete_product "text" \ + origid "text" \ + ortholog "text" \ + paralog "text" \ + pepstats_file "text" \ + percent_id text \ + pfam_match "text" \ + previous_systematic_id "text" \ + primary_name "text" \ + prosite_match "text" \ + psu_db_xref "text" \ + psu_domain "text" \ + reserved_name "text" \ + query_id text \ + score text \ + sequence_source "text" \ + sequence_status "text" \ + sigcleave_file "text" \ + signal "text" \ + similarity "text" \ + smart_file "text" \ + sptr_display "text" \ + start_phase text \ + subject_end text \ + subject_id text \ + subject_start text \ + synonym "text" \ + synteny "text" \ + systematic_id "text" \ + taxon_id "text" \ + tblastn_file "text" \ + tblastx_file "text" \ + tb_orthologue "text" \ + temporary_systematic_id "text" \ + tmhelix "text" \ + transferred_gene "text" \ + transferred_locus_tag "text" \ + transferred_note "text" \ + transferred_primary_name "text" \ + transferred_product "text" \ + transferred_synonym "text" \ + transferred_systematic_id "text" \ + type "text" + +# this is a list of extra qualifiers that are legal but are not displayed in +# popup menus (such as the one in the feature editor window). this hack is +# used by diana.components.QualifierChoice to limit the number of qualifers +# that are displayed in the popup menu. on some VMs if there are too many in +# the popup the bottom ones aren't visible +invisible_qualifiers = \ + CHROMO_LINK \ + C_processing \ + C_processing_BigPi \ + C_processing_DGPI \ + COM_NAME \ + FEAT_NAME \ + LOCUS \ + PUB_LOCUS \ + PUB_COMMENT \ + REPEAT_TYPE \ + SNP \ + bicsw_file \ + blast_file \ + blast_score \ + blastn_file \ + blastp+go_file \ + blastp_file \ + blastx_file \ + cds_id \ + chloroplast \ + chromoplast \ + codon \ + comment_Cterm \ + comment_Nterm \ + created \ + cyanelle \ + end_phase \ + exception \ + exon_id \ + fasta_file \ + fasta_match \ + gene_id \ + gff_feature \ + gff_group \ + gff_seqname \ + gff_source \ + go_from_interpro \ + hp_match \ + hth_file \ + interpro \ + map \ + mitochondrion \ + modified \ + number \ + obsolete_gene_name \ + pepstats_file \ + percent_id \ + pfam_match \ + prosite_match \ + psu_domain \ + reserved_gene_name \ + query_id \ + sigcleave_file \ + score \ + smart_file \ + start_phase \ + tblastn_file \ + tblastx_file \ + temporary_systematic_id \ + transl_table \ + translation \ + type \ + usedin + + +# These pairs consist of a program name and a parameter string. +# For blast and fasta the parameter string is the name of the database to +# search. +feature_protein_programs = \ + fasta %L \ + sigcleave 0 \ + pepstats - \ + blastp swall \ + tblastn embl_other \ + hth - \ + smart - \ + clustalx PROTEIN \ + jalview - + +feature_dna_programs = \ + tblastx embl_other \ + blastn embl_other \ + blastx swall \ + fastx %L \ + clustalx DNA + +application_programs = \ + +# this is the list of keys that should be displayed by default in the edit +# window +common_keys = \ + allele attenuator CDS conflict exon intron LTR misc_feature misc_RNA mRNA \ + mutation polyA_signal polyA_site promoter protein_bind RBS repeat_region \ + repeat_unit rRNA scRNA snRNA source stem_loop STS TATA_signal terminator \ + tRNA unsure variation -10_signal -35_signal CDS_motif gene \ + BLASTN_HIT BLASTCDS 3'UTR 5'UTR diff --git a/etc/pombe.usage b/etc/pombe.usage new file mode 100644 index 000000000..bb7176ed1 --- /dev/null +++ b/etc/pombe.usage @@ -0,0 +1,20 @@ +UUU 32.2( 48423) UCU 30.5( 45913) UAU 21.8( 32829) UGU 8.9( 13371) +UUC 13.0( 19519) UCC 12.1( 18149) UAC 11.8( 17721) UGC 5.6( 8372) +UUA 26.0( 39138) UCA 17.9( 26850) UAA 1.3( 1944) UGA 0.5( 733) +UUG 24.0( 36134) UCG 8.0( 12055) UAG 0.5( 705) UGG 10.9( 16364) + +CUU 25.3( 38015) CCU 21.9( 32964) CAU 16.3( 24577) CGU 16.3( 24495) +CUC 7.3( 10922) CCC 8.4( 12619) CAC 6.4( 9653) CGC 6.2( 9316) +CUA 8.6( 12957) CCA 12.7( 19075) CAA 27.3( 41066) CGA 7.9( 11896) +CUG 6.3( 9503) CCG 4.6( 6910) CAG 10.9( 16457) CGG 3.0( 4487) + +AUU 35.0( 52636) ACU 22.9( 34419) AAU 33.9( 51009) AGU 14.7( 22108) +AUC 12.6( 19000) ACC 10.9( 16378) AAC 17.9( 26895) AGC 9.2( 13905) +AUA 13.1( 19726) ACA 13.9( 20898) AAA 39.3( 59079) AGA 11.1( 16742) +AUG 20.9( 31376) ACG 6.5( 9744) AAG 25.2( 37825) AGG 5.1( 7615) + +GUU 29.3( 44015) GCU 30.2( 45397) GAU 38.1( 57240) GGU 22.0( 33101) +GUC 11.0( 16497) GCC 11.6( 17518) GAC 15.8( 23749) GGC 8.5( 12717) +GUA 12.3( 18451) GCA 15.7( 23649) GAA 44.3( 66550) GGA 15.7( 23623) +GUG 8.3( 12422) GCG 5.3( 8011) GAG 21.3( 31979) GGG 4.3( 6497) + diff --git a/etc/qualifier_types b/etc/qualifier_types new file mode 100644 index 000000000..f860210db --- /dev/null +++ b/etc/qualifier_types @@ -0,0 +1,110 @@ +# Feature qualifiers for EMBL/GenBank feature tables +# +# From: http://www.ebi.ac.uk/~faruque/art/keyqual.txt +# +# valid qualifier types are: +# (::) (text:text,text:text) +# EC "n.n.n.n" +# feature dbname::accno:location +# item single text item +# list one of the listed values +# modbase one of the stored modbase values +# none no value +# number nn +# (other) (text) +# location a valid location range (or feature label) +# real n.n within specified range +# ref [nn] +# text any text, no quotes added, spaces allowed if quoted +# "text" quoted text, double any contained quotes +# "opt" optional quoted text, double any contained quotes +# "list" quoted text, list of accepted values +# +# if not specified, the default is text (so anything is accepted) +# +# Name required Type Value(s) .. +allele no "text" +anticodon yes (::) pos aa +bound_moiety no "text" +cell_line no "text" +cell_type no "text" +chromosome no "opt" +citation no ref +clone no "text" +clone_lib no "text" +codon no (::) seq aa +codon_start yes number 1 3 +cons_splice yes (::) 5'site 3'site +country no "text" +cultivar no "text" +db_xref no "text" +dev_stage no "text" +direction yes list LEFT RIGHT BOTH +ecotype no "text" +EC_number no "text" +environmental_sample no none +estimated_length no "text" +evidence yes list EXPERIMENTAL NOT_EXPERIMENTAL +exception no "text" +focus no none +frequency yes real 0.0 1.0 +function yes "text" +gene no "text" +germline yes none +haplotype no "text" +insertion_seq no "text" +isolation_source no "text" +isolate no "text" +kinetoplast no "opt" +label yes item +lab_host no "text" +locus_tag no "text" +macronuclear no none +map no "text" +mod_base no modbase +mol_type no "text" +note no "text" +number yes number 1 99999999 +operon no "text" +organell no "text" +organism yes "text" +partial yes none +PCR_conditions no "text" +phenotype no "text" +plasmid no "text" +pop_variant no "text" +product no "text" +protein_id no "text" +proviral yes none +pseudo yes none +rearranged yes none +replace no "text" +rpt_family no "text" +rpt_type no list TANDEM INVERTED FLANKING TERMINAL DIRECT \ + DISPERSED OTHER +rpt_unit no location +segment no "text" +sequenced_mol no "list" "cDNA" "cDNA to genomic RNA" \ + "cDNA to mRNA" "cDNA to other RNA" \ + "cDNA to rRNA" "DNA" "mRNA" \ + "RNA" "rRNA" "scRNA" "snRNA" "tRNA" +serotype no "text" +serovar no "text" +sex no "text" +specific_host no "text" +specimen_voucher no "text" +standard_name no "text" +strain no "text" +sub_clone no "text" +sub_species no "text" +sub_strain no "text" +tissue_lib no "text" +tissue_type no "text" +transgenic no "text" +translation no "text" +transl_except no (::) pos aa +transl_table no number 1 11 +transposon no "text" +usedin no feature +variety no "text" +virion no none diff --git a/etc/results_to_netscape b/etc/results_to_netscape new file mode 100755 index 000000000..3de1626a4 --- /dev/null +++ b/etc/results_to_netscape @@ -0,0 +1,214 @@ +#!/bin/sh - + +# This script will send a file to netscape with database IDs linked to SRS. +# To customize this script edit the $DATABASES and $SRS_SERVER variable in the +# perl code below and the NETSCAPE variable at the top of the script. + +# To enable this in Artemis, sanger_options must be set to true in the options +# file. + +NETSCAPE=/usr/bin/X11/real-netscape + +if [ -f "$DIANA_ENVIRONMENT_FILE" ] +then + . $DIANA_ENVIRONMENT_FILE +fi + +if [ $# = 0 ] +then + echo no argument given 1>&2 + exit 1 +fi + +file_arg=$1 + +unique_bit=$$.`hostname` + +# sanger hack: +file_arg=`echo $file_arg | sed 's@^/tmp_mnt/nfs/@/nfs/@' | sed 's@^/tmp_mnt/tmp_nfs/@/nfs/@'` +# fix for pcs3: +file_arg=`echo $file_arg | sed 's@^/yeastpub4/@/nfs/disk222/yeastpub4/@'` + + +if [ -f ./$file_arg ] +then + # the file is in the current directory - we need the full path so netscape + # can find the file + new_file=$PWD/$file_arg.$unique_bit.html +else + new_file=$file_arg.$unique_bit.html +fi + +cat <<EOF > $new_file +<HTML> + <HEAD> + <TITLE> + Results for $file_arg + </TITLE> + </HEAD> + <BODY> +<PRE> +EOF + +perl -e ' +BEGIN { + # change these variable to list the databases to search for the IDs - the + # database names should be separated by spaces + $PROTEIN_DATABASES = "swall"; + $DNA_DATABASES = "embl"; + + # change this to point to the wgetz script of your SRS server + $SRS_SERVER = "www.sanger.ac.uk/srs6bin/cgi-bin/wgetz?-e+"; + + $PROTEIN_DATABASES =~ s/ /%20/g; + $DNA_DATABASES =~ s/ /%20/g; + + %GENEDB_PATTERNS = (tryp => q!Tb\d+\.\d+\.\d+|TRYP_\S+!, + leish => q!LmjF\d+.\d+!); + + $GENEDB_PATTERN = join ("|", values %GENEDB_PATTERNS); + + $BLAST_START_LINE = "Sequences producing High-scoring Segment Pairs|" . + "Sequences producing significant alignments:"; + $FASTA_START_LINE = "The best scores are"; + + # the list of IDs we have seen so far + @ids = (); + + # the list of IDs we have made anchors for so far + @anchored_ids = (); + + $db_type = "unknown"; +} + +sub hyperlink_to_anchor +{ + $id = shift; + qq(<a href="#$id">$id</a>); +} + +sub hyperlink_id +{ + $id = shift; + + if ($db_type eq "dna") { + $r = qq#<a href="http://$SRS_SERVER\[\{$DNA_DATABASES\}-ID:$id*]|[\{$DNA_DATABASES\}-AccNumber:$id*]">$id</a>#; + } else { + for my $org (keys %GENEDB_PATTERNS) { + my $pattern = $GENEDB_PATTERNS{$org}; + + if ($id =~ /$pattern/) { + $r = qq#<a href="http://www.genedb.org/genedb/Search?organism=$org&name=$id">$id</a>#; + return $r + } + } + + $r = qq#<a href="http://$SRS_SERVER\[\{$PROTEIN_DATABASES\}-ID:$id*]|[\{$PROTEIN_DATABASES\}-AccNumber:$id*]">$id</a>#; + } + return $r +} + +$file_name = $ARGV[0]; + +if ($file_name =~ /\.gz$/) { + open IN_FILE, "gzip -d < $file_name |" or die "failed to open $file_name\n"; +} else { + open IN_FILE, "$file_name" or die "failed to open $file_name\n"; +} + +while (<IN_FILE>) { + if ($. == 1) { + if (/^\s*([^\s]+)/) { + if (lc $1 eq "blastn" or lc $1 eq "tblastn" or lc $1 eq "tblastx") { + $db_type = "dna"; + } else { + if (lc $1 eq "fasta" or lc $1 eq "blastp" or lc $1 eq "blastx") { + $db_type = "protein"; + } else { + print "\nWARNING: could not identify file type: $1\n"; + } + } + } else { + print "\nWARNING: could not identify file type\n"; + } + } + + + # ignore header lines + if (1..m/$BLAST_START_LINE|$FASTA_START_LINE/) { + print; + next; + } + + if (@ids && /^\s*$/) { + $summary_finished = 1; + } + + if (/^(?:(?:>?>?(?:[A-Z]+:)?)(\w+)|($GENEDB_PATTERN)) /) { + $id = $1; + + if (!defined $id) { + $id = $2; + } + + if ($summary_finished) { + if ((grep {$_ eq $id} @ids) && (!grep {$_ eq $id} @anchored_ids)) { + # not anchored yet so make it an anchor + if (s/\b$id\b/"<a name=\"$id\">" . (hyperlink_id($id)) . "<\/a>"/e) { + push @anchored_ids, $id; + } + } + } else { + if (!grep {$_ eq $id} @ids) { + push @ids, $id; + } + + s/$id/hyperlink_to_anchor($id)/ei; + + if (!s/ $id/" " . hyperlink_id($id)/ei) { + # if the id occurs once in the line put a link at end of line + s/$/" LINK:" . hyperlink_id($id)/e; + } + } + } + print; +} + +' $file_arg >> $new_file + +cat <<EOF >> $new_file; +</PRE> + </BODY> +</HTML> +EOF + +# delete it at some point +echo "rm -f $new_file > /dev/null 2>&1" | at now + 36 hours + +if $NETSCAPE -remote "openURL($new_file)" +then + exit 0 +else + echo starting new netscape 2>&1 + # netscape isn't running - so start it + ($NETSCAPE &)& + + # now send the URL. we do things this way so that the script doesn't exit + # until netscape has successfully shown the URL + + sleep 1 + + # don't exit the script until the file is successfully displayed or until + # 40 seconds is up + for i in 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 + do + if $NETSCAPE -remote "openURL($new_file)" 2> /dev/null + then + exit 0 + else + sleep 2 + fi + done + + exit 1 +fi diff --git a/etc/run_blastn b/etc/run_blastn new file mode 100755 index 000000000..ef5297bd1 --- /dev/null +++ b/etc/run_blastn @@ -0,0 +1,87 @@ +#!/bin/sh - + +# this script will run a search program on a sequence input file or on each +# file in a file of filenames + +# to customise this script see the function called run_one_prog below + + +RCS_HEADER="$Header: //tmp/pathsoft/artemis/etc/run_blastn,v 1.1 2004-06-09 10:02:58 tjc Exp $" + +PROG=`echo $RCS_HEADER | sed 's/.*run_\(.*\),v.*/\1/'` + + +if [ $# = 4 -a x$1 = x-onefile ] +then + shift + ONEFILE=t + DATABASE=$3 export DATABASE +else + if [ $# = 2 ] + then + DATABASE=$2 export DATABASE + else + echo usage: $0 -onefile input_file output_file database + echo or: $0 file_of_filenames database + exit 1 + fi +fi + + +# expand any ~ or environment variables +EXPANDED_DATABASE=`echo "echo $DATABASE" | /bin/csh -f` + + +### change this function to suit your site: + +run_one_prog () { + INPUT_FILE=$1 + OUTPUT_FILE=$2 + DATABASE=$3 + + + ### change these lines: + EXEC=blastall + + echo "about to start $EXEC with input from $INPUT_FILE and output to" + echo "$OUTPUT_FILE using database $DATABASE" + + + EXTRA_ARGS= + + # add/change the flags to suit your site: + lsrun -v blastwrap.pl $EXEC -d $DATABASE -i $INPUT_FILE -p blastn \ + $EXTRA_ARGS 2>&1 > $OUTPUT_FILE | + tee ${PROG}_errors.new 1>&2 + + #### end of changes + + + # Artemis can read compressed files + gzip -9 $OUTPUT_FILE & + + if [ -s ${PROG}_errors.new ] + then + ( echo ERROR running $PROG: ; echo; + echo =================================================== + cat ${PROG}_errors.new ) >> $OUTPUT_FILE + cat ${PROG}_errors.new >> ${PROG}_errors + fi +} + +(echo "#!/bin/sh -"; echo "kill $$") > $PROG.kill + +chmod a+x $PROG.kill + +if [ x$ONEFILE = x ] +then + for i in `cat $1` + do + run_one_prog $i $i.out $EXPANDED_DATABASE + done + +else + run_one_prog $1 $2 $EXPANDED_DATABASE +fi + +exit 0 diff --git a/etc/run_blastp b/etc/run_blastp new file mode 100755 index 000000000..2ac573c1b --- /dev/null +++ b/etc/run_blastp @@ -0,0 +1,88 @@ +#!/bin/sh - + +# this script will run a search program on a sequence input file or on each +# file in a file of filenames + +# to customise this script see the function called run_one_prog below + + +RCS_HEADER="$Header: //tmp/pathsoft/artemis/etc/run_blastp,v 1.1 2004-06-09 10:02:59 tjc Exp $" + +PROG=`echo $RCS_HEADER | sed 's/.*run_\(.*\),v.*/\1/'` + + +if [ $# = 4 -a x$1 = x-onefile ] +then + shift + ONEFILE=t + DATABASE=$3 export DATABASE +else + if [ $# = 2 ] + then + DATABASE=$2 export DATABASE + else + echo usage: $0 -onefile input_file output_file database + echo or: $0 file_of_filenames database + exit 1 + fi +fi + + +# expand any ~ or environment variables +EXPANDED_DATABASE=`echo "echo $DATABASE" | /bin/csh -f` + + +### change this function to suit your site: + +run_one_prog () { + INPUT_FILE=$1 + OUTPUT_FILE=$2 + DATABASE=$3 + + + ### change these lines: + EXEC=blastall + + echo "about to start $EXEC with input from $INPUT_FILE and output to" + echo "$OUTPUT_FILE using database $DATABASE" + + + EXTRA_ARGS= + + # add/change the flags to suit your site: + lsrun -R 'select[blast && mem > 500] rusage[r1m=1:mem=500]' -v \ + blastwrap.pl $EXEC -d $DATABASE -i $INPUT_FILE -p blastp \ + $EXTRA_ARGS 2>&1 > $OUTPUT_FILE | + tee ${PROG}_errors.new 1>&2 + + #### end of changes + + + # Artemis can read compressed files + gzip -9 $OUTPUT_FILE & + + if [ -s ${PROG}_errors.new ] + then + ( echo ERROR running $PROG: ; echo; + echo =================================================== + cat ${PROG}_errors.new ) >> $OUTPUT_FILE + cat ${PROG}_errors.new >> ${PROG}_errors + fi +} + +(echo "#!/bin/sh -"; echo "kill $$") > $PROG.kill + +chmod a+x $PROG.kill + +if [ x$ONEFILE = x ] +then + for i in `cat $1` + do + run_one_prog $i $i.out $EXPANDED_DATABASE + done + +else + run_one_prog $1 $2 $EXPANDED_DATABASE +fi + +exit 0 diff --git a/etc/run_blastx b/etc/run_blastx new file mode 100755 index 000000000..21c88d11b --- /dev/null +++ b/etc/run_blastx @@ -0,0 +1,87 @@ +#!/bin/sh - + +# this script will run a search program on a sequence input file or on each +# file in a file of filenames + +# to customise this script see the function called run_one_prog below + + +RCS_HEADER="$Header: //tmp/pathsoft/artemis/etc/run_blastx,v 1.1 2004-06-09 10:03:00 tjc Exp $" + +PROG=`echo $RCS_HEADER | sed 's/.*run_\(.*\),v.*/\1/'` + + +if [ $# = 4 -a x$1 = x-onefile ] +then + shift + ONEFILE=t + DATABASE=$3 export DATABASE +else + if [ $# = 2 ] + then + DATABASE=$2 export DATABASE + else + echo usage: $0 -onefile input_file output_file database + echo or: $0 file_of_filenames database + exit 1 + fi +fi + + +# expand any ~ or environment variables +EXPANDED_DATABASE=`echo "echo $DATABASE" | /bin/csh -f` + + +### change this function to suit your site: + +run_one_prog () { + INPUT_FILE=$1 + OUTPUT_FILE=$2 + DATABASE=$3 + + + ### change these lines: + EXEC=blastall + + echo "about to start $EXEC with input from $INPUT_FILE and output to" + echo "$OUTPUT_FILE using database $DATABASE" + + + EXTRA_ARGS= + + # add/change the flags to suit your site: + lsrun -v blastwrap.pl $EXEC -d $DATABASE -i $INPUT_FILE -p blastx \ + $EXTRA_ARGS 2>&1 > $OUTPUT_FILE | + tee ${PROG}_errors.new 1>&2 + + #### end of changes + + + # Artemis can read compressed files + gzip -9 $OUTPUT_FILE & + + if [ -s ${PROG}_errors.new ] + then + ( echo ERROR running $PROG: ; echo; + echo =================================================== + cat ${PROG}_errors.new ) >> $OUTPUT_FILE + cat ${PROG}_errors.new >> ${PROG}_errors + fi +} + +(echo "#!/bin/sh -"; echo "kill $$") > $PROG.kill + +chmod a+x $PROG.kill + +if [ x$ONEFILE = x ] +then + for i in `cat $1` + do + run_one_prog $i $i.out $EXPANDED_DATABASE + done + +else + run_one_prog $1 $2 $EXPANDED_DATABASE +fi + +exit 0 diff --git a/etc/run_clustalx b/etc/run_clustalx new file mode 100755 index 000000000..1e40a7c0e --- /dev/null +++ b/etc/run_clustalx @@ -0,0 +1,41 @@ +#!/bin/sh - + +# this script will run clustalx on a temporary file containing the concatenated +# contents of files listed in a file of filenames + + +RCS_HEADER="$Header: //tmp/pathsoft/artemis/etc/run_clustalx,v 1.1 2004-06-09 10:03:01 tjc Exp $" + +PROG=`echo $RCS_HEADER | sed 's/.*run_\(.*\),v.*/\1/'` + + +if [ $# != 1 ] +then + echo usage: $0 file_of_filenames +fi + +(echo "#!/bin/sh -"; echo "kill $$") > $PROG.kill + +chmod a+x $PROG.kill + +file_of_filenames=$1 +date=`date +"%y_%m_%d"` +hostname=`hostname` +temp_file_name=/tmp/artemis_temp.$$.$hostname.$date.clustalx_input.fasta + +cat $file_of_filenames | xargs cat > $temp_file_name + +# make sure that the identifiers are unique for clustalx +perl -pne 'if (/^>(\S+)/) { + $name = $1; + if (exists $h{$name}) { + $i = $h{$name}++; + s/^>(\S+)/>$name.$i/; + } else { + $h{$name} = 0; + } +}' $temp_file_name > $temp_file_name.processed + +clustalx $temp_file_name.processed + +exit 0 diff --git a/etc/run_fasta b/etc/run_fasta new file mode 100755 index 000000000..b46d0dd56 --- /dev/null +++ b/etc/run_fasta @@ -0,0 +1,90 @@ +#!/bin/sh - + +# this script will run a search program on a sequence input file or on each +# file in a file of filenames + +# to customise this script see the function called run_one_prog below + + +RCS_HEADER="$Header: //tmp/pathsoft/artemis/etc/run_fasta,v 1.1 2004-06-09 10:03:03 tjc Exp $" + +PROG=`echo $RCS_HEADER | sed 's/.*run_\(.*\),v.*/\1/'` + + +if [ $# = 4 -a x$1 = x-onefile ] +then + shift + ONEFILE=t + DATABASE=$3 export DATABASE +else + if [ $# = 2 ] + then + DATABASE=$2 export DATABASE + else + echo usage: $0 -onefile input_file output_file database 1>&2 + echo or: $0 file_of_filenames database 1>&2 + exit 1 + fi +fi + + +# expand any ~ or environment variables +EXPANDED_DATABASE=`echo "echo $DATABASE" | /bin/csh -f` + + +### change this function to suit your site: + +run_one_prog () { + INPUT_FILE=$1 + OUTPUT_FILE=$2 + DATABASE=$3 + + + ### change these lines: + + FASTLIBS=/nfs/disk222/yeastpub/bio-soft/fasta/pubseqgbs export FASTLIBS + EXEC=/nfs/disk222/yeastpub/bio-soft/fasta/fasta33 + + echo "about to start $EXEC with input from $INPUT_FILE and output to" 1>&2 + echo "$OUTPUT_FILE using database $DATABASE" 1>&2 + + # add/change the flags to suit your site: + COMMAND="$EXEC -B -S -q -b 100 -H $INPUT_FILE $DATABASE ktup 2" + + echo "command line: $COMMAND" 1>&2 + +# lsrun -R 'select[blast && mem > 500] rusage[r1m=1:mem=500]' -v $COMMAND 2>&1 > $OUTPUT_FILE | + bsub -q longblastq -R 'select[blast && mem > 500] rusage[r1m=1:mem=500]' -I $COMMAND 2>&1 > $OUTPUT_FILE | + tee ${PROG}_errors.new 1>&2 + + #### end of changes + + + # Artemis can read compressed files + gzip -9 $OUTPUT_FILE & + + if [ -s ${PROG}_errors.new ] + then + ( echo ERROR running $PROG: ; echo; + echo =================================================== + cat ${PROG}_errors.new ) >> $OUTPUT_FILE + cat ${PROG}_errors.new >> ${PROG}_errors + fi +} + +(echo "#!/bin/sh -"; echo "kill $$") > $PROG.kill + +chmod a+x $PROG.kill + +if [ x$ONEFILE = x ] +then + for i in `cat $1` + do + run_one_prog $i $i.out $EXPANDED_DATABASE + done + +else + run_one_prog $1 $2 $EXPANDED_DATABASE +fi + +exit 0 diff --git a/etc/run_fasta_orig b/etc/run_fasta_orig new file mode 100755 index 000000000..63c87b3e3 --- /dev/null +++ b/etc/run_fasta_orig @@ -0,0 +1,90 @@ +#!/bin/sh - + +# this script will run a search program on a sequence input file or on each +# file in a file of filenames + +# to customise this script see the function called run_one_prog below + + +RCS_HEADER="$Header: //tmp/pathsoft/artemis/etc/run_fasta_orig,v 1.1 2004-06-09 10:03:04 tjc Exp $" + +PROG=`echo $RCS_HEADER | sed 's/.*run_\(.*\),v.*/\1/'` + + +if [ $# = 4 -a x$1 = x-onefile ] +then + shift + ONEFILE=t + DATABASE=$3 export DATABASE +else + if [ $# = 2 ] + then + DATABASE=$2 export DATABASE + else + echo usage: $0 -onefile input_file output_file database 1>&2 + echo or: $0 file_of_filenames database 1>&2 + exit 1 + fi +fi + + +# expand any ~ or environment variables +EXPANDED_DATABASE=`echo "echo $DATABASE" | /bin/csh -f` + + +### change this function to suit your site: + +run_one_prog () { + INPUT_FILE=$1 + OUTPUT_FILE=$2 + DATABASE=$3 + + + ### change these lines: + + FASTLIBS=/nfs/disk222/yeastpub/bio-soft/fasta/pubseqgbs export FASTLIBS + EXEC=/nfs/disk222/yeastpub/bio-soft/fasta/fasta33 + + echo "about to start $EXEC with input from $INPUT_FILE and output to" 1>&2 + echo "$OUTPUT_FILE using database $DATABASE" 1>&2 + + # add/change the flags to suit your site: + COMMAND="$EXEC -B -S -q -b 40 -H $INPUT_FILE $DATABASE ktup 2" + + echo "command line: $COMMAND" 1>&2 + + lsrun -R 'select[blast && mem > 500] rusage[r1m=1:mem=500]' -v \ + $COMMAND 2>&1 > $OUTPUT_FILE | + tee ${PROG}_errors.new 1>&2 + + #### end of changes + + + # Artemis can read compressed files + gzip -9 $OUTPUT_FILE & + + if [ -s ${PROG}_errors.new ] + then + ( echo ERROR running $PROG: ; echo; + echo =================================================== + cat ${PROG}_errors.new ) >> $OUTPUT_FILE + cat ${PROG}_errors.new >> ${PROG}_errors + fi +} + +(echo "#!/bin/sh -"; echo "kill $$") > $PROG.kill + +chmod a+x $PROG.kill + +if [ x$ONEFILE = x ] +then + for i in `cat $1` + do + run_one_prog $i $i.out $EXPANDED_DATABASE + done + +else + run_one_prog $1 $2 $EXPANDED_DATABASE +fi + +exit 0 diff --git a/etc/run_fastx b/etc/run_fastx new file mode 100644 index 000000000..b04a259a9 --- /dev/null +++ b/etc/run_fastx @@ -0,0 +1,89 @@ +#!/bin/sh - + +# this script will run a search program on a sequence input file or on each +# file in a file of filenames + +# to customise this script see the function called run_one_prog below + + +RCS_HEADER="$Header: //tmp/pathsoft/artemis/etc/run_fastx,v 1.1 2004-06-09 10:03:05 tjc Exp $" + +PROG=`echo $RCS_HEADER | sed 's/.*run_\(.*\),v.*/\1/'` + + +if [ $# = 4 -a x$1 = x-onefile ] +then + shift + ONEFILE=t + DATABASE=$3 export DATABASE +else + if [ $# = 2 ] + then + DATABASE=$2 export DATABASE + else + echo usage: $0 -onefile input_file output_file database 1>&2 + echo or: $0 file_of_filenames database 1>&2 + exit 1 + fi +fi + + +# expand any ~ or environment variables +EXPANDED_DATABASE=`echo "echo $DATABASE" | /bin/csh -f` + + +### change this function to suit your site: + +run_one_prog () { + INPUT_FILE=$1 + OUTPUT_FILE=$2 + DATABASE=$3 + + + ### change these lines: + + FASTLIBS=/nfs/disk222/yeastpub/bio-soft/fasta/pubseqgbs export FASTLIBS + EXEC=/nfs/disk222/yeastpub/bio-soft/fasta/fastx33_t + + echo "about to start $EXEC with input from $INPUT_FILE and output to" 1>&2 + echo "$OUTPUT_FILE using database $DATABASE" 1>&2 + + # add/change the flags to suit your site: + COMMAND="$EXEC -B -S -q -b 40 -H $INPUT_FILE $DATABASE ktup 2" + + echo "command line: $COMMAND" 1>&2 + + $COMMAND 2>&1 > $OUTPUT_FILE | + tee ${PROG}_errors.new 1>&2 + + #### end of changes + + + # Artemis can read compressed files + gzip -9 $OUTPUT_FILE & + + if [ -s ${PROG}_errors.new ] + then + ( echo ERROR running $PROG: ; echo; + echo =================================================== + cat ${PROG}_errors.new ) >> $OUTPUT_FILE + cat ${PROG}_errors.new >> ${PROG}_errors + fi +} + +(echo "#!/bin/sh -"; echo "kill $$") > $PROG.kill + +chmod a+x $PROG.kill + +if [ x$ONEFILE = x ] +then + for i in `cat $1` + do + run_one_prog $i $i.out $EXPANDED_DATABASE + done + +else + run_one_prog $1 $2 $EXPANDED_DATABASE +fi + +exit 0 diff --git a/etc/run_hth b/etc/run_hth new file mode 100755 index 000000000..a61aeca54 --- /dev/null +++ b/etc/run_hth @@ -0,0 +1,148 @@ +#!/bin/sh - + +# this script will run a search program on a sequence input file or on each +# file in a file of filenames + +# to customise this script see the function called run_one_prog below + + +RCS_HEADER="$Header: //tmp/pathsoft/artemis/etc/run_hth,v 1.1 2004-06-09 10:03:06 tjc Exp $" + +PROG=`echo $RCS_HEADER | sed 's/.*run_\(.*\),v.*/\1/'` + + +if [ $# = 4 -a x$1 = x-onefile ] +then + shift + ONEFILE=t + PARAMETERS=$3 export PARAMETERS +else + if [ $# = 2 ] + then + PARAMETERS=$2 export PARAMETERS + else + echo usage: $0 -onefile input_file output_file parameters 1>&2 + echo or: $0 file_of_filenames parameters 1>&2 + exit 1 + fi +fi + + +# expand any ~ or environment variables +EXPANDED_PARAMETERS=`echo "echo $PARAMETERS" | /bin/csh -f` + + +### change this function to suit your site: + +run_one_prog () { + INPUT_FILE=$1 + OUTPUT_FILE=$2 + PARAMETERS=$3 + + + ### change these lines: + EXEC=helixturnhelix + + echo "about to start $EXEC with input from $INPUT_FILE and output to" 1>&2 + echo "$OUTPUT_FILE using database $PARAMETERS" 1>&2 + echo "command line: $EXEC $PARAMETERS $INPUT_FILE" 1>&2 + + $EXEC $INPUT_FILE $OUTPUT_FILE $PARAMETERS 2> hth_errors.new + + # add/change the flags to suit your site: + $EXEC $INPUT_FILE -outfile $OUTPUT_FILE $PARAMETERS 2>&1 | + tee ${PROG}_errors.new 1>&2 + + #### end of changes + + + if [ -s ${PROG}_errors.new ] + then + ( echo ERROR running $PROG: ; echo; + echo =================================================== + cat ${PROG}_errors.new ) >> $OUTPUT_FILE + cat ${PROG}_errors.new >> ${PROG}_errors + fi +} + +(echo "#!/bin/sh -"; echo "kill $$") > $PROG.kill + +chmod a+x $PROG.kill + +if [ x$ONEFILE = x ] +then + for i in `cat $1` + do + run_one_prog $i $i.out $EXPANDED_PARAMETERS + done + +else + run_one_prog $1 $2 $EXPANDED_PARAMETERS +fi + +if [ x$ONEFILE = x ] +then + PEPFILES=`cat $1` +else + PEPFILES=$1 +fi + +if [ -e hth/hth.tab ] +then + mv -f hth/hth.tab hth/hth.tab.old +fi + +for i in $PEPFILES +do +# write a tab file containing a feature for each hth +perl -e ' +open PEPFILE, "$ARGV[0]" or die "$0: cannot open $ARGV[0]\n"; + +my $first_line = <PEPFILE>; + +close PEPFILE; + +if ($first_line !~ m/^>(.*?), (.*) (\d+):(\d+)\s+(\S+)/) { + die "first line of $ARGV[0] is badly formatted\n"; +} + +my ($gene_name, $description, $pep_first_base, + $pep_last_base, $forward_or_back) = ($1, $2, $3, $4, $5); + +open HTHFILE, "$ARGV[1]" or die "$0: cannot open $ARGV[1]\n"; + +my $score; +my $first_match_base; + +while (<HTHFILE>) { + if (m/^Score (\d+) .* in .* at residue (\d+)/) { + $score = $1; + $first_match_base = $2; + } + + if (m/^\s+Sequence:\s+(\S+)/ && + defined ($score) && defined ($pep_first_base)) { + if ($forward_or_back eq "forward") { + my $start_base = $pep_first_base + ($first_match_base - 1) * 3; + my $end_base = $start_base + (length $1) * 3 - 1; + print <<EOF; +FT CDS_motif $start_base..$end_base +FT /note="Helix-turn-helix from $gene_name score $score" +FT /label=hth +EOF + } else { + my $end_base = $pep_last_base - ($first_match_base - 1) * 3; + my $start_base = $end_base - ((length $1) * 3 - 1); + print <<EOF; +FT CDS_motif complement($start_base..$end_base) +FT /note="Helix-turn-helix from $gene_name score $score" +FT /label=hth +EOF + } + } +} +' $i $i.out >> hth/hth.tab + +done + +exit 0 diff --git a/etc/run_jalview b/etc/run_jalview new file mode 100755 index 000000000..bf214db58 --- /dev/null +++ b/etc/run_jalview @@ -0,0 +1,51 @@ +#!/bin/sh - + +# This script needs one argument - a file of file names. + +PERL_PROG=' + +use strict; + +if (@ARGV < 1) +{ + die "$0 needs one argument - a file of sequence file names\n"; +} + +my $file = $ARGV[0]; + +chomp $file; + +if (-e $file) +{ + my $msf_file = "$file.fasta_msf"; + + my $seqnum = 1; + open(LIST_FILE,$file); + while(my $line = <LIST_FILE>) + { + chomp($line); + + # + # run descseq to ensure unique names + # + my $emboss_command_line = "descseq -append -name _$seqnum $line $line.new -auto"; + + open EMBOSS, "|$emboss_command_line" or + die "cannot open pipe to descseq: $!\n"; + close EMBOSS; + + unlink("$line"); + rename("$line.new","$line"); + $seqnum++; + } + + my $emboss_command_line = "emma \"\@$file\" -filter -stdout -osf msf -dendoutfile /dev/null -outseq $msf_file"; + + open EMBOSS, "|$emboss_command_line" or + die "cannot open pipe to emma: $!\n"; + close EMBOSS; + system "jalview", "$msf_file"; +} +' + +perl -w -e "$PERL_PROG" "$@" diff --git a/etc/run_jalview.orig b/etc/run_jalview.orig new file mode 100755 index 000000000..03e6e537b --- /dev/null +++ b/etc/run_jalview.orig @@ -0,0 +1,167 @@ +#!/bin/sh - + +# This script needs one argument - a file of file names. +# Each name should refer to a file that contains a EMBL format feature. +# The feature must have a /fasta_file= qualifier which is used to read the +# FASTA search results for the feature and to find the protein sequence of the +# feature. The sequence and the sequence of the FASTA hits will be passed to +# jalview. + +PERL_PROG=' + +use strict; + +if (@ARGV != 1) { + die "$0 needs one argument - a file of feature file names\n"; +} + + +sub process_fasta +{ + my $feature_file = shift; + my $fasta_results_file = shift; + + my $sequence_file; + + if ($fasta_results_file =~ /(.*).out/) { + $sequence_file = $1; + } else { + die "cannot understand $fasta_results_file\n"; + } + + if (! -e $sequence_file) { + die "cannot find $sequence_file\n"; + } + + my $fasta_seq_for_alignment = ""; + + open SEQ_FILE, $sequence_file or die "cannot open $sequence_file: $!\n"; + + while (<SEQ_FILE>) { + $fasta_seq_for_alignment .= $_; + } + + close SEQ_FILE; + + if (-e $fasta_results_file) { + open FASTA_OUTPUT, $fasta_results_file + or die "cannot open $fasta_results_file: $!\n"; + } else { + my $gzip_fasta_results_file = $fasta_results_file . ".gz"; + if (-e $gzip_fasta_results_file) { + open FASTA_OUTPUT, "gzip -d < $gzip_fasta_results_file |" + or die "cannot open $gzip_fasta_results_file: $!\n"; + } else { + die "cannot find $fasta_results_file or $gzip_fasta_results_file\n"; + } + } + + + my $top_re = "^The best scores are:"; + + my $seen_top = 0; + my $seen_bottom = 0; + + my @protein_ids = (); + + while (<FASTA_OUTPUT>) { + if (/$top_re/) { + $seen_top = 1; + next; + } + + if ($seen_top && /^\s*$/) { + $seen_bottom = 1; + next; + } + + if ($seen_top && !$seen_bottom) { + if (/^(\S+)/) { + if (@protein_ids < 20) { + push @protein_ids, "$1" + } else { + last; + } + } else { + warn "cannot understand this line:\n$_\n"; + } + } + } + + my %hash = (); + + @hash{@protein_ids} = (1) x @protein_ids; + + @protein_ids = sort keys %hash; + + my $protein_db = "swall"; + + # look for each of the IDs from the FASTA output in each of the DBs + + for my $id (@protein_ids) { + my $fetch = "getz -sf fasta -f seq [swall-id:$id]"; + + my $temp_seq = ""; + + open FETCH, "$fetch |" or + die "cannot open pipe to $fetch: $!\n"; + + while (<FETCH>) { + $temp_seq .= $_; + } + + close FETCH; + + if ($? == 0) { + $fasta_seq_for_alignment .= $temp_seq; + } else { + print STDERR "$id was not found in $protein_db\n"; + } + } + + my $msf_file = "$feature_file.fasta_msf"; + + my $emboss_prog = "emma"; + + my $emboss_command_line = "$emboss_prog -filter -stdout -osf msf -dendoutfile /dev/null > $msf_file"; + + open EMBOSS, "|$emboss_command_line" or + die "cannot open pipe to $emboss_prog: $!\n"; + + print EMBOSS $fasta_seq_for_alignment; + + close EMBOSS; + + my $jalview_prog = "jalview"; + + print STDERR "\nstarting $jalview_prog:\n"; + + system "$jalview_prog", "$msf_file"; +} + + +my $file; + +while (defined ($file = <>)) { + chomp $file; + + if (-e $file) { + open IN_FILE, "$file\n" or die "cannot open $file\n"; + + my $line; + + while (defined ($line = <IN_FILE>)) { + if ($line =~ m!/fasta_file="(.*)"!) { + my $fasta_results_file = $1; + + process_fasta $file, $fasta_results_file; + + last; + } + } + + close IN_FILE; + } +}' + +perl -w -e "$PERL_PROG" "$@" diff --git a/etc/run_pepstats b/etc/run_pepstats new file mode 100755 index 000000000..22239de3a --- /dev/null +++ b/etc/run_pepstats @@ -0,0 +1,77 @@ +#!/bin/sh - + +# this script will run pepstats on a sequence input file or on each +# file in a file of filenames + +# to customise this script see the function called run_one_prog below + + +RCS_HEADER="$Header: //tmp/pathsoft/artemis/etc/run_pepstats,v 1.1 2004-06-09 10:03:10 tjc Exp $" + +PROG=`echo $RCS_HEADER | sed 's/.*run_\(.*\),v.*/\1/'` + + +if [ $# = 4 -a x$1 = x-onefile ] +then + shift + ONEFILE=t + PARAMETERS=$3 export PARAMETERS +else + if [ $# = 2 ] + then + PARAMETERS=$2 export PARAMETERS + else + echo usage: $0 -onefile input_file output_file parameters 1>&2 + echo or: $0 file_of_filenames parameters 1>&2 + exit 1 + fi +fi + + +### change this function to suit your site: + +run_one_prog () { + INPUT_FILE=$1 + OUTPUT_FILE=$2 + + ### change these lines: + EXEC=pepstats + + COMMAND_LINE="$EXEC -filter $INPUT_FILE" + + echo "about to start $EXEC with input from $INPUT_FILE and output to" 1>&2 + echo "$OUTPUT_FILE using parameters: $PARAMETERS" 1>&2 + echo "command line: $COMMAND_LINE" 1>&2 + + # add/change the flags to suit your site: + (head -1 $INPUT_FILE | sed 's/^>//'; echo; + $COMMAND_LINE) 2>&1 > $OUTPUT_FILE | tee ${PROG}_errors.new 1>&2 + + #### end of changes + + + if [ -s ${PROG}_errors.new ] + then + ( echo ERROR running $PROG: ; echo; + echo =================================================== + cat ${PROG}_errors.new ) >> $OUTPUT_FILE + cat ${PROG}_errors.new >> ${PROG}_errors + fi +} + +(echo "#!/bin/sh -"; echo "kill $$") > $PROG.kill + +chmod a+x $PROG.kill + +if [ x$ONEFILE = x ] +then + for i in `cat $1` + do + run_one_prog $i $i.out + done + +else + run_one_prog $1 $2 +fi + +exit 0 diff --git a/etc/run_sigcleave b/etc/run_sigcleave new file mode 100755 index 000000000..a8a073367 --- /dev/null +++ b/etc/run_sigcleave @@ -0,0 +1,78 @@ +#!/bin/sh - + +# this script will run a search program on a sequence input file or on each +# file in a file of filenames + +# to customise this script see the function called run_one_prog below + + +RCS_HEADER="$Header: //tmp/pathsoft/artemis/etc/run_sigcleave,v 1.1 2004-06-09 10:03:11 tjc Exp $" + +PROG=`echo $RCS_HEADER | sed 's/.*run_\(.*\),v.*/\1/'` + + +if [ $# = 4 -a x$1 = x-onefile ] +then + shift + ONEFILE=t + MINWEIGHT=$3 +else + if [ $# = 2 ] + then + MINWEIGHT=$2 + else + echo usage: $0 -onefile input_file output_file minimum_weight 1>&2 + echo or: $0 file_of_filenames minimum_weight 1>&2 + exit 1 + fi +fi + +PARAMETERS="-minweight $MINWEIGHT" + +### change this function to suit your site: + +run_one_prog () { + INPUT_FILE=$1 + OUTPUT_FILE=$2 + PARAMETERS="$3 $4 $5 $6 $7 $8 $9" + + ### change these lines: + EXEC=sigcleave + + COMMAND_LINE="$EXEC $INPUT_FILE -outfile $OUTPUT_FILE $PARAMETERS" + + echo "about to start $EXEC with input from $INPUT_FILE and output to" 1>&2 + echo "$OUTPUT_FILE using parameters: $PARAMETERS" 1>&2 + echo "command line: $COMMAND_LINE" 1>&2 + + # add/change the flags to suit your site: + $COMMAND_LINE 2>&1 | tee ${PROG}_errors.new 1>&2 + + #### end of changes + + + if [ -s ${PROG}_errors.new ] + then + ( echo ERROR running $PROG: ; echo; + echo =================================================== + cat ${PROG}_errors.new ) >> $OUTPUT_FILE + cat ${PROG}_errors.new >> ${PROG}_errors + fi +} + +(echo "#!/bin/sh -"; echo "kill $$") > $PROG.kill + +chmod a+x $PROG.kill + +if [ x$ONEFILE = x ] +then + for i in `cat $1` + do + run_one_prog $i $i.out $PARAMETERS + done + +else + run_one_prog $1 $2 $PARAMETERS +fi + +exit 0 diff --git a/etc/run_smart b/etc/run_smart new file mode 100755 index 000000000..cc9ffb592 --- /dev/null +++ b/etc/run_smart @@ -0,0 +1,95 @@ +#!/bin/sh - + +# this script will run SMART (http://smart.embl-heidelberg.de/) for an +# sequence input file or on each file in a file of filenames. it uses +# lynx to access send a query to the SMART web site and then writes +# the output to a file in the same way as run_fasta and run_blastp. +# see: +# http://www.sanger.ac.uk/Software/Artemis/stable/manual/runmenu.html#RUNMENU-CONFIGURATION +# for more details. + +# you will need the "GET" command from the perl LWP module to use this script + +# to customise this script see the function called run_one_prog below + + +RCS_HEADER="$Header: //tmp/pathsoft/artemis/etc/run_smart,v 1.1 2004-06-09 10:03:12 tjc Exp $" + +PROG=`echo $RCS_HEADER | sed 's/.*run_\(.*\),v.*/\1/'` + + +if [ $# = 3 -a x$1 = x-onefile -o $# = 4 -a x$1 = x-onefile ] +then + shift + ONEFILE=t +else + if [ $# != 2 -a $# = != 1 ] + then + echo usage: $0 -onefile input_file output_file 1>&2 + echo or: $0 file_of_filenames 1>&2 + exit 1 + fi +fi + + +# expand any ~ or environment variables +EXPANDED_PARAMETERS=`echo "echo $PARAMETERS" | /bin/csh -f` + + +### change this function to suit your site: + +run_one_prog () { + INPUT_FILE=$1 + OUTPUT_FILE=$2 + PARAMETERS=$3 + + # remove the rubbish from the FASTA header and change the sequence + # into URL form + SEQUENCE=`perl -pne 'chomp; s/^>.*/>sequence/; s/ /\%20/g; $_ .= "%0D"' $INPUT_FILE` + + SEQUENCE=`echo $SEQUENCE | sed 's/%0D$//'` + + URL='http://smart.embl-heidelberg.de/smart/show_motifs.pl?INCLUDE_SIGNALP=INCLUDE_SIGNALP&DO_PROSPERO=DO_PROSPERO&DO_PFAM=DO_PFAM&SEQUENCE='"$SEQUENCE" + + ### change these lines: + EXEC=lynx + + echo "about to start $EXEC with input from $INPUT_FILE and output to" 1>&2 + echo "$OUTPUT_FILE" 1>&2 + + COMMAND="$EXEC -force_html -dump $URL" + + echo "command line: $COMMAND" 1>&2 + + (echo "read from $URL"; echo) > $OUTPUT_FILE + + $COMMAND 2>&1 >> $OUTPUT_FILE | + tee ${PROG}_errors.new 1>&2 + + #### end of changes + + if [ -s ${PROG}_errors.new ] + then + ( echo ERROR running $PROG: ; echo; + echo =================================================== + cat ${PROG}_errors.new ) >> $OUTPUT_FILE + cat ${PROG}_errors.new >> ${PROG}_errors + fi +} + +(echo "#!/bin/sh -"; echo "kill $$") > $PROG.kill + +chmod a+x $PROG.kill + +if [ x$ONEFILE = x ] +then + for i in `cat $1` + do + run_one_prog $i $i.out $EXPANDED_PARAMETERS + done + +else + run_one_prog $1 $2 $EXPANDED_PARAMETERS +fi + +exit 0 diff --git a/etc/run_tblastn b/etc/run_tblastn new file mode 100755 index 000000000..321853d7a --- /dev/null +++ b/etc/run_tblastn @@ -0,0 +1,88 @@ +#!/bin/sh - + +# this script will run a search program on a sequence input file or on each +# file in a file of filenames + +# to customise this script see the function called run_one_prog below + + +RCS_HEADER="$Header: //tmp/pathsoft/artemis/etc/run_tblastn,v 1.1 2004-06-09 10:03:13 tjc Exp $" + +PROG=`echo $RCS_HEADER | sed 's/.*run_\(.*\),v.*/\1/'` + + +if [ $# = 4 -a x$1 = x-onefile ] +then + shift + ONEFILE=t + DATABASE=$3 export DATABASE +else + if [ $# = 2 ] + then + DATABASE=$2 export DATABASE + else + echo usage: $0 -onefile input_file output_file database 1>&2 + echo or: $0 file_of_filenames database 1>&2 + exit 1 + fi +fi + + +# expand any ~ or environment variables +EXPANDED_DATABASE=`echo "echo $DATABASE" | /bin/csh -f` + + +### change this function to suit your site: + +run_one_prog () { + INPUT_FILE=$1 + OUTPUT_FILE=$2 + DATABASE=$3 + + + ### change these lines: + EXEC=blastall + + echo "about to start $EXEC with input from $INPUT_FILE and output to" 1>&2 + echo "$OUTPUT_FILE using database $DATABASE" 1>&2 + echo "command line: $EXEC $DATABASE $INPUT_FILE" 1>&2 + + + EXTRA_ARGS= + + # add/change the flags to suit your site: + lsrun -v blastwrap.pl $EXEC -d $DATABASE -i $INPUT_FILE -p tblastn \ + $EXTRA_ARGS 2>&1 > $OUTPUT_FILE | + tee ${PROG}_errors.new 1>&2 + + #### end of changes + + + # Artemis can read compressed files + gzip -9 $OUTPUT_FILE & + + if [ -s ${PROG}_errors.new ] + then + ( echo ERROR running $PROG: ; echo; + echo =================================================== + cat ${PROG}_errors.new ) >> $OUTPUT_FILE + cat ${PROG}_errors.new >> ${PROG}_errors + fi +} + +(echo "#!/bin/sh -"; echo "kill $$") > $PROG.kill + +chmod a+x $PROG.kill + +if [ x$ONEFILE = x ] +then + for i in `cat $1` + do + run_one_prog $i $i.out $EXPANDED_DATABASE + done + +else + run_one_prog $1 $2 $EXPANDED_DATABASE +fi + +exit 0 diff --git a/etc/run_tblastx b/etc/run_tblastx new file mode 100755 index 000000000..92fd500f0 --- /dev/null +++ b/etc/run_tblastx @@ -0,0 +1,87 @@ +#!/bin/sh - + +# this script will run a search program on a sequence input file or on each +# file in a file of filenames + +# to customise this script see the function called run_one_prog below + + +RCS_HEADER="$Header: //tmp/pathsoft/artemis/etc/run_tblastx,v 1.1 2004-06-09 10:03:14 tjc Exp $" + +PROG=`echo $RCS_HEADER | sed 's/.*run_\(.*\),v.*/\1/'` + + +if [ $# = 4 -a x$1 = x-onefile ] +then + shift + ONEFILE=t + DATABASE=$3 export DATABASE +else + if [ $# = 2 ] + then + DATABASE=$2 export DATABASE + else + echo usage: $0 -onefile input_file output_file database 1>&2 + echo or: $0 file_of_filenames database 1>&2 + exit 1 + fi +fi + + +# expand any ~ or environment variables +EXPANDED_DATABASE=`echo "echo $DATABASE" | /bin/csh -f` + + +### change this function to suit your site: + +run_one_prog () { + INPUT_FILE=$1 + OUTPUT_FILE=$2 + DATABASE=$3 + + + ### change these lines: + EXEC=blastall + + echo "about to start $EXEC with input from $INPUT_FILE and output to" 1>&2 + echo "$OUTPUT_FILE using database $DATABASE" 1>&2 + + + EXTRA_ARGS= + + # add/change the flags to suit your site: + lsrun -v blastwrap.pl $EXEC -d $DATABASE -i $INPUT_FILE -p tblastx \ + $EXTRA_ARGS 2>&1 > $OUTPUT_FILE | + tee ${PROG}_errors.new 1>&2 + + #### end of changes + + + # Artemis can read compressed files + gzip -9 $OUTPUT_FILE & + + if [ -s ${PROG}_errors.new ] + then + ( echo ERROR running $PROG: ; echo; + echo =================================================== + cat ${PROG}_errors.new ) >> $OUTPUT_FILE + cat ${PROG}_errors.new >> ${PROG}_errors + fi +} + +(echo "#!/bin/sh -"; echo "kill $$") > $PROG.kill + +chmod a+x $PROG.kill + +if [ x$ONEFILE = x ] +then + for i in `cat $1` + do + run_one_prog $i $i.out $EXPANDED_DATABASE + done + +else + run_one_prog $1 $2 $EXPANDED_DATABASE +fi + +exit 0 -- GitLab