LOCUS AFCE01000038 5958 bp DNA linear BCT 26-MAY-2011 DEFINITION Caldalkalibacillus thermarum TA2.A1 ctg132, whole genome shotgun sequence. ACCESSION AFCE01000038 AFCE01000000 VERSION AFCE01000038.1 DBLINK BioProject: PRJNA63105 BioSample: SAMN02471911 KEYWORDS WGS. SOURCE Caldalkalibacillus thermarum TA2.A1 ORGANISM Caldalkalibacillus thermarum TA2.A1 Bacteria; Firmicutes; Bacilli; Bacillales; Bacillaceae; Caldalkalibacillus. REFERENCE 1 (bases 1 to 5958) AUTHORS Kalamorz,F., Keis,S., McMillan,D.G., Olsson,K., Stanton,J.A., Stockwell,P., Black,M.A., Klingeman,D.M., Land,M.L., Han,C.S., Martin,S.L., Becher,S.A., Peddie,C.J., Morgan,H.W., Matthies,D., Preiss,L., Meier,T., Brown,S.D. and Cook,G.M. TITLE Draft Genome Sequence of the Thermoalkaliphilic Caldalkalibacillus thermarum Strain TA2.A1 JOURNAL J. Bacteriol. 193 (16), 4290-4291 (2011) PUBMED 21685297 REFERENCE 2 (bases 1 to 5958) AUTHORS Kalamorz,F., Keis,S., McMillan,D.G.G., Stanton,J.-A., Stockwell,P., Black,M.A., Brown,S.D., Klingeman,D.M., Land,M.L., Han,C.S., Martin,S.L., Becher,S.A., Morgan,H.W. and Cook,G.M. TITLE Direct Submission JOURNAL Submitted (26-MAY-2011) Department of Microbiology and Immunology, University of Otago, 720 Cumberland Street, Dunedin, Otago 9016, New Zealand COMMENT Source DNA and bacteria available from Professor Greg Cook, Department of Microbiology and Immunology, University of Otago, PO Box 56, Dunedin 9054, New Zealand. ##Genome-Assembly-Data-START## Assembly Method :: Newbler v. 2.3; Velvet v. 1.0.13; Phrap v. 101208 Genome Coverage :: 18x 454 GS FLX; 216x Illumina Sequencing Technology :: 454 GS FLX; Illumina ##Genome-Assembly-Data-END## FEATURES Location/Qualifiers source 1..5958 /organism="Caldalkalibacillus thermarum TA2.A1" /mol_type="genomic DNA" /strain="TA2.A1" /db_xref="taxon:986075" gene complement(52..234) /locus_tag="CathTA2_0283" CDS complement(52..234) /locus_tag="CathTA2_0283" /inference="ab initio prediction:Prodigal:1.4" /codon_start=1 /transl_table=11 /product="hypothetical protein" /protein_id="EGL84153.1" /db_xref="GI:334181630" /translation="MDFFIDLAILGVMIIGMTAFLAVIVQAIVRPFVSKKGEVSVIRN LEIKKGWKKVGGKQQS" sig_peptide complement(151..234) /locus_tag="CathTA2_0283" /note="Signal predicted by SignalP 3.0 HMM (Signal peptide probabilty 0.683) with cleavage site probability 0.546 at residue 28" gene complement(414..1223) /locus_tag="CathTA2_0284" CDS complement(414..1223) /locus_tag="CathTA2_0284" /inference="similar to AA sequence:KEGG:Aflv_1606" /note="KEGG: afl:Aflv_1606 Zn-dependent hydrolase" /codon_start=1 /transl_table=11 /product="Zn-dependent hydrolase" /protein_id="EGL84154.1" /db_xref="GI:334181631" /translation="MLKLYQHKDLIQGQLFLKHFSLSVSFYLIDGLLIDTGAPVYKQT LKNYFKGQKIEQVVLTHHHEDHSGCAGWLSRAKQVPVYMHPETKRILQAPPSIPMYRK LVWGQMEAVEGQEIGDRLETEHFTFKVIHTPGHCQDHISLLESNRGILFSGDLFVSTV IKYSLRDESIKQMLDSINTLLTYDFEEVYCAHAGRVENGYEAFRQKKAYLEELIEAVL HYYKQGLETHEIKEKLFPKPDWNHYLTMGEFSSYNVVKHIIEEFGSTLKVS" gene complement(1396..1617) /locus_tag="CathTA2_0285" CDS complement(1396..1617) /locus_tag="CathTA2_0285" /inference="ab initio prediction:Prodigal:1.4" /codon_start=1 /transl_table=11 /product="hypothetical protein" /protein_id="EGL84155.1" /db_xref="GI:334181632" /translation="MELYYWSPEGEIDEKVIREKMLQAYEDIHHYQYEEYFDRAEPDP EKLIQYTPEASAHPGNQAAHEADPGQSQV" gene 1972..2178 /locus_tag="CathTA2_0286" CDS 1972..2178 /locus_tag="CathTA2_0286" /inference="ab initio prediction:Prodigal:1.4" /codon_start=1 /transl_table=11 /product="hypothetical protein" /protein_id="EGL84156.1" /db_xref="GI:334181633" /translation="MIGIGAFLLWKSVDLGEAYANHWLRKSGGHADTDTYHIILSEAI RMYRSAGAILFAIGVWFLRKEAMR" gene complement(2216..3610) /locus_tag="CathTA2_0287" CDS complement(2216..3610) /locus_tag="CathTA2_0287" /inference="protein motif:PFAM:PF00392" /note="KEGG: gwc:GWCH70_1952 GntR family transcriptional regulator; PFAM: HTH transcriptional regulator, GntR; Aminotransferase, class I/II; SMART: HTH transcriptional regulator, GntR" /codon_start=1 /transl_table=11 /product="transcriptional regulator, GntR family with aminotransferase domain containing protein" /protein_id="EGL84157.1" /db_xref="GI:334181634" /db_xref="GO:0003700" /db_xref="GO:0030170" /db_xref="InterPro:IPR000524" /db_xref="InterPro:IPR004839" /translation="MELQPILDPTNGTPLYMQLYTYIKEEITNGHLQKGSKLPSIRVL SQHLGISKNTVETAYQQLLAEGYIESKPRVGFVVQELEEPLQPFPFQPDVPVEAPKSK PIRYNFRYGHIDLAHFPMKTWRKCLLEALDSEQSELMWYGERKGDIELRREIQRYLYY ARGIRCSAGQIIIGSGTPQLIGVLCQLFDCRHDEVALENPCYNVVRTVFQNHHFSIVP VELEEDGLNIDQLQATSAKVVYVTPSHQLPLGMVLPIGKRQKLLKWAQQSNGFIIEDD YDSEFRYGSKPIPALKALDTEDRVVYIGTFSKVFTPAIRTSYMVLPQHLLERFHERCS NYHQTVATVVQKALTRFMREGHFERHVRRMRTIYAKKRQALIEAICEYFGDQATIIGD KAGLHLLVKIKGKSAAELVQKAEQAGILVYSAAKYWFGNNGTPPSYLLLGFGGMNEAD IRTGIRELKRVWEI" gene 3716..4264 /locus_tag="CathTA2_0288" CDS 3716..4264 /locus_tag="CathTA2_0288" /inference="protein motif:PFAM:PF01243" /note="PFAM: Pyridoxamine 5'-phosphate oxidase-like, FMN-binding domain; KEGG: gwc:GWCH70_1951 pyridoxamine 5'-phosphate oxidase-related FMN-binding" /codon_start=1 /transl_table=11 /product="pyridoxamine 5'-phosphate oxidase-related FMN-binding" /protein_id="EGL84158.1" /db_xref="GI:334181635" /db_xref="GO:0010181" /db_xref="InterPro:IPR011576" /translation="MRRDMLECKDEQKINRFLQEALTGFLGLADGGDPYVVPLNFVWW NGCVYVHGAEEGRKIDIIRRNPRVCFTVSEHIGTMVHPVPAKTSTAYMSVMIFGTAEI VSDLKEATQALDQLLGKYVPGYFDRPLSEKHVSSYRSSAGSATVVIKIIPDLITAKEK PLEKERKFYKGRTVRDDAGRIF" gene 4367..4795 /locus_tag="CathTA2_0289" CDS 4367..4795 /locus_tag="CathTA2_0289" /inference="protein motif:PFAM:PF09339" /note="KEGG: gmc:GY4MC1_1582 transcriptional regulator, IclR family; PFAM: Transcriptional regulator IclR, N-terminal; SMART: Transcriptional regulator IclR, N-terminal" /codon_start=1 /transl_table=11 /product="transcriptional regulator, IclR family" /protein_id="EGL84159.1" /db_xref="GI:334181636" /db_xref="GO:0003677" /db_xref="InterPro:IPR005471" /translation="MNKTVIKTMEMLKLFIDRERLTLQEMVELLQMPKTSVYRMAQSL VELGFLQKTNDYYQLGLAFLSFGMLVAERLDLRRIALPIMKRLKEETKEAVNLVIRDG DEAIYNEKVDTSEPVRVYTKVGQRAPLYAGACPIAIKLRI" gene 4865..5050 /locus_tag="CathTA2_0290" CDS 4865..5050 /locus_tag="CathTA2_0290" /inference="similar to AA sequence:KEGG:GWCH70_1418" /note="KEGG: gwc:GWCH70_1418 transposase IS4 family protein" /codon_start=1 /transl_table=11 /product="transposase IS4 family protein" /protein_id="EGL84160.1" /db_xref="GI:334181637" /translation="MAKKMKAWIKTIRQLFSSEELTRLARKVGFIQRQRSLTAEAFLT LCAWGDGSLAGQVQIIV" gene complement(5238..>5958) /locus_tag="CathTA2_0291" CDS complement(5238..>5958) /locus_tag="CathTA2_0291" /inference="protein motif:PFAM:PF00872" /note="PFAM: Transposase, mutator type; KEGG: gmc:GY4MC1_2978 transposase mutator type" /codon_start=2 /transl_table=11 /product="transposase mutator type" /protein_id="EGL84161.1" /db_xref="GI:334181638" /db_xref="GO:0003677" /db_xref="GO:0004803" /db_xref="InterPro:IPR001207" /translation="DGRVRSRAVLIATGVNEEGYREILGLQIGNSESESSWSEFFGWL KDRGLRGVDLIISDQHRGLVQAIEKHFQGATWQRCQTHFIRNILDAAPKYMQDALLEE IRGILHAPNKQTARLLLEQVLAKWEEKAPKAMQILEEGFEDATAVLDYPDRYRRRLRT TNGVERLNEEIRRRERVIRIFPNRESVYRLVGAVLIEIDEKWMSGRKYLDMSEYWRWR KTKEQGIRSVNQETPAIKRVG" BASE COUNT 1499 a 1339 c 1449 g 1671 t ORIGIN 1 gtggtcagaa ccggttttgt acataataaa gccaacaggt taaataaatc atcaagattg 61 ctgtttgccc ccaacctttt tccagccttt tttaatctct aagttacgga tgacagatac 121 ttcacctttt ttgctgacga atggcctgac aatggcctga acgatgacgg ctaaaaaagc 181 ggtcatgcca ataatcatta cgcctaaaat cgccaggtca atgaaaaaat ccatcctact 241 caccccttat attgaaattt taccccacag gctgtcaatt gaaaagagcc ctggacagaa 301 aacgcccaaa acgtgataat tcaataaaat aaatacatta atcatgaaaa cagagagaga 361 ggaccatgag caccgttgac cttcatcctt cagccgtgct gattgtcttg ggcttaactt 421 accttgagcg tggaaccgaa ttcctcaata atatgcttga caacgttgta tgatgaaaac 481 tcacccatcg tcaaataatg gttccagtct ggtttgggga agagtttttc cttgatttca 541 tgtgtttcca agccttgttt gtaatagtgg agcactgctt caatcagttc ctccagatag 601 gctttcttct gccggaatgc ctcgtaaccg ttttcgaccc gtccggcatg ggcgcagtac 661 acctcttcaa aatcgtaggt taacagggta ttgatggaat ccagcatctg tttgatcgac 721 tcatcgcgca agctgtactt gatcactgtg gagacgaaca ggtcaccgct gaataaaatg 781 ccccggttgg actccagcaa gctgatgtga tcctggcagt gacctggtgt atgaatcact 841 ttaaaggtaa agtgctctgt ttcgagtctg tcgccaattt cctgcccctc cacggcctcc 901 atttgtcccc aaaccagctt gcggtacatg gggatggaag gaggggcttg taaaattcgc 961 ttggtttcag ggtgcatgta gaccgggact tgtttggccc gtgaaagcca tcctgcacag 1021 ccggaatggt cttcgtggtg atgggttaac accacttgtt cgattttttg ccctttgaaa 1081 tagtttttta atgtctgttt atatactggt gcacctgtat cgatcagtaa accatcaatc 1141 aagtaaaaag aaaccgaaag ggagaaatgc ttcaggaata gctgaccctg aatcaggtct 1201 ttatgttgat aaagttttaa catggtgaat ctcctctgtc cagtgttgtt ctgacatcaa 1261 cggagtaaac gttgtgaaca ctaaacttat tctgaatgaa tagtcattca ttataaatat 1321 agcataaaca gggcaggatg tcattccaaa agttaacagc accagcgcaa tgttgcttaa 1381 aactgagaga gttgcttaaa cctgagactg accaggatct gcctcatgag ctgcttgatt 1441 gccggggtgt gcggaagctt cgggcgtgta ctgaattaat ttttctggat ccggctcagc 1501 acggtcaaag tattcttcgt attggtagtg atggatatct tcataggcct gaagcatctt 1561 ttcacggatg actttttcat ctatttcccc ttcaggtgac caataataca gctccatgcg 1621 gtttaactca ggggacgttt cccagggtat gcgtcccgtt tatcggaaag cccgactatt 1681 tcgagtaatt cattgactct tttttcaatt tcgccttttg gcttttttgc tgtgctgaca 1741 ggaatgattg ccgcgtttct catgcagcat cattctgcgc aagaagccat tagcaacgcc 1801 gtctgggttc atggaaaagc cgccgatatg cttgtagaac gcggccattc gcaatgggac 1861 gtacttgctg gcgatttgat tgaagcaatt ccagcggtgc tttcgtatgt gcaggaaaaa 1921 caataggggg gatatggatt gaaaaattgg aaatggtggc tggacattgc aatgattgga 1981 atcggcgctt ttttgctttg gaaaagcgtg gaccttggtg aagcatacgc caatcattgg 2041 cttcgtaaaa gcgggggaca tgcagacacg gatacttatc atattatctt atccgaagcg 2101 attcgcatgt atcgttcggc aggtgcgatt ttattcgcca tcggggtatg gtttctgcgt 2161 aaagaagcga tgcgctagaa tatagaagcg catcgttttt ctttttggga gtagttcaaa 2221 tctcccatac ccgttttagt tcgcgaattc cggtacggat gtccgcctcg ttcattcctc 2281 caaagcctag caaaagataa gaaggaggcg ttccgttgtt cccaaaccaa tatttcgctg 2341 cggaatagac gagaatgccc gcttgttctg ctttttgcac cagttcggcg gcgctcttgc 2401 cttttatttt tacaagaaga tgaagccccg ctttgtcgcc gatgatcgtt gcttgatcac 2461 cgaagtattc acaaatcgct tcgataagcg cctgccgctt ttttgcgtag atggtgcgca 2521 tgcggcggac atggcgttca aaatggcctt cacgcataaa tcgggtgagc gctttttgga 2581 cgaccgtagc gacggtctga tggtaattgg agcagcgttc atgaaaccgc tctagcaaat 2641 gttgcggcag caccatataa cttgtgcgga tggcaggggt gaacactttt gaaaacgtgc 2701 cgatataaac gacgcggtct tctgtatcga gcgcttttaa cgcagggatc ggtttgcttc 2761 cgtagcggaa ttcgctgtca taatcgtctt cgataataaa gccgttagac tgttgcgccc 2821 attttaggag cttttgccgt ttgccgatcg gcagcaccat cccaagcggc aattgatggg 2881 aaggggtgac ataaacgact tttgcgcttg ttgcttgcag ctggtcaatg ttcagtccgt 2941 cttcttccag ctcgaccgga acgatggaaa aatggtggtt ttgaaacacg gtgcgaacga 3001 cattataaca aggattttct aaagcgacct catcgtgcct gcagtcgaac agctggcata 3061 agacgccaat cagttgtggc gtgccagagc caataatgat ttgcccagcc gaacagcgaa 3121 tgccgcgtgc ataatacaag tagcgttgga tttcgcggcg caattcgata tctccttttc 3181 gttcgccata ccacattaat tcgctttgtt cggaatccag cgcttcaagg agacattttc 3241 gccatgtttt catcggaaaa tgggcaaggt caatatgacc gtagcgaaag ttgtagcgaa 3301 tcggcttgct tttcggagcc tccacgggga catccggttg gaaaggaaac ggttggagag 3361 gctcttccag ttcttgaaca acgaatccta cgcgcggctt gctttcgata tatccttcgg 3421 caagaagctg ctggtatgcg gtttcgacgg tatttttgct gatgcctagg tgttgggaaa 3481 gcacgcgaat cgatgggagc ttgcttcctt tttggagatg gccgtttgtg atttcctctt 3541 ttatgtacgt atacagctgc atgtaaagcg gtgtgccgtt tgttggatcg agaatgggct 3601 gcaattccat tatgtttttc ctcctctgac ccttcttttt tatttaattc tgtccctgtt 3661 cataaggtca gtttttttct atgattccat tatacactag gaagggggaa aatagatgag 3721 aagggatatg ttggaatgca aagatgaaca aaaaatcaac cggtttttgc aggaagcgtt 3781 gaccggattt ttaggtttgg cagacggtgg tgatccatat gtcgtaccgc ttaatttcgt 3841 atggtggaac ggctgtgtct atgtgcatgg agcggaagaa gggagaaaaa tcgatataat 3901 ccgtcgcaat ccgcgcgttt gttttaccgt tagtgaacat atcgggacaa tggtacatcc 3961 cgttccagca aaaacgagca ccgcttatat gagtgtgatg atatttggaa cagcggagat 4021 cgtttctgat ctaaaggagg cgacacaagc gctcgaccag ttgcttggca aatatgtgcc 4081 gggctatttt gaccgaccgc tttccgagaa gcatgtatca tcataccgct catcggcagg 4141 aagcgcgact gttgtcatca aaatcattcc tgaccttatc acagcgaaag aaaaaccgtt 4201 agagaaagag cgaaagtttt ataaaggaag aaccgtgcgg gacgatgccg gcaggatttt 4261 ttgactgaaa aataagatag aaaattttat gtatttttac tataatgaat ataaaaattc 4321 attttgcgga atataagttt caatattcgg aacaagaggg agaatgatga ataaaacagt 4381 cattaaaacg atggaaatgt taaagttgtt catcgaccgt gaacggctta cattgcagga 4441 aatggtcgaa ttattgcaaa tgccaaagac gtcggtgtat cggatggcgc aatcattagt 4501 ggaacttggt tttttacaaa aaactaacga ttattatcag ctcggtttag catttttgtc 4561 gtttggcatg ctcgttgccg agcggctgga tctccggcga atcgcgcttc cgattatgaa 4621 gcggctgaaa gaagagacga aggaagcggt caatttagtc attcgcgacg gcgatgaagc 4681 gatttataat gaaaaggtcg atacatcgga accggtgcgc gtgtatacaa aagtaggaca 4741 gcgtgctccg ttatacgcgg gggcgtgccc catagccatc aagttaagaa tttgatcttt 4801 tttcagcgcc aaaaacatgg tatcctttct aacgaaaatc atcgttggaa aggattgttt 4861 tttgatggca aaaaagatga aggcatggat aaaaacgatt cgtcaactct tctcctctga 4921 agaactgacc cgtctggcac ggaaagtcgg attcattcag cggcagcgtt cattaacagc 4981 ggaagccttt ctgacgctat gtgcttgggg agacggatcg ctcgccggtc aagtccaaat 5041 tattgtgtaa attccccttt gatagacaac atggacctga gactggacgt atagtaggta 5101 agtccggcaa gtctccctgc cggtcgcctt cccggaccaa tgatcatgtt gtcaaggaac 5161 aggtgtgtca aggagctttc gcggcatatc ctcgcttcgc tccggtattc cacgttctcc 5221 ttgacacagc gaaggggtta tcccactctc ttgatcgccg gagtctcctg attcaccgat 5281 cggattcctt gctctttcgt tttccgccac cgccaatatt cggacatatc caagtattta 5341 cgtcccgaca tccatttttc gtcgatttcg atcagcacgg cgccaacgag gcgatacacc 5401 gattcccggt tcggaaagat gcggatgacc cgttctctgc ggcgaatttc ctcgttcagc 5461 cgttccactc cgttggtcgt gcgcagacgc cgccggtaac ggtccggata gtccaatacg 5521 gccgtggcgt cttcaaatcc ctcttcaagg atttgcatgg cttttggtgc tttttcttcc 5581 catttggcca gcacttgttc caataacagt cgggccgttt gcttgtttgg ggcatgaaga 5641 atcccgcgaa tctcctcaag caaggcatcc tgcatatact ttggtgcggc atcgaggata 5701 ttgcgaataa aatgtgtctg gcatcgctgc catgtagcgc cttggaaatg cttttcaata 5761 gcttgcacaa gcccgcggtg ctgatccgag atgatcaagt ccactccccg gagtcctcgg 5821 tctttcagcc atccgaagaa ctcgctccag ctggactccg attcactgtt tccgatttgc 5881 aggccaagaa tttcccggta tccttcctca ttcactcccg tggcgatcaa aacggctctg 5941 gaacgtaccc gtccatct //