LOCUS X90754 4680 bp DNA linear BCT 04-MAY-2005 DEFINITION E.coli csgG, csgF, csgE, csgD, csgB, csgA, and orfC genes. ACCESSION X90754 VERSION X90754.1 KEYWORDS csgA gene; csgB gene; csgD gene; csgE gene; csgF gene; csgG gene; orfC gene. SOURCE Escherichia coli ORGANISM Escherichia coli Bacteria; Proteobacteria; Gammaproteobacteria; Enterobacterales; Enterobacteriaceae; Escherichia. REFERENCE 1 AUTHORS Hammar M., Arnqvist A., Bian Z., Olsen A., Normark S. TITLE Expression of two csg operons is required for production of fibronectin- and congo red-binding curli polymers in Escherichia coli K-12 JOURNAL Mol. Microbiol. 18(4), 661-670(1995). PUBMED 8817489 REFERENCE 2 (bases 1 to 4680) AUTHORS Hammar M. JOURNAL Submitted (11-AUG-1995) to the INSDC. M. Hammar, Karolinska Institutet, Microbiology and Tumorbiology Center, Box 280, S-171 77 Stockholm, SWEDEN FEATURES Location/Qualifiers source 1..4680 /organism="Escherichia coli" /map="23.15 minutes" /strain="K12" /mol_type="genomic DNA" /db_xref="taxon:562" misc_feature 1..3140 /note="strain MC4100" mobile_element <1..>4680 /mobile_element_type="insertion sequence:IS2 (partial)" CDS complement(133..966) /transl_table=11 /gene="csgG" /product="assembly /transport component in curli production" /db_xref="GOA:P0AEA2" /db_xref="InterPro:IPR005534" /db_xref="PDB:4UV2" /db_xref="PDB:4UV3" /db_xref="UniProtKB/Swiss-Prot:P0AEA2" /protein_id="CAA62277.1" /translation="MQRLFLLVAVMLLSGCLTAPPKEAARPTLMPRAQSYKDLTHLPA PTGKIFVSVYNIQDETGQFKPYPASNFSTAVPQSATAMLVTALKDSRWFIPLERQGLQ NLLNERKIIRAAQENGTVAINNRIPLQSLTAANIMVEGSIIGYESNVKSGGVGARYFG IGADTQYQLDQIAVNLRVVNVSTGEILSSVNTSKTILSYEVQAGVFRFIDYQRLLEGE VGYTSNEPVMLCLMSAIETGVIFLINDGIDRGLWDLQNKAERQNDILVKYRHMSVPPE S" CDS complement(993..1409) /transl_table=11 /gene="csgF" /product="assembly /transport component in curli production" /db_xref="GOA:P0AE98" /db_xref="InterPro:IPR018893" /db_xref="PDB:5M1U" /db_xref="UniProtKB/Swiss-Prot:P0AE98" /protein_id="CAA62278.1" /translation="MRVKHAVVLLMLISPLSWAGTMTFQFRNPNFGGNPNNGAFLLNS AQAQNSYKDPSYNDDFGIETPSALDNFTQAIQSQILGGLLSNINTGKPGRMVTNDYIV DIANRDGQLQLNVTDRKTGQTSTIQVSGLQNNSTDF" CDS complement(1434..1823) /transl_table=11 /gene="csgE" /product="assembly /transport component in curli production" /db_xref="GOA:P0AE95" /db_xref="InterPro:IPR018900" /db_xref="PDB:2NA4" /db_xref="UniProtKB/Swiss-Prot:P0AE95" /protein_id="CAA62279.1" /translation="MKRYLRWIVAAEFLFAAGNLHAVEVEVPGLLTDHTVSSIGHDFY RAFSDKWESDYTGNLTINERPSARWGSWITITVNQDVIFQTFLFPLKRDFEKTVVFAL IQTEEALNRRQINQALLSTGDLAHDEF" CDS complement(1828..2478) /transl_table=11 /gene="csgD" /product="putative regulatory protein" /note="necessary for transcription of the csgBA operon" /db_xref="GOA:P52106" /db_xref="InterPro:IPR000792" /db_xref="InterPro:IPR016032" /db_xref="InterPro:IPR036388" /db_xref="UniProtKB/Swiss-Prot:P52106" /protein_id="CAA62280.1" /translation="MFNEVHSIHGHTLLLITKSSLQATALLQHLKQSLAITGKLHNIQ RSLDDISSGSIILLDMMEADKKLIHYWQDTLSRKNNNIKILLLNTPEDYPYRDIENWP HINGVFYSMEDQERVVNGLQGVLRGECYFTQKLASYLITHSGNYRYNSTESALLTHRE KEILNKLRIGASNNEIARSLFISENTVKTHLYNLFKKIAVKNRTQAVSWANDNLRR" misc_feature complement(2626) /note="transcriptional start site for csgDEFG operon" misc_feature 3140 /note="transcriptional start site for csgBA operon" misc_feature 3141..4680 /note="strain W3110" CDS 3233..3688 /transl_table=11 /gene="csgB" /product="nucleation component of curlin monomers" /db_xref="GOA:P0ABK7" /db_xref="InterPro:IPR009742" /db_xref="UniProtKB/Swiss-Prot:P0ABK7" /protein_id="CAA62281.1" /translation="MKNKLLFMMLTILGAPGIAAAAGYDLANSEYNFAVNELSKSSFN QAAIIGQAGTNNSAQLRQGGSKLLAVVAQEGSSNRAKIDQTGDYNLAYIDQAGSANDA SISQGAYGNTAMIIQKGSGNKANITQYGTQKTAIVVQRQSQMAIRVTQR" sig_peptide 3729..3788 /gene="csgA" CDS 3729..4184 /transl_table=11 /gene="csgA" /product="curlin/CsgA protein" /note="major subunit" /db_xref="GOA:P28307" /db_xref="InterPro:IPR009742" /db_xref="PDB:6G8C" /db_xref="PDB:6G8D" /db_xref="PDB:6G8E" /db_xref="PDB:6G9G" /db_xref="UniProtKB/Swiss-Prot:P28307" /protein_id="CAA62282.1" /translation="MKLLKVAAIAAIVFSGSALAGVVPQYGGGGNHGGGGNNSGPNSE LNIYQYGGGNSALALQTDARNSDLTITQHGGGNGADVGQGSDDSSIDLTQRGFGNSAT LDQWNGKNSEMTVKQFGGGNGAAVDQTASNSSVNVTQVGFGNNATAHQY" CDS 4243..4575 /transl_table=11 /gene="orfC" /product="putative curli production protein" /db_xref="GOA:P52107" /db_xref="InterPro:IPR014491" /db_xref="UniProtKB/Swiss-Prot:P52107" /protein_id="CAA62283.1" /translation="MNTLLLLAALSSQITFNTTQQGDVYTIIPEVTLTQSCLCRVQIL SLREGSSGQSQTKQEKTLSLPANQPIALTKLSLNISPDDRVKIVVTVSDGQSLHLSQQ WPPSSEKS" BASE COUNT 1335 a 986 c 1047 g 1312 t ORIGIN 1 ggcctgtggc tggcggcgcg tagtgcaaag acggcgcacc gtgagcagga aatcaaaaat 61 aaagcgtgag gggcactcac gctttcgctt aaacagtaaa atgccggatg ataattccgg 121 cttttttatc tgtcaggatt ccggtggaac cgacatatgg cggtatttca ccagaatgtc 181 attctgccgt tctgctttat tttgcaaatc ccacagacca cggtcgatac catcattaat 241 caggaaaatg acccctgttt cgatagccga catcaggcac agcataacag gttcgttcga 301 ggtgtaaccc acttcccctt caagcaagcg ctggtagtca ataaagcgga aaaccccggc 361 ctgaacttca taggaaagta tcgtcttact ggtgttcacc gaagaaagga tctcgccggt 421 actcacattg acgacgcgca ggttcacggc aatctgatcg agctggtatt gcgtgtcggc 481 accgatgcca aaatatcttg ccccaacccc gccagatttg acgttgcttt cataaccgat 541 aatcgaacct tcaaccatga tatttgccgc cgttaaagat tgcagcggga ttcggttatt 601 aatggcaacc gtgccgtttt cttgtgccgc acgaataatc ttgcgctcgt taagcaggtt 661 ttgtaagccc tggcgctcca gcggtataaa ccagcgagaa tctttcagtg ccgtgaccag 721 cattgccgtg gcgctttgcg gaacagcagt ggagaagtta cttgccgggt agggtttaaa 781 ttgcccggtt tcgtcctgaa tgttgtatac cgaaacaaag attttacccg tcggcgctgg 841 cagatgggtc aaatctttgt agctctgagc acgaggcatt aatgtcggtc tggcggcttc 901 tttaggcggg gcggttaagc atccgctcag taacatgacg gcaaccaaaa gaaataagcg 961 ctgcatgatt attttcctta tgaagctggg gcttaaaaat cggttgagtt attttgtaaa 1021 cccgaaacct ggatggtcga ggtttgtccg gttttacgat ctgtcacgtt caactgcaat 1081 tgaccatcgc ggttggcaat atcgacaata taatcgttgg tcaccatgcg gcccggttta 1141 ccggtattaa tattcgacag tagcccacct aaaatttgtg actggatggc ctgagtaaag 1201 ttatctaacg ctgagggtgt ttcaatacca aagtcatcgt tatagctcgg atctttataa 1261 gagttttggg cctgagcgct atttaataaa aaagcgccat tatttgggtt accaccaaag 1321 tttggattac ggaactggaa agtcatggtt ccagcccaac ttaatggcga aataagcatg 1381 agtagaacta ctgcatgttt gacacgcatt gcagcctccg aacaattttt tatttagaat 1441 tcatcatgcg ccaaatcgcc cgtacttaat aacgcctgat ttatctggcg acgatttagt 1501 gcttcttcag tttgaatcag tgcaaagacg acagttttct cgaagtctct tttcaacgga 1561 aataaaaaag tctggaaaat aacgtcctga ttgaccgtta tagtgatcca gcttccccat 1621 cgtgcactgg gcctttcatt aatcgttaag ttacccgtat agtcactttc ccatttatca 1681 ctaaaggctc ggtaaaaatc atggccaata gatgaaacag tatggtcagt tagcaatccc 1741 gggacttcta cctcaacggc gtgaagattc cctgcggcga acagaaattc tgccgccaca 1801 atccagcgta aataacgttt catggcttta tcgcctgagg ttatcgtttg cccaggaaac 1861 cgcttgtgtc cggtttttta cggctatctt cttgaaaaga ttataaagat gcgttttaac 1921 cgtattttcg ctgatgaaca acgaacgagc gatctcgtta ttagacgcgc cgatacgcag 1981 cttattcagg atctcttttt cccgatgagt aaggagggct gattccgtgc tgttataacg 2041 atagttacct gaatgcgtaa tcaggtagct ggcaagcttt tgcgtaaagt agcattcgcc 2101 gcgcaggacg ccttgcaacc cattgacaac acgttcttga tcctccatgg aataaaaaac 2161 gccgttgata tgaggccagt tttcaatgtc gcggtacggg taatcttcag gcgtatttag 2221 caacaatatt ttgatattgt tgtttttcct gctcaaagta tcctgccaat aatggataag 2281 ctttttatcc gcttccatca tatccagaag aataatagag cctgaagaga tatcgtccag 2341 agaacgttga atattatgta attttcctgt aattgccagc gattgtttaa ggtgctgcaa 2401 gagagctgtc gcctgcaaag aagatttagt gatcaacaat aatgtatgac catgaatact 2461 atggacttca ttaaacatga tgaaaccccg ctttttttat tgatcgcaca cctgacagct 2521 gcctctaaaa tagaagcacc agaagtactg acagatgttg cactgctgtg tgtagtaata 2581 aatcagccct aaatgggtaa aatataaaac taatggatta catctgattt caatctagcc 2641 attacaaatc ttaaatcaag tgttaaacat gtaactaaat gtaactcgtt atattaaaat 2701 gttaacctta aggttttatt aagtttagaa atgatagaaa agttgtacat ttggttttta 2761 ttgcacaatt ttaaaaaatc atacaaatgg tgataactta ctaataatgc atataaaaaa 2821 tatttcggtg tagtcctttc gtcatgtaaa acgttcttgt tttttctcca cacctccgtg 2881 gacaattttt tactgcaaaa agacgaggtt tgtcacggct tgtgcgcaag acatatcgca 2941 gcaatcagcg acgggcaaga agaatgactg tctggtgctt tttgatagcg gaaaacggag 3001 atttaaaaga aaacaaaata tttttttgcg tagataacag cgtatttacg tgggttttaa 3061 tactttggta tgaactaaaa aagaaaaata caacgcgcgg gtgagttatt aaaaatattt 3121 ccgcagacat actttccatc gtaacgcagc gttaacaaaa tacaggttgc gttaacaacc 3181 aagttgaaat gatttaattt cttaaatgta cgaccaggtc cagggtgaca acatgaaaaa 3241 caaattgtta tttatgatgt taacaatact gggtgcgcct gggattgcag ccgcagcagg 3301 ttatgattta gctaattcag aatataactt cgcggtaaat gaattgagta agtcttcatt 3361 taatcaggca gccataattg gtcaagctgg gactaataat agtgctcagt tacggcaggg 3421 aggctcaaaa cttttggcgg ttgttgcgca agaaggtagt agcaaccggg caaagattga 3481 ccagacagga gattataacc ttgcatatat tgatcaggcg ggcagtgcca acgatgccag 3541 tatttcgcaa ggtgcttatg gtaatactgc gatgattatc cagaaaggtt ctggtaataa 3601 agcaaatatt acacagtatg gtactcaaaa aacggcaatt gtagtgcaga gacagtcgca 3661 aatggctatt cgcgtgacac aacgttaatt tccattcgac ttttaaatca atccgatggg 3721 ggttttacat gaaactttta aaagtagcag caattgcagc aatcgtattc tccggtagcg 3781 ctctggcagg tgttgttcct cagtacggcg gcggcggtaa ccacggtggt ggcggtaata 3841 atagcggccc aaattctgag ctgaacattt accagtacgg tggcggtaac tctgcacttg 3901 ctctgcaaac tgatgcccgt aactctgact tgactattac ccagcatggc ggcggtaatg 3961 gtgcagatgt tggtcagggc tcagatgaca gctcaatcga tctgacccaa cgtggcttcg 4021 gtaacagcgc tactcttgat cagtggaacg gcaaaaattc tgaaatgacg gttaaacagt 4081 tcggtggtgg caacggtgct gcagttgacc agactgcatc taactcctcc gtcaacgtga 4141 ctcaggttgg ctttggtaac aacgcgaccg ctcatcagta ctaatacatc atttgtatta 4201 cagaaacagg gcgcaagccc tgtttttttt cgggagaaga atatgaatac gttattactc 4261 cttgcggcac tttccagtca gataaccttt aatacgaccc agcaagggga tgtgtatacc 4321 attattcctg aagtcactct tactcaatct tgtctgtgca gagtacaaat attgtccctg 4381 cgcgaaggca gttcagggca aagtcagacg aagcaagaaa agaccctttc attgcctgct 4441 aatcaaccca ttgctttgac gaagttgagt ttaaatattt ccccggacga tcgggtgaaa 4501 atagttgtta ctgtttctga tggacagtca cttcatttat cacaacaatg gccgccctct 4561 tcagaaaagt cttaatttgt tgaaatatcg agcataagat gaatctggag agaatggtct 4621 gctgcgaatc agccaacctg aaagtatgga taacacaacc cttggatttg cccctatatt //