Escherichia coli CFT073_ complete genome - 1..5231428 299 newly added protein-coding (reannotated) (additional file 2) Location Strand Length PID Gene Synonym Code Product 11870..11935 + 21 * - c0001r - Predicted protein 12038..12133 + 31 * - c0002r - Predicted protein 16186..16338 - 50 * - c0003r - Toxic membrane protein_ hokC 29538..29729 + 63 * - c0004r - Hypothetical protein 29982..30452 + 156 * - c0005r - Non-specific ribonucleoside 45846..46280 + 144 * - c0006r - Homologue to protein FixB 46346..46786 + 146 * - c0007r - Homologue to protein FixB 81729..81860 + 43 * - c0008r - Putative uncharacterized protein 127216..128997 + 593 * - c0009r - Uropathogenic specific S-type colicin 129401..129688 + 95 * - c0010r - Putative colicin 129691..129984 + 97 * - c0011r - Putative colicin immunity protein 131965..132090 + 41 * - c0012r - Transposase for insertion sequence 136042..136671 + 209 * - c0013r - Probable pyruvate dehydrogenase 136658..137935 + 425 * - c0014r - Pyruvate dehydrogenase 203554..203907 + 117 * - c0015r - Predicted protein 203960..204055 + 31 * - c0016r - Hypothetical protein 204195..204752 + 185 * - c0017r - Putative ATP-binding component 238894..239013 + 39 * - c0018r - Putative uncharacterized protein 239023..239250 - 75 * - c0019r - Putative uncharacterized protein 239479..239673 - 64 * - c0020r - Cell wall-associated hydrolase 253442..253609 - 55 * - c0021r - Putative uncharacterized protein 255064..255288 - 74 * - c0022r - L0008-like protein 255428..255946 + 172 * - c0023r - Putative uncharacterized protein 255849..256166 + 105 * - c0024r - Transposase protein 256087..256683 + 198 * - c0025r - Putative protein 256700..256930 + 76 * - c0026r - Hypothetical transposase 270674..270919 - 81 * - c0027r - Phage integrase family protein 271866..272603 + 245 26246197 - c0292 - - hypothetical protein 292043..292366 + 107 * - c0028r - Putative uncharacterized protein 300426..300542 + 38 * - c0029r - Putative protein 300576..300641 + 21 * - c0030r - Hypothetical protein 305442..305696 + 84 * - c0031r - Hypothetical protein 310860..312131 + 423 * - c0032r - CdiB protein 312198..312632 + 144 * - c0033r - CdiA protein 322222..322740 + 172 * - c0034r - Putative uncharacterized protein 322816..323052 + 78 * - c0035r - Putative protein 323036..323194 + 52 * - c0036r - Putative protein 325690..325962 - 90 * - c0037r - Homologue to pilu protein_ papB 331584..331709 - 41 * - c0038r - Predicted integrase protein 335703..335993 + 96 * - c0039r - Putative protein 348478..348687 + 69 * - c0040r - Putative receptor 376998..377138 + 46 * - c0041r - Homologue to Iso-IS1-insB protein 378980..379309 - 109 * - c0042r - Putative ferrodoxin 408902..409114 - 70 * - c0043r - Putative uncharacterized protein 428818..430314 + 498 * - c0044r - Putative protein_ homologous to YahG 430382..430630 + 82 * - c0045r - Putative uncharacterized protein 435157..435201 + 14 * - c0046r - Hypothetical protein 452265..452504 - 79 * - c0047r - Hypothetical protein 582977..583057 + 26 * - c0048r - Putative protein 592543..592800 + 85 * - c0049r - Predicted protein 593126..593323 + 65 * - c0050r - Predicted protein 625280..625372 - 30 * - c0051r - Hypothetical protein 627155..627463 - 102 * - c0052r - Putative prophase integrase protein_ IntD 627483..627782 - 99 * - c0053r - Putative integrase 681713..681823 - 36 * - c0054r - Hok/Gef family protein 691079..691375 - 98 * - c0055r - Citrate lyase acyl carrier protein_ CitD 778988..779098 - 36 * - c0056r - Hypothetical protein 796866..796979 + 37 * - c0057r - Hypothetical protein 834297..834971 + 224 * - c0058r - Biotin synthesis protein B 875244..875294 + 16 * - c0059r - Hypothetical protein 909004..909273 - 89 * - c0060r - Putative uncharacterized protein 912524..912676 - 50 * - c0061r - Putative uncharacterized protein 912701..912757 - 18 * - c0062r - Hypothetical protein 914647..914760 + 37 * - c0063r - Hypothetical protein 914770..914925 + 51 * - c0064r - Hypothetical protein 916419..916565 + 48 * - c0065r - Hypothetical protein 916956..917057 + 33 * - c0066r - Hypothetical protein 917672..917860 + 62 * - c0067r - Putative uncharacterized protein 937247..937315 + 22 * - c0068r - Hypothetical protein 942966..943067 + 33 * - c0069r - Hypothetical protein 974475..976484 + 669 * - c0070r - Macrolide-specific ABC-type protein 1002231..1003541 - 436 * - c0071r - Putative protein 1003381..1004514 - 377 * - c0072r - Putative protein 1019325..1019591 + 88 * - c0073r - Putative protein 1019452..1020312 + 286 * - c0074r - Putative protein 1059490..1059657 + 55 * - c0075r - Ribosomal modulation factor 1084234..1084326 + 30 * - c0076r - Hypothetical protein 1098806..1098973 + 55 * - c0077r - Hypothetical protein 1100027..1100332 + 101 * - c0078r - Hypothetical protein 1101750..1101923 + 57 * - c0079r - Hypothetical protein 1132609..1132743 + 44 * - c0080r - Putative uncharacterized protein 1136321..1136371 + 16 * - c0081r - Hypothetical protein 1139601..1139885 - 94 * - c0082r - Putative protein 1139653..1139919 - 88 * - c0083r - Tagatose-biphosphate adolase II 1140813..1141064 + 83 * - c0084r - Putative protein 1141282..1141383 + 33 * - c0085r - Hypothetical protein 1141446..1141883 - 145 * - c0086r - Putative protein 1141965..1142066 - 33 * - c0087r - Hypothetical protein 1142066..1142329 - 87 * - c0088r - Putative protein 1142354..1142572 - 72 * - c0089r - Putative protein 1164731..1165249 + 172 * - c0090r - Putative protein 1166568..1166987 - 139 * - c0091r - Putative protein 1167112..1167756 - 214 * - c0092r - Putative protein 1176363..1176527 + 54 * - c0093r - Protein MchX 1176596..1176805 + 69 * - c0094r - Microcin immunity protein_ MchI 1182901..1183122 + 73 * - c0095r - Microcin immunity protein_ McmI 1183119..1183397 + 92 * - c0096r - McmA protein 1212671..1212796 - 41 * - c0097r - Putative protein 1223287..1223520 - 77 * - c0098r - Putative uncharacterized protein 1234499..1235998 + 499 * - c0099r - R6-like transposase protein 1235995..1236750 + 251 * - c0100r - Insertion sequence ATP-binding protein 1270306..1270671 + 121 * - c0101r - Putative virulence factor 1270789..1271232 + 147 * - c0102r - Putative virulence factor 1290866..1291039 + 57 * - c0103r - 50S ribosomal factor L32 1294169..1294906 + 245 * - c0104r - 3-oxoacyl-acyl carriet protein 1314745..1315629 - 294 * - c0105r - Transcription-repair couple protein 1334231..1334512 + 93 * - c0106r - Putative protein 1338301..1338456 + 51 * - c0107r - Hypothetical protein 1371676..1371774 + 32 * - c0108r - Hypothetical protein 1379525..1379713 + 62 * - c0109r - Putative DNA binding protein 1384959..1385207 + 82 * - c0110r - Putative transcriptional activator_ Per homologue 1395192..1395452 - 86 * - c0111r - Hypothetical protein 1399577..1399702 + 41 * - c0112r - Hypothetical protein 1399872..1400051 - 59 * - c0113r - Hypothetical protein 1405665..1405886 - 73 * - c0114r - Putative C4-type zinc finger DNA binding protein 1406277..1406468 - 63 * - c0115r - Hypothetical protein 1412931..1413086 - 51 * - c0116r - Hypothetical protein 1416788..1416913 + 41 * - c0117r - Hypothetical protein 1418123..1418299 + 58 * - c0118r - Hypothetical protein 1422607..1422789 + 60 * - c0119r - Hypothetical peotein 1434048..1434275 + 75 * - c0120r - Putative protein 1434272..1434622 + 116 * - c0121r - Ig domain protein 1438027..1438356 + 109 * - c0122r - Minor tail protein 1455858..1456130 + 90 * - c0123r - Putative uncharacterized protein 1456610..1456786 + 58 * - c0124r - Putative uncharacterized protein 1458725..1458904 + 59 * - c0125r - Hypothetical protein 1459208..1459570 + 120 * - c0126r - Hypothetical protein 1461494..1461634 + 46 * - c0127r - Hypothetical protein 1532199..1532366 + 55 * - c0128r - Hypothetical protein 1532212..1532499 + 95 * - c0129r - Predicted protein 1532234..1532323 - 29 * - c0130r - Hypothetical protein 1539399..1539500 - 33 * - c0131r - Hypothetical protein 1544529..1544690 - 53 * - c0132r - Hypothetical protein 1562031..1563389 - 452 * - c0133r - Tryptophan biosynthesis protein 1609322..1609426 - 34 * - c0134r - Hypothetical protein 1632491..1632763 - 90 * - c0135r - Hypothetical protein 1632764..1633219 - 151 * - c0136r - Putative lysine carboxypeptide 1664321..1665229 + 302 * - c0137r - EntS/YbdA MFS transporter 1665588..1670360 + 1590 * - c0138r - Putative autotransporter protein 1705714..1705851 + 45 * - c0139r - Hypothetical protein 1709322..1709408 + 28 * - c0140r - Hypothetical protein 1709622..1710872 - 416 * - c0141r - Outer membrane TonB-dependent receptor 1710862..1711725 - 287 * - c0142r - Outer membrane receptor 1725418..1725504 + 28 * - c0143r - Putative protein 1727515..1727730 + 71 * - c0144r - Putative uncharacterized protein 1740228..1740815 + 195 * - c0145r - Formate dehydrogenase 1750171..1751349 - 392 * - c0146r - Putative enzyme 1750209..1750325 - 38 * - c0147r - Hypothetical protein 1779279..1779401 + 40 * - c0148r - Hypothetical protein 1785630..1787090 - 486 * - c0149r - Altronate oxidoreductase 1792671..1792790 + 39 * - c0150r - Hypothetical protein 1806257..1806331 - 24 * - c0151r - Hypothetical protein 1865074..1865199 + 41 * - c0152r - β-lactam resistance protein 1889782..1889844 + 20 * - c0153r - Hypothetical protein 1902540..1902650 - 36 * - c0154r - Putative protein 1951524..1953581 - 685 * - c0155r - Phenylalanyl-tRNA synthetase 1953448..1953912 - 154 * - c0156r - Putative protein 1955770..1955967 - 65 * - c0157r - 50S ribosomal protein L35 1959061..1959300 + 79 * - c0158r - Putative uncharacterized protein 1960261..1960368 + 35 * - c0159r - Predicted protein 2082558..2083154 + 198 * - c0160r - Phosphoribosylglycinamide formyltransferase 2 2083173..2083736 + 187 * - c0161r - Putative protein 2120211..2120321 - 36 * - c0162r - Hypothetical protein 2164409..2164450 + 13 * - c0163r - Hypothetical protein 2207421..2207480 + 19 * - c0164r - Putative exported protein 2215292..2215510 - 72 * - c0165r - Putative DNA binding protein 2314311..2314523 + 70 * - c0166r - Putative transcriptional regulator 2328409..2329605 + 398 * - c0167r - Glycosyl transferase family protein 2331125..2331247 - 40 * - c0168r - Putative protein 2331582..2331692 + 36 * - c0169r - Putative uncharacterized protein 2331672..2331779 - 35 * - c0170r - Hypothetical protein 2336026..2336163 - 45 * - c0171r - Hypothetical protein 2336202..2336288 - 28 * - c0172r - Hypothetical protein 2347097..2347141 + 14 * - c0173r - Hypothtical protein 2349098..2349277 + 59 * - c0174r - Putative transposase 2357898..2358332 + 144 * - c0175r - Homologous to GTP-binding protein 2368079..2368435 + 118 * - c0176r - Hypothetical protein 2449308..2449568 + 86 * - c0177r - Hypothetical protein 2495548..2495667 + 39 * - c0178r - Hypothetical protein 2507364..2507471 + 35 * - c0179r - Homologous to putative inner membrane protein 2547930..2548520 - 196 * - c0180r - Putative protein 2548517..2548870 - 117 * - c0181r - Conserved protein 2570846..2571073 + 75 * - c0182r - Putative protein 2571057..2571143 + 28 * - c0183r - Hypothetical protein 2577661..2577864 - 67 * - c0184r - Hypothetical outer membrane protein 2708536..2708700 - 54 * - c0185r - ABC transporter component 2709112..2709318 - 68 * - c0186r - Putative protein 2720742..2721467 - 241 * - c0187r - Putative transport protein 2721472..2721918 - 148 * - c0188r - Putative protein 2886254..2886445 + 63 * - c0189r - Putative uncharacterized protein 2989363..2989557 + 64 * - c0190r - Cell wall-associated hydrogenase 2989787..2990014 + 75 * - c0191r - Putative uncharacterized protein 2990024..2990143 - 39 * - c0192r - Hypothetical protein 3046888..3047082 + 64 * - c0193r - Protein ylcI homologue 3047333..3047539 - 68 * - c0194r - Uncharacterized protein ybcW 3048181..3048411 - 76 * - c0195r - Uncharacterized protein ynfN 3058011..3058349 - 112 * - c0196r - Putative protein 3061005..3061040 + 11 * - c0197r - Hypothetical protein 3101847..3103580 - 577 * - c0198r - Alanyl-tRNA synthetase 3103723..3104478 - 251 * - c0199r - Putative protein 3114946..3115896 + 316 * - c0200r - Anaerobic nitric oxide reductase 3115901..3116386 + 161 * - c0201r - Conservative protein 3160953..3161105 - 50 * - c0202r - Hypothetical protein 3167987..3168322 + 111 * - c0203r - Glyerol-3-phosphate response protein 3168309..3168563 + 84 * - c0204r - Hypothetical protein 3194046..3194204 - 52 * - c0205r - Hypothetical protein 3212335..3212487 + 50 * - c0206r - Hypothetical protein 3212760..3213752 + 330 * - c0207r - L-fuculokinase 3369752..3369922 - 56 * - c0208r - Hypothetical protein 3382130..3382345 + 71 * - c0209r - Putative protein 3409614..3409967 + 117 * - c0210r - Phage-like element 3412924..3413223 + 99 * - c0211r - Putative protein 3437738..3438052 - 104 * - c0212r - Possible P fimbrial regulator protein papB 3450922..3450987 + 21 * - c0213r - Hypothetical protein 3451905..3452165 - 86 * - c0214r - Insertion sequence protein 3452185..3452226 + 13 * - c0215r - Hypothetical protein 3452229..3452321 - 30 * - c0216r - Hypothetical protein 3452604..3452813 + 69 * - c0217r - Putative uncharacterized protein 3452998..3453309 + 103 * - c0218r - Putative uncharacterized protein 3471865..3472089 + 74 * - c0219r - Hypothetical protein 3472281..3472439 + 52 * - c0220r - Hypothetical protein 3498968..3499069 - 33 * - c0221r - Hypothetical protein 3531004..3531597 - 197 * - c0222r - Hypothetical type II secretion system component 3531570..3532172 - 200 * - c0223r - Hypothetical type II secretion system component 3538895..3540118 - 407 * - c0224r - GlcF protein 3540129..3541181 - 350 * - c0225r - GlcE protein 3600287..3600619 - 110 * - c0226r - Putative uncharacterized protein 3691020..3691553 + 177 * - c0227r - Putative glutathione S-transferase 3691424..3692008 + 194 * - c0228r - Putative transferase 3696054..3696446 - 130 * - c0229r - Predicted transporter 3696275..3697387 - 370 * - c0230r - Putative transport system 3758632..3758958 - 108 * - c0231r - Putative protein 3758948..3760576 - 542 * - c0232r - ATP-dependent metallopeptidase HflB 3766628..3766939 - 103 * - c0233r - 50S ribosomal protein L21 3828066..3828230 + 54 * - c0234r - Hypothetical protein 3855625..3855819 + 64 * - c0235r - Cell wall-associated hydrogenase protein 3856048..3856290 + 80 * - c0236r - Putative uncharacterized protein 3856287..3856406 - 39 * - c0237r - Hypothetical protein 3873994..3874110 - 38 * - c0238r - 50S ribosomal subunit protein L36 3903151..3903318 + 55 * - c0239r - Hypothetical protein 3903352..3904938 + 528 * - c0240r - Putative uncharacterized protein 4020420..4020722 + 100 * - c0241r - Hypothetical acetyltransferase 4020735..4020908 + 57 * - c0242r - Hypothetical protein 4083199..4083396 + 65 * - c0243r - Putative protein 4083336..4083506 + 56 * - c0244r - Hypothetical protein 4139185..4139292 - 35 * - c0245r - Hypothetical protein 4159486..4159698 - 70 * - c0246r - Putative membrane permeability altering protein HokA 4216169..4216354 + 61 * - c0247r - Putative protein 4283366..4283440 - 24 * - c0248r - Hypothetical protein 4283780..4284055 - 91 * - c0249r - IS element 4291696..4292046 + 116 * - c0250r - transposase 4293074..4293121 - 15 * - c0251r - Transposase IS3/IS9 family protein 4294097..4294258 - 53 * - c0252r - Hypothetical protein 4301574..4302509 - 311 * - c0253r - Putative uncharacterized protein 4332035..4332148 - 37 * - c0254r - Hypothetical protein 4373586..4374734 - 382 * - c0255r - Bifunctional 2-oxo-3-deoxygalactonate_6-phosphate aldolase/galactonate dehydratase_ dgoD 4374756..4375349 - 197 * - c0256r - Putative protein 4380278..4380658 + 126 * - c0257r - Putative uncharacterized protein 4381415..4381915 + 166 * - c0258r - Putative uncharacterized protein 4384062..4384772 - 236 * - c0259r - Hypothetical chromosal protein 4384741..4385466 - 241 * - c0260r - Hypothetical chromosal protein 4386553..4386810 + 85 * - c0261r - UPF0161 protein yidD 4446589..4446831 - 80 * - c0262r - Putative protein 4447060..4447254 - 64 * - c0263r - Cell wall-associated hydrogenase protein 4482875..4483018 - 47 * - c0264r - Hypothetical protein 4494050..4494145 + 31 * - c0265r - Hypothetical protein 4521197..4521490 - 97 * - c0266r - Putative uncharacterized protein 4535533..4535628 + 31 * - c0267r - Hypothetical protein 4564910..4565029 + 39 * - c0268r - Hypothetical protein 4565026..4565268 - 80 * - c0269r - Putative protein 4565497..4565691 - 64 * - c0270r - Cell wall-associated hydrogenase protein 4572457..4573236 + 259 * - c0271r - Putative protein 4573149..4575242 + 697 * - c0272r - Conservative protein 4608747..4609334 - 195 * - c0273r - Formate dehydrogenase-O_ major subunit 4646707..4646919 + 70 * - c0274r - 50S ribosomal protein L31 4702788..4702907 + 39 * - c0275r - Hypothetical protein 4702917..4703144 - 75 * - c0276r - Putative uncharacterized protein 4703373..4703567 - 64 * - c0277r - Cell wall-associated hydrogenase protein 4742961..4743080 + 39 * - c0278r - Hypothetical protein 4743077..4743319 - 80 * - c0279r - Putative uncharacterized protein 4743548..4743742 - 64 * - c0280r - Cell wall-associated dehydrogenase protein 4822057..4822113 - 18 * - c0281r - Putative protein 4822307..4822417 - 36 * - c0282r - Hypothetical protein 4858106..4858525 - 139 * - c0283r - Formate dehydrogenase-H_ fdhF 4874565..4875122 - 185 * - c0284r - ATP-binding protein_ phnN 4901810..4902154 - 114 * - c0285r - Putative uncharacterized protein 4902072..4902452 - 126 * - c0286r - Putative uncharacterized protein 4909481..4909777 + 98 * - c0287r - Predicted protein_ homologous to YdjK 4932104..4932217 - 37 * - c0288r - Hypothetical protein 4940353..4940478 + 41 * - c0289r - Hypothetical protein 4948974..4949288 - 104 * - c0290r - P fimbrial regulator papB 4952308..4952481 + 57 * - c0291r - Putative uncharacterized protein 4966824..4966949 - 41 * - c0292r - Putative protein 5021097..5021354 + 85 * - c0293r - Putative protein 5033588..5033902 + 104 * - c0294r - Primosomal replication protein_ priB 5063873..5064055 - 60 * - c0295r - Predicted protein 5116725..5116814 + 29 * - c0296r - Hypothetical protein 5154853..5155197 + 114 * - c0297r - Probable RNA2 phosphotransferase 5155083..5155406 + 107 * - c0298r - Hypothetical protein