Imperial College London


Faculty of Natural SciencesDepartment of Life Sciences

Director Centre for Bioinformatics



+44 (0)20 7594 5212m.sternberg Website




306Sir Ernst Chain BuildingSouth Kensington Campus






BibTex format

author = {Sternberg, MJE and Tamaddoni-Nezhad, A and Lesk, VI and Kay, E and Hitchen, PG and Cootes, A and van, Alphen LB and Lamoureux, MP and Jarrelle, HC and Rawlings, CJ and Soo, EC and Szymanski, CM and Dell, A and Wren, BW and Muggleton, SH},
doi = {10.1016/j.jmb.2012.10.014},
journal = {Journal of Molecular Biology},
pages = {186--197},
title = {Gene Function Hypotheses for the Campylobacter jejuni Glycome Generated by a Logic-Based Approach},
url = {},
volume = {425},
year = {2012}

RIS format (EndNote, RefMan)

AB - Increasingly, experimental data on biological systems are obtained from several sources and computational approaches are required to integrate this information and derive models for the function of the system. Here, we demonstrate the power of a logic-based machine learning approach to propose hypotheses for gene function integrating information from two diverse experimental approaches. Specifically, we use inductive logic programming that automatically proposes hypotheses explaining the empirical data with respect to logically encoded background knowledge. We study the capsular polysaccharide biosynthetic pathway of the major human gastrointestinal pathogen Campylobacter jejuni. We consider several key steps in the formation of capsular polysaccharide consisting of 15 genes of which 8 have assigned function, and we explore the extent to which functions can be hypothesised for the remaining 7. Two sources of experimental data provide the information for learning—the results of knockout experiments on the genes involved in capsule formation and the absence/presence of capsule genes in a multitude of strains of different serotypes. The machine learning uses the pathway structure as background knowledge. We propose assignments of specific genes to five previously unassigned reaction steps. For four of these steps, there was an unambiguous optimal assignment of gene to reaction, and to the fifth, there were three candidate genes. Several of these assignments were consistent with additional experimental results. We therefore show that the logic-based methodology provides a robust strategy to integrate results from different experimental approaches and propose hypotheses for the behaviour of a biological system.
AU - Sternberg,MJE
AU - Tamaddoni-Nezhad,A
AU - Lesk,VI
AU - Kay,E
AU - Hitchen,PG
AU - Cootes,A
AU - van,Alphen LB
AU - Lamoureux,MP
AU - Jarrelle,HC
AU - Rawlings,CJ
AU - Soo,EC
AU - Szymanski,CM
AU - Dell,A
AU - Wren,BW
AU - Muggleton,SH
DO - 10.1016/j.jmb.2012.10.014
EP - 197
PY - 2012///
SN - 1089-8638
SP - 186
TI - Gene Function Hypotheses for the Campylobacter jejuni Glycome Generated by a Logic-Based Approach
T2 - Journal of Molecular Biology
UR -
UR -
VL - 425
ER -