Citation

BibTex format

@article{Peach:2021:10.1016/j.patter.2021.100227,
author = {Peach, RL and Arnaudon, A and Schmidt, JA and Palasciano, HA and Bernier, NR and Jelfs, KE and Yaliraki, SN and Barahona, M},
doi = {10.1016/j.patter.2021.100227},
journal = {Patterns},
pages = {100227--100227},
title = {HCGA: Highly comparative graph analysis for network phenotyping},
url = {http://dx.doi.org/10.1016/j.patter.2021.100227},
volume = {2},
year = {2021}
}

RIS format (EndNote, RefMan)

TY  - JOUR
AB - <jats:title>A<jats:sc>bstract</jats:sc></jats:title><jats:p>Networks are widely used as mathematical models of complex systems across many scientific disciplines, not only in biology and medicine but also in the social sciences, physics, computing and engineering. Decades of work have produced a vast corpus of research characterising the topological, combinatorial, statistical and spectral properties of graphs. Each graph property can be thought of as a feature that captures important (and some times overlapping) characteristics of a network. In the analysis of real-world graphs, it is crucial to integrate systematically a large number of diverse graph features in order to characterise and classify networks, as well as to aid network-based scientific discovery. In this paper, we introduce HCGA, a framework for highly comparative analysis of graph data sets that computes several thousands of graph features from any given network. HCGA also offers a suite of statistical learning and data analysis tools for automated identification and selection of important and interpretable features underpinning the characterisation of graph data sets. We show that HCGA outperforms other methodologies on supervised classification tasks on benchmark data sets whilst retaining the interpretability of network features. We also illustrate how HCGA can be used for network-based discovery through two examples where data is naturally represented as graphs: the clustering of a data set of images of neuronal morphologies, and a regression problem to predict charge transfer in organic semiconductors based on their structure. HCGA is an open platform that can be expanded to include further graph properties and statistical learning tools to allow researchers to leverage the wide breadth of graph-theoretical research to quantitatively analyse and draw insights from network data.</jats:p>
AU - Peach,RL
AU - Arnaudon,A
AU - Schmidt,JA
AU - Palasciano,HA
AU - Bernier,NR
AU - Jelfs,KE
AU - Yaliraki,SN
AU - Barahona,M
DO - 10.1016/j.patter.2021.100227
EP - 100227
PY - 2021///
SN - 2666-3899
SP - 100227
TI - HCGA: Highly comparative graph analysis for network phenotyping
T2 - Patterns
UR - http://dx.doi.org/10.1016/j.patter.2021.100227
UR - http://hdl.handle.net/10044/1/88479
VL - 2
ER -