@inproceedings{e80a36f7706e4c1ea5b8fb0f3e5644ad,
title = "Large scale graph representations for subgraph census",
abstract = "A Subgraph Census (determining the frequency of smaller subgraphs in a network) is an important computational task at the heart of several graph mining algorithms. Here we focus on the g-tries, an efficient state-of-the art data structure. Its algorithm makes extensive use of the graph primitive that checks if a certain edge exists. The original implementation used adjacency matrices in order to make this operation as fast as possible, as is the case with most past approaches. This representation is very expensive in memory usage, limiting the applicability. In this paper we study a number of possible approaches that scale linearly with the number of edges. We make an extensive empirical study of these alternatives in order to find an efficient hybrid approach that combines the best representations. We achieve a performance that is less than 50% slower than the adjacency matrix on average (almost 3 times more efficient than a naive binary search implementation), while being memory efficient and tunable for different memory restrictions.",
keywords = "Complex networks, G-tries, Large scale graphs, Motifs",
author = "Pedro Paredes and Pedro Ribeiro",
note = "Publisher Copyright: {\textcopyright} Springer-Verlag Berlin Heidelberg 2016.; 12th International Conference and School on Advances in Network Science, NetSci-X 2016 ; Conference date: 11-01-2016 Through 13-01-2016",
year = "2016",
doi = "10.1007/978-3-319-28361-6_16",
language = "English (US)",
isbn = "9783319283609",
series = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
publisher = "Springer Verlag",
pages = "186--194",
editor = "Ulrik Brandes and Dino Pedreschi and Adam Wierzbicki and Frank Schweitzer",
booktitle = "Advances in Network Science - 12th International Conference and School, NetSci-X 2016, Proceedings",
address = "Germany",
}