@inproceedings{ba1faeda6a1245c48065d464f20afee2,
title = "Compressing inverted indexes with recursive graph bisection: A reproducibility study",
abstract = "Document reordering is an important but often overlooked preprocessing stage in index construction. Reordering document identifiers in graphs and inverted indexes has been shown to reduce storage costs and improve processing efficiency in the resulting indexes. However, surprisingly few document reordering algorithms are publicly available despite their importance. A new reordering algorithm derived from recursive graph bisection was recently proposed by Dhulipala et al., and shown to be highly effective and efficient when compared against other state-of-the-art reordering strategies. In this work, we present a reproducibility study of this new algorithm. We describe the implementation challenges encountered, and explore the performance characteristics of our clean-room reimplementation. We show that we are able to successfully reproduce the core results of the original paper, and show that the algorithm generalizes to other collections and indexing frameworks. Furthermore, we make our implementation publicly available to help promote further research in this space.",
keywords = "Compression, Efficiency, Reordering, Reproducibility",
author = "Joel Mackenzie and Antonio Mallia and Matthias Petri and Culpepper, {J. Shane} and Torsten Suel",
note = "Publisher Copyright: {\textcopyright} Springer Nature Switzerland AG 2019.; 41st European Conference on Information Retrieval, ECIR 2019 ; Conference date: 14-04-2019 Through 18-04-2019",
year = "2019",
doi = "10.1007/978-3-030-15712-8_22",
language = "English (US)",
isbn = "9783030157111",
series = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
publisher = "Springer Verlag",
pages = "339--352",
editor = "Djoerd Hiemstra and Claudia Hauff and Norbert Fuhr and Leif Azzopardi and Benno Stein and Philipp Mayr",
booktitle = "Advances in Information Retrieval - 41st European Conference on IR Research, ECIR 2019, Proceedings",
}