@inproceedings{b5a5ff05cb504bd39d69db298b8928f6,
title = "Correcting for Granularity Bias in Modularity-Based Community Detection Methods",
abstract = "Maximizing modularity is currently the most widely-used community detection method in applications. Modularity comes with a parameter that indirectly controls the granularity of the resulting clustering. Moreover, one can choose this parameter in such a way that modularity maximization becomes equivalent to maximizing the likelihood of a stochastic block model. Thus, this method is statistically justified, while at the same time, it is known to have a bias towards fine-grained clusterings. In this work, we introduce a heuristic to correct for this bias. This heuristic is based on prior work where modularity is described in geometric terms. This has led to a broad generalization of modularity-based community detection methods, and the heuristic presented in this paper applies to each of them. We justify the heuristic by describing a relation between several distances that we observe to hold in many instances. We prove that, assuming the validity of this relation, our heuristic leads to a clustering of the same granularity as the ground-truth clustering. We compare our heuristic to likelihood-based community detection methods on several synthetic graphs and show that our method indeed results in clusterings with granularity closer to the granularity of the ground-truth clustering. Moreover, our heuristic often outperforms likelihood maximization in terms of similarity to the ground-truth clustering.",
keywords = "Clustering, Community detection, Likelihood maximization, Modularity",
author = "Martijn G{\"o}sgens and {van der Hofstad}, Remco and Nelly Litvak",
year = "2023",
month = may,
day = "16",
doi = "10.1007/978-3-031-32296-9_1",
language = "English",
isbn = "978-3-031-32295-2",
series = "Lecture Notes in Computer Science (LNCS)",
publisher = "Springer",
pages = "1--18",
editor = "Megan Dewar and Pawe{\l} Pra{\l}at and Przemys{\l}aw Szufel and Fran{\c c}ois Th{\'e}berge and Ma{\l}gorzata Wrzosek",
booktitle = "Algorithms and Models for the Web Graph",
address = "Germany",
note = "18th International Workshop on Algorithms and Models for the Web Graph, WAW 2023 ; Conference date: 23-05-2023 Through 26-05-2023",
}