@inproceedings{0da405abb17c4e518a8b1ce7109a10df,
title = "SiGMa: Simple greedy matching for aligning large knowledge bases",
abstract = "The Internet has enabled the creation of a growing number of large-scale knowledge bases in a variety of domains containing complementary information. Tools for automatically aligning these knowledge bases would make it possible to unify many sources of structured knowledge and answer complex queries. However, the efficient alignment of large- scale knowledge bases still poses a considerable challenge. Here, we present Simple Greedy Matching (SiGMa), a simple algorithm for aligning knowledge bases with millions of entities and facts. SiGMa is an iterative propagation algorithm that leverages both the structural information from the relationship graph and flexible similarity measures between entity properties in a greedy local search, which makes it scalable. Despite its greedy nature, our experiments indicate that SiGMa can efficiently match some of the world's largest knowledge bases with high accuracy. We provide additional experiments on benchmark datasets which demonstrate that SiGMa can outperform state-of-The-Art approaches both in accuracy and efficiency.",
keywords = "Alignment, Entity, Greedy algorithm, Knowledge base, Large-scale, Relationship",
author = "Simon Lacoste-Julien and Konstantina Palla and Alex Davies and Gjergji Kasneci and Thore Graepel and Zoubin Ghahramani",
note = "Publisher Copyright: Copyright {\textcopyright} 2013 ACM.; 19th ACM SIGKDD International Conference on Knowledge Discovery and Data Mining, KDD 2013 ; Conference date: 11-08-2013 Through 14-08-2013",
year = "2013",
month = aug,
day = "11",
doi = "10.1145/2487575.2487592",
language = "English",
series = "Proceedings of the ACM SIGKDD International Conference on Knowledge Discovery and Data Mining",
publisher = "Association for Computing Machinery",
pages = "572--580",
editor = "Rajesh Parekh and Jingrui He and Inderjit, {Dhillon S.} and Paul Bradley and Yehuda Koren and Rayid Ghani and Senator, {Ted E.} and Grossman, {Robert L.} and Ramasamy Uthurusamy",
booktitle = "KDD 2013 - 19th ACM SIGKDD International Conference on Knowledge Discovery and Data Mining",
}