@inproceedings{12b2630176154e0ba02b80793cd7ad2e,
title = "Efficient entity resolution based on sequence rules",
abstract = "Entity resolution (ER) is to find the data objects referring to the same real-world entity. When ER is performed on relations, the crucial operator is record matching, which is to judge whether two tuples referring to the same real-world entity. Record matching is a longstanding issue. However, with massive and complex data in applications, current methods cannot satisfy the requirements. A Sequence-rule-based record matching (SeReMatching) is presented with the consideration of both the values of the attributes and their importance in record matching. And with the help of the Bloom Filter we changed, the algorithm greatly increases the checking speed and makes the complexity of entity resolution almost O(n). And extensive experiments are performed to evaluate our methods.",
keywords = "Bloom Filter, Entity resolution, Record matching",
author = "Yakun Li and Hongzhi Wang and Hong Gao",
year = "2011",
doi = "10.1007/978-3-642-21402-8\_61",
language = "英语",
isbn = "9783642214011",
series = "Communications in Computer and Information Science",
number = "PART 1",
pages = "381--388",
booktitle = "Advanced Research on Computer Science and Information Engineering - International Conference, CSIE 2011, Proceedings",
edition = "PART 1",
note = "International Conference on Advanced Research on Computer Science and Information Engineering, CSIE 2011 ; Conference date: 21-05-2011 Through 22-05-2011",
}