@inproceedings{b77cf63cb2b74fd183ebb8fd8855f78e,
title = "SimDB: A similarity-aware database system",
abstract = "The identification and processing of similarities in the data play a key role in multiple application scenarios. Several types of similarity-aware operations have been studied in the literature. However, in most of the previous work, similarity-aware operations are studied in isolation from other regular or similarity-aware operations. Furthermore, most of the previous research in the area considers a standalone implementation, i.e., without any integration with a database system. In this demonstration we present SimDB, a similarity-aware database management system. SimDB supports multiple similarity-aware operations as first-class database operators. We describe the architectural changes to implement the similarity-aware operators. In particular, we present the way conventional operators' implementation machinery is extended to support similarity-aware operators. We also show how these operators interact with other similarity-aware and regular operators. In particular, we show the effectiveness of multiple equivalence rules that can be used to extend cost-based query optimization to the case of similarity-ware operations.",
keywords = "similarity group-by, similarity join, similarity-aware query processing and optimization",
author = "Silva, {Yasin N.} and Aly, {Ahmed M.} and Aref, {Walid G.} and Larson, {Per Ake}",
year = "2010",
month = jul,
day = "23",
doi = "10.1145/1807167.1807330",
language = "English (US)",
isbn = "9781450300322",
series = "Proceedings of the ACM SIGMOD International Conference on Management of Data",
pages = "1243--1246",
booktitle = "Proceedings of the 2010 International Conference on Management of Data, SIGMOD '10",
note = "2010 International Conference on Management of Data, SIGMOD '10 ; Conference date: 06-06-2010 Through 11-06-2010",
}