{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,7,24]],"date-time":"2024-07-24T07:19:29Z","timestamp":1721805569903},"reference-count":31,"publisher":"Springer Science and Business Media LLC","issue":"3","license":[{"start":{"date-parts":[[2012,11,8]],"date-time":"2012-11-08T00:00:00Z","timestamp":1352332800000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["The VLDB Journal"],"published-print":{"date-parts":[[2013,6]]},"DOI":"10.1007\/s00778-012-0296-4","type":"journal-article","created":{"date-parts":[[2012,11,7]],"date-time":"2012-11-07T03:44:50Z","timestamp":1352259890000},"page":"395-420","source":"Crossref","is-referenced-by-count":28,"title":["Similarity queries: their conceptual evaluation, transformations, and processing"],"prefix":"10.1007","volume":"22","author":[{"given":"Yasin N.","family":"Silva","sequence":"first","affiliation":[]},{"given":"Walid G.","family":"Aref","sequence":"additional","affiliation":[]},{"given":"Per-Ake","family":"Larson","sequence":"additional","affiliation":[]},{"given":"Spencer S.","family":"Pearson","sequence":"additional","affiliation":[]},{"given":"Mohamed H.","family":"Ali","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2012,11,8]]},"reference":[{"key":"296_CR1","unstructured":"Silva, Y.N., Aref, W.G, Ali, M.H.: Similarity group-by. In: Proceedings of the 2009 IEEE International Conference on Data, Engineering, 2009"},{"key":"296_CR2","unstructured":"Silva, Y.N., Aref, W.G., Ali, M.H.: The similarity join database operator. In: Proceedings of the 2010 IEEE International Conference on Data, Engineering, 2010"},{"key":"296_CR3","unstructured":"Silva, Y.N., Arshad, M.U., Aref, W.G.: Exploiting similarity-aware grouping in decision support systems. In: Proceedings of the 12th International Conference on Extending Database Technology: Advances in Database Technology, 2009"},{"key":"296_CR4","unstructured":"Silva, Y.N., Aly, A.M., Aref, W.G., Larson, P.-A.: Simdb: a similarity-aware database system. In: Proceedings of the 2010 International Conference on Management of data, 2010"},{"key":"296_CR5","unstructured":"Guha, S., Rastogi, R., Shim, K.: Cure: an efficient clustering algorithm for large databases. In: Proceedings of the 1998 ACM SIGMOD International Conference on Management of data, 1998"},{"key":"296_CR6","unstructured":"Zhang, T., Ramakrishnan, R., Livny, M.: Birch: an efficient data clustering method for very large databases. In: Proceedings of the 1996 ACM SIGMOD International Conference on Management of data, 1996"},{"key":"296_CR7","unstructured":"Zhang, C., Huang, Y.: Cluster by: a new sql extension for spatial data aggregation. In: Proceedings of the 15th Annual ACM International Symposium on Advances in Geographic, Information Systems, 2007"},{"key":"296_CR8","unstructured":"Li, C., Wang, M., Lim, L., Wang, H., Chang, K.C.-C.: Supporting ranking and clustering as generalized order-by and group-by. In: Proceedings of the 2007 ACM SIGMOD International Conference on Management of data, 2007"},{"key":"296_CR9","unstructured":"Schallehn, E., Sattler, K.-u., Saake, G.: Extensible grouping and aggregation for data reconciliation. In: In Proceedings of 4th International Workshop on Engineering Federated, Information Systems, EFIS01, 2001"},{"key":"296_CR10","doi-asserted-by":"crossref","first-page":"361","DOI":"10.1016\/j.datak.2003.08.004","volume":"48","author":"E Schallehn","year":"2004","unstructured":"Schallehn, E., Sattler, K.-U., Saake, G.: Efficient similarity-based operations for data integration. Data Knowl. Eng. 48, 361\u2013387 (2004)","journal-title":"Data Knowl. Eng."},{"key":"296_CR11","first-page":"7:1","volume":"33","author":"EH Jacox","year":"2008","unstructured":"Jacox, E.H., Samet, H.: Metric space similarity joins. ACM Trans. Datab. Syst. 33, 7:1\u20137:38 (2008)","journal-title":"ACM Trans. Datab. Syst."},{"key":"296_CR12","unstructured":"Hjaltason, G.R., Samet, H.: Incremental distance join algorithms for spatial databases. In: Proceedings of the 1998 ACM SIGMOD International Conference on Management of data, 1998"},{"key":"296_CR13","doi-asserted-by":"crossref","first-page":"728","DOI":"10.1007\/s10115-003-0122-9","volume":"6","author":"C B\u00f6hm","year":"2004","unstructured":"B\u00f6hm, C., Krebs, F.: The k-nearest neighbour join: turbo charging the kdd process. Knowl. Inf. Syst. 6, 728\u2013749 (2004)","journal-title":"Knowl. Inf. Syst."},{"key":"296_CR14","unstructured":"Chaudhuri, S., Ganti, V., Kaushik, R.: A primitive operator for similarity joins in data cleaning. In: Proceedings of the 22nd International Conference on Data, Engineering, 2006"},{"key":"296_CR15","unstructured":"Gravano, L., Ipeirotis, P.G., Jagadish, H.V., Koudas, N., Muthukrishnan, S., Srivastava, D.: Approximate string joins in a database (almost) for free. In: Proceedings of the 27th International Conference on Very Large Data, Bases, 2001"},{"key":"296_CR16","unstructured":"Hadjieleftheriou, M., Chandel, A., Koudas, N., Srivastava, D.: Fast indexes and algorithms for set similarity selection queries. In: Proceedings of the 2008 IEEE 24th International Conference on Data, Engineering, 2008"},{"key":"296_CR17","unstructured":"Yang, X., Wang, B., Li, C.: Cost-based variable-length-gram selection for string collections to support approximate queries efficiently. In: Proceedings of the 2008 ACM SIGMOD International Conference on Management of data, 2008"},{"key":"296_CR18","unstructured":"Wichterich, M., Assent, I., Kranen, P., Seidl, T.: Efficient emd-based similarity search in multimedia databases via flexible dimensionality reduction. In: Proceedings of the 2008 ACM SIGMOD International Conference on Management of data, 2008"},{"key":"296_CR19","unstructured":"Adali, S., Bonatti, P., Sapino, M.L., Subrahmanian, V.S.: A multi-similarity algebra. In: Proceedings of the 1998 ACM SIGMOD International Conference on Management of Data, 1998"},{"key":"296_CR20","unstructured":"Ferreira, M.R.P., Traina, C., Jr., Traina, A.J.M.: An efficient framework for similarity query optimization. In: Proceedings of the 15th Annual ACM International Symposium on Advances in Geographic, Information Systems, 2007"},{"key":"296_CR21","doi-asserted-by":"crossref","unstructured":"Traina, C. Jr., Traina, A.J.M., Vieira, M.R., Arantes, A.S., Faloutsos, C.: Efficient processing of complex similarity queries in rdbms through query rewriting, In: Proceedings of the 15th ACM International Conference on Information and, Knowledge Management, 2006","DOI":"10.1145\/1183614.1183620"},{"key":"296_CR22","unstructured":"Barioni, M.C.N., Razente, H., Traina, A., Traina, C. Jr.: Siren: a similarity retrieval engine for complex data. In: Proceedings of the 32nd International Conference on Very Large Data Bases, 2006"},{"key":"296_CR23","unstructured":"Baioco, G.B., Traina, A.J.M., Traina, C. Jr.: Mamcost: Global and local estimates leading to robust cost estimation of similarity queries. In: Proceedings of the 19th International Conference on Scientific and Statistical Database Management, 2007"},{"key":"296_CR24","unstructured":"TPC-H version 2.14.3. [Online]. Available: http:\/\/www.tpc.org\/tpch\/"},{"key":"296_CR25","unstructured":"Silva, Y.N., Aref, W.G., Larson, P.-A., Pearson, S.S., Ali, M.H.: Similarity queries\u2014transformation rules and proofs. Arizona State University, Tech. Rep., 2012. [Online]. Available: http:\/\/www.public.asu.edu\/~ynsilva\/tr\/SQTRep.pdf"},{"key":"296_CR26","unstructured":"Chaudhuri, S., Shim, K.: Including group-by in query optimization. In: Proceedings of the 20th International Conference on Very Large Data, Bases, 1994"},{"key":"296_CR27","unstructured":"Yan, W.P., Larson, P.-A.: Eager aggregation and lazy aggregation. In: Proceedings of the 21th International Conference on Very Large Data, Bases, 1995"},{"issue":"3","key":"296_CR28","first-page":"19","volume":"18","author":"G Graefe","year":"1995","unstructured":"Graefe, G.: The cascades framework for query optimization. IEEE Data Eng. Bull. 18(3), 19\u201329 (1995)","journal-title":"IEEE Data Eng. Bull."},{"key":"296_CR29","doi-asserted-by":"crossref","unstructured":"Graefe, G., McKenna, W.J.: The volcano optimizer generator: Extensibility and efficient search. In: Proceedings of the Ninth International Conference on Data Engineering, pp. 209\u2013218. IEEE Computer Society, Washington, DC (1993)","DOI":"10.1109\/ICDE.1993.344061"},{"key":"296_CR30","doi-asserted-by":"crossref","unstructured":"Ciaccia, P., Patella, M., Zezula, P.: A cost model for similarity queries in metric spaces. In Proceedings of the Seventeenth ACM SIGACT-SIGMOD-SIGART Symposium on Principles of Database Systems, pp. 59\u201368. ACM, New York, NY (1998)","DOI":"10.1145\/275487.275495"},{"key":"296_CR31","doi-asserted-by":"crossref","first-page":"338","DOI":"10.14778\/1978665.1978666","volume":"4","author":"H Lee","year":"2011","unstructured":"Lee, H., Ng, R.T., Shim, K.: Similarity join size estimation using locality sensitive hashing. Proc. VLDB Endow. 4, 338\u2013349 (2011)","journal-title":"Proc. VLDB Endow."}],"container-title":["The VLDB Journal"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s00778-012-0296-4.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/article\/10.1007\/s00778-012-0296-4\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s00778-012-0296-4","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2019,7,5]],"date-time":"2019-07-05T05:47:08Z","timestamp":1562305628000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/s00778-012-0296-4"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2012,11,8]]},"references-count":31,"journal-issue":{"issue":"3","published-print":{"date-parts":[[2013,6]]}},"alternative-id":["296"],"URL":"https:\/\/doi.org\/10.1007\/s00778-012-0296-4","relation":{},"ISSN":["1066-8888","0949-877X"],"issn-type":[{"value":"1066-8888","type":"print"},{"value":"0949-877X","type":"electronic"}],"subject":[],"published":{"date-parts":[[2012,11,8]]}}}