{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,10,30]],"date-time":"2024-10-30T22:55:06Z","timestamp":1730328906234,"version":"3.28.0"},"publisher-location":"New York, NY, USA","reference-count":32,"publisher":"ACM","content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2001,5]]},"DOI":"10.1145\/375663.375671","type":"proceedings-article","created":{"date-parts":[[2003,11,25]],"date-time":"2003-11-25T19:25:53Z","timestamp":1069788353000},"page":"67-78","update-policy":"http:\/\/dx.doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":56,"title":["Probe, count, and classify"],"prefix":"10.1145","author":[{"given":"Panagiotis G.","family":"Ipeirotis","sequence":"first","affiliation":[{"name":"Computer Science Dept., Columbia University"}]},{"given":"Luis","family":"Gravano","sequence":"additional","affiliation":[{"name":"Computer Science Dept., Columbia University"}]},{"given":"Mehran","family":"Sahami","sequence":"additional","affiliation":[{"name":"E.piphany, Inc."}]}],"member":"320","published-online":{"date-parts":[[2001,5]]},"reference":[{"key":"e_1_3_2_1_1_2","doi-asserted-by":"publisher","DOI":"10.1145\/183422.183423"},{"key":"e_1_3_2_1_2_2","doi-asserted-by":"publisher","DOI":"10.1145\/304182.304224"},{"key":"e_1_3_2_1_3_2","doi-asserted-by":"publisher","DOI":"10.1108\/eb049925"},{"key":"e_1_3_2_1_4_2","first-page":"709","volume-title":"Proceedings of AAAI'96","volume":"1","author":"Cohen W. W.","year":"1996","unstructured":"W. W. Cohen . Learning trees and rules with set-valued features . In Proceedings of AAAI'96 , IAAI'96, volume 1 , pages 709 - 716 . AAAI, 1996 . W. W. Cohen. Learning trees and rules with set-valued features. In Proceedings of AAAI'96, IAAI'96, volume 1, pages 709-716. AAAI, 1996."},{"key":"e_1_3_2_1_5_2","doi-asserted-by":"publisher","DOI":"10.1145\/336597.336628"},{"key":"e_1_3_2_1_6_2","unstructured":"The Deep Web: Surfacing Hidden Value. Accessible at http:\/\/www.completeplanet.com\/Tutorials\/DeepWeb\/index.asp. The Deep Web: Surfacing Hidden Value. Accessible at http:\/\/www.completeplanet.com\/Tutorials\/DeepWeb\/index.asp."},{"key":"e_1_3_2_1_7_2","doi-asserted-by":"publisher","DOI":"10.1145\/288627.288651"},{"issue":"9","key":"e_1_3_2_1_8_2","first-page":"637","article-title":"Profusion*: Intelligent fusion from multiple, distributed search engines","volume":"2","author":"Gauch S.","year":"1996","unstructured":"S. Gauch , G. Wang , and M. Gomez . Profusion*: Intelligent fusion from multiple, distributed search engines . The Journal of Universal Computer Science , 2 ( 9 ): 637 - 649 , Sept. 1996 . S. Gauch, G. Wang, and M. Gomez. Profusion*: Intelligent fusion from multiple, distributed search engines. The Journal of Universal Computer Science, 2(9):637-649, Sept. 1996.","journal-title":"The Journal of Universal Computer Science"},{"key":"e_1_3_2_1_9_2","doi-asserted-by":"publisher","DOI":"10.1145\/320248.320252"},{"key":"e_1_3_2_1_10_2","first-page":"2000","article-title":"Estimation of English and non-English language use on the WWW","author":"Grefenstette G.","year":"2000","unstructured":"G. Grefenstette and J. Nioche . Estimation of English and non-English language use on the WWW . In RIAO 2000 , 2000 . G. Grefenstette and J. Nioche. Estimation of English and non-English language use on the WWW. In RIAO 2000, 2000.","journal-title":"RIAO"},{"key":"e_1_3_2_1_11_2","doi-asserted-by":"publisher","DOI":"10.1145\/297117.297123"},{"key":"e_1_3_2_1_12_2","volume-title":"Proceedings of the ACM SIGMOD Workshop on the Web and Databases (WebDB2000)","author":"Ipeirotis P. G.","year":"2000","unstructured":"P. G. Ipeirotis , L. Gravano , and M. Sahami . Automatic classification of text databases through query probing . In Proceedings of the ACM SIGMOD Workshop on the Web and Databases (WebDB2000) , May 2000 . P. G. Ipeirotis, L. Gravano, and M. Sahami. Automatic classification of text databases through query probing. In Proceedings of the ACM SIGMOD Workshop on the Web and Databases (WebDB2000), May 2000."},{"key":"e_1_3_2_1_13_2","doi-asserted-by":"publisher","DOI":"10.5555\/645326.649721"},{"key":"e_1_3_2_1_14_2","doi-asserted-by":"publisher","DOI":"10.1016\/0024-3795(71)90016-4"},{"key":"e_1_3_2_1_15_2","first-page":"284","volume-title":"Proceedings of the Thirteenth International Conference (ICML '96)","author":"Koller D.","year":"1996","unstructured":"D. Koller and M. Sahami . Toward optimal feature selection. In Machine Learning , Proceedings of the Thirteenth International Conference (ICML '96) , pages 284 - 292 , 1996 . D. Koller and M. Sahami. Toward optimal feature selection. In Machine Learning, Proceedings of the Thirteenth International Conference (ICML '96), pages 284-292, 1996."},{"key":"e_1_3_2_1_16_2","doi-asserted-by":"publisher","DOI":"10.5555\/645526.657130"},{"key":"e_1_3_2_1_17_2","doi-asserted-by":"publisher","DOI":"10.1145\/243199.243277"},{"key":"e_1_3_2_1_18_2","volume-title":"Learning for Text Categorization: Papers from the 1998 AAAI Workshop","author":"McCallum A.","year":"1998","unstructured":"A. McCallum and K. Nigam . A comparison of event models for naive bayes text classification . In Learning for Text Categorization: Papers from the 1998 AAAI Workshop , 1998 . A. McCallum and K. Nigam. A comparison of event models for naive bayes text classification. In Learning for Text Categorization: Papers from the 1998 AAAI Workshop, 1998."},{"key":"e_1_3_2_1_19_2","volume-title":"VLDB'98","author":"Meng W.","year":"1998","unstructured":"W. Meng , K.-L. Liu , C. T. Yu , X. Wang , Y. Chang , and N. Rishe . Determining text databases to search in the Internet . In VLDB'98 , Proceedings of 24th International Conference on Very Large Data Bases, pages 14-25 , 1998 . W. Meng, K.-L. Liu, C. T. Yu, X. Wang, Y. Chang, and N. Rishe. Determining text databases to search in the Internet. In VLDB'98, Proceedings of 24th International Conference on Very Large Data Bases, pages 14-25, 1998."},{"key":"e_1_3_2_1_20_2","first-page":"22","volume-title":"Proceedings of the Fourth IFCIS International Conference on Cooperative Information Systems","author":"Meng W.","year":"1999","unstructured":"W. Meng , C. T. Yu , and K.-L. Liu . Detection of heterogeneities in a multiple text database environment . In Proceedings of the Fourth IFCIS International Conference on Cooperative Information Systems , pages 22 - 33 , 1999 . W. Meng, C. T. Yu, and K.-L. Liu. Detection of heterogeneities in a multiple text database environment. In Proceedings of the Fourth IFCIS International Conference on Cooperative Information Systems, pages 22-33, 1999."},{"key":"e_1_3_2_1_21_2","volume-title":"Machine Learning","author":"Mitchell T.","year":"1997","unstructured":"T. Mitchell . Machine Learning . McGraw Hill , 1997 . T. Mitchell. Machine Learning. McGraw Hill, 1997."},{"key":"e_1_3_2_1_22_2","doi-asserted-by":"publisher","DOI":"10.1023\/A:1008672508721"},{"key":"e_1_3_2_1_23_2","first-page":"313","volume-title":"The SMART Information Retrieval System","author":"Rocchio J. J.","year":"1971","unstructured":"J. J. Rocchio . Relevance feedback in information retrieval . In G. Salton, editor, The SMART Information Retrieval System , pages 313 - 323 . Prentice Hall , Englewood Cliffs, NJ , 1971 . J. J. Rocchio. Relevance feedback in information retrieval. In G. Salton, editor, The SMART Information Retrieval System, pages 313-323. Prentice Hall, Englewood Cliffs, NJ, 1971."},{"key":"e_1_3_2_1_24_2","doi-asserted-by":"publisher","DOI":"10.1016\/0306-4573(88)90021-0"},{"key":"e_1_3_2_1_25_2","first-page":"381","volume-title":"Readings in Information Retrieval","author":"Salton G.","year":"1997","unstructured":"G. Salton and M. J. McGill . The SMART and SIRE experimental retrieval systems . In K. S. Jones and P. Willett, editors, Readings in Information Retrieval , pages 381 - 399 . Morgan Kaufmann , 1997 . G. Salton and M. J. McGill. The SMART and SIRE experimental retrieval systems. In K. S. Jones and P. Willett, editors, Readings in Information Retrieval, pages 381-399. Morgan Kaufmann, 1997."},{"key":"e_1_3_2_1_26_2","doi-asserted-by":"publisher","DOI":"10.1145\/215206.215365"},{"key":"e_1_3_2_1_27_2","doi-asserted-by":"publisher","DOI":"10.5555\/347319.346329"},{"key":"e_1_3_2_1_28_2","volume-title":"Information Retrieval","author":"van Rijsbergen K.","year":"1979","unstructured":"K. van Rijsbergen . Information Retrieval ( 2 nd edition). Butterworths , London , 1979 . K. van Rijsbergen. Information Retrieval (2nd edition). Butterworths, London, 1979.","edition":"2"},{"key":"e_1_3_2_1_29_2","doi-asserted-by":"publisher","DOI":"10.5555\/882511.885375"},{"key":"e_1_3_2_1_30_2","doi-asserted-by":"publisher","DOI":"10.1145\/290941.290974"},{"key":"e_1_3_2_1_31_2","doi-asserted-by":"publisher","DOI":"10.1145\/312624.312647"},{"key":"e_1_3_2_1_32_2","volume-title":"Addison-Wesley","author":"Zipf G. K.","year":"1949","unstructured":"G. K. Zipf . Human Behavior and the Principle of Least Effort . Addison-Wesley , 1949 . G. K. Zipf. Human Behavior and the Principle of Least Effort. Addison-Wesley, 1949."}],"event":{"name":"SIGMOD\/PODS01: ACM SIGMOD International Conference on Management of Data","sponsor":["SIGMOD ACM Special Interest Group on Management of Data"],"location":"Santa Barbara California USA","acronym":"SIGMOD\/PODS01"},"container-title":["Proceedings of the 2001 ACM SIGMOD international conference on Management of data"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/375663.375671","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,9,4]],"date-time":"2023-09-04T13:11:53Z","timestamp":1693833113000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/375663.375671"}},"subtitle":["categorizing hidden web databases"],"short-title":[],"issued":{"date-parts":[[2001,5]]},"references-count":32,"alternative-id":["10.1145\/375663.375671","10.1145\/375663"],"URL":"https:\/\/doi.org\/10.1145\/375663.375671","relation":{"is-identical-to":[{"id-type":"doi","id":"10.1145\/376284.375671","asserted-by":"object"}]},"subject":[],"published":{"date-parts":[[2001,5]]},"assertion":[{"value":"2001-05-01","order":2,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}