{"id":"https://openalex.org/W1908963334","doi":"https://doi.org/10.1109/pdis.1994.331726","title":"Precision and recall of GlOSS estimators for database discovery","display_name":"Precision and recall of GlOSS estimators for database discovery","publication_year":2002,"publication_date":"2002-12-17","ids":{"openalex":"https://openalex.org/W1908963334","doi":"https://doi.org/10.1109/pdis.1994.331726","mag":"1908963334"},"language":"en","primary_location":{"is_oa":false,"landing_page_url":"https://doi.org/10.1109/pdis.1994.331726","pdf_url":null,"source":null,"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false},"type":"article","type_crossref":"proceedings-article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"http://www.cs.cmu.edu/~tomasic/doc/1994/GravanoGarciaTomasicPDIS1994.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5080063580","display_name":"Luis Gravano","orcid":null},"institutions":[{"id":"https://openalex.org/I97018004","display_name":"Stanford University","ror":"https://ror.org/00f54p054","country_code":"US","type":"education","lineage":["https://openalex.org/I97018004"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"L. Gravano","raw_affiliation_strings":["[Dept. of Comput. Sci., Stanford Univ., CA, USA]"],"affiliations":[{"raw_affiliation_string":"[Dept. of Comput. Sci., Stanford Univ., CA, USA]","institution_ids":["https://openalex.org/I97018004"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5055883336","display_name":"H\u00e9ctor Garc\u00eda-Molina","orcid":null},"institutions":[{"id":"https://openalex.org/I97018004","display_name":"Stanford University","ror":"https://ror.org/00f54p054","country_code":"US","type":"education","lineage":["https://openalex.org/I97018004"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"H. Garcia-Molina","raw_affiliation_strings":["[Dept. of Comput. Sci., Stanford Univ., CA, USA]"],"affiliations":[{"raw_affiliation_string":"[Dept. of Comput. Sci., Stanford Univ., CA, USA]","institution_ids":["https://openalex.org/I97018004"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5027233041","display_name":"Anthony Tomasic","orcid":null},"institutions":[{"id":"https://openalex.org/I97018004","display_name":"Stanford University","ror":"https://ror.org/00f54p054","country_code":"US","type":"education","lineage":["https://openalex.org/I97018004"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"A. Tomasic","raw_affiliation_strings":["[Dept. of Comput. Sci., Stanford Univ., CA, USA]"],"affiliations":[{"raw_affiliation_string":"[Dept. of Comput. Sci., Stanford Univ., CA, USA]","institution_ids":["https://openalex.org/I97018004"]}]}],"institution_assertions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":1.12,"has_fulltext":true,"fulltext_origin":"ngrams","cited_by_count":40,"citation_normalized_percentile":{"value":0.881869,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":91},"biblio":{"volume":"5","issue":null,"first_page":"103","last_page":"106"},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10317","display_name":"Advanced Database Systems and Queries","score":0.9991,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10317","display_name":"Advanced Database Systems and Queries","score":0.9991,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.999,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11269","display_name":"Algorithms and Data Compression","score":0.9989,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/gloss","display_name":"Gloss (optics)","score":0.6041033}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.82546103},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.69744146},{"id":"https://openalex.org/C54239708","wikidata":"https://www.wikidata.org/wiki/Q1329910","display_name":"View","level":3,"score":0.6420021},{"id":"https://openalex.org/C143025027","wikidata":"https://www.wikidata.org/wiki/Q900581","display_name":"Gloss (optics)","level":3,"score":0.6041033},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.5526927},{"id":"https://openalex.org/C192028432","wikidata":"https://www.wikidata.org/wiki/Q845739","display_name":"Query language","level":2,"score":0.4929514},{"id":"https://openalex.org/C99016210","wikidata":"https://www.wikidata.org/wiki/Q5488129","display_name":"Query expansion","level":2,"score":0.4556085},{"id":"https://openalex.org/C157692150","wikidata":"https://www.wikidata.org/wiki/Q2919848","display_name":"Query optimization","level":2,"score":0.4457152},{"id":"https://openalex.org/C164120249","wikidata":"https://www.wikidata.org/wiki/Q995982","display_name":"Web search query","level":3,"score":0.41296244},{"id":"https://openalex.org/C97854310","wikidata":"https://www.wikidata.org/wiki/Q19541","display_name":"Search engine","level":2,"score":0.35187528},{"id":"https://openalex.org/C148840519","wikidata":"https://www.wikidata.org/wiki/Q1049878","display_name":"Database design","level":2,"score":0.26333773},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C178790620","wikidata":"https://www.wikidata.org/wiki/Q11351","display_name":"Organic chemistry","level":1,"score":0.0},{"id":"https://openalex.org/C2781448156","wikidata":"https://www.wikidata.org/wiki/Q1570182","display_name":"Coating","level":2,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"is_oa":false,"landing_page_url":"https://doi.org/10.1109/pdis.1994.331726","pdf_url":null,"source":null,"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false},{"is_oa":true,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.48.2241","pdf_url":"http://www.cs.cmu.edu/~tomasic/doc/1994/GravanoGarciaTomasicPDIS1994.pdf","source":{"id":"https://openalex.org/S4306400349","display_name":"CiteSeer X (The Pennsylvania State University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I130769515","host_organization_name":"Pennsylvania State University","host_organization_lineage":["https://openalex.org/I130769515"],"host_organization_lineage_names":["Pennsylvania State University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false}],"best_oa_location":{"is_oa":true,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.48.2241","pdf_url":"http://www.cs.cmu.edu/~tomasic/doc/1994/GravanoGarciaTomasicPDIS1994.pdf","source":{"id":"https://openalex.org/S4306400349","display_name":"CiteSeer X (The Pennsylvania State University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I130769515","host_organization_name":"Pennsylvania State University","host_organization_lineage":["https://openalex.org/I130769515"],"host_organization_lineage_names":["Pennsylvania State University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false},"sustainable_development_goals":[],"grants":[],"datasets":[],"versions":[],"referenced_works_count":4,"referenced_works":["https://openalex.org/W2073788020","https://openalex.org/W2123922130","https://openalex.org/W2152645051","https://openalex.org/W2325227998"],"related_works":["https://openalex.org/W4381740310","https://openalex.org/W3197639690","https://openalex.org/W3125756434","https://openalex.org/W2970853428","https://openalex.org/W2572349046","https://openalex.org/W2186703450","https://openalex.org/W2113390685","https://openalex.org/W2096359267","https://openalex.org/W2026738364","https://openalex.org/W1981131819"],"abstract_inverted_index":{"Online":[0],"information":[1,21,112,117,158,193,221,230],"vendors":[2],"and":[3,29,154],"the":[4,39,66,71,86,92,106,135,152,165,190,223,226],"Internet":[5],"together":[6],"offer":[7],"thousands":[8],"of":[9,80,99,137,157,208,220,225],"text":[10],"databases":[11,55,82,101,138,198],"from":[12,189],"which":[13,36],"a":[14,19,26,31,48,78,97,127,143,148,179,217],"user":[15],"may":[16],"choose":[17],"for":[18,28,105,113,129,142,164,178,205],"given":[20,144],"need.":[22],"This":[23,116],"paper":[24],"presents":[25],"framework":[27,149,173],"analyses":[30],"solution":[32,44],"to":[33,46,56,70,76,83,232,235,242],"this":[34,229],"problem,":[35],"we":[37,146],"call":[38],"text-database":[40,166],"discovery":[41,167],"problem.":[42,168],"Our":[43],"is":[45,68,88],"build":[47],"service":[49],"that":[50,139],"can":[51],"suggest":[52],"potentially":[53],"good":[54],"search.":[57,84],"A":[58],"user's":[59,107],"query":[60,67,87,187],"goes":[61],"through":[62,200],"two":[63],"steps:":[64],"first,":[65],"presented":[69],"GlOSS":[72,95,140,209,215],"server":[73],"(Glossary-Of-Servers":[74],"Server)":[75],"select":[77],"set":[79,136],"promising":[81],"Secondly,":[85],"actually":[89,125],"evaluated":[90],"in":[91,122],"chosen":[93],"databases.":[94],"gives":[96],"hint":[98],"what":[100],"might":[102],"be":[103,233],"useful":[104,238],"query,":[108,145],"based":[109,150],"on":[110,151,240],"word-frequency":[111],"each":[114,123,130],"database.":[115],"indicates":[118],"how":[119],"many":[120],"documents":[121],"database":[124],"contain":[126],"keyword,":[128],"field":[131],"designator.":[132],"To":[133],"evaluate":[134],"returns":[141],"present":[147],"precision":[153],"recall":[155],"metrics":[156,163],"retrieval":[159,194],"theory.":[160],"We":[161,169,182],"define":[162],"further":[170],"extend":[171],"our":[172],"by":[174],"offering":[175],"different":[176,206],"definitions":[177],"\"relevant":[180],"database\".":[181],"have":[183],"performed":[184],"experiments":[185],"using":[186],"traces":[188],"FOLIO":[191],"library":[192],"system,":[195],"involving":[196],"six":[197],"available":[199,227],"FOLIO.":[201],"The":[202],"results":[203],"obtained":[204],"variants":[207],"are":[210],"very":[211,237],"promising.":[212],"Even":[213],"though":[214],"keeps":[216],"small":[218],"amount":[219],"about":[222],"contents":[224],"databases,":[228],"proved":[231],"sufficient":[234],"produce":[236],"hints":[239],"where":[241],"search.<":[243],">":[246]},"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W1908963334","counts_by_year":[{"year":2015,"cited_by_count":1},{"year":2014,"cited_by_count":2}],"updated_date":"2024-12-13T01:57:59.219037","created_date":"2016-06-24"}