{"id":"https://openalex.org/W2113448659","doi":"https://doi.org/10.1109/ideas.2001.938087","title":"Reducing inconsistency in integrating data from different sources","display_name":"Reducing inconsistency in integrating data from different sources","publication_year":2002,"publication_date":"2002-11-13","ids":{"openalex":"https://openalex.org/W2113448659","doi":"https://doi.org/10.1109/ideas.2001.938087","mag":"2113448659"},"language":"en","primary_location":{"is_oa":false,"landing_page_url":"https://doi.org/10.1109/ideas.2001.938087","pdf_url":null,"source":{"id":"https://openalex.org/S4210202518","display_name":"Proceedings - International Database Engineering and Applications Symposium","issn_l":"1098-8068","issn":["1098-8068"],"is_oa":false,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false},"type":"article","type_crossref":"proceedings-article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5088265373","display_name":"Sergio Luj\u00e1n\u2010Mora","orcid":"https://orcid.org/0000-0001-5000-864X"},"institutions":[{"id":"https://openalex.org/I130194489","display_name":"University of Alicante","ror":"https://ror.org/05t8bcz72","country_code":"ES","type":"funder","lineage":["https://openalex.org/I130194489"]}],"countries":["ES"],"is_corresponding":false,"raw_author_name":"S. Lujan-Mora","raw_affiliation_strings":["Dept. de Lenguajes y Sistemas Inf., Alicante Univ., Spain"],"affiliations":[{"raw_affiliation_string":"Dept. de Lenguajes y Sistemas Inf., Alicante Univ., Spain","institution_ids":["https://openalex.org/I130194489"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5030733421","display_name":"Manuel Palomar","orcid":"https://orcid.org/0000-0002-1441-7865"},"institutions":[{"id":"https://openalex.org/I130194489","display_name":"University of Alicante","ror":"https://ror.org/05t8bcz72","country_code":"ES","type":"funder","lineage":["https://openalex.org/I130194489"]}],"countries":["ES"],"is_corresponding":false,"raw_author_name":"M. Palomar","raw_affiliation_strings":["Departamento de Lenguajes y Sistemas Inform\u00e1ticos Universidad de Alicante Alicante Spain"],"affiliations":[{"raw_affiliation_string":"Departamento de Lenguajes y Sistemas Inform\u00e1ticos Universidad de Alicante Alicante Spain","institution_ids":["https://openalex.org/I130194489"]}]}],"institution_assertions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":1.412,"has_fulltext":true,"fulltext_origin":"ngrams","cited_by_count":23,"citation_normalized_percentile":{"value":0.896302,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":86,"max":87},"biblio":{"volume":"23","issue":null,"first_page":"209","last_page":"218"},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T11719","display_name":"Data Quality and Management","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T11719","display_name":"Data Quality and Management","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11106","display_name":"Data Management and Algorithms","score":0.9835,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10538","display_name":"Data Mining Algorithms and Applications","score":0.9811,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6499263}],"mesh":[],"locations_count":1,"locations":[{"is_oa":false,"landing_page_url":"https://doi.org/10.1109/ideas.2001.938087","pdf_url":null,"source":{"id":"https://openalex.org/S4210202518","display_name":"Proceedings - International Database Engineering and Applications Symposium","issn_l":"1098-8068","issn":["1098-8068"],"is_oa":false,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.4,"display_name":"Quality education","id":"https://metadata.un.org/sdg/4"}],"grants":[],"datasets":[],"versions":[],"referenced_works_count":19,"referenced_works":["https://openalex.org/W12422471","https://openalex.org/W1569123402","https://openalex.org/W1574837942","https://openalex.org/W1597110170","https://openalex.org/W1610496399","https://openalex.org/W1612155886","https://openalex.org/W1647671624","https://openalex.org/W1667176087","https://openalex.org/W168092880","https://openalex.org/W1995443722","https://openalex.org/W2020191321","https://openalex.org/W2024770506","https://openalex.org/W2044030465","https://openalex.org/W2150698190","https://openalex.org/W2155493185","https://openalex.org/W25398253","https://openalex.org/W2913066018","https://openalex.org/W4256583922","https://openalex.org/W4285719527"],"related_works":["https://openalex.org/W4391913857","https://openalex.org/W2748952813","https://openalex.org/W2530322880","https://openalex.org/W2478288626","https://openalex.org/W2390279801","https://openalex.org/W2382290278","https://openalex.org/W2376932109","https://openalex.org/W2358668433","https://openalex.org/W2350741829","https://openalex.org/W2001405890"],"abstract_inverted_index":{"One":[0],"of":[1,16,76,110],"the":[2,13,17,23,62,95,138],"main":[3],"problems":[4],"in":[5,20,53,89,119],"integrating":[6],"databases":[7],"into":[8],"a":[9,34,67,85],"common":[10,86],"repository":[11],"is":[12,123],"possible":[14],"inconsistency":[15,51],"values":[18,63,80],"stored":[19],"them,":[21],"i.e.,":[22],"very":[24],"same":[25,68],"term":[26,69],"may":[27,116],"have":[28],"different":[29,101],"values,":[30],"due":[31],"to":[32,66,84,127],"misspelling,":[33],"permuted":[35],"word":[36],"order,":[37],"spelling":[38],"variants":[39],"and":[40,56,107],"so":[41],"on.":[42],"The":[43,78,112],"authors":[44],"present":[45],"an":[46],"automatic":[47],"method":[48,113],"for":[49,94,104,135],"reducing":[50],"found":[52],"existing":[54],"databases,":[55],"thus,":[57],"improving":[58],"data":[59],"quality.":[60],"All":[61],"that":[64],"refer":[65],"are":[70],"clustered":[71,79],"by":[72],"measuring":[73],"their":[74],"degree":[75],"similarity.":[77],"can":[81],"be":[82,92],"assigned":[83],"value":[87],"that,":[88],"principle,":[90],"could":[91],"substituted":[93],"original":[96],"values.":[97],"We":[98],"evaluate":[99],"four":[100],"similarity":[102],"measures":[103],"clustering":[105],"with":[106],"without":[108],"expansion":[109],"abbreviations.":[111],"we":[114,131],"propose":[115],"work":[117],"well":[118],"practice":[120],"but":[121],"it":[122],"time-consuming.":[124],"In":[125],"order":[126],"reduce":[128],"this":[129],"problem,":[130],"remove":[132],"stop":[133],"words":[134],"speeding":[136],"up":[137],"clustering.":[139]},"abstract_inverted_index_v3":null,"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W2113448659","counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2021,"cited_by_count":2},{"year":2020,"cited_by_count":1},{"year":2019,"cited_by_count":1},{"year":2017,"cited_by_count":4},{"year":2012,"cited_by_count":2}],"updated_date":"2025-03-22T02:24:08.464292","created_date":"2016-06-24"}