{"id":"https://openalex.org/W2740530567","doi":"https://doi.org/10.18653/v1/w17-2312","title":"Representation of complex terms in a vector space structured by an ontology for a normalization task","display_name":"Representation of complex terms in a vector space structured by an ontology for a normalization task","publication_year":2017,"publication_date":"2017-01-01","ids":{"openalex":"https://openalex.org/W2740530567","doi":"https://doi.org/10.18653/v1/w17-2312","mag":"2740530567"},"language":"en","primary_location":{"is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/w17-2312","pdf_url":"https://www.aclweb.org/anthology/W17-2312.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true},"type":"preprint","type_crossref":"proceedings-article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://www.aclweb.org/anthology/W17-2312.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5006669344","display_name":"Arnaud Ferr\u00e9","orcid":"https://orcid.org/0000-0001-9115-8222"},"institutions":[{"id":"https://openalex.org/I4210159481","display_name":"Math\u00e9matiques et Informatique Appliqu\u00e9es du G\u00e9nome \u00e0 l'Environnement","ror":"https://ror.org/05qdnns64","country_code":"FR","type":"facility","lineage":["https://openalex.org/I4210088668","https://openalex.org/I4210099460","https://openalex.org/I4210159481"]},{"id":"https://openalex.org/I4210115485","display_name":"Laboratoire d'Informatique pour la M\u00e9canique et les Sciences de l'Ing\u00e9nieur","ror":"https://ror.org/01raq4x89","country_code":"FR","type":"facility","lineage":["https://openalex.org/I102197404","https://openalex.org/I1294671590","https://openalex.org/I4210115485","https://openalex.org/I4210159245"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Arnaud Ferr\u00e9","raw_affiliation_strings":["Laboratoire d'Informatique pour la M\u00e9canique et les Sciences de l'Ing\u00e9nieur","Math\u00e9matiques et Informatique Appliqu\u00e9es du G\u00e9nome \u00e0 l'Environnement [Jouy-En-Josas]"],"affiliations":[{"raw_affiliation_string":"Math\u00e9matiques et Informatique Appliqu\u00e9es du G\u00e9nome \u00e0 l'Environnement [Jouy-En-Josas]","institution_ids":["https://openalex.org/I4210159481"]},{"raw_affiliation_string":"Laboratoire d'Informatique pour la M\u00e9canique et les Sciences de l'Ing\u00e9nieur","institution_ids":["https://openalex.org/I4210115485"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5090195478","display_name":"Pierre Zweigenbaum","orcid":"https://orcid.org/0000-0001-8410-4808"},"institutions":[{"id":"https://openalex.org/I4210115485","display_name":"Laboratoire d'Informatique pour la M\u00e9canique et les Sciences de l'Ing\u00e9nieur","ror":"https://ror.org/01raq4x89","country_code":"FR","type":"facility","lineage":["https://openalex.org/I102197404","https://openalex.org/I1294671590","https://openalex.org/I4210115485","https://openalex.org/I4210159245"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Pierre Zweigenbaum","raw_affiliation_strings":["Laboratoire d'Informatique pour la M\u00e9canique et les Sciences de l'Ing\u00e9nieur"],"affiliations":[{"raw_affiliation_string":"Laboratoire d'Informatique pour la M\u00e9canique et les Sciences de l'Ing\u00e9nieur","institution_ids":["https://openalex.org/I4210115485"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5063577222","display_name":"Claire N\u00e9dellec","orcid":"https://orcid.org/0000-0002-0577-0595"},"institutions":[{"id":"https://openalex.org/I4210159481","display_name":"Math\u00e9matiques et Informatique Appliqu\u00e9es du G\u00e9nome \u00e0 l'Environnement","ror":"https://ror.org/05qdnns64","country_code":"FR","type":"facility","lineage":["https://openalex.org/I4210088668","https://openalex.org/I4210099460","https://openalex.org/I4210159481"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Claire N\u00e9dellec","raw_affiliation_strings":["Math\u00e9matiques et Informatique Appliqu\u00e9es du G\u00e9nome \u00e0 l'Environnement [Jouy-En-Josas]"],"affiliations":[{"raw_affiliation_string":"Math\u00e9matiques et Informatique Appliqu\u00e9es du G\u00e9nome \u00e0 l'Environnement [Jouy-En-Josas]","institution_ids":["https://openalex.org/I4210159481"]}]}],"institution_assertions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":true,"fulltext_origin":"pdf","cited_by_count":10,"citation_normalized_percentile":{"value":0.666822,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":85,"max":86},"biblio":{"volume":null,"issue":null,"first_page":"99","last_page":"106"},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10215","display_name":"Semantic Web and Ontologies","score":0.9994,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10215","display_name":"Semantic Web and Ontologies","score":0.9994,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13083","display_name":"Advanced Text Analysis Techniques","score":0.9988,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11710","display_name":"Biomedical Text Mining and Ontologies","score":0.9987,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/normalization","display_name":"Normalization","score":0.7670448},{"id":"https://openalex.org/keywords/distributional-semantics","display_name":"Distributional semantics","score":0.56271607},{"id":"https://openalex.org/keywords/ontology-engineering","display_name":"Ontology engineering","score":0.46632746},{"id":"https://openalex.org/keywords/vector-space-model","display_name":"Vector space model","score":0.41925454},{"id":"https://openalex.org/keywords/representation","display_name":"Representation","score":0.41716343}],"concepts":[{"id":"https://openalex.org/C136886441","wikidata":"https://www.wikidata.org/wiki/Q926129","display_name":"Normalization (sociology)","level":2,"score":0.7670448},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.69981587},{"id":"https://openalex.org/C25810664","wikidata":"https://www.wikidata.org/wiki/Q44325","display_name":"Ontology","level":2,"score":0.6788864},{"id":"https://openalex.org/C13336665","wikidata":"https://www.wikidata.org/wiki/Q125977","display_name":"Vector space","level":2,"score":0.6122069},{"id":"https://openalex.org/C2778828372","wikidata":"https://www.wikidata.org/wiki/Q5283209","display_name":"Distributional semantics","level":3,"score":0.56271607},{"id":"https://openalex.org/C41608201","wikidata":"https://www.wikidata.org/wiki/Q980509","display_name":"Embedding","level":2,"score":0.55348265},{"id":"https://openalex.org/C2778820784","wikidata":"https://www.wikidata.org/wiki/Q1027508","display_name":"Ontology engineering","level":4,"score":0.46632746},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.4635275},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.46055946},{"id":"https://openalex.org/C188087704","wikidata":"https://www.wikidata.org/wiki/Q369577","display_name":"Standardization","level":2,"score":0.45461804},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.43712318},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.4334882},{"id":"https://openalex.org/C89686163","wikidata":"https://www.wikidata.org/wiki/Q1187982","display_name":"Vector space model","level":2,"score":0.41925454},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.41716343},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.3223537},{"id":"https://openalex.org/C22550185","wikidata":"https://www.wikidata.org/wiki/Q7095047","display_name":"Ontology-based data integration","level":3,"score":0.31989068},{"id":"https://openalex.org/C130318100","wikidata":"https://www.wikidata.org/wiki/Q2268914","display_name":"Semantic similarity","level":2,"score":0.26518878},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.21789223},{"id":"https://openalex.org/C2129575","wikidata":"https://www.wikidata.org/wiki/Q54837","display_name":"Semantic Web","level":2,"score":0.1683009},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0},{"id":"https://openalex.org/C144024400","wikidata":"https://www.wikidata.org/wiki/Q21201","display_name":"Sociology","level":0,"score":0.0},{"id":"https://openalex.org/C94625758","wikidata":"https://www.wikidata.org/wiki/Q7163","display_name":"Politics","level":2,"score":0.0},{"id":"https://openalex.org/C19165224","wikidata":"https://www.wikidata.org/wiki/Q23404","display_name":"Anthropology","level":1,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/w17-2312","pdf_url":"https://www.aclweb.org/anthology/W17-2312.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true},{"is_oa":false,"landing_page_url":"https://hal.archives-ouvertes.fr/hal-01582292","pdf_url":null,"source":{"id":"https://openalex.org/S4306402512","display_name":"HAL (Le Centre pour la Communication Scientifique Directe)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I1294671590","host_organization_name":"Centre National de la Recherche Scientifique","host_organization_lineage":["https://openalex.org/I1294671590"],"host_organization_lineage_names":["Centre National de la Recherche Scientifique"],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false},{"is_oa":false,"landing_page_url":"https://hal.science/hal-01582292","pdf_url":null,"source":null,"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false}],"best_oa_location":{"is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/w17-2312","pdf_url":"https://www.aclweb.org/anthology/W17-2312.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true},"sustainable_development_goals":[],"grants":[],"datasets":[],"versions":[],"referenced_works_count":18,"referenced_works":["https://openalex.org/W1553529581","https://openalex.org/W1614298861","https://openalex.org/W1914733988","https://openalex.org/W2000747570","https://openalex.org/W2010027150","https://openalex.org/W2039612385","https://openalex.org/W2128049108","https://openalex.org/W2129038679","https://openalex.org/W2182314358","https://openalex.org/W2509401464","https://openalex.org/W2510327534","https://openalex.org/W2518463060","https://openalex.org/W2625658851","https://openalex.org/W2626480150","https://openalex.org/W2882319491","https://openalex.org/W2918995630","https://openalex.org/W2950577311","https://openalex.org/W3097437297"],"related_works":["https://openalex.org/W4251889114","https://openalex.org/W3161401723","https://openalex.org/W2741017126","https://openalex.org/W2349139068","https://openalex.org/W2096728994","https://openalex.org/W2078533744","https://openalex.org/W2013634681","https://openalex.org/W1974406477","https://openalex.org/W1604150642","https://openalex.org/W1540114765"],"abstract_inverted_index":{"We":[0,107],"propose":[1],"in":[2,28,60,144],"this":[3,158,171],"paper":[4],"a":[5,16,29,41,78,84,116,138],"semi-supervised":[6],"method":[7,20,38,159],"for":[8,49,115,170],"labeling":[9],"terms":[10,27,94,131],"of":[11,15,25,51,68,93,97,112,123,130,140,157,164,167,173],"texts":[12],"with":[13],"concepts":[14,98,122],"domain":[17],"ontology.":[18,35,70],"The":[19,36,155],"generates":[21,46],"continuous":[22],"vector":[23,62,148],"representations":[24,114],"complex":[26],"semantic":[30,127],"space":[31,63,149],"structured":[32],"by":[33,76,119],"the":[34,52,61,66,69,89,110,121,141,147,165,168],"proposed":[37],"relies":[39],"on":[40],"distributional":[42],"semantics":[43],"approach,":[44],"which":[45],"initial":[47],"vectors":[48,57,92,96],"each":[50],"extracted":[53],"terms.":[54,106],"Then":[55],"these":[56,113],"are":[58],"embedded":[59],"constructed":[64],"from":[65],"structure":[67],"This":[71],"embedding":[72],"is":[73,132,160],"carried":[74],"out":[75],"training":[77],"linear":[79],"model.":[80],"Finally,":[81],"we":[82],"apply":[83],"distance":[85],"calculation":[86],"to":[87,101,105,136,162],"determine":[88],"proximity":[90],"between":[91],"and":[95,99],"thus":[100],"assign":[102],"ontology":[103,125],"labels":[104],"have":[108],"evaluated":[109],"quality":[111],"normalization":[117],"task":[118,172],"using":[120],"an":[124,133],"as":[126],"labels.":[128],"Normalization":[129],"important":[134],"step":[135],"extract":[137],"part":[139],"information":[142],"containing":[143],"texts,":[145],"but":[146],"generated":[150],"might":[151],"find":[152],"other":[153],"applications.":[154],"performance":[156],"comparable":[161],"that":[163],"state":[166],"art":[169],"standardization,":[174],"opening":[175],"up":[176],"encouraging":[177],"prospects.":[178]},"abstract_inverted_index_v3":null,"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W2740530567","counts_by_year":[{"year":2020,"cited_by_count":2},{"year":2019,"cited_by_count":6},{"year":2018,"cited_by_count":2}],"updated_date":"2025-03-16T19:51:51.935444","created_date":"2017-08-08"}