{"id":"https://openalex.org/W2739874095","doi":"https://doi.org/10.18653/v1/p17-1017","title":"Creating Training Corpora for NLG Micro-Planners","display_name":"Creating Training Corpora for NLG Micro-Planners","publication_year":2017,"publication_date":"2017-01-01","ids":{"openalex":"https://openalex.org/W2739874095","doi":"https://doi.org/10.18653/v1/p17-1017","mag":"2739874095"},"language":"en","primary_location":{"is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/p17-1017","pdf_url":"https://www.aclweb.org/anthology/P17-1017.pdf","source":{"id":"https://openalex.org/S4363608652","display_name":"Proceedings of the 60th Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true},"type":"article","type_crossref":"proceedings-article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://www.aclweb.org/anthology/P17-1017.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5087459652","display_name":"Claire Gardent","orcid":"https://orcid.org/0000-0002-3805-6662"},"institutions":[{"id":"https://openalex.org/I1294671590","display_name":"Centre National de la Recherche Scientifique","ror":"https://ror.org/02feahw73","country_code":"FR","type":"government","lineage":["https://openalex.org/I1294671590"]},{"id":"https://openalex.org/I4210121838","display_name":"Laboratoire Lorrain de Recherche en Informatique et ses Applications","ror":"https://ror.org/02vnf0c38","country_code":"FR","type":"facility","lineage":["https://openalex.org/I1294671590","https://openalex.org/I1326498283","https://openalex.org/I4210121838","https://openalex.org/I4210159245","https://openalex.org/I90183372"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Claire Gardent","raw_affiliation_strings":["CNRS, LORIA, UMR 7503 Vandoeuvre-l\u00e8s-Nancy, F-54500, France"],"affiliations":[{"raw_affiliation_string":"CNRS, LORIA, UMR 7503 Vandoeuvre-l\u00e8s-Nancy, F-54500, France","institution_ids":["https://openalex.org/I1294671590","https://openalex.org/I4210121838"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5090458146","display_name":"Anastasia Shimorina","orcid":null},"institutions":[{"id":"https://openalex.org/I4210121838","display_name":"Laboratoire Lorrain de Recherche en Informatique et ses Applications","ror":"https://ror.org/02vnf0c38","country_code":"FR","type":"facility","lineage":["https://openalex.org/I1294671590","https://openalex.org/I1326498283","https://openalex.org/I4210121838","https://openalex.org/I4210159245","https://openalex.org/I90183372"]},{"id":"https://openalex.org/I1294671590","display_name":"Centre National de la Recherche Scientifique","ror":"https://ror.org/02feahw73","country_code":"FR","type":"government","lineage":["https://openalex.org/I1294671590"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Anastasia Shimorina","raw_affiliation_strings":["CNRS, LORIA, UMR 7503 Vandoeuvre-l\u00e8s-Nancy, F-54500, France"],"affiliations":[{"raw_affiliation_string":"CNRS, LORIA, UMR 7503 Vandoeuvre-l\u00e8s-Nancy, F-54500, France","institution_ids":["https://openalex.org/I4210121838","https://openalex.org/I1294671590"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5081801388","display_name":"Shashi Narayan","orcid":null},"institutions":[{"id":"https://openalex.org/I98677209","display_name":"University of Edinburgh","ror":"https://ror.org/01nrxwf90","country_code":"GB","type":"education","lineage":["https://openalex.org/I98677209"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Shashi Narayan","raw_affiliation_strings":["School of Informatics, University of Edinburgh 10 Crichton Street, Edinburgh, EH8 9AB, UK"],"affiliations":[{"raw_affiliation_string":"School of Informatics, University of Edinburgh 10 Crichton Street, Edinburgh, EH8 9AB, UK","institution_ids":["https://openalex.org/I98677209"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5005336295","display_name":"Laura Perez-Beltrachini","orcid":null},"institutions":[{"id":"https://openalex.org/I98677209","display_name":"University of Edinburgh","ror":"https://ror.org/01nrxwf90","country_code":"GB","type":"education","lineage":["https://openalex.org/I98677209"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Laura Perez-Beltrachini","raw_affiliation_strings":["School of Informatics, University of Edinburgh 10 Crichton Street, Edinburgh, EH8 9AB, UK"],"affiliations":[{"raw_affiliation_string":"School of Informatics, University of Edinburgh 10 Crichton Street, Edinburgh, EH8 9AB, UK","institution_ids":["https://openalex.org/I98677209"]}]}],"institution_assertions":[],"countries_distinct_count":2,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":8.76,"has_fulltext":true,"fulltext_origin":"pdf","cited_by_count":343,"citation_normalized_percentile":{"value":0.999893,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":99,"max":100},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9998,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12031","display_name":"Speech and dialogue systems","score":0.9991,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.6505796},{"id":"https://openalex.org/keywords/realisation","display_name":"Realisation","score":0.47245172},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.44014588}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.861238},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.6505796},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.61373043},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6009376},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.5707031},{"id":"https://openalex.org/C2777530160","wikidata":"https://www.wikidata.org/wiki/Q41796","display_name":"Sentence","level":2,"score":0.53819925},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.5302617},{"id":"https://openalex.org/C2779462738","wikidata":"https://www.wikidata.org/wiki/Q17146409","display_name":"Realisation","level":2,"score":0.47245172},{"id":"https://openalex.org/C4554734","wikidata":"https://www.wikidata.org/wiki/Q593744","display_name":"Knowledge base","level":2,"score":0.45924523},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.44014588},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.35465527},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.34945232},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0}],"mesh":[],"locations_count":4,"locations":[{"is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/p17-1017","pdf_url":"https://www.aclweb.org/anthology/P17-1017.pdf","source":{"id":"https://openalex.org/S4363608652","display_name":"Proceedings of the 60th Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true},{"is_oa":true,"landing_page_url":"https://www.research.ed.ac.uk/en/publications/508a2f5e-fa53-4d5a-bf07-1b219aeef5f3","pdf_url":"https://www.research.ed.ac.uk/files/36215547/acl_2017.pdf","source":{"id":"https://openalex.org/S4306400321","display_name":"Edinburgh Research Explorer (University of Edinburgh)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I98677209","host_organization_name":"University of Edinburgh","host_organization_lineage":["https://openalex.org/I98677209"],"host_organization_lineage_names":["University of Edinburgh"],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"acceptedVersion","is_accepted":true,"is_published":false},{"is_oa":true,"landing_page_url":"https://www.pure.ed.ac.uk/ws/files/36215547/acl_2017.pdf","pdf_url":"https://www.pure.ed.ac.uk/ws/files/36215547/acl_2017.pdf","source":{"id":"https://openalex.org/S4306400321","display_name":"Edinburgh Research Explorer (University of Edinburgh)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I98677209","host_organization_name":"University of Edinburgh","host_organization_lineage":["https://openalex.org/I98677209"],"host_organization_lineage_names":["University of Edinburgh"],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"acceptedVersion","is_accepted":true,"is_published":false},{"is_oa":true,"landing_page_url":"http://aclweb.org/anthology/P17-1017","pdf_url":"https://aclanthology.org/P17-1017.pdf","source":{"id":"https://openalex.org/S4306400320","display_name":"Edinburgh Research Explorer (University of Edinburgh)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I98677209","host_organization_name":"University of Edinburgh","host_organization_lineage":["https://openalex.org/I98677209"],"host_organization_lineage_names":["University of Edinburgh"],"type":"repository"},"license":"cc-by-nc-sa","license_id":"https://openalex.org/licenses/cc-by-nc-sa","version":"submittedVersion","is_accepted":false,"is_published":false}],"best_oa_location":{"is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/p17-1017","pdf_url":"https://www.aclweb.org/anthology/P17-1017.pdf","source":{"id":"https://openalex.org/S4363608652","display_name":"Proceedings of the 60th Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true},"sustainable_development_goals":[{"display_name":"Sustainable cities and communities","score":0.54,"id":"https://metadata.un.org/sdg/11"}],"grants":[],"datasets":[],"versions":[],"referenced_works_count":20,"referenced_works":["https://openalex.org/W1631260214","https://openalex.org/W1869752048","https://openalex.org/W1948566616","https://openalex.org/W1976538119","https://openalex.org/W2101105183","https://openalex.org/W2116716943","https://openalex.org/W2123442489","https://openalex.org/W2125417976","https://openalex.org/W2154764394","https://openalex.org/W2201007611","https://openalex.org/W2251958415","https://openalex.org/W2291723583","https://openalex.org/W2566725737","https://openalex.org/W2573463306","https://openalex.org/W2578330760","https://openalex.org/W2949465329","https://openalex.org/W2963069010","https://openalex.org/W2963091658","https://openalex.org/W4239857022","https://openalex.org/W881173"],"related_works":["https://openalex.org/W3016281454","https://openalex.org/W2961288924","https://openalex.org/W2810895613","https://openalex.org/W2789329261","https://openalex.org/W2567712142","https://openalex.org/W2538215832","https://openalex.org/W2187980447","https://openalex.org/W2075250579","https://openalex.org/W2050807172","https://openalex.org/W1725894279"],"abstract_inverted_index":{"In":[0],"this":[1,43,54,177,190],"paper,":[2],"we":[3,179],"present":[4],"a":[5,39,46,133,182],"novel":[6,134],"framework":[7,44,55,82,131,191],"for":[8,49,136],"semi-automatically":[9],"creating":[10,137],"linguistically":[11],"challenging":[12,47,138],"micro-planning":[13,159],"data-to-text":[14],"corpora":[15],"from":[16,33,141],"existing":[17],"Knowledge":[18],"Bases.":[19],"Because":[20],"our":[21,81,128],"method":[22,135],"pairs":[23,187],"data":[24,85,139],"of":[25,53,118,123,151,184,195],"varying":[26],"size":[27],"and":[28,68,75,86,120,168],"shape":[29],"with":[30,91],"texts":[31],"ranging":[32],"simple":[34],"clauses":[35],"to":[36,62,73,83,174],"short":[37],"texts,":[38],"dataset":[40,90,103,183],"created":[41,188],"using":[42,189],"provides":[45],"benchmark":[48],"microplanning.":[50],"Another":[51],"feature":[52],"is":[56,104,112],"that":[57,98],"it":[58,111],"can":[59,69,145],"be":[60,71,146],"applied":[61],"any":[63],"large":[64],"scale":[65],"knowledge":[66],"base":[67],"therefore":[70],"used":[72],"train":[74],"learn":[76],"KB":[77],"verbalisers.":[78],"We":[79,96,125],"apply":[80],"DBpedia":[84],"compare":[87],"the":[88,153,193,196],"resulting":[89],"Wen":[92,100],"et":[93,101],"al.":[94],"2016\u2019s.":[95],"show":[97],"while":[99],"al.\u2019s":[102],"more":[105],"than":[106,109],"twice":[107],"larger":[108],"ours,":[110],"less":[113],"diverse":[114],"both":[115],"in":[116,121,158,192],"terms":[117,122],"input":[119],"text.":[124],"thus":[126],"propose":[127],"corpus":[129],"generation":[130,167],"as":[132],"sets":[140],"which":[142,148],"NLG":[143],"models":[144],"learned":[147],"are":[149],"capable":[150],"handling":[152],"complex":[154],"interactions":[155],"occurring":[156],"during":[157],"between":[160],"lexicalisation,":[161],"aggregation,":[162],"surface":[163],"realisation,":[164],"referring":[165],"expression":[166],"sentence":[169],"segmentation.":[170],"To":[171],"encourage":[172],"researchers":[173],"take":[175],"up":[176],"challenge,":[178],"made":[180],"available":[181],"21,855":[185],"data/text":[186],"context":[194],"WebNLG":[197],"shared":[198],"task.":[199]},"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W2739874095","counts_by_year":[{"year":2024,"cited_by_count":29},{"year":2023,"cited_by_count":77},{"year":2022,"cited_by_count":47},{"year":2021,"cited_by_count":71},{"year":2020,"cited_by_count":53},{"year":2019,"cited_by_count":31},{"year":2018,"cited_by_count":28},{"year":2017,"cited_by_count":6}],"updated_date":"2025-01-15T19:05:41.590740","created_date":"2017-08-08"}