{"id":"https://openalex.org/W4378506719","doi":"https://doi.org/10.48550/arxiv.2305.13773","title":"Enhanced Fine-grained Motion Diffusion for Text-driven Human Motion Synthesis","display_name":"Enhanced Fine-grained Motion Diffusion for Text-driven Human Motion Synthesis","publication_year":2023,"publication_date":"2023-01-01","ids":{"openalex":"https://openalex.org/W4378506719","doi":"https://doi.org/10.48550/arxiv.2305.13773"},"language":"en","primary_location":{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2305.13773","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false},"type":"preprint","type_crossref":"posted-content","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/abs/2305.13773","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100391490","display_name":"Dong Wei","orcid":"https://orcid.org/0000-0002-6342-4658"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wei, Dong","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100642895","display_name":"Xiaoning Sun","orcid":"https://orcid.org/0000-0001-8302-8604"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sun, Xiaoning","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5110740604","display_name":"Huaijiang Sun","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sun, Huaijiang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100781448","display_name":"Bin Li","orcid":"https://orcid.org/0000-0001-5122-5515"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Bin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102709127","display_name":"Shengxiang Hu","orcid":"https://orcid.org/0009-0001-9988-404X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hu, Shengxiang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101414940","display_name":"Weiqing Li","orcid":"https://orcid.org/0000-0002-1929-3654"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Weiqing","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5061472917","display_name":"Jianfeng Lu","orcid":"https://orcid.org/0000-0001-6255-5165"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lu, Jianfeng","raw_affiliation_strings":[],"affiliations":[]}],"institution_assertions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.851999,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":67,"max":78},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T12290","display_name":"Human Motion and Animation","score":0.9989,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12290","display_name":"Human Motion and Animation","score":0.9989,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10719","display_name":"3D Shape Modeling and Analysis","score":0.9615,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9862,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/smoothness","display_name":"Smoothness","score":0.4193486},{"id":"https://openalex.org/keywords/motion-capture","display_name":"Motion Capture","score":0.41406614}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8356395},{"id":"https://openalex.org/C104114177","wikidata":"https://www.wikidata.org/wiki/Q79782","display_name":"Motion (physics)","level":2,"score":0.651231},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.5848476},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.5476254},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.49856615},{"id":"https://openalex.org/C2776459999","wikidata":"https://www.wikidata.org/wiki/Q2119376","display_name":"Fidelity","level":2,"score":0.43957797},{"id":"https://openalex.org/C126042441","wikidata":"https://www.wikidata.org/wiki/Q1324888","display_name":"Frame (networking)","level":2,"score":0.43044358},{"id":"https://openalex.org/C102634674","wikidata":"https://www.wikidata.org/wiki/Q868473","display_name":"Smoothness","level":2,"score":0.4193486},{"id":"https://openalex.org/C48007421","wikidata":"https://www.wikidata.org/wiki/Q676252","display_name":"Motion capture","level":3,"score":0.41406614},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.36634952},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.0},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2305.13773","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false},{"is_oa":true,"landing_page_url":"http://arxiv.org/abs/2305.13773","pdf_url":"http://arxiv.org/pdf/2305.13773","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false},{"is_oa":false,"landing_page_url":"https://api.datacite.org/dois/10.48550/arxiv.2305.13773","pdf_url":null,"source":{"id":"https://openalex.org/S4393179698","display_name":"DataCite API","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I4210145204","host_organization_name":"DataCite","host_organization_lineage":["https://openalex.org/I4210145204"],"host_organization_lineage_names":["DataCite"],"type":"metadata"},"license":null,"license_id":null,"version":null}],"best_oa_location":{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2305.13773","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false},"sustainable_development_goals":[{"display_name":"Decent work and economic growth","score":0.74,"id":"https://metadata.un.org/sdg/8"}],"grants":[],"datasets":[],"versions":[],"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4312814274","https://openalex.org/W4285370786","https://openalex.org/W3207760230","https://openalex.org/W2536018345","https://openalex.org/W2358353312","https://openalex.org/W2353836703","https://openalex.org/W2296488620","https://openalex.org/W17155033","https://openalex.org/W1590307681","https://openalex.org/W1496222301"],"abstract_inverted_index":{"The":[0],"emergence":[1],"of":[2,144,203],"text-driven":[3,75],"motion":[4,26,76],"synthesis":[5,77],"technique":[6],"provides":[7],"animators":[8,60],"with":[9,61,78,84,95],"great":[10],"potential":[11],"to":[12,36,105,211],"create":[13],"efficiently.":[14],"However,":[15],"in":[16,161,201],"most":[17],"cases,":[18],"textual":[19],"expressions":[20],"only":[21,96,156,197],"contain":[22],"general":[23],"and":[24,32,86,101,126,134,146],"qualitative":[25],"descriptions,":[27,58],"while":[28],"lack":[29],"fine":[30],"depiction":[31,103],"sufficient":[33],"intensity,":[34],"leading":[35],"the":[37,56,135,141,166,181],"synthesized":[38],"motions":[39],"that":[40,114,193],"either":[41],"(a)":[42],"semantically":[43],"compliant":[44],"but":[45,206],"uncontrollable":[46],"over":[47],"specific":[48],"pose":[49],"details,":[50],"or":[51],"(b)":[52],"even":[53],"deviates":[54],"from":[55],"provided":[57],"bringing":[59],"undesired":[62],"cases.":[63],"In":[64],"this":[65],"paper,":[66],"we":[67,149,171],"propose":[68],"DiffKFC,":[69],"a":[70,173],"conditional":[71,120],"diffusion":[72,112,121],"model":[73,122,195],"for":[74,99],"KeyFrames":[79],"Collaborated,":[80],"enabling":[81],"realistic":[82],"generation":[83],"collaborative":[85],"efficient":[87],"dual-level":[88],"control:":[89],"coarse":[90],"guidance":[91,217],"at":[92,188],"semantic":[93,204],"level,":[94],"few":[97],"keyframes":[98,133],"direct":[100],"fine-grained":[102,216],"down":[104],"body":[106],"posture":[107],"level.":[108],"Unlike":[109],"existing":[110],"inference-editing":[111],"models":[113],"incorporate":[115],"conditions":[116],"without":[117,218],"training,":[118],"our":[119,194],"is":[123,209],"explicitly":[124],"trained":[125],"can":[127],"fully":[128],"exploit":[129],"correlations":[130],"among":[131],"texts,":[132],"diffused":[136],"target":[137],"frames.":[138],"To":[139],"preserve":[140],"control":[142],"capability":[143],"discrete":[145],"sparse":[147],"keyframes,":[148],"customize":[150],"dilated":[151,167],"mask":[152],"attention":[153],"modules":[154],"where":[155],"partial":[157],"valid":[158],"tokens":[159],"participate":[160],"local-to-global":[162],"attention,":[163],"indicated":[164],"by":[165],"keyframe":[168,186],"mask.":[169],"Additionally,":[170],"develop":[172],"simple":[174],"yet":[175],"effective":[176],"smoothness":[177],"prior,":[178],"which":[179],"steers":[180],"generated":[182],"frames":[183],"towards":[184],"seamless":[185],"transitions":[187],"inference.":[189],"Extensive":[190],"experiments":[191],"show":[192],"not":[196],"achieves":[198],"state-of-the-art":[199],"performance":[200],"terms":[202],"fidelity,":[205],"more":[207],"importantly,":[208],"able":[210],"satisfy":[212],"animator":[213],"requirements":[214],"through":[215],"tedious":[219],"labor.":[220]},"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4378506719","counts_by_year":[{"year":2023,"cited_by_count":1}],"updated_date":"2025-01-04T16:37:57.859209","created_date":"2023-05-27"}