{"id":"https://openalex.org/W4385849212","doi":"https://doi.org/10.48550/arxiv.2308.07092","title":"Masked Motion Predictors are Strong 3D Action Representation Learners","display_name":"Masked Motion Predictors are Strong 3D Action Representation Learners","publication_year":2023,"publication_date":"2023-01-01","ids":{"openalex":"https://openalex.org/W4385849212","doi":"https://doi.org/10.48550/arxiv.2308.07092"},"language":"en","primary_location":{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2308.07092","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false},"type":"preprint","type_crossref":"posted-content","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/abs/2308.07092","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5088650924","display_name":"Yunyao Mao","orcid":"https://orcid.org/0000-0002-9427-9086"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mao, Yunyao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5081269555","display_name":"Jiajun Deng","orcid":"https://orcid.org/0000-0002-6834-0322"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Deng, Jiajun","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5046805800","display_name":"Wengang Zhou","orcid":"https://orcid.org/0000-0003-1690-9836"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhou, Wengang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5041649403","display_name":"Fang Yao","orcid":"https://orcid.org/0000-0002-8562-6373"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Fang, Yao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5087818121","display_name":"Wanli Ouyang","orcid":"https://orcid.org/0000-0002-9163-2761"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ouyang, Wanli","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5078141810","display_name":"Houqiang Li","orcid":"https://orcid.org/0000-0003-2188-3028"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Houqiang","raw_affiliation_strings":[],"affiliations":[]}],"institution_assertions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.0,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":0,"max":66},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9998,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9998,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11398","display_name":"Hand Gesture Recognition Systems","score":0.9513,"subfield":{"id":"https://openalex.org/subfields/1709","display_name":"Human-Computer Interaction"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9403,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/feature-learning","display_name":"Feature Learning","score":0.62515455},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.4178474}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7466993},{"id":"https://openalex.org/C59404180","wikidata":"https://www.wikidata.org/wiki/Q17013334","display_name":"Feature learning","level":2,"score":0.62515455},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.59355426},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.5053101},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4721097},{"id":"https://openalex.org/C104114177","wikidata":"https://www.wikidata.org/wiki/Q79782","display_name":"Motion (physics)","level":2,"score":0.46770212},{"id":"https://openalex.org/C152124472","wikidata":"https://www.wikidata.org/wiki/Q1204361","display_name":"Redundancy (engineering)","level":2,"score":0.44237018},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.4178474},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.32198778},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.12496951},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.0836682},{"id":"https://openalex.org/C165801399","wikidata":"https://www.wikidata.org/wiki/Q25428","display_name":"Voltage","level":2,"score":0.0},{"id":"https://openalex.org/C119599485","wikidata":"https://www.wikidata.org/wiki/Q43035","display_name":"Electrical engineering","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2308.07092","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false},{"is_oa":false,"landing_page_url":"https://api.datacite.org/dois/10.48550/arxiv.2308.07092","pdf_url":null,"source":{"id":"https://openalex.org/S4393179698","display_name":"DataCite API","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I4210145204","host_organization_name":"DataCite","host_organization_lineage":["https://openalex.org/I4210145204"],"host_organization_lineage_names":["DataCite"],"type":"metadata"},"license":null,"license_id":null,"version":null}],"best_oa_location":{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2308.07092","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false},"sustainable_development_goals":[{"display_name":"Quality education","id":"https://metadata.un.org/sdg/4","score":0.51}],"grants":[],"datasets":[],"versions":[],"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W2494338568","https://openalex.org/W2349023125","https://openalex.org/W2282510344","https://openalex.org/W2183994405","https://openalex.org/W2163502240","https://openalex.org/W2122678784","https://openalex.org/W1976807322","https://openalex.org/W1875646599","https://openalex.org/W1495042958","https://openalex.org/W139987158"],"abstract_inverted_index":{"In":[0,36],"3D":[1,72],"human":[2,55,107],"action":[3,73],"recognition,":[4],"limited":[5],"supervised":[6],"data":[7],"makes":[8],"it":[9],"challenging":[10],"to":[11,49,63,140],"fully":[12],"tap":[13],"into":[14],"the":[15,45,64,78,87,93,100,105,110,115,121,134,155,161,164],"modeling":[16,60],"potential":[17],"of":[18,43,66,104,114,163,178],"powerful":[19],"networks":[20],"such":[21],"as":[22,91,126],"transformers.":[23],"As":[24],"a":[25],"result,":[26],"researchers":[27],"have":[28],"been":[29],"actively":[30],"investigating":[31],"effective":[32,68],"self-supervised":[33],"pre-training":[34,158],"strategies.":[35],"this":[37],"work,":[38],"we":[39,76],"show":[40,153],"that":[41,132,154],"instead":[42],"following":[44],"prevalent":[46],"pretext":[47],"task":[48],"perform":[50],"masked":[51,94,106],"self-component":[52],"reconstruction":[53],"in":[54,118],"joints,":[56],"explicit":[57],"contextual":[58],"motion":[59,103,122],"is":[61,181],"key":[62],"success":[65],"learning":[67],"feature":[69],"representation":[70],"for":[71],"recognition.":[74],"Formally,":[75],"propose":[77],"Masked":[79],"Motion":[80],"Prediction":[81],"(MAMP)":[82],"framework.":[83],"To":[84],"be":[85],"specific,":[86],"proposed":[88,156],"MAMP":[89,157,180],"takes":[90],"input":[92],"spatio-temporal":[95],"skeleton":[96,116],"sequence":[97],"and":[98,150,173],"predicts":[99],"corresponding":[101],"temporal":[102,112,143],"joints.":[108],"Considering":[109],"high":[111],"redundancy":[113],"sequence,":[117],"our":[119,179],"MAMP,":[120],"information":[123],"also":[124],"acts":[125],"an":[127],"empirical":[128],"semantic":[129],"richness":[130],"prior":[131],"guide":[133],"masking":[135],"process,":[136],"promoting":[137],"better":[138],"attention":[139],"semantically":[141],"rich":[142],"regions.":[144],"Extensive":[145],"experiments":[146],"on":[147],"NTU-60,":[148],"NTU-120,":[149],"PKU-MMD":[151],"datasets":[152],"substantially":[159],"improves":[160],"performance":[162],"adopted":[165],"vanilla":[166],"transformer,":[167],"achieving":[168],"state-of-the-art":[169],"results":[170],"without":[171],"bells":[172],"whistles.":[174],"The":[175],"source":[176],"code":[177],"available":[182],"at":[183],"https://github.com/maoyunyao/MAMP.":[184]},"abstract_inverted_index_v3":null,"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4385849212","counts_by_year":[],"updated_date":"2025-02-20T23:37:47.071206","created_date":"2023-08-16"}