{"id":"https://openalex.org/W4312506452","doi":"https://doi.org/10.1109/ijcnn55064.2022.9892087","title":"Spatial Parsing and Dynamic Temporal Pooling networks for Human-Object Interaction detection","display_name":"Spatial Parsing and Dynamic Temporal Pooling networks for Human-Object Interaction detection","publication_year":2022,"publication_date":"2022-07-18","ids":{"openalex":"https://openalex.org/W4312506452","doi":"https://doi.org/10.1109/ijcnn55064.2022.9892087"},"language":"en","primary_location":{"is_oa":false,"landing_page_url":"https://doi.org/10.1109/ijcnn55064.2022.9892087","pdf_url":null,"source":{"id":"https://openalex.org/S4363607707","display_name":"2022 International Joint Conference on Neural Networks (IJCNN)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false},"type":"article","type_crossref":"proceedings-article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"http://arxiv.org/pdf/2206.03061","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100732450","display_name":"Hongsheng Li","orcid":"https://orcid.org/0000-0002-2664-7975"},"institutions":[{"id":"https://openalex.org/I149594827","display_name":"Xidian University","ror":"https://ror.org/05s92vm98","country_code":"CN","type":"education","lineage":["https://openalex.org/I149594827"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hongsheng Li","raw_affiliation_strings":["School of Computer Science and Technology, Xidian University, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, Xidian University, China","institution_ids":["https://openalex.org/I149594827"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5028794275","display_name":"Guangming Zhu","orcid":"https://orcid.org/0000-0003-3214-4095"},"institutions":[{"id":"https://openalex.org/I149594827","display_name":"Xidian University","ror":"https://ror.org/05s92vm98","country_code":"CN","type":"education","lineage":["https://openalex.org/I149594827"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Guangming Zhu","raw_affiliation_strings":["School of Computer Science and Technology, Xidian University, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, Xidian University, China","institution_ids":["https://openalex.org/I149594827"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103881061","display_name":"Wu Zhen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wu Zhen","raw_affiliation_strings":["Beijing Roborock Technology Co.,Ltd."],"affiliations":[{"raw_affiliation_string":"Beijing Roborock Technology Co.,Ltd.","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5000205091","display_name":"Lan Ni","orcid":null},"institutions":[{"id":"https://openalex.org/I113940042","display_name":"Shanghai University","ror":"https://ror.org/006teas31","country_code":"CN","type":"education","lineage":["https://openalex.org/I113940042"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Lan Ni","raw_affiliation_strings":["Shanghai University"],"affiliations":[{"raw_affiliation_string":"Shanghai University","institution_ids":["https://openalex.org/I113940042"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103197309","display_name":"Peiyi Shen","orcid":"https://orcid.org/0000-0002-3527-7232"},"institutions":[{"id":"https://openalex.org/I149594827","display_name":"Xidian University","ror":"https://ror.org/05s92vm98","country_code":"CN","type":"education","lineage":["https://openalex.org/I149594827"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Peiyi Shen","raw_affiliation_strings":["School of Computer Science and Technology, Xidian University, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, Xidian University, China","institution_ids":["https://openalex.org/I149594827"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100425294","display_name":"Liang Zhang","orcid":"https://orcid.org/0000-0003-4331-5830"},"institutions":[{"id":"https://openalex.org/I149594827","display_name":"Xidian University","ror":"https://ror.org/05s92vm98","country_code":"CN","type":"education","lineage":["https://openalex.org/I149594827"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Liang Zhang","raw_affiliation_strings":["School of Computer Science and Technology, Xidian University, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, Xidian University, China","institution_ids":["https://openalex.org/I149594827"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100387083","display_name":"Ning Wang","orcid":"https://orcid.org/0000-0001-6877-4211"},"institutions":[{"id":"https://openalex.org/I149594827","display_name":"Xidian University","ror":"https://ror.org/05s92vm98","country_code":"CN","type":"education","lineage":["https://openalex.org/I149594827"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ning Wang","raw_affiliation_strings":["School of Computer Science and Technology, Xidian University, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, Xidian University, China","institution_ids":["https://openalex.org/I149594827"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101763303","display_name":"Cong Hua","orcid":"https://orcid.org/0009-0005-6846-7330"},"institutions":[{"id":"https://openalex.org/I149594827","display_name":"Xidian University","ror":"https://ror.org/05s92vm98","country_code":"CN","type":"education","lineage":["https://openalex.org/I149594827"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Cong Hua","raw_affiliation_strings":["School of Computer Science and Technology, Xidian University, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, Xidian University, China","institution_ids":["https://openalex.org/I149594827"]}]}],"institution_assertions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.205,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.359733,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":70,"max":76},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"8"},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9999,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9999,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9999,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11605","display_name":"Visual Attention and Saliency Detection","score":0.9993,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/pooling","display_name":"Pooling","score":0.7093352},{"id":"https://openalex.org/keywords/human-interaction","display_name":"Human interaction","score":0.42083132}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.85408235},{"id":"https://openalex.org/C70437156","wikidata":"https://www.wikidata.org/wiki/Q7228652","display_name":"Pooling","level":2,"score":0.7093352},{"id":"https://openalex.org/C186644900","wikidata":"https://www.wikidata.org/wiki/Q194152","display_name":"Parsing","level":2,"score":0.6629646},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.637126},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.6043006},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.53478384},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.46973002},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.43000782},{"id":"https://openalex.org/C2987082051","wikidata":"https://www.wikidata.org/wiki/Q223642","display_name":"Human interaction","level":2,"score":0.42083132},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.42022896},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3863643},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3775604},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.25194037},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.22102344},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"is_oa":false,"landing_page_url":"https://doi.org/10.1109/ijcnn55064.2022.9892087","pdf_url":null,"source":{"id":"https://openalex.org/S4363607707","display_name":"2022 International Joint Conference on Neural Networks (IJCNN)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false},{"is_oa":true,"landing_page_url":"http://arxiv.org/abs/2206.03061","pdf_url":"http://arxiv.org/pdf/2206.03061","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false}],"best_oa_location":{"is_oa":true,"landing_page_url":"http://arxiv.org/abs/2206.03061","pdf_url":"http://arxiv.org/pdf/2206.03061","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false},"sustainable_development_goals":[],"grants":[{"funder":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China","award_id":"62072358,62073252"},{"funder":"https://openalex.org/F4320335777","funder_display_name":"National Key Research and Development Program of China","award_id":"2020YFF0304900"}],"datasets":[],"versions":[],"referenced_works_count":36,"referenced_works":["https://openalex.org/W1551928752","https://openalex.org/W2131984901","https://openalex.org/W2146055337","https://openalex.org/W2309415944","https://openalex.org/W2412782625","https://openalex.org/W2470394683","https://openalex.org/W2579549467","https://openalex.org/W2581887665","https://openalex.org/W2598104261","https://openalex.org/W2606202972","https://openalex.org/W2618862450","https://openalex.org/W2625366777","https://openalex.org/W2806331055","https://openalex.org/W2809890486","https://openalex.org/W2888096830","https://openalex.org/W2888814092","https://openalex.org/W2962779575","https://openalex.org/W2963165299","https://openalex.org/W2963227409","https://openalex.org/W2963346996","https://openalex.org/W2963441581","https://openalex.org/W2963681621","https://openalex.org/W2963876278","https://openalex.org/W2964225075","https://openalex.org/W2964321699","https://openalex.org/W2981774933","https://openalex.org/W2982441354","https://openalex.org/W3034257141","https://openalex.org/W3092336341","https://openalex.org/W3096057444","https://openalex.org/W3164894587","https://openalex.org/W4288322145","https://openalex.org/W4297733535","https://openalex.org/W4301141993","https://openalex.org/W4385245566","https://openalex.org/W639708223"],"related_works":["https://openalex.org/W4390975304","https://openalex.org/W4287804464","https://openalex.org/W3211292372","https://openalex.org/W3103989898","https://openalex.org/W3022252430","https://openalex.org/W3015684221","https://openalex.org/W2953234277","https://openalex.org/W2900413183","https://openalex.org/W2626256601","https://openalex.org/W147410782"],"abstract_inverted_index":{"The":[0],"key":[1],"of":[2,57,66,71,91,161],"Human-Object":[3,18],"Interaction(HOI)":[4,19],"recognition":[5],"is":[6,27,60],"to":[7,44,157,180],"infer":[8],"the":[9,16,68,72,75,79,85,92,99,110,131,159,162,166,170],"relationship":[10],"between":[11,133],"human":[12,118],"and":[13,49,88,102,119,135,142,152,164,184,195],"objects.":[14],"Recently,":[15],"image's":[17],"detection":[20,35],"has":[21],"made":[22],"significant":[23],"progress.":[24],"However,":[25],"there":[26],"still":[28],"room":[29],"for":[30],"improvement":[31],"in":[32,77],"video":[33,47,112,163],"HOI":[34],"performance.":[36],"Existing":[37],"one-stage":[38],"methods":[39],"use":[40],"well-designed":[41],"end-to-end":[42],"networks":[43],"detect":[45],"a":[46,114,150],"segment":[48],"directly":[50],"predict":[51],"an":[52],"interaction.":[53],"A":[54],"side":[55],"effect":[56],"these":[58],"approaches":[59],"that":[61,174],"we":[62,148,188],"have":[63],"no":[64],"way":[65],"knowing":[67],"human-object":[69,182],"pair":[70],"interaction":[73,80,145],"or":[74],"keyframes":[76,160],"which":[78,108],"took":[81],"place.":[82],"It":[83],"makes":[84],"model":[86],"learning":[87],"further":[89],"optimization":[90],"network":[93,129],"more":[94,178],"complex.":[95],"This":[96],"paper":[97],"introduces":[98],"Spatial":[100],"Parsing":[101],"Dynamic":[103,154],"Temporal":[104,155],"Pooling":[105],"(SPDTP)":[106],"network,":[107],"takes":[109],"entire":[111],"as":[113,122],"spatio-temporal":[115],"graph":[116],"with":[117],"object":[120],"nodes":[121],"input.":[123],"Unlike":[124],"existing":[125],"methods,":[126],"our":[127],"proposed":[128],"predicts":[130],"difference":[132],"interactive":[134],"non-interactive":[136],"pairs":[137,183],"through":[138],"explicit":[139],"spatial":[140],"parsing,":[141],"then":[143],"performs":[144],"recognition.":[146],"Moreover,":[147],"propose":[149],"learnable":[151],"differentiable":[153],"Module(DTM)":[156],"emphasize":[158],"suppress":[165],"redundant":[167],"frame.":[168],"Furthermore,":[169],"experimental":[171],"results":[172],"show":[173],"SPDTP":[175],"can":[176],"pay":[177],"attention":[179],"active":[181],"valid":[185],"keyframes.":[186],"Overall,":[187],"achieve":[189],"state-of-the-art":[190],"performance":[191],"on":[192],"CAD-120":[193],"dataset":[194],"Something-":[196],"Else":[197],"dataset.":[198]},"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4312506452","counts_by_year":[{"year":2024,"cited_by_count":2}],"updated_date":"2025-01-04T23:23:23.247725","created_date":"2023-01-05"}