{"id":"https://openalex.org/W4283318419","doi":"https://doi.org/10.48550/arxiv.2206.10095","title":"Pyramid Region-based Slot Attention Network for Temporal Action Proposal Generation","display_name":"Pyramid Region-based Slot Attention Network for Temporal Action Proposal Generation","publication_year":2022,"publication_date":"2022-01-01","ids":{"openalex":"https://openalex.org/W4283318419","doi":"https://doi.org/10.48550/arxiv.2206.10095"},"language":"en","primary_location":{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2206.10095","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false},"type":"preprint","type_crossref":"posted-content","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/abs/2206.10095","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5083428910","display_name":"Shuai Cheng Li","orcid":"https://orcid.org/0000-0001-6246-6349"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Shuaicheng","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100401285","display_name":"Feng Zhang","orcid":"https://orcid.org/0000-0002-7995-918X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Feng","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100626035","display_name":"Rui-Wei Zhao","orcid":"https://orcid.org/0000-0002-8498-5761"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhao, Rui-Wei","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100680618","display_name":"Rui Feng","orcid":"https://orcid.org/0000-0002-8956-558X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Feng, Rui","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5009217816","display_name":"Kun\u2010Lin Yang","orcid":"https://orcid.org/0000-0002-7958-9334"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yang, Kunlin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102971183","display_name":"Lingbo Liu","orcid":"https://orcid.org/0000-0001-8179-6685"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Lingbo","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5100721400","display_name":"Jun Hou","orcid":"https://orcid.org/0000-0002-2978-8749"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hou, Jun","raw_affiliation_strings":[],"affiliations":[]}],"institution_assertions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.820962,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":75,"max":79},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9999,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9999,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9991,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.993,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/snippet","display_name":"Snippet","score":0.9697544},{"id":"https://openalex.org/keywords/pyramid","display_name":"Pyramid (geometry)","score":0.7613348},{"id":"https://openalex.org/keywords/representation","display_name":"Representation","score":0.56825906},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.5217801},{"id":"https://openalex.org/keywords/spatial-contextual-awareness","display_name":"Spatial contextual awareness","score":0.49217477},{"id":"https://openalex.org/keywords/similarity","display_name":"Similarity (geometry)","score":0.48999825}],"concepts":[{"id":"https://openalex.org/C2777822670","wikidata":"https://www.wikidata.org/wiki/Q1120538","display_name":"Snippet","level":2,"score":0.9697544},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.79597676},{"id":"https://openalex.org/C142575187","wikidata":"https://www.wikidata.org/wiki/Q3358290","display_name":"Pyramid (geometry)","level":2,"score":0.7613348},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.6482361},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.6009573},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.56825906},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.5364889},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.5217801},{"id":"https://openalex.org/C64754055","wikidata":"https://www.wikidata.org/wiki/Q7574053","display_name":"Spatial contextual awareness","level":2,"score":0.49217477},{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.48999825},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4681656},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.44600007},{"id":"https://openalex.org/C124913957","wikidata":"https://www.wikidata.org/wiki/Q1232548","display_name":"Zoom","level":3,"score":0.4351644},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.2465803},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.22749698},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.07403356},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0},{"id":"https://openalex.org/C94625758","wikidata":"https://www.wikidata.org/wiki/Q7163","display_name":"Politics","level":2,"score":0.0},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C78762247","wikidata":"https://www.wikidata.org/wiki/Q1273174","display_name":"Petroleum engineering","level":1,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0},{"id":"https://openalex.org/C15336307","wikidata":"https://www.wikidata.org/wiki/Q1766051","display_name":"Lens (geology)","level":2,"score":0.0},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2206.10095","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false},{"is_oa":true,"landing_page_url":"http://arxiv.org/abs/2206.10095","pdf_url":"http://arxiv.org/pdf/2206.10095","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false},{"is_oa":false,"landing_page_url":"https://api.datacite.org/dois/10.48550/arxiv.2206.10095","pdf_url":null,"source":{"id":"https://openalex.org/S4393179698","display_name":"DataCite API","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I4210145204","host_organization_name":"DataCite","host_organization_lineage":["https://openalex.org/I4210145204"],"host_organization_lineage_names":["DataCite"],"type":"metadata"},"license":null,"license_id":null,"version":null}],"best_oa_location":{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2206.10095","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false},"sustainable_development_goals":[],"grants":[],"datasets":[],"versions":[],"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4318980730","https://openalex.org/W4289376745","https://openalex.org/W3201315194","https://openalex.org/W3036724449","https://openalex.org/W2985134635","https://openalex.org/W2950904665","https://openalex.org/W2798329462","https://openalex.org/W2023083803","https://openalex.org/W1607713096","https://openalex.org/W1511521437"],"abstract_inverted_index":{"It":[0],"has":[1],"been":[2],"found":[3],"that":[4],"temporal":[5,14,35,48,185],"action":[6,15,239],"proposal":[7,191,225],"generation,":[8],"which":[9],"aims":[10],"to":[11,45,83,177,222,236],"discover":[12],"the":[13,18,21,27,47,90,98,107,116,125,132,153,215,218,229],"instances":[16],"within":[17],"range":[19],"of":[20,88,109],"start":[22],"and":[23,36,50,65,105,142,186,202,227],"end":[24],"frames":[25],"in":[26,101],"untrimmed":[28],"videos,":[29],"can":[30],"largely":[31],"benefit":[32],"from":[33,61,217,234],"proper":[34],"semantic":[37,52,187],"context":[38,49,156,188],"exploitation.":[39],"The":[40],"latest":[41],"efforts":[42],"were":[43],"dedicated":[44],"considering":[46],"similarity-based":[51],"contexts":[53],"through":[54],"self-attention":[55],"modules.":[56],"However,":[57],"they":[58],"still":[59],"suffer":[60],"cluttered":[62],"background":[63],"information":[64],"limited":[66],"contextual":[67],"feature":[68],"learning.":[69],"In":[70,211],"this":[71],"paper,":[72],"we":[73,166,213],"propose":[74],"a":[75,110,158,168,179],"novel":[76,169],"Pyramid":[77,170],"Region-based":[78,171],"Slot":[79,172],"Attention":[80,173],"(PRSlot)":[81],"module":[82,95,130],"address":[84],"these":[85],"issues.":[86],"Instead":[87],"using":[89],"similarity":[91],"computation,":[92],"our":[93],"PRSlot":[94,129,164],"directly":[96],"learns":[97],"local":[99,111,154],"relations":[100],"an":[102],"encoder-decoder":[103],"manner":[104],"generates":[106,144],"representation":[108,182],"region":[112,139],"enhanced":[113],"based":[114],"on":[115,163,197,241],"attention":[117],"over":[118],"input":[119,126],"features":[120],"called":[121],"\\textit{slot}.":[122],"Specifically,":[123],"upon":[124],"snippet-level":[127],"features,":[128],"takes":[131],"target":[133],"snippet":[134,155],"as":[135,140],"\\textit{query},":[136],"its":[137],"surrounding":[138],"\\textit{key}":[141],"then":[143],"slot":[145,150],"representations":[146],"for":[147,189,224,238],"each":[148],"\\textit{query-key}":[149],"by":[151],"aggregating":[152],"with":[157,183],"parallel":[159],"pyramid":[160],"strategy.":[161],"Based":[162],"modules,":[165],"present":[167],"Network":[174],"termed":[175],"PRSA-Net":[176,206],"learn":[178],"unified":[180],"visual":[181],"rich":[184],"better":[190],"generation.":[192],"Extensive":[193],"experiments":[194],"are":[195],"conducted":[196],"two":[198],"widely":[199],"adopted":[200],"THUMOS14":[201],"ActivityNet-1.3":[203],"benchmarks.":[204],"Our":[205],"outperforms":[207],"other":[208],"state-of-the-art":[209],"methods.":[210],"particular,":[212],"improve":[214],"AR@100":[216],"previous":[219],"best":[220],"50.67%":[221],"56.12%":[223],"generation":[226],"raise":[228],"mAP":[230],"under":[231],"0.5":[232],"tIoU":[233],"51.9\\%":[235],"58.7\\%":[237],"detection":[240],"THUMOS14.":[242],"\\textit{Code":[243],"is":[244],"available":[245],"at}":[246],"\\url{https://github.com/handhand123/PRSA-Net}":[247]},"abstract_inverted_index_v3":null,"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4283318419","counts_by_year":[{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":1}],"updated_date":"2025-04-21T13:29:39.669727","created_date":"2022-06-24"}