{"id":"https://openalex.org/W4396817127","doi":"https://doi.org/10.48550/arxiv.2405.05130","title":"Multi-scale Bottleneck Transformer for Weakly Supervised Multimodal\n Violence Detection","display_name":"Multi-scale Bottleneck Transformer for Weakly Supervised Multimodal\n Violence Detection","publication_year":2024,"publication_date":"2024-05-08","ids":{"openalex":"https://openalex.org/W4396817127","doi":"https://doi.org/10.48550/arxiv.2405.05130"},"language":"en","primary_location":{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2405.05130","pdf_url":"https://arxiv.org/pdf/2405.05130","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false},"type":"preprint","type_crossref":"posted-content","indexed_in":["arxiv"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2405.05130","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101560169","display_name":"Shengyang Sun","orcid":"https://orcid.org/0000-0003-3286-0585"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sun, Shengyang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5061298101","display_name":"Xiaojin Gong","orcid":"https://orcid.org/0000-0001-9955-3569"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gong, Xiaojin","raw_affiliation_strings":[],"affiliations":[]}],"institution_assertions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.0,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":0,"max":83},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T11241","display_name":"Advanced Malware Detection Techniques","score":0.9891,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11241","display_name":"Advanced Malware Detection Techniques","score":0.9891,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11512","display_name":"Anomaly Detection Techniques and Applications","score":0.9803,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10400","display_name":"Network Security and Intrusion Detection","score":0.9731,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[],"concepts":[{"id":"https://openalex.org/C2780513914","wikidata":"https://www.wikidata.org/wiki/Q18210350","display_name":"Bottleneck","level":2,"score":0.70005804},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.49104476},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.46454573},{"id":"https://openalex.org/C2778755073","wikidata":"https://www.wikidata.org/wiki/Q10858537","display_name":"Scale (ratio)","level":2,"score":0.43738884},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4063912},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.20370135},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.18151766},{"id":"https://openalex.org/C119599485","wikidata":"https://www.wikidata.org/wiki/Q43035","display_name":"Electrical engineering","level":1,"score":0.13175282},{"id":"https://openalex.org/C58640448","wikidata":"https://www.wikidata.org/wiki/Q42515","display_name":"Cartography","level":1,"score":0.12415829},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.12140417},{"id":"https://openalex.org/C165801399","wikidata":"https://www.wikidata.org/wiki/Q25428","display_name":"Voltage","level":2,"score":0.062633336}],"mesh":[],"locations_count":1,"locations":[{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2405.05130","pdf_url":"https://arxiv.org/pdf/2405.05130","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false}],"best_oa_location":{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2405.05130","pdf_url":"https://arxiv.org/pdf/2405.05130","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false},"sustainable_development_goals":[],"grants":[],"datasets":[],"versions":[],"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W4382618745","https://openalex.org/W2885125400","https://openalex.org/W2748952813","https://openalex.org/W2595172197","https://openalex.org/W2127970246","https://openalex.org/W2084856301","https://openalex.org/W1989889224","https://openalex.org/W1973775000","https://openalex.org/W1001352512"],"abstract_inverted_index":{"Weakly":[0],"supervised":[1,59],"multimodal":[2,34],"violence":[3,9,35],"detection":[4,10,36],"aims":[5],"to":[6,86,103,117],"learn":[7],"a":[8,56,70,80,98,112],"model":[11],"by":[12],"leveraging":[13],"multiple":[14],"modalities":[15,95],"such":[16],"as":[17,47],"RGB,":[18],"optical":[19],"flow,":[20],"and":[21,42,90,96],"audio,":[22],"while":[23],"only":[24],"video-level":[25],"annotations":[26],"are":[27,45],"available.":[28],"In":[29,51],"the":[30,125,131],"pursuit":[31],"of":[32,83,94],"effective":[33],"(MVD),":[37],"information":[38,89],"redundancy,":[39],"modality":[40,43],"imbalance,":[41],"asynchrony":[44],"identified":[46],"three":[48],"key":[49],"challenges.":[50,66],"this":[52],"work,":[53],"we":[54,68,110],"propose":[55,111],"new":[57],"weakly":[58],"MVD":[60],"method":[61,133],"that":[62,78,130],"explicitly":[63],"addresses":[64],"these":[65],"Specifically,":[67],"introduce":[69],"multi-scale":[71],"bottleneck":[72,84,99],"transformer":[73],"(MSBT)":[74],"based":[75],"fusion":[76],"module":[77],"employs":[79],"reduced":[81],"number":[82],"tokens":[85],"gradually":[87],"condense":[88],"fuse":[91],"each":[92],"pair":[93],"utilizes":[97],"token-based":[100],"weighting":[101],"scheme":[102],"highlight":[104],"more":[105],"important":[106],"fused":[107,121],"features.":[108,122],"Furthermore,":[109],"temporal":[113],"consistency":[114],"contrast":[115],"loss":[116],"semantically":[118],"align":[119],"pairwise":[120],"Experiments":[123],"on":[124],"largest-scale":[126],"XD-Violence":[127],"dataset":[128],"demonstrate":[129],"proposed":[132],"achieves":[134],"state-of-the-art":[135],"performance.":[136],"Code":[137],"is":[138],"available":[139],"at":[140],"https://github.com/shengyangsun/MSBT.":[141]},"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4396817127","counts_by_year":[],"updated_date":"2025-01-08T23:46:06.333815","created_date":"2024-05-11"}