{"id":"https://openalex.org/W1550352777","doi":"https://doi.org/10.1109/chinasip.2015.7230448","title":"Audio recapture detection using deep learning","display_name":"Audio recapture detection using deep learning","publication_year":2015,"publication_date":"2015-07-01","ids":{"openalex":"https://openalex.org/W1550352777","doi":"https://doi.org/10.1109/chinasip.2015.7230448","mag":"1550352777"},"language":"en","primary_location":{"is_oa":false,"landing_page_url":"https://doi.org/10.1109/chinasip.2015.7230448","pdf_url":null,"source":null,"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false},"type":"article","type_crossref":"proceedings-article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5111636829","display_name":"Da Luo","orcid":null},"institutions":[{"id":"https://openalex.org/I1302611135","display_name":"Ministry of Public Security of the People's Republic of China","ror":"https://ror.org/00bt9we26","country_code":"CN","type":"government","lineage":["https://openalex.org/I1302611135"]},{"id":"https://openalex.org/I180726961","display_name":"Shenzhen University","ror":"https://ror.org/01vy4gh70","country_code":"CN","type":"education","lineage":["https://openalex.org/I180726961"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Da Luo","raw_affiliation_strings":["College of Information Engineering, Shenzhen University, Shenzhen, P.R. China","Shenzhen Key Laboratory of Media Security, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"Shenzhen Key Laboratory of Media Security, Shenzhen, China","institution_ids":["https://openalex.org/I1302611135"]},{"raw_affiliation_string":"College of Information Engineering, Shenzhen University, Shenzhen, P.R. China","institution_ids":["https://openalex.org/I180726961"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5054806754","display_name":"Haojun Wu","orcid":null},"institutions":[{"id":"https://openalex.org/I1302611135","display_name":"Ministry of Public Security of the People's Republic of China","ror":"https://ror.org/00bt9we26","country_code":"CN","type":"government","lineage":["https://openalex.org/I1302611135"]},{"id":"https://openalex.org/I157773358","display_name":"Sun Yat-sen University","ror":"https://ror.org/0064kty71","country_code":"CN","type":"education","lineage":["https://openalex.org/I157773358"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Haojun Wu","raw_affiliation_strings":["School of Information Science and Technology, Sun Yat-Sen University, Guangzhou, P.R. China","Shenzhen Key Laboratory of Media Security, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"Shenzhen Key Laboratory of Media Security, Shenzhen, China","institution_ids":["https://openalex.org/I1302611135"]},{"raw_affiliation_string":"School of Information Science and Technology, Sun Yat-Sen University, Guangzhou, P.R. China","institution_ids":["https://openalex.org/I157773358"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5047964483","display_name":"Jiwu Huang","orcid":"https://orcid.org/0000-0002-7625-5689"},"institutions":[{"id":"https://openalex.org/I180726961","display_name":"Shenzhen University","ror":"https://ror.org/01vy4gh70","country_code":"CN","type":"education","lineage":["https://openalex.org/I180726961"]},{"id":"https://openalex.org/I1302611135","display_name":"Ministry of Public Security of the People's Republic of China","ror":"https://ror.org/00bt9we26","country_code":"CN","type":"government","lineage":["https://openalex.org/I1302611135"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jiwu Huang","raw_affiliation_strings":["College of Information Engineering, Shenzhen University, Shenzhen, P.R. China","Shenzhen Key Laboratory of Media Security, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"College of Information Engineering, Shenzhen University, Shenzhen, P.R. China","institution_ids":["https://openalex.org/I180726961"]},{"raw_affiliation_string":"Shenzhen Key Laboratory of Media Security, Shenzhen, China","institution_ids":["https://openalex.org/I1302611135"]}]}],"institution_assertions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.505,"has_fulltext":true,"fulltext_origin":"ngrams","cited_by_count":14,"citation_normalized_percentile":{"value":0.827035,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":88,"max":89},"biblio":{"volume":null,"issue":null,"first_page":"478","last_page":"482"},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T12357","display_name":"Digital Image Forgery Detection and Identification","score":0.9995,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12357","display_name":"Digital Image Forgery Detection and Identification","score":0.9995,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Audio Signal Classification and Analysis","score":0.9983,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech Enhancement Techniques","score":0.9852,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/dropout","display_name":"Dropout (neural networks)","score":0.64811933},{"id":"https://openalex.org/keywords/audio-event-detection","display_name":"Audio Event Detection","score":0.630911},{"id":"https://openalex.org/keywords/resampling-detection","display_name":"Resampling Detection","score":0.590991},{"id":"https://openalex.org/keywords/environmental-sound-recognition","display_name":"Environmental Sound Recognition","score":0.58206},{"id":"https://openalex.org/keywords/splicing-detection","display_name":"Splicing Detection","score":0.556062},{"id":"https://openalex.org/keywords/audio-visual-speech-recognition","display_name":"Audio-Visual Speech Recognition","score":0.553329},{"id":"https://openalex.org/keywords/autoencoder","display_name":"Autoencoder","score":0.46900818}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7740774},{"id":"https://openalex.org/C2776145597","wikidata":"https://www.wikidata.org/wiki/Q25339462","display_name":"Dropout (neural networks)","level":2,"score":0.64811933},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.63707316},{"id":"https://openalex.org/C64922751","wikidata":"https://www.wikidata.org/wiki/Q4650799","display_name":"Audio signal","level":3,"score":0.6133555},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6023919},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.53525764},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.49999285},{"id":"https://openalex.org/C101738243","wikidata":"https://www.wikidata.org/wiki/Q786435","display_name":"Autoencoder","level":3,"score":0.46900818},{"id":"https://openalex.org/C127220857","wikidata":"https://www.wikidata.org/wiki/Q2719318","display_name":"Audio signal processing","level":4,"score":0.43178985},{"id":"https://openalex.org/C126042441","wikidata":"https://www.wikidata.org/wiki/Q1324888","display_name":"Frame (networking)","level":2,"score":0.4263869},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.41685066},{"id":"https://openalex.org/C13895895","wikidata":"https://www.wikidata.org/wiki/Q3270773","display_name":"Speech coding","level":2,"score":0.2642977},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.236368},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.09318629},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"is_oa":false,"landing_page_url":"https://doi.org/10.1109/chinasip.2015.7230448","pdf_url":null,"source":null,"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Reduced inequalities","id":"https://metadata.un.org/sdg/10","score":0.68}],"grants":[],"datasets":[],"versions":[],"referenced_works_count":22,"referenced_works":["https://openalex.org/W1485656768","https://openalex.org/W1490120479","https://openalex.org/W1613249581","https://openalex.org/W1904365287","https://openalex.org/W1904969684","https://openalex.org/W2002433241","https://openalex.org/W2010616303","https://openalex.org/W2016419400","https://openalex.org/W2025768430","https://openalex.org/W2040515751","https://openalex.org/W2056177844","https://openalex.org/W2069423658","https://openalex.org/W2072128103","https://openalex.org/W2077084699","https://openalex.org/W2094810510","https://openalex.org/W2114376863","https://openalex.org/W2123299109","https://openalex.org/W2124537004","https://openalex.org/W2150341604","https://openalex.org/W2187281534","https://openalex.org/W330298975","https://openalex.org/W4231109964"],"related_works":["https://openalex.org/W4315836293","https://openalex.org/W4243888788","https://openalex.org/W4231351862","https://openalex.org/W4212794605","https://openalex.org/W3004352674","https://openalex.org/W2970176078","https://openalex.org/W2769884427","https://openalex.org/W2354332708","https://openalex.org/W2289868279","https://openalex.org/W1975359510"],"abstract_inverted_index":{"Since":[0],"the":[1,43,77,80],"audio":[2,9,19,45,71,106],"recapture":[3],"can":[4,93,102],"be":[5,94],"used":[6,75],"to":[7,14,41],"assist":[8],"splicing,":[10],"it":[11],"is":[12,21,73],"important":[13],"identify":[15],"whether":[16],"a":[17],"suspected":[18],"recording":[20],"recaptured":[22,44,105],"or":[23],"not.":[24],"However,":[25],"few":[26],"works":[27],"on":[28,47],"such":[29],"detection":[30],"have":[31],"been":[32],"reported.":[33],"In":[34],"this":[35],"paper,":[36],"we":[37,51],"propose":[38],"an":[39],"method":[40,62,101],"detect":[42],"based":[46],"deep":[48,54,81],"learning":[49,55],"and":[50,63,107],"investigate":[52],"two":[53],"techniques,":[56],"i.e.,":[57],"neural":[58,82],"network":[59],"with":[60],"dropout":[61],"stack":[64],"auto-encoders":[65],"(SAE).":[66],"The":[67,84],"waveform":[68],"samples":[69],"of":[70],"frame":[72],"directly":[74],"as":[76],"input":[78],"for":[79],"network.":[83],"experimental":[85],"results":[86],"show":[87],"that":[88,98],"error":[89],"rate":[90],"around":[91],"7.5%":[92],"achieved,":[95],"which":[96],"indicates":[97],"our":[99],"proposed":[100],"successfully":[103],"discriminate":[104],"original":[108],"audio.":[109]},"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W1550352777","counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":1},{"year":2020,"cited_by_count":3},{"year":2019,"cited_by_count":4},{"year":2018,"cited_by_count":2},{"year":2017,"cited_by_count":2},{"year":2016,"cited_by_count":1}],"updated_date":"2024-11-24T02:34:01.312005","created_date":"2016-06-24"}