{"id":"https://openalex.org/W4300158295","doi":"https://doi.org/10.48550/arxiv.2208.04094","title":"Towards Semantic Communications: Deep Learning-Based Image Semantic Coding","display_name":"Towards Semantic Communications: Deep Learning-Based Image Semantic Coding","publication_year":2022,"publication_date":"2022-01-01","ids":{"openalex":"https://openalex.org/W4300158295","doi":"https://doi.org/10.48550/arxiv.2208.04094"},"language":"en","primary_location":{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2208.04094","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false},"type":"preprint","type_crossref":"posted-content","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/abs/2208.04094","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101896273","display_name":"Danlan Huang","orcid":"https://orcid.org/0000-0002-1198-7643"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Huang, Danlan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5050402661","display_name":"Feifei Gao","orcid":"https://orcid.org/0000-0001-8896-352X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gao, Feifei","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5087298250","display_name":"Xiaoming Tao","orcid":"https://orcid.org/0000-0002-2406-0695"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tao, Xiaoming","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5064353941","display_name":"Qiyuan Du","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Du, Qiyuan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5100873531","display_name":"Jianhua Lu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lu, Jianhua","raw_affiliation_strings":[],"affiliations":[]}],"institution_assertions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.820962,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":69,"max":75},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9634,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9634,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12357","display_name":"Digital Media Forensic Detection","score":0.9503,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11147","display_name":"Misinformation and Its Impacts","score":0.9394,"subfield":{"id":"https://openalex.org/subfields/3312","display_name":"Sociology and Political Science"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/semantic-compression","display_name":"Semantic compression","score":0.7338164}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.80256486},{"id":"https://openalex.org/C202708506","wikidata":"https://www.wikidata.org/wiki/Q7449050","display_name":"Semantic compression","level":5,"score":0.7338164},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.59299326},{"id":"https://openalex.org/C130318100","wikidata":"https://www.wikidata.org/wiki/Q2268914","display_name":"Semantic similarity","level":2,"score":0.5860942},{"id":"https://openalex.org/C511149849","wikidata":"https://www.wikidata.org/wiki/Q7449051","display_name":"Semantic computing","level":3,"score":0.52343535},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.49924588},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.4469784},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3246474},{"id":"https://openalex.org/C6881194","wikidata":"https://www.wikidata.org/wiki/Q7449091","display_name":"Semantic technology","level":4,"score":0.22351393},{"id":"https://openalex.org/C2129575","wikidata":"https://www.wikidata.org/wiki/Q54837","display_name":"Semantic Web","level":2,"score":0.083699584},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2208.04094","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false},{"is_oa":false,"landing_page_url":"https://api.datacite.org/dois/10.48550/arxiv.2208.04094","pdf_url":null,"source":{"id":"https://openalex.org/S4393179698","display_name":"DataCite API","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I4210145204","host_organization_name":"DataCite","host_organization_lineage":["https://openalex.org/I4210145204"],"host_organization_lineage_names":["DataCite"],"type":"metadata"},"license":null,"license_id":null,"version":null}],"best_oa_location":{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2208.04094","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false},"sustainable_development_goals":[{"display_name":"Quality education","score":0.63,"id":"https://metadata.un.org/sdg/4"}],"grants":[],"datasets":[],"versions":[],"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W858433989","https://openalex.org/W3134365128","https://openalex.org/W3016822073","https://openalex.org/W2541135911","https://openalex.org/W2365969513","https://openalex.org/W2362519509","https://openalex.org/W2359259132","https://openalex.org/W2250607250","https://openalex.org/W2103835134","https://openalex.org/W1965623300"],"abstract_inverted_index":{"Semantic":[0],"communications":[1,55],"has":[2],"received":[3],"growing":[4],"interest":[5],"since":[6],"it":[7],"can":[8],"remarkably":[9],"reduce":[10],"the":[11,26,43,46,53,89,97,105,121,128,151,167,184,207],"amount":[12],"of":[13,45,92,225],"data":[14,58,94,178],"to":[15,41,114,132,229],"be":[16],"transmitted":[17],"without":[18],"missing":[19],"critical":[20],"information.":[21],"Most":[22],"existing":[23],"works":[24],"explore":[25],"semantic":[27,54,76,90,112,116,133,144,160,190,219],"encoding":[28,157],"and":[29,33,66,101,108,135,172,196,213,218,222,232],"transmission":[30],"for":[31,56],"text":[32],"apply":[34],"techniques":[35],"in":[36,64,153],"Natural":[37],"Language":[38],"Processing":[39],"(NLP)":[40],"interpret":[42],"meaning":[44],"text.":[47],"In":[48],"this":[49],"paper,":[50],"we":[51,87,119,139,182],"conceive":[52],"image":[57,93,122,236],"that":[59,80,95,125,192,206],"is":[60,150,170,179,210],"much":[61],"more":[62],"richer":[63],"semantics":[65],"bandwidth":[67],"sensitive.":[68],"We":[69],"propose":[70,109,120,183],"an":[71,200],"reinforcement":[72],"learning":[73],"based":[74,189],"adaptive":[75,163],"coding":[77],"(RL-ASC)":[78],"approach":[79],"encodes":[81],"images":[82],"beyond":[83],"pixel":[84,130],"level.":[85,165],"Firstly,":[86],"define":[88],"concept":[91,161],"includes":[96],"category,":[98],"spatial":[99],"arrangement,":[100],"visual":[102],"feature":[103],"as":[104],"representation":[106],"unit,":[107],"a":[110,141,158],"convolutional":[111],"encoder":[113],"extract":[115],"concepts.":[117],"Secondly,":[118],"reconstruction":[123],"criterion":[124],"evolves":[126],"from":[127],"traditional":[129],"similarity":[131,134],"perceptual":[136],"performance.":[137],"Thirdly,":[138],"design":[140],"novel":[142],"RL-based":[143],"bit":[145,226],"allocation":[146],"model,":[147],"whose":[148],"reward":[149],"increase":[152],"rate-semantic-perceptual":[154],"performance":[155],"after":[156],"certain":[159],"with":[162],"quantization":[164],"Thus,":[166],"task-related":[168],"information":[169],"preserved":[171],"reconstructed":[173],"properly":[174],"while":[175],"less":[176],"important":[177],"discarded.":[180],"Finally,":[181],"Generative":[185],"Adversarial":[186],"Nets":[187],"(GANs)":[188],"decoder":[191],"fuses":[193],"both":[194],"locally":[195],"globally":[197],"features":[198],"via":[199],"attention":[201],"module.":[202],"Experimental":[203],"results":[204],"demonstrate":[205],"proposed":[208],"RL-ASC":[209],"noise":[211],"robust":[212],"could":[214],"reconstruct":[215],"visually":[216],"pleasant":[217],"consistent":[220],"image,":[221],"saves":[223],"times":[224],"cost":[227],"compared":[228],"standard":[230],"codecs":[231],"other":[233],"deep":[234],"learning-based":[235],"codecs.":[237]},"abstract_inverted_index_v3":null,"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4300158295","counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":1}],"updated_date":"2025-04-23T19:07:25.799930","created_date":"2022-10-03"}