{"id":"https://openalex.org/W4376652989","doi":"https://doi.org/10.48550/arxiv.2305.07783","title":"ROI-based Deep Image Compression with Swin Transformers","display_name":"ROI-based Deep Image Compression with Swin Transformers","publication_year":2023,"publication_date":"2023-01-01","ids":{"openalex":"https://openalex.org/W4376652989","doi":"https://doi.org/10.48550/arxiv.2305.07783"},"language":"en","primary_location":{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2305.07783","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false},"type":"preprint","type_crossref":"posted-content","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/abs/2305.07783","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100649277","display_name":"Binglin Li","orcid":"https://orcid.org/0000-0003-2798-1710"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Binglin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5108166775","display_name":"Jie Liang","orcid":"https://orcid.org/0000-0003-3003-4343"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liang, Jie","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5045288861","display_name":"Haisheng Fu","orcid":"https://orcid.org/0000-0001-8709-5927"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Fu, Haisheng","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5046233912","display_name":"Jingning Han","orcid":"https://orcid.org/0000-0001-7168-2254"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Han, Jingning","raw_affiliation_strings":[],"affiliations":[]}],"institution_assertions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.0,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":0,"max":65},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9978,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9978,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10824","display_name":"Image Retrieval and Classification Techniques","score":0.9963,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10052","display_name":"Medical Image Segmentation Techniques","score":0.9952,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/region-of-interest","display_name":"Region of interest","score":0.81918705}],"concepts":[{"id":"https://openalex.org/C19609008","wikidata":"https://www.wikidata.org/wiki/Q2138203","display_name":"Region of interest","level":2,"score":0.81918705},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.77515167},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.75980616},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.66627204},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.5707725},{"id":"https://openalex.org/C13481523","wikidata":"https://www.wikidata.org/wiki/Q412438","display_name":"Image compression","level":4,"score":0.4533004},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3347723},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.30512038},{"id":"https://openalex.org/C9417928","wikidata":"https://www.wikidata.org/wiki/Q1070689","display_name":"Image processing","level":3,"score":0.24044633}],"mesh":[],"locations_count":3,"locations":[{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2305.07783","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false},{"is_oa":true,"landing_page_url":"http://arxiv.org/abs/2305.07783","pdf_url":"http://arxiv.org/pdf/2305.07783","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false},{"is_oa":false,"landing_page_url":"https://api.datacite.org/dois/10.48550/arxiv.2305.07783","pdf_url":null,"source":{"id":"https://openalex.org/S4393179698","display_name":"DataCite API","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I4210145204","host_organization_name":"DataCite","host_organization_lineage":["https://openalex.org/I4210145204"],"host_organization_lineage_names":["DataCite"],"type":"metadata"},"license":null,"license_id":null,"version":null}],"best_oa_location":{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2305.07783","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false},"sustainable_development_goals":[],"grants":[],"datasets":[],"versions":[],"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4389858081","https://openalex.org/W4385583601","https://openalex.org/W4379231730","https://openalex.org/W4298131179","https://openalex.org/W2799953226","https://openalex.org/W2766331907","https://openalex.org/W2765471884","https://openalex.org/W2501551404","https://openalex.org/W2326552140","https://openalex.org/W2113201962"],"abstract_inverted_index":{"Encoding":[0],"the":[1,10,43,56,65,71,75,81,128],"Region":[2],"Of":[3],"Interest":[4],"(ROI)":[5],"with":[6,35,115],"better":[7],"quality":[8],"than":[9,100],"background":[11],"has":[12,119],"many":[13],"applications":[14],"including":[15],"video":[16,19],"conferencing":[17],"systems,":[18],"surveillance":[20],"and":[21,77,103,123],"object-oriented":[22],"vision":[23],"tasks.":[24],"In":[25],"this":[26],"paper,":[27],"we":[28,68],"propose":[29],"a":[30],"ROI-based":[31],"image":[32],"compression":[33],"framework":[34],"Swin":[36],"transformers":[37],"as":[38],"main":[39],"building":[40],"blocks":[41],"for":[42,88,107],"autoencoder":[44],"network.":[45],"The":[46],"binary":[47],"ROI":[48,66,76,98],"mask":[49],"is":[50],"integrated":[51],"into":[52],"different":[53,89],"layers":[54],"of":[55,74],"network":[57],"to":[58],"provide":[59],"spatial":[60],"information":[61],"guidance.":[62],"Based":[63],"on":[64,112,127],"mask,":[67],"can":[69],"control":[70],"relative":[72],"importance":[73],"non-ROI":[78],"by":[79],"modifying":[80],"corresponding":[82],"Lagrange":[83],"multiplier":[84],"$":[85,87],"\\lambda":[86],"regions.":[90],"Experimental":[91],"results":[92],"show":[93],"our":[94],"model":[95],"achieves":[96],"higher":[97],"PSNR":[99,106],"other":[101],"methods":[102],"modest":[104],"average":[105],"human":[108],"evaluation.":[109],"When":[110],"tested":[111],"models":[113],"pre-trained":[114],"original":[116],"images,":[117],"it":[118],"superior":[120],"object":[121],"detection":[122],"instance":[124],"segmentation":[125],"performance":[126],"COCO":[129],"validation":[130],"dataset.":[131]},"abstract_inverted_index_v3":null,"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4376652989","counts_by_year":[],"updated_date":"2025-04-14T09:48:57.480455","created_date":"2023-05-17"}