{"id":"https://openalex.org/W4221150810","doi":"https://doi.org/10.48550/arxiv.2203.10247","title":"HIPA: Hierarchical Patch Transformer for Single Image Super Resolution","display_name":"HIPA: Hierarchical Patch Transformer for Single Image Super Resolution","publication_year":2022,"publication_date":"2022-01-01","ids":{"openalex":"https://openalex.org/W4221150810","doi":"https://doi.org/10.48550/arxiv.2203.10247"},"language":"en","primary_location":{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2203.10247","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":null,"is_accepted":false,"is_published":false},"type":"preprint","type_crossref":"journal-article","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/abs/2203.10247","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5111582622","display_name":"Qing Cai","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cai, Qing","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5108429353","display_name":"Yiming Qian","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Qian, Yiming","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100753458","display_name":"Jinxing Li","orcid":"https://orcid.org/0000-0001-5156-0305"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Jinxing","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100308848","display_name":"Jun Lv","orcid":"https://orcid.org/0000-0003-4328-0420"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lv, Jun","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5081300658","display_name":"Yee\u2010Hong Yang","orcid":"https://orcid.org/0000-0002-7194-3327"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yang, Yee-Hong","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103150943","display_name":"Feng Wu","orcid":"https://orcid.org/0000-0001-7266-5579"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wu, Feng","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5100325058","display_name":"David Zhang","orcid":"https://orcid.org/0000-0002-5027-5286"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, David","raw_affiliation_strings":[],"affiliations":[]}],"institution_assertions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.0,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":0,"max":59},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T11105","display_name":"Advanced Image Processing Techniques","score":0.9997,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11105","display_name":"Advanced Image Processing Techniques","score":0.9997,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.994,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11659","display_name":"Advanced Image Fusion Techniques","score":0.9918,"subfield":{"id":"https://openalex.org/subfields/2214","display_name":"Media Technology"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/merge","display_name":"Merge (version control)","score":0.4404582}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7535701},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.6278596},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5121064},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.45267582},{"id":"https://openalex.org/C197129107","wikidata":"https://www.wikidata.org/wiki/Q1921621","display_name":"Merge (version control)","level":2,"score":0.4404582},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.34848666},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.08889535},{"id":"https://openalex.org/C165801399","wikidata":"https://www.wikidata.org/wiki/Q25428","display_name":"Voltage","level":2,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2203.10247","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":null,"is_accepted":false,"is_published":false},{"is_oa":true,"landing_page_url":"http://arxiv.org/abs/2203.10247","pdf_url":"http://arxiv.org/pdf/2203.10247","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false},{"is_oa":false,"landing_page_url":"https://api.datacite.org/dois/10.48550/arxiv.2203.10247","pdf_url":null,"source":{"id":"https://openalex.org/S4393179698","display_name":"DataCite API","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I4210145204","host_organization_name":"DataCite","host_organization_lineage":["https://openalex.org/I4210145204"],"host_organization_lineage_names":["DataCite"],"type":"metadata"},"license":null,"license_id":null,"version":null}],"best_oa_location":{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2203.10247","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":null,"is_accepted":false,"is_published":false},"sustainable_development_goals":[],"grants":[],"datasets":[],"versions":["https://openalex.org/W4378804909"],"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W3116076068","https://openalex.org/W2951359407","https://openalex.org/W2775347418","https://openalex.org/W2772917594","https://openalex.org/W2755342338","https://openalex.org/W2229312674","https://openalex.org/W2166024367","https://openalex.org/W2079911747","https://openalex.org/W2058170566","https://openalex.org/W1969923398"],"abstract_inverted_index":{"Transformer-based":[0],"architectures":[1],"start":[2,82],"to":[3,92,148,165,173,187],"emerge":[4],"in":[5,77],"single":[6],"image":[7,60,76,118],"super":[8],"resolution":[9,59],"(SISR)":[10],"and":[11,89,130,215],"have":[12],"achieved":[13],"promising":[14],"performance.":[15],"Most":[16],"existing":[17],"Vision":[18],"Transformers":[19],"divide":[20],"images":[21],"into":[22],"the":[23,57,93,150,170,189,204,208],"same":[24],"number":[25],"of":[26,43,207],"patches":[27,39],"with":[28,40,83,85,127],"a":[29,50,62,69,97,122,131,138,181],"fixed":[30],"size,":[31],"which":[32,154,168],"may":[33],"not":[34,101],"be":[35,157],"optimal":[36],"for":[37,116,125,134,144],"restoring":[38],"different":[41,117,163,166,194],"levels":[42],"texture":[44],"richness.":[45],"This":[46],"paper":[47],"presents":[48],"HIPA,":[49],"novel":[51],"Transformer":[52,145],"architecture":[53],"that":[54,72],"progressively":[55],"recovers":[56],"high":[58],"using":[61,121],"hierarchical":[63,98],"patch":[64,87,99,124,133],"partition.":[65],"Specifically,":[66],"we":[67,81,178],"build":[68],"cascaded":[70],"model":[71],"processes":[73],"an":[74],"input":[75],"multiple":[78,108],"stages,":[79],"where":[80],"tokens":[84,155],"small":[86],"sizes":[88],"gradually":[90],"merge":[91],"full":[94],"resolution.":[95],"Such":[96],"mechanism":[100],"only":[102],"explicitly":[103],"enables":[104],"feature":[105],"aggregation":[106],"at":[107],"resolutions":[109],"but":[110],"also":[111,179],"adaptively":[112],"learns":[113],"patch-aware":[114],"features":[115],"regions,":[119],"e.g.,":[120],"smaller":[123],"areas":[126],"fine":[128],"details":[129],"larger":[132],"textureless":[135],"regions.":[136],"Meanwhile,":[137],"new":[139,182],"attention-based":[140],"position":[141],"encoding":[142],"scheme":[143],"is":[146,169],"proposed":[147,209],"let":[149],"network":[151],"focus":[152],"on":[153,199],"should":[156],"paid":[158],"more":[159],"attention":[160,185],"by":[161],"assigning":[162],"weights":[164],"tokens,":[167],"first":[171],"time":[172],"our":[174],"best":[175],"knowledge.":[176],"Furthermore,":[177],"propose":[180],"multi-reception":[183],"field":[184,192],"module":[186],"enlarge":[188],"convolution":[190],"reception":[191],"from":[193],"branches.":[195],"The":[196],"experimental":[197],"results":[198],"several":[200],"public":[201],"datasets":[202],"demonstrate":[203],"superior":[205],"performance":[206],"HIPA":[210],"over":[211],"previous":[212],"methods":[213],"quantitatively":[214],"qualitatively.":[216]},"abstract_inverted_index_v3":null,"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4221150810","counts_by_year":[],"updated_date":"2025-03-19T08:21:39.271144","created_date":"2022-04-03"}