{"id":"https://openalex.org/W4401306479","doi":"https://doi.org/10.48550/arxiv.2407.21284","title":"Robust Box Prompt based SAM for Medical Image Segmentation","display_name":"Robust Box Prompt based SAM for Medical Image Segmentation","publication_year":2024,"publication_date":"2024-07-30","ids":{"openalex":"https://openalex.org/W4401306479","doi":"https://doi.org/10.48550/arxiv.2407.21284"},"language":"en","primary_location":{"is_oa":true,"landing_page_url":"http://arxiv.org/abs/2407.21284","pdf_url":"http://arxiv.org/pdf/2407.21284","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false},"type":"preprint","type_crossref":"posted-content","indexed_in":["arxiv"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"http://arxiv.org/pdf/2407.21284","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101740599","display_name":"Yuhao Huang","orcid":"https://orcid.org/0000-0002-0126-1857"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Huang, Yuhao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5017262410","display_name":"Xin Yang","orcid":"https://orcid.org/0000-0003-4653-6524"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yang, Xin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100784571","display_name":"Han Zhou","orcid":"https://orcid.org/0000-0003-3778-4075"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhou, Han","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103221780","display_name":"Yan Cao","orcid":"https://orcid.org/0000-0001-5510-9773"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cao, Yan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5088178652","display_name":"Haoran Dou","orcid":"https://orcid.org/0000-0001-8628-5489"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Dou, Haoran","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5022631295","display_name":"Fajin Dong","orcid":"https://orcid.org/0000-0002-4558-4885"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Dong, Fajin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5065374358","display_name":"Dong Ni","orcid":"https://orcid.org/0000-0002-9146-6003"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ni, Dong","raw_affiliation_strings":[],"affiliations":[]}],"institution_assertions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.0,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":0,"max":84},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10052","display_name":"Medical Image Segmentation Techniques","score":0.9813,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10052","display_name":"Medical Image Segmentation Techniques","score":0.9813,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12702","display_name":"Brain Tumor Detection and Classification","score":0.9755,"subfield":{"id":"https://openalex.org/subfields/2808","display_name":"Neurology"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T12549","display_name":"Image and Object Detection Techniques","score":0.9089,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[],"concepts":[{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5648258},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.5512081},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5217308},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.51978743},{"id":"https://openalex.org/C124504099","wikidata":"https://www.wikidata.org/wiki/Q56933","display_name":"Image segmentation","level":3,"score":0.51197135},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.50139475}],"mesh":[],"locations_count":1,"locations":[{"is_oa":true,"landing_page_url":"http://arxiv.org/abs/2407.21284","pdf_url":"http://arxiv.org/pdf/2407.21284","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false}],"best_oa_location":{"is_oa":true,"landing_page_url":"http://arxiv.org/abs/2407.21284","pdf_url":"http://arxiv.org/pdf/2407.21284","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false},"sustainable_development_goals":[],"grants":[],"datasets":[],"versions":[],"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W3116076068","https://openalex.org/W2951359407","https://openalex.org/W2775347418","https://openalex.org/W2772917594","https://openalex.org/W2755342338","https://openalex.org/W2229312674","https://openalex.org/W2166024367","https://openalex.org/W2079911747","https://openalex.org/W2058170566","https://openalex.org/W1969923398"],"abstract_inverted_index":{"The":[0],"Segment":[1],"Anything":[2],"Model":[3],"(SAM)":[4],"can":[5,132,145],"achieve":[6],"satisfactory":[7],"segmentation":[8,47,113,155],"performance":[9,48],"under":[10,49],"high-quality":[11,84],"box":[12,23,80],"prompts.":[13],"However,":[14],"SAM's":[15,46],"robustness":[16,142],"is":[17,56],"compromised":[18],"by":[19],"the":[20,68,73,78,111,123,127,134,141,152,166],"decline":[21],"in":[22,28],"quality,":[24],"limiting":[25],"its":[26],"practicality":[27],"clinical":[29],"reality.":[30],"In":[31],"this":[32],"study,":[33],"we":[34,59,98,116],"propose":[35,60],"a":[36,61,83,100,118],"novel":[37],"Robust":[38],"Box":[39],"prompt":[40,62,81,95,101],"based":[41],"SAM":[42,144],"(\\textbf{RoBox-SAM})":[43],"to":[44,65,75,104,109,121],"ensure":[45],"prompts":[50,108],"with":[51],"different":[52],"qualities.":[53],"Our":[54],"contribution":[55],"three-fold.":[57],"First,":[58],"refinement":[63],"module":[64,103],"implicitly":[66],"perceive":[67],"potential":[69],"targets,":[70],"and":[71,137,162],"output":[72],"offsets":[74],"directly":[76],"transform":[77],"low-quality":[79],"into":[82],"one.":[85],"We":[86],"then":[87],"provide":[88],"an":[89],"online":[90],"iterative":[91],"strategy":[92],"for":[93],"further":[94,147],"refinement.":[96],"Second,":[97],"introduce":[99],"enhancement":[102],"automatically":[105],"generate":[106],"point":[107],"assist":[110],"box-promptable":[112],"effectively.":[114],"Last,":[115],"build":[117],"self-information":[119],"extractor":[120],"encode":[122],"prior":[124],"information":[125],"from":[126],"input":[128],"image.":[129],"These":[130],"features":[131],"optimize":[133],"image":[135],"embeddings":[136],"attention":[138],"calculation,":[139],"thus,":[140],"of":[143,168],"be":[146],"enhanced.":[148],"Extensive":[149],"experiments":[150],"on":[151],"large":[153],"medical":[154],"dataset":[156],"including":[157],"99,299":[158],"images,":[159],"5":[160],"modalities,":[161],"25":[163],"organs/targets":[164],"validated":[165],"efficacy":[167],"our":[169],"proposed":[170],"RoBox-SAM.":[171]},"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4401306479","counts_by_year":[],"updated_date":"2024-12-15T13:53:13.795679","created_date":"2024-08-04"}