{"id":"https://openalex.org/W4283830263","doi":"https://doi.org/10.48550/arxiv.2207.01220","title":"BusiNet -- a Light and Fast Text Detection Network for Business Documents","display_name":"BusiNet -- a Light and Fast Text Detection Network for Business Documents","publication_year":2022,"publication_date":"2022-01-01","ids":{"openalex":"https://openalex.org/W4283830263","doi":"https://doi.org/10.48550/arxiv.2207.01220"},"language":"en","primary_location":{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2207.01220","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false},"type":"preprint","type_crossref":"posted-content","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/abs/2207.01220","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5020146315","display_name":"Oshri Naparstek","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Naparstek, Oshri","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5005382374","display_name":"Ophir Azulai","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Azulai, Ophir","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5015846077","display_name":"Daniel Rotman","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Rotman, Daniel","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5047695006","display_name":"Yevgeny Burshtein","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Burshtein, Yevgeny","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5024778597","display_name":"Peter Staar","orcid":"https://orcid.org/0000-0002-8088-0823"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Staar, Peter","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5047102702","display_name":"Udi Barzelay","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Barzelay, Udi","raw_affiliation_strings":[],"affiliations":[]}],"institution_assertions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.0,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":0,"max":60},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T12357","display_name":"Digital Media Forensic Detection","score":0.9991,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12357","display_name":"Digital Media Forensic Detection","score":0.9991,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11512","display_name":"Anomaly Detection Techniques and Applications","score":0.9894,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":0.9893,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/optical-character-recognition","display_name":"Optical character recognition","score":0.71485144},{"id":"https://openalex.org/keywords/upload","display_name":"Upload","score":0.6431448}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8292488},{"id":"https://openalex.org/C546480517","wikidata":"https://www.wikidata.org/wiki/Q167555","display_name":"Optical character recognition","level":3,"score":0.71485144},{"id":"https://openalex.org/C71901391","wikidata":"https://www.wikidata.org/wiki/Q7126699","display_name":"Upload","level":2,"score":0.6431448},{"id":"https://openalex.org/C75165309","wikidata":"https://www.wikidata.org/wiki/Q2258979","display_name":"Search engine indexing","level":2,"score":0.54219365},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.49538386},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.47994664},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.4589968},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.40059158},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.341251},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.25342897},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.16325942},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2207.01220","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false},{"is_oa":true,"landing_page_url":"http://arxiv.org/abs/2207.01220","pdf_url":"http://arxiv.org/pdf/2207.01220","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false},{"is_oa":false,"landing_page_url":"https://api.datacite.org/dois/10.48550/arxiv.2207.01220","pdf_url":null,"source":{"id":"https://openalex.org/S4393179698","display_name":"DataCite API","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I4210145204","host_organization_name":"DataCite","host_organization_lineage":["https://openalex.org/I4210145204"],"host_organization_lineage_names":["DataCite"],"type":"metadata"},"license":null,"license_id":null,"version":null}],"best_oa_location":{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2207.01220","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false},"sustainable_development_goals":[{"score":0.83,"display_name":"Peace, justice, and strong institutions","id":"https://metadata.un.org/sdg/16"}],"grants":[],"datasets":[],"versions":[],"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4361862506","https://openalex.org/W4321854979","https://openalex.org/W4312214821","https://openalex.org/W3037018281","https://openalex.org/W2972592048","https://openalex.org/W2944823289","https://openalex.org/W2497626292","https://openalex.org/W2390344072","https://openalex.org/W2358319515","https://openalex.org/W2003209439"],"abstract_inverted_index":{"For":[0],"digitizing":[1],"or":[2,29],"indexing":[3],"physical":[4],"documents,":[5,18],"Optical":[6],"Character":[7],"Recognition":[8],"(OCR),":[9],"the":[10,46,139],"process":[11],"of":[12,48,63,144],"extracting":[13],"textual":[14],"information":[15,71],"from":[16],"scanned":[17,107],"is":[19,26,103,119],"a":[20,24,55,80,113],"vital":[21],"technology.":[22],"When":[23],"document":[25,108],"visually":[27],"damaged":[28],"contains":[30],"non-textual":[31],"elements,":[32],"existing":[33],"technologies":[34],"can":[35,43],"yield":[36],"poor":[37],"results,":[38],"as":[39,73],"erroneous":[40],"detection":[41,56],"results":[42],"greatly":[44],"affect":[45],"quality":[47],"OCR.":[49,84],"In":[50],"this":[51],"paper":[52],"we":[53],"present":[54],"network":[57],"dubbed":[58],"BusiNet":[59,85,102],"aimed":[60],"at":[61],"OCR":[62],"business":[64],"documents.":[65],"Business":[66],"documents":[67],"often":[68],"include":[69],"sensitive":[70],"and":[72,91,110,141],"such":[74],"they":[75],"cannot":[76],"be":[77,89],"uploaded":[78],"to":[79,88,105,122],"cloud":[81],"service":[82],"for":[83],"was":[86],"designed":[87],"fast":[90],"light":[92],"so":[93],"it":[94],"could":[95],"run":[96],"locally":[97],"preventing":[98],"privacy":[99],"issues.":[100],"Furthermore,":[101],"built":[104],"handle":[106],"corruption":[109],"noise":[111,124],"using":[112],"specialized":[114],"synthetic":[115],"dataset.":[116],"The":[117],"model":[118],"made":[120],"robust":[121],"unseen":[123],"by":[125],"employing":[126],"adversarial":[127],"training":[128],"strategies.":[129],"We":[130],"perform":[131],"an":[132],"evaluation":[133],"on":[134],"publicly":[135],"available":[136],"datasets":[137],"demonstrating":[138],"usefulness":[140],"broad":[142],"applicability":[143],"our":[145],"model.":[146]},"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4283830263","counts_by_year":[],"updated_date":"2024-12-09T20:26:23.128561","created_date":"2022-07-07"}