{"id":"https://openalex.org/W2095366181","doi":"https://doi.org/10.1117/12.662918","title":"<title>Complex document information processing: prototype, test collection, and evaluation</title>","display_name":"<title>Complex document information processing: prototype, test collection, and evaluation</title>","publication_year":2006,"publication_date":"2006-01-15","ids":{"openalex":"https://openalex.org/W2095366181","doi":"https://doi.org/10.1117/12.662918","mag":"2095366181"},"language":"en","primary_location":{"is_oa":false,"landing_page_url":"https://doi.org/10.1117/12.662918","pdf_url":null,"source":{"id":"https://openalex.org/S183492911","display_name":"Proceedings of SPIE, the International Society for Optical Engineering/Proceedings of SPIE","issn_l":"0277-786X","issn":["0277-786X","1996-756X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310315543","host_organization_name":"SPIE","host_organization_lineage":["https://openalex.org/P4310315543"],"host_organization_lineage_names":["SPIE"],"type":"journal"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false},"type":"article","type_crossref":"proceedings-article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5023698748","display_name":"Gady Agam","orcid":null},"institutions":[{"id":"https://openalex.org/I180949307","display_name":"Illinois Institute of Technology","ror":"https://ror.org/037t3ry66","country_code":"US","type":"education","lineage":["https://openalex.org/I180949307"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"G. Agam","raw_affiliation_strings":["Illinois Institute of Technology, United#N# States"],"affiliations":[{"raw_affiliation_string":"Illinois Institute of Technology, United#N# States","institution_ids":["https://openalex.org/I180949307"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5013934685","display_name":"Shlomo Argamon","orcid":"https://orcid.org/0000-0001-8699-324X"},"institutions":[{"id":"https://openalex.org/I180949307","display_name":"Illinois Institute of Technology","ror":"https://ror.org/037t3ry66","country_code":"US","type":"education","lineage":["https://openalex.org/I180949307"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"S. Argamon","raw_affiliation_strings":["Illinois Institute of Technology, United#N# States"],"affiliations":[{"raw_affiliation_string":"Illinois Institute of Technology, United#N# States","institution_ids":["https://openalex.org/I180949307"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5062591304","display_name":"Ophir Frieder","orcid":"https://orcid.org/0000-0001-5076-8171"},"institutions":[{"id":"https://openalex.org/I180949307","display_name":"Illinois Institute of Technology","ror":"https://ror.org/037t3ry66","country_code":"US","type":"education","lineage":["https://openalex.org/I180949307"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"O. Frieder","raw_affiliation_strings":["Illinois Institute of Technology, United#N# States"],"affiliations":[{"raw_affiliation_string":"Illinois Institute of Technology, United#N# States","institution_ids":["https://openalex.org/I180949307"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5109992497","display_name":"D. Grossman","orcid":null},"institutions":[{"id":"https://openalex.org/I180949307","display_name":"Illinois Institute of Technology","ror":"https://ror.org/037t3ry66","country_code":"US","type":"education","lineage":["https://openalex.org/I180949307"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"D. Grossman","raw_affiliation_strings":["Illinois Institute of Technology, United#N# States"],"affiliations":[{"raw_affiliation_string":"Illinois Institute of Technology, United#N# States","institution_ids":["https://openalex.org/I180949307"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5020081385","display_name":"David Lewis","orcid":"https://orcid.org/0000-0002-3503-4644"},"institutions":[{"id":"https://openalex.org/I4210148173","display_name":"Morgan, Lewis & Bockius (United States)","ror":"https://ror.org/04c0z3e83","country_code":"US","type":"company","lineage":["https://openalex.org/I4210148173"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"D. Lewis","raw_affiliation_strings":["David D. Lewis Consulting (United States)"],"affiliations":[{"raw_affiliation_string":"David D. Lewis Consulting (United States)","institution_ids":["https://openalex.org/I4210148173"]}]}],"institution_assertions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":2.277,"has_fulltext":true,"fulltext_origin":"ngrams","cited_by_count":19,"citation_normalized_percentile":{"value":0.876005,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":86,"max":87},"biblio":{"volume":"6067","issue":null,"first_page":"60670N","last_page":"11"},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":0.9989,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":0.9989,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10824","display_name":"Image Retrieval and Classification Techniques","score":0.9988,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12016","display_name":"Web Data Mining and Analysis","score":0.9932,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/handwriting","display_name":"Handwriting","score":0.687331},{"id":"https://openalex.org/keywords/relevance","display_name":"Relevance","score":0.42113096}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8816732},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.762812},{"id":"https://openalex.org/C93518851","wikidata":"https://www.wikidata.org/wiki/Q180160","display_name":"Metadata","level":2,"score":0.75073606},{"id":"https://openalex.org/C136197465","wikidata":"https://www.wikidata.org/wiki/Q1729295","display_name":"Variety (cybernetics)","level":2,"score":0.7477727},{"id":"https://openalex.org/C2779386606","wikidata":"https://www.wikidata.org/wiki/Q2393642","display_name":"Handwriting","level":2,"score":0.687331},{"id":"https://openalex.org/C21442007","wikidata":"https://www.wikidata.org/wiki/Q1027879","display_name":"Graphics","level":2,"score":0.48167905},{"id":"https://openalex.org/C158154518","wikidata":"https://www.wikidata.org/wiki/Q7310970","display_name":"Relevance (law)","level":2,"score":0.42113096},{"id":"https://openalex.org/C68699486","wikidata":"https://www.wikidata.org/wiki/Q265904","display_name":"Document Structure Description","level":3,"score":0.41576335},{"id":"https://openalex.org/C2777267654","wikidata":"https://www.wikidata.org/wiki/Q3519023","display_name":"Test (biology)","level":2,"score":0.41487038},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.39778283},{"id":"https://openalex.org/C8797682","wikidata":"https://www.wikidata.org/wiki/Q2115","display_name":"XML","level":2,"score":0.22072738},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.16408068},{"id":"https://openalex.org/C121684516","wikidata":"https://www.wikidata.org/wiki/Q7600677","display_name":"Computer graphics (images)","level":1,"score":0.11608344},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"is_oa":false,"landing_page_url":"https://doi.org/10.1117/12.662918","pdf_url":null,"source":{"id":"https://openalex.org/S183492911","display_name":"Proceedings of SPIE, the International Society for Optical Engineering/Proceedings of SPIE","issn_l":"0277-786X","issn":["0277-786X","1996-756X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310315543","host_organization_name":"SPIE","host_organization_lineage":["https://openalex.org/P4310315543"],"host_organization_lineage_names":["SPIE"],"type":"journal"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Quality education","id":"https://metadata.un.org/sdg/4","score":0.41}],"grants":[],"datasets":[],"versions":[],"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W3166464480","https://openalex.org/W3118925046","https://openalex.org/W2561540377","https://openalex.org/W2507888814","https://openalex.org/W2388180914","https://openalex.org/W2381764175","https://openalex.org/W2374694510","https://openalex.org/W2360066868","https://openalex.org/W2027154813","https://openalex.org/W1694630026"],"abstract_inverted_index":{"Analysis":[0],"of":[1,4,53,70,83,90,125,128,154,156,163,168],"large":[2,76],"collections":[3],"complex":[5,106,139],"documents":[6,16,18,31,85],"is":[7,79],"an":[8],"increasingly":[9],"important":[10],"need":[11],"for":[12,74,149,177],"numerous":[13],"applications.":[14],"Complex":[15],"are":[17,26,132],"that":[19],"typically":[20],"start":[21],"out":[22],"on":[23,160],"paper":[24],"and":[25,36,59,64,108,158,165],"then":[27,109],"electronically":[28],"scanned.":[29],"These":[30],"have":[32,47],"rich":[33,102],"internal":[34],"structure":[35],"might":[37],"only":[38],"be":[39],"available":[40],"in":[41,93],"image":[42],"form.":[43],"Additionally,":[44],"they":[45],"may":[46],"been":[48],"produced":[49],"by":[50,57],"a":[51,75,105,122,135,152,161],"combination":[52],"printing":[54],"technologies":[55],"(or":[56],"handwriting);":[58],"include":[60,146],"diagrams,":[61],"graphics,":[62],"tables":[63],"other":[65],"non-textual":[66],"elements.":[67],"The":[68,143],"state":[69],"the":[71,115,126],"art":[72],"today":[73],"document":[77,107,140],"collection":[78,144],"essentially":[80],"text":[81,118],"search":[82],"OCR'd":[84],"with":[86,117],"no":[87],"meaningful":[88],"use":[89],"data":[91],"found":[92],"images,":[94],"signatures,":[95],"logos,":[96],"etc.":[97],"Our":[98],"prototype":[99],"automatically":[100],"generates":[101],"metadata":[103,116],"about":[104],"applies":[110],"query":[111],"tools":[112],"to":[113],"integrate":[114],"search.":[119],"To":[120],"ensure":[121],"thorough":[123],"evaluation":[124],"effectiveness":[127],"our":[129],"prototype,":[130],"we":[131],"also":[133],"developing":[134],"roughly":[136],"42,000,000":[137],"page":[138],"test":[141],"collection.":[142],"will":[145],"relevance":[147],"judgments":[148],"queries":[150,175],"at":[151],"variety":[153,162],"levels":[155],"detail":[157],"depending":[159],"content":[164],"structural":[166],"characteristics":[167],"documents,":[169],"as":[170,172],"well":[171],"\"known":[173],"item\"":[174],"looking":[176],"particular":[178],"documents.":[179]},"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W2095366181","counts_by_year":[{"year":2019,"cited_by_count":2},{"year":2018,"cited_by_count":1},{"year":2016,"cited_by_count":2},{"year":2015,"cited_by_count":1},{"year":2014,"cited_by_count":2},{"year":2013,"cited_by_count":2}],"updated_date":"2024-12-15T19:40:46.741696","created_date":"2016-06-24"}