{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,11,19]],"date-time":"2024-11-19T16:36:36Z","timestamp":1732034196372},"reference-count":30,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2012,5,28]],"date-time":"2012-05-28T00:00:00Z","timestamp":1338163200000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/creativecommons.org\/licenses\/by\/2.0"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["Source Code Biol Med"],"published-print":{"date-parts":[[2012,12]]},"DOI":"10.1186\/1751-0473-7-7","type":"journal-article","created":{"date-parts":[[2012,6,1]],"date-time":"2012-06-01T08:31:05Z","timestamp":1338539465000},"source":"Crossref","is-referenced-by-count":73,"title":["Layout-aware text extraction from full-text PDF of scientific articles"],"prefix":"10.1186","volume":"7","author":[{"given":"Cartic","family":"Ramakrishnan","sequence":"first","affiliation":[]},{"given":"Abhishek","family":"Patnia","sequence":"additional","affiliation":[]},{"given":"Eduard","family":"Hovy","sequence":"additional","affiliation":[]},{"given":"Gully APC","family":"Burns","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2012,5,28]]},"reference":[{"issue":"2","key":"72_CR1","doi-asserted-by":"publisher","first-page":"e65","DOI":"10.1371\/journal.pbio.0030065","volume":"3","author":"D Rebholz-Schuhmann","year":"2005","unstructured":"Rebholz-Schuhmann D, Kirsch H, et al: Facts from text\u2013is text mining ready to deliver?. PLoS Biol. 2005, 3 (2): e65-10.1371\/journal.pbio.0030065.","journal-title":"PLoS Biol"},{"issue":"Suppl 2","key":"72_CR2","doi-asserted-by":"publisher","first-page":"S7","DOI":"10.1186\/gb-2008-9-s2-s7","volume":"9","author":"RB Altman","year":"2008","unstructured":"Altman RB, Bergman CM, et al: Text mining for biology\u2013the way forward: opinions from leading scientists. Genome Biol. 2008, 9 (Suppl 2): S7-10.1186\/gb-2008-9-s2-s7.","journal-title":"Genome Biol"},{"key":"72_CR3","first-page":"104","volume-title":"Biomedical named entity recognition using conditional random fields and rich feature sets.Proceedings of the International Joint Workshop on Natural Language Processing in Biomedicine and its Applications","author":"B Settles","year":"2004","unstructured":"Settles B: Biomedical named entity recognition using conditional random fields and rich feature sets.Proceedings of the International Joint Workshop on Natural Language Processing in Biomedicine and its Applications. 2004, Association for Computational Linguistics, Geneva, 104-107."},{"key":"72_CR4","first-page":"430","volume-title":"Proceedings of the 42nd Annual Meeting on Association for Computational Linguistics","author":"B Rosario","year":"2004","unstructured":"Rosario B, Hearst MA: Classifying semantic relations in bioscience texts. Proceedings of the 42nd Annual Meeting on Association for Computational Linguistics. 2004, Association for Computational Linguistics, Barcelona, 430."},{"issue":"Suppl 8","key":"72_CR5","doi-asserted-by":"publisher","first-page":"S3","DOI":"10.1186\/1471-2105-12-S8-S3","volume":"12","author":"M Krallinger","year":"2011","unstructured":"Krallinger M, Vazquez M, et al: The Protein-Protein Interaction tasks of BioCreative III: classification\/ranking of articles and linking bio-ontology concepts to full text. BMC Bioinformatics. 2011, 12 (Suppl 8): S3-10.1186\/1471-2105-12-S8-S3.","journal-title":"BMC Bioinformatics"},{"key":"72_CR6","first-page":"4","volume":"11","author":"HW Chun","year":"2006","unstructured":"Chun HW, Tsuruoka Y, Kim JD, Shiba R, Nagata N, Hishiki T, Tsujii J: Extraction of gene-disease relations from Medline using domain dictionaries and machine learning. Pac Symp Biocomput. 2006, 11: 4-15.","journal-title":"Pac Symp Biocomput"},{"key":"72_CR7","doi-asserted-by":"publisher","first-page":"492","DOI":"10.1186\/1471-2105-11-492","volume":"11","author":"KB Cohen","year":"2010","unstructured":"Cohen KB, Johnson HL, et al: The structural and content aspects of abstracts versus bodies of full text journal articles are different. BMC Bioinformatics. 2010, 11: 492-10.1186\/1471-2105-11-492.","journal-title":"BMC Bioinformatics"},{"key":"72_CR8","first-page":"556","volume":"567","author":"B Alex","year":"2008","unstructured":"Alex B, Grover C, et al: Assisted curation: does text mining really help?. Pac Symp Biocomput. 2008, 567: 556-567.","journal-title":"Pac Symp Biocomput"},{"key":"72_CR9","doi-asserted-by":"publisher","first-page":"398","DOI":"10.1109\/WIIAT.2008.295","volume-title":"Proceedings of the 2008 IEEE\/WIC\/ACM International Conference on Web Intelligence and Intelligent Agent Technology - Volume 01","author":"C Ramakrishnan","year":"2008","unstructured":"Ramakrishnan C, Mendes PN, et al: Joint Extraction of Compound Entities and Relationships from Biomedical Literature. Proceedings of the 2008 IEEE\/WIC\/ACM International Conference on Web Intelligence and Intelligent Agent Technology - Volume 01. 2008, IEEE Computer Society, Sydney, 398-401."},{"key":"72_CR10","doi-asserted-by":"publisher","first-page":"146","DOI":"10.1007\/978-3-540-87696-0_15","volume-title":"Proceedings of the 16th international conference on Knowledge Engineering: Practice and Patterns","author":"C Ramakrishnan","year":"2008","unstructured":"Ramakrishnan C, Mendes PN, et al: Unsupervised Discovery of Compound Entities for Relationship Extraction. Proceedings of the 16th international conference on Knowledge Engineering: Practice and Patterns. 2008, Springer-Verlag, Acitrezza, 146-155."},{"issue":"Suppl 10","key":"72_CR11","doi-asserted-by":"publisher","first-page":"S19","DOI":"10.1186\/1471-2105-12-S10-S19","volume":"12","author":"S Roy","year":"2011","unstructured":"Roy S, Heinrich K, et al: Latent Semantic Indexing of PubMed abstracts for identification of transcription factor candidates from microarray derived gene sets. BMC Bioinformatics. 2011, 12 (Suppl 10): S19-10.1186\/1471-2105-12-S10-S19.","journal-title":"BMC Bioinformatics"},{"key":"72_CR12","doi-asserted-by":"publisher","first-page":"4","DOI":"10.1186\/1747-5333-1-4","volume":"1","author":"AM Cohen","year":"2006","unstructured":"Cohen AM, Hersh WR: The TREC 2004 genomics track categorization task: classifying full text biomedical documents. J Biomed Discov Collab. 2006, 1: 4-10.1186\/1747-5333-1-4.","journal-title":"J Biomed Discov Collab"},{"issue":"10","key":"72_CR13","doi-asserted-by":"publisher","first-page":"e142","DOI":"10.1371\/journal.pcbi.0020142","volume":"2","author":"P Bourne","year":"2006","unstructured":"Bourne P, McEntyre J: Biocurators: contributors to the world of science. PLoS Comput Biol. 2006, 2 (10): e142-10.1371\/journal.pcbi.0020142.","journal-title":"PLoS Comput Biol"},{"issue":"Suppl 2","key":"72_CR14","doi-asserted-by":"publisher","first-page":"S1","DOI":"10.1186\/gb-2008-9-s2-s1","volume":"9","author":"M Krallinger","year":"2008","unstructured":"Krallinger M, Morgan A, et al: Evaluation of text-mining systems for biology: overview of the Second BioCreative community challenge. Genome Biol. 2008, 9 (Suppl 2): S1-10.1186\/gb-2008-9-s2-s1. Epub 2008 Sep 1","journal-title":"Genome Biol"},{"issue":"Suppl 2","key":"72_CR15","doi-asserted-by":"publisher","first-page":"S3","DOI":"10.1186\/gb-2008-9-s2-s3","volume":"9","author":"AA Morgan","year":"2008","unstructured":"Morgan AA, Lu Z, et al: Overview of BioCreative II gene normalization. Genome Biol. 2008, 9 (Suppl 2): S3-10.1186\/gb-2008-9-s2-s3.","journal-title":"Genome Biol"},{"key":"72_CR16","doi-asserted-by":"publisher","first-page":"11","DOI":"10.1093\/database\/bap019","volume":"2009","author":"KG Dowell","year":"2009","unstructured":"Dowell KG, McAndrews-Hill MS, et al: Integrating text mining into the MGI biocuration workflow. Database. 2009, 2009: 11.","journal-title":"Database"},{"issue":"1","key":"72_CR17","doi-asserted-by":"publisher","first-page":"17","DOI":"10.1016\/0004-3702(82)90020-0","volume":"19","author":"CL Forgy","year":"1982","unstructured":"Forgy CL: Rete: a fast algorithm for the many pattern\/many object pattern match problem. Artif Intell. 1982, 19 (1): 17-37. 10.1016\/0004-3702(82)90020-0.","journal-title":"Artif Intell"},{"issue":"3","key":"72_CR18","doi-asserted-by":"publisher","first-page":"443","DOI":"10.1016\/0022-2836(70)90057-4","volume":"48","author":"SB Needleman","year":"1970","unstructured":"Needleman SB, Wunsch CD: A general method applicable to the search for similarities in the amino acid sequence of two proteins. J Mol Biol. 1970, 48 (3): 443-453. 10.1016\/0022-2836(70)90057-4.","journal-title":"J Mol Biol"},{"key":"72_CR19","doi-asserted-by":"publisher","first-page":"587","DOI":"10.1109\/ICDAR.1995.601965","volume-title":"Proceedings of the Third International Conference on Document Analysis and Recognition (Volume 2) - Volume 2","author":"A Dengel","year":"1995","unstructured":"Dengel A, Dubiel F: Clustering and classification of document structure-a machine learning approach. Proceedings of the Third International Conference on Document Analysis and Recognition (Volume 2) - Volume 2. 1995, IEEE Computer Society, Washington, 587."},{"key":"72_CR20","doi-asserted-by":"publisher","first-page":"466","DOI":"10.1109\/ICDAR.1995.599037","volume-title":"the Proceedings of the Third International Conference on Document Analysis and Recognition","author":"F Esposito","year":"1995","unstructured":"Esposito F, Malerba D, et al: A Knowledge-Based Approach to the Layout Analysis. the Proceedings of the Third International Conference on Document Analysis and Recognition. 1995, Society Press, Montreal, 466-471."},{"key":"72_CR21","volume-title":"Automatic Discovery of Logical Document Structure. Technical Report","author":"Kristen Summers","year":"1998","unstructured":"Summers Kristen: Automatic Discovery of Logical Document Structure. Technical Report. 1998, Cornell University, Ithaca"},{"issue":"4","key":"72_CR22","doi-asserted-by":"publisher","first-page":"1","DOI":"10.4018\/jdls.2010100101","volume":"1","author":"M-T Luong","year":"2011","unstructured":"Luong M-T, Nguyen TD, Kan M-Y: Logical structure recovery in scholarly articles with rich document features. International Journal of Digital Library Systems (IJDLS). 2011, 1 (4): 1-23.","journal-title":"International Journal of Digital Library Systems (IJDLS)"},{"key":"72_CR23","first-page":"282","volume-title":"Proceedings of the Eighteenth International Conference on Machine Learning","author":"JD Lafferty","year":"2001","unstructured":"Lafferty JD, McCallum A, et al: Conditional Random Fields: Probabilistic Models for Segmenting and Labeling Sequence Data. Proceedings of the Eighteenth International Conference on Machine Learning. 2001, Morgan Kaufmann Publishers Inc, San Francisco, 282-289."},{"issue":"18","key":"72_CR24","doi-asserted-by":"publisher","first-page":"i568","DOI":"10.1093\/bioinformatics\/btq383","volume":"26","author":"TK Attwood","year":"2010","unstructured":"Attwood TK, Kell DB, et al: Utopia documents: linking scholarly literature with research data. Bioinformatics. 2010, 26 (18): i568-i574. 10.1093\/bioinformatics\/btq383.","journal-title":"Bioinformatics"},{"key":"72_CR25","doi-asserted-by":"publisher","first-page":"362","DOI":"10.1186\/1471-2105-12-362","volume":"12","author":"B Vroling","year":"2011","unstructured":"Vroling B, Thorne D, et al: Integrating GPCR-specific information with full text articles. BMC Bioinformatics. 2011, 12: 362-10.1186\/1471-2105-12-362.","journal-title":"BMC Bioinformatics"},{"key":"72_CR26","doi-asserted-by":"crossref","first-page":"1311","DOI":"10.1145\/1458082.1458255","volume-title":"Proceeding of the 17th ACM conference on Information and knowledge management","author":"Y Liu","year":"2008","unstructured":"Liu Y, Mitra P, et al: Identifying table boundaries in digital documents via sparse line detection. Proceeding of the 17th ACM conference on Information and knowledge management. 2008, ACM, Napa Valley, 1311-1320."},{"key":"72_CR27","doi-asserted-by":"publisher","first-page":"119","DOI":"10.1109\/BIBE.2001.974420","volume-title":"Proceedings of the 2nd IEEE International Symposium on Bioinformatics and Bioengineering","author":"RF Murphy","year":"2001","unstructured":"Murphy RF, Velliste M, et al: Searching Online Journals for Fluorescence Microscope Images Depicting Protein Subcellular Location Patterns. Proceedings of the 2nd IEEE International Symposium on Bioinformatics and Bioengineering. 2001, IEEE Computer Society, Washington, 119."},{"key":"72_CR28","volume-title":"Proceedings of the Sixth International Language Resources and Evaluation (LREC'08)","author":"C Lee Giles","year":"2008","unstructured":"Lee Giles C, Councill I, Kan M-Y: ParsCit: an Open-source CRF Reference String Parsing Package. Proceedings of the Sixth International Language Resources and Evaluation (LREC'08). 2008, European Language Resources Association (ELRA), Marrakech"},{"key":"72_CR29","volume-title":"Paper at Workshop Beyond the PDF","author":"P Ciccarese","year":"2011","unstructured":"Ciccarese P, Attwood T, et al: A Round-Trip to the Annotation Store: Open, Transferable Semantic Annotation of Biomedical Publications. Paper at Workshop Beyond the PDF. 2011"},{"issue":"Suppl 2","key":"72_CR30","doi-asserted-by":"publisher","first-page":"S4","DOI":"10.1186\/2041-1480-2-S2-S4","volume":"2","author":"P Ciccarese","year":"2011","unstructured":"Ciccarese P, Ocana M, Garcia Castro LJ, Das S, Clark T: An open annotation ontology for science on web 3.0. J Biomed Semantics. 2011 May 17, 2 (Suppl 2): S4-10.1186\/2041-1480-2-S2-S4.","journal-title":"J Biomed Semantics"}],"container-title":["Source Code for Biology and Medicine"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1186\/1751-0473-7-7.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/article\/10.1186\/1751-0473-7-7\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1186\/1751-0473-7-7.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,1,16]],"date-time":"2022-01-16T15:24:29Z","timestamp":1642346669000},"score":1,"resource":{"primary":{"URL":"https:\/\/scfbm.biomedcentral.com\/articles\/10.1186\/1751-0473-7-7"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2012,5,28]]},"references-count":30,"journal-issue":{"issue":"1","published-print":{"date-parts":[[2012,12]]}},"alternative-id":["72"],"URL":"https:\/\/doi.org\/10.1186\/1751-0473-7-7","relation":{},"ISSN":["1751-0473"],"issn-type":[{"value":"1751-0473","type":"electronic"}],"subject":[],"published":{"date-parts":[[2012,5,28]]},"article-number":"7"}}