{"id":"https://openalex.org/W4404388980","doi":"https://doi.org/10.48550/arxiv.2411.05026","title":"Deep Learning and Machine Learning -- Natural Language Processing: From\n Theory to Application","display_name":"Deep Learning and Machine Learning -- Natural Language Processing: From\n Theory to Application","publication_year":2024,"publication_date":"2024-10-30","ids":{"openalex":"https://openalex.org/W4404388980","doi":"https://doi.org/10.48550/arxiv.2411.05026"},"language":"en","primary_location":{"is_oa":true,"landing_page_url":"http://arxiv.org/abs/2411.05026","pdf_url":"http://arxiv.org/pdf/2411.05026","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false},"type":"preprint","type_crossref":"posted-content","indexed_in":["arxiv"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"http://arxiv.org/pdf/2411.05026","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101430780","display_name":"Keyu Chen","orcid":"https://orcid.org/0000-0003-0808-2533"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Keyu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5062469562","display_name":"Fei Cheng","orcid":"https://orcid.org/0000-0003-4808-8470"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Fei, Cheng","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5108304756","display_name":"Ziqian Bi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bi, Ziqian","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100682738","display_name":"Junyu Liu","orcid":"https://orcid.org/0000-0002-4293-1247"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Junyu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5074724383","display_name":"Benji Peng","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Peng, Benji","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100378899","display_name":"Sen Zhang","orcid":"https://orcid.org/0000-0003-1409-5795"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Sen","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5091365447","display_name":"Xiaoyong Pan","orcid":"https://orcid.org/0000-0001-5010-464X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pan, Xuanhe","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101432897","display_name":"Jiawei Xu","orcid":"https://orcid.org/0000-0002-2732-086X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xu, Jiawei","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5047629664","display_name":"Jinlang Wang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Jinlang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5020602843","display_name":"Caitlyn Heqi Yin","orcid":"https://orcid.org/0009-0006-5037-8716"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yin, Caitlyn Heqi","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100625408","display_name":"Yichao Zhang","orcid":"https://orcid.org/0000-0002-9931-4733"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Yichao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5112984429","display_name":"Peiyong Feng","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Feng, Pohsun","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5111363143","display_name":"Yizhu Wen","orcid":"https://orcid.org/0009-0008-0479-4991"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wen, Yizhu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100656834","display_name":"Tianyang Wang","orcid":"https://orcid.org/0000-0003-3184-0566"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Tianyang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5104361565","display_name":"Ming Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Ming","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5023639734","display_name":"Jin\u2010Tao Ren","orcid":"https://orcid.org/0000-0001-8017-9546"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ren, Jintao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5001865341","display_name":"Qian Niu","orcid":"https://orcid.org/0000-0001-7139-384X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Niu, Qian","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102807454","display_name":"Silin Chen","orcid":"https://orcid.org/0000-0003-4073-3375"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Silin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5002433369","display_name":"Wilson C. Hsieh","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hsieh, Weiche","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5035357574","display_name":"Lingzhi Yan","orcid":"https://orcid.org/0000-0002-1530-7940"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yan, Lawrence K. Q.","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5114664487","display_name":"Chia Xin Liang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liang, Chia Xin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101786912","display_name":"Xu Han","orcid":"https://orcid.org/0000-0003-0068-0117"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xu, Han","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5034788095","display_name":"H. Eric Tseng","orcid":"https://orcid.org/0000-0001-9544-4226"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tseng, Hong-Ming","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5006004614","display_name":"Xinyuan Song","orcid":"https://orcid.org/0000-0002-4877-3200"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Song, Xinyuan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5100343852","display_name":"Ming Liu","orcid":"https://orcid.org/0000-0001-6239-1180"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Ming","raw_affiliation_strings":[],"affiliations":[]}],"institution_assertions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.0,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":0,"max":84},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T14470","display_name":"Advanced Data Processing Techniques","score":0.0517,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T14470","display_name":"Advanced Data Processing Techniques","score":0.0517,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[],"concepts":[{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.58747447},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.54645735},{"id":"https://openalex.org/C2776608160","wikidata":"https://www.wikidata.org/wiki/Q4785462","display_name":"Natural (archaeology)","level":2,"score":0.53243655},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.5196946},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.46686745},{"id":"https://openalex.org/C95457728","wikidata":"https://www.wikidata.org/wiki/Q309","display_name":"History","level":0,"score":0.15695328},{"id":"https://openalex.org/C166957645","wikidata":"https://www.wikidata.org/wiki/Q23498","display_name":"Archaeology","level":1,"score":0.07865599}],"mesh":[],"locations_count":1,"locations":[{"is_oa":true,"landing_page_url":"http://arxiv.org/abs/2411.05026","pdf_url":"http://arxiv.org/pdf/2411.05026","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false}],"best_oa_location":{"is_oa":true,"landing_page_url":"http://arxiv.org/abs/2411.05026","pdf_url":"http://arxiv.org/pdf/2411.05026","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false},"sustainable_development_goals":[],"grants":[],"datasets":[],"versions":[],"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4360585206","https://openalex.org/W4323565446","https://openalex.org/W4321369474","https://openalex.org/W4285208911","https://openalex.org/W4213079790","https://openalex.org/W3215138031","https://openalex.org/W3082895349","https://openalex.org/W3009238340","https://openalex.org/W2731899572","https://openalex.org/W2248239756"],"abstract_inverted_index":{"With":[0],"a":[1],"focus":[2],"on":[3],"natural":[4],"language":[5,13],"processing":[6,52,97],"(NLP)":[7],"and":[8,25,46,53,64,87,98,110],"the":[9,18,65],"role":[10],"of":[11,20,67,95],"large":[12],"models":[14],"(LLMs),":[15],"we":[16],"explore":[17],"intersection":[19],"machine":[21],"learning,":[22,24],"deep":[23],"artificial":[26,29],"intelligence.":[27],"As":[28],"intelligence":[30],"continues":[31],"to":[32,37,104],"revolutionize":[33],"fields":[34],"from":[35],"healthcare":[36],"finance,":[38],"NLP":[39],"techniques":[40,63],"such":[41,80],"as":[42,81],"tokenization,":[43],"text":[44],"classification,":[45],"entity":[47],"recognition":[48],"are":[49],"essential":[50],"for":[51,72],"understanding":[54],"human":[55],"language.":[56],"This":[57],"paper":[58],"discusses":[59],"advanced":[60],"data":[61,96],"preprocessing":[62],"use":[66],"frameworks":[68],"like":[69],"Hugging":[70],"Face":[71],"implementing":[73],"transformer-based":[74],"models.":[75],"Additionally,":[76],"it":[77],"highlights":[78],"challenges":[79],"handling":[82],"multilingual":[83],"data,":[84],"reducing":[85],"bias,":[86],"ensuring":[88],"model":[89,99],"robustness.":[90],"By":[91],"addressing":[92],"key":[93],"aspects":[94],"fine-tuning,":[100],"this":[101],"work":[102],"aims":[103],"provide":[105],"insights":[106],"into":[107],"deploying":[108],"effective":[109],"ethically":[111],"sound":[112],"AI":[113],"solutions.":[114]},"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4404388980","counts_by_year":[],"updated_date":"2024-12-07T04:57:04.902710","created_date":"2024-11-15"}