{"id":"https://openalex.org/W4392142888","doi":"https://doi.org/10.1186/s13321-024-00815-2","title":"Prediction of chemical reaction yields with large-scale multi-view pre-training","display_name":"Prediction of chemical reaction yields with large-scale multi-view pre-training","publication_year":2024,"publication_date":"2024-02-25","ids":{"openalex":"https://openalex.org/W4392142888","doi":"https://doi.org/10.1186/s13321-024-00815-2","pmid":"https://pubmed.ncbi.nlm.nih.gov/38403627"},"language":"en","primary_location":{"is_oa":true,"landing_page_url":"https://doi.org/10.1186/s13321-024-00815-2","pdf_url":"https://jcheminf.biomedcentral.com/counter/pdf/10.1186/s13321-024-00815-2","source":{"id":"https://openalex.org/S180838163","display_name":"Journal of Cheminformatics","issn_l":"1758-2946","issn":["1758-2946"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320256","host_organization_name":"BioMed Central","host_organization_lineage":["https://openalex.org/P4310319965","https://openalex.org/P4310320256"],"host_organization_lineage_names":["Springer Nature","BioMed Central"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true},"type":"article","type_crossref":"journal-article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://jcheminf.biomedcentral.com/counter/pdf/10.1186/s13321-024-00815-2","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5086021328","display_name":"Runhan Shi","orcid":null},"institutions":[{"id":"https://openalex.org/I4210165726","display_name":"Shanghai Municipal Education Commission","ror":"https://ror.org/05tewj457","country_code":"CN","type":"government","lineage":["https://openalex.org/I4210165456","https://openalex.org/I4210165726"]},{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Runhan Shi","raw_affiliation_strings":["Department of Computer Science and Engineering, and Key Laboratory of Shanghai Education Commission for Intelligent Interaction and Cognitive Engineering, Shanghai Jiao Tong University, Shanghai, 200240, China"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Engineering, and Key Laboratory of Shanghai Education Commission for Intelligent Interaction and Cognitive Engineering, Shanghai Jiao Tong University, Shanghai, 200240, China","institution_ids":["https://openalex.org/I4210165726","https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5027377924","display_name":"Gufeng Yu","orcid":"https://orcid.org/0000-0003-0628-8714"},"institutions":[{"id":"https://openalex.org/I4210165726","display_name":"Shanghai Municipal Education Commission","ror":"https://ror.org/05tewj457","country_code":"CN","type":"government","lineage":["https://openalex.org/I4210165456","https://openalex.org/I4210165726"]},{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Gufeng Yu","raw_affiliation_strings":["Department of Computer Science and Engineering, and Key Laboratory of Shanghai Education Commission for Intelligent Interaction and Cognitive Engineering, Shanghai Jiao Tong University, Shanghai, 200240, China"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Engineering, and Key Laboratory of Shanghai Education Commission for Intelligent Interaction and Cognitive Engineering, Shanghai Jiao Tong University, Shanghai, 200240, China","institution_ids":["https://openalex.org/I4210165726","https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5082306289","display_name":"Xiaohong Huo","orcid":"https://orcid.org/0000-0002-7486-099X"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaohong Huo","raw_affiliation_strings":["Shanghai Key Laboratory for Molecular Engineering of Chiral Drugs, Frontiers Science Center for Transformative Molecules, School of Chemistry and Chemical Engineering, Shanghai Jiao Tong University, Shanghai, 200240, China"],"affiliations":[{"raw_affiliation_string":"Shanghai Key Laboratory for Molecular Engineering of Chiral Drugs, Frontiers Science Center for Transformative Molecules, School of Chemistry and Chemical Engineering, Shanghai Jiao Tong University, Shanghai, 200240, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100397381","display_name":"Yang Yang","orcid":"https://orcid.org/0000-0001-5720-773X"},"institutions":[{"id":"https://openalex.org/I4210165726","display_name":"Shanghai Municipal Education Commission","ror":"https://ror.org/05tewj457","country_code":"CN","type":"government","lineage":["https://openalex.org/I4210165456","https://openalex.org/I4210165726"]},{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yang Yang","raw_affiliation_strings":["Department of Computer Science and Engineering, and Key Laboratory of Shanghai Education Commission for Intelligent Interaction and Cognitive Engineering, Shanghai Jiao Tong University, Shanghai, 200240, China"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Engineering, and Key Laboratory of Shanghai Education Commission for Intelligent Interaction and Cognitive Engineering, Shanghai Jiao Tong University, Shanghai, 200240, China","institution_ids":["https://openalex.org/I4210165726","https://openalex.org/I183067930"]}]}],"institution_assertions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":{"value":1290,"currency":"GBP","value_usd":1582,"provenance":"doaj"},"apc_paid":{"value":1290,"currency":"GBP","value_usd":1582,"provenance":"doaj"},"fwci":2.645,"has_fulltext":true,"fulltext_origin":"pdf","cited_by_count":3,"citation_normalized_percentile":{"value":0.999966,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":96,"max":97},"biblio":{"volume":"16","issue":"1","first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T11948","display_name":"Machine Learning in Materials Science","score":0.9998,"subfield":{"id":"https://openalex.org/subfields/2505","display_name":"Materials Chemistry"},"field":{"id":"https://openalex.org/fields/25","display_name":"Materials Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11948","display_name":"Machine Learning in Materials Science","score":0.9998,"subfield":{"id":"https://openalex.org/subfields/2505","display_name":"Materials Chemistry"},"field":{"id":"https://openalex.org/fields/25","display_name":"Materials Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10211","display_name":"Computational Drug Discovery Methods","score":0.9956,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12254","display_name":"Machine Learning in Bioinformatics","score":0.9407,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.7377407},{"id":"https://openalex.org/keywords/representation","display_name":"Representation","score":0.52940285},{"id":"https://openalex.org/keywords/sample","display_name":"Sample (material)","score":0.4106215}],"concepts":[{"id":"https://openalex.org/C177148314","wikidata":"https://www.wikidata.org/wiki/Q170084","display_name":"Generalization","level":2,"score":0.8073071},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7716062},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.7377407},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.7222658},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6995225},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.574923},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.52940285},{"id":"https://openalex.org/C2778755073","wikidata":"https://www.wikidata.org/wiki/Q10858537","display_name":"Scale (ratio)","level":2,"score":0.48770198},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.43824255},{"id":"https://openalex.org/C198531522","wikidata":"https://www.wikidata.org/wiki/Q485146","display_name":"Sample (material)","level":2,"score":0.4106215},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.13953874},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.10360879},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0},{"id":"https://openalex.org/C43617362","wikidata":"https://www.wikidata.org/wiki/Q170050","display_name":"Chromatography","level":1,"score":0.0},{"id":"https://openalex.org/C94625758","wikidata":"https://www.wikidata.org/wiki/Q7163","display_name":"Politics","level":2,"score":0.0},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"is_oa":true,"landing_page_url":"https://doi.org/10.1186/s13321-024-00815-2","pdf_url":"https://jcheminf.biomedcentral.com/counter/pdf/10.1186/s13321-024-00815-2","source":{"id":"https://openalex.org/S180838163","display_name":"Journal of Cheminformatics","issn_l":"1758-2946","issn":["1758-2946"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320256","host_organization_name":"BioMed Central","host_organization_lineage":["https://openalex.org/P4310319965","https://openalex.org/P4310320256"],"host_organization_lineage_names":["Springer Nature","BioMed Central"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true},{"is_oa":true,"landing_page_url":"https://www.ncbi.nlm.nih.gov/pmc/articles/PMC10895839","pdf_url":null,"source":{"id":"https://openalex.org/S2764455111","display_name":"PubMed Central","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":["National Institutes of Health"],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true},{"is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/38403627","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":["National Institutes of Health"],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false}],"best_oa_location":{"is_oa":true,"landing_page_url":"https://doi.org/10.1186/s13321-024-00815-2","pdf_url":"https://jcheminf.biomedcentral.com/counter/pdf/10.1186/s13321-024-00815-2","source":{"id":"https://openalex.org/S180838163","display_name":"Journal of Cheminformatics","issn_l":"1758-2946","issn":["1758-2946"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320256","host_organization_name":"BioMed Central","host_organization_lineage":["https://openalex.org/P4310319965","https://openalex.org/P4310320256"],"host_organization_lineage_names":["Springer Nature","BioMed Central"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true},"sustainable_development_goals":[{"display_name":"Industry, innovation and infrastructure","score":0.5,"id":"https://metadata.un.org/sdg/9"}],"grants":[{"funder":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China","award_id":"61972251"},{"funder":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China","award_id":"62272300"}],"datasets":[],"versions":[],"referenced_works_count":40,"referenced_works":["https://openalex.org/W1965555277","https://openalex.org/W1975147762","https://openalex.org/W2034354062","https://openalex.org/W2060586571","https://openalex.org/W2244785476","https://openalex.org/W2775684663","https://openalex.org/W2784918212","https://openalex.org/W2785942661","https://openalex.org/W2787252987","https://openalex.org/W29374554","https://openalex.org/W2949064041","https://openalex.org/W2952524414","https://openalex.org/W2964199361","https://openalex.org/W3021539081","https://openalex.org/W3094905049","https://openalex.org/W3103092523","https://openalex.org/W3118349318","https://openalex.org/W3123901912","https://openalex.org/W3143418323","https://openalex.org/W3165522846","https://openalex.org/W3173107846","https://openalex.org/W3189145548","https://openalex.org/W3201840690","https://openalex.org/W3209951148","https://openalex.org/W3215313681","https://openalex.org/W4206063340","https://openalex.org/W4213077304","https://openalex.org/W4220747243","https://openalex.org/W4220902634","https://openalex.org/W4220918529","https://openalex.org/W4221074165","https://openalex.org/W4226145240","https://openalex.org/W4226345167","https://openalex.org/W4255556435","https://openalex.org/W4295951229","https://openalex.org/W4296686673","https://openalex.org/W4315645746","https://openalex.org/W4319826004","https://openalex.org/W4324122028","https://openalex.org/W4362733319"],"related_works":["https://openalex.org/W972276598","https://openalex.org/W4321353415","https://openalex.org/W4246352526","https://openalex.org/W2745001401","https://openalex.org/W2378211422","https://openalex.org/W2130974462","https://openalex.org/W2121910908","https://openalex.org/W2087343574","https://openalex.org/W2086519370","https://openalex.org/W2028665553"],"abstract_inverted_index":{"Abstract":[0],"Developing":[1],"machine":[2,179],"learning":[3,96,113,128,180,196],"models":[4,24,181],"with":[5,129,198],"high":[6],"generalization":[7,91,159,176],"capability":[8,92,177],"for":[9,182,216],"predicting":[10,73,153,183],"chemical":[11,31,52,77,122,184],"reaction":[12,123,185],"yields":[13],"is":[14,54],"of":[15,22,30,42,51,93,178,223],"significant":[16,150],"interest":[17],"and":[18,76,115,190,193,219],"importance.":[19],"The":[20,210],"efficacy":[21],"such":[23],"depends":[25],"heavily":[26],"on":[27,99,137,207],"the":[28,49,58,90,104,142,170,175,221],"representation":[29],"reactions,":[32],"which":[33,63,110,173],"has":[34,82,148],"commonly":[35],"been":[36,65,83],"learned":[37],"from":[38],"SMILES":[39],"or":[40],"graphs":[41],"molecules":[43],"using":[44],"deep":[45,95],"neural":[46],"networks.":[47],"However,":[48],"progression":[50],"reactions":[53],"inherently":[55],"determined":[56],"by":[57],"molecular":[59,74],"3D":[60,130],"geometric":[61,131,191],"properties,":[62],"have":[64],"recently":[66],"highlighted":[67],"as":[68],"crucial":[69],"features":[70],"in":[71,88,152],"accurately":[72],"properties":[75],"reactions.":[78,164,225],"Additionally,":[79],"large-scale":[80],"pre-training":[81,118,201],"shown":[84],"to":[85,120,161],"be":[86],"essential":[87],"enhancing":[89],"complex":[94],"models.":[97],"Based":[98],"these":[100],"considerations,":[101],"we":[102],"propose":[103],"Reaction":[105],"Multi-View":[106],"Pre-training":[107],"(ReaMVP)":[108],"framework,":[109,172],"leverages":[111],"self-supervised":[112,195],"techniques":[114,197],"a":[116,149,199],"two-stage":[117,200],"strategy":[119],"predict":[121,162],"yields.":[124,186],"By":[125,187],"incorporating":[126],"multi-view":[127],"information,":[132],"ReaMVP":[133,147,171,203],"achieves":[134,204],"state-of-the-art":[135,205],"performance":[136,206],"two":[138],"benchmark":[139,208],"datasets.":[140,209],"Notably,":[141],"experimental":[143],"results":[144],"indicate":[145],"that":[146],"advantage":[151],"out-of-sample":[154,217],"data,":[155],"suggesting":[156],"an":[157],"enhanced":[158],"ability":[160,215],"new":[163,224],"Scientific":[165],"Contribution:":[166],"This":[167],"study":[168],"presents":[169],"improves":[174],"integrating":[188],"sequential":[189],"views":[192],"leveraging":[194],"strategy,":[202],"framework":[211],"demonstrates":[212],"superior":[213],"predictive":[214],"data":[218],"enhances":[220],"prediction":[222]},"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4392142888","counts_by_year":[{"year":2024,"cited_by_count":3}],"updated_date":"2024-12-11T23:50:04.539495","created_date":"2024-02-26"}