{"id":"https://openalex.org/W4315588170","doi":"https://doi.org/10.48550/arxiv.2301.02665","title":"Discovery of structure-property relations for molecules via hypothesis-driven active learning over the chemical space","display_name":"Discovery of structure-property relations for molecules via hypothesis-driven active learning over the chemical space","publication_year":2023,"publication_date":"2023-01-01","ids":{"openalex":"https://openalex.org/W4315588170","doi":"https://doi.org/10.48550/arxiv.2301.02665"},"language":"en","primary_location":{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2301.02665","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false},"type":"preprint","type_crossref":"journal-article","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://arxiv.org/abs/2301.02665","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5013590092","display_name":"Ayana Ghosh","orcid":"https://orcid.org/0000-0002-0432-3689"},"institutions":[{"id":"https://openalex.org/I1289243028","display_name":"Oak Ridge National Laboratory","ror":"https://ror.org/01qz5mb56","country_code":"US","type":"funder","lineage":["https://openalex.org/I1289243028","https://openalex.org/I1330989302","https://openalex.org/I39565521","https://openalex.org/I4210159294"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Ayana Ghosh","raw_affiliation_strings":["Computational Sciences and Engineering Division, Oak Ridge National Laboratory, Oak Ridge, TN 37831 USA"],"affiliations":[{"raw_affiliation_string":"Computational Sciences and Engineering Division, Oak Ridge National Laboratory, Oak Ridge, TN 37831 USA","institution_ids":["https://openalex.org/I1289243028"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5048552375","display_name":"Sergei V. Kalinin","orcid":"https://orcid.org/0000-0001-5354-6152"},"institutions":[{"id":"https://openalex.org/I2802706902","display_name":"Knoxville College","ror":"https://ror.org/02bxrp522","country_code":"US","type":"education","lineage":["https://openalex.org/I2802706902"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Sergei V. Kalinin","raw_affiliation_strings":["Department of Materials Science and Engineering, University of Knoxville, Knoxville, TN 37996 USA"],"affiliations":[{"raw_affiliation_string":"Department of Materials Science and Engineering, University of Knoxville, Knoxville, TN 37996 USA","institution_ids":["https://openalex.org/I2802706902"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5013879711","display_name":"Maxim Ziatdinov","orcid":"https://orcid.org/0000-0003-2570-4592"},"institutions":[{"id":"https://openalex.org/I1289243028","display_name":"Oak Ridge National Laboratory","ror":"https://ror.org/01qz5mb56","country_code":"US","type":"funder","lineage":["https://openalex.org/I1289243028","https://openalex.org/I1330989302","https://openalex.org/I39565521","https://openalex.org/I4210159294"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Maxim A. Ziatdinov","raw_affiliation_strings":["Center for Nanophase Materials Sciences, Oak Ridge National Laboratory, Oak Ridge, TN 37831 USA","Computational Sciences and Engineering Division, Oak Ridge National Laboratory, Oak Ridge, TN 37831 USA"],"affiliations":[{"raw_affiliation_string":"Computational Sciences and Engineering Division, Oak Ridge National Laboratory, Oak Ridge, TN 37831 USA","institution_ids":["https://openalex.org/I1289243028"]},{"raw_affiliation_string":"Center for Nanophase Materials Sciences, Oak Ridge National Laboratory, Oak Ridge, TN 37831 USA","institution_ids":["https://openalex.org/I1289243028"]}]}],"institution_assertions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5013590092"],"corresponding_institution_ids":["https://openalex.org/I1289243028"],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.0,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":0,"max":66},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T11948","display_name":"Machine Learning in Materials Science","score":0.9995,"subfield":{"id":"https://openalex.org/subfields/2505","display_name":"Materials Chemistry"},"field":{"id":"https://openalex.org/fields/25","display_name":"Materials Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11948","display_name":"Machine Learning in Materials Science","score":0.9995,"subfield":{"id":"https://openalex.org/subfields/2505","display_name":"Materials Chemistry"},"field":{"id":"https://openalex.org/fields/25","display_name":"Materials Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10211","display_name":"Computational Drug Discovery Methods","score":0.9954,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12327","display_name":"Various Chemistry Research Topics","score":0.9706,"subfield":{"id":"https://openalex.org/subfields/1606","display_name":"Physical and Theoretical Chemistry"},"field":{"id":"https://openalex.org/fields/16","display_name":"Chemistry"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/chemical-space","display_name":"Chemical space","score":0.74829197}],"concepts":[{"id":"https://openalex.org/C99726746","wikidata":"https://www.wikidata.org/wiki/Q906396","display_name":"Chemical space","level":3,"score":0.74829197},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.62155974},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.562291},{"id":"https://openalex.org/C49937458","wikidata":"https://www.wikidata.org/wiki/Q2599292","display_name":"Probabilistic logic","level":2,"score":0.56182224},{"id":"https://openalex.org/C77967617","wikidata":"https://www.wikidata.org/wiki/Q4677561","display_name":"Active learning (machine learning)","level":2,"score":0.5603955},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.52236444},{"id":"https://openalex.org/C189950617","wikidata":"https://www.wikidata.org/wiki/Q937228","display_name":"Property (philosophy)","level":2,"score":0.5208938},{"id":"https://openalex.org/C2780801425","wikidata":"https://www.wikidata.org/wiki/Q5164392","display_name":"Construct (python library)","level":2,"score":0.48193192},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.4598819},{"id":"https://openalex.org/C2778572836","wikidata":"https://www.wikidata.org/wiki/Q380933","display_name":"Space (punctuation)","level":2,"score":0.45855707},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.45712134},{"id":"https://openalex.org/C61326573","wikidata":"https://www.wikidata.org/wiki/Q1496376","display_name":"Gaussian process","level":3,"score":0.42853978},{"id":"https://openalex.org/C74187038","wikidata":"https://www.wikidata.org/wiki/Q1418791","display_name":"Drug discovery","level":2,"score":0.38800007},{"id":"https://openalex.org/C163716315","wikidata":"https://www.wikidata.org/wiki/Q901177","display_name":"Gaussian","level":2,"score":0.30937773},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.115771174},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.08697471},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C147597530","wikidata":"https://www.wikidata.org/wiki/Q369472","display_name":"Computational chemistry","level":1,"score":0.0},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0},{"id":"https://openalex.org/C120665830","wikidata":"https://www.wikidata.org/wiki/Q14620","display_name":"Optics","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[],"locations_count":4,"locations":[{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2301.02665","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false},{"is_oa":true,"landing_page_url":"https://www.osti.gov/biblio/2204589","pdf_url":null,"source":{"id":"https://openalex.org/S4306402487","display_name":"OSTI OAI (U.S. Department of Energy Office of Scientific and Technical Information)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I139351228","host_organization_name":"Office of Scientific and Technical Information","host_organization_lineage":["https://openalex.org/I139351228"],"host_organization_lineage_names":["Office of Scientific and Technical Information"],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false},{"is_oa":true,"landing_page_url":"https://doi.org/10.1063/5.0157644","pdf_url":"https://pubs.aip.org/aip/aml/article-pdf/doi/10.1063/5.0157644/18179485/046102_1_5.0157644.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true},{"is_oa":false,"landing_page_url":"https://api.datacite.org/dois/10.48550/arxiv.2301.02665","pdf_url":null,"source":{"id":"https://openalex.org/S4393179698","display_name":"DataCite API","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I4210145204","host_organization_name":"DataCite","host_organization_lineage":["https://openalex.org/I4210145204"],"host_organization_lineage_names":["DataCite"],"type":"metadata"},"license":null,"license_id":null,"version":null}],"best_oa_location":{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2301.02665","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false},"sustainable_development_goals":[],"grants":[],"datasets":[],"versions":["https://openalex.org/W4315588170","https://openalex.org/W4387822637"],"referenced_works_count":91,"referenced_works":["https://openalex.org/W1702387805","https://openalex.org/W1967287635","https://openalex.org/W1975147762","https://openalex.org/W1975875968","https://openalex.org/W1979142801","https://openalex.org/W1996228494","https://openalex.org/W2027482274","https://openalex.org/W2029533715","https://openalex.org/W2036600427","https://openalex.org/W2038102635","https://openalex.org/W2049237203","https://openalex.org/W2058220696","https://openalex.org/W2061144551","https://openalex.org/W2080635178","https://openalex.org/W2085398335","https://openalex.org/W2085890279","https://openalex.org/W2085915663","https://openalex.org/W2096541451","https://openalex.org/W2123306226","https://openalex.org/W2125849100","https://openalex.org/W2127019019","https://openalex.org/W2127553917","https://openalex.org/W2134164499","https://openalex.org/W2177317049","https://openalex.org/W2192203593","https://openalex.org/W2407586185","https://openalex.org/W2478294658","https://openalex.org/W2527189750","https://openalex.org/W2549144853","https://openalex.org/W2553246783","https://openalex.org/W2594183968","https://openalex.org/W2603068161","https://openalex.org/W2610148085","https://openalex.org/W2620687153","https://openalex.org/W2747592475","https://openalex.org/W2774977638","https://openalex.org/W2785813126","https://openalex.org/W2786722833","https://openalex.org/W2792137452","https://openalex.org/W2794574783","https://openalex.org/W2799620402","https://openalex.org/W2801991413","https://openalex.org/W2880842812","https://openalex.org/W2884430236","https://openalex.org/W2891523768","https://openalex.org/W2900455315","https://openalex.org/W2909055772","https://openalex.org/W2923693308","https://openalex.org/W2937307539","https://openalex.org/W2940242941","https://openalex.org/W2949095042","https://openalex.org/W2955986556","https://openalex.org/W2962872055","https://openalex.org/W2967968968","https://openalex.org/W2970235642","https://openalex.org/W2988203096","https://openalex.org/W2996448308","https://openalex.org/W2997479617","https://openalex.org/W3022256936","https://openalex.org/W3035559885","https://openalex.org/W3045928028","https://openalex.org/W3049675384","https://openalex.org/W3093687066","https://openalex.org/W3098179186","https://openalex.org/W3098269892","https://openalex.org/W3098321015","https://openalex.org/W3100751385","https://openalex.org/W3102795188","https://openalex.org/W3104850868","https://openalex.org/W3106310231","https://openalex.org/W3113447514","https://openalex.org/W3119872582","https://openalex.org/W3126732720","https://openalex.org/W3127113723","https://openalex.org/W3156805104","https://openalex.org/W3163177404","https://openalex.org/W3183931249","https://openalex.org/W3194368700","https://openalex.org/W3194515217","https://openalex.org/W3209056694","https://openalex.org/W3212512279","https://openalex.org/W4220831513","https://openalex.org/W4243421346","https://openalex.org/W4254278957","https://openalex.org/W4283574835","https://openalex.org/W4291288469","https://openalex.org/W4294804855","https://openalex.org/W4297796727","https://openalex.org/W4300537282","https://openalex.org/W4306754767","https://openalex.org/W4311001462"],"related_works":["https://openalex.org/W4385760073","https://openalex.org/W4385588199","https://openalex.org/W4320732452","https://openalex.org/W4286980196","https://openalex.org/W4283395020","https://openalex.org/W3199987505","https://openalex.org/W3183930479","https://openalex.org/W2973074952","https://openalex.org/W2594328795","https://openalex.org/W135095951"],"abstract_inverted_index":{"Discovery":[0],"of":[1,20,25,28,66,73,109,174],"the":[2,29,33,43,47,56,59,83,89,92,159],"molecular":[3,175],"candidates":[4],"for":[5,42,82,140,158],"applications":[6],"in":[7,118,135],"drug":[8],"targets,":[9],"biomolecular":[10],"systems,":[11],"catalysts,":[12],"photovoltaics,":[13],"organic":[14],"electronics,":[15],"and":[16,64,75,99,143,176],"batteries,":[17],"necessitates":[18],"development":[19],"machine":[21,136],"learning":[22,45,101,121,137],"algorithms":[23],"capable":[24],"rapid":[26],"exploration":[27],"chemical":[30,48,152],"spaces":[31,49],"targeting":[32],"desired":[34],"functionalities.":[35],"Here":[36],"we":[37,155],"introduce":[38,76],"a":[39,70,103,124,147],"novel":[40],"approach":[41,87],"active":[44,100,120],"over":[46],"based":[50,68],"on":[51,58,69,132,150],"hypothesis":[52],"learning.":[53],"We":[54],"construct":[55],"hypotheses":[57],"possible":[60],"relationships":[61],"between":[62],"structures":[63],"functionalities":[65],"interest":[67],"small":[71],"subset":[72],"data":[74],"them":[77],"as":[78,97,129],"(probabilistic)":[79],"mean":[80],"functions":[81],"Gaussian":[84],"process.":[85],"This":[86],"combines":[88],"elements":[90],"from":[91,171],"symbolic":[93],"regression":[94],"methods":[95],"such":[96],"SISSO":[98],"into":[102],"single":[104],"framework.":[105],"The":[106],"primary":[107],"focus":[108],"constructing":[110],"this":[111],"framework":[112],"is":[113],"to":[114,146,169],"approximate":[115],"physical":[116],"laws":[117],"an":[119],"regime":[122],"toward":[123],"more":[125,167],"robust":[126],"predictive":[127],"performance,":[128],"traditional":[130],"evaluation":[131],"hold-out":[133],"sets":[134],"doesn't":[138],"account":[139],"out-of-distribution":[141],"effects":[142],"may":[144],"lead":[145],"complete":[148],"failure":[149],"unseen":[151],"space.":[153],"Here,":[154],"demonstrate":[156],"it":[157,163],"QM9":[160],"dataset,":[161],"but":[162],"can":[164],"be":[165],"applied":[166],"broadly":[168],"datasets":[170],"both":[172],"domains":[173],"solid-state":[177],"materials":[178],"sciences.":[179]},"abstract_inverted_index_v3":null,"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4315588170","counts_by_year":[],"updated_date":"2025-02-24T14:36:58.916842","created_date":"2023-01-11"}