{"id":"https://openalex.org/W4353115367","doi":"https://doi.org/10.48550/arxiv.2303.11761","title":"Reasonable Scale Machine Learning with Open-Source Metaflow","display_name":"Reasonable Scale Machine Learning with Open-Source Metaflow","publication_year":2023,"publication_date":"2023-01-01","ids":{"openalex":"https://openalex.org/W4353115367","doi":"https://doi.org/10.48550/arxiv.2303.11761"},"language":"en","primary_location":{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2303.11761","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false},"type":"preprint","type_crossref":"posted-content","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/abs/2303.11761","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5008079520","display_name":"Jacopo Tagliabue","orcid":"https://orcid.org/0000-0001-8634-6122"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tagliabue, Jacopo","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5083703448","display_name":"Hugo Bowne\u2010Anderson","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bowne-Anderson, Hugo","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5000571410","display_name":"Ville Tuulos","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tuulos, Ville","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5091702405","display_name":"Savin Goyal","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Goyal, Savin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5078525830","display_name":"Romain Cl\u00e9dat","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cledat, Romain","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5084471463","display_name":"David Van Den Berg","orcid":"https://orcid.org/0000-0002-8797-8217"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Berg, David","raw_affiliation_strings":[],"affiliations":[]}],"institution_assertions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.0,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":0,"max":67},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T11986","display_name":"Scientific Computing and Data Management","score":0.9885,"subfield":{"id":"https://openalex.org/subfields/1802","display_name":"Information Systems and Management"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T11986","display_name":"Scientific Computing and Data Management","score":0.9885,"subfield":{"id":"https://openalex.org/subfields/1802","display_name":"Information Systems and Management"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11891","display_name":"Big Data and Business Intelligence","score":0.9809,"subfield":{"id":"https://openalex.org/subfields/1404","display_name":"Management Information Systems"},"field":{"id":"https://openalex.org/fields/14","display_name":"Business, Management and Accounting"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T12761","display_name":"Data Stream Mining Techniques","score":0.971,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/warrant","display_name":"Warrant","score":0.7211099},{"id":"https://openalex.org/keywords/business-logic","display_name":"Business logic","score":0.50025177}],"concepts":[{"id":"https://openalex.org/C168065819","wikidata":"https://www.wikidata.org/wiki/Q845566","display_name":"Debugging","level":2,"score":0.8001356},{"id":"https://openalex.org/C56666940","wikidata":"https://www.wikidata.org/wiki/Q788790","display_name":"Documentation","level":2,"score":0.77832896},{"id":"https://openalex.org/C2776916960","wikidata":"https://www.wikidata.org/wiki/Q637156","display_name":"Warrant","level":2,"score":0.7211099},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.68172055},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.6722529},{"id":"https://openalex.org/C204983608","wikidata":"https://www.wikidata.org/wiki/Q2111958","display_name":"Productivity","level":2,"score":0.6631063},{"id":"https://openalex.org/C3018397939","wikidata":"https://www.wikidata.org/wiki/Q3644502","display_name":"Open source","level":3,"score":0.6233466},{"id":"https://openalex.org/C115903868","wikidata":"https://www.wikidata.org/wiki/Q80993","display_name":"Software engineering","level":1,"score":0.5868887},{"id":"https://openalex.org/C9652623","wikidata":"https://www.wikidata.org/wiki/Q190109","display_name":"Field (mathematics)","level":2,"score":0.5441528},{"id":"https://openalex.org/C2778755073","wikidata":"https://www.wikidata.org/wiki/Q10858537","display_name":"Scale (ratio)","level":2,"score":0.5178642},{"id":"https://openalex.org/C146222976","wikidata":"https://www.wikidata.org/wiki/Q1204997","display_name":"Business logic","level":2,"score":0.50025177},{"id":"https://openalex.org/C110354214","wikidata":"https://www.wikidata.org/wiki/Q6314146","display_name":"Engineering management","level":1,"score":0.42696851},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.36141363},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.33925104},{"id":"https://openalex.org/C2777904410","wikidata":"https://www.wikidata.org/wiki/Q7397","display_name":"Software","level":2,"score":0.3391914},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.18681431},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.15636173},{"id":"https://openalex.org/C144133560","wikidata":"https://www.wikidata.org/wiki/Q4830453","display_name":"Business","level":0,"score":0.13010743},{"id":"https://openalex.org/C10138342","wikidata":"https://www.wikidata.org/wiki/Q43015","display_name":"Finance","level":1,"score":0.11932552},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C202444582","wikidata":"https://www.wikidata.org/wiki/Q837863","display_name":"Pure mathematics","level":1,"score":0.0},{"id":"https://openalex.org/C139719470","wikidata":"https://www.wikidata.org/wiki/Q39680","display_name":"Macroeconomics","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2303.11761","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false},{"is_oa":false,"landing_page_url":"https://api.datacite.org/dois/10.48550/arxiv.2303.11761","pdf_url":null,"source":{"id":"https://openalex.org/S4393179698","display_name":"DataCite API","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I4210145204","host_organization_name":"DataCite","host_organization_lineage":["https://openalex.org/I4210145204"],"host_organization_lineage_names":["DataCite"],"type":"metadata"},"license":null,"license_id":null,"version":null}],"best_oa_location":{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2303.11761","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/8","display_name":"Decent work and economic growth","score":0.47}],"grants":[],"datasets":[],"versions":[],"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W3015649151","https://openalex.org/W3014921315","https://openalex.org/W2618713772","https://openalex.org/W2506609850","https://openalex.org/W2496426887","https://openalex.org/W2381584298","https://openalex.org/W2373243504","https://openalex.org/W2363340781","https://openalex.org/W2349156183","https://openalex.org/W2299215294"],"abstract_inverted_index":{"As":[0],"Machine":[1],"Learning":[2],"(ML)":[3],"gains":[4],"adoption":[5],"across":[6],"industries":[7],"and":[8,20,28,49,115,120],"new":[9],"use":[10,121],"cases,":[11],"practitioners":[12,86],"increasingly":[13],"realize":[14],"the":[15,44,57,82,90,96,99,108,127],"challenges":[16,110],"around":[17],"effectively":[18],"developing":[19],"iterating":[21],"on":[22,126],"ML":[23,62,76,93,112],"systems:":[24],"reproducibility,":[25],"debugging,":[26],"scalability,":[27],"documentation":[29],"are":[30],"elusive":[31],"goals":[32],"for":[33,75],"real-world":[34],"pipelines":[35],"outside":[36],"tech-first":[37],"companies.":[38],"In":[39],"this":[40],"paper,":[41],"we":[42],"review":[43],"nature":[45],"of":[46,84,92,98],"ML-oriented":[47],"workloads":[48],"argue":[50],"that":[51],"re-purposing":[52],"existing":[53],"tools":[54],"won't":[55],"solve":[56],"current":[58],"productivity":[59,83],"issues,":[60],"as":[61],"peculiarities":[63],"warrant":[64],"specialized":[65],"development":[66],"tooling.":[67],"We":[68,102],"then":[69],"introduce":[70],"Metaflow,":[71],"an":[72],"open-source":[73],"framework":[74],"projects":[77],"explicitly":[78],"designed":[79],"to":[80],"boost":[81],"data":[85],"by":[87],"abstracting":[88],"away":[89],"execution":[91],"code":[94],"from":[95],"definition":[97],"business":[100],"logic.":[101],"show":[103],"how":[104],"our":[105],"design":[106],"addresses":[107],"main":[109],"in":[111],"operations":[113],"(MLOps),":[114],"document":[116],"through":[117],"examples,":[118],"interviews":[119],"cases":[122],"its":[123],"practical":[124],"impact":[125],"field.":[128]},"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4353115367","counts_by_year":[],"updated_date":"2025-01-08T21:57:34.486194","created_date":"2023-03-23"}