{"id":"https://openalex.org/W2081819181","doi":"https://doi.org/10.1145/1851476.1851585","title":"File-access patterns of data-intensive workflow applications and their implications to distributed filesystems","display_name":"File-access patterns of data-intensive workflow applications and their implications to distributed filesystems","publication_year":2010,"publication_date":"2010-06-21","ids":{"openalex":"https://openalex.org/W2081819181","doi":"https://doi.org/10.1145/1851476.1851585","mag":"2081819181"},"language":"en","primary_location":{"is_oa":false,"landing_page_url":"https://doi.org/10.1145/1851476.1851585","pdf_url":null,"source":null,"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false},"type":"article","type_crossref":"proceedings-article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5104018782","display_name":"Takeshi Shibata","orcid":null},"institutions":[{"id":"https://openalex.org/I74801974","display_name":"The University of Tokyo","ror":"https://ror.org/057zh3y96","country_code":"JP","type":"funder","lineage":["https://openalex.org/I74801974"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Takeshi Shibata","raw_affiliation_strings":["university of Tokyo;"],"affiliations":[{"raw_affiliation_string":"university of Tokyo;","institution_ids":["https://openalex.org/I74801974"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5047846580","display_name":"SungJun Choi","orcid":null},"institutions":[{"id":"https://openalex.org/I74801974","display_name":"The University of Tokyo","ror":"https://ror.org/057zh3y96","country_code":"JP","type":"funder","lineage":["https://openalex.org/I74801974"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"SungJun Choi","raw_affiliation_strings":["university of Tokyo;"],"affiliations":[{"raw_affiliation_string":"university of Tokyo;","institution_ids":["https://openalex.org/I74801974"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5009359355","display_name":"Kenjiro Taura","orcid":"https://orcid.org/0000-0001-5224-382X"},"institutions":[{"id":"https://openalex.org/I74801974","display_name":"The University of Tokyo","ror":"https://ror.org/057zh3y96","country_code":"JP","type":"funder","lineage":["https://openalex.org/I74801974"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Kenjiro Taura","raw_affiliation_strings":["university of Tokyo;"],"affiliations":[{"raw_affiliation_string":"university of Tokyo;","institution_ids":["https://openalex.org/I74801974"]}]}],"institution_assertions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":1.615,"has_fulltext":true,"fulltext_origin":"ngrams","cited_by_count":29,"citation_normalized_percentile":{"value":0.925231,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":91,"max":92},"biblio":{"volume":null,"issue":null,"first_page":"746","last_page":"755"},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10715","display_name":"Distributed and Parallel Computing Systems","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10715","display_name":"Distributed and Parallel Computing Systems","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11986","display_name":"Scientific Computing and Data Management","score":0.999,"subfield":{"id":"https://openalex.org/subfields/1802","display_name":"Information Systems and Management"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.9989,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/data-access","display_name":"Data access","score":0.44901368}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8729627},{"id":"https://openalex.org/C177212765","wikidata":"https://www.wikidata.org/wiki/Q627335","display_name":"Workflow","level":2,"score":0.82814014},{"id":"https://openalex.org/C2778476105","wikidata":"https://www.wikidata.org/wiki/Q628539","display_name":"Workload","level":2,"score":0.57837003},{"id":"https://openalex.org/C206729178","wikidata":"https://www.wikidata.org/wiki/Q2271896","display_name":"Scheduling (production processes)","level":2,"score":0.5638182},{"id":"https://openalex.org/C140824633","wikidata":"https://www.wikidata.org/wiki/Q2808660","display_name":"Workflow management system","level":3,"score":0.550508},{"id":"https://openalex.org/C19612761","wikidata":"https://www.wikidata.org/wiki/Q8034836","display_name":"Workflow technology","level":3,"score":0.4726735},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.4577758},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.454153},{"id":"https://openalex.org/C47487241","wikidata":"https://www.wikidata.org/wiki/Q5227230","display_name":"Data access","level":2,"score":0.44901368},{"id":"https://openalex.org/C2779808786","wikidata":"https://www.wikidata.org/wiki/Q6664603","display_name":"Locality","level":2,"score":0.41332754},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.37088937},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C21547014","wikidata":"https://www.wikidata.org/wiki/Q1423657","display_name":"Operations management","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"is_oa":false,"landing_page_url":"https://doi.org/10.1145/1851476.1851585","pdf_url":null,"source":null,"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false}],"best_oa_location":null,"sustainable_development_goals":[],"grants":[],"datasets":[],"versions":[],"referenced_works_count":33,"referenced_works":["https://openalex.org/W1530375089","https://openalex.org/W1969369888","https://openalex.org/W1975806783","https://openalex.org/W1986015128","https://openalex.org/W1998082182","https://openalex.org/W1999984505","https://openalex.org/W2006743077","https://openalex.org/W2008206224","https://openalex.org/W2019438923","https://openalex.org/W2094806030","https://openalex.org/W2096709532","https://openalex.org/W2100550451","https://openalex.org/W2100830825","https://openalex.org/W2101681305","https://openalex.org/W2103590782","https://openalex.org/W2104998023","https://openalex.org/W2109033701","https://openalex.org/W2112542464","https://openalex.org/W2113209795","https://openalex.org/W2118436132","https://openalex.org/W2122465391","https://openalex.org/W2123130398","https://openalex.org/W2129666400","https://openalex.org/W2131645490","https://openalex.org/W2148317584","https://openalex.org/W2149294210","https://openalex.org/W2155463028","https://openalex.org/W2157970256","https://openalex.org/W2166100672","https://openalex.org/W2168103533","https://openalex.org/W259012431","https://openalex.org/W4229976825","https://openalex.org/W4389442197"],"related_works":["https://openalex.org/W291310304","https://openalex.org/W2391168633","https://openalex.org/W2385499106","https://openalex.org/W2379425324","https://openalex.org/W2376410910","https://openalex.org/W2375552622","https://openalex.org/W2373541195","https://openalex.org/W2370109655","https://openalex.org/W2365658322","https://openalex.org/W2352344200"],"abstract_inverted_index":{"This":[0],"paper":[1],"studies":[2],"five":[3],"real-world":[4,110,128],"data":[5,21,65,78],"intensive":[6,24],"workflow":[7,44,111,129],"applications":[8,30,112,130],"in":[9,120],"the":[10,75],"fields":[11],"of":[12,43,77,90,109],"natural":[13],"language":[14],"processing,":[15],"astronomy":[16],"image":[17],"analysis,":[18],"and":[19,33,53,70,137,143],"web":[20],"analysis.":[22],"Data":[23],"workflows":[25],"are":[26,63,104],"increasingly":[27],"becoming":[28],"important":[29],"for":[31],"cluster":[32],"Grid":[34],"environments.":[35],"They":[36],"open":[37],"new":[38],"challenges":[39],"to":[40,59,117,141],"various":[41],"components":[42],"execution":[45],"environments":[46],"including":[47],"job":[48],"dispatchers,":[49],"schedulers,":[50],"file":[51,54,134,144],"systems,":[52],"staging":[55],"tools.":[56],"The":[57],"keys":[58],"achieving":[60],"high":[61],"performance":[62],"efficient":[64],"sharing":[66],"among":[67],"executing":[68],"hosts":[69],"locality-aware":[71],"scheduling":[72,87],"that":[73],"reduces":[74],"amount":[76],"transfer.":[79],"While":[80],"much":[81],"work":[82],"has":[83],"been":[84],"done":[85],"on":[86,101,132],"workflows,":[88],"many":[89],"them":[91],"use":[92],"synthetic":[93],"or":[94],"random":[95],"workload.":[96],"As":[97],"such,":[98],"their":[99,133,139],"impacts":[100],"real":[102],"workloads":[103],"largely":[105],"unknown.":[106],"Understanding":[107],"characteristics":[108],"is":[113],"a":[114],"required":[115],"step":[116],"promote":[118],"research":[119],"this":[121,124],"area.":[122],"To":[123],"end,":[125],"we":[126],"analyse":[127],"focusing":[131],"access":[135],"patterns":[136],"summarize":[138],"implications":[140],"schedulers":[142],"system/staging":[145],"designs.":[146]},"abstract_inverted_index_v3":null,"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W2081819181","counts_by_year":[{"year":2020,"cited_by_count":1},{"year":2019,"cited_by_count":1},{"year":2018,"cited_by_count":1},{"year":2017,"cited_by_count":7},{"year":2016,"cited_by_count":2},{"year":2015,"cited_by_count":5},{"year":2014,"cited_by_count":6},{"year":2013,"cited_by_count":2},{"year":2012,"cited_by_count":2}],"updated_date":"2025-02-24T07:06:33.412217","created_date":"2016-06-24"}