{"id":"https://openalex.org/W4311728209","doi":"https://doi.org/10.48550/arxiv.2212.07921","title":"Scholarly Knowledge Extraction from Published Software Packages","display_name":"Scholarly Knowledge Extraction from Published Software Packages","publication_year":2022,"publication_date":"2022-01-01","ids":{"openalex":"https://openalex.org/W4311728209","doi":"https://doi.org/10.48550/arxiv.2212.07921"},"language":"en","primary_location":{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2212.07921","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false},"type":"preprint","type_crossref":"posted-content","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/abs/2212.07921","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100740706","display_name":"Muhammad Haris","orcid":"https://orcid.org/0000-0002-8875-9948"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Haris, Muhammad","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5062163326","display_name":"Markus Stocker","orcid":"https://orcid.org/0000-0001-5492-3212"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Stocker, Markus","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5071765665","display_name":"S\u00f6ren Auer","orcid":"https://orcid.org/0000-0002-0698-2864"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Auer, S\u00f6ren","raw_affiliation_strings":[],"affiliations":[]}],"institution_assertions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.0,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":0,"max":60},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T11986","display_name":"Scientific Computing and Data Management","score":0.994,"subfield":{"id":"https://openalex.org/subfields/1802","display_name":"Information Systems and Management"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T11986","display_name":"Scientific Computing and Data Management","score":0.994,"subfield":{"id":"https://openalex.org/subfields/1802","display_name":"Information Systems and Management"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10215","display_name":"Semantic Web and Ontologies","score":0.9825,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11710","display_name":"Biomedical Text Mining and Ontologies","score":0.9628,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/software-mining","display_name":"Software mining","score":0.44272333},{"id":"https://openalex.org/keywords/python","display_name":"Python","score":0.43825218}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8203948},{"id":"https://openalex.org/C93518851","wikidata":"https://www.wikidata.org/wiki/Q180160","display_name":"Metadata","level":2,"score":0.68919325},{"id":"https://openalex.org/C2777904410","wikidata":"https://www.wikidata.org/wiki/Q7397","display_name":"Software","level":2,"score":0.5767189},{"id":"https://openalex.org/C61423126","wikidata":"https://www.wikidata.org/wiki/Q187432","display_name":"Scripting language","level":2,"score":0.5624136},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.48257747},{"id":"https://openalex.org/C195807954","wikidata":"https://www.wikidata.org/wiki/Q1662562","display_name":"Information extraction","level":2,"score":0.45235354},{"id":"https://openalex.org/C103520596","wikidata":"https://www.wikidata.org/wiki/Q7554328","display_name":"Software mining","level":5,"score":0.44272333},{"id":"https://openalex.org/C519991488","wikidata":"https://www.wikidata.org/wiki/Q28865","display_name":"Python (programming language)","level":2,"score":0.43825218},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.40762767},{"id":"https://openalex.org/C115903868","wikidata":"https://www.wikidata.org/wiki/Q80993","display_name":"Software engineering","level":1,"score":0.37807894},{"id":"https://openalex.org/C529173508","wikidata":"https://www.wikidata.org/wiki/Q638608","display_name":"Software development","level":3,"score":0.34711987},{"id":"https://openalex.org/C186846655","wikidata":"https://www.wikidata.org/wiki/Q3398377","display_name":"Software construction","level":4,"score":0.2854194},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.24141583}],"mesh":[],"locations_count":2,"locations":[{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2212.07921","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false},{"is_oa":false,"landing_page_url":"https://api.datacite.org/dois/10.48550/arxiv.2212.07921","pdf_url":null,"source":{"id":"https://openalex.org/S4393179698","display_name":"DataCite API","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I4210145204","host_organization_name":"DataCite","host_organization_lineage":["https://openalex.org/I4210145204"],"host_organization_lineage_names":["DataCite"],"type":"metadata"},"license":null,"license_id":null,"version":null}],"best_oa_location":{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2212.07921","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false},"sustainable_development_goals":[{"display_name":"Quality education","id":"https://metadata.un.org/sdg/4","score":0.54}],"grants":[],"datasets":[],"versions":[],"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4389470870","https://openalex.org/W4300438041","https://openalex.org/W3023169329","https://openalex.org/W2782165897","https://openalex.org/W2761254753","https://openalex.org/W2188981919","https://openalex.org/W2139703748","https://openalex.org/W2054104202","https://openalex.org/W1582950852","https://openalex.org/W1024825291"],"abstract_inverted_index":{"A":[0],"plethora":[1],"of":[2,22,41,54,153],"scientific":[3],"software":[4,15,49,86,115,119],"packages":[5,16,50,87],"are":[6,17],"published":[7,23,48,122,166],"in":[8,62,121,149,167,180],"repositories,":[9],"e.g.,":[10],"Zenodo":[11],"and":[12,57,96,126],"figshare.":[13],"These":[14],"crucial":[18],"for":[19,38,118],"the":[20,90,97,103,108,113,128,138,146,150,158,168,174,181],"reproducibility":[21],"research.":[24],"As":[25],"an":[26,36],"additional":[27],"route":[28],"to":[29,106,134,156,161],"scholarly":[30,45,162,169,178],"knowledge":[31,46,179],"graph":[32],"construction,":[33],"we":[34,75,101,124,144,172],"propose":[35],"approach":[37,68],"automated":[39],"extraction":[40],"machine":[42,176],"actionable":[43,177],"(structured)":[44],"from":[47,85],"by":[51,88],"static":[52],"analysis":[53],"their":[55],"(meta)data":[56],"contents":[58],"(in":[59],"particular":[60],"scripts":[61],"languages":[63],"such":[64],"as":[65,72],"Python).":[66],"The":[67],"can":[69],"be":[70],"summarized":[71],"follows.":[73],"First,":[74],"extract":[76,135],"metadata":[77,105],"information":[78,136,148,160,165],"(software":[79],"description,":[80],"programming":[81],"languages,":[82],"related":[83,154],"references)":[84],"leveraging":[89],"Software":[91],"Metadata":[92],"Extraction":[93],"Framework":[94],"(SOMEF)":[95],"GitHub":[98],"API.":[99],"Second,":[100],"analyze":[102,127],"extracted":[104,147,159,175],"find":[107],"research":[109],"articles":[110,155],"associated":[111],"with":[112],"corresponding":[114],"repository.":[116],"Third,":[117],"contained":[120],"packages,":[123],"create":[125],"Abstract":[129],"Syntax":[130],"Tree":[131],"(AST)":[132],"representation":[133],"about":[137],"procedures":[139],"performed":[140],"on":[141],"data.":[142],"Fourth,":[143],"search":[145],"full":[151],"text":[152],"constrain":[157],"knowledge,":[163],"i.e.":[164],"literature.":[170],"Finally,":[171],"publish":[173],"Open":[182],"Research":[183],"Knowledge":[184],"Graph":[185],"(ORKG).":[186]},"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4311728209","counts_by_year":[],"updated_date":"2024-12-07T23:56:53.182521","created_date":"2022-12-28"}