{"id":"https://openalex.org/W2343641740","doi":"https://doi.org/10.1109/tbdata.2016.2557348","title":"Kvasir: Scalable Provision of Semantically Relevant Web Content on Big Data Framework","display_name":"Kvasir: Scalable Provision of Semantically Relevant Web Content on Big Data Framework","publication_year":2016,"publication_date":"2016-04-28","ids":{"openalex":"https://openalex.org/W2343641740","doi":"https://doi.org/10.1109/tbdata.2016.2557348","mag":"2343641740"},"language":"en","primary_location":{"is_oa":false,"landing_page_url":"https://doi.org/10.1109/tbdata.2016.2557348","pdf_url":null,"source":{"id":"https://openalex.org/S2491400915","display_name":"IEEE Transactions on Big Data","issn_l":"2332-7790","issn":["2332-7790","2372-2096"],"is_oa":false,"is_in_doaj":false,"is_indexed_in_scopus":true,"is_core":true,"host_organization":"https://openalex.org/P4310320439","host_organization_name":"IEEE Computer Society","host_organization_lineage":["https://openalex.org/P4310320439","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Computer Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false},"type":"article","type_crossref":"journal-article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100456490","display_name":"Liang Wang","orcid":"https://orcid.org/0000-0001-9456-0786"},"institutions":[{"id":"https://openalex.org/I241749","display_name":"University of Cambridge","ror":"https://ror.org/013meh722","country_code":"GB","type":"funder","lineage":["https://openalex.org/I241749"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Liang Wang","raw_affiliation_strings":["University of Cambridge, Cambridge, United Kingdom"],"affiliations":[{"raw_affiliation_string":"University of Cambridge, Cambridge, United Kingdom","institution_ids":["https://openalex.org/I241749"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5039205111","display_name":"Sotiris K. Tasoulis","orcid":"https://orcid.org/0000-0001-9536-4090"},"institutions":[{"id":"https://openalex.org/I63098007","display_name":"Liverpool John Moores University","ror":"https://ror.org/04zfme737","country_code":"GB","type":"funder","lineage":["https://openalex.org/I63098007"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Sotiris Tasoulis","raw_affiliation_strings":["Liverpool John Moores University, Liverpool, United Kingdom"],"affiliations":[{"raw_affiliation_string":"Liverpool John Moores University, Liverpool, United Kingdom","institution_ids":["https://openalex.org/I63098007"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5066842476","display_name":"Teemu Roos","orcid":"https://orcid.org/0000-0001-9470-3759"},"institutions":[{"id":"https://openalex.org/I133731052","display_name":"University of Helsinki","ror":"https://ror.org/040af2s02","country_code":"FI","type":"funder","lineage":["https://openalex.org/I133731052"]}],"countries":["FI"],"is_corresponding":false,"raw_author_name":"Teemu Roos","raw_affiliation_strings":["University of Helsinki, Helsinki, Finland"],"affiliations":[{"raw_affiliation_string":"University of Helsinki, Helsinki, Finland","institution_ids":["https://openalex.org/I133731052"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5008046951","display_name":"Jussi Kangasharju","orcid":"https://orcid.org/0000-0001-6119-1638"},"institutions":[{"id":"https://openalex.org/I133731052","display_name":"University of Helsinki","ror":"https://ror.org/040af2s02","country_code":"FI","type":"funder","lineage":["https://openalex.org/I133731052"]}],"countries":["FI"],"is_corresponding":false,"raw_author_name":"Jussi Kangasharju","raw_affiliation_strings":["University of Helsinki, Helsinki, Finland"],"affiliations":[{"raw_affiliation_string":"University of Helsinki, Helsinki, Finland","institution_ids":["https://openalex.org/I133731052"]}]}],"institution_assertions":[],"countries_distinct_count":2,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":4.328,"has_fulltext":true,"fulltext_origin":"ngrams","cited_by_count":24,"citation_normalized_percentile":{"value":0.919234,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":92,"max":93},"biblio":{"volume":"2","issue":"3","first_page":"219","last_page":"233"},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T11478","display_name":"Caching and Content Delivery","score":0.9993,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11478","display_name":"Caching and Content Delivery","score":0.9993,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10203","display_name":"Recommender Systems and Techniques","score":0.9989,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9988,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/spark","display_name":"SPARK (programming language)","score":0.44118297}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.9116788},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.6850076},{"id":"https://openalex.org/C75165309","wikidata":"https://www.wikidata.org/wiki/Q2258979","display_name":"Search engine indexing","level":2,"score":0.5647386},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.5560476},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.5257764},{"id":"https://openalex.org/C110875604","wikidata":"https://www.wikidata.org/wiki/Q75","display_name":"The Internet","level":2,"score":0.4680248},{"id":"https://openalex.org/C167379230","wikidata":"https://www.wikidata.org/wiki/Q1026884","display_name":"Semantic Web Stack","level":3,"score":0.46568623},{"id":"https://openalex.org/C75684735","wikidata":"https://www.wikidata.org/wiki/Q858810","display_name":"Big data","level":2,"score":0.4630018},{"id":"https://openalex.org/C2781215313","wikidata":"https://www.wikidata.org/wiki/Q3493345","display_name":"SPARK (programming language)","level":2,"score":0.44118297},{"id":"https://openalex.org/C2129575","wikidata":"https://www.wikidata.org/wiki/Q54837","display_name":"Semantic Web","level":2,"score":0.43737522},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.23682329},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.20516789},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"is_oa":false,"landing_page_url":"https://doi.org/10.1109/tbdata.2016.2557348","pdf_url":null,"source":{"id":"https://openalex.org/S2491400915","display_name":"IEEE Transactions on Big Data","issn_l":"2332-7790","issn":["2332-7790","2372-2096"],"is_oa":false,"is_in_doaj":false,"is_indexed_in_scopus":true,"is_core":true,"host_organization":"https://openalex.org/P4310320439","host_organization_name":"IEEE Computer Society","host_organization_lineage":["https://openalex.org/P4310320439","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Computer Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Industry, innovation and infrastructure","score":0.43,"id":"https://metadata.un.org/sdg/9"}],"grants":[{"funder":"https://openalex.org/F4320321108","funder_display_name":"Academy of Finland","award_id":null}],"datasets":[],"versions":[],"referenced_works_count":57,"referenced_works":["https://openalex.org/W143867266","https://openalex.org/W1532325895","https://openalex.org/W1592247788","https://openalex.org/W1627400044","https://openalex.org/W168564468","https://openalex.org/W17346433","https://openalex.org/W1854214752","https://openalex.org/W1880262756","https://openalex.org/W1915050012","https://openalex.org/W1966553486","https://openalex.org/W1978112828","https://openalex.org/W1980110184","https://openalex.org/W1987040325","https://openalex.org/W1997841190","https://openalex.org/W2015676665","https://openalex.org/W2025605741","https://openalex.org/W2028787907","https://openalex.org/W2044195942","https://openalex.org/W2046545050","https://openalex.org/W2054945727","https://openalex.org/W2072773380","https://openalex.org/W2086504823","https://openalex.org/W2090398718","https://openalex.org/W2107107106","https://openalex.org/W2107743791","https://openalex.org/W2110325612","https://openalex.org/W2111565546","https://openalex.org/W2112053513","https://openalex.org/W2115407997","https://openalex.org/W2115854352","https://openalex.org/W2117756735","https://openalex.org/W2118123209","https://openalex.org/W2118519969","https://openalex.org/W2124509324","https://openalex.org/W2131975293","https://openalex.org/W2132314908","https://openalex.org/W2133990480","https://openalex.org/W2138621811","https://openalex.org/W2145065594","https://openalex.org/W2147152072","https://openalex.org/W2154249783","https://openalex.org/W2154851929","https://openalex.org/W2158169729","https://openalex.org/W2165949563","https://openalex.org/W2170605888","https://openalex.org/W2171960770","https://openalex.org/W2189465200","https://openalex.org/W2341865734","https://openalex.org/W2502644482","https://openalex.org/W281665770","https://openalex.org/W2950332743","https://openalex.org/W4213009331","https://openalex.org/W4231510805","https://openalex.org/W4233135949","https://openalex.org/W4239696231","https://openalex.org/W4299379706","https://openalex.org/W4301776409"],"related_works":["https://openalex.org/W4247566972","https://openalex.org/W3211874991","https://openalex.org/W3202731209","https://openalex.org/W2766461310","https://openalex.org/W2366430559","https://openalex.org/W2355823470","https://openalex.org/W2349698472","https://openalex.org/W2171552258","https://openalex.org/W1985801232","https://openalex.org/W1585941060"],"abstract_inverted_index":{"The":[0],"Internet":[1,91],"is":[2],"overloading":[3],"its":[4],"users":[5],"with":[6,124],"excessive":[7],"information":[8,34],"flows,":[9],"so":[10],"that":[11],"effective":[12],"content-based":[13],"filtering":[14],"becomes":[15],"crucial":[16],"in":[17,131],"improving":[18],"user":[19],"experience":[20],"and":[21,59,68,106],"work":[22],"efficiency.":[23],"Latent":[24],"semantic":[25,50,57],"analysis":[26,58],"has":[27],"long":[28],"been":[29],"demonstrated":[30],"as":[31],"a":[32,49,89],"promising":[33],"retrieval":[35],"technique":[36],"to":[37,63,84,102,127],"search":[38],"for":[39],"relevant":[40],"articles":[41],"from":[42],"large":[43],"text":[44],"corpora.":[45],"We":[46,76],"build":[47],"Kvasir,":[48,119],"recommendation":[51],"system,":[52],"on":[53],"top":[54],"of":[55,81,108,110,118],"latent":[56],"other":[60],"state-of-the-art":[61],"technologies":[62],"seamlessly":[64],"integrate":[65],"an":[66],"automated":[67],"proactive":[69],"content":[70],"provision":[71],"service":[72],"into":[73,88],"web":[74],"browsing.":[75],"utilize":[77],"the":[78,97,115,120,128,132],"processing":[79],"power":[80],"Apache":[82],"Spark":[83],"scale":[85],"up":[86],"Kvasir":[87],"practical":[90],"service.":[92],"In":[93],"addition,":[94],"we":[95,113],"improve":[96],"classic":[98],"randomized":[99],"partition":[100],"tree":[101],"support":[103],"efficient":[104],"indexing":[105],"searching":[107],"millions":[109],"documents.":[111],"Herein":[112],"present":[114],"architectural":[116],"design":[117],"core":[121],"algorithms,":[122],"along":[123],"our":[125],"solutions":[126],"technical":[129],"challenges":[130],"actual":[133],"system":[134],"implementation.":[135]},"abstract_inverted_index_v3":null,"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W2343641740","counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":1},{"year":2020,"cited_by_count":2},{"year":2019,"cited_by_count":4},{"year":2018,"cited_by_count":8},{"year":2017,"cited_by_count":5},{"year":2016,"cited_by_count":1},{"year":2015,"cited_by_count":1}],"updated_date":"2025-04-20T07:46:21.961030","created_date":"2016-06-24"}