{"id":"https://openalex.org/W4385484253","doi":"https://doi.org/10.1016/j.jksuci.2023.101687","title":"A semi-supervised hierarchical ensemble clustering framework based on a novel similarity metric and stratified feature sampling","display_name":"A semi-supervised hierarchical ensemble clustering framework based on a novel similarity metric and stratified feature sampling","publication_year":2023,"publication_date":"2023-08-02","ids":{"openalex":"https://openalex.org/W4385484253","doi":"https://doi.org/10.1016/j.jksuci.2023.101687"},"language":"en","primary_location":{"is_oa":true,"landing_page_url":"https://doi.org/10.1016/j.jksuci.2023.101687","pdf_url":null,"source":{"id":"https://openalex.org/S2764955546","display_name":"Journal of King Saud University - Computer and Information Sciences","issn_l":"1319-1578","issn":["1319-1578","2213-1248"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320990","host_organization_name":"Elsevier BV","host_organization_lineage":["https://openalex.org/P4310320990"],"host_organization_lineage_names":["Elsevier BV"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true},"type":"article","type_crossref":"journal-article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.1016/j.jksuci.2023.101687","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5007002466","display_name":"Hui Shi","orcid":"https://orcid.org/0000-0003-1524-4553"},"institutions":[{"id":"https://openalex.org/I2250955327","display_name":"Huawei Technologies (China)","ror":"https://ror.org/00cmhce21","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250955327"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Hui Shi","raw_affiliation_strings":["Shanwei Innovation Industrial Design and Research Institute, Shanwei 516600, Guangdong, China","Shanwei Institute of Technology, Shanwei 516600, Guangdong, China"],"affiliations":[{"raw_affiliation_string":"Shanwei Innovation Industrial Design and Research Institute, Shanwei 516600, Guangdong, China","institution_ids":["https://openalex.org/I2250955327"]},{"raw_affiliation_string":"Shanwei Institute of Technology, Shanwei 516600, Guangdong, China","institution_ids":["https://openalex.org/I2250955327"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5053836350","display_name":"Qiang Peng","orcid":"https://orcid.org/0000-0002-0536-2313"},"institutions":[{"id":"https://openalex.org/I2250955327","display_name":"Huawei Technologies (China)","ror":"https://ror.org/00cmhce21","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250955327"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qiang Peng","raw_affiliation_strings":["Shanwei Institute of Technology, Shanwei 516600, Guangdong, China"],"affiliations":[{"raw_affiliation_string":"Shanwei Institute of Technology, Shanwei 516600, Guangdong, China","institution_ids":["https://openalex.org/I2250955327"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5014212797","display_name":"Zhiming Xie","orcid":null},"institutions":[{"id":"https://openalex.org/I2250955327","display_name":"Huawei Technologies (China)","ror":"https://ror.org/00cmhce21","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250955327"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhiming Xie","raw_affiliation_strings":["Shanwei Innovation Industrial Design and Research Institute, Shanwei 516600, Guangdong, China","Shanwei Institute of Technology, Shanwei 516600, Guangdong, China"],"affiliations":[{"raw_affiliation_string":"Shanwei Innovation Industrial Design and Research Institute, Shanwei 516600, Guangdong, China","institution_ids":["https://openalex.org/I2250955327"]},{"raw_affiliation_string":"Shanwei Institute of Technology, Shanwei 516600, Guangdong, China","institution_ids":["https://openalex.org/I2250955327"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100370523","display_name":"Jian Wang","orcid":"https://orcid.org/0000-0002-9849-7558"},"institutions":[{"id":"https://openalex.org/I2250955327","display_name":"Huawei Technologies (China)","ror":"https://ror.org/00cmhce21","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250955327"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jian Wang","raw_affiliation_strings":["Shanwei Institute of Technology, Shanwei 516600, Guangdong, China"],"affiliations":[{"raw_affiliation_string":"Shanwei Institute of Technology, Shanwei 516600, Guangdong, China","institution_ids":["https://openalex.org/I2250955327"]}]}],"institution_assertions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":["https://openalex.org/A5007002466"],"corresponding_institution_ids":["https://openalex.org/I2250955327"],"apc_list":{"value":1350,"currency":"USD","value_usd":1350,"provenance":"doaj"},"apc_paid":{"value":1350,"currency":"USD","value_usd":1350,"provenance":"doaj"},"fwci":0.805,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.999978,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":85,"max":89},"biblio":{"volume":"35","issue":"8","first_page":"101687","last_page":"101687"},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10637","display_name":"Data Clustering Techniques and Algorithms","score":0.9966,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10637","display_name":"Data Clustering Techniques and Algorithms","score":0.9966,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10057","display_name":"Face Recognition and Dimensionality Reduction Techniques","score":0.9923,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13731","display_name":"Dynamics of Urban Structure through Spatial Network Analysis","score":0.9871,"subfield":{"id":"https://openalex.org/subfields/3322","display_name":"Urban Studies"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/semi-supervised-clustering","display_name":"Semi-supervised Clustering","score":0.691457},{"id":"https://openalex.org/keywords/single-linkage-clustering","display_name":"Single-linkage clustering","score":0.6654197},{"id":"https://openalex.org/keywords/consensus-clustering","display_name":"Consensus clustering","score":0.64277697},{"id":"https://openalex.org/keywords/hierarchical-clustering","display_name":"Hierarchical clustering","score":0.6381335},{"id":"https://openalex.org/keywords/ensemble-methods","display_name":"Ensemble Methods","score":0.591779},{"id":"https://openalex.org/keywords/clustering-algorithms","display_name":"Clustering Algorithms","score":0.565117},{"id":"https://openalex.org/keywords/spectral-clustering","display_name":"Spectral Clustering","score":0.555995},{"id":"https://openalex.org/keywords/density-based-clustering","display_name":"Density-based Clustering","score":0.547612},{"id":"https://openalex.org/keywords/brown-clustering","display_name":"Brown clustering","score":0.48784328},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.45254278},{"id":"https://openalex.org/keywords/similarity","display_name":"Similarity (geometry)","score":0.42734095}],"concepts":[{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.8447233},{"id":"https://openalex.org/C22648726","wikidata":"https://www.wikidata.org/wiki/Q7523744","display_name":"Single-linkage clustering","level":5,"score":0.6654197},{"id":"https://openalex.org/C94641424","wikidata":"https://www.wikidata.org/wiki/Q5172845","display_name":"Correlation clustering","level":3,"score":0.6527571},{"id":"https://openalex.org/C186767784","wikidata":"https://www.wikidata.org/wiki/Q5162841","display_name":"Consensus clustering","level":5,"score":0.64277697},{"id":"https://openalex.org/C92835128","wikidata":"https://www.wikidata.org/wiki/Q1277447","display_name":"Hierarchical clustering","level":3,"score":0.6381335},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.5672951},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5643578},{"id":"https://openalex.org/C33704608","wikidata":"https://www.wikidata.org/wiki/Q5014717","display_name":"CURE data clustering algorithm","level":4,"score":0.5581586},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.5564241},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5528429},{"id":"https://openalex.org/C17212007","wikidata":"https://www.wikidata.org/wiki/Q5511111","display_name":"Fuzzy clustering","level":3,"score":0.51929873},{"id":"https://openalex.org/C104047586","wikidata":"https://www.wikidata.org/wiki/Q5033439","display_name":"Canopy clustering algorithm","level":4,"score":0.49384242},{"id":"https://openalex.org/C167984511","wikidata":"https://www.wikidata.org/wiki/Q17003931","display_name":"Brown clustering","level":5,"score":0.48784328},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.45254278},{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.42734095},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.37834314},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"is_oa":true,"landing_page_url":"https://doi.org/10.1016/j.jksuci.2023.101687","pdf_url":null,"source":{"id":"https://openalex.org/S2764955546","display_name":"Journal of King Saud University - Computer and Information Sciences","issn_l":"1319-1578","issn":["1319-1578","2213-1248"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320990","host_organization_name":"Elsevier BV","host_organization_lineage":["https://openalex.org/P4310320990"],"host_organization_lineage_names":["Elsevier BV"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true}],"best_oa_location":{"is_oa":true,"landing_page_url":"https://doi.org/10.1016/j.jksuci.2023.101687","pdf_url":null,"source":{"id":"https://openalex.org/S2764955546","display_name":"Journal of King Saud University - Computer and Information Sciences","issn_l":"1319-1578","issn":["1319-1578","2213-1248"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320990","host_organization_name":"Elsevier BV","host_organization_lineage":["https://openalex.org/P4310320990"],"host_organization_lineage_names":["Elsevier BV"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true},"sustainable_development_goals":[],"grants":[],"datasets":[],"versions":[],"referenced_works_count":35,"referenced_works":["https://openalex.org/W2119611763","https://openalex.org/W2151153628","https://openalex.org/W2306431670","https://openalex.org/W253433213","https://openalex.org/W2587977506","https://openalex.org/W2791980930","https://openalex.org/W2955505172","https://openalex.org/W2971783895","https://openalex.org/W2976222518","https://openalex.org/W3003752967","https://openalex.org/W3012390780","https://openalex.org/W3014328542","https://openalex.org/W3126686163","https://openalex.org/W3172721149","https://openalex.org/W3189070026","https://openalex.org/W3193895443","https://openalex.org/W3207672631","https://openalex.org/W4210286867","https://openalex.org/W4224256651","https://openalex.org/W4281630955","https://openalex.org/W4281886197","https://openalex.org/W4283717319","https://openalex.org/W4284712243","https://openalex.org/W4284960100","https://openalex.org/W4285411788","https://openalex.org/W4289745840","https://openalex.org/W4293203059","https://openalex.org/W4307832574","https://openalex.org/W4309778434","https://openalex.org/W4321109309","https://openalex.org/W4323266540","https://openalex.org/W4361191480","https://openalex.org/W4366752402","https://openalex.org/W4367663227","https://openalex.org/W4376273023"],"related_works":["https://openalex.org/W4241767317","https://openalex.org/W2622412490","https://openalex.org/W2385630304","https://openalex.org/W2384052049","https://openalex.org/W2160785859","https://openalex.org/W2118740473","https://openalex.org/W2101637161","https://openalex.org/W2087424554","https://openalex.org/W2067669858","https://openalex.org/W1957537378"],"abstract_inverted_index":{"Recently,":[0],"both":[1],"ensemble":[2],"clustering":[3,6,16,21,34,74,83,182,198,212],"and":[4,76,97,123,167,184,205],"semi-supervised":[5],"have":[7],"emerged":[8],"as":[9],"important":[10],"paradigms":[11],"of":[12,40,135,164,207],"traditional":[13],"clustering.":[14],"Ensemble":[15,53,114],"seeks":[17],"to":[18,61,101,140,143,210],"integrate":[19],"multiple":[20,180],"results":[22,201],"from":[23],"different":[24,31],"methods":[25,29],"or":[26],"the":[27,48,133,145,162,173,185,196,203],"same":[28],"with":[30,153,169],"parameters.":[32],"Semi-supervised":[33,112],"involves":[35],"using":[36],"a":[37,111,119,154,191],"small":[38],"amount":[39],"class":[41],"membership":[42],"information":[43,134],"in":[44,86],"some":[45],"samples":[46],"for":[47],"learning":[49],"process.":[50],"Meanwhile,":[51],"Semi-Supervised":[52],"Clustering":[54,115],"(SSEC)":[55],"has":[56],"attracted":[57],"increasing":[58],"attention":[59],"due":[60],"its":[62],"high":[63],"performance.":[64],"However,":[65],"most":[66],"SSEC":[67,89],"algorithms":[68],"are":[69,78,176],"configured":[70,189],"based":[71,117,178,194],"on":[72,81,118,179,195],"partitional":[73],"techniques,":[75,183],"there":[77],"few":[79],"attempts":[80],"hierarchical":[82,181],"techniques.":[84],"Even":[85],"existing":[87],"hierarchy-based":[88],"algorithms,":[90],"prior":[91],"knowledge":[92],"is":[93,98,151,188],"not":[94],"sufficiently":[95],"used":[96],"often":[99],"applied":[100],"create":[102],"primary":[103,137,165,174],"partitions.":[104],"To":[105],"address":[106],"these":[107],"problems,":[108],"we":[109,128],"propose":[110],"Hierarchical":[113],"framework":[116],"novel":[120],"Similarity":[121],"metric":[122],"stratified":[124,155],"feature":[125,156],"Sampling,":[126],"which":[127],"call":[129],"SHECSS.":[130],"SHECSS":[131,150,208],"uses":[132],"all":[136],"partitions":[138,166,175],"according":[139],"their":[141],"strength":[142],"calculate":[144],"similarity":[146],"between":[147],"samples.":[148],"Also,":[149],"equipped":[152],"sampling":[157],"mechanism":[158],"that":[159],"can":[160],"improve":[161],"diversity":[163],"deal":[168],"high-dimensional":[170],"data.":[171],"Here,":[172],"created":[177],"target":[186],"partition":[187],"by":[190],"consensus":[192],"function":[193],"clusters":[197],"policy.":[199],"Experimental":[200],"show":[202],"effectiveness":[204],"efficiency":[206],"compared":[209],"representative":[211],"methods.":[213]},"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4385484253","counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":1},{"year":2014,"cited_by_count":1}],"updated_date":"2024-11-26T17:14:02.004213","created_date":"2023-08-03"}