{"id":"https://openalex.org/W2031388557","doi":"https://doi.org/10.1109/isit.2012.6283716","title":"On optimal two sample homogeneity tests for finite alphabets","display_name":"On optimal two sample homogeneity tests for finite alphabets","publication_year":2012,"publication_date":"2012-07-01","ids":{"openalex":"https://openalex.org/W2031388557","doi":"https://doi.org/10.1109/isit.2012.6283716","mag":"2031388557"},"language":"en","primary_location":{"is_oa":false,"landing_page_url":"https://doi.org/10.1109/isit.2012.6283716","pdf_url":null,"source":null,"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false},"type":"article","type_crossref":"proceedings-article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://infoscience.epfl.ch/record/181816/files/Unnikrishnan12.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5039592314","display_name":"Jayakrishnan Unnikrishnan","orcid":"https://orcid.org/0000-0002-8464-4641"},"institutions":[{"id":"https://openalex.org/I5124864","display_name":"\u00c9cole Polytechnique F\u00e9d\u00e9rale de Lausanne","ror":"https://ror.org/02s376052","country_code":"CH","type":"funder","lineage":["https://openalex.org/I2799323385","https://openalex.org/I5124864"]}],"countries":["CH"],"is_corresponding":true,"raw_author_name":"Jayakrishnan Unnikrishnan","raw_affiliation_strings":["Audiovisual Communications Laboratory, School of Computer and Communication Sciences, Ecole Polytechnique F\u00e9d\u00e9rale de Lausanne (EPFL), Switzerland#TAB#"],"affiliations":[{"raw_affiliation_string":"Audiovisual Communications Laboratory, School of Computer and Communication Sciences, Ecole Polytechnique F\u00e9d\u00e9rale de Lausanne (EPFL), Switzerland#TAB#","institution_ids":["https://openalex.org/I5124864"]}]}],"institution_assertions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":["https://openalex.org/A5039592314"],"corresponding_institution_ids":["https://openalex.org/I5124864"],"apc_list":null,"apc_paid":null,"fwci":1.704,"has_fulltext":true,"fulltext_origin":"pdf","cited_by_count":11,"citation_normalized_percentile":{"value":0.651839,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":85,"max":86},"biblio":{"volume":null,"issue":null,"first_page":"2027","last_page":"2031"},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T11269","display_name":"Algorithms and Data Compression","score":0.9979,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11269","display_name":"Algorithms and Data Compression","score":0.9979,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12072","display_name":"Machine Learning and Algorithms","score":0.9967,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11901","display_name":"Bayesian Methods and Mixture Models","score":0.9948,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/statistic","display_name":"Statistic","score":0.4682746},{"id":"https://openalex.org/keywords/chi-square-test","display_name":"Chi-square test","score":0.46503943},{"id":"https://openalex.org/keywords/limiting","display_name":"Limiting","score":0.45943612}],"concepts":[{"id":"https://openalex.org/C142259097","wikidata":"https://www.wikidata.org/wiki/Q5891314","display_name":"Homogeneity (statistics)","level":2,"score":0.73887134},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.62016726},{"id":"https://openalex.org/C112876837","wikidata":"https://www.wikidata.org/wiki/Q837518","display_name":"Alphabet","level":2,"score":0.56577677},{"id":"https://openalex.org/C87007009","wikidata":"https://www.wikidata.org/wiki/Q210832","display_name":"Statistical hypothesis testing","level":2,"score":0.5652833},{"id":"https://openalex.org/C29447264","wikidata":"https://www.wikidata.org/wiki/Q5423649","display_name":"F-test of equality of variances","level":4,"score":0.56336904},{"id":"https://openalex.org/C191988596","wikidata":"https://www.wikidata.org/wiki/Q628374","display_name":"Null hypothesis","level":2,"score":0.53784275},{"id":"https://openalex.org/C89128539","wikidata":"https://www.wikidata.org/wiki/Q1949963","display_name":"Statistic","level":2,"score":0.4682746},{"id":"https://openalex.org/C32809988","wikidata":"https://www.wikidata.org/wiki/Q1071004","display_name":"Chi-square test","level":2,"score":0.46503943},{"id":"https://openalex.org/C188198153","wikidata":"https://www.wikidata.org/wiki/Q1613840","display_name":"Limiting","level":2,"score":0.45943612},{"id":"https://openalex.org/C169857963","wikidata":"https://www.wikidata.org/wiki/Q1461038","display_name":"Test statistic","level":3,"score":0.45021114},{"id":"https://openalex.org/C120639","wikidata":"https://www.wikidata.org/wiki/Q7068958","display_name":"Null distribution","level":4,"score":0.44810808},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.39749983},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.3519392},{"id":"https://openalex.org/C28826006","wikidata":"https://www.wikidata.org/wiki/Q33521","display_name":"Applied mathematics","level":1,"score":0.34334278},{"id":"https://openalex.org/C118615104","wikidata":"https://www.wikidata.org/wiki/Q121416","display_name":"Discrete mathematics","level":1,"score":0.32425147},{"id":"https://openalex.org/C78519656","wikidata":"https://www.wikidata.org/wiki/Q101333","display_name":"Mechanical engineering","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"is_oa":false,"landing_page_url":"https://doi.org/10.1109/isit.2012.6283716","pdf_url":null,"source":null,"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false},{"is_oa":true,"landing_page_url":"http://infoscience.epfl.ch/record/181816","pdf_url":"https://infoscience.epfl.ch/record/181816/files/Unnikrishnan12.pdf","source":{"id":"https://openalex.org/S4306400488","display_name":"Infoscience (Ecole Polytechnique F\u00e9d\u00e9rale de Lausanne)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false},{"is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.352.4500","pdf_url":null,"source":{"id":"https://openalex.org/S4306400349","display_name":"CiteSeer X (The Pennsylvania State University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I130769515","host_organization_name":"Pennsylvania State University","host_organization_lineage":["https://openalex.org/I130769515"],"host_organization_lineage_names":["Pennsylvania State University"],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false}],"best_oa_location":{"is_oa":true,"landing_page_url":"http://infoscience.epfl.ch/record/181816","pdf_url":"https://infoscience.epfl.ch/record/181816/files/Unnikrishnan12.pdf","source":{"id":"https://openalex.org/S4306400488","display_name":"Infoscience (Ecole Polytechnique F\u00e9d\u00e9rale de Lausanne)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","score":0.69,"display_name":"Quality education"}],"grants":[],"datasets":[],"versions":[],"referenced_works_count":14,"referenced_works":["https://openalex.org/W1582019318","https://openalex.org/W2033387638","https://openalex.org/W2045638068","https://openalex.org/W2051258594","https://openalex.org/W2055309977","https://openalex.org/W2070139658","https://openalex.org/W2103641619","https://openalex.org/W2109407383","https://openalex.org/W2796936280","https://openalex.org/W2797043077","https://openalex.org/W2802739963","https://openalex.org/W3027327446","https://openalex.org/W4233941567","https://openalex.org/W4293404332"],"related_works":["https://openalex.org/W4400844461","https://openalex.org/W4312206274","https://openalex.org/W4200217769","https://openalex.org/W3208315888","https://openalex.org/W3106637505","https://openalex.org/W3000603176","https://openalex.org/W2154254690","https://openalex.org/W2062512628","https://openalex.org/W2032513700","https://openalex.org/W1982620251"],"abstract_inverted_index":{"Suppose":[0],"we":[1,120],"are":[2,15,39,89,106,112,197],"given":[3],"two":[4,55,132],"independent":[5],"strings":[6,25],"of":[7,64,75,149,157],"data":[8],"from":[9,28],"a":[10,50,146],"known":[11,81],"finite":[12,181],"alphabet.":[13],"We":[14,130,143,201],"interested":[16],"in":[17,92,98,115,162,192,220],"testing":[18],"the":[19,24,29,34,44,54,67,70,76,99,124,158,164,217],"null":[20,72],"hypothesis":[21,73],"that":[22,33,69,88,173,203],"both":[23,163],"were":[26],"drawn":[27],"same":[30],"distribution,":[31],"assuming":[32],"samples":[35],"within":[36],"each":[37],"string":[38],"mutually":[40],"independent.":[41],"Among":[42],"statisticians,":[43],"most":[45],"popular":[46],"solution":[47],"for":[48,170,180],"such":[49,103,110,204],"homogeneity":[51,205],"test":[52,78,151,159,219],"is":[53,80],"sample":[56],"chi-square":[57,218],"test,":[58],"primarily":[59],"due":[60],"to":[61,84,122,190],"its":[62],"ease":[63],"implementation":[65],"and":[66,82,109,128,140,152],"fact":[68],"limiting":[71,155],"distribution":[74],"associated":[77],"statistic":[79],"easy":[83,189],"compute.":[85],"Although":[86],"tests":[87,111,135,188,206],"asymptotically":[90],"optimal":[91,134],"error":[93],"probability":[94],"have":[95],"been":[96],"proposed":[97,136],"information":[100],"theory":[101,127],"literature,":[102],"optimality":[104,209],"results":[105,167],"not":[107],"well-known":[108],"rarely":[113],"used":[114,161],"practice.":[116,129,193,221],"In":[117],"this":[118],"paper":[119],"seek":[121],"bridge":[123],"gap":[125],"between":[126],"study":[131],"different":[133],"by":[137],"Shayevitz":[138],"[1]":[139],"Gutman":[141],"[2].":[142],"first":[144],"obtain":[145,154],"simplified":[147],"structure":[148],"Shayevitz's":[150],"then":[153],"distributions":[156],"statistics":[160],"tests.":[165],"These":[166],"provide":[168],"guidelines":[169],"choosing":[171],"thresholds":[172],"guarantee":[174],"an":[175],"approximate":[176],"false":[177],"alarm":[178],"constraint":[179],"length":[182],"observation":[183],"sequences,":[184],"thus":[185],"making":[186],"these":[187],"use":[191],"The":[194],"approximation":[195],"accuracies":[196],"demonstrated":[198],"using":[199],"simulations.":[200],"argue":[202],"with":[207],"provable":[208],"properties":[210],"could":[211],"potentially":[212],"be":[213],"better":[214],"choices":[215],"than":[216]},"abstract_inverted_index_v3":null,"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W2031388557","counts_by_year":[{"year":2018,"cited_by_count":2},{"year":2016,"cited_by_count":1},{"year":2015,"cited_by_count":1},{"year":2014,"cited_by_count":4},{"year":2013,"cited_by_count":3}],"updated_date":"2025-03-17T17:56:11.551978","created_date":"2016-06-24"}