{"id":"https://openalex.org/W4377864448","doi":"https://doi.org/10.48550/arxiv.2305.12518","title":"VAKTA-SETU: A Speech-to-Speech Machine Translation Service in Select Indic Languages","display_name":"VAKTA-SETU: A Speech-to-Speech Machine Translation Service in Select Indic Languages","publication_year":2023,"publication_date":"2023-01-01","ids":{"openalex":"https://openalex.org/W4377864448","doi":"https://doi.org/10.48550/arxiv.2305.12518"},"language":"en","primary_location":{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2305.12518","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"cc-by-nc-sa","license_id":"https://openalex.org/licenses/cc-by-nc-sa","version":"submittedVersion","is_accepted":false,"is_published":false},"type":"preprint","type_crossref":"posted-content","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/abs/2305.12518","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5056201614","display_name":"Shivam Mhaskar","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mhaskar, Shivam","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5108520931","display_name":"Vineet Bhat","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bhat, Vineet","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5064312570","display_name":"Akshay Batheja","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Batheja, Akshay","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5014560775","display_name":"Sourabh Deoghare","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Deoghare, Sourabh","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5104152364","display_name":"Paramveer Choudhary","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Choudhary, Paramveer","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5065100828","display_name":"Pushpak Bhattacharyya","orcid":"https://orcid.org/0000-0001-5319-5508"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bhattacharyya, Pushpak","raw_affiliation_strings":[],"affiliations":[]}],"institution_assertions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.712479,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":82,"max":86},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9994,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9994,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9881,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9856,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/marathi","display_name":"Marathi","score":0.5979571},{"id":"https://openalex.org/keywords/language-translation","display_name":"Language translation","score":0.4991398},{"id":"https://openalex.org/keywords/speech-translation","display_name":"Speech translation","score":0.44760767}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7513981},{"id":"https://openalex.org/C519982507","wikidata":"https://www.wikidata.org/wiki/Q1568","display_name":"Hindi","level":2,"score":0.74747807},{"id":"https://openalex.org/C2776844415","wikidata":"https://www.wikidata.org/wiki/Q1571","display_name":"Marathi","level":2,"score":0.5979571},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.59716815},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.5918472},{"id":"https://openalex.org/C203005215","wikidata":"https://www.wikidata.org/wiki/Q79798","display_name":"Machine translation","level":2,"score":0.5571889},{"id":"https://openalex.org/C2986862884","wikidata":"https://www.wikidata.org/wiki/Q7553","display_name":"Language translation","level":3,"score":0.4991398},{"id":"https://openalex.org/C105339364","wikidata":"https://www.wikidata.org/wiki/Q2297740","display_name":"Software deployment","level":2,"score":0.47998902},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.45441824},{"id":"https://openalex.org/C2780366754","wikidata":"https://www.wikidata.org/wiki/Q7494857","display_name":"Speech translation","level":3,"score":0.44760767},{"id":"https://openalex.org/C2780378061","wikidata":"https://www.wikidata.org/wiki/Q25351891","display_name":"Service (business)","level":2,"score":0.42683923},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.41376907},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.35466594},{"id":"https://openalex.org/C115903868","wikidata":"https://www.wikidata.org/wiki/Q80993","display_name":"Software engineering","level":1,"score":0.15247217},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.13461971},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0749284},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C136264566","wikidata":"https://www.wikidata.org/wiki/Q159810","display_name":"Economy","level":1,"score":0.0},{"id":"https://openalex.org/C166957645","wikidata":"https://www.wikidata.org/wiki/Q23498","display_name":"Archaeology","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2305.12518","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"cc-by-nc-sa","license_id":"https://openalex.org/licenses/cc-by-nc-sa","version":"submittedVersion","is_accepted":false,"is_published":false},{"is_oa":true,"landing_page_url":"http://arxiv.org/abs/2305.12518","pdf_url":"http://arxiv.org/pdf/2305.12518","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false},{"is_oa":false,"landing_page_url":"https://api.datacite.org/dois/10.48550/arxiv.2305.12518","pdf_url":null,"source":{"id":"https://openalex.org/S4393179698","display_name":"DataCite API","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I4210145204","host_organization_name":"DataCite","host_organization_lineage":["https://openalex.org/I4210145204"],"host_organization_lineage_names":["DataCite"],"type":"metadata"},"license":null,"license_id":null,"version":null}],"best_oa_location":{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2305.12518","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"cc-by-nc-sa","license_id":"https://openalex.org/licenses/cc-by-nc-sa","version":"submittedVersion","is_accepted":false,"is_published":false},"sustainable_development_goals":[{"score":0.7,"display_name":"Quality education","id":"https://metadata.un.org/sdg/4"}],"grants":[],"datasets":[],"versions":[],"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W637185019","https://openalex.org/W4386103000","https://openalex.org/W4321480256","https://openalex.org/W4309803833","https://openalex.org/W3119657211","https://openalex.org/W2913221509","https://openalex.org/W2789013119","https://openalex.org/W2784413230","https://openalex.org/W2607310639","https://openalex.org/W2336638260"],"abstract_inverted_index":{"In":[0],"this":[1],"work,":[2],"we":[3,74,96],"present":[4],"our":[5,140,213],"deployment-ready":[6],"Speech-to-Speech":[7],"Machine":[8,33,78],"Translation":[9,34,79],"(SSMT)":[10],"system":[11,23,59,141],"for":[12,113,122],"English-Hindi,":[13],"English-Marathi,":[14],"and":[15,36,49,52,90,126,129,197,200,215],"Hindi-Marathi":[16],"language":[17],"pairs.":[18],"We":[19,41,203],"develop":[20,97],"the":[21,43,47,53,57,67,71,115,119,124,130,148,160,173,178,187,206],"SSMT":[22,58,125,214],"by":[24],"cascading":[25],"Automatic":[26],"Speech":[27],"Recognition":[28],"(ASR),":[29],"Disfluency":[30],"Correction":[31],"(DC),":[32],"(MT),":[35],"Text-to-Speech":[37],"Synthesis":[38],"(TTS)":[39],"models.":[40],"discuss":[42],"challenges":[44],"faced":[45],"during":[46],"research":[48],"development":[50],"stage":[51],"scalable":[54],"deployment":[55],"of":[56,70,139,145,150,163,172,175,180,189],"as":[60,183],"a":[61,76,98,109,169],"publicly":[62,136],"accessible":[63],"web":[64],"service.":[65],"On":[66],"MT":[68],"part":[69],"pipeline":[72],"too,":[73],"create":[75],"Text-to-Text":[77],"(TTMT)":[80],"service":[81],"in":[82,147,220],"all":[83],"six":[84],"translation":[85,188],"directions":[86],"involving":[87],"English,":[88],"Hindi,":[89],"Marathi.":[91],"To":[92],"mitigate":[93],"data":[94,120],"scarcity,":[95],"LaBSE-based":[99],"corpus":[100,112],"filtering":[101],"tool":[102],"to":[103],"select":[104],"high-quality":[105],"parallel":[106],"sentences":[107],"from":[108,209],"noisy":[110],"pseudo-parallel":[111],"training":[114,123],"TTMT":[116,127,216],"system.":[117],"All":[118],"used":[121],"systems":[128,217],"best":[131],"models":[132],"are":[133,142],"being":[134],"made":[135],"available.":[137],"Users":[138],"(a)":[143],"Govt.":[144],"India":[146],"context":[149],"its":[151],"new":[152],"education":[153],"policy":[154],"(NEP),":[155],"(b)":[156],"tourists":[157],"who":[158,194],"criss-cross":[159],"multilingual":[161],"landscape":[162],"India,":[164],"(c)":[165],"Indian":[166],"Judiciary":[167],"where":[168],"leading":[170],"cause":[171],"pendency":[174],"cases":[176],"(to":[177],"order":[179],"10":[181],"million":[182],"on":[184],"date)":[185],"is":[186],"case":[190],"papers,":[191],"(d)":[192],"farmers":[193],"need":[195],"weather":[196],"price":[198],"information":[199],"so":[201],"on.":[202],"also":[204],"share":[205],"feedback":[207],"received":[208],"various":[210],"stakeholders":[211],"when":[212],"were":[218],"demonstrated":[219],"large":[221],"public":[222],"events.":[223]},"abstract_inverted_index_v3":null,"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4377864448","counts_by_year":[{"year":2024,"cited_by_count":3}],"updated_date":"2025-03-23T16:28:07.859168","created_date":"2023-05-24"}