{"id":"https://openalex.org/W4379538797","doi":"https://doi.org/10.48550/arxiv.2306.02105","title":"Advancing African-Accented Speech Recognition: Epistemic Uncertainty-Driven Data Selection for Generalizable ASR Models","display_name":"Advancing African-Accented Speech Recognition: Epistemic Uncertainty-Driven Data Selection for Generalizable ASR Models","publication_year":2023,"publication_date":"2023-06-03","ids":{"openalex":"https://openalex.org/W4379538797","doi":"https://doi.org/10.48550/arxiv.2306.02105"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2306.02105","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2306.02105","pdf_url":"https://arxiv.org/pdf/2306.02105","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2306.02105","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5058219704","display_name":"Bonaventure F. P. Dossou","orcid":"https://orcid.org/0000-0002-0519-1761"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Dossou, Bonaventure F. P.","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":1,"corresponding_author_ids":["https://openalex.org/A5058219704"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":true,"cited_by_count":3,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9961000084877014,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9961000084877014,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10403","display_name":"Phonetics and Phonology Research","score":0.9925000071525574,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T12031","display_name":"Speech and dialogue systems","score":0.991100013256073,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.69774329662323},{"id":"https://openalex.org/keywords/annotation","display_name":"Annotation","score":0.674177885055542},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.6479442119598389},{"id":"https://openalex.org/keywords/selection","display_name":"Selection (genetic algorithm)","score":0.6460272073745728},{"id":"https://openalex.org/keywords/generalization","display_name":"Generalization","score":0.6102538704872131},{"id":"https://openalex.org/keywords/baseline","display_name":"Baseline (sea)","score":0.5861479043960571},{"id":"https://openalex.org/keywords/variety","display_name":"Variety (cybernetics)","score":0.538421094417572},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5071804523468018},{"id":"https://openalex.org/keywords/resource","display_name":"Resource (disambiguation)","score":0.4989748001098633},{"id":"https://openalex.org/keywords/labeled-data","display_name":"Labeled data","score":0.49876832962036133},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.48911362886428833},{"id":"https://openalex.org/keywords/adaptation","display_name":"Adaptation (eye)","score":0.47633248567581177},{"id":"https://openalex.org/keywords/training-set","display_name":"Training set","score":0.45822346210479736},{"id":"https://openalex.org/keywords/domain","display_name":"Domain (mathematical analysis)","score":0.4393080472946167},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.4167991876602173},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.09624534845352173},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.09366217255592346},{"id":"https://openalex.org/keywords/biology","display_name":"Biology","score":0.08050587773323059}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.69774329662323},{"id":"https://openalex.org/C2776321320","wikidata":"https://www.wikidata.org/wiki/Q857525","display_name":"Annotation","level":2,"score":0.674177885055542},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.6479442119598389},{"id":"https://openalex.org/C81917197","wikidata":"https://www.wikidata.org/wiki/Q628760","display_name":"Selection (genetic algorithm)","level":2,"score":0.6460272073745728},{"id":"https://openalex.org/C177148314","wikidata":"https://www.wikidata.org/wiki/Q170084","display_name":"Generalization","level":2,"score":0.6102538704872131},{"id":"https://openalex.org/C12725497","wikidata":"https://www.wikidata.org/wiki/Q810247","display_name":"Baseline (sea)","level":2,"score":0.5861479043960571},{"id":"https://openalex.org/C136197465","wikidata":"https://www.wikidata.org/wiki/Q1729295","display_name":"Variety (cybernetics)","level":2,"score":0.538421094417572},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5071804523468018},{"id":"https://openalex.org/C206345919","wikidata":"https://www.wikidata.org/wiki/Q20380951","display_name":"Resource (disambiguation)","level":2,"score":0.4989748001098633},{"id":"https://openalex.org/C2776145971","wikidata":"https://www.wikidata.org/wiki/Q30673951","display_name":"Labeled data","level":2,"score":0.49876832962036133},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.48911362886428833},{"id":"https://openalex.org/C139807058","wikidata":"https://www.wikidata.org/wiki/Q352374","display_name":"Adaptation (eye)","level":2,"score":0.47633248567581177},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.45822346210479736},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.4393080472946167},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.4167991876602173},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.09624534845352173},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.09366217255592346},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.08050587773323059},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.0},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C505870484","wikidata":"https://www.wikidata.org/wiki/Q180538","display_name":"Fishery","level":1,"score":0.0},{"id":"https://openalex.org/C169760540","wikidata":"https://www.wikidata.org/wiki/Q207011","display_name":"Neuroscience","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2306.02105","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2306.02105","pdf_url":"https://arxiv.org/pdf/2306.02105","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"doi:10.48550/arxiv.2306.02105","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2306.02105","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2306.02105","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2306.02105","pdf_url":"https://arxiv.org/pdf/2306.02105","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[{"score":0.75,"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4379538797.pdf","grobid_xml":"https://content.openalex.org/works/W4379538797.grobid-xml"},"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W2130553454","https://openalex.org/W3022007134","https://openalex.org/W4317548404","https://openalex.org/W2087783760","https://openalex.org/W3104108945","https://openalex.org/W2033364610","https://openalex.org/W3163689946","https://openalex.org/W2797776314","https://openalex.org/W2153927146","https://openalex.org/W2091066410"],"abstract_inverted_index":{"Accents":[0],"play":[1],"a":[2,41,68,111,142],"pivotal":[3],"role":[4],"in":[5,28,176],"shaping":[6],"human":[7,55,88],"communication,":[8],"enhancing":[9,106],"our":[10,124,138],"ability":[11],"to":[12,40,50,77,103,115,119,141],"convey":[13],"and":[14,19,52,62,87,96,130],"comprehend":[15],"messages":[16],"with":[17],"clarity":[18],"cultural":[20],"nuance.":[21],"While":[22],"there":[23],"has":[24,36],"been":[25,37],"significant":[26],"progress":[27],"Automatic":[29],"Speech":[30],"Recognition":[31],"(ASR),":[32],"African-accented":[33],"English":[34],"ASR":[35,174],"understudied":[38],"due":[39],"lack":[42],"of":[43,179],"training":[44,107],"datasets,":[45,129],"which":[46],"are":[47],"often":[48],"expensive":[49],"create":[51],"demand":[53],"colossal":[54],"labor.":[56,89],"Combining":[57],"several":[58,127],"active":[59],"learning":[60],"paradigms":[61],"the":[63,79,84,177,185],"core-set":[64],"approach,":[65],"we":[66],"propose":[67],"new":[69,112],"multi-rounds":[70],"adaptation":[71,118],"process":[72],"that":[73,137],"uses":[74],"epistemic":[75],"uncertainty":[76],"automate":[78],"annotation":[80,95],"process,":[81],"significantly":[82],"reducing":[83],"associated":[85],"costs":[86],"This":[90],"novel":[91],"method":[92],"streamlines":[93],"data":[94,99,154],"strategically":[97],"selects":[98],"samples":[100],"contributing":[101],"most":[102],"model":[104,117],"uncertainty,":[105],"efficiency.":[108],"We":[109,122,183],"define":[110],"U-WER":[113],"metric":[114],"track":[116],"hard":[120],"accents.":[121],"evaluate":[123],"approach":[125,139,159],"across":[126],"domains,":[128],"high-performing":[131],"speech":[132],"models.":[133],"Our":[134,158],"results":[135],"show":[136],"leads":[140],"27\\%":[143],"WER":[144],"relative":[145],"average":[146,151],"improvement":[147],"while":[148],"requiring":[149],"on":[150],"45\\%":[152],"less":[153],"than":[155],"established":[156],"baselines.":[157],"also":[160],"improves":[161],"out-of-distribution":[162],"generalization":[163],"for":[164,171],"very":[165],"low-resource":[166],"accents,":[167],"demonstrating":[168],"its":[169],"viability":[170],"building":[172],"generalizable":[173],"models":[175],"context":[178],"accented":[180],"African":[181],"ASR.":[182],"open-source":[184],"code":[186],"here:":[187],"https://github.com/bonaventuredossou/active_learning_african_asr.":[188]},"counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":2}],"updated_date":"2026-03-12T08:34:05.389933","created_date":"2023-06-07T00:00:00"}
