{"id":"https://openalex.org/W4390493540","doi":"https://doi.org/10.1109/snams60348.2023.10375468","title":"Breaking Barriers: Can Multilingual Foundation Models Bridge the Gap in Cross-Language Speech Emotion Recognition?","display_name":"Breaking Barriers: Can Multilingual Foundation Models Bridge the Gap in Cross-Language Speech Emotion Recognition?","publication_year":2023,"publication_date":"2023-11-21","ids":{"openalex":"https://openalex.org/W4390493540","doi":"https://doi.org/10.1109/snams60348.2023.10375468"},"language":"en","primary_location":{"id":"doi:10.1109/snams60348.2023.10375468","is_oa":false,"landing_page_url":"https://doi.org/10.1109/snams60348.2023.10375468","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 Tenth International Conference on Social Networks Analysis, Management and Security (SNAMS)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5077782202","display_name":"Moazzam Shoukat","orcid":"https://orcid.org/0009-0005-6497-2823"},"institutions":[{"id":"https://openalex.org/I2800666866","display_name":"Government of Pakistan","ror":"https://ror.org/00pnp4y96","country_code":"PK","type":"government","lineage":["https://openalex.org/I2800666866"]}],"countries":["PK"],"is_corresponding":true,"raw_author_name":"Moazzam Shoukat","raw_affiliation_strings":["EmulationAI,Pakistan","EmulationAI, Pakistan"],"affiliations":[{"raw_affiliation_string":"EmulationAI,Pakistan","institution_ids":["https://openalex.org/I2800666866"]},{"raw_affiliation_string":"EmulationAI, Pakistan","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5086703267","display_name":"Muhammad Usama","orcid":"https://orcid.org/0000-0001-5015-8605"},"institutions":[{"id":"https://openalex.org/I201384688","display_name":"National University of Computer and Emerging Sciences","ror":"https://ror.org/003eyb898","country_code":"PK","type":"education","lineage":["https://openalex.org/I201384688"]}],"countries":["PK"],"is_corresponding":false,"raw_author_name":"Muhammad Usama","raw_affiliation_strings":["National University of Computer &#x0026; Emerging Sciences,Faisalabad,Pakistan"],"affiliations":[{"raw_affiliation_string":"National University of Computer &#x0026; Emerging Sciences,Faisalabad,Pakistan","institution_ids":["https://openalex.org/I201384688"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5066120242","display_name":"Hafiz Shehbaz Ali","orcid":null},"institutions":[{"id":"https://openalex.org/I2800666866","display_name":"Government of Pakistan","ror":"https://ror.org/00pnp4y96","country_code":"PK","type":"government","lineage":["https://openalex.org/I2800666866"]}],"countries":["PK"],"is_corresponding":false,"raw_author_name":"Hafiz Shehbaz Ali","raw_affiliation_strings":["EmulationAI,Pakistan","EmulationAI, Pakistan"],"affiliations":[{"raw_affiliation_string":"EmulationAI,Pakistan","institution_ids":["https://openalex.org/I2800666866"]},{"raw_affiliation_string":"EmulationAI, Pakistan","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5047197696","display_name":"Siddique Latif","orcid":"https://orcid.org/0000-0001-5662-4777"},"institutions":[{"id":"https://openalex.org/I160993911","display_name":"Queensland University of Technology","ror":"https://ror.org/03pnv4752","country_code":"AU","type":"education","lineage":["https://openalex.org/I160993911"]},{"id":"https://openalex.org/I185523456","display_name":"University of Southern Queensland","ror":"https://ror.org/04sjbnx57","country_code":"AU","type":"education","lineage":["https://openalex.org/I185523456"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Siddique Latif","raw_affiliation_strings":["University of Southern Queensland (UniSQ) Queensland University of Technology (QUT),Australia","University of Southern Queensland (UniSQ) Queensland University of Technology (QUT), Australia"],"affiliations":[{"raw_affiliation_string":"University of Southern Queensland (UniSQ) Queensland University of Technology (QUT),Australia","institution_ids":["https://openalex.org/I160993911","https://openalex.org/I185523456"]},{"raw_affiliation_string":"University of Southern Queensland (UniSQ) Queensland University of Technology (QUT), Australia","institution_ids":["https://openalex.org/I185523456","https://openalex.org/I160993911"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5077782202"],"corresponding_institution_ids":["https://openalex.org/I2800666866"],"apc_list":null,"apc_paid":null,"fwci":0.262,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.62786337,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"9"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10667","display_name":"Emotion and Mood Recognition","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T10667","display_name":"Emotion and Mood Recognition","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10664","display_name":"Sentiment Analysis and Opinion Mining","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.992900013923645,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8132662177085876},{"id":"https://openalex.org/keywords/bridge","display_name":"Bridge (graph theory)","score":0.711675763130188},{"id":"https://openalex.org/keywords/foundation","display_name":"Foundation (evidence)","score":0.6778717041015625},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.6217241287231445},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5221574306488037},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.5212507843971252},{"id":"https://openalex.org/keywords/transfer-of-learning","display_name":"Transfer of learning","score":0.4962802529335022},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.3251107335090637}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8132662177085876},{"id":"https://openalex.org/C100776233","wikidata":"https://www.wikidata.org/wiki/Q2532492","display_name":"Bridge (graph theory)","level":2,"score":0.711675763130188},{"id":"https://openalex.org/C2780966255","wikidata":"https://www.wikidata.org/wiki/Q5474306","display_name":"Foundation (evidence)","level":2,"score":0.6778717041015625},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.6217241287231445},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5221574306488037},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.5212507843971252},{"id":"https://openalex.org/C150899416","wikidata":"https://www.wikidata.org/wiki/Q1820378","display_name":"Transfer of learning","level":2,"score":0.4962802529335022},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.3251107335090637},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0},{"id":"https://openalex.org/C95457728","wikidata":"https://www.wikidata.org/wiki/Q309","display_name":"History","level":0,"score":0.0},{"id":"https://openalex.org/C126322002","wikidata":"https://www.wikidata.org/wiki/Q11180","display_name":"Internal medicine","level":1,"score":0.0},{"id":"https://openalex.org/C166957645","wikidata":"https://www.wikidata.org/wiki/Q23498","display_name":"Archaeology","level":1,"score":0.0},{"id":"https://openalex.org/C71924100","wikidata":"https://www.wikidata.org/wiki/Q11190","display_name":"Medicine","level":0,"score":0.0},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/snams60348.2023.10375468","is_oa":false,"landing_page_url":"https://doi.org/10.1109/snams60348.2023.10375468","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 Tenth International Conference on Social Networks Analysis, Management and Security (SNAMS)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.8399999737739563,"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":75,"referenced_works":["https://openalex.org/W175750906","https://openalex.org/W2074788634","https://openalex.org/W2146334809","https://openalex.org/W2465534249","https://openalex.org/W2762715843","https://openalex.org/W2771976988","https://openalex.org/W2904938641","https://openalex.org/W2905903577","https://openalex.org/W2924116307","https://openalex.org/W2936372954","https://openalex.org/W2962770129","https://openalex.org/W2963686995","https://openalex.org/W2964010806","https://openalex.org/W2969889150","https://openalex.org/W2972640480","https://openalex.org/W2995813704","https://openalex.org/W3004319605","https://openalex.org/W3036601975","https://openalex.org/W3038105747","https://openalex.org/W3043910663","https://openalex.org/W3095334805","https://openalex.org/W3095666234","https://openalex.org/W3096109555","https://openalex.org/W3097341095","https://openalex.org/W3098571047","https://openalex.org/W3133702157","https://openalex.org/W3152893301","https://openalex.org/W3168867926","https://openalex.org/W3179560930","https://openalex.org/W3198429080","https://openalex.org/W3198791972","https://openalex.org/W3199964822","https://openalex.org/W4214825215","https://openalex.org/W4220725970","https://openalex.org/W4221089191","https://openalex.org/W4221122497","https://openalex.org/W4224917001","https://openalex.org/W4225635674","https://openalex.org/W4232282348","https://openalex.org/W4285393783","https://openalex.org/W4286640379","https://openalex.org/W4288391270","https://openalex.org/W4288408927","https://openalex.org/W4292779060","https://openalex.org/W4293661603","https://openalex.org/W4297841899","https://openalex.org/W4309134503","https://openalex.org/W4312327819","https://openalex.org/W4317380951","https://openalex.org/W4323569712","https://openalex.org/W4353114117","https://openalex.org/W4361994820","https://openalex.org/W4378105483","https://openalex.org/W4384268405","https://openalex.org/W4386185396","https://openalex.org/W4390874621","https://openalex.org/W4404658388","https://openalex.org/W6617505242","https://openalex.org/W6719667659","https://openalex.org/W6744702808","https://openalex.org/W6755541679","https://openalex.org/W6760937267","https://openalex.org/W6778883912","https://openalex.org/W6779919476","https://openalex.org/W6780218876","https://openalex.org/W6796581206","https://openalex.org/W6846726371","https://openalex.org/W6847363464","https://openalex.org/W6850462617","https://openalex.org/W6850957775","https://openalex.org/W6852909395","https://openalex.org/W6853389878","https://openalex.org/W6854299349","https://openalex.org/W6856168926","https://openalex.org/W6945962177"],"related_works":["https://openalex.org/W2378211422","https://openalex.org/W4321353415","https://openalex.org/W2745001401","https://openalex.org/W2130974462","https://openalex.org/W2028665553","https://openalex.org/W2086519370","https://openalex.org/W972276598","https://openalex.org/W4246352526","https://openalex.org/W2381393187","https://openalex.org/W2121910908"],"abstract_inverted_index":{"Speech":[0],"emotion":[1,96,116],"recognition":[2],"(SER)":[3],"faces":[4],"challenges":[5],"in":[6,12,79,111],"cross-language":[7,80,89],"scenarios":[8],"due":[9],"to":[10,44,75],"differences":[11],"linguistic":[13,166],"and":[14,73,125,146],"cultural":[15],"expression":[16],"of":[17,67],"emotions":[18],"across":[19,168],"languages.":[20],"Recently,":[21],"large":[22],"multilingual":[23,58],"foundation":[24,68,103,157],"models":[25,69,136,158],"pre-trained":[26],"on":[27,33,87,149],"massive":[28],"corpora":[29],"have":[30],"achieved":[31],"performance":[32,86,148],"natural":[34],"language":[35],"understanding":[36],"tasks":[37],"by":[38],"learning":[39,114],"cross-lingual":[40,112,133],"representations.":[41],"Their":[42],"ability":[43],"understand":[45],"relationships":[46],"between":[47],"languages":[48,94,169],"without":[49],"direct":[50],"translation":[51],"opens":[52],"up":[53],"possibilities":[54],"for":[55,95,115,131,164,170],"more":[56],"applicable":[57],"models.":[59],"In":[60],"this":[61],"paper,":[62],"we":[63,83],"evaluate":[64],"the":[65,77,102],"capabilities":[66],"(Wav2Vec2,":[70],"XLSR,":[71],"Whisper":[72],"MMS)":[74],"bridge":[76],"gap":[78],"SER.":[81,171],"Specifically,":[82],"analyse":[84],"their":[85,109],"benchmark":[88],"SER":[90],"datasets":[91],"involving":[92],"four":[93],"classification.":[97],"Our":[98,152],"experiments":[99],"show":[100],"that":[101,155],"model":[104],"outperforms":[105],"CNN-LSTM":[106],"baselines,":[107],"establishing":[108],"superiority":[110],"transfer":[113],"recognition.":[117],"However,":[118],"self-supervised":[119],"pre-training":[120,161],"plays":[121],"a":[122],"key":[123],"role,":[124],"inductive":[126],"biases":[127],"alone":[128],"are":[129],"insufficient":[130],"high":[132],"generalisability.":[134],"Foundation":[135],"also":[137],"demonstrate":[138],"gains":[139],"over":[140],"baselines":[141],"with":[142],"limited":[143],"target":[144],"data":[145],"better":[147],"noisy":[150],"data.":[151],"findings":[153],"indicate":[154],"while":[156],"hold":[159],"promise,":[160],"remains":[162],"vital":[163],"handling":[165],"variations":[167]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
