{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,28]],"date-time":"2026-03-28T00:47:56Z","timestamp":1774658876131,"version":"3.50.1"},"reference-count":211,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","license":[{"start":{"date-parts":[[2025,1,1]],"date-time":"2025-01-01T00:00:00Z","timestamp":1735689600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/linproxy.fan.workers.dev:443\/https\/creativecommons.org\/licenses\/by\/4.0\/legalcode"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Open J. Commun. Soc."],"published-print":{"date-parts":[[2025]]},"DOI":"10.1109\/ojcoms.2025.3554537","type":"journal-article","created":{"date-parts":[[2025,3,27]],"date-time":"2025-03-27T03:05:20Z","timestamp":1743044720000},"page":"2510-2538","source":"Crossref","is-referenced-by-count":19,"title":["Survey of Multimodal Federated Learning: Exploring Data Integration, Challenges, and Future Directions"],"prefix":"10.1109","volume":"6","author":[{"ORCID":"https:\/\/linproxy.fan.workers.dev:443\/https\/orcid.org\/0009-0002-3492-0318","authenticated-orcid":false,"given":"Mumin","family":"Adam","sequence":"first","affiliation":[{"name":"Department of Computer Engineering, King Fahd University of Petroleum and Minerals, Dhahran, Saudi Arabia"}]},{"ORCID":"https:\/\/linproxy.fan.workers.dev:443\/https\/orcid.org\/0000-0002-6886-6500","authenticated-orcid":false,"given":"Abdullatif","family":"Albaseer","sequence":"additional","affiliation":[{"name":"Division of Information and Computing Technology, College of Science and Engineering, Hamad Bin Khalifa University, Doha, Qatar"}]},{"ORCID":"https:\/\/linproxy.fan.workers.dev:443\/https\/orcid.org\/0000-0002-1507-5713","authenticated-orcid":false,"given":"Uthman","family":"Baroudi","sequence":"additional","affiliation":[{"name":"Department of Computer Engineering, King Fahd University of Petroleum and Minerals, Dhahran, Saudi Arabia"}]},{"ORCID":"https:\/\/linproxy.fan.workers.dev:443\/https\/orcid.org\/0000-0002-3261-7588","authenticated-orcid":false,"given":"Mohamed","family":"Abdallah","sequence":"additional","affiliation":[{"name":"Division of Information and Computing Technology, College of Science and Engineering, Hamad Bin Khalifa University, Doha, Qatar"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.00965"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1145\/3447993.3483276"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1145\/3384419.3430776"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1007\/s12193-021-00382-y"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.3390\/s21062212"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2018.2798607"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/MSP.2017.2738401"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2019.2916887"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1145\/1978942.1978945"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1561\/0600000105"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1016\/j.future.2020.06.013"},{"key":"ref12","first-page":"1273","article-title":"Communication-efficient learning of deep networks from decentralized data","volume-title":"Proc. Artif. Intell. Stat.","author":"McMahan"},{"key":"ref13","article-title":"Differentially private federated learning: A client level perspective","author":"Geyer","year":"2017","journal-title":"arXiv:1712.07557"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.00982"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2024.3382709"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1016\/j.neucom.2022.01.063"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/TNSE.2021.3100805"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/MSP.2020.2975749"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1109\/TNSM.2023.3270168"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/OJCOMS.2024.3506214"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1016\/j.future.2020.10.007"},{"key":"ref22","first-page":"19","article-title":"Oort: Efficient federated learning via guided participant selection","volume-title":"Proc. 15th USENIX Symp. Oper. Syst. Design Implement.","author":"Lai"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/JSAC.2020.3036952"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1145\/3495243.3517017"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1109\/TMC.2022.3214234"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1109\/JIOT.2023.3299573"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.01271"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1145\/3570361.3592517"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1109\/NaNA63151.2024.00030"},{"key":"ref30","article-title":"Communication-efficient multimodal federated learning: Joint modality and client selection","author":"Yuan","year":"2024","journal-title":"arXiv:2401.16685"},{"key":"ref31","article-title":"A survey of resource-efficient LLM and multimodal foundation models","author":"Xu","year":"2024","journal-title":"arXiv:2401.08092"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1145\/3570361.3592505"},{"key":"ref33","first-page":"456","article-title":"Reducing communication overhead in federated learning for pre-trained language models using parameter-efficient finetuning","volume-title":"Proc. Conf. Lifelong Learn. Agents","author":"Malaviya"},{"key":"ref34","article-title":"Multimodal federated learning via contrastive representation ensemble","author":"Yu","year":"2023","journal-title":"arXiv:2302.08888"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v38i10.29007"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1016\/j.neunet.2024.107017"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1109\/TNNLS.2021.3131614"},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.1007\/s11633-022-1398-0"},{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.3390\/s23156986"},{"key":"ref40","article-title":"Multimodal federated learning in healthcare: A review","author":"Thrasher","year":"2023","journal-title":"arXiv:2310.09650"},{"key":"ref41","doi-asserted-by":"publisher","DOI":"10.1016\/j.inffus.2024.102576"},{"key":"ref42","doi-asserted-by":"publisher","DOI":"10.1007\/s00530-024-01422-9"},{"key":"ref43","doi-asserted-by":"publisher","DOI":"10.1109\/JSEN.2017.2735539"},{"key":"ref44","doi-asserted-by":"publisher","DOI":"10.1109\/JIOT.2017.2683200"},{"key":"ref45","doi-asserted-by":"publisher","DOI":"10.3390\/s22197433"},{"key":"ref46","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2017.2696365"},{"key":"ref47","doi-asserted-by":"publisher","DOI":"10.12691\/acis-3-1-3"},{"key":"ref48","doi-asserted-by":"publisher","DOI":"10.1016\/j.jcmg.2019.06.009"},{"key":"ref49","doi-asserted-by":"publisher","DOI":"10.3390\/s23020828"},{"key":"ref50","doi-asserted-by":"publisher","DOI":"10.1016\/j.ajpc.2022.100379"},{"key":"ref51","doi-asserted-by":"publisher","DOI":"10.3390\/electronics12071558"},{"key":"ref52","article-title":"Cross-domain federated learning in medical imaging","author":"Parekh","year":"2021","journal-title":"arXiv:2112.10001"},{"key":"ref53","doi-asserted-by":"publisher","DOI":"10.1145\/3580305.3599825"},{"key":"ref54","doi-asserted-by":"publisher","DOI":"10.1038\/s41597-020-0495-6"},{"key":"ref55","article-title":"Federated learning: Strategies for improving communication efficiency","author":"Kone\u010dn\u00fd","year":"2016","journal-title":"arXiv:1610.05492"},{"key":"ref56","doi-asserted-by":"publisher","DOI":"10.1109\/VTC2024-Fall63153.2024.10757873"},{"key":"ref57","article-title":"Personalized federated learning: A meta-learning approach","author":"Fallah","year":"2020","journal-title":"arXiv:2002.07948"},{"key":"ref58","article-title":"FedBN: Federated learning on non-IID features via local batch normalization","author":"Li","year":"2021","journal-title":"arXiv:2102.07623"},{"key":"ref59","first-page":"11058","article-title":"Multi-level branched regularization for federated learning","volume-title":"Proc. Int. Conf. Mach. Lear.","author":"Kim"},{"key":"ref60","article-title":"Overcoming forgetting in federated learning on non-IID data","author":"Shoham","year":"2019","journal-title":"arXiv:1910.07796"},{"key":"ref61","doi-asserted-by":"publisher","DOI":"10.1073\/pnas.1611835114"},{"key":"ref62","first-page":"5132","article-title":"SCAFFOLD: Stochastic controlled averaging for federated learning","volume-title":"Proc. Int. Conf. Mach. Learn.","author":"Karimireddy"},{"key":"ref63","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.01057"},{"key":"ref64","article-title":"Device heterogeneity in federated learning: A superquantile approach","author":"Laguel","year":"2020","journal-title":"arXiv:2002.11223"},{"key":"ref65","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.01565"},{"key":"ref66","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.01173"},{"key":"ref67","doi-asserted-by":"publisher","DOI":"10.1109\/TVT.2024.3427349"},{"key":"ref68","doi-asserted-by":"publisher","DOI":"10.1109\/IPCCC51483.2021.9679416"},{"key":"ref69","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.00985"},{"key":"ref70","doi-asserted-by":"publisher","DOI":"10.1016\/j.jnca.2018.05.003"},{"key":"ref71","article-title":"Federated learning with personalization layers","author":"Arivazhagan","year":"2019","journal-title":"arXiv:1912.00818"},{"key":"ref72","article-title":"Federated user representation learning","author":"Bui","year":"2019","journal-title":"arXiv:1909.12535"},{"key":"ref73","doi-asserted-by":"publisher","DOI":"10.1109\/SRDS51746.2020.00017"},{"key":"ref74","doi-asserted-by":"publisher","DOI":"10.1109\/IOTM.001.2300054"},{"key":"ref75","first-page":"1","article-title":"Federated multi-task learning","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","volume":"30","author":"Smith"},{"key":"ref76","doi-asserted-by":"publisher","DOI":"10.1109\/GLOBECOM46510.2021.9685938"},{"issue":"10","key":"ref77","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1145\/3663364","article-title":"Foundations & trends in multimodal machine learning: Principles, challenges, and open questions","volume":"56","author":"Liang","year":"2024","journal-title":"ACM Comput. Surv."},{"key":"ref78","doi-asserted-by":"publisher","DOI":"10.1016\/j.ymeth.2022.03.005"},{"key":"ref79","doi-asserted-by":"publisher","DOI":"10.1007\/978-1-4419-1428-6_239"},{"key":"ref80","article-title":"UNIMO: Towards unified-modal understanding and generation via cross-modal contrastive learning","author":"Li","year":"2020","journal-title":"arXiv:2012.15409"},{"key":"ref81","doi-asserted-by":"publisher","DOI":"10.1038\/s41746-022-00712-8"},{"key":"ref82","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2023.3243854"},{"key":"ref83","doi-asserted-by":"publisher","DOI":"10.48550\/ARXIV.1706.03762"},{"key":"ref84","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/D18-1045"},{"key":"ref85","doi-asserted-by":"publisher","DOI":"10.1109\/VTC2024-Spring62846.2024.10683376"},{"key":"ref86","article-title":"FedCLIP: Fast generalization and personalization for clip in federated learning","author":"Lu","year":"2023","journal-title":"arXiv:2302.13485"},{"key":"ref87","doi-asserted-by":"publisher","DOI":"10.1145\/3510033"},{"key":"ref88","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-72633-0_13"},{"key":"ref89","article-title":"BERT: Pre-training of deep bidirectional transformers for language understanding","author":"Devlin","year":"2018","journal-title":"arXiv:1810.04805"},{"key":"ref90","article-title":"BART: Denoising sequence-to-sequence pre-training for natural language generation, translation, and comprehension","author":"Lewis","year":"2019","journal-title":"arXiv:1910.13461"},{"key":"ref91","volume-title":"Improving language understanding by generative pre-training","author":"Radford","year":"2018"},{"key":"ref92","article-title":"Longformer: The long-document transformer","author":"Beltagy","year":"2020","journal-title":"arXiv:2004.05150"},{"key":"ref93","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/P19-1285"},{"key":"ref94","first-page":"5753","article-title":"XLNet: Generalized autoregressive pretraining for language understanding","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","volume":"32","author":"Yang"},{"key":"ref95","article-title":"An image is worth 16\u00d716 words: Transformers for image recognition at scale","author":"Dosovitskiy","year":"2020","journal-title":"arXiv:2010.11929"},{"key":"ref96","first-page":"10347","article-title":"Training data-efficient image transformers & distillation through attention","volume-title":"Proc. Int. Conf. Mach. Learn.","author":"Touvron"},{"key":"ref97","article-title":"Toward transformer-based object detection","author":"Beal","year":"2020","journal-title":"arXiv:2012.09958"},{"key":"ref98","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.00986"},{"key":"ref99","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.00950"},{"key":"ref100","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.00951"},{"key":"ref101","article-title":"BEiT: BERT pre-training of image transformers","author":"Bao","year":"2021","journal-title":"arXiv:2106.08254"},{"key":"ref102","doi-asserted-by":"publisher","DOI":"10.48550\/ARXIV.2105.07581"},{"key":"ref103","first-page":"12116","article-title":"Do vision transformers see like convolutional neural networks?","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","volume":"34","author":"Raghu"},{"key":"ref104","article-title":"How to understand masked autoencoders","author":"Cao","year":"2022","journal-title":"arXiv:2202.03670"},{"key":"ref105","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV51070.2023.00460"},{"key":"ref106","doi-asserted-by":"publisher","DOI":"10.1109\/TNNLS.2023.3269062"},{"key":"ref107","article-title":"On the importance and applicability of pre-training for federated learning","author":"Chen","year":"2022","journal-title":"arXiv:2206.11488"},{"key":"ref108","article-title":"Where to begin? On the impact of pre-training and initialization in federated learning","author":"Nguyen","year":"2022","journal-title":"arXiv:2206.15387"},{"key":"ref109","article-title":"Conquering the communication constraints to enable large pre-trained models in federated learning","author":"Sun","year":"2022","journal-title":"arXiv:2210.01708"},{"key":"ref110","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00756"},{"key":"ref111","first-page":"1","article-title":"ViLBERT: Pretraining task-agnostic visiolinguistic representations for vision-and-language tasks","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","volume":"32","author":"Lu"},{"key":"ref112","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/D19-1514"},{"key":"ref113","article-title":"VisualBERT: A simple and performant baseline for vision and language","author":"Li","year":"2019","journal-title":"arXiv:1908.03557"},{"key":"ref114","first-page":"8748","article-title":"Learning transferable visual models from natural language supervision","volume-title":"Proc. Int. Conf. Mach. Learn.","author":"Radford"},{"key":"ref115","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-19818-2_42"},{"key":"ref116","first-page":"4904","article-title":"Scaling up visual and vision-language representation learning with noisy text supervision","volume-title":"Proc. Int. Conf. Mach. Learn.","author":"Jia"},{"key":"ref117","article-title":"CoCa: Contrastive captioners are image-text foundation models","author":"Yu","year":"2022","journal-title":"arXiv:2205.01917"},{"key":"ref118","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2023.3275156"},{"key":"ref119","doi-asserted-by":"publisher","DOI":"10.1109\/TIV.2022.3197815"},{"key":"ref120","article-title":"Resource-efficient federated multimodal learning via layer-wise and progressive training","author":"Tun","year":"2024","journal-title":"arXiv:2407.15426"},{"key":"ref121","doi-asserted-by":"publisher","DOI":"10.1145\/3666025.3699360"},{"key":"ref122","article-title":"FIARSE: Model-heterogeneous federated learning via importance-aware submodel extraction","author":"Wu","year":"2024","journal-title":"arXiv:2407.19389"},{"key":"ref123","doi-asserted-by":"publisher","DOI":"10.1109\/TNNLS.2019.2944481"},{"key":"ref124","doi-asserted-by":"publisher","DOI":"10.1109\/TCE.2024.3352432"},{"key":"ref125","doi-asserted-by":"publisher","DOI":"10.1109\/TPDS.2022.3186960"},{"key":"ref126","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2024.3508030"},{"key":"ref127","doi-asserted-by":"publisher","DOI":"10.1109\/ICCWAMTIP53232.2021.9674116"},{"key":"ref128","doi-asserted-by":"publisher","DOI":"10.1016\/j.inffus.2023.101890"},{"key":"ref129","doi-asserted-by":"publisher","DOI":"10.1145\/3581791.3596844"},{"key":"ref130","doi-asserted-by":"publisher","DOI":"10.1109\/IoTDI54339.2022.00011"},{"key":"ref131","doi-asserted-by":"publisher","DOI":"10.1145\/3657291"},{"key":"ref132","article-title":"FedMEKT: Distillation-based embedding knowledge transfer for multimodal federated learning","author":"Le","year":"2023","journal-title":"arXiv:2307.13214"},{"key":"ref133","article-title":"Think locally, act globally: Federated learning with local and global representations","author":"Liang","year":"2020","journal-title":"arXiv:2001.01523"},{"key":"ref134","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2024.3367412"},{"key":"ref135","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v38i2.27909"},{"key":"ref136","doi-asserted-by":"publisher","DOI":"10.1109\/ICC51166.2024.10622194"},{"key":"ref137","doi-asserted-by":"publisher","DOI":"10.1109\/TIFS.2023.3340994"},{"key":"ref138","doi-asserted-by":"publisher","DOI":"10.1016\/j.compmedimag.2024.102342"},{"key":"ref139","doi-asserted-by":"publisher","DOI":"10.1145\/3404835.3462989"},{"key":"ref140","doi-asserted-by":"publisher","DOI":"10.1109\/OJCS.2022.3206407"},{"key":"ref141","doi-asserted-by":"publisher","DOI":"10.1109\/TGRS.2023.3339522"},{"key":"ref142","doi-asserted-by":"publisher","DOI":"10.1016\/j.neuroimage.2011.09.069"},{"key":"ref143","article-title":"Multimodal fusion on low-quality data: A comprehensive survey","author":"Zhang","year":"2024","journal-title":"arXiv:2404.18947"},{"key":"ref144","doi-asserted-by":"publisher","DOI":"10.1016\/j.neuroimage.2014.01.033"},{"key":"ref145","article-title":"UNIXGEN: A unified vision-language model for multi-view chest X-ray generation and report generation","volume-title":"arXiv:2302.12172","author":"Lee","year":"2023"},{"key":"ref146","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2020.3037734"},{"key":"ref147","doi-asserted-by":"publisher","DOI":"10.1016\/j.patrec.2022.04.019"},{"key":"ref148","doi-asserted-by":"publisher","DOI":"10.1145\/3219819.3219963"},{"key":"ref149","doi-asserted-by":"publisher","DOI":"10.1145\/3394486.3403182"},{"key":"ref150","doi-asserted-by":"publisher","DOI":"10.1080\/01621459.2019.1632079"},{"key":"ref151","doi-asserted-by":"publisher","DOI":"10.1145\/3543848"},{"key":"ref152","doi-asserted-by":"publisher","DOI":"10.3390\/s19091988"},{"key":"ref153","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2023.3286935"},{"key":"ref154","doi-asserted-by":"publisher","DOI":"10.1007\/11608288_66"},{"key":"ref155","doi-asserted-by":"publisher","DOI":"10.1007\/s11042-013-1391-2"},{"key":"ref156","first-page":"2764","article-title":"WSABIE: Scaling up to large vocabulary image annotation","volume-title":"Proc. 22nd Int. Joint Conf. Artif. Intell.","author":"Weston"},{"key":"ref157","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v36i3.20213"},{"key":"ref158","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2020.emnlp-main.159"},{"key":"ref159","doi-asserted-by":"publisher","DOI":"10.1016\/j.inffus.2021.12.003"},{"key":"ref160","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-53092-0_15"},{"key":"ref161","doi-asserted-by":"publisher","DOI":"10.1016\/j.engappai.2023.107037"},{"key":"ref162","article-title":"Align as ideal: Cross-modal alignment binding for federated medical vision-language pre-training","author":"Shuai","year":"2024","journal-title":"arXiv:2404.03854v2"},{"key":"ref163","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2023.3340109"},{"key":"ref164","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/P19-1656"},{"key":"ref165","article-title":"Unimodal training-multimodal prediction: Cross-modal federated learning with hierarchical aggregation","author":"Zhang","year":"2023","journal-title":"arXiv:2303.15486"},{"key":"ref166","doi-asserted-by":"publisher","DOI":"10.1145\/3534678.3539384"},{"key":"ref167","doi-asserted-by":"publisher","DOI":"10.1007\/s10586-023-04133-4"},{"key":"ref168","doi-asserted-by":"publisher","DOI":"10.1109\/PERCOM50583.2021.9439129"},{"key":"ref169","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.721"},{"key":"ref170","doi-asserted-by":"publisher","DOI":"10.1016\/j.bspc.2024.106353"},{"key":"ref171","article-title":"Multi-modal federated learning for cancer staging over non-IID datasets with unbalanced modalities","author":"Borazjani","year":"2024","journal-title":"arXiv:2401.03609"},{"key":"ref172","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v34i07.6824"},{"key":"ref173","doi-asserted-by":"publisher","DOI":"10.1145\/3543507.3583518"},{"key":"ref174","doi-asserted-by":"publisher","DOI":"10.1126\/science.adk6139"},{"key":"ref175","doi-asserted-by":"publisher","DOI":"10.1016\/j.eswa.2020.114054"},{"key":"ref176","doi-asserted-by":"publisher","DOI":"10.1016\/j.ejrad.2021.109583"},{"key":"ref177","doi-asserted-by":"publisher","DOI":"10.1145\/3523150.3523166"},{"key":"ref178","doi-asserted-by":"publisher","DOI":"10.1007\/978-981-97-5131-0_21"},{"key":"ref179","doi-asserted-by":"publisher","DOI":"10.1002\/jmri.21049"},{"key":"ref180","doi-asserted-by":"publisher","DOI":"10.1038\/s43018-022-00388-9"},{"key":"ref181","doi-asserted-by":"publisher","DOI":"10.3389\/fbinf.2023.1131021"},{"key":"ref182","doi-asserted-by":"publisher","DOI":"10.1016\/j.media.2020.101795"},{"key":"ref183","doi-asserted-by":"publisher","DOI":"10.1038\/nmeth.2956"},{"key":"ref184","article-title":"Identifying the best machine learning algorithms for brain tumor segmentation, progression assessment, and overall survival prediction in the brats challenge","author":"Bakas","year":"2018","journal-title":"arXiv:1811.02629"},{"key":"ref185","article-title":"MELD: A multimodal multi-party dataset for emotion recognition in conversations","author":"Poria","year":"2018","journal-title":"arXiv:1810.02508"},{"key":"ref186","doi-asserted-by":"publisher","DOI":"10.1109\/TAFFC.2014.2336244"},{"key":"ref187","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v32i1.12024"},{"key":"ref188","first-page":"1","article-title":"MultiBench: Multiscale benchmarks for multimodal representation learning","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","author":"Liang"},{"key":"ref189","doi-asserted-by":"publisher","DOI":"10.1007\/s10579-008-9076-6"},{"key":"ref190","first-page":"3","article-title":"A public domain dataset for human activity recognition using smartphones","volume-title":"Proc. Esann","volume":"3","author":"Anguita"},{"key":"ref191","doi-asserted-by":"publisher","DOI":"10.1016\/j.patrec.2021.02.024"},{"key":"ref192","doi-asserted-by":"publisher","DOI":"10.1007\/s11263-021-01531-2"},{"key":"ref193","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2019.2916873"},{"key":"ref194","first-page":"5315","article-title":"FLamby: Datasets and benchmarks for cross-silo federated learning in realistic healthcare settings","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","volume":"35","author":"du Terrail"},{"key":"ref195","doi-asserted-by":"publisher","DOI":"10.1038\/s41597-022-01899-x"},{"key":"ref196","first-page":"2611","article-title":"The hateful memes challenge: Detecting hate speech in multimodal memes","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","volume":"33","author":"Kiela"},{"key":"ref197","doi-asserted-by":"publisher","DOI":"10.1609\/icwsm.v12i1.14983"},{"key":"ref198","volume-title":"The caltech-ucsd birds-200-2011 dataset","author":"Wah"},{"key":"ref199","doi-asserted-by":"publisher","DOI":"10.1109\/ICVGIP.2008.47"},{"key":"ref200","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-10599-4_29"},{"key":"ref201","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2022.3225461"},{"key":"ref202","doi-asserted-by":"publisher","DOI":"10.1109\/JIOT.2020.3009358"},{"key":"ref203","doi-asserted-by":"publisher","DOI":"10.1117\/12.2618904"},{"key":"ref204","doi-asserted-by":"publisher","DOI":"10.1109\/ICDE51399.2021.00023"},{"key":"ref205","doi-asserted-by":"publisher","DOI":"10.1109\/SP.2019.00065"},{"key":"ref206","doi-asserted-by":"publisher","DOI":"10.1109\/TIFS.2020.2988575"},{"key":"ref207","doi-asserted-by":"publisher","DOI":"10.1109\/TNNLS.2021.3072238"},{"key":"ref208","article-title":"Nonnegative decomposition of multivariate information","author":"Williams","year":"2010","journal-title":"arXiv:1004.2515"},{"key":"ref209","first-page":"10092","article-title":"Parameterized knowledge transfer for personalized federated learning","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","volume":"34","author":"Zhang"},{"key":"ref210","doi-asserted-by":"publisher","DOI":"10.1109\/INFOCOM53939.2023.10228954"},{"key":"ref211","doi-asserted-by":"publisher","DOI":"10.1109\/MWC.016.2300523"}],"container-title":["IEEE Open Journal of the Communications Society"],"original-title":[],"link":[{"URL":"https:\/\/linproxy.fan.workers.dev:443\/http\/xplorestaging.ieee.org\/ielx8\/8782661\/10829557\/10938626.pdf?arnumber=10938626","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,4,17]],"date-time":"2025-04-17T17:44:58Z","timestamp":1744911898000},"score":1,"resource":{"primary":{"URL":"https:\/\/linproxy.fan.workers.dev:443\/https\/ieeexplore.ieee.org\/document\/10938626\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025]]},"references-count":211,"URL":"https:\/\/linproxy.fan.workers.dev:443\/https\/doi.org\/10.1109\/ojcoms.2025.3554537","relation":{},"ISSN":["2644-125X"],"issn-type":[{"value":"2644-125X","type":"electronic"}],"subject":[],"published":{"date-parts":[[2025]]}}}