@inproceedings{4cfe1a9a73f34f468a74c4e1b2a937ee,
title = "RECURRENT 3-D MULTI-LEVEL VISUAL TRANSFORMER FOR JOINT CLASSIFICATION OF HETEROGENEOUS 2-D AND 3-D RADIOGRAPHIC DATA",
abstract = "Recent advancements in artificial intelligence algorithms for medical imaging show significant potential in automating the detection of lung infections from chest radiograph scans. However, current approaches often focus solely on either 2-D or 3-D scans, failing to leverage the combined advantages of both modalities. Moreover, conventional slice-based methods place a manual burden on radiologists for slice selection. To overcome these challenges, we propose the Recurrent 3-D Multi-level Vision Transformer (R3DM-ViT) model, capable of handling multimodal data to enhance diagnostic accuracy. Our quantitative evaluations demonstrate that R3DM-ViT surpasses existing methods, achieving an impressive accuracy of 96.67\%, F1-score of 96.88\%, mean average precision of 96.75\%, and mean average recall of 97.02\%. This research signifies a significant stride forward in the automated detection of lung infections through multimodal imaging.",
keywords = "CBMIR, Computer-aided diagnosis, lung infection, Medical image retrieval, R3DM-ViT",
author = "Muhammad Owais and Muhammad Zubair and Taimur Hassan and Divya Velayudhan and Irfan Hussain and Naoufel Werghi",
note = "Publisher Copyright: {\textcopyright} 2024 IEEE; 31st IEEE International Conference on Image Processing, ICIP 2024 ; Conference date: 27-10-2024 Through 30-10-2024",
year = "2024",
doi = "10.1109/ICIP51287.2024.10647131",
language = "British English",
series = "Proceedings - International Conference on Image Processing, ICIP",
publisher = "IEEE Computer Society",
pages = "3205--3211",
booktitle = "2024 IEEE International Conference on Image Processing, ICIP 2024 - Proceedings",
address = "United States",
}