@inproceedings{958072166ec4471381e61a7ec6cb825b,
title = "CancerUniT: Towards a Single Unified Model for Effective Detection, Segmentation, and Diagnosis of Eight Major Cancers Using a Large Collection of CT Scans",
abstract = "Human readers or radiologists routinely perform full-body multi-organ multi-disease detection and diagnosis in clinical practice, while most medical AI systems are built to focus on single organs with a narrow list of a few diseases. This might severely limit AI's clinical adoption. A certain number of AI models need to be assembled nontrivially to match the diagnostic process of a human reading a CT scan. In this paper, we construct a Unified Tumor Transformer (CancerUniT) model to jointly detect tumor existence & location and diagnose tumor characteristics for eight major cancers in CT scans. CancerUniT is a query-based Mask Transformer model with the output of multi-tumor prediction. We decouple the object queries into organ queries, tumor detection queries and tumor diagnosis queries, and further establish hierarchical relationships among the three groups. This clinically-inspired architecture effectively assists inter- and intra-organ representation learning of tumors and facilitates the resolution of these complex, anatomically related multi-organ cancer image reading tasks. CancerUniT is trained end-to-end using a curated large-scale CT images of 10,042 patients including eight major types of cancers and occurring non-cancer tumors (all are pathology-confirmed with 3D tumor masks annotated by radiologists). On the test set of 631 patients, CancerUniT has demonstrated strong performance under a set of clinically relevant evaluation metrics, substantially outperforming both multi-disease methods and an assembly of eight single-organ expert models in tumor detection, segmentation, and diagnosis. This moves one step closer towards a universal high performance cancer screening tool.",
author = "Jieneng Chen and Yingda Xia and Jiawen Yao and Ke Yan and Jianpeng Zhang and Le Lu and Fakai Wang and Bo Zhou and Mingyan Qiu and Qihang Yu and Mingze Yuan and Wei Fang and Yuxing Tang and Minfeng Xu and Jian Zhou and Yuqian Zhao and Qifeng Wang and Xianghua Ye and Xiaoli Yin and Yu Shi and Xin Chen and Jingren Zhou and Alan Yuille and Zaiyi Liu and Ling Zhang",
note = "Publisher Copyright: {\textcopyright} 2023 IEEE.; 2023 IEEE/CVF International Conference on Computer Vision, ICCV 2023 ; Conference date: 02-10-2023 Through 06-10-2023",
year = "2023",
doi = "10.1109/ICCV51070.2023.01950",
language = "English (US)",
series = "Proceedings of the IEEE International Conference on Computer Vision",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
pages = "21270--21281",
booktitle = "Proceedings - 2023 IEEE/CVF International Conference on Computer Vision, ICCV 2023",
address = "United States",
}