@inproceedings{b9454ca1a71d46f3a78b85b6050eef18,
title = "CausalCLIPSeg: Unlocking CLIP{\textquoteright}s Potential in Referring Medical Image Segmentation with Causal Intervention",
abstract = "Referring medical image segmentation targets delineating lesions indicated by textual descriptions. Aligning visual and textual cues is challenging due to their distinct data properties. Inspired by largescale pre-trained vision-language models, we propose CausalCLIPSeg, an end-to-end framework for referring medical image segmentation that leverages CLIP. Despite not being trained on medical data, we enforce CLIP{\textquoteright}s rich semantic space onto the medical domain by a tailored crossmodal decoding method to achieve text-to-pixel alignment. Furthermore, to mitigate confounding bias that may cause the model to learn spurious correlations instead of meaningful causal relationships, CausalCLIPSeg introduces a causal intervention module which self-annotates confounders and excavates causal features from inputs for segmentation judgments. We also devise an adversarial min-max game to optimize causal features while penalizing confounding ones. Extensive experiments demonstrate the state-of-the-art performance of our proposed method. Code is available at https://github.com/WUTCM-Lab/CausalCLIPSeg.",
keywords = "causal intervention, CLIP, cross-modal decoding, referring medical image segmentation",
author = "Yaxiong Chen and Minghong Wei and Zixuan Zheng and Jingliang Hu and Yilei Shi and Shengwu Xiong and Zhu, \{Xiao Xiang\} and Lichao Mou",
note = "Publisher Copyright: {\textcopyright} The Author(s), under exclusive license to Springer Nature Switzerland AG 2024.; 27th International Conference on Medical Image Computing and Computer-Assisted Intervention, MICCAI 2024 ; Conference date: 06-10-2024 Through 10-10-2024",
year = "2024",
doi = "10.1007/978-3-031-72384-1\_8",
language = "English",
isbn = "9783031723834",
series = "Lecture Notes in Computer Science",
publisher = "Springer Science and Business Media Deutschland GmbH",
pages = "76--87",
editor = "Linguraru, \{Marius George\} and Aasa Feragen and Ben Glocker and Schnabel, \{Julia A.\} and Qi Dou and Stamatia Giannarou and Karim Lekadir",
booktitle = "Medical Image Computing and Computer Assisted Intervention - MICCAI 2024 - 27th International Conference, Proceedings",
}