@inproceedings{9733dae86017424b8f325af69c4b64b8,
title = "Patcher: Patch Transformers with Mixture of Experts for Precise Medical Image Segmentation",
abstract = "We present a new encoder-decoder Vision Transformer architecture, Patcher, for medical image segmentation. Unlike standard Vision Transformers, it employs Patcher blocks that segment an image into large patches, each of which is further divided into small patches. Transformers are applied to the small patches within a large patch, which constrains the receptive field of each pixel. We intentionally make the large patches overlap to enhance intra-patch communication. The encoder employs a cascade of Patcher blocks with increasing receptive fields to extract features from local to global levels. This design allows Patcher to benefit from both the coarse-to-fine feature extraction common in CNNs and the superior spatial relationship modeling of Transformers. We also propose a new mixture-of-experts (MoE) based decoder, which treats the feature maps from the encoder as experts and selects a suitable set of expert features to predict the label for each pixel. The use of MoE enables better specializations of the expert features and reduces interference between them during inference. Extensive experiments demonstrate that Patcher outperforms state-of-the-art Transformer- and CNN-based approaches significantly on stroke lesion segmentation and polyp segmentation. Code for Patcher is released to facilitate related research. (Code: https://github.com/YanglanOu/patcher.git.).",
author = "Yanglan Ou and Ye Yuan and Xiaolei Huang and Wong, {Stephen T.C.} and John Volpi and Wang, {James Z.} and Kelvin Wong",
note = "Publisher Copyright: {\textcopyright} 2022, The Author(s), under exclusive license to Springer Nature Switzerland AG.; 25th International Conference on Medical Image Computing and Computer-Assisted Intervention, MICCAI 2022 ; Conference date: 18-09-2022 Through 22-09-2022",
year = "2022",
doi = "10.1007/978-3-031-16443-9_46",
language = "English (US)",
isbn = "9783031164422",
series = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
publisher = "Springer Science and Business Media Deutschland GmbH",
pages = "475--484",
editor = "Linwei Wang and Qi Dou and Fletcher, {P. Thomas} and Stefanie Speidel and Shuo Li",
booktitle = "Medical Image Computing and Computer Assisted Intervention – MICCAI 2022 - 25th International Conference, Proceedings",
address = "Germany",
}