@inproceedings{ed99edc68b1846419e70b347d2832d92,
title = "Synthetic sample selection via reinforcement learning",
abstract = "Synthesizing realistic medical images provides a feasible solution to the shortage of training data in deep learning based medical image recognition systems. However, the quality control of synthetic images for data augmentation purposes is under-investigated, and some of the generated images are not realistic and may contain misleading features that distort data distribution when mixed with real images. Thus, the effectiveness of those synthetic images in medical image recognition systems cannot be guaranteed when they are being added randomly without quality assurance. In this work, we propose a reinforcement learning (RL) based synthetic sample selection method that learns to choose synthetic images containing reliable and informative features. A transformer based controller is trained via proximal policy optimization (PPO) using the validation classification accuracy as the reward. The selected images are mixed with the original training data for improved training of image recognition systems. To validate our method, we take the pathology image recognition as an example and conduct extensive experiments on two histopathology image datasets. In experiments on a cervical dataset and a lymph node dataset, the image classification performance is improved by 8.1 % and 2.3 %, respectively, when utilizing high-quality synthetic images selected by our RL framework. Our proposed synthetic sample selection method is general and has great potential to boost the performance of various medical image recognition systems given limited annotation.",
author = "Jiarong Ye and Yuan Xue and Long, {L. Rodney} and Sameer Antani and Zhiyun Xue and Cheng, {Keith C.} and Xiaolei Huang",
note = "Publisher Copyright: {\textcopyright} Springer Nature Switzerland AG 2020.; 23rd International Conference on Medical Image Computing and Computer-Assisted Intervention, MICCAI 2020 ; Conference date: 04-10-2020 Through 08-10-2020",
year = "2020",
doi = "10.1007/978-3-030-59710-8_6",
language = "English (US)",
isbn = "9783030597092",
series = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
publisher = "Springer Science and Business Media Deutschland GmbH",
pages = "53--63",
editor = "Martel, {Anne L.} and Purang Abolmaesumi and Danail Stoyanov and Diana Mateus and Zuluaga, {Maria A.} and Zhou, {S. Kevin} and Daniel Racoceanu and Leo Joskowicz",
booktitle = "Medical Image Computing and Computer Assisted Intervention – MICCAI 2020 - 23rd International Conference, Proceedings",
address = "Germany",
}