We present a novel multi-task convolutional neural network called Multi-task SonoEyeNet (M-SEN) that learns to generate clinically relevant visual attention maps using sonographer gaze tracking data on input ultrasound (US) video frames so as to assist standardized abdominal circumference (AC) plane detection. Our architecture consists of a generator and a discriminator, which are trained in an adversarial scheme. The generator learns sonographer attention on a given US video frame to predict the frame label (standardized AC plane/background). The discriminator further fine-tunes the predicted attention map by encouraging it to mimick the ground-truth sonographer attention map. The novel model expands the potential clinical usefulness of a previous model by eliminating the requirement of input gaze tracking data during inference without compromising its plane detection performance (Precision: 96.8, Recall: 96.2, F-1 score: 96.5).
@inproceedings{cai_multi-task_2018,
title = {Multi-task SonoEyeNet: Detection of Fetal Standardized Planes Assisted by Generated Sonographer Attention Maps},
author = {Cai, Yifan and Sharma, Harshita and Chatelain, Pierre and Noble, J. Alison},
booktitle = {Medical Image Computing and Computer Assisted Intervention – MICCAI 2018},
doi = {10.1007/978-3-030-00928-1_98},
editor = {Frangi, Alejandro F. and Schnabel, Julia A. and Davatzikos, Christos and Alberola-López, Carlos and Fichtinger, Gabor},
isbn = {978-3-030-00928-1},
language = {en},
pages = {871--879},
publisher = {Springer International Publishing},
series = {Lecture Notes in Computer Science},
shorttitle = {Multi-task SonoEyeNet},
year = {2018},
address = {Cham}
}