@Article{NAM2003061, author = {Nam, Ju Gang and Kim, Minchul and Park, Jongchan and Hwang, Eui Jin and Lee, Jong Hyuk and Hong, Jung Hee and Goo, Jin Mo and Park, Chang Min}, title = {Development and validation of a deep learning algorithm detecting 10 common abnormalities on chest radiographs}, elocation-id = {2003061}, year = {2020}, doi = {10.1183/13993003.03061-2020}, abstract = {We aimed to develop a deep learning algorithm to detect 10 common abnormalities on chest radiographs (DLAD-10) and evaluate its impact on diagnostic accuracy, reporting timeliness and workload.DLAD-10 was trained using 108 053 patients using a ResNet34-based neural network with lesion-specific channels for 10 common radiologic abnormalities (pneumothorax, mediastinal widening, pneumonia, nodule/mass, consolidation, linear interstitial opacity, fibrosis, calcification and cardiomegaly). For external validation, DLAD-10{\textquoteright}s performance was compared with three radiologists on a same-day CT-confirmed dataset (normal:abnormal, 53:147) and an open-source dataset (PadChest; normal:abnormal, 339:334). A separate simulated reading test was performed on another dataset from the emergency department adjusted to real-world disease prevalence, including four critical, 52 urgent and 146 non-urgent cases. Six radiologists participated in simulated reading sessions with or without DLAD-10.DLAD-10 demonstrated 0.895{\textendash}1.00 area under the receiver operating characteristic curve (AUROC) in the CT-confirmed dataset and 0.878{\textendash}0.995 AUROC in the PadChest dataset. DLAD-10 correctly classified critical abnormalities (95.0\% [57/60]) better than pooled radiologists (84.4\% [152/180]; p=0.01). In simulated reading tests for emergency department patients, pooled readers detected significantly more critical (70.8\% [17/24] versus 29.2\% [7/24]; p=0.006) and urgent (82.7\% [258/312] versus 78.2\% [244/312]; p=0.04) abnormalities when aided by DLAD-10. DLAD-10 assistance shortened the mean time-to-report critical and urgent radiographs (640.5{\textpm}466.3 versus 3371.0{\textpm}1352.5 s and 1840.3{\textpm}1141.1 versus 2127.1{\textpm}1468.2, respectively; p-values\<0.01) and reduced the mean interpretation time (20.5{\textpm}22.8 versus 23.5{\textpm}23.7 s; p\<0.001).DLAD-10 showed excellent performance, improving radiologists{\textquoteright} performance and shortening the reporting time for critical and urgent cases.}, issn = {0903-1936}, URL = {//www.qdcxjkg.com/content/early/2020/11/05/13993003.03061-2020}, journal = {European Respiratory Journal} }