@article{fdi:010086352, title = {{I}nterpreting convolutional neural network decision for earthquake detection with feature map visualization, backward optimization and layer-wise relevance propagation methods}, author = {{M}ajstorovic, {J}. and {G}iffard-{R}oisin, {S}ophie and {P}oli, {P}.}, editor = {}, language = {{ENG}}, abstract = {{I}n the recent years, the seismological community has adopted deep learning ({DL}) models for many diverse tasks such as discrimination and classification of seismic events, identification of {P}- and {S}-phase wave arrivals or earthquake early warning systems. {N}umerous models recently developed are showing high accuracy values, and it has been attested for several tasks that {DL} models perform better than the classical seismological state-of-art models. {H}owever, their performances strongly depend on the {DL} architecture, the training hyperparameters, and the training data sets. {M}oreover, due to their complex nature, we are unable to understand how the model is learning and therefore how it is making a prediction. {T}hus, {DL} models are usually referred to as a 'black-box'. {I}n this study, we propose to apply three complementary techniques to address the interpretability of a convolutional neural network ({CNN}) model for the earthquake detection. {T}he implemented techniques are: feature map visualization, backward optimization and layer-wise relevance propagation. {S}ince our model reaches a good accuracy performance (97%), we can suppose that the {CNN} detector model extracts relevant characteristics from the data, however a question remains: can we identify these characteristics? {T}he proposed techniques help to answer the following questions: {H}ow is an earthquake processed by a {CNN} model? {W}hat is the optimal earthquake signal according to a {CNN}? {W}hich parts of the earthquake signal are more relevant for the model to correctly classify an earthquake sample? {T}he answer to these questions help understand why the model works and where it might fail, and whether the model is designed well for the predefined task. {T}he {CNN} used in this study had been trained for single-station detection, where an input sample is a 25 s three-component waveform. {T}he model outputs a binary target: earthquake (positive) or noise (negative) class. {T}he training database contains a balanced number of samples from both classes. {O}ur results shows that the {CNN} model correctly learned to recognize where is the earthquake within the sample window, even though the position of the earthquake in the window is not explicitly given during the training. {M}oreover, we give insights on how a neural network builds its decision process: while some aspects can be linked to clear physical characteristics, such as the frequency content and the {P} and {S} waves, we also see how different a {DL} detection is compared to a visual expertise or an {STA}/{LTA} detection. {O}n top of improving our model designs, we also think that understanding how such models work, how they perceive an earthquake, can be useful for the comprehension of events that are not fully understood yet such as tremors or low frequency earthquakes.}, keywords = {{N}eural networks ; fuzzy logic ; {N}umerical modelling ; {T}ime-series analysis ; {C}omputational seismology ; {ITALIE} ; {ABRUZZES}}, booktitle = {}, journal = {{G}eophysical {J}ournal {I}nternational}, volume = {232}, numero = {2}, pages = {923--939}, ISSN = {0956-540{X}}, year = {2022}, DOI = {10.1093/gji/ggac369}, URL = {https://www.documentation.ird.fr/hor/fdi:010086352}, }