<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Archiving and Interchange DTD v1.0 20120330//EN" "JATS-archivearticle1.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink">
  <front>
    <journal-meta />
    <article-meta>
      <title-group>
        <article-title>Reconstruction of Radio Signals from Air-Showers with Autoencoder</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="author">
          <string-name>Pavel Bezyazeekov</string-name>
          <xref ref-type="aff" rid="aff5">5</xref>
        </contrib>
        <contrib contrib-type="author">
          <string-name>Nikolay Budnev</string-name>
          <xref ref-type="aff" rid="aff5">5</xref>
        </contrib>
        <contrib contrib-type="author">
          <string-name>Oleg Fedorov</string-name>
          <xref ref-type="aff" rid="aff5">5</xref>
        </contrib>
        <contrib contrib-type="author">
          <string-name>Oleg Gress</string-name>
          <xref ref-type="aff" rid="aff5">5</xref>
        </contrib>
        <contrib contrib-type="author">
          <string-name>Oleg Grishin</string-name>
          <xref ref-type="aff" rid="aff5">5</xref>
        </contrib>
        <contrib contrib-type="author">
          <string-name>Andreas Haungs</string-name>
          <xref ref-type="aff" rid="aff3">3</xref>
        </contrib>
        <contrib contrib-type="author">
          <string-name>Tim Huege</string-name>
          <xref ref-type="aff" rid="aff0">0</xref>
          <xref ref-type="aff" rid="aff3">3</xref>
        </contrib>
        <contrib contrib-type="author">
          <string-name>Yulia Kazarina</string-name>
          <xref ref-type="aff" rid="aff5">5</xref>
        </contrib>
        <contrib contrib-type="author">
          <string-name>Matthias Kleifges</string-name>
          <xref ref-type="aff" rid="aff4">4</xref>
        </contrib>
        <contrib contrib-type="author">
          <string-name>Dmitriy Kostunin</string-name>
          <xref ref-type="aff" rid="aff2">2</xref>
        </contrib>
        <contrib contrib-type="author">
          <string-name>Elena Korosteleva</string-name>
          <xref ref-type="aff" rid="aff6">6</xref>
        </contrib>
        <contrib contrib-type="author">
          <string-name>Leonid Kuzmichev</string-name>
          <xref ref-type="aff" rid="aff6">6</xref>
        </contrib>
        <contrib contrib-type="author">
          <string-name>Vladimir Lenok</string-name>
          <xref ref-type="aff" rid="aff3">3</xref>
        </contrib>
        <contrib contrib-type="author">
          <string-name>Nima Lubsandorzhiev</string-name>
          <xref ref-type="aff" rid="aff6">6</xref>
        </contrib>
        <contrib contrib-type="author">
          <string-name>Stanislav Malakhov</string-name>
          <xref ref-type="aff" rid="aff5">5</xref>
        </contrib>
        <contrib contrib-type="author">
          <string-name>Tatyana Marshalkina</string-name>
          <xref ref-type="aff" rid="aff5">5</xref>
        </contrib>
        <contrib contrib-type="author">
          <string-name>Roman Monkhoev</string-name>
          <xref ref-type="aff" rid="aff5">5</xref>
        </contrib>
        <contrib contrib-type="author">
          <string-name>Eleonora Osipova</string-name>
          <xref ref-type="aff" rid="aff6">6</xref>
        </contrib>
        <contrib contrib-type="author">
          <string-name>Alexandr Pakhorukov</string-name>
          <xref ref-type="aff" rid="aff5">5</xref>
        </contrib>
        <contrib contrib-type="author">
          <string-name>Leonid Pankov</string-name>
          <xref ref-type="aff" rid="aff5">5</xref>
        </contrib>
        <contrib contrib-type="author">
          <string-name>Vasiliy Prosin</string-name>
          <xref ref-type="aff" rid="aff6">6</xref>
        </contrib>
        <contrib contrib-type="author">
          <string-name>Frank Schroder</string-name>
          <xref ref-type="aff" rid="aff1">1</xref>
          <xref ref-type="aff" rid="aff3">3</xref>
        </contrib>
        <contrib contrib-type="author">
          <string-name>Dmitriy Shipilov</string-name>
          <xref ref-type="aff" rid="aff5">5</xref>
        </contrib>
        <contrib contrib-type="author">
          <string-name>Alexey Zagorodnikov</string-name>
          <xref ref-type="aff" rid="aff5">5</xref>
        </contrib>
        <aff id="aff0">
          <label>0</label>
          <institution>Astrophysical Institute, Vrije Universiteit Brussel</institution>
          ,
          <addr-line>Pleinlaan 2, Brussels</addr-line>
          ,
          <country country="BE">Belgium</country>
        </aff>
        <aff id="aff1">
          <label>1</label>
          <institution>Bartol Research Inst., Dept. of Phys. and Astron., Univ. of Delaware</institution>
          ,
          <addr-line>Newark</addr-line>
          ,
          <country country="US">USA</country>
        </aff>
        <aff id="aff2">
          <label>2</label>
          <institution>DESY</institution>
          ,
          <addr-line>Zeuthen</addr-line>
          ,
          <country country="DE">Germany</country>
        </aff>
        <aff id="aff3">
          <label>3</label>
          <institution>Institut fur Kernphysik, KIT</institution>
          ,
          <addr-line>Karlsruhe</addr-line>
          ,
          <country country="DE">Germany</country>
        </aff>
        <aff id="aff4">
          <label>4</label>
          <institution>Institut fur Prozessdatenverarbeitung und Elektronik, KIT</institution>
          ,
          <addr-line>Karlsruhe</addr-line>
          ,
          <country country="DE">Germany</country>
        </aff>
        <aff id="aff5">
          <label>5</label>
          <institution>Institute of Applied Physics ISU</institution>
          ,
          <addr-line>Irkutsk</addr-line>
          ,
          <country country="RU">Russia</country>
        </aff>
        <aff id="aff6">
          <label>6</label>
          <institution>Skobeltsyn Institute of Nuclear Physics MSU</institution>
          ,
          <addr-line>Moscow</addr-line>
          ,
          <country country="RU">Russia</country>
        </aff>
      </contrib-group>
      <abstract>
        <p>The Tunka Radio Extension (Tunka-Rex) is a digital antenna array (63 antennas distributed over 1 km2) co-located with the TAIGA observatory in Eastern Siberia. Tunka-Rex measures radio emission of air-showers induced by ultra-high energy cosmic rays in the frequency band of 30-80 MHz. Air-shower signal is a short (tens of nanoseconds) broadband pulse. Using time positions and amplitudes of these pulses, we reconstruct parameters of air showers and primary cosmic rays. The amplitudes of low-energy event (E &lt; 1017 eV) cannot be used for succesful reconstruction due to the domination of background. To lower the energy threshold of the detection and increase the e ciency, we use autoencoder neural network which removes noise from the measured data. This work describes our approach to denoising raw data and further reconstruction of air-shower parameters. We also present results of the low-energy events reconstruction with autoencoder.</p>
      </abstract>
      <kwd-group>
        <kwd>Tunka-Rex • E</kwd>
        <kwd>ciency • Autoencoder • Denoising</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec id="sec-1">
      <title>-</title>
      <p>
        Cosmic rays (CR) are accelerated charged particles traveling in the space.
Most of them are protons, minor part is more massive atomic nuclei (up to iron).
The sources of CR are associated with stars at di erent evolution stages. The
Copyright ' 2020 for this paper by its authors. Use permitted under Creative
Commons License Attribution 4.0 International (CC BY 4.0).
ultra-high energy CR (&gt; 1015 eV) carry information about most powerful cosmic
accelerators and studying them is one of important tasks in modern astrophysics.
Due to the low ux of the ultra-high energy CR, it is impossible to measure
them directly (in space or high layers of atmosphere), and they are detected by
sparse ground detectors measuring cascades produced by their interaction with
the atmosphere. These cascades, called air-showers, consist of many secondary
particles, including electrons and positrons, which produce short radio pulses due
to de ection in the Earth's magnetic eld and heterogenity of charge distribution
in shower. These pulses have a broadband spectrum mostly in the MHz domain
and a duration of tens of nanoseconds [
        <xref ref-type="bibr" rid="ref1">1</xref>
        ].
      </p>
      <p>
        Tunka-Rex [
        <xref ref-type="bibr" rid="ref2">2</xref>
        ] is a sparse antenna array located at the TAIGA facility [
        <xref ref-type="bibr" rid="ref3 ref4">3, 4</xref>
        ]
in the Tunka Valley (Eastern Siberia). It consists of 63 antennas measuring radio
emission from air showers in the frequency band of 30-80 MHz. Since Tunka-Rex
is placed in a relatively radio-quiet location, the main background is from the
Galaxy. However, there are plenty of non-stationary background sources, which
may distort the air-shower pulse and complicate the reconstruction of events with
low energies. In this work, we present our progress on the way of reconstruction
of low-energy events by removing RFI from Tunka-Rex signal traces using the
autoencoder (AE) neural network and discuss the performance of this approach.
2
      </p>
    </sec>
    <sec id="sec-2">
      <title>Dataset</title>
      <p>
        Tunka-Rex measures air-shower signals in two perpendicular polarizations and
records it to traces of 1024 samples each with 200 MHz sampling. For the
reconstruction of cosmic-ray air-showers, the two main properties of radio pulses are
used: the amplitude of the signal and its arrival time. Details of this
reconstruction are given in Refs. [
        <xref ref-type="bibr" rid="ref5 ref6">5, 6</xref>
        ].
      </p>
      <p>Before the reconstruction of the signals, we perform several preprocessing
transformations. Spectra of the signals obtained with the Fourier transform are
cut by a digital bandpass to 35-75 MHz and ltered with a median lter, which
removes narrow-band RFI and equalizes the noise using a sliding window of
3 MHz width. Afterwards, the traces are upsampled in order to increase the
timing resolution (factor 16 for this study). Finally, the electric elds along the
two polarization directions in the plane perpendicular to the shower axis are
reconstructed, namely v B (along the Lorentz force, where v is the direction
of the air shower and B the direction of the geomagnetic eld) and v v B
perpendicular to it. Since the main contribution of radio emission occurs in the
v B polarization, we consider only this one for the AE processing.</p>
      <p>
        In this study, we use a dataset of 650 000 samples of the measured background
(2014-2017) recorded by Tunka-Rex and 25 000 CoREAS [
        <xref ref-type="bibr" rid="ref7">7</xref>
        ] simulations. The
air-shower pulse is randomly located within the signal window, summed with
noise and folded with the Tunka-Rex hardware response taking into account the
geometry of the air shower and the detector calibration. As was discussed in
Ref. [
        <xref ref-type="bibr" rid="ref6">6</xref>
        ], the simulated signals reproduce real ones with satisfactory accuracy. As
shown below, the methods developed for simulated pulses can be applied to the
real data without additional tuning.
3
      </p>
    </sec>
    <sec id="sec-3">
      <title>Autoencoder (AE)</title>
      <p>
        AE [
        <xref ref-type="bibr" rid="ref8">8</xref>
        ] is an unsupervised convolutional network used for learning the coded
representation of the data and removing speci c features from it. The structure
of AE can be described as follows:
1. Encoder. This part of AE distinguishes the features of noise contained in
the input data by applying sets of lters. The lters perform the
convolution of characteristic noise-related features with the input data, estimate
its contribution as a result of the convolution, and afterwards send it to the
max-pooling layer. The max-pooling layer performs a discrete downsampling
of the data and sends it to the next convolution layer with the next set of
lters. With each layer of the encoder, the data becomes more abstract and
reduced in size.
2. Coded representation. Central layer of AE has the least size (1024 in this
study) and contains an abstract code of the input data. Due to its small
size, we lost part of the input data. Learning procedure tunes AE for loosing
noise-related data and leaving only cosmic-ray signals.
3. Decoder. After encoding, the noise-related features are removed and the
map of denoised data proceeds to the decoding part of AE, which produces
a reverse reconstruction and returns a data array of the same dimension as
the input. If successful, the resulting output is the denoised trace containing
only the air-shower pulse, as shown in Fig. (1).
3.1
      </p>
      <sec id="sec-3-1">
        <title>Con guration and training</title>
        <p>The input array for our AE consists of 4096 values, which corresponds to a trace
length of 1280 ns and 0.3125 ns sampling in order to contain the signal window
of 200 ns as well as surrounding background. To minimize the loss, we normalize
the input data to the [0:1] range with a baseline level at 0.5.</p>
        <p>
          We have explicitly selected a subsample with low amplitudes and a low SNR
for training to nd out if the threshold may be lowered. We implemented and
trained our AE with Keras [
          <xref ref-type="bibr" rid="ref9">9</xref>
          ] and Tensor ow [
          <xref ref-type="bibr" rid="ref10">10</xref>
          ] in a uDocker container with
GPU support. After estimation of e ciency and accuracy of reconstruction with
various depth (number of convolutional layers) and a number of lters per layer,
we chose a 3-layer encoder with 8 lters per layer. The full pipeline reconstruction
using the data denoised by AE shows precision comparable with the standard
method [
          <xref ref-type="bibr" rid="ref11">11</xref>
          ].
3.2
        </p>
      </sec>
      <sec id="sec-3-2">
        <title>Real data reconstruction</title>
        <p>After a series of tests on the simulated data, we test the performance of AE in
application to the reconstruction of real low-energy events. For this study, we use
0.8
0.6
0.4
)
rya 0.2
itr
b
r(ae 0
d
u
iltpm -0.2
A
-0.4
-0.6
-0.8
expected pulse position</p>
        <p>raw signal
denoised signal
300
400
500
600
700</p>
        <p>
          800
t (ns)
a set of low-energy Tunka-133 [12] events (Fig. (2)) with energies from 1016 to
1017 eV, which is unavailable for reconstruction using the standard Tunka-Rex
method [
          <xref ref-type="bibr" rid="ref5">5</xref>
          ]. The AE threshold was decreased from 0:395=0:500 to 0:200=0:500.
The reconstruction pipeline is as follows:
1. Traces (single polarization) in the event are processed with AE. Peaks of
envelopes of denoised traces are saved as assumed air-shower timestamps.
2. Reconstruction of the shower front and arrival direction using these
timestamps.
3. Cut by applying the cross-check between the reconstruction direction by
AE and by the host experiment Tunka-133: passing only events with the
di erence &lt; 5 . Additional cut for the geomagnetic angle &gt; 60 to select
events with the maximal contribution of the geomagnetic e ect.
4. Shifting the traces inside each event corresponding to the AE timestamps,
summarizing them and normalizing to number of input traces in purpose of
increasing SNR (Fig. (3)).
        </p>
        <p>The result of processing an event with this pipeline is an amplitude S of the
coherent sum at AE timestamps and a mean distance r of input stations. By
this we extrapolate the lateral distribution function:</p>
        <p>S0 =</p>
        <p>S
exp[ 0(r
r0)]
;
(1)
where S0 is an amplitude at the distance r0 from the shower axis, 0 = 227:793
10 5 m 1 is correction factor. This way we calculate the amplitude S180 (180
m to axis) related to the best correlation with air-shower energy. After that we
Tunka-Rex station
Shower core
180°
135°
225°
90°
B field
270°
10 20 30 40 50 60</p>
        <p>0°
45°
315°
reconstruct the energy E using the single antenna method:</p>
        <p>E = S180
;
(2)
where = 868 10 6 EeV m=V. This way we reconstruct the set of low-energy
events. 83 events passed the amplitude threshold and the arrival direction
crosscheck. 13 of them survived after and SNR cuts. In Fig. (4) one can see the
results of this reconstruction.
4</p>
      </sec>
    </sec>
    <sec id="sec-4">
      <title>Discussion and conclusion</title>
      <p>The performance of Tunka-Rex AE has been tested on real data. Reconstruction
shows that we can reconstruct the arrival direction of low-energy events with AE,
but energy precision for now is relatively low ( 26%). We have illustrated the
possibility of reconstruction of low-energy events, and there is still room for
improvement for the e cient application to the Tunka-Rex data processing. We
plan to improve AE by testing di erent loss metrics and network architectures
with bigger dataset. Future work also implies modi cation of the input trace
normalization for saving the information of the absolute signal amplitude in
denoised trace. This will enable us to validate our technique on the Tunka-133
+ Tunka-Rex data and check its performance in application to the data measured
by Tunka-Rex + Tunka-Grande experiments. In addition to the task of lowering
the threshold, we also plan to check application of this technique to removing
air-shower pulses from the raw data ow within the frame of the Tunka-21cm
experiment [13].</p>
      <p>SNR = 18.05</p>
      <p>1800
SNR = 12.26</p>
      <p>1800
SNR = 9.77</p>
      <p>SNR = 31.48</p>
      <p>Signal traces:
1000
1200
1400</p>
      <p>1600
1000
1200
1400</p>
      <p>1600
1200 1400</p>
      <p>Coherent sum:
1000
1600
1800
60
40
20
0
20
40
60
40
20
0
20
40
40
20
0
20
40
40
20
0
20
40
1000
1200
1400
1600
1800</p>
    </sec>
    <sec id="sec-5">
      <title>Acknowledgements</title>
      <p>The work of P.Bezyazeekov on section "Real data reconstruction" is supported
by the Russian Foundation for Basic Research "Mobility" program grant
1932-50147. The work has been supported by Russian Federation for Basic
Research grant 18-32-20220, the Helmholtz grant HRSF-0027, the Russian
Federation Ministry of Science and High Education (project. FZZE-2020-0024), the
Mathematical Center in Akademgorodok under agreement No 075-2019-1675
with the Ministry of Science and Higher Education of the Russian Federation
and Irkutsk State University grant 091-19-213. P.Bezyazeekov thanks the
community of the Institute for Nuclear Research, where this study has been carried
out, and personally G. Rubtsov.
12. V. V. Prosin et al., \Primary CR energy spectrum and mass composition by the
data of Tunka-133 array," EPJ Web Conf., vol. 99, p. 04002, 2015.
13. D. Kostunin et al., \Quest for detection of a cosmological signal from neutral
hydrogen with a digital radio array developed for air-shower measurements," PoS,
vol. ICRC2019, p. 320, 2020.</p>
    </sec>
  </body>
  <back>
    <ref-list>
      <ref id="ref1">
        <mixed-citation>
          1.
          <string-name>
            <given-names>F.G.</given-names>
            <surname>Schro</surname>
          </string-name>
          <article-title>der, \Radio detection of Cosmic-Ray Air Showers</article-title>
          and
          <string-name>
            <surname>High-Energy</surname>
            <given-names>Neutrinos</given-names>
          </string-name>
          ,
          <article-title>"</article-title>
          <source>Prog. Part. Nucl. Phys.</source>
          , vol.
          <volume>93</volume>
          , pp.
          <volume>1</volume>
          {
          <issue>68</issue>
          ,
          <year>2017</year>
          .
        </mixed-citation>
      </ref>
      <ref id="ref2">
        <mixed-citation>
          2.
          <string-name>
            <given-names>P. A.</given-names>
            <surname>Bezyazeekov</surname>
          </string-name>
          et al.,
          <article-title>\Measurement of cosmic-ray air showers with the Tunka Radio Extension (Tunka-Rex),"</article-title>
          <string-name>
            <surname>Nucl. Instrum. Meth.</surname>
          </string-name>
          , vol.
          <source>A802</source>
          , pp.
          <volume>89</volume>
          {
          <issue>96</issue>
          ,
          <year>2015</year>
          .
        </mixed-citation>
      </ref>
      <ref id="ref3">
        <mixed-citation>
          3.
          <string-name>
            <given-names>N.</given-names>
            <surname>Budnev</surname>
          </string-name>
          et al., \
          <article-title>The TAIGA experiment: From cosmic-ray to gamma-ray astronomy in the Tunka valley," Nucl</article-title>
          . Instrum. Meth., vol.
          <source>A845</source>
          , pp.
          <volume>330</volume>
          {
          <issue>333</issue>
          ,
          <year>2017</year>
          .
        </mixed-citation>
      </ref>
      <ref id="ref4">
        <mixed-citation>
          4.
          <string-name>
            <given-names>D.</given-names>
            <surname>Kostunin</surname>
          </string-name>
          et al.,
          <article-title>\Tunka Advanced Instrument for cosmic rays and Gamma Astronomy," in 18th International Baikal Summer School on Physics of Elementary Particles and Astrophysics: Exploring the Universe through multiple messengers (ISAPP-Baikal 2018) Bolshie Koty</article-title>
          , Lake Baikal, Russia,
          <source>July 12-21</source>
          ,
          <year>2018</year>
          ,
          <year>2019</year>
          .
        </mixed-citation>
      </ref>
      <ref id="ref5">
        <mixed-citation>
          5.
          <string-name>
            <given-names>P. A.</given-names>
            <surname>Bezyazeekov</surname>
          </string-name>
          et al., \
          <article-title>Radio measurements of the energy and the depth of the shower maximum of cosmic-ray air showers by Tunka-Rex,"</article-title>
          <source>JCAP</source>
          , vol.
          <volume>1601</volume>
          , no.
          <issue>01</issue>
          , p.
          <fpage>052</fpage>
          ,
          <year>2016</year>
          .
        </mixed-citation>
      </ref>
      <ref id="ref6">
        <mixed-citation>
          6.
          <string-name>
            <given-names>P. A.</given-names>
            <surname>Bezyazeekov</surname>
          </string-name>
          et al.,
          <article-title>\Reconstruction of cosmic ray air showers with TunkaRex data using template tting of radio pulses,"</article-title>
          <source>Phys. Rev.</source>
          , vol.
          <volume>D97</volume>
          , no.
          <issue>12</issue>
          , p.
          <fpage>122004</fpage>
          ,
          <year>2018</year>
          .
        </mixed-citation>
      </ref>
      <ref id="ref7">
        <mixed-citation>
          7.
          <string-name>
            <given-names>T.</given-names>
            <surname>Huege</surname>
          </string-name>
          ,
          <string-name>
            <given-names>M.</given-names>
            <surname>Ludwig</surname>
          </string-name>
          , and
          <string-name>
            <given-names>C.</given-names>
            <surname>James</surname>
          </string-name>
          , \
          <article-title>Simulating radio emission from air showers with CoREAS,"</article-title>
          <source>AIP Conf.Proc.</source>
          , vol.
          <volume>1535</volume>
          , p.
          <fpage>128</fpage>
          ,
          <year>2013</year>
          .
        </mixed-citation>
      </ref>
      <ref id="ref8">
        <mixed-citation>
          8.
          <string-name>
            <given-names>Y.</given-names>
            <surname>Bengio</surname>
          </string-name>
          ,
          <string-name>
            <given-names>A.</given-names>
            <surname>Courville</surname>
          </string-name>
          , and
          <string-name>
            <given-names>P.</given-names>
            <surname>Vincent</surname>
          </string-name>
          , \
          <article-title>Representation learning: A review and new perspectives,"</article-title>
          <source>IEEE Trans. Pattern Anal. Mach</source>
          . Intell., vol.
          <volume>35</volume>
          , pp.
          <volume>1798</volume>
          {
          <issue>1828</issue>
          , Aug.
          <year>2013</year>
          .
        </mixed-citation>
      </ref>
      <ref id="ref9">
        <mixed-citation>
          9.
          <string-name>
            <given-names>F.</given-names>
            <surname>Chollet</surname>
          </string-name>
          , \
          <fpage>keras</fpage>
          ." https://github.com/fchollet/keras,
          <year>2015</year>
          .
        </mixed-citation>
      </ref>
      <ref id="ref10">
        <mixed-citation>
          10.
          <string-name>
            <surname>M. Abadi</surname>
          </string-name>
          et al.,
          <source>\TensorFlow: Large-scale machine learning on heterogeneous systems," 2015</source>
          .
          <article-title>Software available from tensor ow</article-title>
          .
          <source>org.</source>
        </mixed-citation>
      </ref>
      <ref id="ref11">
        <mixed-citation>
          11. P.Bezyazeekov et al. (
          <article-title>Tunka-Rex collab</article-title>
          .), \
          <article-title>Advanced Signal Reconstruction in Tunka-Rex with Matched Filtering and Deep Learning,"</article-title>
          <source>CEUR Workshop Proceedings</source>
          , vol.
          <volume>2406</volume>
          , pp.
          <volume>7</volume>
          {
          <issue>16</issue>
          ,
          <year>2019</year>
          .
        </mixed-citation>
      </ref>
    </ref-list>
  </back>
</article>