Other formats:
BibTeX
LaTeX
RIS
@article{77186, author = {White, Jack and Adámek, Karel and Roy, Jayanta and Dimoudi, Sofia and Ransom, Scott M. and Armour, Wesley}, article_location = {GB - Spojené království Velké Británie a}, article_number = {1}, doi = {http://dx.doi.org/10.3847/1538-4365/acb351}, keywords = {detecting ;binary pulsars; radio astronomy data sets}, language = {eng}, issn = {0067-0049}, journal = {Astrophysical Journal Supplement Series}, title = {Bits Missing: Finding Exotic Pulsars Using bfloat16 on NVIDIA GPUs}, url = {https://iopscience.iop.org/article/10.3847/1538-4365/acb351}, volume = {265}, year = {2023} }
TY - JOUR ID - 77186 AU - White, Jack - Adámek, Karel - Roy, Jayanta - Dimoudi, Sofia - Ransom, Scott M. - Armour, Wesley PY - 2023 TI - Bits Missing: Finding Exotic Pulsars Using bfloat16 on NVIDIA GPUs JF - Astrophysical Journal Supplement Series VL - 265 IS - 1 SP - "13-1"-"13-12" EP - "13-1"-"13-12" SN - 00670049 KW - detecting ;binary pulsars KW - radio astronomy data sets UR - https://iopscience.iop.org/article/10.3847/1538-4365/acb351 N2 - The Fourier domain acceleration search (FDAS) is an effective technique for detecting faint binary pulsars in large radio astronomy data sets. This paper quantifies the sensitivity impact of reducing numerical precision in the graphics processing unit (GPU)-accelerated FDAS pipeline of the AstroAccelerate (AA) software package. The prior implementation used IEEE-754 single-precision in the entire binary pulsar detection pipeline, spending a large fraction of the runtime computing GPU-accelerated fast Fourier transforms. AA has been modified to use bfloat16 (and IEEE-754 double-precision to provide a "gold standard" comparison) within the Fourier domain convolution section of the FDAS routine. Approximately 20,000 synthetic pulsar filterbank files representing binary pulsars were generated using SIGPROC with a range of physical parameters. They have been processed using bfloat16, single-precision, and double-precision convolutions. All bfloat16 peaks are within 3% of the predicted signal-to-noise ratio of their corresponding single-precision peaks. Of 14,971 "bright" single-precision fundamental peaks above a power of 44.982 (our experimentally measured highest noise value), 14,602 (97.53%) have a peak in the same acceleration and frequency bin in the bfloat16 output plane, while in the remaining 369 the nearest peak is located in the adjacent acceleration bin. There is no bin drift measured between the single- and double-precision results. The bfloat16 version of FDAS achieves a speedup of approximately 1.6x compared to single-precision. A comparison between AA and the PRESTO software package is presented using observations collected with the GMRT of PSR J1544+4937, a 2.16 ms black widow pulsar in a 2.8 hr compact orbit. ER -
WHITE, Jack, Karel ADÁMEK, Jayanta ROY, Sofia DIMOUDI, Scott M. RANSOM and Wesley ARMOUR. Bits Missing: Finding Exotic Pulsars Using bfloat16 on NVIDIA GPUs. \textit{Astrophysical Journal Supplement Series}. GB - Spojené království Velké Británie a, 2023, vol.~265, No~1, p.~''13-1''-''13-12'', 12 pp. ISSN~0067-0049. Available from: https://dx.doi.org/10.3847/1538-4365/acb351.
|