@inproceedings{ebdd43b2e1294b07845747dd3c413e73,
title = "Efficient parallelization of MLFMA for 3D electromagnetic scattering problems on sunway many-core processor SW26010",
abstract = "A many-core implementation of the multilevel fast multipole algorithm (MLFMA) based on the Athread parallel programming model for computing electromagnetic scattering by a 3-D object on the homegrown many-core SW26010 CPU of China is presented. In the proposed many-core implementation of MLFMA, the data access efficiency is improved by using data structures based on the Structure-of-Array (SoA). The adaptive workload distribution strategies are adopted on different MLFMA tree levels to ensure full utilization of computing capability and the scratchpad memory (SPM). A double-buffering scheme is specially designed to make communication overlapped computation. The resulting Athread-based many-core implementation of the MLFMA is capable for solving real-life problems with over four hundred thousand unknowns with a remarkable speed-up. Numerical results show that with the proposed parallel scheme, a total speed-up larger than 7 times can be achieved, compared with the CPU master-core.",
author = "He, {W. J.} and Yang, {M. L.} and W. Wang and Sheng, {X. Q.}",
note = "Publisher Copyright: {\textcopyright} 2019 IEEE.; 2019 Photonics and Electromagnetics Research Symposium - Fall, PIERS - Fall 2019 ; Conference date: 17-12-2019 Through 20-12-2019",
year = "2019",
month = dec,
doi = "10.1109/PIERS-Fall48861.2019.9021293",
language = "English",
series = "2019 Photonics and Electromagnetics Research Symposium - Fall, PIERS - Fall 2019 - Proceedings",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
pages = "1870--1876",
booktitle = "2019 Photonics and Electromagnetics Research Symposium - Fall, PIERS - Fall 2019 - Proceedings",
address = "United States",
}