@inproceedings{f49ffead2a66440784629dfd288b859f,
title = "Acceleration of GPU-based ultrasound simulation via data compression",
abstract = "The realistic simulation of ultrasound wave propagation is computationally intensive. The large size of the grid and low degree of reuse of data means that it places a great demand on memory bandwidth. Graphics Processing Units (GPUs) have attracted attention for performing scientific calculations due to their potential for efficiently performing large numbers of floating point computations. However, many applications may be limited by memory bandwidth, especially for data sets whose size is larger than that of the GPU platform. This problem is only partially mitigated by applying the standard technique of breaking the grid into regions and overlapping the computation of one region with the host-device memory transfer of another. In this paper, we implement a memory-bound GPU-based ultrasound simulation and evaluate the use of a technique for improving performance by compressing the data into a fixed-point representation that reduces the time required for inter-host-device transfers. We demonstrate a speedup of 1.5 times on a simulation where the data is broken into regions that must be copied back and forth between the CPU and GPU. We develop a model that can be used to determine the amount of temporal blocking required to achieve near optimal performance, without extensive experimentation. This technique may also be applied to GPU-based scientific simulations in other domains such as computational fluid dynamics and electromagnetic wave simulation.",
keywords = "Data compression, GPGPU, Memory architecture, Nonlinear acoustics, Parallel architectures",
author = "Haigh, {Andrew A.} and McCreath, {Eric C.}",
note = "Publisher Copyright: {\textcopyright} 2014 IEEE.; 28th IEEE International Parallel and Distributed Processing Symposium Workshops, IPDPSW 2014 ; Conference date: 19-05-2014 Through 23-05-2014",
year = "2014",
month = nov,
day = "27",
doi = "10.1109/IPDPSW.2014.140",
language = "English",
series = "Proceedings - IEEE 28th International Parallel and Distributed Processing Symposium Workshops, IPDPSW 2014",
publisher = "IEEE Computer Society",
pages = "1248--1255",
booktitle = "Proceedings - IEEE 28th International Parallel and Distributed Processing Symposium Workshops, IPDPSW 2014",
address = "United States",
}