@inbook{e65dd0bbe54845febd920048e2b9c7ac,
title = "Accelerating large-scale simulation of seismic wave propagation by multi-GPUs and three-dimensional domain decomposition",
abstract = "We adopted the GPU (graphics processing unit) to accelerate the large-scale finite-difference simulation of seismic wave propagation. We describe the main part of our implementation: the memory optimization, the three-dimensional domain decomposition, and overlapping communication and computation. With our GPU program, we achieved a very high single-precision performance of about 61 TFlops by using 1,200 GPUs and 1.5 TB of total memory, and a scalability nearly proportional to the number of GPUs on TSUBAME–2.0, the recently installed GPU supercomputer in Tokyo Institute of Technology, Japan. In a realistic application by using 400 GPUs, only a wall clock time of 2,068 s (including the times for the overhead of snapshot output) was required for a complex structure model with more than 13 billion unit cells and 20,000 time steps. We therefore conclude that GPU computing for large-scale simulation of seismic wave propagation is a promising approach.",
author = "Taro Okamoto and Hiroshi Takenaka and Takeshi Nakamura and Takayuki Aoki",
note = "Publisher Copyright: {\textcopyright} Springer-Verlag Berlin Heidelberg 2013.",
year = "2013",
doi = "10.1007/978-3-642-16405-7_24",
language = "English",
series = "Lecture Notes in Earth System Sciences",
publisher = "Springer International Publishing",
number = "9783642164040",
pages = "375--389",
booktitle = "Lecture Notes in Earth System Sciences",
edition = "9783642164040",
}