@inproceedings{ce1d256f3584490e83e91ec543908b44,
title = "A study of CUDA/MPI parallel computations for CADMAS-SURF/3D",
abstract = "We present a new faster GPU/MPI computation and algorithm for CADMAS-SURF/3D by a CUDA parallelization technique on a GPU accelerator {"}Tesla{"}. In this paper, we examine the CUDA porting tool for GPU computation and suggest a macro code by C preprocessor for CADMAS-SURF/3D originally coded in FORTRAN to be adapted into CUDA C language. Furthermore, we optimize the data access sequence pattern from a profiling result to eliminate the calculation bottleneck. We inspect the legitimacy of the solution by examining the rounding error, and then examine the program tuning a data sequence access pattern optimization.",
keywords = "Array data access optimization, CADMAS-SURF/3D, CUDA parallelization, GPU",
author = "Hiroshi Okumura and Taro Arikawa",
year = "2014",
language = "英語",
isbn = "9781880653913",
series = "Proceedings of the International Offshore and Polar Engineering Conference",
publisher = "International Society of Offshore and Polar Engineers",
pages = "420--424",
booktitle = "Proceedings of the 24th International Ocean and Polar Engineering Conference, ISOPE Busan",
note = "24th International Ocean and Polar Engineering Conference, ISOPE 2014 Busan ; Conference date: 15-06-2014 Through 20-06-2014",
}