This repository has been archived by the owner on Jun 20, 2024. It is now read-only.
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathcalc_dt_kernel_cuda.cu
executable file
·107 lines (95 loc) · 4.43 KB
/
calc_dt_kernel_cuda.cu
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
/*Crown Copyright 2012 AWE.
*
* This file is part of CloverLeaf.
*
* CloverLeaf is free software: you can redistribute it and/or modify it under
* the terms of the GNU General Public License as published by the
* Free Software Foundation, either version 3 of the License, or (at your option)
* any later version.
*
* CloverLeaf is distributed in the hope that it will be useful, but
* WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for more
* details.
*
* You should have received a copy of the GNU General Public License along with
* CloverLeaf. If not, see http://www.gnu.org/licenses/.
*/
/*
* @brief CUDA timestep kernel
* @author Michael Boulton NVIDIA Corporation
* @details Calculates the minimum timestep on the mesh chunk based on the CFL
* condition, the velocity gradient and the velocity divergence. A safety
* factor is used to ensure numerical stability.
*/
#include "cuda_common.hpp"
#include "kernel_files/calc_dt_kernel.cuknl"
#include "host_reductions_kernel_cuda.hpp"
#include "value_getter.hpp"
extern "C" void calc_dt_kernel_cuda_
(double* g_small,
double* g_big,
double* dtmin,
double* dtc_safe,
double* dtu_safe,
double* dtv_safe,
double* dtdiv_safe,
double* dt_min_val,
int* dtl_control,
double* xl_pos,
double* yl_pos,
int* jldt,
int* kldt,
int* small)
{
cuda_chunk.calc_dt_kernel(*g_small, *g_big, *dtmin, *dtc_safe, *dtu_safe,
*dtv_safe, *dtdiv_safe, dt_min_val, dtl_control, xl_pos, yl_pos,
jldt, kldt, small);
}
void CloverleafCudaChunk::calc_dt_kernel
(double g_small, double g_big, double dtmin,
double dtc_safe, double dtu_safe, double dtv_safe, double dtdiv_safe,
double* dt_min_val,
int* dtl_control,
double* xl_pos,
double* yl_pos,
int* jldt,
int* kldt,
int* small)
{
CUDALAUNCH(device_calc_dt_kernel_cuda, g_small, g_big, dtmin, dtc_safe,
dtu_safe, dtv_safe, dtdiv_safe, xarea, yarea, celldx, celldy,
volume, density0, viscosity, soundspeed, xvel0, yvel0,
reduce_buf_1, reduce_buf_2);
ReduceToHost<double>::min_element(reduce_buf_2, dt_min_val, num_blocks);
double jk_control;
ReduceToHost<double>::max_element(reduce_buf_1, &jk_control, num_blocks);
*dtl_control = 10.01 * (jk_control - static_cast<int>(jk_control));
jk_control = jk_control - (jk_control - static_cast<int>(jk_control));
int tmp_jldt = *jldt = (static_cast<int>(jk_control)) % x_max;
int tmp_kldt = *kldt = 1 + (jk_control/x_max);
*xl_pos = Value_Getter<double>::from_device(cellx, tmp_jldt);
*yl_pos = Value_Getter<double>::from_device(celly, tmp_kldt);
*small = (*dt_min_val < dtmin) ? 1 : 0;
if (*small != 0)
{
std::cerr << "Timestep information:" << std::endl;
std::cerr << "j, k : " << tmp_jldt << " " << tmp_kldt << std::endl;
std::cerr << "x, y : " << Value_Getter<double>::from_device(cellx, tmp_jldt) << " " << Value_Getter<double>::from_device(celly, tmp_kldt) << std::endl;
std::cerr << "timestep : " << *dt_min_val << std::endl;
std::cerr << "Cell velocities;" << std::endl;
std::cerr << Value_Getter<double>::from_device(xvel0, tmp_jldt +(x_max+5)*tmp_kldt ) << "\t";
std::cerr << Value_Getter<double>::from_device(yvel0, tmp_jldt +(x_max+5)*tmp_kldt ) << std::endl;
std::cerr << Value_Getter<double>::from_device(xvel0, tmp_jldt+1+(x_max+5)*tmp_kldt ) << "\t";
std::cerr << Value_Getter<double>::from_device(yvel0, tmp_jldt+1+(x_max+5)*tmp_kldt ) << std::endl;
std::cerr << Value_Getter<double>::from_device(xvel0, tmp_jldt+1+(x_max+5)*(tmp_kldt+1)) << "\t";
std::cerr << Value_Getter<double>::from_device(yvel0, tmp_jldt+1+(x_max+5)*(tmp_kldt+1)) << std::endl;
std::cerr << Value_Getter<double>::from_device(xvel0, tmp_jldt +(x_max+5)*(tmp_kldt+1)) << "\t";
std::cerr << Value_Getter<double>::from_device(yvel0, tmp_jldt +(x_max+5)*(tmp_kldt+1)) << std::endl;
std::cerr << "density, energy, pressure, soundspeed " << std::endl;
std::cerr << Value_Getter<double>::from_device(density0, tmp_jldt+(x_max+5)*tmp_kldt) << "\t";
std::cerr << Value_Getter<double>::from_device(energy0, tmp_jldt+(x_max+5)*tmp_kldt) << "\t";
std::cerr << Value_Getter<double>::from_device(pressure, tmp_jldt+(x_max+5)*tmp_kldt) << "\t";
std::cerr << Value_Getter<double>::from_device(soundspeed, tmp_jldt+(x_max+5)*tmp_kldt) << std::endl;
}
}