@@ -1142,69 +1142,32 @@ contains
1142
1142
if (n == 0 ) return
1143
1143
1144
1144
if (weno_dir == 2 ) then
1145
- #if MFC_cuTENSOR
1146
- if (cu_tensor) then
1147
- if (p == 0 ) then
1148
- block
1149
- use CuTensorEx
1150
-
1151
- #:call GPU_HOST_DATA(use_device= ' [v_rs_ws_x, v_rs_ws_y]' )
1152
- v_rs_ws_y = reshape (v_rs_ws_x, shape= [n + 1 + 2 * buff_size, m + 2 * buff_size + 1 , p + 1 , sys_size], order= [2 , 1 , 3 , 4 ])
1153
- #:endcall GPU_HOST_DATA
1154
- end block
1155
- else
1156
- block
1157
- use CuTensorEx
1158
-
1159
- #:call GPU_HOST_DATA(use_device= ' [v_rs_ws_x, v_rs_ws_y]' )
1160
- v_rs_ws_y = reshape (v_rs_ws_x, shape= [n + 1 + 2 * buff_size, m + 2 * buff_size + 1 , p + 1 + 2 * buff_size, sys_size], order= [2 , 1 , 3 , 4 ])
1161
- #:endcall GPU_HOST_DATA
1162
- end block
1163
- end if
1164
- else
1165
- #endif
1166
- $:GPU_PARALLEL_LOOP(collapse= 4 )
1167
- do j = 1 , v_size
1168
- do q = is3_weno%beg, is3_weno%end
1169
- do l = is2_weno%beg, is2_weno%end
1170
- do k = is1_weno%beg - weno_polyn, is1_weno%end + weno_polyn
1171
- v_rs_ws_y(k, l, q, j) = v_vf(j)%sf(l, k, q)
1172
- end do
1145
+ $:GPU_PARALLEL_LOOP(collapse= 4 )
1146
+ do j = 1 , v_size
1147
+ do q = is3_weno%beg, is3_weno%end
1148
+ do l = is2_weno%beg, is2_weno%end
1149
+ do k = is1_weno%beg - weno_polyn, is1_weno%end + weno_polyn
1150
+ v_rs_ws_y(k, l, q, j) = v_vf(j)%sf(l, k, q)
1173
1151
end do
1174
1152
end do
1175
1153
end do
1176
- #if MFC_cuTENSOR
1177
- end if
1178
- #endif
1154
+ end do
1179
1155
end if
1180
1156
1181
1157
! Reshaping/ Projecting onto Characteristic Fields in z- direction
1182
1158
if (p == 0 ) return
1159
+
1183
1160
if (weno_dir == 3 ) then
1184
- #if MFC_cuTENSOR
1185
- if (cu_tensor) then
1186
- block
1187
- use CuTensorEx
1188
-
1189
- #:call GPU_HOST_DATA(use_device= ' [v_rs_ws_x, v_rs_ws_z]' )
1190
- v_rs_ws_z = reshape (v_rs_ws_x, shape= [p + 1 + 2 * buff_size, n + 2 * buff_size + 1 , m + 2 * buff_size + 1 , sys_size], order= [3 , 2 , 1 , 4 ])
1191
- #:endcall
1192
- end block
1193
- else
1194
- #endif
1195
- $:GPU_PARALLEL_LOOP(collapse= 4 )
1196
- do j = 1 , v_size
1197
- do q = is3_weno%beg, is3_weno%end
1198
- do l = is2_weno%beg, is2_weno%end
1199
- do k = is1_weno%beg - weno_polyn, is1_weno%end + weno_polyn
1200
- v_rs_ws_z(k, l, q, j) = v_vf(j)%sf(q, l, k)
1201
- end do
1161
+ $:GPU_PARALLEL_LOOP(collapse= 4 )
1162
+ do j = 1 , v_size
1163
+ do q = is3_weno%beg, is3_weno%end
1164
+ do l = is2_weno%beg, is2_weno%end
1165
+ do k = is1_weno%beg - weno_polyn, is1_weno%end + weno_polyn
1166
+ v_rs_ws_z(k, l, q, j) = v_vf(j)%sf(q, l, k)
1202
1167
end do
1203
1168
end do
1204
1169
end do
1205
- #if MFC_cuTENSOR
1206
- end if
1207
- #endif
1170
+ end do
1208
1171
end if
1209
1172
1210
1173
end subroutine s_initialize_weno
0 commit comments