@@ -1142,69 +1142,32 @@ contains
11421142 if (n == 0 ) return
11431143
11441144 if (weno_dir == 2 ) then
1145- #if MFC_cuTENSOR
1146- if (cu_tensor) then
1147- if (p == 0 ) then
1148- block
1149- use CuTensorEx
1150-
1151- #:call GPU_HOST_DATA(use_device= ' [v_rs_ws_x, v_rs_ws_y]' )
1152- v_rs_ws_y = reshape (v_rs_ws_x, shape= [n + 1 + 2 * buff_size, m + 2 * buff_size + 1 , p + 1 , sys_size], order= [2 , 1 , 3 , 4 ])
1153- #:endcall GPU_HOST_DATA
1154- end block
1155- else
1156- block
1157- use CuTensorEx
1158-
1159- #:call GPU_HOST_DATA(use_device= ' [v_rs_ws_x, v_rs_ws_y]' )
1160- v_rs_ws_y = reshape (v_rs_ws_x, shape= [n + 1 + 2 * buff_size, m + 2 * buff_size + 1 , p + 1 + 2 * buff_size, sys_size], order= [2 , 1 , 3 , 4 ])
1161- #:endcall GPU_HOST_DATA
1162- end block
1163- end if
1164- else
1165- #endif
1166- $:GPU_PARALLEL_LOOP(collapse= 4 )
1167- do j = 1 , v_size
1168- do q = is3_weno%beg, is3_weno%end
1169- do l = is2_weno%beg, is2_weno%end
1170- do k = is1_weno%beg - weno_polyn, is1_weno%end + weno_polyn
1171- v_rs_ws_y(k, l, q, j) = v_vf(j)%sf(l, k, q)
1172- end do
1145+ $:GPU_PARALLEL_LOOP(collapse= 4 )
1146+ do j = 1 , v_size
1147+ do q = is3_weno%beg, is3_weno%end
1148+ do l = is2_weno%beg, is2_weno%end
1149+ do k = is1_weno%beg - weno_polyn, is1_weno%end + weno_polyn
1150+ v_rs_ws_y(k, l, q, j) = v_vf(j)%sf(l, k, q)
11731151 end do
11741152 end do
11751153 end do
1176- #if MFC_cuTENSOR
1177- end if
1178- #endif
1154+ end do
11791155 end if
11801156
11811157 ! Reshaping/ Projecting onto Characteristic Fields in z- direction
11821158 if (p == 0 ) return
1159+
11831160 if (weno_dir == 3 ) then
1184- #if MFC_cuTENSOR
1185- if (cu_tensor) then
1186- block
1187- use CuTensorEx
1188-
1189- #:call GPU_HOST_DATA(use_device= ' [v_rs_ws_x, v_rs_ws_z]' )
1190- v_rs_ws_z = reshape (v_rs_ws_x, shape= [p + 1 + 2 * buff_size, n + 2 * buff_size + 1 , m + 2 * buff_size + 1 , sys_size], order= [3 , 2 , 1 , 4 ])
1191- #:endcall
1192- end block
1193- else
1194- #endif
1195- $:GPU_PARALLEL_LOOP(collapse= 4 )
1196- do j = 1 , v_size
1197- do q = is3_weno%beg, is3_weno%end
1198- do l = is2_weno%beg, is2_weno%end
1199- do k = is1_weno%beg - weno_polyn, is1_weno%end + weno_polyn
1200- v_rs_ws_z(k, l, q, j) = v_vf(j)%sf(q, l, k)
1201- end do
1161+ $:GPU_PARALLEL_LOOP(collapse= 4 )
1162+ do j = 1 , v_size
1163+ do q = is3_weno%beg, is3_weno%end
1164+ do l = is2_weno%beg, is2_weno%end
1165+ do k = is1_weno%beg - weno_polyn, is1_weno%end + weno_polyn
1166+ v_rs_ws_z(k, l, q, j) = v_vf(j)%sf(q, l, k)
12021167 end do
12031168 end do
12041169 end do
1205- #if MFC_cuTENSOR
1206- end if
1207- #endif
1170+ end do
12081171 end if
12091172
12101173 end subroutine s_initialize_weno
0 commit comments