Loading src/trapping/cfrfme.cpp +9 −3 Original line number Original line Diff line number Diff line Loading @@ -403,6 +403,8 @@ void frfme(string data_file, string output_path) { double *vec_vkzm = vkzm[0]; double *vec_vkzm = vkzm[0]; #ifdef USE_TARGET_OFFLOAD #ifdef USE_TARGET_OFFLOAD #pragma omp target teams distribute parallel for simd #pragma omp target teams distribute parallel for simd #else #pragma omp parallel for simd #endif #endif // #pragma omp parallel for // #pragma omp parallel for for (int j80 = jlmf-1; j80 < jlml; j80++) { for (int j80 = jlmf-1; j80 < jlml; j80++) { Loading @@ -417,8 +419,9 @@ void frfme(string data_file, string output_path) { // for (int jx50 = 0; jx50 < nkv; jx50++) { // for (int jx50 = 0; jx50 < nkv; jx50++) { // #ifdef USE_TARGET_OFFLOAD // #ifdef USE_TARGET_OFFLOAD // #pragma omp target teams distribute parallel for simd // #pragma omp target teams distribute parallel for simd // #else // #pragma omp parallel for simd // #endif // #endif // #pragma omp parallel for for (int jxy50 = 0; jxy50 < nkvs; jxy50++) { for (int jxy50 = 0; jxy50 < nkvs; jxy50++) { // for (int wi = 0; wi < nlmmt; wi++) wk_local[wi] = tt1->wk[wk_index++]; // for (int wi = 0; wi < nlmmt; wi++) wk_local[wi] = tt1->wk[wk_index++]; // w[jx50][jy50] = wk_local[j80]; // w[jx50][jy50] = wk_local[j80]; Loading @@ -438,8 +441,9 @@ void frfme(string data_file, string output_path) { int nvxy = nxv *nyv; int nvxy = nxv *nyv; // #ifdef USE_TARGET_OFFLOAD // #ifdef USE_TARGET_OFFLOAD // #pragma omp target teams distribute parallel for // #pragma omp target teams distribute parallel for // #endif // #else // #pragma omp parallel for // #pragma omp parallel for // #endif for (int ixyz = 0; ixyz < nvtot; ixyz++) { for (int ixyz = 0; ixyz < nvtot; ixyz++) { int iz75 = ixyz / nvxy; int iz75 = ixyz / nvxy; int iy70 = (ixyz % nvxy) / nxv; int iy70 = (ixyz % nvxy) / nxv; Loading @@ -453,7 +457,9 @@ void frfme(string data_file, string output_path) { // ixyz++; // ixyz++; dcomplex sumy = cc0; dcomplex sumy = cc0; // #ifdef USE_TARGET_OFFLOAD // #ifdef USE_TARGET_OFFLOAD // #pragma omp target parallel for simd reduction(+:sumy) // #pragma omp target teams distribute parallel for simd reduction(+:sumy) // #else // #pragma omp parallel for simd reduction(+:sumy) // #endif // #endif for (int jy60x55 = 0; jy60x55 < nkvs ; jy60x55++) { for (int jy60x55 = 0; jy60x55 < nkvs ; jy60x55++) { int jy60 = jy60x55 / nkv; int jy60 = jy60x55 / nkv; Loading Loading
src/trapping/cfrfme.cpp +9 −3 Original line number Original line Diff line number Diff line Loading @@ -403,6 +403,8 @@ void frfme(string data_file, string output_path) { double *vec_vkzm = vkzm[0]; double *vec_vkzm = vkzm[0]; #ifdef USE_TARGET_OFFLOAD #ifdef USE_TARGET_OFFLOAD #pragma omp target teams distribute parallel for simd #pragma omp target teams distribute parallel for simd #else #pragma omp parallel for simd #endif #endif // #pragma omp parallel for // #pragma omp parallel for for (int j80 = jlmf-1; j80 < jlml; j80++) { for (int j80 = jlmf-1; j80 < jlml; j80++) { Loading @@ -417,8 +419,9 @@ void frfme(string data_file, string output_path) { // for (int jx50 = 0; jx50 < nkv; jx50++) { // for (int jx50 = 0; jx50 < nkv; jx50++) { // #ifdef USE_TARGET_OFFLOAD // #ifdef USE_TARGET_OFFLOAD // #pragma omp target teams distribute parallel for simd // #pragma omp target teams distribute parallel for simd // #else // #pragma omp parallel for simd // #endif // #endif // #pragma omp parallel for for (int jxy50 = 0; jxy50 < nkvs; jxy50++) { for (int jxy50 = 0; jxy50 < nkvs; jxy50++) { // for (int wi = 0; wi < nlmmt; wi++) wk_local[wi] = tt1->wk[wk_index++]; // for (int wi = 0; wi < nlmmt; wi++) wk_local[wi] = tt1->wk[wk_index++]; // w[jx50][jy50] = wk_local[j80]; // w[jx50][jy50] = wk_local[j80]; Loading @@ -438,8 +441,9 @@ void frfme(string data_file, string output_path) { int nvxy = nxv *nyv; int nvxy = nxv *nyv; // #ifdef USE_TARGET_OFFLOAD // #ifdef USE_TARGET_OFFLOAD // #pragma omp target teams distribute parallel for // #pragma omp target teams distribute parallel for // #endif // #else // #pragma omp parallel for // #pragma omp parallel for // #endif for (int ixyz = 0; ixyz < nvtot; ixyz++) { for (int ixyz = 0; ixyz < nvtot; ixyz++) { int iz75 = ixyz / nvxy; int iz75 = ixyz / nvxy; int iy70 = (ixyz % nvxy) / nxv; int iy70 = (ixyz % nvxy) / nxv; Loading @@ -453,7 +457,9 @@ void frfme(string data_file, string output_path) { // ixyz++; // ixyz++; dcomplex sumy = cc0; dcomplex sumy = cc0; // #ifdef USE_TARGET_OFFLOAD // #ifdef USE_TARGET_OFFLOAD // #pragma omp target parallel for simd reduction(+:sumy) // #pragma omp target teams distribute parallel for simd reduction(+:sumy) // #else // #pragma omp parallel for simd reduction(+:sumy) // #endif // #endif for (int jy60x55 = 0; jy60x55 < nkvs ; jy60x55++) { for (int jy60x55 = 0; jy60x55 < nkvs ; jy60x55++) { int jy60 = jy60x55 / nkv; int jy60 = jy60x55 / nkv; Loading