Export PGI_CURR_CUDA_HOME=/home/jlow/vidia-gcc-8.4.0/hpc_sdk/Linux_ppc64le/cuda/11.0 Export NVCOMPILER=/home/jlow/vidia-gcc-8.4.0/hpc_sdk/Linux_ppc64le/20.5 Export PGI=/home/jlow/vidia-gcc-8.4.0/hpc_sdk /home/jlow/vidia-gcc-8.4.0/hpc_sdk/Linux_ppc64le/20.5/compilers/bin/tools/fort1 xcspin.f90 -opt 2 -nostatic -x 19 0x400000 -quad -x 15 2 -x 49 0x400004 -x 51 0x20 -x 57 0x4c -x 58 0x10000 -x 124 0x1000 -x 57 0xfb0000 -x 58 0x78031040 -x 70 0x6c00 -x 47 0x400000 -x 47 0x08 -x 48 4608 -x 49 0x100 -stdinc /home/jlow/vidia-gcc-8.4.0/hpc_sdk/Linux_ppc64le/20.5/compilers/include-gcc49:/home/jlow/vidia-gcc-8.4.0/hpc_sdk/Linux_ppc64le/20.5/compilers/include:/usr/local/include:/soft/packaging/spack-builds/linux-rhel7-power8le/gcc-4.8.5/gcc-8.4.0-n5lbxh6ybxdmqh346yxg3lpkpx3clfzm/lib/gcc/powerpc64le-unknown-linux-gnu/8.4.0/include:/usr/local/include:/soft/packaging/spack-builds/linux-rhel7-power8le/gcc-4.8.5/gcc-8.4.0-n5lbxh6ybxdmqh346yxg3lpkpx3clfzm/include:/soft/packaging/spack-builds/linux-rhel7-power8le/gcc-4.8.5/gcc-8.4.0-n5lbxh6ybxdmqh346yxg3lpkpx3clfzm/lib/gcc/powerpc64le-unknown-linux-gnu/8.4.0/include-fixed:/usr/include:/soft/packaging/spack-builds/linux-rhel7-power8le/gcc-4.8.5/gcc-8.4.0-n5lbxh6ybxdmqh346yxg3lpkpx3clfzm/lib/gcc/powerpc64le-unknown-linux-gnu/8.4.0/include:/usr/include -cmdline '+nvfortran xcspin.f90 -v -Minfo -acc -ta=tesla:cc30,cc35,cc60,cc70,cuda11.0 -Mfree -Mnoupcase -Mbackslash -Mlarge_arrays -fast -Mvect=simd -Mflushz -Mcache_align -ta=tesla:nollvm -I/home/jlow/qd/2.3.22-pgi-2020/include/qd -I/soft/packaging/spack-builds/linux-rhel7-power8le/gcc-8.4.0/fftw-3.3.8-iolztwvg7vdfhufa7scpnp6hmsopn55k/include -c -I/home/jlow/vidia-gcc-8.4.0/hpc_sdk/Linux_ppc64le/2020/mpi/openmpi-3.1.5/include -I/home/jlow/vidia-gcc-8.4.0/hpc_sdk/Linux_ppc64le/2020/mpi/openmpi-3.1.5/lib' -def __STDC_HOSTED__ -idir /home/jlow/qd/2.3.22-pgi-2020/include/qd -idir /soft/packaging/spack-builds/linux-rhel7-power8le/gcc-8.4.0/fftw-3.3.8-iolztwvg7vdfhufa7scpnp6hmsopn55k/include -idir /home/jlow/vidia-gcc-8.4.0/hpc_sdk/Linux_ppc64le/2020/mpi/openmpi-3.1.5/include -idir /home/jlow/vidia-gcc-8.4.0/hpc_sdk/Linux_ppc64le/2020/mpi/openmpi-3.1.5/lib -def __power__ -def __powerpc__ -def __powerpc64__ -def __PPC__ -def __PPC64__ -def __LP64__ -def __LITTLE_ENDIAN__ -def __CHAR_UNSIGNED__ -def _CALL_ELF=2 -def __PGLLVM__ -def __NVCOMPILER_LLVM__ -def __extension__= -def __linux__ -def __linux -def linux -def _ACCEL=201003 -def _OPENACC=201711 -def CUDA_VERSION=11000 -def PGI_TESLA_TARGET -ccff -freeform -vect 48 -x 54 1 -x 68 0x1 -x 49 0x40000000 -x 70 0x40000000 -x 124 1 -x 195 0x8000 -x 186 0x80 -x 186 0x80 -x 163 1 -x 186 0x80000 -x 180 0x400 -cudaver 11000 -x 186 0x80 -x 163 1 -x 186 0x80000 -x 180 0x400 -cudaver 11000 -x 189 0x8000 -y 163 0xc0000000 -accel tesla -accel tesla -freeform -noupcase -x 124 0x40 -x 68 0x1 -x 53 2 -quad -x 119 0x10000000 -stbfile /tmp/nvfortranMd1AYR0Lj3-O.stb -modexport /tmp/nvfortranwd1AckA-aQVB.cmod -modindex /tmp/nvfortrangd1AsAR916Jy.cmdx -output /tmp/nvfortran2d1AIV_6f7DS.ilm 0 inform, 0 warnings, 0 severes, 0 fatal for fexcgs 0 inform, 0 warnings, 0 severes, 0 fatal for fexcgs_ 0 inform, 0 warnings, 0 severes, 0 fatal for ggaapprox 0 inform, 0 warnings, 0 severes, 0 fatal for fexcgs_ddsc 0 inform, 0 warnings, 0 severes, 0 fatal for fexcgs_ddsc_ 0 inform, 0 warnings, 0 severes, 0 fatal for fexcgs_noncol_ 0 inform, 0 warnings, 0 severes, 0 fatal for fexcgs_vdw_ NVFORTRAN/power Linux 20.5-0: compilation successful /home/jlow/vidia-gcc-8.4.0/hpc_sdk/Linux_ppc64le/20.5/compilers/bin/tools/fort2 /tmp/nvfortran2d1AIV_6f7DS.ilm -fn xcspin.f90 -opt 2 -x 51 0x20 -x 119 0xa10000 -x 122 0x40 -x 123 0x1000 -x 127 4 -x 127 17 -x 119 0x40000000 -x 19 0x400000 -x 120 0x10000000 -x 70 0x8000 -x 122 1 -x 125 0x20000 -x 56 0x40 -vect 56 -y 34 16 -x 34 0x8 -y 19 8 -y 35 0 -x 42 0x30 -x 199 10 -x 39 0x80 -x 34 0x400000 -x 149 1 -x 150 1 -x 120 0x1000 -x 124 0x1400 -y 15 2 -x 57 0x3b0000 -x 58 0x48000000 -x 49 0x100 -astype 0 -x 121 1 -x 183 4 -x 121 0x800 -x 8 0x40000000 -x 70 0x40000000 -x 54 0x10 -x 249 90 -x 68 0x20 -x 8 0x40000000 -x 39 4 -x 68 0x1 -x 49 0x40000000 -x 164 0x800000 -x 124 1 -accel tesla -accel tesla -x 180 0x4000400 -x 121 0xc00 -x 186 0x80 -x 180 0x4000400 -x 121 0xc00 -x 186 0x80 -x 163 0x1 -x 186 0x80000 -cudaver 11000 -x 194 0x40000 -cudaroot /home/jlow/vidia-gcc-8.4.0/hpc_sdk/Linux_ppc64le/cuda/11.0 -x 176 0x100 -cudacap 30 -cudacap 35 -cudacap 60 -cudacap 70 -x 180 0x4000400 -x 121 0xc00 -x 186 0x80 -x 163 0x1 -x 186 0x80000 -cudaver 11000 -x 194 0x40000 -y 189 0x10 -cudaroot /home/jlow/vidia-gcc-8.4.0/hpc_sdk/Linux_ppc64le/cuda/11.0 -x 176 0x100 -cudacap 30 -cudacap 35 -cudacap 60 -cudacap 70 -x 189 0x8000 -y 163 0xc0000000 -y 189 0x4000000 -cudaroot /home/jlow/vidia-gcc-8.4.0/hpc_sdk/Linux_ppc64le/cuda/11.0 -x 0 0x1000000 -x 2 0x100000 -x 0 0x2000000 -x 161 0x2cff7 -x 162 0x2cff7 -noupcase -x 124 0x40 -x 68 0x1 -x 9 1 -x 42 0x14200000 -x 72 0x1 -x 136 0x11 -x 37 0x481000 -x 129 2 -quad -x 119 0x10000000 -x 129 0x40000000 -cmdline '+nvfortran xcspin.f90 -v -Minfo -acc -ta=tesla:cc30,cc35,cc60,cc70,cuda11.0 -Mfree -Mnoupcase -Mbackslash -Mlarge_arrays -fast -Mvect=simd -Mflushz -Mcache_align -ta=tesla:nollvm -I/home/jlow/qd/2.3.22-pgi-2020/include/qd -I/soft/packaging/spack-builds/linux-rhel7-power8le/gcc-8.4.0/fftw-3.3.8-iolztwvg7vdfhufa7scpnp6hmsopn55k/include -c -I/home/jlow/vidia-gcc-8.4.0/hpc_sdk/Linux_ppc64le/2020/mpi/openmpi-3.1.5/include -I/home/jlow/vidia-gcc-8.4.0/hpc_sdk/Linux_ppc64le/2020/mpi/openmpi-3.1.5/lib' -stbfile /tmp/nvfortranMd1AYR0Lj3-O.stb -asm /tmp/nvfortranMd1AYq8PfCup.ll fexcgs: 65, Generating enter data create(cwgrad(:,:),dwork2(:,:),dwork1(:,:),dvc(:),dwork3(:,:),dworkg(:,:)) 74, Generating enter data create(dwork6(:),dwork5(:),dwork4(:),dwork7(:)) 82, Generating exit data delete(dwork6(:),dwork5(:),dwork4(:),dwork7(:)) 87, Generating exit data delete(cwgrad(:,:),dwork2(:,:),dwork1(:,:),dvc(:),dwork3(:,:),dworkg(:,:)) 95, Generating enter data create(cwgrad(:,:),dwork2(:,:),dwork1(:,:),dvc(:),dwork3(:,:),dworkg(:,:)) 102, Generating exit data delete(cwgrad(:,:),dwork2(:,:),dwork1(:,:),dvc(:),dworkg(:,:),dwork3(:,:)) 0 inform, 0 warnings, 0 severes, 0 fatal for fexcgs fexcgs_: 182, FMA (fused multiply-add) instruction(s) generated 184, Generating present(dhtot(:,:),dencor(:),latt_cur,dwork(:,:)) Generating Tesla code 185, !$acc loop gang, vector(128) ! blockidx%x threadidx%x 184, Generating implicit copyin(gridc) [if not already present] 185, Loop not fused: no successor loop Generated vector simd code for the loop 195, Generating present(cwork(:,:),cwgrad(:,:)) Generating Tesla code 196, !$acc loop gang, vector(128) ! blockidx%x threadidx%x 195, Generating implicit copyin(gridc) [if not already present] 196, Loop not fused: no successor loop Loop not vectorized: may not be beneficial Loop unrolled 8 times 203, Generating present(cwork(:,:),latt_cur,gridc) Generating Tesla code 205, !$acc loop gang, vector(128) ! blockidx%x threadidx%x 205, Loop not fused: no successor loop Loop not vectorized: mixed data types Loop not vectorized: may not be beneficial 217, Generating present(dwork(:,:),dwork1(:,:)) Generating Tesla code 218, !$acc loop gang, vector(128) ! blockidx%x threadidx%x 217, Generating implicit copyin(gridc) [if not already present] 218, Memory copy idiom, loop replaced by call to __c_mcopy8 223, Generating present(cwork(:,:),cwgrad(:,:)) Generating Tesla code 224, !$acc loop gang, vector(128) ! blockidx%x threadidx%x 223, Generating implicit copyin(gridc) [if not already present] 224, Loop not fused: no successor loop Loop not vectorized: may not be beneficial Loop unrolled 8 times 230, Generating present(cwork(:,:),latt_cur,gridc) Generating Tesla code 232, !$acc loop gang, vector(128) ! blockidx%x threadidx%x 232, Loop not fused: no successor loop Loop not vectorized: mixed data types Loop not vectorized: may not be beneficial 244, Generating present(dwork2(:,:),dwork(:,:)) Generating Tesla code 245, !$acc loop gang, vector(128) ! blockidx%x threadidx%x 244, Generating implicit copyin(gridc) [if not already present] 245, Memory copy idiom, loop replaced by call to __c_mcopy8 251, Generating present(cwork(:,:),cwgrad(:,:)) Generating Tesla code 252, !$acc loop gang, vector(128) ! blockidx%x threadidx%x 251, Generating implicit copyin(gridc) [if not already present] 252, Loop not fused: no successor loop Loop not vectorized: may not be beneficial Loop unrolled 8 times 259, Generating present(cwork(:,:),latt_cur,gridc) Generating Tesla code 261, !$acc loop gang, vector(128) ! blockidx%x threadidx%x 261, Loop not fused: no successor loop Loop not vectorized: mixed data types Loop not vectorized: may not be beneficial 273, Generating present(dwork3(:,:),dwork(:,:)) Generating Tesla code 274, !$acc loop gang, vector(128) ! blockidx%x threadidx%x 273, Generating implicit copyin(gridc) [if not already present] 274, Memory copy idiom, loop replaced by call to __c_mcopy8 288, Generating present(dencor(:),latt_cur,dworkg(:,:),dwork(:,:),dwork1(:,:),dwork2(:,:),dvc(:),dhtot(:,:),dwork3(:,:)) Generating Tesla code 291, !$acc loop gang, vector(128) ! blockidx%x threadidx%x Generating reduction(+:exc) 288, Generating implicit copyin(gridc) [if not already present] Generating implicit copy(exc) [if not already present] 291, Loop not vectorized/parallelized: contains call 295, FMA (fused multiply-add) instruction(s) generated 298, FMA (fused multiply-add) instruction(s) generated 301, FMA (fused multiply-add) instruction(s) generated 323, FMA (fused multiply-add) instruction(s) generated 392, Generating present(dwork(:,:),dwork1(:,:),dwork3(:,:),dwork2(:,:),dvc(:)) Generating Tesla code 394, !$acc loop gang, vector(128) collapse(2) ! blockidx%x threadidx%x Generating reduction(+:sif12,sif31,sif33,sif11,sif22,sif23) 395, ! blockidx%x threadidx%x collapsed 392, Generating implicit copyin(gridc) [if not already present] Generating implicit copy(sif12,sif33,sif31,sif11,sif22,sif23) [if not already present] 394, Scalar last value needed after loop for sif11 at line 411 Scalar last value needed after loop for sif22 at line 412 Scalar last value needed after loop for sif33 at line 413 Scalar last value needed after loop for sif12 at line 414 Scalar last value needed after loop for sif31 at line 416 Scalar last value needed after loop for sif23 at line 415 Loop not fused: no successor loop FMA (fused multiply-add) instruction(s) generated 395, Scalar last value needed after loop for sif11 at line 411 427, Generating present(dwork(:,:),dwork1(:,:),dwork3(:,:),dwork2(:,:),dvc(:)) Generating Tesla code 429, !$acc loop gang, vector(128) ! blockidx%x threadidx%x 427, Generating implicit copyin(gridc) [if not already present] 429, Loop not fused: no successor loop Generated vector simd code for the loop FMA (fused multiply-add) instruction(s) generated 446, FMA (fused multiply-add) instruction(s) generated 451, Generating present(dwork1(:,:),dwork(:,:)) Generating Tesla code 452, !$acc loop gang, vector(128) ! blockidx%x threadidx%x 451, Generating implicit copyin(gridc) [if not already present] 452, Memory copy idiom, loop replaced by call to __c_mcopy8 459, Generating present(cwork(:,:),cwgrad(:,:),latt_cur,gridc) Generating Tesla code 461, !$acc loop gang, vector(128) ! blockidx%x threadidx%x 461, Loop not fused: no successor loop Loop not vectorized: mixed data types Loop not vectorized: may not be beneficial 472, Generating present(dwork2(:,:),dwork(:,:)) Generating Tesla code 473, !$acc loop gang, vector(128) ! blockidx%x threadidx%x 472, Generating implicit copyin(gridc) [if not already present] 473, Memory copy idiom, loop replaced by call to __c_mcopy8 480, Generating present(cwork(:,:),cwgrad(:,:),latt_cur,gridc) Generating Tesla code 482, !$acc loop gang, vector(128) ! blockidx%x threadidx%x 482, Loop not fused: no successor loop Loop not vectorized: mixed data types Loop not vectorized: may not be beneficial 493, Generating present(dwork3(:,:),dwork(:,:)) Generating Tesla code 494, !$acc loop gang, vector(128) ! blockidx%x threadidx%x 493, Generating implicit copyin(gridc) [if not already present] 494, Memory copy idiom, loop replaced by call to __c_mcopy8 501, Generating present(cwork(:,:),cwgrad(:,:),latt_cur,gridc) Generating Tesla code 503, !$acc loop gang, vector(128) ! blockidx%x threadidx%x 503, Loop not fused: no successor loop Loop not vectorized: mixed data types Loop not vectorized: may not be beneficial 529, Generating present(dencor(:),latt_cur,dworkg(:,:),dwork(:,:),dhtot(:,:),dwgrad(:,:)) Generating Tesla code 531, !$acc loop gang, vector(128) ! blockidx%x threadidx%x Generating reduction(+:xcencc,xcenc,cvzero) 529, Generating implicit copy(cvzero,xcencc,xcenc) [if not already present] Generating implicit copyin(gridc) [if not already present] 531, Loop not fused: no successor loop Loop not vectorized: may not be beneficial FMA (fused multiply-add) instruction(s) generated 0 inform, 0 warnings, 0 severes, 0 fatal for fexcgs_ 0 inform, 0 warnings, 0 severes, 0 fatal for ggaapprox 0 inform, 0 warnings, 0 severes, 0 fatal for fexcgs_ddsc fexcgs_ddsc_: 728, FMA (fused multiply-add) instruction(s) generated 730, Loop not fused: function call before adjacent loop Generated vector simd code for the loop 740, Loop not fused: different loop trip count Loop not vectorized: may not be beneficial Loop unrolled 8 times 747, Loop not fused: function call before adjacent loop Loop not vectorized: mixed data types Loop not vectorized: may not be beneficial 759, Memory copy idiom, loop replaced by call to __c_mcopy8 764, Loop not fused: different loop trip count Loop not vectorized: may not be beneficial Loop unrolled 8 times 770, Loop not fused: function call before adjacent loop Loop not vectorized: mixed data types Loop not vectorized: may not be beneficial 782, Memory copy idiom, loop replaced by call to __c_mcopy8 788, Loop not fused: different loop trip count Loop not vectorized: may not be beneficial Loop unrolled 8 times 795, Loop not fused: function call before adjacent loop Loop not vectorized: mixed data types Loop not vectorized: may not be beneficial 807, Memory copy idiom, loop replaced by call to __c_mcopy8 821, Loop not vectorized/parallelized: contains call 825, FMA (fused multiply-add) instruction(s) generated 828, FMA (fused multiply-add) instruction(s) generated 831, FMA (fused multiply-add) instruction(s) generated 858, FMA (fused multiply-add) instruction(s) generated 885, Loop not vectorized/parallelized: contains call 889, FMA (fused multiply-add) instruction(s) generated 892, FMA (fused multiply-add) instruction(s) generated 944, Loop not fused: different loop trip count FMA (fused multiply-add) instruction(s) generated 977, Generated vector simd code for the loop FMA (fused multiply-add) instruction(s) generated 994, FMA (fused multiply-add) instruction(s) generated 999, Memory copy idiom, loop replaced by call to __c_mcopy8 1006, Loop not fused: function call before adjacent loop Loop not vectorized: mixed data types Loop not vectorized: may not be beneficial 1017, Memory copy idiom, loop replaced by call to __c_mcopy8 1024, Loop not fused: function call before adjacent loop Loop not vectorized: mixed data types Loop not vectorized: may not be beneficial 1035, Memory copy idiom, loop replaced by call to __c_mcopy8 1042, Loop not fused: function call before adjacent loop Loop not vectorized: mixed data types Loop not vectorized: may not be beneficial 1068, Loop not fused: function call before adjacent loop Loop not vectorized: may not be beneficial FMA (fused multiply-add) instruction(s) generated 0 inform, 0 warnings, 0 severes, 0 fatal for fexcgs_ddsc_ fexcgs_noncol_: 1184, FMA (fused multiply-add) instruction(s) generated 1187, Generating present(dhtot(:,:),dencor(:),dwork(:,:),latt_cur) Generating Tesla code 1188, !$acc loop gang, vector(128) ! blockidx%x threadidx%x 1187, Generating implicit copyin(gridc) [if not already present] 1188, Loop not fused: no successor loop Generated vector simd code for the loop 1192, Generating present(dhtot(:,:),latt_cur,dwork(:,:)) Generating Tesla code 1193, !$acc loop gang, vector(128) ! blockidx%x threadidx%x 1192, Generating implicit copyin(gridc) [if not already present] 1193, Loop not fused: no successor loop Generated vector simd code for the loop 1204, Generating present(cwork(:,:),cwgrad(:,:)) Generating Tesla code 1205, !$acc loop gang, vector(128) ! blockidx%x threadidx%x 1204, Generating implicit copyin(gridc) [if not already present] 1205, Loop not fused: no successor loop Loop not vectorized: may not be beneficial Loop unrolled 8 times 1211, Generating present(cwork(:,:),latt_cur,gridc) Generating Tesla code 1213, !$acc loop gang, vector(128) ! blockidx%x threadidx%x 1213, Loop not fused: no successor loop Loop not vectorized: mixed data types Loop not vectorized: may not be beneficial 1225, Generating present(dwork(:,:),dwork1(:,:)) Generating Tesla code 1226, !$acc loop gang, vector(128) ! blockidx%x threadidx%x 1225, Generating implicit copyin(gridc) [if not already present] 1226, Memory copy idiom, loop replaced by call to __c_mcopy8 1231, Generating present(cwork(:,:),cwgrad(:,:)) Generating Tesla code 1232, !$acc loop gang, vector(128) ! blockidx%x threadidx%x 1231, Generating implicit copyin(gridc) [if not already present] 1232, Loop not fused: no successor loop Loop not vectorized: may not be beneficial Loop unrolled 8 times 1238, Generating present(cwork(:,:),latt_cur,gridc) Generating Tesla code 1240, !$acc loop gang, vector(128) ! blockidx%x threadidx%x 1240, Loop not fused: no successor loop Loop not vectorized: mixed data types Loop not vectorized: may not be beneficial 1252, Generating present(dwork2(:,:),dwork(:,:)) Generating Tesla code 1253, !$acc loop gang, vector(128) ! blockidx%x threadidx%x 1252, Generating implicit copyin(gridc) [if not already present] 1253, Memory copy idiom, loop replaced by call to __c_mcopy8 1258, Generating present(cwork(:,:),cwgrad(:,:)) Generating Tesla code 1259, !$acc loop gang, vector(128) ! blockidx%x threadidx%x 1258, Generating implicit copyin(gridc) [if not already present] 1259, Loop not fused: no successor loop Loop not vectorized: may not be beneficial Loop unrolled 8 times 1265, Generating present(cwork(:,:),gridc,latt_cur) Generating Tesla code 1267, !$acc loop gang, vector(128) ! blockidx%x threadidx%x 1267, Loop not fused: no successor loop Loop not vectorized: mixed data types Loop not vectorized: may not be beneficial 1279, Generating present(dwork3(:,:),dwork(:,:)) Generating Tesla code 1280, !$acc loop gang, vector(128) ! blockidx%x threadidx%x 1279, Generating implicit copyin(gridc) [if not already present] 1280, Memory copy idiom, loop replaced by call to __c_mcopy8 1295, Generating present(dencor(:),latt_cur,dworkg(:,:),dwork(:,:),dwork1(:,:),dwork2(:,:),dvc(:),dhtot(:,:),dwork3(:,:)) Generating Tesla code 1298, !$acc loop gang, vector(128) ! blockidx%x threadidx%x Generating reduction(+:exc) 1295, Local memory used for nabmag Generating implicit copyin(gridc) [if not already present] Generating implicit copy(exc) [if not already present] 1298, Loop not vectorized/parallelized: contains call 1302, FMA (fused multiply-add) instruction(s) generated 1313, FMA (fused multiply-add) instruction(s) generated 1314, FMA (fused multiply-add) instruction(s) generated 1315, FMA (fused multiply-add) instruction(s) generated 1319, FMA (fused multiply-add) instruction(s) generated 1326, FMA (fused multiply-add) instruction(s) generated 1333, FMA (fused multiply-add) instruction(s) generated 1364, FMA (fused multiply-add) instruction(s) generated 1430, Generating present(dwork(:,:),dwork1(:,:),dwork3(:,:),dwork2(:,:),dvc(:)) Generating Tesla code 1432, !$acc loop gang, vector(128) collapse(2) ! blockidx%x threadidx%x Generating reduction(+:sif12,sif31,sif33,sif11,sif22,sif23) 1433, ! blockidx%x threadidx%x collapsed 1430, Generating implicit copyin(gridc) [if not already present] Generating implicit copy(sif12,sif33,sif31,sif11,sif22,sif23) [if not already present] 1432, Scalar last value needed after loop for sif11 at line 1449 Scalar last value needed after loop for sif22 at line 1450 Scalar last value needed after loop for sif33 at line 1451 Scalar last value needed after loop for sif12 at line 1452 Scalar last value needed after loop for sif31 at line 1454 Scalar last value needed after loop for sif23 at line 1453 Loop not fused: no successor loop Loop not vectorized/parallelized: loop count too small FMA (fused multiply-add) instruction(s) generated 1433, Scalar last value needed after loop for sif11 at line 1449 1465, Generating present(dwork(:,:),dwork1(:,:),dwork3(:,:),dwork2(:,:),dvc(:)) Generating Tesla code 1467, !$acc loop gang, vector(128) ! blockidx%x threadidx%x 1465, Generating implicit copyin(gridc) [if not already present] 1467, Loop not fused: no successor loop Generated vector simd code for the loop FMA (fused multiply-add) instruction(s) generated 1484, FMA (fused multiply-add) instruction(s) generated 1489, Generating present(dwork1(:,:),dwork(:,:)) Generating Tesla code 1490, !$acc loop gang, vector(128) ! blockidx%x threadidx%x 1489, Generating implicit copyin(gridc) [if not already present] 1490, Memory copy idiom, loop replaced by call to __c_mcopy8 1497, Generating present(cwork(:,:),cwgrad(:,:),latt_cur,gridc) Generating Tesla code 1499, !$acc loop gang, vector(128) ! blockidx%x threadidx%x 1499, Loop not fused: no successor loop Loop not vectorized: mixed data types Loop not vectorized: may not be beneficial 1510, Generating present(dwork2(:,:),dwork(:,:)) Generating Tesla code 1511, !$acc loop gang, vector(128) ! blockidx%x threadidx%x 1510, Generating implicit copyin(gridc) [if not already present] 1511, Memory copy idiom, loop replaced by call to __c_mcopy8 1518, Generating present(cwork(:,:),cwgrad(:,:),latt_cur,gridc) Generating Tesla code 1520, !$acc loop gang, vector(128) ! blockidx%x threadidx%x 1520, Loop not fused: no successor loop Loop not vectorized: mixed data types Loop not vectorized: may not be beneficial 1531, Generating present(dwork3(:,:),dwork(:,:)) Generating Tesla code 1532, !$acc loop gang, vector(128) ! blockidx%x threadidx%x 1531, Generating implicit copyin(gridc) [if not already present] 1532, Memory copy idiom, loop replaced by call to __c_mcopy8 1539, Generating present(cwork(:,:),cwgrad(:,:),latt_cur,gridc) Generating Tesla code 1541, !$acc loop gang, vector(128) ! blockidx%x threadidx%x 1541, Loop not fused: no successor loop Loop not vectorized: mixed data types Loop not vectorized: may not be beneficial 1567, Generating present(dencor(:),latt_cur,dworkg(:,:),dwork(:,:),dhtot(:,:),dwgrad(:,:)) Generating Tesla code 1570, !$acc loop gang, vector(128) ! blockidx%x threadidx%x Generating reduction(+:xcencc,xcenc,cvzero) 1567, Generating implicit copy(cvzero,xcencc,xcenc) [if not already present] Generating implicit copyin(gridc) [if not already present] 1570, Loop not fused: no successor loop Loop not vectorized: may not be beneficial FMA (fused multiply-add) instruction(s) generated 0 inform, 0 warnings, 0 severes, 0 fatal for fexcgs_noncol_ fexcgs_vdw_: 1712, FMA (fused multiply-add) instruction(s) generated 1714, Generating present(dhtot(:,:),dencor(:),latt_cur,dwork(:,:)) Generating Tesla code 1715, !$acc loop gang, vector(128) ! blockidx%x threadidx%x 1714, Generating implicit copyin(gridc) [if not already present] 1715, Loop not fused: no successor loop Generated vector simd code for the loop 1725, Generating present(cwork(:,:),cwgrad(:,:)) Generating Tesla code 1726, !$acc loop gang, vector(128) ! blockidx%x threadidx%x 1725, Generating implicit copyin(gridc) [if not already present] 1726, Loop not fused: no successor loop Loop not vectorized: may not be beneficial Loop unrolled 8 times 1733, Generating present(cwork(:,:),gridc,latt_cur) Generating Tesla code 1735, !$acc loop gang, vector(128) ! blockidx%x threadidx%x 1735, Loop not fused: no successor loop Loop not vectorized: mixed data types Loop not vectorized: may not be beneficial 1747, Generating present(dwork(:,:),dwork1(:,:)) Generating Tesla code 1748, !$acc loop gang, vector(128) ! blockidx%x threadidx%x 1747, Generating implicit copyin(gridc) [if not already present] 1748, Memory copy idiom, loop replaced by call to __c_mcopy8 1753, Generating present(cwork(:,:),cwgrad(:,:)) Generating Tesla code 1754, !$acc loop gang, vector(128) ! blockidx%x threadidx%x 1753, Generating implicit copyin(gridc) [if not already present] 1754, Loop not fused: no successor loop Loop not vectorized: may not be beneficial Loop unrolled 8 times 1760, Generating present(cwork(:,:),latt_cur,gridc) Generating Tesla code 1762, !$acc loop gang, vector(128) ! blockidx%x threadidx%x 1762, Loop not fused: no successor loop Loop not vectorized: mixed data types Loop not vectorized: may not be beneficial 1774, Generating present(dwork2(:,:),dwork(:,:)) Generating Tesla code 1775, !$acc loop gang, vector(128) ! blockidx%x threadidx%x 1774, Generating implicit copyin(gridc) [if not already present] 1775, Memory copy idiom, loop replaced by call to __c_mcopy8 1781, Generating present(cwgrad(:,:),cwork(:,:)) Generating Tesla code 1782, !$acc loop gang, vector(128) ! blockidx%x threadidx%x 1781, Generating implicit copyin(gridc) [if not already present] 1782, Loop not fused: no successor loop Loop not vectorized: may not be beneficial Loop unrolled 8 times 1789, Generating present(cwork(:,:),latt_cur,gridc) Generating Tesla code 1791, !$acc loop gang, vector(128) ! blockidx%x threadidx%x 1791, Loop not fused: no successor loop Loop not vectorized: mixed data types Loop not vectorized: may not be beneficial 1803, Generating present(dwork3(:,:),dwork(:,:)) Generating Tesla code 1804, !$acc loop gang, vector(128) ! blockidx%x threadidx%x 1803, Generating implicit copyin(gridc) [if not already present] 1804, Memory copy idiom, loop replaced by call to __c_mcopy8 1818, Generating present(dencor(:),latt_cur,dworkg(:,:),dwork(:,:),dwork1(:,:),dwork2(:,:),dvc(:),dhtot(:,:),dwork3(:,:)) Generating Tesla code 1821, !$acc loop gang, vector(128) ! blockidx%x threadidx%x Generating reduction(+:exc) 1818, Generating implicit copyin(gridc) [if not already present] Generating implicit copy(exc,dwork7(:)) [if not already present] 1821, Loop not vectorized/parallelized: contains call 1825, FMA (fused multiply-add) instruction(s) generated 1828, FMA (fused multiply-add) instruction(s) generated 1831, FMA (fused multiply-add) instruction(s) generated 1857, FMA (fused multiply-add) instruction(s) generated 1885, Generating present(dhtot(:,:),dencor(:),latt_cur,dwork4(:)) Generating Tesla code 1886, !$acc loop gang, vector(128) ! blockidx%x threadidx%x 1885, Generating implicit copyin(gridc) [if not already present] 1886, Loop not fused: no successor loop Generated vector simd code for the loop 1890, Generating present(dwork6(:),dwork5(:)) 1891, Array assignment / Forall at line 1892 fused Loop is parallelizable Generating Tesla code 1891, !$acc loop gang, vector(128) ! blockidx%x threadidx%x 1891, Loop not fused: no successor loop Generated vector simd code for the loop 1897, Generating update self(dwork7(:),dwork6(:),dwork5(:),dwork4(:)) 1899, Generating update device(dwork6(:),dwork5(:)) 1902, Generating present(dwork5(:),dwork3(:,:),dwork(:,:),dwork1(:,:),dwork2(:,:)) Generating Tesla code 1903, !$acc loop gang, vector(128) ! blockidx%x threadidx%x 1902, Generating implicit copyin(gridc) [if not already present] 1903, Loop not fused: no successor loop Generated vector simd code for the loop FMA (fused multiply-add) instruction(s) generated 1910, Generating present(dworkg(:,:),dwork6(:)) Generating Tesla code 1911, !$acc loop gang, vector(128) ! blockidx%x threadidx%x 1910, Generating implicit copyin(gridc) [if not already present] 1911, Loop not fused: no successor loop Generated vector simd code for the loop 1960, Generating present(dwork(:,:),dwork1(:,:),dwork3(:,:),dwork2(:,:),dvc(:)) Generating Tesla code 1962, !$acc loop gang, vector(128) collapse(2) ! blockidx%x threadidx%x Generating reduction(+:sif12,sif31,sif33,sif11,sif22,sif23) 1963, ! blockidx%x threadidx%x collapsed 1960, Generating implicit copyin(gridc) [if not already present] Generating implicit copy(sif12,sif33,sif31,sif11,sif22,sif23) [if not already present] 1962, Scalar last value needed after loop for sif11 at line 1979 Scalar last value needed after loop for sif22 at line 1980 Scalar last value needed after loop for sif33 at line 1981 Scalar last value needed after loop for sif12 at line 1982 Scalar last value needed after loop for sif31 at line 1984 Scalar last value needed after loop for sif23 at line 1983 Loop not fused: no successor loop FMA (fused multiply-add) instruction(s) generated 1963, Scalar last value needed after loop for sif11 at line 1979 1995, Generating present(dwork(:,:),dwork1(:,:),dwork3(:,:),dwork2(:,:),dvc(:)) Generating Tesla code 1997, !$acc loop gang, vector(128) ! blockidx%x threadidx%x 1995, Generating implicit copyin(gridc) [if not already present] 1997, Loop not fused: no successor loop Generated vector simd code for the loop FMA (fused multiply-add) instruction(s) generated 2014, FMA (fused multiply-add) instruction(s) generated 2019, Generating present(dwork1(:,:),dwork(:,:)) Generating Tesla code 2020, !$acc loop gang, vector(128) ! blockidx%x threadidx%x 2019, Generating implicit copyin(gridc) [if not already present] 2020, Memory copy idiom, loop replaced by call to __c_mcopy8 2027, Generating present(cwork(:,:),cwgrad(:,:),latt_cur,gridc) Generating Tesla code 2029, !$acc loop gang, vector(128) ! blockidx%x threadidx%x 2029, Loop not fused: no successor loop Loop not vectorized: mixed data types Loop not vectorized: may not be beneficial 2040, Generating present(dwork2(:,:),dwork(:,:)) Generating Tesla code 2041, !$acc loop gang, vector(128) ! blockidx%x threadidx%x 2040, Generating implicit copyin(gridc) [if not already present] 2041, Memory copy idiom, loop replaced by call to __c_mcopy8 2048, Generating present(cwork(:,:),cwgrad(:,:),latt_cur,gridc) Generating Tesla code 2050, !$acc loop gang, vector(128) ! blockidx%x threadidx%x 2050, Loop not fused: no successor loop Loop not vectorized: mixed data types Loop not vectorized: may not be beneficial 2061, Generating present(dwork3(:,:),dwork(:,:)) Generating Tesla code 2062, !$acc loop gang, vector(128) ! blockidx%x threadidx%x 2061, Generating implicit copyin(gridc) [if not already present] 2062, Memory copy idiom, loop replaced by call to __c_mcopy8 2069, Generating present(cwork(:,:),cwgrad(:,:),latt_cur,gridc) Generating Tesla code 2071, !$acc loop gang, vector(128) ! blockidx%x threadidx%x 2071, Loop not fused: no successor loop Loop not vectorized: mixed data types Loop not vectorized: may not be beneficial 2097, Generating present(dencor(:),latt_cur,dworkg(:,:),dwork(:,:),dhtot(:,:),dwgrad(:,:)) Generating Tesla code 2099, !$acc loop gang, vector(128) ! blockidx%x threadidx%x Generating reduction(+:xcencc,xcenc,cvzero) 2097, Generating implicit copy(cvzero,xcencc,xcenc) [if not already present] Generating implicit copyin(gridc) [if not already present] 2099, Loop not fused: no successor loop Loop not vectorized: may not be beneficial FMA (fused multiply-add) instruction(s) generated 2133, Loop unrolled 3 times (completely unrolled) 0 inform, 0 warnings, 0 severes, 0 fatal for fexcgs_vdw_ /home/jlow/vidia-gcc-8.4.0/hpc_sdk/Linux_ppc64le/20.5/compilers/bin/tools/nvdd -dcuda /home/jlow/vidia-gcc-8.4.0/hpc_sdk/Linux_ppc64le/cuda/11.0 -reloc /tmp/pgaccNg1A1aMSCcct.gpu -computecap 30 -ptx /tmp/pgaccxg1AfdhZmjLk.ptx -o /tmp/pgaccpg1ATBFZetUv.bin -ftz -cuda11000 /tmp/pgaccNg1A1aMSCcct.gpu(1941): error: no operator "=" matches these operands operand types are: dcmplx2 = double /tmp/pgaccNg1A1aMSCcct.gpu(1943): error: no suitable conversion function from "dcmplx2" to "double" exists /tmp/pgaccNg1A1aMSCcct.gpu(4416): error: no operator "=" matches these operands operand types are: dcmplx2 = double /tmp/pgaccNg1A1aMSCcct.gpu(4418): error: no suitable conversion function from "dcmplx2" to "double" exists /tmp/pgaccNg1A1aMSCcct.gpu(6955): error: no operator "=" matches these operands operand types are: dcmplx2 = double /tmp/pgaccNg1A1aMSCcct.gpu(6957): error: no suitable conversion function from "dcmplx2" to "double" exists 6 errors detected in the compilation of "/tmp/nvdd3h1ALLPKr-Cx.ii". NVFORTRAN-F-0155-Compiler failed to translate accelerator region (see -Minfo messages): Device compiler exited with error status code (xcspin.f90: 2097) NVFORTRAN/power Linux 20.5-0: compilation aborted nvfortran-Fatal-f902 completed with exit code 1 Unlinking /tmp/nvfortran2d1AIV_6f7DS.ilm Unlinking /tmp/nvfortranMd1AYR0Lj3-O.stb Unlinking /tmp/nvfortranwd1AckA-aQVB.cmod Unlinking /tmp/nvfortrangd1AsAR916Jy.cmdx Unlinking /tmp/nvfortran2d1AISggWR0F.s Unlinking /tmp/nvfortranMd1AYq8PfCup.ll