[CP2K-user] [CP2K:19649] Compilation error of ELPA (cp2k-v2023.2)
Chungwen Liang
chungwen.liang at creyonbio.com
Tue Dec 12 04:34:10 UTC 2023
Hi all,
I experienced the following error when compiling ELPA library. Could you
please point me the direction? Thanks so much.
==================== Installing ELPA ====================
wget --quiet https://www.cp2k.org/static/downloads/elpa-2022.11.001.tar.gz
elpa-2022.11.001.tar.gz: OK
Checksum of elpa-2022.11.001.tar.gz Ok
Installing from scratch into
/home/chungwen_liang_creyonbio_com/PROGRAMS/cp2k-2023/tools/toolchain/install/elpa-2022.11.001/cpu
Installing from scratch into
/home/chungwen_liang_creyonbio_com/PROGRAMS/cp2k-2023/tools/toolchain/install/elpa-2022.11.001/nvidia
7974 | static __forceinline void
CONCAT_8ARGS(hh_trafo_complex_kernel_,ROW_LENGTH,_,SIMD_SET,_,BLOCK,hv_,WORD_LENGTH)
(DATA_TYPE_PTR q, DATA_TYPE_PTR hh, int nb, int ldq
| ^~~~~~~~~~~~~~~~~~~~~~~~
../src/elpa2/kernels/complex_128bit_256bit_512bit_BLOCK_template.c:51:47:
note: in definition of macro 'CONCAT2_8ARGS'
51 | #define CONCAT2_8ARGS(a, b, c, d, e, f, g, h) a ## b ## c ## d ## e
## f ## g ## h
| ^
../src/elpa2/kernels/complex_128bit_256bit_512bit_BLOCK_template.c:7974:27:
note: in expansion of macro 'CONCAT_8ARGS'
7974 | static __forceinline void
CONCAT_8ARGS(hh_trafo_complex_kernel_,ROW_LENGTH,_,SIMD_SET,_,BLOCK,hv_,WORD_LENGTH)
(DATA_TYPE_PTR q, DATA_TYPE_PTR hh, int nb, int ldq
| ^~~~~~~~~~~~
../test/shared/GPU/test_gpu_vendor_agnostic_layerFunctions.c: In function
'gpuFree':
../test/shared/GPU/test_gpu_vendor_agnostic_layerFunctions.c:104:11:
warning: implicit declaration of function 'cudaFreeFromC'
[-Wimplicit-function-declaration]
104 | return cudaFreeFromC(a);
| ^~~~~~~~~~~~~
../src/elpa2/kernels/complex_128bit_256bit_512bit_BLOCK_template.c:6719:40:
warning: 'always_inline' function might not be inlinable [-Wattributes]
6719 | static __forceinline void
CONCAT_8ARGS(hh_trafo_complex_kernel_,ROW_LENGTH,_,SIMD_SET,_,BLOCK,hv_,WORD_LENGTH)
(DATA_TYPE_PTR q, DATA_TYPE_PTR hh, int nb, int ldq
| ^~~~~~~~~~~~~~~~~~~~~~~~
../src/elpa2/kernels/complex_128bit_256bit_512bit_BLOCK_template.c:51:47:
note: in definition of macro 'CONCAT2_8ARGS'
51 | #define CONCAT2_8ARGS(a, b, c, d, e, f, g, h) a ## b ## c ## d ## e
## f ## g ## h
| ^
../src/elpa2/kernels/complex_128bit_256bit_512bit_BLOCK_template.c:6719:27:
note: in expansion of macro 'CONCAT_8ARGS'
6719 | static __forceinline void
CONCAT_8ARGS(hh_trafo_complex_kernel_,ROW_LENGTH,_,SIMD_SET,_,BLOCK,hv_,WORD_LENGTH)
(DATA_TYPE_PTR q, DATA_TYPE_PTR hh, int nb, int ldq
| ^~~~~~~~~~~~
../test/shared/GPU/test_gpu_vendor_agnostic_layerFunctions.c: In function
'gpuMemcpy':
../test/shared/GPU/test_gpu_vendor_agnostic_layerFunctions.c:113:11:
warning: implicit declaration of function 'cudaMemcpyFromC'
[-Wimplicit-function-declaration]
113 | return cudaMemcpyFromC(dest, src, count, dir);
| ^~~~~~~~~~~~~~~
../src/elpa2/kernels/complex_128bit_256bit_512bit_BLOCK_template.c:5285:40:
warning: 'always_inline' function might not be inlinable [-Wattributes]
5285 | static __forceinline void
CONCAT_8ARGS(hh_trafo_complex_kernel_,ROW_LENGTH,_,SIMD_SET,_,BLOCK,hv_,WORD_LENGTH)
(DATA_TYPE_PTR q, DATA_TYPE_PTR hh, int nb, int ldq
| ^~~~~~~~~~~~~~~~~~~~~~~~
../src/elpa2/kernels/complex_128bit_256bit_512bit_BLOCK_template.c:51:47:
note: in definition of macro 'CONCAT2_8ARGS'
51 | #define CONCAT2_8ARGS(a, b, c, d, e, f, g, h) a ## b ## c ## d ## e
## f ## g ## h
| ^
../src/elpa2/kernels/complex_128bit_256bit_512bit_BLOCK_template.c:5285:27:
note: in expansion of macro 'CONCAT_8ARGS'
5285 | static __forceinline void
CONCAT_8ARGS(hh_trafo_complex_kernel_,ROW_LENGTH,_,SIMD_SET,_,BLOCK,hv_,WORD_LENGTH)
(DATA_TYPE_PTR q, DATA_TYPE_PTR hh, int nb, int ldq
| ^~~~~~~~~~~~
../src/elpa2/kernels/complex_128bit_256bit_512bit_BLOCK_template.c:3681:40:
warning: 'always_inline' function might not be inlinable [-Wattributes]
3681 | static __forceinline void
CONCAT_8ARGS(hh_trafo_complex_kernel_,ROW_LENGTH,_,SIMD_SET,_,BLOCK,hv_,WORD_LENGTH)
(DATA_TYPE_PTR q, DATA_TYPE_PTR hh, int nb, int ldq
| ^~~~~~~~~~~~~~~~~~~~~~~~
../src/elpa2/kernels/complex_128bit_256bit_512bit_BLOCK_template.c:51:47:
note: in definition of macro 'CONCAT2_8ARGS'
51 | #define CONCAT2_8ARGS(a, b, c, d, e, f, g, h) a ## b ## c ## d ## e
## f ## g ## h
| ^
../src/elpa2/kernels/complex_128bit_256bit_512bit_BLOCK_template.c:3681:27:
note: in expansion of macro 'CONCAT_8ARGS'
3681 | static __forceinline void
CONCAT_8ARGS(hh_trafo_complex_kernel_,ROW_LENGTH,_,SIMD_SET,_,BLOCK,hv_,WORD_LENGTH)
(DATA_TYPE_PTR q, DATA_TYPE_PTR hh, int nb, int ldq
| ^~~~~~~~~~~~
../src/elpa2/kernels/complex_128bit_256bit_512bit_BLOCK_template.c:1872:40:
warning: 'always_inline' function might not be inlinable [-Wattributes]
1872 | static __forceinline void
CONCAT_8ARGS(hh_trafo_complex_kernel_,ROW_LENGTH,_,SIMD_SET,_,BLOCK,hv_,WORD_LENGTH)
(DATA_TYPE_PTR q, DATA_TYPE_PTR hh, int nb, int ldq
| ^~~~~~~~~~~~~~~~~~~~~~~~
../src/elpa2/kernels/complex_128bit_256bit_512bit_BLOCK_template.c:51:47:
note: in definition of macro 'CONCAT2_8ARGS'
51 | #define CONCAT2_8ARGS(a, b, c, d, e, f, g, h) a ## b ## c ## d ## e
## f ## g ## h
| ^
../src/elpa2/kernels/complex_128bit_256bit_512bit_BLOCK_template.c:1872:27:
note: in expansion of macro 'CONCAT_8ARGS'
1872 | static __forceinline void
CONCAT_8ARGS(hh_trafo_complex_kernel_,ROW_LENGTH,_,SIMD_SET,_,BLOCK,hv_,WORD_LENGTH)
(DATA_TYPE_PTR q, DATA_TYPE_PTR hh, int nb, int ldq
| ^~~~~~~~~~~~
PPFC src/GPU/CUDA/libelpa_openmp_private_la-mod_cuda.lo
In file included from
../src/elpa2/kernels/complex_avx_2hv_double_precision.c:54:
../src/elpa2/kernels/complex_128bit_256bit_512bit_BLOCK_template.c:9043:40:
warning: 'always_inline' function might not be inlinable [-Wattributes]
9043 | static __forceinline void
CONCAT_8ARGS(hh_trafo_complex_kernel_,ROW_LENGTH,_,SIMD_SET,_,BLOCK,hv_,WORD_LENGTH)
(DATA_TYPE_PTR q, DATA_TYPE_PTR hh, int nb, int ldq
| ^~~~~~~~~~~~~~~~~~~~~~~~
../src/elpa2/kernels/complex_128bit_256bit_512bit_BLOCK_template.c:51:47:
note: in definition of macro 'CONCAT2_8ARGS'
51 | #define CONCAT2_8ARGS(a, b, c, d, e, f, g, h) a ## b ## c ## d ## e
## f ## g ## h
| ^
../src/elpa2/kernels/complex_128bit_256bit_512bit_BLOCK_template.c:9043:27:
note: in expansion of macro 'CONCAT_8ARGS'
9043 | static __forceinline void
CONCAT_8ARGS(hh_trafo_complex_kernel_,ROW_LENGTH,_,SIMD_SET,_,BLOCK,hv_,WORD_LENGTH)
(DATA_TYPE_PTR q, DATA_TYPE_PTR hh, int nb, int ldq
| ^~~~~~~~~~~~
../src/elpa2/kernels/complex_128bit_256bit_512bit_BLOCK_template.c:7974:40:
warning: 'always_inline' function might not be inlinable [-Wattributes]
7974 | static __forceinline void
CONCAT_8ARGS(hh_trafo_complex_kernel_,ROW_LENGTH,_,SIMD_SET,_,BLOCK,hv_,WORD_LENGTH)
(DATA_TYPE_PTR q, DATA_TYPE_PTR hh, int nb, int ldq
| ^~~~~~~~~~~~~~~~~~~~~~~~
../src/elpa2/kernels/complex_128bit_256bit_512bit_BLOCK_template.c:51:47:
note: in definition of macro 'CONCAT2_8ARGS'
51 | #define CONCAT2_8ARGS(a, b, c, d, e, f, g, h) a ## b ## c ## d ## e
## f ## g ## h
| ^
../src/elpa2/kernels/complex_128bit_256bit_512bit_BLOCK_template.c:7974:27:
note: in expansion of macro 'CONCAT_8ARGS'
7974 | static __forceinline void
CONCAT_8ARGS(hh_trafo_complex_kernel_,ROW_LENGTH,_,SIMD_SET,_,BLOCK,hv_,WORD_LENGTH)
(DATA_TYPE_PTR q, DATA_TYPE_PTR hh, int nb, int ldq
| ^~~~~~~~~~~~
../src/elpa2/kernels/complex_128bit_256bit_512bit_BLOCK_template.c:6719:40:
warning: 'always_inline' function might not be inlinable [-Wattributes]
6719 | static __forceinline void
CONCAT_8ARGS(hh_trafo_complex_kernel_,ROW_LENGTH,_,SIMD_SET,_,BLOCK,hv_,WORD_LENGTH)
(DATA_TYPE_PTR q, DATA_TYPE_PTR hh, int nb, int ldq
| ^~~~~~~~~~~~~~~~~~~~~~~~
../src/elpa2/kernels/complex_128bit_256bit_512bit_BLOCK_template.c:51:47:
note: in definition of macro 'CONCAT2_8ARGS'
51 | #define CONCAT2_8ARGS(a, b, c, d, e, f, g, h) a ## b ## c ## d ## e
## f ## g ## h
| ^
../src/elpa2/kernels/complex_128bit_256bit_512bit_BLOCK_template.c:6719:27:
note: in expansion of macro 'CONCAT_8ARGS'
6719 | static __forceinline void
CONCAT_8ARGS(hh_trafo_complex_kernel_,ROW_LENGTH,_,SIMD_SET,_,BLOCK,hv_,WORD_LENGTH)
(DATA_TYPE_PTR q, DATA_TYPE_PTR hh, int nb, int ldq
| ^~~~~~~~~~~~
../src/elpa2/kernels/complex_128bit_256bit_512bit_BLOCK_template.c:5285:40:
warning: 'always_inline' function might not be inlinable [-Wattributes]
5285 | static __forceinline void
CONCAT_8ARGS(hh_trafo_complex_kernel_,ROW_LENGTH,_,SIMD_SET,_,BLOCK,hv_,WORD_LENGTH)
(DATA_TYPE_PTR q, DATA_TYPE_PTR hh, int nb, int ldq
| ^~~~~~~~~~~~~~~~~~~~~~~~
../src/elpa2/kernels/complex_128bit_256bit_512bit_BLOCK_template.c:51:47:
note: in definition of macro 'CONCAT2_8ARGS'
51 | #define CONCAT2_8ARGS(a, b, c, d, e, f, g, h) a ## b ## c ## d ## e
## f ## g ## h
| ^
../src/elpa2/kernels/complex_128bit_256bit_512bit_BLOCK_template.c:5285:27:
note: in expansion of macro 'CONCAT_8ARGS'
5285 | static __forceinline void
CONCAT_8ARGS(hh_trafo_complex_kernel_,ROW_LENGTH,_,SIMD_SET,_,BLOCK,hv_,WORD_LENGTH)
(DATA_TYPE_PTR q, DATA_TYPE_PTR hh, int nb, int ldq
| ^~~~~~~~~~~~
../src/elpa2/kernels/complex_128bit_256bit_512bit_BLOCK_template.c:3681:40:
warning: 'always_inline' function might not be inlinable [-Wattributes]
3681 | static __forceinline void
CONCAT_8ARGS(hh_trafo_complex_kernel_,ROW_LENGTH,_,SIMD_SET,_,BLOCK,hv_,WORD_LENGTH)
(DATA_TYPE_PTR q, DATA_TYPE_PTR hh, int nb, int ldq
| ^~~~~~~~~~~~~~~~~~~~~~~~
../src/elpa2/kernels/complex_128bit_256bit_512bit_BLOCK_template.c:51:47:
note: in definition of macro 'CONCAT2_8ARGS'
51 | #define CONCAT2_8ARGS(a, b, c, d, e, f, g, h) a ## b ## c ## d ## e
## f ## g ## h
| ^
../src/elpa2/kernels/complex_128bit_256bit_512bit_BLOCK_template.c:3681:27:
note: in expansion of macro 'CONCAT_8ARGS'
3681 | static __forceinline void
CONCAT_8ARGS(hh_trafo_complex_kernel_,ROW_LENGTH,_,SIMD_SET,_,BLOCK,hv_,WORD_LENGTH)
(DATA_TYPE_PTR q, DATA_TYPE_PTR hh, int nb, int ldq
| ^~~~~~~~~~~~
../src/elpa2/kernels/complex_128bit_256bit_512bit_BLOCK_template.c:1872:40:
warning: 'always_inline' function might not be inlinable [-Wattributes]
1872 | static __forceinline void
CONCAT_8ARGS(hh_trafo_complex_kernel_,ROW_LENGTH,_,SIMD_SET,_,BLOCK,hv_,WORD_LENGTH)
(DATA_TYPE_PTR q, DATA_TYPE_PTR hh, int nb, int ldq
| ^~~~~~~~~~~~~~~~~~~~~~~~
../src/elpa2/kernels/complex_128bit_256bit_512bit_BLOCK_template.c:51:47:
note: in definition of macro 'CONCAT2_8ARGS'
51 | #define CONCAT2_8ARGS(a, b, c, d, e, f, g, h) a ## b ## c ## d ## e
## f ## g ## h
| ^
../src/elpa2/kernels/complex_128bit_256bit_512bit_BLOCK_template.c:1872:27:
note: in expansion of macro 'CONCAT_8ARGS'
1872 | static __forceinline void
CONCAT_8ARGS(hh_trafo_complex_kernel_,ROW_LENGTH,_,SIMD_SET,_,BLOCK,hv_,WORD_LENGTH)
(DATA_TYPE_PTR q, DATA_TYPE_PTR hh, int nb, int ldq
| ^~~~~~~~~~~~
PPFC src/GPU/OpenMP/libelpa_openmp_private_la-mod_openmp_offload.lo
PPFC src/GPU/ROCm/libelpa_openmp_private_la-mod_hip.lo
PPFC src/helpers/libelpa_openmp_private_la-mod_scalapack_interfaces.lo
PPFC src/ftimings/libelpa_openmp_private_la-ftimings_value.lo
PPFC
src/invert_trm/GPU/CUDA/libelpa_openmp_private_la-mod_invert_trm_cuda.lo
PPFC
src/cholesky/GPU/CUDA/libelpa_openmp_private_la-mod_cholesky_cuda.lo
PPFC src/helpers/libelpa_openmp_private_la-mod_blas_interfaces.lo
PPFC src/elpa2/GPU/libelpa_openmp_private_la-interface_c_gpu_kernel.lo
PPFC src/helpers/libelpa_openmp_private_la-mod_thread_affinity.lo
PPFC
test/shared/libelpatest_openmp_la-mod_tests_scalapack_interfaces.lo
PPFC test/shared/libelpatest_openmp_la-mod_tests_blas_interfaces.lo
PPFC test/shared/GPU/CUDA/libelpatest_openmp_la-test_cuda.lo
PPFC src/ftimings/libelpa_openmp_private_la-ftimings.lo
PPFC src/cholesky/GPU/libelpa_openmp_private_la-mod_cholesky_gpu.lo
libtool: compile: ../nvcc_wrap -std=c++14 -allow-unsupported-compiler
-arch sm_80 -O2 -I/usr/local/cuda-12.3/include --default-stream per-thread
-Wl,--allow-multiple-definition -Wl,--enable-new-dtags
-L/home/chungwen_liang_creyonbio_com/PROGRAMS/cp2k-2023/tools/toolchain/install/openblas-0.3.23/lib
-Wl,-rpath,/home/chungwen_liang_creyonbio_com/PROGRAMS/cp2k-2023/tools/toolchain/install/openblas-0.3.23/lib
-L/home/chungwen_liang_creyonbio_com/PROGRAMS/cp2k-2023/tools/toolchain/install/scalapack-2.2.1/lib
-Wl,-rpath,/home/chungwen_liang_creyonbio_com/PROGRAMS/cp2k-2023/tools/toolchain/install/scalapack-2.2.1/lib
-L/usr/local/cuda-12.3/lib64 -I./ -I../ -c
../src/GPU/CUDA/elpa_index_nvidia_gpu.cu -o
src/GPU/CUDA/elpa_index_nvidia_gpu.o >/dev/null 2>&1
PPFC
src/invert_trm/GPU/libelpa_openmp_private_la-mod_invert_trm_gpu.lo
PPFC src/elpa2/qr/libelpa_openmp_private_la-elpa_qrkernels.lo
PPFC test/shared/libelpatest_openmp_la-test_prepare_matrix.lo
libtool: compile: ../nvcc_wrap -std=c++14 -allow-unsupported-compiler
-arch sm_80 -O2 -I/usr/local/cuda-12.3/include --default-stream per-thread
-Wl,--allow-multiple-definition -Wl,--enable-new-dtags
-L/home/chungwen_liang_creyonbio_com/PROGRAMS/cp2k-2023/tools/toolchain/install/openblas-0.3.23/lib
-Wl,-rpath,/home/chungwen_liang_creyonbio_com/PROGRAMS/cp2k-2023/tools/toolchain/install/openblas-0.3.23/lib
-L/home/chungwen_liang_creyonbio_com/PROGRAMS/cp2k-2023/tools/toolchain/install/scalapack-2.2.1/lib
-Wl,-rpath,/home/chungwen_liang_creyonbio_com/PROGRAMS/cp2k-2023/tools/toolchain/install/scalapack-2.2.1/lib
-L/usr/local/cuda-12.3/lib64 -I./ -I../ -c
../src/GPU/CUDA/elpa_explicit_name_nvidia_gpu.cu -o
src/GPU/CUDA/elpa_explicit_name_nvidia_gpu.o >/dev/null 2>&1
PPFC src/GPU/libelpa_openmp_private_la-mod_vendor_agnostic_layer.lo
PPFC
test/shared/GPU/libelpatest_openmp_la-test_gpu_vendor_agnostic_layer.lo
libtool: compile: ../nvcc_wrap -std=c++14 -allow-unsupported-compiler
-arch sm_80 -O2 -I/usr/local/cuda-12.3/include --default-stream per-thread
-Wl,--allow-multiple-definition -Wl,--enable-new-dtags
-L/home/chungwen_liang_creyonbio_com/PROGRAMS/cp2k-2023/tools/toolchain/install/openblas-0.3.23/lib
-Wl,-rpath,/home/chungwen_liang_creyonbio_com/PROGRAMS/cp2k-2023/tools/toolchain/install/openblas-0.3.23/lib
-L/home/chungwen_liang_creyonbio_com/PROGRAMS/cp2k-2023/tools/toolchain/install/scalapack-2.2.1/lib
-Wl,-rpath,/home/chungwen_liang_creyonbio_com/PROGRAMS/cp2k-2023/tools/toolchain/install/scalapack-2.2.1/lib
-L/usr/local/cuda-12.3/lib64 -I./ -I../ -c ../src/GPU/CUDA/cuUtils.cu -o
src/GPU/CUDA/cuUtils.o >/dev/null 2>&1
libtool: compile: ../nvcc_wrap -std=c++14 -allow-unsupported-compiler
-arch sm_80 -O2 -I/usr/local/cuda-12.3/include --default-stream per-thread
-Wl,--allow-multiple-definition -Wl,--enable-new-dtags
-L/home/chungwen_liang_creyonbio_com/PROGRAMS/cp2k-2023/tools/toolchain/install/openblas-0.3.23/lib
-Wl,-rpath,/home/chungwen_liang_creyonbio_com/PROGRAMS/cp2k-2023/tools/toolchain/install/openblas-0.3.23/lib
-L/home/chungwen_liang_creyonbio_com/PROGRAMS/cp2k-2023/tools/toolchain/install/scalapack-2.2.1/lib
-Wl,-rpath,/home/chungwen_liang_creyonbio_com/PROGRAMS/cp2k-2023/tools/toolchain/install/scalapack-2.2.1/lib
-L/usr/local/cuda-12.3/lib64 -I./ -I../ -c
../src/cholesky/GPU/CUDA/elpa_cholesky_cuda.cu -o
src/cholesky/GPU/CUDA/elpa_cholesky_cuda.o >/dev/null 2>&1
libtool: compile: ../nvcc_wrap -std=c++14 -allow-unsupported-compiler
-arch sm_80 -O2 -I/usr/local/cuda-12.3/include --default-stream per-thread
-Wl,--allow-multiple-definition -Wl,--enable-new-dtags
-L/home/chungwen_liang_creyonbio_com/PROGRAMS/cp2k-2023/tools/toolchain/install/openblas-0.3.23/lib
-Wl,-rpath,/home/chungwen_liang_creyonbio_com/PROGRAMS/cp2k-2023/tools/toolchain/install/openblas-0.3.23/lib
-L/home/chungwen_liang_creyonbio_com/PROGRAMS/cp2k-2023/tools/toolchain/install/scalapack-2.2.1/lib
-Wl,-rpath,/home/chungwen_liang_creyonbio_com/PROGRAMS/cp2k-2023/tools/toolchain/install/scalapack-2.2.1/lib
-L/usr/local/cuda-12.3/lib64 -I./ -I../ -c
../src/elpa2/GPU/CUDA/ev_tridi_band_nvidia_gpu_complex.cu -o
src/elpa2/GPU/CUDA/ev_tridi_band_nvidia_gpu_complex.o >/dev/null 2>&1
libtool: compile: ../nvcc_wrap -std=c++14 -allow-unsupported-compiler
-arch sm_80 -O2 -I/usr/local/cuda-12.3/include --default-stream per-thread
-Wl,--allow-multiple-definition -Wl,--enable-new-dtags
-L/home/chungwen_liang_creyonbio_com/PROGRAMS/cp2k-2023/tools/toolchain/install/openblas-0.3.23/lib
-Wl,-rpath,/home/chungwen_liang_creyonbio_com/PROGRAMS/cp2k-2023/tools/toolchain/install/openblas-0.3.23/lib
-L/home/chungwen_liang_creyonbio_com/PROGRAMS/cp2k-2023/tools/toolchain/install/scalapack-2.2.1/lib
-Wl,-rpath,/home/chungwen_liang_creyonbio_com/PROGRAMS/cp2k-2023/tools/toolchain/install/scalapack-2.2.1/lib
-L/usr/local/cuda-12.3/lib64 -I./ -I../ -c
../src/invert_trm/GPU/CUDA/elpa_invert_trm_cuda.cu -o
src/invert_trm/GPU/CUDA/elpa_invert_trm_cuda.o >/dev/null 2>&1
PPFC src/general/libelpa_openmp_private_la-elpa_utilities.lo
PPFC src/helpers/libelpa_openmp_private_la-matrix_plot.lo
libtool: compile: ../nvcc_wrap -std=c++14 -allow-unsupported-compiler
-arch sm_80 -O2 -I/usr/local/cuda-12.3/include --default-stream per-thread
-Wl,--allow-multiple-definition -Wl,--enable-new-dtags
-L/home/chungwen_liang_creyonbio_com/PROGRAMS/cp2k-2023/tools/toolchain/install/openblas-0.3.23/lib
-Wl,-rpath,/home/chungwen_liang_creyonbio_com/PROGRAMS/cp2k-2023/tools/toolchain/install/openblas-0.3.23/lib
-L/home/chungwen_liang_creyonbio_com/PROGRAMS/cp2k-2023/tools/toolchain/install/scalapack-2.2.1/lib
-Wl,-rpath,/home/chungwen_liang_creyonbio_com/PROGRAMS/cp2k-2023/tools/toolchain/install/scalapack-2.2.1/lib
-L/usr/local/cuda-12.3/lib64 -I./ -I../ -c
../src/elpa2/GPU/CUDA/ev_tridi_band_nvidia_gpu_real.cu -o
src/elpa2/GPU/CUDA/ev_tridi_band_nvidia_gpu_real.o >/dev/null 2>&1
PPFC src/libelpa_openmp_public_la-elpa_api.lo
PPFC
src/general/libelpa_openmp_private_la-mod_elpa_skewsymmetric_blas.lo
libtool: compile: ../nvcc_wrap -std=c++14 -allow-unsupported-compiler
-arch sm_80 -O2 -I/usr/local/cuda-12.3/include --default-stream per-thread
-Wl,--allow-multiple-definition -Wl,--enable-new-dtags
-L/home/chungwen_liang_creyonbio_com/PROGRAMS/cp2k-2023/tools/toolchain/install/openblas-0.3.23/lib
-Wl,-rpath,/home/chungwen_liang_creyonbio_com/PROGRAMS/cp2k-2023/tools/toolchain/install/openblas-0.3.23/lib
-L/home/chungwen_liang_creyonbio_com/PROGRAMS/cp2k-2023/tools/toolchain/install/scalapack-2.2.1/lib
-Wl,-rpath,/home/chungwen_liang_creyonbio_com/PROGRAMS/cp2k-2023/tools/toolchain/install/scalapack-2.2.1/lib
-L/usr/local/cuda-12.3/lib64 -I./ -I../ -c ../src/GPU/CUDA/cudaFunctions.cu
-o src/GPU/CUDA/cudaFunctions.o >/dev/null 2>&1
PPFC src/libelpa_openmp_private_la-elpa_abstract_impl.lo
libtool: compile: ../nvcc_wrap -std=c++14 -allow-unsupported-compiler
-arch sm_80 -O2 -I/usr/local/cuda-12.3/include --default-stream per-thread
-Wl,--allow-multiple-definition -Wl,--enable-new-dtags
-L/home/chungwen_liang_creyonbio_com/PROGRAMS/cp2k-2023/tools/toolchain/install/openblas-0.3.23/lib
-Wl,-rpath,/home/chungwen_liang_creyonbio_com/PROGRAMS/cp2k-2023/tools/toolchain/install/openblas-0.3.23/lib
-L/home/chungwen_liang_creyonbio_com/PROGRAMS/cp2k-2023/tools/toolchain/install/scalapack-2.2.1/lib
-Wl,-rpath,/home/chungwen_liang_creyonbio_com/PROGRAMS/cp2k-2023/tools/toolchain/install/scalapack-2.2.1/lib
-L/usr/local/cuda-12.3/lib64 -I./ -I../ -c
../test/shared/GPU/CUDA/test_cudaFunctions.cu -o
test/shared/GPU/CUDA/test_cudaFunctions.o >/dev/null 2>&1
PPFC src/GPU/libelpa_openmp_private_la-check_for_gpu.lo
PPFC src/solve_tridi/libelpa_openmp_private_la-mod_global_product.lo
PPFC src/solve_tridi/libelpa_openmp_private_la-mod_v_add_s.lo
PPFC
src/solve_tridi/libelpa_openmp_private_la-mod_solve_secular_equation.lo
PPFC src/solve_tridi/libelpa_openmp_private_la-mod_resort_ev.lo
PPFC src/solve_tridi/libelpa_openmp_private_la-mod_global_gather.lo
PPFC
src/solve_tridi/libelpa_openmp_private_la-mod_transform_columns.lo
PPFC src/solve_tridi/libelpa_openmp_private_la-mod_check_monotony.lo
PPFC
src/solve_tridi/libelpa_openmp_private_la-mod_distribute_global_column.lo
PPFC
src/elpa2/kernels/libelpa_openmp_private_la-mod_single_hh_trafo_real.lo
PPFC src/elpa2/libelpa_openmp_private_la-elpa2_determine_workload.lo
PPFC src/elpa2/libelpa_openmp_private_la-mod_pack_unpack_cpu.lo
PPFC src/elpa2/libelpa_openmp_private_la-mod_pack_unpack_gpu.lo
PPFC src/libelpa_openmp_private_la-elpa_autotune_impl.lo
PPFC src/elpa2/kernels/libelpa_openmp_private_la-real.lo
PPFC src/elpa2/kernels/libelpa_openmp_private_la-complex.lo
PPFC src/elpa2/kernels/libelpa_openmp_private_la-real_simple.lo
PPFC src/elpa2/kernels/libelpa_openmp_private_la-complex_simple.lo
PPFC src/elpa2/kernels/libelpa_openmp_private_la-real_simple_block4.lo
PPFC src/elpa2/kernels/libelpa_openmp_private_la-real_simple_block6.lo
PPFC src/solve_tridi/libelpa_openmp_private_la-mod_add_tmp.lo
PPFC src/elpa2/libelpa_openmp_private_la-mod_compute_hh_trafo.lo
PPFC src/elpa2/libelpa_openmp_private_la-mod_redist_band.lo
PPFC src/solve_tridi/libelpa_openmp_private_la-mod_merge_systems.lo
PPFC src/solve_tridi/libelpa_openmp_private_la-mod_merge_recursive.lo
PPFC src/elpa1/libelpa_openmp_private_la-elpa1_compute_private.lo
PPFC src/solve_tridi/libelpa_openmp_private_la-mod_solve_tridi.lo
PPFC src/cholesky/libelpa_openmp_private_la-mod_elpa_cholesky.lo
PPFC src/invert_trm/libelpa_openmp_private_la-mod_elpa_invert_trm.lo
PPFC
src/multiply_a_b/libelpa_openmp_private_la-mod_elpa_multiply_a_b.lo
PPFC src/elpa2/qr/libelpa_openmp_private_la-qr_utils.lo
PPFC src/elpa1/libelpa_openmp_private_la-elpa1_auxiliary.lo
libtool: compile: ../nvcc_wrap -std=c++14 -allow-unsupported-compiler
-arch sm_80 -O2 -I/usr/local/cuda-12.3/include --default-stream per-thread
-Wl,--allow-multiple-definition -Wl,--enable-new-dtags
-L/home/chungwen_liang_creyonbio_com/PROGRAMS/cp2k-2023/tools/toolchain/install/openblas-0.3.23/lib
-Wl,-rpath,/home/chungwen_liang_creyonbio_com/PROGRAMS/cp2k-2023/tools/toolchain/install/openblas-0.3.23/lib
-L/home/chungwen_liang_creyonbio_com/PROGRAMS/cp2k-2023/tools/toolchain/install/scalapack-2.2.1/lib
-Wl,-rpath,/home/chungwen_liang_creyonbio_com/PROGRAMS/cp2k-2023/tools/toolchain/install/scalapack-2.2.1/lib
-L/usr/local/cuda-12.3/lib64 -I./ -I../ -c
../src/elpa2/GPU/CUDA/ev_tridi_band_nvidia_gpu_real_sm80.cu -o
src/elpa2/GPU/CUDA/ev_tridi_band_nvidia_gpu_real_sm80.o >/dev/null 2>&1
PPFC src/elpa1/libelpa_openmp_private_la-elpa1.lo
PPFC src/elpa2/qr/libelpa_openmp_private_la-elpa_pdlarfb.lo
PPFC src/elpa2/qr/libelpa_openmp_private_la-elpa_pdgeqrf.lo
PPFC src/elpa2/libelpa_openmp_private_la-elpa2_compute.lo
PPFC src/elpa2/libelpa_openmp_private_la-elpa2.lo
PPFC src/libelpa_openmp_private_la-elpa_impl.lo
PPFC src/libelpa_openmp_public_la-elpa.lo
CXXLD libelpa_openmp_private.la
FCLD libelpa_openmp_public.la
PPFC test/shared/libelpatest_openmp_la-test_util.lo
GEN libelpa_openmp.la
PPFC test/shared/libelpatest_openmp_la-test_read_input_parameters.lo
PPFC test/shared/libelpatest_openmp_la-test_setup_mpi.lo
PPFC test/shared/libelpatest_openmp_la-test_analytic.lo
PPFC test/shared/libelpatest_openmp_la-test_check_correctness.lo
PPFC test/shared/libelpatest_openmp_la-test_blacs_infrastructure.lo
PPFC src/elpa2/elpa2_print_kernels_openmp-elpa2_print_kernels.o
FCLD elpa2_print_kernels_openmp
/usr/bin/ld:
./.libs/libelpa_openmp.a(ev_tridi_band_nvidia_gpu_real_sm80.o): in function
`_GLOBAL__sub_I__Z20set_max_shared_bytesPKv':
tmpxft_0036498c_00000000-6_ev_tridi_band_nvidia_gpu_real_sm80.cudafe1.cpp:(.text.startup+0x41c):
undefined reference to `std::ios_base::Init::Init()'
/usr/bin/ld:
tmpxft_0036498c_00000000-6_ev_tridi_band_nvidia_gpu_real_sm80.cudafe1.cpp:(.text.startup+0x423):
undefined reference to `std::ios_base::Init::~Init()'
collect2: error: ld returned 1 exit status
make[1]: *** [Makefile:69291: elpa2_print_kernels_openmp] Error 1
make[1]: *** Waiting for unfinished jobs....
make[1]: Leaving directory
'/home/chungwen_liang_creyonbio_com/PROGRAMS/cp2k-2023/tools/toolchain/build/elpa-2022.11.001/build_nvidia'
make: *** [Makefile:68220: all] Error 2
make install-am
make[1]: Entering directory
'/home/chungwen_liang_creyonbio_com/PROGRAMS/cp2k-2023/tools/toolchain/build/elpa-2022.11.001/build_nvidia'
FCLD elpa2_print_kernels_openmp
/usr/bin/ld:
./.libs/libelpa_openmp.a(ev_tridi_band_nvidia_gpu_real_sm80.o): in function
`_GLOBAL__sub_I__Z20set_max_shared_bytesPKv':
tmpxft_0036498c_00000000-6_ev_tridi_band_nvidia_gpu_real_sm80.cudafe1.cpp:(.text.startup+0x41c):
undefined reference to `std::ios_base::Init::Init()'
/usr/bin/ld:
tmpxft_0036498c_00000000-6_ev_tridi_band_nvidia_gpu_real_sm80.cudafe1.cpp:(.text.startup+0x423):
undefined reference to `std::ios_base::Init::~Init()'
collect2: error: ld returned 1 exit status
make[1]: *** [Makefile:69291: elpa2_print_kernels_openmp] Error 1
make[1]: Leaving directory
'/home/chungwen_liang_creyonbio_com/PROGRAMS/cp2k-2023/tools/toolchain/build/elpa-2022.11.001/build_nvidia'
make: *** [Makefile:90711: install] Error 2
Step elpa took 169.00 seconds.
Step ptscotch took 0.00 seconds.
Step superlu took 0.00 seconds.
Step pexsi took 0.00 seconds.
Step quip took 0.00 seconds.
--
You received this message because you are subscribed to the Google Groups "cp2k" group.
To unsubscribe from this group and stop receiving emails from it, send an email to cp2k+unsubscribe at googlegroups.com.
To view this discussion on the web visit https://groups.google.com/d/msgid/cp2k/25358bc6-6eca-43bc-8b5a-eea952d46a8bn%40googlegroups.com.
-------------- next part --------------
An HTML attachment was scrubbed...
URL: <https://lists.cp2k.org/archives/cp2k-user/attachments/20231211/c0e143eb/attachment-0001.htm>
More information about the CP2K-user
mailing list