[CP2K-user] [CP2K:19649] Compilation error of ELPA (cp2k-v2023.2)

Chungwen Liang chungwen.liang at creyonbio.com
Tue Dec 12 04:34:10 UTC 2023


Hi all, 

I experienced the following error when compiling ELPA library. Could you 
please point me the direction? Thanks so much.

==================== Installing ELPA ====================

wget  --quiet https://www.cp2k.org/static/downloads/elpa-2022.11.001.tar.gz

elpa-2022.11.001.tar.gz: OK

Checksum of elpa-2022.11.001.tar.gz Ok

Installing from scratch into 
/home/chungwen_liang_creyonbio_com/PROGRAMS/cp2k-2023/tools/toolchain/install/elpa-2022.11.001/cpu

Installing from scratch into 
/home/chungwen_liang_creyonbio_com/PROGRAMS/cp2k-2023/tools/toolchain/install/elpa-2022.11.001/nvidia

 7974 | static __forceinline void 
CONCAT_8ARGS(hh_trafo_complex_kernel_,ROW_LENGTH,_,SIMD_SET,_,BLOCK,hv_,WORD_LENGTH) 
(DATA_TYPE_PTR q, DATA_TYPE_PTR hh, int nb, int ldq

      |                                        ^~~~~~~~~~~~~~~~~~~~~~~~

../src/elpa2/kernels/complex_128bit_256bit_512bit_BLOCK_template.c:51:47: 
note: in definition of macro 'CONCAT2_8ARGS'

   51 | #define CONCAT2_8ARGS(a, b, c, d, e, f, g, h) a ## b ## c ## d ## e 
## f ## g ## h

      |                                               ^

../src/elpa2/kernels/complex_128bit_256bit_512bit_BLOCK_template.c:7974:27: 
note: in expansion of macro 'CONCAT_8ARGS'

 7974 | static __forceinline void 
CONCAT_8ARGS(hh_trafo_complex_kernel_,ROW_LENGTH,_,SIMD_SET,_,BLOCK,hv_,WORD_LENGTH) 
(DATA_TYPE_PTR q, DATA_TYPE_PTR hh, int nb, int ldq

      |                           ^~~~~~~~~~~~

../test/shared/GPU/test_gpu_vendor_agnostic_layerFunctions.c: In function 
'gpuFree':

../test/shared/GPU/test_gpu_vendor_agnostic_layerFunctions.c:104:11: 
warning: implicit declaration of function 'cudaFreeFromC' 
[-Wimplicit-function-declaration]

  104 |    return cudaFreeFromC(a);

      |           ^~~~~~~~~~~~~

../src/elpa2/kernels/complex_128bit_256bit_512bit_BLOCK_template.c:6719:40: 
warning: 'always_inline' function might not be inlinable [-Wattributes]

 6719 | static __forceinline void 
CONCAT_8ARGS(hh_trafo_complex_kernel_,ROW_LENGTH,_,SIMD_SET,_,BLOCK,hv_,WORD_LENGTH) 
(DATA_TYPE_PTR q, DATA_TYPE_PTR hh, int nb, int ldq

      |                                        ^~~~~~~~~~~~~~~~~~~~~~~~

../src/elpa2/kernels/complex_128bit_256bit_512bit_BLOCK_template.c:51:47: 
note: in definition of macro 'CONCAT2_8ARGS'

   51 | #define CONCAT2_8ARGS(a, b, c, d, e, f, g, h) a ## b ## c ## d ## e 
## f ## g ## h

      |                                               ^

../src/elpa2/kernels/complex_128bit_256bit_512bit_BLOCK_template.c:6719:27: 
note: in expansion of macro 'CONCAT_8ARGS'

 6719 | static __forceinline void 
CONCAT_8ARGS(hh_trafo_complex_kernel_,ROW_LENGTH,_,SIMD_SET,_,BLOCK,hv_,WORD_LENGTH) 
(DATA_TYPE_PTR q, DATA_TYPE_PTR hh, int nb, int ldq

      |                           ^~~~~~~~~~~~

../test/shared/GPU/test_gpu_vendor_agnostic_layerFunctions.c: In function 
'gpuMemcpy':

../test/shared/GPU/test_gpu_vendor_agnostic_layerFunctions.c:113:11: 
warning: implicit declaration of function 'cudaMemcpyFromC' 
[-Wimplicit-function-declaration]

  113 |    return cudaMemcpyFromC(dest, src, count, dir);

      |           ^~~~~~~~~~~~~~~

../src/elpa2/kernels/complex_128bit_256bit_512bit_BLOCK_template.c:5285:40: 
warning: 'always_inline' function might not be inlinable [-Wattributes]

 5285 | static __forceinline void 
CONCAT_8ARGS(hh_trafo_complex_kernel_,ROW_LENGTH,_,SIMD_SET,_,BLOCK,hv_,WORD_LENGTH) 
(DATA_TYPE_PTR q, DATA_TYPE_PTR hh, int nb, int ldq

      |                                        ^~~~~~~~~~~~~~~~~~~~~~~~

../src/elpa2/kernels/complex_128bit_256bit_512bit_BLOCK_template.c:51:47: 
note: in definition of macro 'CONCAT2_8ARGS'

   51 | #define CONCAT2_8ARGS(a, b, c, d, e, f, g, h) a ## b ## c ## d ## e 
## f ## g ## h

      |                                               ^

../src/elpa2/kernels/complex_128bit_256bit_512bit_BLOCK_template.c:5285:27: 
note: in expansion of macro 'CONCAT_8ARGS'

 5285 | static __forceinline void 
CONCAT_8ARGS(hh_trafo_complex_kernel_,ROW_LENGTH,_,SIMD_SET,_,BLOCK,hv_,WORD_LENGTH) 
(DATA_TYPE_PTR q, DATA_TYPE_PTR hh, int nb, int ldq

      |                           ^~~~~~~~~~~~

../src/elpa2/kernels/complex_128bit_256bit_512bit_BLOCK_template.c:3681:40: 
warning: 'always_inline' function might not be inlinable [-Wattributes]

 3681 | static __forceinline void 
CONCAT_8ARGS(hh_trafo_complex_kernel_,ROW_LENGTH,_,SIMD_SET,_,BLOCK,hv_,WORD_LENGTH) 
(DATA_TYPE_PTR q, DATA_TYPE_PTR hh, int nb, int ldq

      |                                        ^~~~~~~~~~~~~~~~~~~~~~~~

../src/elpa2/kernels/complex_128bit_256bit_512bit_BLOCK_template.c:51:47: 
note: in definition of macro 'CONCAT2_8ARGS'

   51 | #define CONCAT2_8ARGS(a, b, c, d, e, f, g, h) a ## b ## c ## d ## e 
## f ## g ## h

      |                                               ^

../src/elpa2/kernels/complex_128bit_256bit_512bit_BLOCK_template.c:3681:27: 
note: in expansion of macro 'CONCAT_8ARGS'

 3681 | static __forceinline void 
CONCAT_8ARGS(hh_trafo_complex_kernel_,ROW_LENGTH,_,SIMD_SET,_,BLOCK,hv_,WORD_LENGTH) 
(DATA_TYPE_PTR q, DATA_TYPE_PTR hh, int nb, int ldq

      |                           ^~~~~~~~~~~~

../src/elpa2/kernels/complex_128bit_256bit_512bit_BLOCK_template.c:1872:40: 
warning: 'always_inline' function might not be inlinable [-Wattributes]

 1872 | static __forceinline void 
CONCAT_8ARGS(hh_trafo_complex_kernel_,ROW_LENGTH,_,SIMD_SET,_,BLOCK,hv_,WORD_LENGTH) 
(DATA_TYPE_PTR q, DATA_TYPE_PTR hh, int nb, int ldq

      |                                        ^~~~~~~~~~~~~~~~~~~~~~~~

../src/elpa2/kernels/complex_128bit_256bit_512bit_BLOCK_template.c:51:47: 
note: in definition of macro 'CONCAT2_8ARGS'

   51 | #define CONCAT2_8ARGS(a, b, c, d, e, f, g, h) a ## b ## c ## d ## e 
## f ## g ## h

      |                                               ^

../src/elpa2/kernels/complex_128bit_256bit_512bit_BLOCK_template.c:1872:27: 
note: in expansion of macro 'CONCAT_8ARGS'

 1872 | static __forceinline void 
CONCAT_8ARGS(hh_trafo_complex_kernel_,ROW_LENGTH,_,SIMD_SET,_,BLOCK,hv_,WORD_LENGTH) 
(DATA_TYPE_PTR q, DATA_TYPE_PTR hh, int nb, int ldq

      |                           ^~~~~~~~~~~~

  PPFC     src/GPU/CUDA/libelpa_openmp_private_la-mod_cuda.lo

In file included from 
../src/elpa2/kernels/complex_avx_2hv_double_precision.c:54:

../src/elpa2/kernels/complex_128bit_256bit_512bit_BLOCK_template.c:9043:40: 
warning: 'always_inline' function might not be inlinable [-Wattributes]

 9043 | static __forceinline void 
CONCAT_8ARGS(hh_trafo_complex_kernel_,ROW_LENGTH,_,SIMD_SET,_,BLOCK,hv_,WORD_LENGTH) 
(DATA_TYPE_PTR q, DATA_TYPE_PTR hh, int nb, int ldq

      |                                        ^~~~~~~~~~~~~~~~~~~~~~~~

../src/elpa2/kernels/complex_128bit_256bit_512bit_BLOCK_template.c:51:47: 
note: in definition of macro 'CONCAT2_8ARGS'

   51 | #define CONCAT2_8ARGS(a, b, c, d, e, f, g, h) a ## b ## c ## d ## e 
## f ## g ## h

      |                                               ^

../src/elpa2/kernels/complex_128bit_256bit_512bit_BLOCK_template.c:9043:27: 
note: in expansion of macro 'CONCAT_8ARGS'

 9043 | static __forceinline void 
CONCAT_8ARGS(hh_trafo_complex_kernel_,ROW_LENGTH,_,SIMD_SET,_,BLOCK,hv_,WORD_LENGTH) 
(DATA_TYPE_PTR q, DATA_TYPE_PTR hh, int nb, int ldq

      |                           ^~~~~~~~~~~~

../src/elpa2/kernels/complex_128bit_256bit_512bit_BLOCK_template.c:7974:40: 
warning: 'always_inline' function might not be inlinable [-Wattributes]

 7974 | static __forceinline void 
CONCAT_8ARGS(hh_trafo_complex_kernel_,ROW_LENGTH,_,SIMD_SET,_,BLOCK,hv_,WORD_LENGTH) 
(DATA_TYPE_PTR q, DATA_TYPE_PTR hh, int nb, int ldq

      |                                        ^~~~~~~~~~~~~~~~~~~~~~~~

../src/elpa2/kernels/complex_128bit_256bit_512bit_BLOCK_template.c:51:47: 
note: in definition of macro 'CONCAT2_8ARGS'

   51 | #define CONCAT2_8ARGS(a, b, c, d, e, f, g, h) a ## b ## c ## d ## e 
## f ## g ## h

      |                                               ^

../src/elpa2/kernels/complex_128bit_256bit_512bit_BLOCK_template.c:7974:27: 
note: in expansion of macro 'CONCAT_8ARGS'

 7974 | static __forceinline void 
CONCAT_8ARGS(hh_trafo_complex_kernel_,ROW_LENGTH,_,SIMD_SET,_,BLOCK,hv_,WORD_LENGTH) 
(DATA_TYPE_PTR q, DATA_TYPE_PTR hh, int nb, int ldq

      |                           ^~~~~~~~~~~~

../src/elpa2/kernels/complex_128bit_256bit_512bit_BLOCK_template.c:6719:40: 
warning: 'always_inline' function might not be inlinable [-Wattributes]

 6719 | static __forceinline void 
CONCAT_8ARGS(hh_trafo_complex_kernel_,ROW_LENGTH,_,SIMD_SET,_,BLOCK,hv_,WORD_LENGTH) 
(DATA_TYPE_PTR q, DATA_TYPE_PTR hh, int nb, int ldq

      |                                        ^~~~~~~~~~~~~~~~~~~~~~~~

../src/elpa2/kernels/complex_128bit_256bit_512bit_BLOCK_template.c:51:47: 
note: in definition of macro 'CONCAT2_8ARGS'

   51 | #define CONCAT2_8ARGS(a, b, c, d, e, f, g, h) a ## b ## c ## d ## e 
## f ## g ## h

      |                                               ^

../src/elpa2/kernels/complex_128bit_256bit_512bit_BLOCK_template.c:6719:27: 
note: in expansion of macro 'CONCAT_8ARGS'

 6719 | static __forceinline void 
CONCAT_8ARGS(hh_trafo_complex_kernel_,ROW_LENGTH,_,SIMD_SET,_,BLOCK,hv_,WORD_LENGTH) 
(DATA_TYPE_PTR q, DATA_TYPE_PTR hh, int nb, int ldq

      |                           ^~~~~~~~~~~~

../src/elpa2/kernels/complex_128bit_256bit_512bit_BLOCK_template.c:5285:40: 
warning: 'always_inline' function might not be inlinable [-Wattributes]

 5285 | static __forceinline void 
CONCAT_8ARGS(hh_trafo_complex_kernel_,ROW_LENGTH,_,SIMD_SET,_,BLOCK,hv_,WORD_LENGTH) 
(DATA_TYPE_PTR q, DATA_TYPE_PTR hh, int nb, int ldq

      |                                        ^~~~~~~~~~~~~~~~~~~~~~~~

../src/elpa2/kernels/complex_128bit_256bit_512bit_BLOCK_template.c:51:47: 
note: in definition of macro 'CONCAT2_8ARGS'

   51 | #define CONCAT2_8ARGS(a, b, c, d, e, f, g, h) a ## b ## c ## d ## e 
## f ## g ## h

      |                                               ^

../src/elpa2/kernels/complex_128bit_256bit_512bit_BLOCK_template.c:5285:27: 
note: in expansion of macro 'CONCAT_8ARGS'

 5285 | static __forceinline void 
CONCAT_8ARGS(hh_trafo_complex_kernel_,ROW_LENGTH,_,SIMD_SET,_,BLOCK,hv_,WORD_LENGTH) 
(DATA_TYPE_PTR q, DATA_TYPE_PTR hh, int nb, int ldq

      |                           ^~~~~~~~~~~~

../src/elpa2/kernels/complex_128bit_256bit_512bit_BLOCK_template.c:3681:40: 
warning: 'always_inline' function might not be inlinable [-Wattributes]

 3681 | static __forceinline void 
CONCAT_8ARGS(hh_trafo_complex_kernel_,ROW_LENGTH,_,SIMD_SET,_,BLOCK,hv_,WORD_LENGTH) 
(DATA_TYPE_PTR q, DATA_TYPE_PTR hh, int nb, int ldq

      |                                        ^~~~~~~~~~~~~~~~~~~~~~~~

../src/elpa2/kernels/complex_128bit_256bit_512bit_BLOCK_template.c:51:47: 
note: in definition of macro 'CONCAT2_8ARGS'

   51 | #define CONCAT2_8ARGS(a, b, c, d, e, f, g, h) a ## b ## c ## d ## e 
## f ## g ## h

      |                                               ^

../src/elpa2/kernels/complex_128bit_256bit_512bit_BLOCK_template.c:3681:27: 
note: in expansion of macro 'CONCAT_8ARGS'

 3681 | static __forceinline void 
CONCAT_8ARGS(hh_trafo_complex_kernel_,ROW_LENGTH,_,SIMD_SET,_,BLOCK,hv_,WORD_LENGTH) 
(DATA_TYPE_PTR q, DATA_TYPE_PTR hh, int nb, int ldq

      |                           ^~~~~~~~~~~~

../src/elpa2/kernels/complex_128bit_256bit_512bit_BLOCK_template.c:1872:40: 
warning: 'always_inline' function might not be inlinable [-Wattributes]

 1872 | static __forceinline void 
CONCAT_8ARGS(hh_trafo_complex_kernel_,ROW_LENGTH,_,SIMD_SET,_,BLOCK,hv_,WORD_LENGTH) 
(DATA_TYPE_PTR q, DATA_TYPE_PTR hh, int nb, int ldq

      |                                        ^~~~~~~~~~~~~~~~~~~~~~~~

../src/elpa2/kernels/complex_128bit_256bit_512bit_BLOCK_template.c:51:47: 
note: in definition of macro 'CONCAT2_8ARGS'

   51 | #define CONCAT2_8ARGS(a, b, c, d, e, f, g, h) a ## b ## c ## d ## e 
## f ## g ## h

      |                                               ^

../src/elpa2/kernels/complex_128bit_256bit_512bit_BLOCK_template.c:1872:27: 
note: in expansion of macro 'CONCAT_8ARGS'

 1872 | static __forceinline void 
CONCAT_8ARGS(hh_trafo_complex_kernel_,ROW_LENGTH,_,SIMD_SET,_,BLOCK,hv_,WORD_LENGTH) 
(DATA_TYPE_PTR q, DATA_TYPE_PTR hh, int nb, int ldq

      |                           ^~~~~~~~~~~~

  PPFC     src/GPU/OpenMP/libelpa_openmp_private_la-mod_openmp_offload.lo

  PPFC     src/GPU/ROCm/libelpa_openmp_private_la-mod_hip.lo

  PPFC     src/helpers/libelpa_openmp_private_la-mod_scalapack_interfaces.lo

  PPFC     src/ftimings/libelpa_openmp_private_la-ftimings_value.lo

  PPFC     
src/invert_trm/GPU/CUDA/libelpa_openmp_private_la-mod_invert_trm_cuda.lo

  PPFC     
src/cholesky/GPU/CUDA/libelpa_openmp_private_la-mod_cholesky_cuda.lo

  PPFC     src/helpers/libelpa_openmp_private_la-mod_blas_interfaces.lo

  PPFC     src/elpa2/GPU/libelpa_openmp_private_la-interface_c_gpu_kernel.lo

  PPFC     src/helpers/libelpa_openmp_private_la-mod_thread_affinity.lo

  PPFC     
test/shared/libelpatest_openmp_la-mod_tests_scalapack_interfaces.lo

  PPFC     test/shared/libelpatest_openmp_la-mod_tests_blas_interfaces.lo

  PPFC     test/shared/GPU/CUDA/libelpatest_openmp_la-test_cuda.lo

  PPFC     src/ftimings/libelpa_openmp_private_la-ftimings.lo

  PPFC     src/cholesky/GPU/libelpa_openmp_private_la-mod_cholesky_gpu.lo

libtool: compile:  ../nvcc_wrap -std=c++14 -allow-unsupported-compiler 
-arch sm_80 -O2 -I/usr/local/cuda-12.3/include --default-stream per-thread 
-Wl,--allow-multiple-definition -Wl,--enable-new-dtags 
-L/home/chungwen_liang_creyonbio_com/PROGRAMS/cp2k-2023/tools/toolchain/install/openblas-0.3.23/lib 
-Wl,-rpath,/home/chungwen_liang_creyonbio_com/PROGRAMS/cp2k-2023/tools/toolchain/install/openblas-0.3.23/lib 
-L/home/chungwen_liang_creyonbio_com/PROGRAMS/cp2k-2023/tools/toolchain/install/scalapack-2.2.1/lib 
-Wl,-rpath,/home/chungwen_liang_creyonbio_com/PROGRAMS/cp2k-2023/tools/toolchain/install/scalapack-2.2.1/lib 
-L/usr/local/cuda-12.3/lib64 -I./ -I../ -c 
../src/GPU/CUDA/elpa_index_nvidia_gpu.cu -o 
src/GPU/CUDA/elpa_index_nvidia_gpu.o >/dev/null 2>&1

  PPFC     
src/invert_trm/GPU/libelpa_openmp_private_la-mod_invert_trm_gpu.lo

  PPFC     src/elpa2/qr/libelpa_openmp_private_la-elpa_qrkernels.lo

  PPFC     test/shared/libelpatest_openmp_la-test_prepare_matrix.lo

libtool: compile:  ../nvcc_wrap -std=c++14 -allow-unsupported-compiler 
-arch sm_80 -O2 -I/usr/local/cuda-12.3/include --default-stream per-thread 
-Wl,--allow-multiple-definition -Wl,--enable-new-dtags 
-L/home/chungwen_liang_creyonbio_com/PROGRAMS/cp2k-2023/tools/toolchain/install/openblas-0.3.23/lib 
-Wl,-rpath,/home/chungwen_liang_creyonbio_com/PROGRAMS/cp2k-2023/tools/toolchain/install/openblas-0.3.23/lib 
-L/home/chungwen_liang_creyonbio_com/PROGRAMS/cp2k-2023/tools/toolchain/install/scalapack-2.2.1/lib 
-Wl,-rpath,/home/chungwen_liang_creyonbio_com/PROGRAMS/cp2k-2023/tools/toolchain/install/scalapack-2.2.1/lib 
-L/usr/local/cuda-12.3/lib64 -I./ -I../ -c 
../src/GPU/CUDA/elpa_explicit_name_nvidia_gpu.cu -o 
src/GPU/CUDA/elpa_explicit_name_nvidia_gpu.o >/dev/null 2>&1

  PPFC     src/GPU/libelpa_openmp_private_la-mod_vendor_agnostic_layer.lo

  PPFC     
test/shared/GPU/libelpatest_openmp_la-test_gpu_vendor_agnostic_layer.lo

libtool: compile:  ../nvcc_wrap -std=c++14 -allow-unsupported-compiler 
-arch sm_80 -O2 -I/usr/local/cuda-12.3/include --default-stream per-thread 
-Wl,--allow-multiple-definition -Wl,--enable-new-dtags 
-L/home/chungwen_liang_creyonbio_com/PROGRAMS/cp2k-2023/tools/toolchain/install/openblas-0.3.23/lib 
-Wl,-rpath,/home/chungwen_liang_creyonbio_com/PROGRAMS/cp2k-2023/tools/toolchain/install/openblas-0.3.23/lib 
-L/home/chungwen_liang_creyonbio_com/PROGRAMS/cp2k-2023/tools/toolchain/install/scalapack-2.2.1/lib 
-Wl,-rpath,/home/chungwen_liang_creyonbio_com/PROGRAMS/cp2k-2023/tools/toolchain/install/scalapack-2.2.1/lib 
-L/usr/local/cuda-12.3/lib64 -I./ -I../ -c ../src/GPU/CUDA/cuUtils.cu -o 
src/GPU/CUDA/cuUtils.o >/dev/null 2>&1

libtool: compile:  ../nvcc_wrap -std=c++14 -allow-unsupported-compiler 
-arch sm_80 -O2 -I/usr/local/cuda-12.3/include --default-stream per-thread 
-Wl,--allow-multiple-definition -Wl,--enable-new-dtags 
-L/home/chungwen_liang_creyonbio_com/PROGRAMS/cp2k-2023/tools/toolchain/install/openblas-0.3.23/lib 
-Wl,-rpath,/home/chungwen_liang_creyonbio_com/PROGRAMS/cp2k-2023/tools/toolchain/install/openblas-0.3.23/lib 
-L/home/chungwen_liang_creyonbio_com/PROGRAMS/cp2k-2023/tools/toolchain/install/scalapack-2.2.1/lib 
-Wl,-rpath,/home/chungwen_liang_creyonbio_com/PROGRAMS/cp2k-2023/tools/toolchain/install/scalapack-2.2.1/lib 
-L/usr/local/cuda-12.3/lib64 -I./ -I../ -c 
../src/cholesky/GPU/CUDA/elpa_cholesky_cuda.cu -o 
src/cholesky/GPU/CUDA/elpa_cholesky_cuda.o >/dev/null 2>&1

libtool: compile:  ../nvcc_wrap -std=c++14 -allow-unsupported-compiler 
-arch sm_80 -O2 -I/usr/local/cuda-12.3/include --default-stream per-thread 
-Wl,--allow-multiple-definition -Wl,--enable-new-dtags 
-L/home/chungwen_liang_creyonbio_com/PROGRAMS/cp2k-2023/tools/toolchain/install/openblas-0.3.23/lib 
-Wl,-rpath,/home/chungwen_liang_creyonbio_com/PROGRAMS/cp2k-2023/tools/toolchain/install/openblas-0.3.23/lib 
-L/home/chungwen_liang_creyonbio_com/PROGRAMS/cp2k-2023/tools/toolchain/install/scalapack-2.2.1/lib 
-Wl,-rpath,/home/chungwen_liang_creyonbio_com/PROGRAMS/cp2k-2023/tools/toolchain/install/scalapack-2.2.1/lib 
-L/usr/local/cuda-12.3/lib64 -I./ -I../ -c 
../src/elpa2/GPU/CUDA/ev_tridi_band_nvidia_gpu_complex.cu -o 
src/elpa2/GPU/CUDA/ev_tridi_band_nvidia_gpu_complex.o >/dev/null 2>&1

libtool: compile:  ../nvcc_wrap -std=c++14 -allow-unsupported-compiler 
-arch sm_80 -O2 -I/usr/local/cuda-12.3/include --default-stream per-thread 
-Wl,--allow-multiple-definition -Wl,--enable-new-dtags 
-L/home/chungwen_liang_creyonbio_com/PROGRAMS/cp2k-2023/tools/toolchain/install/openblas-0.3.23/lib 
-Wl,-rpath,/home/chungwen_liang_creyonbio_com/PROGRAMS/cp2k-2023/tools/toolchain/install/openblas-0.3.23/lib 
-L/home/chungwen_liang_creyonbio_com/PROGRAMS/cp2k-2023/tools/toolchain/install/scalapack-2.2.1/lib 
-Wl,-rpath,/home/chungwen_liang_creyonbio_com/PROGRAMS/cp2k-2023/tools/toolchain/install/scalapack-2.2.1/lib 
-L/usr/local/cuda-12.3/lib64 -I./ -I../ -c 
../src/invert_trm/GPU/CUDA/elpa_invert_trm_cuda.cu -o 
src/invert_trm/GPU/CUDA/elpa_invert_trm_cuda.o >/dev/null 2>&1

  PPFC     src/general/libelpa_openmp_private_la-elpa_utilities.lo

  PPFC     src/helpers/libelpa_openmp_private_la-matrix_plot.lo

libtool: compile:  ../nvcc_wrap -std=c++14 -allow-unsupported-compiler 
-arch sm_80 -O2 -I/usr/local/cuda-12.3/include --default-stream per-thread 
-Wl,--allow-multiple-definition -Wl,--enable-new-dtags 
-L/home/chungwen_liang_creyonbio_com/PROGRAMS/cp2k-2023/tools/toolchain/install/openblas-0.3.23/lib 
-Wl,-rpath,/home/chungwen_liang_creyonbio_com/PROGRAMS/cp2k-2023/tools/toolchain/install/openblas-0.3.23/lib 
-L/home/chungwen_liang_creyonbio_com/PROGRAMS/cp2k-2023/tools/toolchain/install/scalapack-2.2.1/lib 
-Wl,-rpath,/home/chungwen_liang_creyonbio_com/PROGRAMS/cp2k-2023/tools/toolchain/install/scalapack-2.2.1/lib 
-L/usr/local/cuda-12.3/lib64 -I./ -I../ -c 
../src/elpa2/GPU/CUDA/ev_tridi_band_nvidia_gpu_real.cu -o 
src/elpa2/GPU/CUDA/ev_tridi_band_nvidia_gpu_real.o >/dev/null 2>&1

  PPFC     src/libelpa_openmp_public_la-elpa_api.lo

  PPFC     
src/general/libelpa_openmp_private_la-mod_elpa_skewsymmetric_blas.lo

libtool: compile:  ../nvcc_wrap -std=c++14 -allow-unsupported-compiler 
-arch sm_80 -O2 -I/usr/local/cuda-12.3/include --default-stream per-thread 
-Wl,--allow-multiple-definition -Wl,--enable-new-dtags 
-L/home/chungwen_liang_creyonbio_com/PROGRAMS/cp2k-2023/tools/toolchain/install/openblas-0.3.23/lib 
-Wl,-rpath,/home/chungwen_liang_creyonbio_com/PROGRAMS/cp2k-2023/tools/toolchain/install/openblas-0.3.23/lib 
-L/home/chungwen_liang_creyonbio_com/PROGRAMS/cp2k-2023/tools/toolchain/install/scalapack-2.2.1/lib 
-Wl,-rpath,/home/chungwen_liang_creyonbio_com/PROGRAMS/cp2k-2023/tools/toolchain/install/scalapack-2.2.1/lib 
-L/usr/local/cuda-12.3/lib64 -I./ -I../ -c ../src/GPU/CUDA/cudaFunctions.cu 
-o src/GPU/CUDA/cudaFunctions.o >/dev/null 2>&1

  PPFC     src/libelpa_openmp_private_la-elpa_abstract_impl.lo

libtool: compile:  ../nvcc_wrap -std=c++14 -allow-unsupported-compiler 
-arch sm_80 -O2 -I/usr/local/cuda-12.3/include --default-stream per-thread 
-Wl,--allow-multiple-definition -Wl,--enable-new-dtags 
-L/home/chungwen_liang_creyonbio_com/PROGRAMS/cp2k-2023/tools/toolchain/install/openblas-0.3.23/lib 
-Wl,-rpath,/home/chungwen_liang_creyonbio_com/PROGRAMS/cp2k-2023/tools/toolchain/install/openblas-0.3.23/lib 
-L/home/chungwen_liang_creyonbio_com/PROGRAMS/cp2k-2023/tools/toolchain/install/scalapack-2.2.1/lib 
-Wl,-rpath,/home/chungwen_liang_creyonbio_com/PROGRAMS/cp2k-2023/tools/toolchain/install/scalapack-2.2.1/lib 
-L/usr/local/cuda-12.3/lib64 -I./ -I../ -c 
../test/shared/GPU/CUDA/test_cudaFunctions.cu -o 
test/shared/GPU/CUDA/test_cudaFunctions.o >/dev/null 2>&1

  PPFC     src/GPU/libelpa_openmp_private_la-check_for_gpu.lo

  PPFC     src/solve_tridi/libelpa_openmp_private_la-mod_global_product.lo

  PPFC     src/solve_tridi/libelpa_openmp_private_la-mod_v_add_s.lo

  PPFC     
src/solve_tridi/libelpa_openmp_private_la-mod_solve_secular_equation.lo

  PPFC     src/solve_tridi/libelpa_openmp_private_la-mod_resort_ev.lo

  PPFC     src/solve_tridi/libelpa_openmp_private_la-mod_global_gather.lo

  PPFC     
src/solve_tridi/libelpa_openmp_private_la-mod_transform_columns.lo

  PPFC     src/solve_tridi/libelpa_openmp_private_la-mod_check_monotony.lo

  PPFC     
src/solve_tridi/libelpa_openmp_private_la-mod_distribute_global_column.lo

  PPFC     
src/elpa2/kernels/libelpa_openmp_private_la-mod_single_hh_trafo_real.lo

  PPFC     src/elpa2/libelpa_openmp_private_la-elpa2_determine_workload.lo

  PPFC     src/elpa2/libelpa_openmp_private_la-mod_pack_unpack_cpu.lo

  PPFC     src/elpa2/libelpa_openmp_private_la-mod_pack_unpack_gpu.lo

  PPFC     src/libelpa_openmp_private_la-elpa_autotune_impl.lo

  PPFC     src/elpa2/kernels/libelpa_openmp_private_la-real.lo

  PPFC     src/elpa2/kernels/libelpa_openmp_private_la-complex.lo

  PPFC     src/elpa2/kernels/libelpa_openmp_private_la-real_simple.lo

  PPFC     src/elpa2/kernels/libelpa_openmp_private_la-complex_simple.lo

  PPFC     src/elpa2/kernels/libelpa_openmp_private_la-real_simple_block4.lo

  PPFC     src/elpa2/kernels/libelpa_openmp_private_la-real_simple_block6.lo

  PPFC     src/solve_tridi/libelpa_openmp_private_la-mod_add_tmp.lo

  PPFC     src/elpa2/libelpa_openmp_private_la-mod_compute_hh_trafo.lo

  PPFC     src/elpa2/libelpa_openmp_private_la-mod_redist_band.lo

  PPFC     src/solve_tridi/libelpa_openmp_private_la-mod_merge_systems.lo

  PPFC     src/solve_tridi/libelpa_openmp_private_la-mod_merge_recursive.lo

  PPFC     src/elpa1/libelpa_openmp_private_la-elpa1_compute_private.lo

  PPFC     src/solve_tridi/libelpa_openmp_private_la-mod_solve_tridi.lo

  PPFC     src/cholesky/libelpa_openmp_private_la-mod_elpa_cholesky.lo

  PPFC     src/invert_trm/libelpa_openmp_private_la-mod_elpa_invert_trm.lo

  PPFC     
src/multiply_a_b/libelpa_openmp_private_la-mod_elpa_multiply_a_b.lo

  PPFC     src/elpa2/qr/libelpa_openmp_private_la-qr_utils.lo

  PPFC     src/elpa1/libelpa_openmp_private_la-elpa1_auxiliary.lo

libtool: compile:  ../nvcc_wrap -std=c++14 -allow-unsupported-compiler 
-arch sm_80 -O2 -I/usr/local/cuda-12.3/include --default-stream per-thread 
-Wl,--allow-multiple-definition -Wl,--enable-new-dtags 
-L/home/chungwen_liang_creyonbio_com/PROGRAMS/cp2k-2023/tools/toolchain/install/openblas-0.3.23/lib 
-Wl,-rpath,/home/chungwen_liang_creyonbio_com/PROGRAMS/cp2k-2023/tools/toolchain/install/openblas-0.3.23/lib 
-L/home/chungwen_liang_creyonbio_com/PROGRAMS/cp2k-2023/tools/toolchain/install/scalapack-2.2.1/lib 
-Wl,-rpath,/home/chungwen_liang_creyonbio_com/PROGRAMS/cp2k-2023/tools/toolchain/install/scalapack-2.2.1/lib 
-L/usr/local/cuda-12.3/lib64 -I./ -I../ -c 
../src/elpa2/GPU/CUDA/ev_tridi_band_nvidia_gpu_real_sm80.cu -o 
src/elpa2/GPU/CUDA/ev_tridi_band_nvidia_gpu_real_sm80.o >/dev/null 2>&1

  PPFC     src/elpa1/libelpa_openmp_private_la-elpa1.lo

  PPFC     src/elpa2/qr/libelpa_openmp_private_la-elpa_pdlarfb.lo

  PPFC     src/elpa2/qr/libelpa_openmp_private_la-elpa_pdgeqrf.lo

  PPFC     src/elpa2/libelpa_openmp_private_la-elpa2_compute.lo

  PPFC     src/elpa2/libelpa_openmp_private_la-elpa2.lo

  PPFC     src/libelpa_openmp_private_la-elpa_impl.lo

  PPFC     src/libelpa_openmp_public_la-elpa.lo

  CXXLD    libelpa_openmp_private.la

  FCLD     libelpa_openmp_public.la

  PPFC     test/shared/libelpatest_openmp_la-test_util.lo

  GEN      libelpa_openmp.la

  PPFC     test/shared/libelpatest_openmp_la-test_read_input_parameters.lo

  PPFC     test/shared/libelpatest_openmp_la-test_setup_mpi.lo

  PPFC     test/shared/libelpatest_openmp_la-test_analytic.lo

  PPFC     test/shared/libelpatest_openmp_la-test_check_correctness.lo

  PPFC     test/shared/libelpatest_openmp_la-test_blacs_infrastructure.lo

  PPFC     src/elpa2/elpa2_print_kernels_openmp-elpa2_print_kernels.o

  FCLD     elpa2_print_kernels_openmp

/usr/bin/ld: 
./.libs/libelpa_openmp.a(ev_tridi_band_nvidia_gpu_real_sm80.o): in function 
`_GLOBAL__sub_I__Z20set_max_shared_bytesPKv':

tmpxft_0036498c_00000000-6_ev_tridi_band_nvidia_gpu_real_sm80.cudafe1.cpp:(.text.startup+0x41c): 
undefined reference to `std::ios_base::Init::Init()'

/usr/bin/ld: 
tmpxft_0036498c_00000000-6_ev_tridi_band_nvidia_gpu_real_sm80.cudafe1.cpp:(.text.startup+0x423): 
undefined reference to `std::ios_base::Init::~Init()'

collect2: error: ld returned 1 exit status

make[1]: *** [Makefile:69291: elpa2_print_kernels_openmp] Error 1

make[1]: *** Waiting for unfinished jobs....

make[1]: Leaving directory 
'/home/chungwen_liang_creyonbio_com/PROGRAMS/cp2k-2023/tools/toolchain/build/elpa-2022.11.001/build_nvidia'

make: *** [Makefile:68220: all] Error 2

make  install-am

make[1]: Entering directory 
'/home/chungwen_liang_creyonbio_com/PROGRAMS/cp2k-2023/tools/toolchain/build/elpa-2022.11.001/build_nvidia'

  FCLD     elpa2_print_kernels_openmp

/usr/bin/ld: 
./.libs/libelpa_openmp.a(ev_tridi_band_nvidia_gpu_real_sm80.o): in function 
`_GLOBAL__sub_I__Z20set_max_shared_bytesPKv':

tmpxft_0036498c_00000000-6_ev_tridi_band_nvidia_gpu_real_sm80.cudafe1.cpp:(.text.startup+0x41c): 
undefined reference to `std::ios_base::Init::Init()'

/usr/bin/ld: 
tmpxft_0036498c_00000000-6_ev_tridi_band_nvidia_gpu_real_sm80.cudafe1.cpp:(.text.startup+0x423): 
undefined reference to `std::ios_base::Init::~Init()'

collect2: error: ld returned 1 exit status

make[1]: *** [Makefile:69291: elpa2_print_kernels_openmp] Error 1

make[1]: Leaving directory 
'/home/chungwen_liang_creyonbio_com/PROGRAMS/cp2k-2023/tools/toolchain/build/elpa-2022.11.001/build_nvidia'

make: *** [Makefile:90711: install] Error 2

Step elpa took 169.00 seconds.

Step ptscotch took 0.00 seconds.

Step superlu took 0.00 seconds.

Step pexsi took 0.00 seconds.

Step quip took 0.00 seconds.

-- 
You received this message because you are subscribed to the Google Groups "cp2k" group.
To unsubscribe from this group and stop receiving emails from it, send an email to cp2k+unsubscribe at googlegroups.com.
To view this discussion on the web visit https://groups.google.com/d/msgid/cp2k/25358bc6-6eca-43bc-8b5a-eea952d46a8bn%40googlegroups.com.
-------------- next part --------------
An HTML attachment was scrubbed...
URL: <https://lists.cp2k.org/archives/cp2k-user/attachments/20231211/c0e143eb/attachment-0001.htm>


More information about the CP2K-user mailing list