System: Nehalem CPU with 8 Gbytes main memory, GTX 460 with 2 Gbytes memory, MAGMA 1.0.0 RC3 out of the box and GotoBLAS2 compiled for CORE2 (see other threads).
I get the following output from a run of testing_dgetrf_gpu:
It is crashing on exit, which I have also seen with RC2. I hope this helps figure out what is happening. There are references in the traceback to /usr/lib/atlas which I did not think I was using. I have attached my make.inc in case that has a clue in it.
If I next run testing_zgetrf_gpu and then run testing_dgetrf_gpu both run without error. I have attached the outputs below.
Best wishes
John
- Code: Select all
fletcher@fletcher-desktop:~/magma_1.0.0-rc3/testing$ ./testing_dgetrf_gpu
device 0: GeForce GTX 460, 1400.0 MHz clock, 2047.2 MB memory
Usage:
testing_dgetrf_gpu -M 1024 -N 1024
M N CPU GFlop/s GPU GFlop/s ||PA-LU||/(||A||*N)
============================================================
960 960 16.48 21.56 nan
1920 1920 25.32 43.90 nan
3072 3072 25.87 60.96 nan
4032 4032 26.53 65.27 nan
4992 4992 25.64 67.47 nan
5952 5952 26.42 68.89 nan
7104 7104 26.90 69.78 nan
8064 8064 27.04 70.76 nan
9024 9024 27.39 71.40 nan
9984 9984 26.71 71.57 nan
*** glibc detected *** ./testing_dgetrf_gpu: munmap_chunk(): invalid pointer: 0x00007fdc337b0010 ***
======= Backtrace: =========
/lib/libc.so.6(+0x775b6)[0x7fdc743785b6]
./testing_dgetrf_gpu[0x402670]
/lib/libc.so.6(__libc_start_main+0xfd)[0x7fdc7431fc4d]
./testing_dgetrf_gpu[0x401b59]
======= Memory map: ========
00400000-0053a000 r-xp 00000000 08:01 10750245 /home/fletcher/magma_1.0.0-rc3/testing/testing_dgetrf_gpu
00739000-0073a000 r--p 00139000 08:01 10750245 /home/fletcher/magma_1.0.0-rc3/testing/testing_dgetrf_gpu
0073a000-0073b000 rw-p 0013a000 08:01 10750245 /home/fletcher/magma_1.0.0-rc3/testing/testing_dgetrf_gpu
00ba4000-02fbc000 rw-p 00000000 00:00 0 [heap]
7fdc03f30000-7fdc337b0000 rw-s 1d2ad8000 00:05 4755 /dev/nvidia0
7fdc337b0000-7fdc63031000 rw-p 00000000 00:00 0
7fdc63031000-7fdc65031000 rw-p 00000000 00:00 0
7fdc67033000-7fdc69033000 rw-p 00000000 00:00 0
7fdc6b031000-7fdc6d031000 rw-p 00000000 00:00 0
7fdc6e82c000-7fdc6ec2e000 rw-s 1d757e000 00:05 4755 /dev/nvidia0
7fdc6ec2e000-7fdc6f030000 rw-s 1d7967000 00:05 4755 /dev/nvidia0
7fdc6f030000-7fdc71030000 rw-p 00000000 00:00 0
7fdc7110f000-7fdc7142c000 rw-p 00000000 00:00 0
7fdc7142c000-7fdc7152c000 rw-s 1d785f000 00:05 4755 /dev/nvidia0
7fdc7152c000-7fdc7162c000 rw-s 1e675b000 00:05 4755 /dev/nvidia0
7fdc7162c000-7fdc7172c000 rw-s 1e665b000 00:05 4755 /dev/nvidia0
7fdc7172c000-7fdc7182c000 rw-s 1e6557000 00:05 4755 /dev/nvidia0
7fdc7182c000-7fdc7182d000 ---p 00000000 00:00 0
7fdc7182d000-7fdc7202d000 rwxp 00000000 00:00 0
7fdc7202d000-7fdc7202e000 ---p 00000000 00:00 0
7fdc7202e000-7fdc7282e000 rwxp 00000000 00:00 0
7fdc7282e000-7fdc7282f000 ---p 00000000 00:00 0
7fdc7282f000-7fdc7302f000 rwxp 00000000 00:00 0
7fdc7302f000-7fdc737c0000 r-xp 00000000 08:01 54401328 /usr/lib/atlas/libblas.so.3gf.0
7fdc737c0000-7fdc739bf000 ---p 00791000 08:01 54401328 /usr/lib/atlas/libblas.so.3gf.0
7fdc739bf000-7fdc739c4000 r--p 00790000 08:01 54401328 /usr/lib/atlas/libblas.so.3gf.0
7fdc739c4000-7fdc739ca000 rw-p 00795000 08:01 54401328 /usr/lib/atlas/libblas.so.3gf.0
7fdc739ca000-7fdc739d1000 r-xp 00000000 08:01 28181369 /lib/librt-2.11.1.so
7fdc739d1000-7fdc73bd0000 ---p 00007000 08:01 28181369 /lib/librt-2.11.1.so
7fdc73bd0000-7fdc73bd1000 r--p 00006000 08:01 28181369 /lib/librt-2.11.1.so
7fdc73bd1000-7fdc73bd2000 rw-p 00007000 08:01 28181369 /lib/librt-2.11.1.so
7fdc73bd2000-7fdc73bd4000 r-xp 00000000 08:01 28181708 /lib/libdl-2.11.1.so
7fdc73bd4000-7fdc73dd4000 ---p 00002000 08:01 28181708 /lib/libdl-2.11.1.so
7fdc73dd4000-7fdc73dd5000 r--p 00002000 08:01 28181708 /lib/libdl-2.11.1.so
7fdc73dd5000-7fdc73dd6000 rw-p 00003000 08:01 28181708 /lib/libdl-2.11.1.so
7fdc73dd6000-7fdc73dec000 r-xp 00000000 08:01 28180674 /lib/libz.so.1.2.3.3
7fdc73dec000-7fdc73feb000 ---p 00016000 08:01 28180674 /lib/libz.so.1.2.3.3
7fdc73feb000-7fdc73fec000 r--p 00015000 08:01 28180674 /lib/libz.so.1.2.3.3
7fdc73fec000-7fdc73fed000 rw-p 00016000 08:01 28180674 /lib/libz.so.1.2.3.3
7fdc73fed000-7fdc740e3000 r-xp 00000000 08:01 50335407 /usr/lib/libstdc++.so.6.0.13
7fdc740e3000-7fdc742e3000 ---p 000f6000 08:01 50335407 /usr/lib/libstdc++.so.6.0.13
7fdc742e3000-7fdc742ea000 r--p 000f6000 08:01 50335407 /usr/lib/libstdc++.so.6.0.13
7fdc742ea000-7fdc742ec000 rw-p 000fd000 08:01 50335407 /usr/lib/libstdc++.so.6.0.13
7fdc742ec000-7fdc74301000 rw-p 00000000 00:00 0
7fdc74301000-7fdc7447b000 r-xp 00000000 08:01 28181446 /lib/libc-2.11.1.so
7fdc7447b000-7fdc7467a000 ---p 0017a000 08:01 28181446 /lib/libc-2.11.1.so
7fdc7467a000-7fdc7467e000 r--p 00179000 08:01 28181446 /lib/libc-2.11.1.so
7fdc7467e000-7fdc7467f000 rw-p 0017d000 08:01 28181446 /lib/libc-2.11.1.so
7fdc7467f000-7fdc74684000 rw-p 00000000 00:00 0
7fdc74684000-7fdc7469a000 r-xp 00000000 08:01 28180559 /lib/libgcc_s.so.1
7fdc7469a000-7fdc74899000 ---p 00016000 08:01 28180559 /lib/libgcc_s.so.1
7fdc74899000-7fdc7489a000 r--p 00015000 08:01 28180559 /lib/libgcc_s.so.1
7fdc7489a000-7fdc7489b000 rw-p 00016000 08:01 28180559 /lib/libgcc_s.so.1
7fdc7489b000-7fdc7491d000 r-xp 00000000 08:01 28180728 /lib/libm-2.11.1.so
7fdc7491d000-7fdc74b1c000 ---p 00082000 08:01 28180728 /lib/libm-2.11.1.so
7fdc74b1c000-7fdc74b1d000 r--p 00081000 08:01 28180728 /lib/libm-2.11.1.so
7fdc74b1d000-7fdc74b1e000 rw-p 00082000 08:01 28180728 /lib/libm-2.11.1.so
7fdc74b1e000-7fdc74c09000 r-xp 00000000 08:01 50339064 /usr/lib/libgfortran.so.3.0.0
7fdc74c09000-7fdc74e08000 ---p 000eb000 08:01 50339064 /usr/lib/libgfortran.so.3.0.0
7fdc74e08000-7fdc74e09000 r--p 000ea000 08:01 50339064 /usr/lib/libgfortran.so.3.0.0
7fdc74e09000-7fdc74e0a000 rw-p 000eb000 08:01 50339064 /usr/lib/libgfortran.so.3.0.0
7fdc74e0a000-7fdc74e0b000 rw-p 00000000 00:00 0
7fdc74e0b000-7fdc75700000 r-xp 00000000 08:01 54401329 /usr/lib/atlas/liblapack.so.3gf.0
7fdc75700000-7fdc758ff000 ---p 008f5000 08:01 54401329 /usr/lib/atlas/liblapack.so.3gf.0
7fdc758ff000-7fdc75900000 r--p 008f4000 08:01 54401329 /usr/lib/atlas/liblapack.so.3gf.0
7fdc75900000-7fdc75905000 rw-p 008f5000 08:01 54401329 /usr/lib/atlas/liblapack.so.3gf.0
7fdc75905000-7fdc75a12000 rw-p 00000000 00:00 0 Aborted
- Code: Select all
#//////////////////////////////////////////////////////////////////////////////
# -- MAGMA (version 1.0) --
# Univ. of Tennessee, Knoxville
# Univ. of California, Berkeley
# Univ. of Colorado, Denver
# November 2010
#//////////////////////////////////////////////////////////////////////////////
#
# GPU_TARGET specifies for which GPU you want to compile MAGMA
# 0: Tesla family
# 1: Fermi Family
#
GPU_TARGET = 1
CUDADIR=/usr/local/cuda
CC = gcc
NVCC=$(CUDADIR)/bin/nvcc
#NVCC = nvcc
FORT = gfortran
ARCH = ar
ARCHFLAGS = cr
RANLIB = ranlib
OPTS = -O3 -DADD_
NVOPTS = --compiler-options -fno-strict-aliasing -DUNIX -O3 -DADD_
LDOPTS = -fPIC -z muldefs
# using GotoBLAS
LIB = -lgoto2 -lpthread -lcublas -lcudart -llapack -lm
# using default BLAS (single thread)
#LIB = -lblas -lpthread -lcublas -lcudart -llapack -lm
LIBDIR = -L/home/fletcher/GotoBLAS2 -L/usr/lib64 -L$(CUDADIR)/lib64
INC = -I$(CUDADIR)/include
LIBMAGMA = ../lib/libmagma.a
LIBMAGMABLAS = ../lib/libmagmablas.a
- Code: Select all
fletcher@fletcher-desktop:~/magma_1.0.0-rc3/testing$ ./testing_zgetrf_gpu
device 0: GeForce GTX 460, 1400.0 MHz clock, 2047.2 MB memory
Usage:
testing_zgetrf_gpu -M 1024 -N 1024
M N CPU GFlop/s GPU GFlop/s ||PA-LU||/(||A||*N)
============================================================
960 960 20.35 45.96 1.102403e-17
1920 1920 27.31 59.75 1.096587e-17
3072 3072 27.25 63.34 1.075028e-17
4032 4032 27.74 67.39 1.033353e-17
4992 4992 24.41 68.40 1.044090e-17
5952 5952 27.30 69.05 1.025062e-17
7104 7104 27.62 69.62 1.020955e-17
8064 8064 27.39 69.86 1.004068e-17
9024 9024 27.27 70.14 9.916281e-18
9984 9984 27.79 70.31 9.820221e-18
fletcher@fletcher-desktop:~/magma_1.0.0-rc3/testing$ ./testing_dgetrf_gpu
device 0: GeForce GTX 460, 1400.0 MHz clock, 2047.2 MB memory
Usage:
testing_dgetrf_gpu -M 1024 -N 1024
M N CPU GFlop/s GPU GFlop/s ||PA-LU||/(||A||*N)
============================================================
960 960 21.77 21.14 4.197521e-18
1920 1920 25.42 43.69 3.620278e-18
3072 3072 25.91 60.80 4.114900e-18
4032 4032 26.32 65.09 3.825857e-18
4992 4992 26.30 67.30 3.645565e-18
5952 5952 26.45 68.77 3.493297e-18
7104 7104 26.68 69.71 3.407056e-18
8064 8064 26.76 70.75 2.707749e-18
9024 9024 26.36 71.40 2.627284e-18
9984 9984 26.34 71.50 2.535688e-18