|
MAGMA
1.2.0
MatrixAlgebraonGPUandMulticoreArchitectures
|
#include <stdlib.h>#include <stdio.h>#include <string.h>#include <math.h>#include <cuda.h>#include <cuda_runtime_api.h>#include <cublas.h>#include "flops.h"#include "magma.h"#include "magma_lapack.h"#include "testings.h"Go to the source code of this file.
Macros | |
| #define | PRECISION_z |
| #define | FLOPS(m, n) ( 6. * FMULS_GETRF(m, n) + 2. * FADDS_GETRF(m, n) ) |
Functions | |
| magma_int_t | magma_zgetrf3 (magma_int_t num_gpus, magma_int_t m, magma_int_t n, cuDoubleComplex *a, magma_int_t lda, magma_int_t *ipiv, magma_int_t *info) |
| double | get_LU_error (magma_int_t M, magma_int_t N, cuDoubleComplex *A, magma_int_t lda, cuDoubleComplex *LU, magma_int_t *IPIV) |
| int | main (int argc, char **argv) |
| #define FLOPS | ( | m, | |
| n | |||
| ) | ( 6. * FMULS_GETRF(m, n) + 2. * FADDS_GETRF(m, n) ) |
Definition at line 36 of file testing_zgetrf.cpp.
| #define PRECISION_z |
Definition at line 34 of file testing_zgetrf.cpp.
| double get_LU_error | ( | magma_int_t | M, |
| magma_int_t | N, | ||
| cuDoubleComplex * | A, | ||
| magma_int_t | lda, | ||
| cuDoubleComplex * | LU, | ||
| magma_int_t * | IPIV | ||
| ) |
Definition at line 41 of file testing_zgetrf.cpp.
References blasf77_zgemm, L, lapackf77_zlacpy, lapackf77_zlange, lapackf77_zlaswp, MAGMA_Z_MAKE, MAGMA_Z_ONE, MAGMA_Z_SUB, MAGMA_Z_ZERO, MagmaLowerStr, MagmaUpperStr, min, gbstrct_blg::N, TESTING_FREE, TESTING_MALLOC, and codegen::work.
| magma_int_t magma_zgetrf3 | ( | magma_int_t | num_gpus, |
| magma_int_t | m, | ||
| magma_int_t | n, | ||
| cuDoubleComplex * | a, | ||
| magma_int_t | lda, | ||
| magma_int_t * | ipiv, | ||
| magma_int_t * | info | ||
| ) |
| int main | ( | int | argc, |
| char ** | argv | ||
| ) |
Definition at line 86 of file testing_zgetrf.cpp.
References FLOPS, get_current_time(), get_LU_error(), GetTimerValue(), ISEED, lapackf77_zgetrf, lapackf77_zlacpy, lapackf77_zlarnv, magma_get_zgetrf_nb(), magma_zgetrf(), MagmaUpperLowerStr, min, gbstrct_blg::N, TESTING_CUDA_FINALIZE, TESTING_CUDA_INIT, TESTING_FREE, TESTING_HOSTALLOC, TESTING_HOSTFREE, and TESTING_MALLOC.