|
MAGMA
1.2.0
MatrixAlgebraonGPUandMulticoreArchitectures
|
Go to the source code of this file.
Macros | |
| #define | PRECISION_c |
| #define | MAGMABLAS_CHEMV_MGPU |
| #define | magmablas_chemv_200_mgpu_offset magmablas_chemv_mgpu_offset |
| #define | magmablas_chemv_200_mgpu_32_offset magmablas_chemv_mgpu_32_offset |
| #define | A(i, j) (a+(j)*lda + (i)) |
| #define | W(i, j) (w+(j)*ldw + (i)) |
| #define | dA(id, i, j) (da[(id)]+((j)+loffset)*ldda + (i)+offset) |
| #define | dW(id, i, j) (dw[(id)]+ (j) *lddw + (i)) |
| #define | dW1(id, i, j) (dw[(id)]+ ((j)+nb0) *lddw + (i)) |
| #define | magma_chemv magmablas_chemv |
| #define | magma_cgemv magmablas_cgemv |
| #define | ONGPU |
| #define | dX(id, i) (dx[(id)]+incx*(i)) |
| #define | dY(id, i, j) (dy[(id)]+incy*(i)+n*(j)) |
Functions | |
| magma_int_t | magmablas_chemv_200_mgpu_offset (char uplo, magma_int_t n, cuFloatComplex alpha, cuFloatComplex **A, magma_int_t lda, cuFloatComplex **X, magma_int_t incx, cuFloatComplex beta, cuFloatComplex **Y, magma_int_t incy, cuFloatComplex **work, magma_int_t lwork, magma_int_t num_gpus, magma_int_t nb, magma_int_t offset, cudaStream_t stream[][10]) |
| magma_int_t | magmablas_chemv_200_mgpu_32_offset (char uplo, magma_int_t n, cuFloatComplex alpha, cuFloatComplex **A, magma_int_t lda, cuFloatComplex **X, magma_int_t incx, cuFloatComplex beta, cuFloatComplex **Y, magma_int_t incy, cuFloatComplex **work, magma_int_t lwork, magma_int_t num_gpus, magma_int_t nb, magma_int_t offset, cudaStream_t stream[][10]) |
| magma_int_t | magmablas_chemv_mgpu (magma_int_t num_gpus, magma_int_t k, char uplo, magma_int_t n, magma_int_t nb, cuFloatComplex alpha, cuFloatComplex **da, magma_int_t ldda, magma_int_t offset, cuFloatComplex **dx, magma_int_t incx, cuFloatComplex beta, cuFloatComplex **dy, magma_int_t incy, cuFloatComplex **dwork, magma_int_t ldwork, cuFloatComplex *work, cuFloatComplex *w, cudaStream_t stream[][10]) |
| magma_int_t | magmablas_chemv_synch (magma_int_t num_gpus, magma_int_t k, char uplo, magma_int_t n, cuFloatComplex *work, cuFloatComplex *w, cudaStream_t stream[][10]) |
| magma_int_t | magmablas_chemv (char uplo, magma_int_t n, cuFloatComplex alpha, cuFloatComplex *A, magma_int_t lda, cuFloatComplex *X, magma_int_t incx, cuFloatComplex beta, cuFloatComplex *Y, magma_int_t incy) |
| void | magmablas_cgemvt (char flag, int m, int n, cuFloatComplex alpha, cuFloatComplex *A, int lda, cuFloatComplex *x, int incx, cuFloatComplex beta, cuFloatComplex *y, int incy) |
| float | magma_clatrd_mgpu (int num_gpus, char uplo, magma_int_t n, magma_int_t nb, magma_int_t nb0, cuFloatComplex *a, magma_int_t lda, float *e, cuFloatComplex *tau, cuFloatComplex *w, magma_int_t ldw, cuFloatComplex **da, magma_int_t ldda, magma_int_t offset, cuFloatComplex **dw, magma_int_t lddw, cuFloatComplex *dwork[4], magma_int_t ldwork, magma_int_t k, cuFloatComplex *dx[4], cuFloatComplex *dy[4], cuFloatComplex *work, cudaStream_t stream[][10]) |
| #define A | ( | i, | |
| j | |||
| ) | (a+(j)*lda + (i)) |
Definition at line 73 of file clatrd_mgpu.cpp.
| #define dA | ( | id, | |
| i, | |||
| j | |||
| ) | (da[(id)]+((j)+loffset)*ldda + (i)+offset) |
Definition at line 76 of file clatrd_mgpu.cpp.
| #define dW | ( | id, | |
| i, | |||
| j | |||
| ) | (dw[(id)]+ (j) *lddw + (i)) |
Definition at line 77 of file clatrd_mgpu.cpp.
| #define dW1 | ( | id, | |
| i, | |||
| j | |||
| ) | (dw[(id)]+ ((j)+nb0) *lddw + (i)) |
Definition at line 79 of file clatrd_mgpu.cpp.
| #define dX | ( | id, | |
| i | |||
| ) | (dx[(id)]+incx*(i)) |
| #define dY | ( | id, | |
| i, | |||
| j | |||
| ) | (dy[(id)]+incy*(i)+n*(j)) |
| #define magma_cgemv magmablas_cgemv |
Definition at line 92 of file clatrd_mgpu.cpp.
| #define magma_chemv magmablas_chemv |
Definition at line 91 of file clatrd_mgpu.cpp.
| #define magmablas_chemv_200_mgpu_32_offset magmablas_chemv_mgpu_32_offset |
Definition at line 24 of file clatrd_mgpu.cpp.
| #define magmablas_chemv_200_mgpu_offset magmablas_chemv_mgpu_offset |
Definition at line 23 of file clatrd_mgpu.cpp.
| #define MAGMABLAS_CHEMV_MGPU |
Definition at line 21 of file clatrd_mgpu.cpp.
| #define ONGPU |
| #define PRECISION_c |
Definition at line 19 of file clatrd_mgpu.cpp.
| #define W | ( | i, | |
| j | |||
| ) | (w+(j)*ldw + (i)) |
Definition at line 74 of file clatrd_mgpu.cpp.
| float magma_clatrd_mgpu | ( | int | num_gpus, |
| char | uplo, | ||
| magma_int_t | n, | ||
| magma_int_t | nb, | ||
| magma_int_t | nb0, | ||
| cuFloatComplex * | a, | ||
| magma_int_t | lda, | ||
| float * | e, | ||
| cuFloatComplex * | tau, | ||
| cuFloatComplex * | w, | ||
| magma_int_t | ldw, | ||
| cuFloatComplex ** | da, | ||
| magma_int_t | ldda, | ||
| magma_int_t | offset, | ||
| cuFloatComplex ** | dw, | ||
| magma_int_t | lddw, | ||
| cuFloatComplex * | dwork[4], | ||
| magma_int_t | ldwork, | ||
| magma_int_t | k, | ||
| cuFloatComplex * | dx[4], | ||
| cuFloatComplex * | dy[4], | ||
| cuFloatComplex * | work, | ||
| cudaStream_t | stream[][10] | ||
| ) |
Definition at line 102 of file clatrd_mgpu.cpp.
References A, blasf77_caxpy(), blasf77_cdotc(), blasf77_cgemv(), blasf77_cscal(), dA, dW, dW1, lapack_testing::f, lapackf77_clacgv(), lapackf77_clarfg(), lapackf77_lsame, MAGMA_C_NEG_ONE, MAGMA_C_ONE, MAGMA_C_REAL, MAGMA_C_SET2REAL, MAGMA_C_ZERO, magma_cgemv, magma_cgetmatrix_async(), magma_cgetvector_async(), magma_chemv, magma_csetvector(), magma_csetvector_async(), magma_event_create(), magma_event_record(), magma_queue_sync(), magma_setdevice(), magmablas_cgemvt(), magmablas_chemv_mgpu(), magmablas_chemv_synch(), magmablasSetKernelStream(), MagmaConjTransStr, MagmaNoTrans, MagmaUpper, min, trace_cpu_end, trace_cpu_start, trace_gpu_end, trace_gpu_start, uplo, and W.
| void magmablas_cgemvt | ( | char | flag, |
| int | m, | ||
| int | n, | ||
| cuFloatComplex | alpha, | ||
| cuFloatComplex * | A, | ||
| int | lda, | ||
| cuFloatComplex * | x, | ||
| int | incx, | ||
| cuFloatComplex | beta, | ||
| cuFloatComplex * | y, | ||
| int | incy | ||
| ) |
| magma_int_t magmablas_chemv | ( | char | uplo, |
| magma_int_t | n, | ||
| cuFloatComplex | alpha, | ||
| cuFloatComplex * | A, | ||
| magma_int_t | lda, | ||
| cuFloatComplex * | X, | ||
| magma_int_t | incx, | ||
| cuFloatComplex | beta, | ||
| cuFloatComplex * | Y, | ||
| magma_int_t | incy | ||
| ) |
| magma_int_t magmablas_chemv_200_mgpu_32_offset | ( | char | uplo, |
| magma_int_t | n, | ||
| cuFloatComplex | alpha, | ||
| cuFloatComplex ** | A, | ||
| magma_int_t | lda, | ||
| cuFloatComplex ** | X, | ||
| magma_int_t | incx, | ||
| cuFloatComplex | beta, | ||
| cuFloatComplex ** | Y, | ||
| magma_int_t | incy, | ||
| cuFloatComplex ** | work, | ||
| magma_int_t | lwork, | ||
| magma_int_t | num_gpus, | ||
| magma_int_t | nb, | ||
| magma_int_t | offset, | ||
| cudaStream_t | stream[][10] | ||
| ) |
| magma_int_t magmablas_chemv_200_mgpu_offset | ( | char | uplo, |
| magma_int_t | n, | ||
| cuFloatComplex | alpha, | ||
| cuFloatComplex ** | A, | ||
| magma_int_t | lda, | ||
| cuFloatComplex ** | X, | ||
| magma_int_t | incx, | ||
| cuFloatComplex | beta, | ||
| cuFloatComplex ** | Y, | ||
| magma_int_t | incy, | ||
| cuFloatComplex ** | work, | ||
| magma_int_t | lwork, | ||
| magma_int_t | num_gpus, | ||
| magma_int_t | nb, | ||
| magma_int_t | offset, | ||
| cudaStream_t | stream[][10] | ||
| ) |
| magma_int_t magmablas_chemv_mgpu | ( | magma_int_t | num_gpus, |
| magma_int_t | k, | ||
| char | uplo, | ||
| magma_int_t | n, | ||
| magma_int_t | nb, | ||
| cuFloatComplex | alpha, | ||
| cuFloatComplex ** | da, | ||
| magma_int_t | ldda, | ||
| magma_int_t | offset, | ||
| cuFloatComplex ** | dx, | ||
| magma_int_t | incx, | ||
| cuFloatComplex | beta, | ||
| cuFloatComplex ** | dy, | ||
| magma_int_t | incy, | ||
| cuFloatComplex ** | dwork, | ||
| magma_int_t | ldwork, | ||
| cuFloatComplex * | work, | ||
| cuFloatComplex * | w, | ||
| cudaStream_t | stream[][10] | ||
| ) |
Definition at line 584 of file clatrd_mgpu.cpp.
References dA, dX, dY, MAGMA_C_ONE, magma_cgemv, magma_cgetvector_async(), magma_chemv, magma_setdevice(), magmablasSetKernelStream(), MagmaConjTrans, MagmaLower, MagmaNoTrans, min, trace_gpu_end, and trace_gpu_start.
| magma_int_t magmablas_chemv_synch | ( | magma_int_t | num_gpus, |
| magma_int_t | k, | ||
| char | uplo, | ||
| magma_int_t | n, | ||
| cuFloatComplex * | work, | ||
| cuFloatComplex * | w, | ||
| cudaStream_t | stream[][10] | ||
| ) |
Definition at line 784 of file clatrd_mgpu.cpp.
References blasf77_caxpy(), MAGMA_C_ONE, magma_queue_sync(), and magma_setdevice().