Eigenvalue SoLvers for Petaflop-Applications (ELPA) 2024.05.001
|
#include <stdio.h>
#include <math.h>
#include <stdlib.h>
#include <string.h>
#include <time.h>
#include <alloca.h>
#include <complex.h>
#include "config-f90.h"
#include "./gpu_vendor_agnostic_layer.h"
Functions | |
void | set_gpu_parameters (int *gpuMemcpyHostToDevice, int *gpuMemcpyDeviceToHost) |
int | gpuGetDeviceCount (int *count) |
int | gpuSetDevice (int n) |
int | gpuMalloc (intptr_t *a, size_t width_height) |
int | gpuFree (intptr_t *a) |
int | gpuMemcpy (intptr_t *dest, intptr_t *src, size_t count, int dir) |
int | gpuDeviceSynchronize () |
int | gpuMemset (intptr_t *a, int value, size_t count) |
void | gpublasDgemm (intptr_t *gpuHandle, char transa, char transb, int m, int n, int k, double alpha, const double *A, int lda, const double *B, int ldb, double beta, double *C, int ldc) |
void | gpublasSgemm (intptr_t *gpuHandle, char transa, char transb, int m, int n, int k, float alpha, const float *A, int lda, const float *B, int ldb, float beta, float *C, int ldc) |
void | gpublasZgemm (intptr_t *gpuHandle, char transa, char transb, int m, int n, int k, double _Complex alpha, const double _Complex *A, int lda, const double _Complex *B, int ldb, double _Complex beta, double _Complex *C, int ldc) |
void | gpublasCgemm (intptr_t *gpuHandle, char transa, char transb, int m, int n, int k, float _Complex alpha, const float _Complex *A, int lda, const float _Complex *B, int ldb, float _Complex beta, float _Complex *C, int ldc) |
void gpublasCgemm | ( | intptr_t * | gpuHandle, |
char | transa, | ||
char | transb, | ||
int | m, | ||
int | n, | ||
int | k, | ||
float _Complex | alpha, | ||
const float _Complex * | A, | ||
int | lda, | ||
const float _Complex * | B, | ||
int | ldb, | ||
float _Complex | beta, | ||
float _Complex * | C, | ||
int | ldc ) |
void gpublasDgemm | ( | intptr_t * | gpuHandle, |
char | transa, | ||
char | transb, | ||
int | m, | ||
int | n, | ||
int | k, | ||
double | alpha, | ||
const double * | A, | ||
int | lda, | ||
const double * | B, | ||
int | ldb, | ||
double | beta, | ||
double * | C, | ||
int | ldc ) |
void gpublasSgemm | ( | intptr_t * | gpuHandle, |
char | transa, | ||
char | transb, | ||
int | m, | ||
int | n, | ||
int | k, | ||
float | alpha, | ||
const float * | A, | ||
int | lda, | ||
const float * | B, | ||
int | ldb, | ||
float | beta, | ||
float * | C, | ||
int | ldc ) |
void gpublasZgemm | ( | intptr_t * | gpuHandle, |
char | transa, | ||
char | transb, | ||
int | m, | ||
int | n, | ||
int | k, | ||
double _Complex | alpha, | ||
const double _Complex * | A, | ||
int | lda, | ||
const double _Complex * | B, | ||
int | ldb, | ||
double _Complex | beta, | ||
double _Complex * | C, | ||
int | ldc ) |
int gpuDeviceSynchronize | ( | ) |
int gpuFree | ( | intptr_t * | a | ) |
int gpuGetDeviceCount | ( | int * | count | ) |
int gpuMalloc | ( | intptr_t * | a, |
size_t | width_height ) |
int gpuMemcpy | ( | intptr_t * | dest, |
intptr_t * | src, | ||
size_t | count, | ||
int | dir ) |
int gpuMemset | ( | intptr_t * | a, |
int | value, | ||
size_t | count ) |
int gpuSetDevice | ( | int | n | ) |
void set_gpu_parameters | ( | int * | gpuMemcpyHostToDevice, |
int * | gpuMemcpyDeviceToHost ) |