Eigenvalue SoLvers for Petaflop-Applications (ELPA) 2024.05.001
Loading...
Searching...
No Matches
Functions
gpu_vendor_agnostic_layer.c File Reference
#include <stdio.h>
#include <math.h>
#include <stdlib.h>
#include <string.h>
#include <time.h>
#include <alloca.h>
#include <complex.h>
#include "config-f90.h"
#include "./gpu_vendor_agnostic_layer.h"

Functions

void set_gpu_parameters (int *gpuMemcpyHostToDevice, int *gpuMemcpyDeviceToHost)
 
int gpuGetDeviceCount (int *count)
 
int gpuSetDevice (int n)
 
int gpuMalloc (intptr_t *a, size_t width_height)
 
int gpuFree (intptr_t *a)
 
int gpuMemcpy (intptr_t *dest, intptr_t *src, size_t count, int dir)
 
int gpuDeviceSynchronize ()
 
int gpuMemset (intptr_t *a, int value, size_t count)
 
void gpublasDgemm (intptr_t *gpuHandle, char transa, char transb, int m, int n, int k, double alpha, const double *A, int lda, const double *B, int ldb, double beta, double *C, int ldc)
 
void gpublasSgemm (intptr_t *gpuHandle, char transa, char transb, int m, int n, int k, float alpha, const float *A, int lda, const float *B, int ldb, float beta, float *C, int ldc)
 
void gpublasZgemm (intptr_t *gpuHandle, char transa, char transb, int m, int n, int k, double _Complex alpha, const double _Complex *A, int lda, const double _Complex *B, int ldb, double _Complex beta, double _Complex *C, int ldc)
 
void gpublasCgemm (intptr_t *gpuHandle, char transa, char transb, int m, int n, int k, float _Complex alpha, const float _Complex *A, int lda, const float _Complex *B, int ldb, float _Complex beta, float _Complex *C, int ldc)
 

Function Documentation

◆ gpublasCgemm()

void gpublasCgemm ( intptr_t * gpuHandle,
char transa,
char transb,
int m,
int n,
int k,
float _Complex alpha,
const float _Complex * A,
int lda,
const float _Complex * B,
int ldb,
float _Complex beta,
float _Complex * C,
int ldc )

◆ gpublasDgemm()

void gpublasDgemm ( intptr_t * gpuHandle,
char transa,
char transb,
int m,
int n,
int k,
double alpha,
const double * A,
int lda,
const double * B,
int ldb,
double beta,
double * C,
int ldc )

◆ gpublasSgemm()

void gpublasSgemm ( intptr_t * gpuHandle,
char transa,
char transb,
int m,
int n,
int k,
float alpha,
const float * A,
int lda,
const float * B,
int ldb,
float beta,
float * C,
int ldc )

◆ gpublasZgemm()

void gpublasZgemm ( intptr_t * gpuHandle,
char transa,
char transb,
int m,
int n,
int k,
double _Complex alpha,
const double _Complex * A,
int lda,
const double _Complex * B,
int ldb,
double _Complex beta,
double _Complex * C,
int ldc )

◆ gpuDeviceSynchronize()

int gpuDeviceSynchronize ( )

◆ gpuFree()

int gpuFree ( intptr_t * a)

◆ gpuGetDeviceCount()

int gpuGetDeviceCount ( int * count)

◆ gpuMalloc()

int gpuMalloc ( intptr_t * a,
size_t width_height )

◆ gpuMemcpy()

int gpuMemcpy ( intptr_t * dest,
intptr_t * src,
size_t count,
int dir )

◆ gpuMemset()

int gpuMemset ( intptr_t * a,
int value,
size_t count )

◆ gpuSetDevice()

int gpuSetDevice ( int n)

◆ set_gpu_parameters()

void set_gpu_parameters ( int * gpuMemcpyHostToDevice,
int * gpuMemcpyDeviceToHost )