42#include <cuda_runtime.h>
45#include <neko/device/cuda/check.h>
46#include <neko/device/device_config.h>
57 void* X_out_d,
void* X_in_d,
int* n) {
59 const dim3 nthrds(1024, 1, 1);
60 const dim3 nblcks(((*n) + 1024 - 1) / 1024, 1, 1);
75 const dim3 nblcks(((*n) + 1024 - 1) / 1024, 1, 1);
__global__ void heaviside_mapping_apply_kernel(const T beta, const T eta, T *__restrict__ X_out_d, T *__restrict__ X_in_d, const int n)
void cuda_heaviside_mapping_apply_backward(real *beta, real *eta, void *sens_out_d, void *sens_in_d, void *X_in_d, int *n)
void cuda_heaviside_mapping_apply(real *beta, real *eta, void *X_out_d, void *X_in_d, int *n)