Neko-TOP
A portable framework for high-order spectral element flow toplogy optimization.
Loading...
Searching...
No Matches
mma_kernel.h File Reference
This graph shows which files directly or indirectly include this file:

Go to the source code of this file.

Functions

template<typename T >
__global__ void mma_sub1_kernel (T *__restrict__ xlow, T *__restrict__ xupp, const T *__restrict__ x, const T *__restrict__ xmin, const T *__restrict__ xmax, const T asyinit, const int n)
 
template<typename T >
__global__ void mma_sub2_kernel (T *__restrict__ low, T *__restrict__ upp, const T *__restrict__ x, const T *__restrict__ xold1, const T *__restrict__ xold2, const T *__restrict__ xmin, const T *__restrict__ xmax, const T asydecr, const T asyincr, const int n)
 
template<typename T >
__global__ void mma_sub3_kernel (const T *__restrict__ x, const T *__restrict__ df0dx, const T *__restrict__ dfdx, T *__restrict__ low, T *__restrict__ upp, const T *__restrict__ xmin, const T *__restrict__ xmax, T *__restrict__ alpha, T *__restrict__ beta, T *__restrict__ p0j, T *__restrict__ q0j, T *__restrict__ pij, T *__restrict__ qij, const int n, const int m)
 
template<typename T >
__global__ void mma_sub4_kernel (const T *__restrict__ x, T *__restrict__ low, T *__restrict__ upp, T *__restrict__ pij, T *__restrict__ qij, T *__restrict__ temp, const int n, const int m)
 
template<typename T >
__global__ void mma_max2_kernel (T *__restrict__ xsi, const T *__restrict__ x, T *__restrict__ alpha, const int n)
 
template<typename T >
__global__ void relambda_kernel (T *__restrict__ temp, const T *__restrict__ x, const T *__restrict__ xupp, const T *__restrict__ xlow, const T *__restrict__ pij, const T *__restrict__ qij, const int n, const int m)
 
template<typename T >
__global__ void sub2cons2_kernel (T *__restrict__ a, const T *__restrict__ b, const T *__restrict__ c, const T *__restrict__ d, const T e, const int n)
 
template<typename T >
__inline__ __device__ T max_reduce_warp (T val)
 
template<typename T >
__global__ void maxval_kernel (const T *__restrict__ a, T *temp, const int n)
 
template<typename T >
__global__ void max_reduce_kernel (T *__restrict__ bufred, const int n)
 
template<typename T >
__global__ void delx_kernel (T *__restrict__ delx, const T *__restrict__ x, const T *__restrict__ xlow, const T *__restrict__ xupp, const T *__restrict__ pij, const T *__restrict__ qij, const T *__restrict__ p0j, const T *__restrict__ q0j, const T *__restrict__ alpha, const T *__restrict__ beta, const T *__restrict__ lambda, const T epsi, const int n, const int m)
 
template<typename T >
__global__ void GG_kernel (T *__restrict__ GG, const T *__restrict__ x, const T *__restrict__ xlow, const T *__restrict__ xupp, const T *__restrict__ pij, const T *__restrict__ qij, const int n, const int m)
 
template<typename T >
__global__ void diagx_kernel (T *__restrict__ diagx, const T *__restrict__ x, const T *__restrict__ xsi, const T *__restrict__ xlow, const T *__restrict__ xupp, const T *__restrict__ p0j, const T *__restrict__ q0j, const T *__restrict__ pij, const T *__restrict__ qij, const T *alpha, const T *beta, const T *eta, const T *lambda, const int n, const int m)
 
template<typename T >
__inline__ __device__ T reduce_warp (T val)
 
template<typename T >
__global__ void mmareduce_kernel (T *__restrict__ bufred, const int n)
 
template<typename T >
__global__ void mmasum_kernel (const T *__restrict__ a, T *__restrict__ buf_h, const int n, const int m, const int k)
 
template<typename T >
__global__ void mmasumbb_kernel (const T *__restrict__ GG, const T *__restrict__ delx, const T *__restrict__ diagx, T *__restrict__ buf_h, const int n, const int m, const int k)
 
template<typename T >
__global__ void mmasumAA_kernel (const T *__restrict__ GG, const T *__restrict__ diagx, T *__restrict__ buf_h, const int n, const int m, const int k0, const int k1)
 
template<typename T >
__global__ void mma_copy_kernel (T *__restrict__ a, const T *__restrict__ b, const int n, const int m)
 
template<typename T >
__global__ void AA_kernel (T *__restrict__ temp, const T *__restrict__ GG, const T *__restrict__ diagx, const int n, const int m)
 
template<typename T >
__global__ void dx_kernel (T *__restrict__ dx, const T *__restrict__ delx, const T *__restrict__ diagx, const T *__restrict__ GG, const T *__restrict__ dlambda, const int n, const int m)
 
template<typename T >
__global__ void dxsi_kernel (T *__restrict__ dxsi, const T *__restrict__ xsi, const T *__restrict__ dx, const T *__restrict__ x, const T *__restrict__ alpha, const T epsi, const int n)
 
template<typename T >
__global__ void deta_kernel (T *__restrict__ deta, const T *__restrict__ eta, const T *__restrict__ dx, const T *__restrict__ x, const T *__restrict__ beta, const T epsi, const int n)
 
template<typename T >
__global__ void RexCalculation_kernel (T *__restrict__ rex, const T *__restrict__ x, const T *__restrict__ xlow, const T *__restrict__ xupp, const T *__restrict__ pij, const T *__restrict__ p0j, const T *__restrict__ qij, const T *__restrict__ q0j, const T *__restrict__ lambda, const T *__restrict__ xsi, const T *__restrict__ eta, const int n, const int m)
 
template<typename T >
__global__ void rey_calculation_kernel (T *__restrict__ rey, const T *__restrict__ c, const T *__restrict__ d, const T *__restrict__ y, const T *__restrict__ lambda, const T *__restrict__ mu, const int n)
 
template<typename T >
__global__ void norm_kernel (const T *__restrict__ a, T *__restrict__ buf_h, const int n)
 
template<typename T >
__global__ void sub2cons_kernel (T *__restrict__ a, const T *__restrict__ b, const T *__restrict__ c, const T d, const int n)
 
template<typename T >
__global__ void dely_kernel (T *__restrict__ dely, const T *__restrict__ c, const T *__restrict__ d, const T *__restrict__ y, const T *__restrict__ lambda, const T epsi, const int n)
 
template<typename T >
__global__ void maxval2_kernel (const T *__restrict__ a, const T *__restrict__ b, T *__restrict__ temp, const T cons, const int n)
 
template<typename T >
__global__ void maxval3_kernel (const T *__restrict__ a, const T *__restrict__ b, const T *__restrict__ c, T *__restrict__ temp, const T cons, const int n)
 
template<typename T >
__global__ void kkt_rex_kernel (T *__restrict__ rex, const T *__restrict__ df0dx, const T *__restrict__ dfdx, const T *__restrict__ xsi, const T *__restrict__ eta, const T *__restrict__ lambda, const int n, const int m)
 
template<typename T >
__global__ void maxcons_kernel (T *__restrict__ a, const T b, const T c, const T *__restrict__ d, const int n)
 
template<typename T >
__global__ void glsum_kernel (const T *a, T *buf_h, const int n)
 
template<typename T >
__global__ void glsc2_kernel (const T *a, const T *b, T *buf_h, const int n)
 
template<typename T >
__global__ void add2inv2_kernel (T *__restrict__ a, const T *__restrict__ b, const T c, const int n)
 
template<typename T >
__global__ void max2_kernel (T *__restrict__ a, const T b, const T *__restrict__ c, const T d, const int n)
 
template<typename T >
__global__ void updatebb_kernel (T *__restrict__ bb, const T *__restrict__ dellambda, const T *__restrict__ dely, const T *__restrict__ d, const T *__restrict__ mu, const T *__restrict__ y, const T delz, const int m)
 
template<typename T >
__global__ void updateAA_kernel (T *__restrict__ AA, const T *__restrict__ globaltmp_mm, const T *__restrict__ s, const T *__restrict__ lambda, const T *__restrict__ d, const T *__restrict__ mu, const T *__restrict__ y, const T *__restrict__ a, const T zeta, const T z, const int m)
 
template<typename T >
__global__ void dy_kernel (T *__restrict__ dy, const T *__restrict__ dely, const T *__restrict__ dlambda, const T *__restrict__ d, const T *__restrict__ mu, const T *__restrict__ y, const int n)
 

Function Documentation

◆ AA_kernel()

template<typename T >
__global__ void AA_kernel ( T *__restrict__  temp,
const T *__restrict__  GG,
const T *__restrict__  diagx,
const int  n,
const int  m 
)

Definition at line 398 of file mma_kernel.h.

Here is the call graph for this function:

◆ add2inv2_kernel()

template<typename T >
__global__ void add2inv2_kernel ( T *__restrict__  a,
const T *__restrict__  b,
const T  c,
const int  n 
)

Definition at line 693 of file mma_kernel.h.

Here is the call graph for this function:

◆ delx_kernel()

template<typename T >
__global__ void delx_kernel ( T *__restrict__  delx,
const T *__restrict__  x,
const T *__restrict__  xlow,
const T *__restrict__  xupp,
const T *__restrict__  pij,
const T *__restrict__  qij,
const T *__restrict__  p0j,
const T *__restrict__  q0j,
const T *__restrict__  alpha,
const T *__restrict__  beta,
const T *__restrict__  lambda,
const T  epsi,
const int  n,
const int  m 
)

Definition at line 196 of file mma_kernel.h.

Here is the call graph for this function:

◆ dely_kernel()

template<typename T >
__global__ void dely_kernel ( T *__restrict__  dely,
const T *__restrict__  c,
const T *__restrict__  d,
const T *__restrict__  y,
const T *__restrict__  lambda,
const T  epsi,
const int  n 
)

Definition at line 526 of file mma_kernel.h.

Here is the call graph for this function:

◆ deta_kernel()

template<typename T >
__global__ void deta_kernel ( T *__restrict__  deta,
const T *__restrict__  eta,
const T *__restrict__  dx,
const T *__restrict__  x,
const T *__restrict__  beta,
const T  epsi,
const int  n 
)

Definition at line 439 of file mma_kernel.h.

Here is the call graph for this function:

◆ diagx_kernel()

template<typename T >
__global__ void diagx_kernel ( T *__restrict__  diagx,
const T *__restrict__  x,
const T *__restrict__  xsi,
const T *__restrict__  xlow,
const T *__restrict__  xupp,
const T *__restrict__  p0j,
const T *__restrict__  q0j,
const T *__restrict__  pij,
const T *__restrict__  qij,
const T alpha,
const T beta,
const T eta,
const T lambda,
const int  n,
const int  m 
)

Definition at line 231 of file mma_kernel.h.

Here is the call graph for this function:

◆ dx_kernel()

template<typename T >
__global__ void dx_kernel ( T *__restrict__  dx,
const T *__restrict__  delx,
const T *__restrict__  diagx,
const T *__restrict__  GG,
const T *__restrict__  dlambda,
const int  n,
const int  m 
)

Definition at line 413 of file mma_kernel.h.

Here is the call graph for this function:

◆ dxsi_kernel()

template<typename T >
__global__ void dxsi_kernel ( T *__restrict__  dxsi,
const T *__restrict__  xsi,
const T *__restrict__  dx,
const T *__restrict__  x,
const T *__restrict__  alpha,
const T  epsi,
const int  n 
)

Definition at line 428 of file mma_kernel.h.

Here is the call graph for this function:

◆ dy_kernel()

template<typename T >
__global__ void dy_kernel ( T *__restrict__  dy,
const T *__restrict__  dely,
const T *__restrict__  dlambda,
const T *__restrict__  d,
const T *__restrict__  mu,
const T *__restrict__  y,
const int  n 
)

Definition at line 743 of file mma_kernel.h.

Here is the call graph for this function:

◆ GG_kernel()

template<typename T >
__global__ void GG_kernel ( T *__restrict__  GG,
const T *__restrict__  x,
const T *__restrict__  xlow,
const T *__restrict__  xupp,
const T *__restrict__  pij,
const T *__restrict__  qij,
const int  n,
const int  m 
)

Definition at line 218 of file mma_kernel.h.

Here is the call graph for this function:

◆ glsc2_kernel()

template<typename T >
__global__ void glsc2_kernel ( const T a,
const T b,
T buf_h,
const int  n 
)

Definition at line 657 of file mma_kernel.h.

Here is the call graph for this function:

◆ glsum_kernel()

template<typename T >
__global__ void glsum_kernel ( const T a,
T buf_h,
const int  n 
)

Definition at line 629 of file mma_kernel.h.

Here is the call graph for this function:

◆ kkt_rex_kernel()

template<typename T >
__global__ void kkt_rex_kernel ( T *__restrict__  rex,
const T *__restrict__  df0dx,
const T *__restrict__  dfdx,
const T *__restrict__  xsi,
const T *__restrict__  eta,
const T *__restrict__  lambda,
const int  n,
const int  m 
)

Definition at line 602 of file mma_kernel.h.

Here is the call graph for this function:

◆ max2_kernel()

template<typename T >
__global__ void max2_kernel ( T *__restrict__  a,
const T  b,
const T *__restrict__  c,
const T  d,
const int  n 
)

Definition at line 702 of file mma_kernel.h.

Here is the call graph for this function:

◆ max_reduce_kernel()

template<typename T >
__global__ void max_reduce_kernel ( T *__restrict__  bufred,
const int  n 
)

Definition at line 168 of file mma_kernel.h.

Here is the call graph for this function:

◆ max_reduce_warp()

template<typename T >
__inline__ __device__ T max_reduce_warp ( T  val)

Definition at line 127 of file mma_kernel.h.

Here is the call graph for this function:

◆ maxcons_kernel()

template<typename T >
__global__ void maxcons_kernel ( T *__restrict__  a,
const T  b,
const T  c,
const T *__restrict__  d,
const int  n 
)

Definition at line 618 of file mma_kernel.h.

Here is the call graph for this function:

◆ maxval2_kernel()

template<typename T >
__global__ void maxval2_kernel ( const T *__restrict__  a,
const T *__restrict__  b,
T *__restrict__  temp,
const T  cons,
const int  n 
)

Definition at line 538 of file mma_kernel.h.

Here is the call graph for this function:

◆ maxval3_kernel()

template<typename T >
__global__ void maxval3_kernel ( const T *__restrict__  a,
const T *__restrict__  b,
const T *__restrict__  c,
T *__restrict__  temp,
const T  cons,
const int  n 
)

Definition at line 570 of file mma_kernel.h.

Here is the call graph for this function:

◆ maxval_kernel()

template<typename T >
__global__ void maxval_kernel ( const T *__restrict__  a,
T temp,
const int  n 
)

Definition at line 139 of file mma_kernel.h.

Here is the call graph for this function:

◆ mma_copy_kernel()

template<typename T >
__global__ void mma_copy_kernel ( T *__restrict__  a,
const T *__restrict__  b,
const int  n,
const int  m 
)

Definition at line 388 of file mma_kernel.h.

Here is the call graph for this function:

◆ mma_max2_kernel()

template<typename T >
__global__ void mma_max2_kernel ( T *__restrict__  xsi,
const T *__restrict__  x,
T *__restrict__  alpha,
const int  n 
)

Definition at line 91 of file mma_kernel.h.

Here is the call graph for this function:

◆ mma_sub1_kernel()

template<typename T >
__global__ void mma_sub1_kernel ( T *__restrict__  xlow,
T *__restrict__  xupp,
const T *__restrict__  x,
const T *__restrict__  xmin,
const T *__restrict__  xmax,
const T  asyinit,
const int  n 
)

Definition at line 4 of file mma_kernel.h.

Here is the call graph for this function:

◆ mma_sub2_kernel()

template<typename T >
__global__ void mma_sub2_kernel ( T *__restrict__  low,
T *__restrict__  upp,
const T *__restrict__  x,
const T *__restrict__  xold1,
const T *__restrict__  xold2,
const T *__restrict__  xmin,
const T *__restrict__  xmax,
const T  asydecr,
const T  asyincr,
const int  n 
)

Definition at line 17 of file mma_kernel.h.

Here is the call graph for this function:

◆ mma_sub3_kernel()

template<typename T >
__global__ void mma_sub3_kernel ( const T *__restrict__  x,
const T *__restrict__  df0dx,
const T *__restrict__  dfdx,
T *__restrict__  low,
T *__restrict__  upp,
const T *__restrict__  xmin,
const T *__restrict__  xmax,
T *__restrict__  alpha,
T *__restrict__  beta,
T *__restrict__  p0j,
T *__restrict__  q0j,
T *__restrict__  pij,
T *__restrict__  qij,
const int  n,
const int  m 
)

Definition at line 46 of file mma_kernel.h.

Here is the call graph for this function:

◆ mma_sub4_kernel()

template<typename T >
__global__ void mma_sub4_kernel ( const T *__restrict__  x,
T *__restrict__  low,
T *__restrict__  upp,
T *__restrict__  pij,
T *__restrict__  qij,
T *__restrict__  temp,
const int  n,
const int  m 
)

Definition at line 77 of file mma_kernel.h.

Here is the call graph for this function:

◆ mmareduce_kernel()

template<typename T >
__global__ void mmareduce_kernel ( T *__restrict__  bufred,
const int  n 
)

Definition at line 264 of file mma_kernel.h.

Here is the call graph for this function:

◆ mmasum_kernel()

template<typename T >
__global__ void mmasum_kernel ( const T *__restrict__  a,
T *__restrict__  buf_h,
const int  n,
const int  m,
const int  k 
)

Definition at line 293 of file mma_kernel.h.

Here is the call graph for this function:

◆ mmasumAA_kernel()

template<typename T >
__global__ void mmasumAA_kernel ( const T *__restrict__  GG,
const T *__restrict__  diagx,
T *__restrict__  buf_h,
const int  n,
const int  m,
const int  k0,
const int  k1 
)

Definition at line 355 of file mma_kernel.h.

Here is the call graph for this function:

◆ mmasumbb_kernel()

template<typename T >
__global__ void mmasumbb_kernel ( const T *__restrict__  GG,
const T *__restrict__  delx,
const T *__restrict__  diagx,
T *__restrict__  buf_h,
const int  n,
const int  m,
const int  k 
)

Definition at line 323 of file mma_kernel.h.

Here is the call graph for this function:

◆ norm_kernel()

template<typename T >
__global__ void norm_kernel ( const T *__restrict__  a,
T *__restrict__  buf_h,
const int  n 
)

Definition at line 482 of file mma_kernel.h.

Here is the call graph for this function:

◆ reduce_warp()

template<typename T >
__inline__ __device__ T reduce_warp ( T  val)

Definition at line 254 of file mma_kernel.h.

Here is the call graph for this function:

◆ relambda_kernel()

template<typename T >
__global__ void relambda_kernel ( T *__restrict__  temp,
const T *__restrict__  x,
const T *__restrict__  xupp,
const T *__restrict__  xlow,
const T *__restrict__  pij,
const T *__restrict__  qij,
const int  n,
const int  m 
)

Definition at line 102 of file mma_kernel.h.

Here is the call graph for this function:

◆ RexCalculation_kernel()

template<typename T >
__global__ void RexCalculation_kernel ( T *__restrict__  rex,
const T *__restrict__  x,
const T *__restrict__  xlow,
const T *__restrict__  xupp,
const T *__restrict__  pij,
const T *__restrict__  p0j,
const T *__restrict__  qij,
const T *__restrict__  q0j,
const T *__restrict__  lambda,
const T *__restrict__  xsi,
const T *__restrict__  eta,
const int  n,
const int  m 
)

Definition at line 451 of file mma_kernel.h.

Here is the call graph for this function:

◆ rey_calculation_kernel()

template<typename T >
__global__ void rey_calculation_kernel ( T *__restrict__  rey,
const T *__restrict__  c,
const T *__restrict__  d,
const T *__restrict__  y,
const T *__restrict__  lambda,
const T *__restrict__  mu,
const int  n 
)

Definition at line 471 of file mma_kernel.h.

Here is the call graph for this function:

◆ sub2cons2_kernel()

template<typename T >
__global__ void sub2cons2_kernel ( T *__restrict__  a,
const T *__restrict__  b,
const T *__restrict__  c,
const T *__restrict__  d,
const T  e,
const int  n 
)

Definition at line 117 of file mma_kernel.h.

Here is the call graph for this function:

◆ sub2cons_kernel()

template<typename T >
__global__ void sub2cons_kernel ( T *__restrict__  a,
const T *__restrict__  b,
const T *__restrict__  c,
const T  d,
const int  n 
)

Definition at line 515 of file mma_kernel.h.

Here is the call graph for this function:

◆ updateAA_kernel()

template<typename T >
__global__ void updateAA_kernel ( T *__restrict__  AA,
const T *__restrict__  globaltmp_mm,
const T *__restrict__  s,
const T *__restrict__  lambda,
const T *__restrict__  d,
const T *__restrict__  mu,
const T *__restrict__  y,
const T *__restrict__  a,
const T  zeta,
const T  z,
const int  m 
)

Definition at line 725 of file mma_kernel.h.

Here is the call graph for this function:

◆ updatebb_kernel()

template<typename T >
__global__ void updatebb_kernel ( T *__restrict__  bb,
const T *__restrict__  dellambda,
const T *__restrict__  dely,
const T *__restrict__  d,
const T *__restrict__  mu,
const T *__restrict__  y,
const T  delz,
const int  m 
)

Definition at line 711 of file mma_kernel.h.

Here is the call graph for this function: