punica-sgmv / sgmv /sgmv_cutlass.cu
danieldk's picture
danieldk HF Staff
Add Punica sgmv kernels
5a84343
raw
history blame contribute delete
649 Bytes
#include <cuda_bf16.h>
#include <cuda_fp16.h>
#include "sgmv_cutlass.cuh"
template bool sgmv<nv_half>(nv_half *y, nv_half *x, nv_half **w,
int32_t *s_start, int32_t *s_end,
void *tmp_d, int num_problems, int d_in, int d_out,
int layer_idx, cudaStream_t stream);
template bool sgmv<nv_bfloat16>(nv_bfloat16 *y, nv_bfloat16 *x, nv_bfloat16 **w,
int32_t *s_start, int32_t *s_end,
void *tmp_d, int num_problems, int d_in, int d_out,
int layer_idx, cudaStream_t stream);