template bool sgmv<nv_half>(nv_half *y, nv_half *x, nv_half **w, | |
int32_t *s_start, int32_t *s_end, | |
void *tmp_d, int num_problems, int d_in, int d_out, | |
int layer_idx, cudaStream_t stream); | |
template bool sgmv<nv_bfloat16>(nv_bfloat16 *y, nv_bfloat16 *x, nv_bfloat16 **w, | |
int32_t *s_start, int32_t *s_end, | |
void *tmp_d, int num_problems, int d_in, int d_out, | |
int layer_idx, cudaStream_t stream); | |