TinyChatEngine
Loading...
Searching...
No Matches
llm
include
ops
BMM_S8T_S8N_F32T.h
1
#include "common.h"
2
3
struct
BMM_S8T_S8N_F32T_params
{
4
float
alpha;
5
};
6
7
class
BMM_S8T_S8N_F32T
{
8
public
:
9
BMM_S8T_S8N_F32T
(
BMM_S8T_S8N_F32T_params
¶ms_);
10
BMM_S8T_S8N_F32T
(){};
11
void
forward(
const
Matrix3D<int8_t>
&x,
const
Matrix3D<int8_t>
&weight,
Matrix3D<float>
&output);
12
struct
matmul_params
params;
13
float
alpha;
14
15
private
:
16
std::string profile_name =
"BMM_S8T_S8N_F32T"
;
17
};
18
19
void
load_BMM_S8T_S8N_F32T(
BMM_S8T_S8N_F32T
&op, std::string prefix);
BMM_S8T_S8N_F32T
Definition
BMM_S8T_S8N_F32T.h:7
Matrix3D
Definition
common.h:34
BMM_S8T_S8N_F32T_params
Definition
BMM_S8T_S8N_F32T.h:3
matmul_params
Definition
matmul.h:78
Generated by
1.11.0