TinyChatEngine
Loading...
Searching...
No Matches
llm
include
ops
W8A8B8O8Linear.h
1
#include "common.h"
2
3
struct
W8A8B8O8Linear_params
{
4
Matrix3D<int8_t>
weight;
5
Matrix3D<int8_t>
bias;
6
float
alpha;
7
float
beta;
8
};
9
10
class
W8A8B8O8Linear
{
11
public
:
12
W8A8B8O8Linear
(
W8A8B8O8Linear_params
¶ms_);
13
W8A8B8O8Linear
(){};
14
void
forward(
const
Matrix3D<int8_t>
&x,
Matrix3D<int8_t>
&output);
15
struct
matmul_params
params;
16
float
alpha;
17
float
beta;
18
19
private
:
20
std::string profile_name =
"W8A8B8O8Linear"
;
21
};
22
23
void
load_W8A8B8O8Linear_params(
W8A8B8O8Linear
&op, std::string prefix);
Matrix3D
Definition
common.h:34
W8A8B8O8Linear
Definition
W8A8B8O8Linear.h:10
W8A8B8O8Linear_params
Definition
W8A8B8O8Linear.h:3
matmul_params
Definition
matmul.h:78
Generated by
1.11.0