TinyChatEngine
Loading...
Searching...
No Matches
llm
include
ops
W8A8BFP32OFP32Linear.h
1
#include "common.h"
2
3
struct
W8A8BFP32OFP32Linear_params
{
4
Matrix3D<int8_t>
weight;
5
Matrix3D<float>
bias;
6
float
alpha;
7
};
8
9
class
W8A8BFP32OFP32Linear
{
10
public
:
11
W8A8BFP32OFP32Linear
(
W8A8BFP32OFP32Linear_params
¶ms_);
12
W8A8BFP32OFP32Linear
(){};
13
void
forward(
const
Matrix3D<int8_t>
&x,
Matrix3D<float>
&output);
14
struct
matmul_params
params;
15
float
alpha;
16
17
private
:
18
std::string profile_name =
"W8A8BFP32OFP32Linear"
;
19
};
20
21
void
load_W8A8BFP32OFP32Linear_params(
W8A8BFP32OFP32Linear
&op, std::string prefix);
Matrix3D
Definition
common.h:34
W8A8BFP32OFP32Linear
Definition
W8A8BFP32OFP32Linear.h:9
W8A8BFP32OFP32Linear_params
Definition
W8A8BFP32OFP32Linear.h:3
matmul_params
Definition
matmul.h:78
Generated by
1.11.0