TinyChatEngine
|
This is the complete list of members for Int8OPTDecoderLayer, including all inherited members.
attn (defined in Int8OPTDecoderLayer) | Int8OPTDecoderLayer | |
embed_dim (defined in Int8OPTDecoderLayer) | Int8OPTDecoderLayer | |
fc1 (defined in Int8OPTDecoderLayer) | Int8OPTDecoderLayer | |
fc2 (defined in Int8OPTDecoderLayer) | Int8OPTDecoderLayer | |
final_layer_norm (defined in Int8OPTDecoderLayer) | Int8OPTDecoderLayer | |
forward(const struct Int8OPTDecoderLayer_input &input) (defined in Int8OPTDecoderLayer) | Int8OPTDecoderLayer | |
hidden_dim (defined in Int8OPTDecoderLayer) | Int8OPTDecoderLayer | |
Int8OPTDecoderLayer(std::string param_path, const struct model_config config, int layer_idx, LayerNormQ self_attn_layer_norm, LayerNormQ final_layer_norm, W8A8B8O8LinearReLU fc1, W8A8BFP32OFP32Linear fc2, BMM_S8T_S8N_F32T qk_bmm, BMM_S8T_S8N_S8T pv_bmm, W8A8B8O8Linear k_proj, W8A8B8O8Linear v_proj, W8A8B8O8Linear q_proj, W8A8BFP32OFP32Linear out_proj) (defined in Int8OPTDecoderLayer) | Int8OPTDecoderLayer | |
layer_idx (defined in Int8OPTDecoderLayer) | Int8OPTDecoderLayer | |
num_attention_heads (defined in Int8OPTDecoderLayer) | Int8OPTDecoderLayer | |
profile_name (defined in Int8OPTDecoderLayer) | Int8OPTDecoderLayer | |
self_attn_layer_norm (defined in Int8OPTDecoderLayer) | Int8OPTDecoderLayer |