|
int | voc_size |
|
int | embed_dim |
|
int | padding_idx |
|
int | hidden_dim |
|
int | num_heads |
|
float | rms_norm_eps |
|
std::vector< Int4llamaDecoderLayer > | layers |
|
std::string | profile_name = "Int4llamaDecoder" |
|
Embedding | embed_tokens |
|
LlamaRMSNorm | norm |
|
float * | attention_mask_buf |
|
float * | pos_embeds_buf |
|
float * | last_hidden_states_buf |
|
float * | hidden_states_buf |
|
float * | inputs_embeds_buf |
|
float * | first_input_ids_buf |
|
float * | image_embed_buf |
|
float * | second_input_ids_buf |
|
float * | norm_weight_ptr = nullptr |
|
The documentation for this class was generated from the following files: