| 
| 
int  | voc_size | 
|   | 
| 
int  | embed_dim | 
|   | 
| 
int  | padding_idx | 
|   | 
| 
int  | hidden_dim | 
|   | 
| 
int  | num_heads | 
|   | 
| 
float  | rms_norm_eps | 
|   | 
| 
std::vector< Int4llamaDecoderLayer >  | layers | 
|   | 
| 
std::string  | profile_name = "Int4llamaDecoder" | 
|   | 
| 
Embedding  | embed_tokens | 
|   | 
| 
LlamaRMSNorm  | norm | 
|   | 
| 
float *  | attention_mask_buf | 
|   | 
| 
float *  | pos_embeds_buf | 
|   | 
| 
float *  | last_hidden_states_buf | 
|   | 
| 
float *  | hidden_states_buf | 
|   | 
| 
float *  | inputs_embeds_buf | 
|   | 
| 
float *  | first_input_ids_buf | 
|   | 
| 
float *  | image_embed_buf | 
|   | 
| 
float *  | second_input_ids_buf | 
|   | 
| 
float *  | norm_weight_ptr = nullptr | 
|   | 
The documentation for this class was generated from the following files: