|
TinyChatEngine
|
Public Member Functions | |
| Int4llamaAttention (std::string param_path, const struct model_config config, int layer_idx) | |
| struct Int4llamaAttention_output | forward (std::string param_path, const struct Int4llamaAttention_input &input) |
Static Public Member Functions | |
| static void | initialized_memory (const struct model_config config) |
Public Attributes | |
| int * | q_weight = nullptr |
| int * | k_weight = nullptr |
| int * | v_weight = nullptr |
| int * | o_weight = nullptr |
| int * | qkv_weight = nullptr |
| float * | cos_buf = nullptr |
| float * | sin_buf = nullptr |