AUTO-GENERATED: qwen2_0.5b_decode Memory Layout. More...
Go to the source code of this file.
Data Structures | |
| struct | QWEN2_0_5B_DECODECanary |
| struct | QWEN2_0_5B_DECODEFooterOffsets |
| struct | QWEN2_0_5B_DECODEGlobalOffsets |
| struct | QWEN2_0_5B_DECODEHeaderOffsets |
| struct | QWEN2_0_5B_DECODELayerOffsets |
| struct | QWEN2_0_5B_DECODEModel |
Functions | |
| void | qwen2_0_5b_decode_decode (QWEN2_0_5B_DECODEModel *model, const int *token, int token_index) |
| void | qwen2_0_5b_decode_forward (QWEN2_0_5B_DECODEModel *model, const int *tokens, int num_tokens) |
| int | qwen2_0_5b_decode_model_allocate (QWEN2_0_5B_DECODEModel *model) |
| void | qwen2_0_5b_decode_model_free (QWEN2_0_5B_DECODEModel *model) |
| int | qwen2_0_5b_decode_verify_canaries (QWEN2_0_5B_DECODEModel *model) |
Variables | |
| static const QWEN2_0_5B_DECODECanary | QWEN2_0_5B_DECODE_CANARIES [] |
| static const QWEN2_0_5B_DECODEFooterOffsets | QWEN2_0_5B_DECODE_FOOTER |
| static const QWEN2_0_5B_DECODEGlobalOffsets | QWEN2_0_5B_DECODE_GLOBALS |
| static const QWEN2_0_5B_DECODEHeaderOffsets | QWEN2_0_5B_DECODE_HEADER |
| static const CKDataType | QWEN2_0_5B_DECODE_LAYER_W1_DTYPE [] |
| static const CKDataType | QWEN2_0_5B_DECODE_LAYER_W2_DTYPE [] |
| static const CKDataType | QWEN2_0_5B_DECODE_LAYER_WK_DTYPE [] |
| static const CKDataType | QWEN2_0_5B_DECODE_LAYER_WO_DTYPE [] |
| static const CKDataType | QWEN2_0_5B_DECODE_LAYER_WQ_DTYPE [] |
| static const CKDataType | QWEN2_0_5B_DECODE_LAYER_WV_DTYPE [] |
| static const QWEN2_0_5B_DECODELayerOffsets | QWEN2_0_5B_DECODE_LAYERS [24] |
AUTO-GENERATED: qwen2_0.5b_decode Memory Layout.
Generated: 2026-01-15T19:23:13.597715 UTC Total Memory: 3.65 GB
DO NOT EDIT - Regenerate with build_ir_v3.py
Definition in file v6.6/generated/ck-kernel-inference.h.
| #define QWEN2_0_5B_DECODE_ACTIVATION_BYTES 3256082944ULL |
Definition at line 39 of file v6.6/generated/ck-kernel-inference.h.
| #define QWEN2_0_5B_DECODE_CANARY_COUNT 566 |
Definition at line 1289 of file v6.6/generated/ck-kernel-inference.h.
| #define QWEN2_0_5B_DECODE_CANARY_SIZE 64 |
Definition at line 43 of file v6.6/generated/ck-kernel-inference.h.
| #define QWEN2_0_5B_DECODE_CANARY_VALUE 0xDEADBEEFUL |
Definition at line 42 of file v6.6/generated/ck-kernel-inference.h.
| #define QWEN2_0_5B_DECODE_DTYPE_BYTES 4 |
Definition at line 35 of file v6.6/generated/ck-kernel-inference.h.
| #define QWEN2_0_5B_DECODE_EMBED_DIM 896 |
Definition at line 25 of file v6.6/generated/ck-kernel-inference.h.
| #define QWEN2_0_5B_DECODE_HEAD_DIM 64 |
Definition at line 28 of file v6.6/generated/ck-kernel-inference.h.
| #define QWEN2_0_5B_DECODE_INTERMEDIATE 4864 |
Definition at line 29 of file v6.6/generated/ck-kernel-inference.h.
| #define QWEN2_0_5B_DECODE_LAYER | ( | layer_id | ) | (&QWEN2_0_5B_DECODE_LAYERS[layer_id]) |
Definition at line 1310 of file v6.6/generated/ck-kernel-inference.h.
| #define QWEN2_0_5B_DECODE_LAYER_STRIDE 0x08A688C0ULL |
Definition at line 648 of file v6.6/generated/ck-kernel-inference.h.
| #define QWEN2_0_5B_DECODE_MAGIC 0x434B454EUL |
Definition at line 41 of file v6.6/generated/ck-kernel-inference.h.
| #define QWEN2_0_5B_DECODE_MAX_SEQ_LEN 131072 |
Definition at line 32 of file v6.6/generated/ck-kernel-inference.h.
| #define QWEN2_0_5B_DECODE_NUM_HEADS 14 |
Definition at line 26 of file v6.6/generated/ck-kernel-inference.h.
| #define QWEN2_0_5B_DECODE_NUM_KV_HEADS 2 |
Definition at line 27 of file v6.6/generated/ck-kernel-inference.h.
| #define QWEN2_0_5B_DECODE_NUM_LAYERS 24 |
Definition at line 30 of file v6.6/generated/ck-kernel-inference.h.
| #define QWEN2_0_5B_DECODE_NUM_MERGES 0 |
Definition at line 33 of file v6.6/generated/ck-kernel-inference.h.
| #define QWEN2_0_5B_DECODE_PTR | ( | model, | |
| offset | |||
| ) | ((float*)((char*)(model)->base + (offset))) |
Definition at line 1304 of file v6.6/generated/ck-kernel-inference.h.
| #define QWEN2_0_5B_DECODE_PTR_BF16 | ( | model, | |
| offset | |||
| ) | ((uint16_t*)((char*)(model)->base + (offset))) |
Definition at line 1307 of file v6.6/generated/ck-kernel-inference.h.
| #define QWEN2_0_5B_DECODE_TOTAL_BYTES 3651931008ULL |
Definition at line 37 of file v6.6/generated/ck-kernel-inference.h.
| #define QWEN2_0_5B_DECODE_TOTAL_VOCAB_BYTES 0 |
Definition at line 34 of file v6.6/generated/ck-kernel-inference.h.
| #define QWEN2_0_5B_DECODE_VOCAB_SIZE 151936 |
Definition at line 31 of file v6.6/generated/ck-kernel-inference.h.
| #define QWEN2_0_5B_DECODE_WEIGHT_BYTES 395811776ULL |
Definition at line 38 of file v6.6/generated/ck-kernel-inference.h.
| void qwen2_0_5b_decode_decode | ( | QWEN2_0_5B_DECODEModel * | model, |
| const int * | token, | ||
| int | token_index | ||
| ) |
Definition at line 8022 of file v6.5/test_generated/ck-kernel-inference.c.
| void qwen2_0_5b_decode_forward | ( | QWEN2_0_5B_DECODEModel * | model, |
| const int * | tokens, | ||
| int | num_tokens | ||
| ) |
Definition at line 8013 of file v6.5/test_generated/ck-kernel-inference.c.
| int qwen2_0_5b_decode_model_allocate | ( | QWEN2_0_5B_DECODEModel * | model | ) |
Definition at line 88 of file v6.5/test_generated/ck-kernel-inference.c.
| void qwen2_0_5b_decode_model_free | ( | QWEN2_0_5B_DECODEModel * | model | ) |
Definition at line 141 of file v6.5/test_generated/ck-kernel-inference.c.
| int qwen2_0_5b_decode_verify_canaries | ( | QWEN2_0_5B_DECODEModel * | model | ) |
Definition at line 152 of file v6.5/test_generated/ck-kernel-inference.c.
|
static |
Definition at line 721 of file v6.6/generated/ck-kernel-inference.h.
|
static |
Definition at line 691 of file v6.6/generated/ck-kernel-inference.h.
|
static |
Definition at line 707 of file v6.6/generated/ck-kernel-inference.h.
|
static |
Definition at line 57 of file v6.6/generated/ck-kernel-inference.h.
|
static |
Definition at line 672 of file v6.6/generated/ck-kernel-inference.h.
|
static |
Definition at line 676 of file v6.6/generated/ck-kernel-inference.h.
|
static |
Definition at line 660 of file v6.6/generated/ck-kernel-inference.h.
|
static |
Definition at line 668 of file v6.6/generated/ck-kernel-inference.h.
|
static |
Definition at line 656 of file v6.6/generated/ck-kernel-inference.h.
|
static |
Definition at line 664 of file v6.6/generated/ck-kernel-inference.h.
|
static |
Definition at line 93 of file v6.6/generated/ck-kernel-inference.h.