AUTO-GENERATED: qwen2_0.5b_decode Memory Layout. More...
#include <stddef.h>#include <stdint.h>Go to the source code of this file.
Data Structures | |
| struct | QWEN2_0_5B_DECODECanary |
| struct | QWEN2_0_5B_DECODEFooterOffsets |
| struct | QWEN2_0_5B_DECODEGlobalOffsets |
| struct | QWEN2_0_5B_DECODEHeaderOffsets |
| struct | QWEN2_0_5B_DECODELayerOffsets |
| struct | QWEN2_0_5B_DECODEModel |
Functions | |
| void | qwen2_0_5b_decode_decode (QWEN2_0_5B_DECODEModel *model, const int *token, int token_index) |
| void | qwen2_0_5b_decode_forward (QWEN2_0_5B_DECODEModel *model, const int *tokens, int num_tokens) |
| int | qwen2_0_5b_decode_model_allocate (QWEN2_0_5B_DECODEModel *model) |
| void | qwen2_0_5b_decode_model_free (QWEN2_0_5B_DECODEModel *model) |
| int | qwen2_0_5b_decode_verify_canaries (QWEN2_0_5B_DECODEModel *model) |
Variables | |
| static const QWEN2_0_5B_DECODECanary | QWEN2_0_5B_DECODE_CANARIES [] |
| static const QWEN2_0_5B_DECODEFooterOffsets | QWEN2_0_5B_DECODE_FOOTER |
| static const QWEN2_0_5B_DECODEGlobalOffsets | QWEN2_0_5B_DECODE_GLOBALS |
| static const QWEN2_0_5B_DECODEHeaderOffsets | QWEN2_0_5B_DECODE_HEADER |
| static const QWEN2_0_5B_DECODELayerOffsets | QWEN2_0_5B_DECODE_LAYERS [24] |
AUTO-GENERATED: qwen2_0.5b_decode Memory Layout.
Generated: 2026-01-12T04:06:36.660353 UTC Total Memory: 3.57 GB
DO NOT EDIT - Regenerate with build_ir_v3.py
Definition in file v6.5/test_generated/ck-kernel-inference.h.
| #define QWEN2_0_5B_DECODE_ACTIVATION_BYTES 3256169984ULL |
Definition at line 39 of file v6.5/test_generated/ck-kernel-inference.h.
| #define QWEN2_0_5B_DECODE_CANARY_COUNT 566 |
Definition at line 1259 of file v6.5/test_generated/ck-kernel-inference.h.
| #define QWEN2_0_5B_DECODE_CANARY_SIZE 64 |
Definition at line 43 of file v6.5/test_generated/ck-kernel-inference.h.
| #define QWEN2_0_5B_DECODE_CANARY_VALUE 0xDEADBEEFUL |
Definition at line 42 of file v6.5/test_generated/ck-kernel-inference.h.
| #define QWEN2_0_5B_DECODE_DTYPE_BYTES 4 |
Definition at line 35 of file v6.5/test_generated/ck-kernel-inference.h.
| #define QWEN2_0_5B_DECODE_EMBED_DIM 896 |
Definition at line 25 of file v6.5/test_generated/ck-kernel-inference.h.
| #define QWEN2_0_5B_DECODE_HEAD_DIM 64 |
Definition at line 28 of file v6.5/test_generated/ck-kernel-inference.h.
| #define QWEN2_0_5B_DECODE_INTERMEDIATE 4864 |
Definition at line 29 of file v6.5/test_generated/ck-kernel-inference.h.
| #define QWEN2_0_5B_DECODE_LAYER | ( | layer_id | ) | (&QWEN2_0_5B_DECODE_LAYERS[layer_id]) |
Definition at line 1280 of file v6.5/test_generated/ck-kernel-inference.h.
| #define QWEN2_0_5B_DECODE_LAYER_STRIDE 0x0892CC00ULL |
Definition at line 648 of file v6.5/test_generated/ck-kernel-inference.h.
| #define QWEN2_0_5B_DECODE_MAGIC 0x434B454EUL |
Definition at line 41 of file v6.5/test_generated/ck-kernel-inference.h.
| #define QWEN2_0_5B_DECODE_MAX_SEQ_LEN 131072 |
Definition at line 32 of file v6.5/test_generated/ck-kernel-inference.h.
| #define QWEN2_0_5B_DECODE_NUM_HEADS 14 |
Definition at line 26 of file v6.5/test_generated/ck-kernel-inference.h.
| #define QWEN2_0_5B_DECODE_NUM_KV_HEADS 2 |
Definition at line 27 of file v6.5/test_generated/ck-kernel-inference.h.
| #define QWEN2_0_5B_DECODE_NUM_LAYERS 24 |
Definition at line 30 of file v6.5/test_generated/ck-kernel-inference.h.
| #define QWEN2_0_5B_DECODE_NUM_MERGES 0 |
Definition at line 33 of file v6.5/test_generated/ck-kernel-inference.h.
| #define QWEN2_0_5B_DECODE_PTR | ( | model, | |
| offset | |||
| ) | ((float*)((char*)(model)->base + (offset))) |
Definition at line 1274 of file v6.5/test_generated/ck-kernel-inference.h.
| #define QWEN2_0_5B_DECODE_PTR_BF16 | ( | model, | |
| offset | |||
| ) | ((uint16_t*)((char*)(model)->base + (offset))) |
Definition at line 1277 of file v6.5/test_generated/ck-kernel-inference.h.
| #define QWEN2_0_5B_DECODE_TOTAL_BYTES 3573889600ULL |
Definition at line 37 of file v6.5/test_generated/ck-kernel-inference.h.
| #define QWEN2_0_5B_DECODE_TOTAL_VOCAB_BYTES 0 |
Definition at line 34 of file v6.5/test_generated/ck-kernel-inference.h.
| #define QWEN2_0_5B_DECODE_VOCAB_SIZE 151936 |
Definition at line 31 of file v6.5/test_generated/ck-kernel-inference.h.
| #define QWEN2_0_5B_DECODE_WEIGHT_BYTES 317683328ULL |
Definition at line 38 of file v6.5/test_generated/ck-kernel-inference.h.
| void qwen2_0_5b_decode_decode | ( | QWEN2_0_5B_DECODEModel * | model, |
| const int * | token, | ||
| int | token_index | ||
| ) |
Definition at line 8022 of file v6.5/test_generated/ck-kernel-inference.c.
| void qwen2_0_5b_decode_forward | ( | QWEN2_0_5B_DECODEModel * | model, |
| const int * | tokens, | ||
| int | num_tokens | ||
| ) |
Definition at line 8013 of file v6.5/test_generated/ck-kernel-inference.c.
| int qwen2_0_5b_decode_model_allocate | ( | QWEN2_0_5B_DECODEModel * | model | ) |
Definition at line 88 of file v6.5/test_generated/ck-kernel-inference.c.
| void qwen2_0_5b_decode_model_free | ( | QWEN2_0_5B_DECODEModel * | model | ) |
Definition at line 141 of file v6.5/test_generated/ck-kernel-inference.c.
| int qwen2_0_5b_decode_verify_canaries | ( | QWEN2_0_5B_DECODEModel * | model | ) |
Definition at line 152 of file v6.5/test_generated/ck-kernel-inference.c.
|
static |
Definition at line 691 of file v6.5/test_generated/ck-kernel-inference.h.
Referenced by qwen2_0_5b_decode_model_allocate(), and qwen2_0_5b_decode_verify_canaries().
|
static |
Definition at line 661 of file v6.5/test_generated/ck-kernel-inference.h.
Referenced by ck_model_get_logits(), qwen2_0_5b_decode_decode_token(), and qwen2_0_5b_decode_forward_prefill_impl().
|
static |
Definition at line 677 of file v6.5/test_generated/ck-kernel-inference.h.
Referenced by qwen2_0_5b_decode_layer_0_decode(), qwen2_0_5b_decode_layer_0_prefill(), qwen2_0_5b_decode_layer_10_decode(), qwen2_0_5b_decode_layer_10_prefill(), qwen2_0_5b_decode_layer_11_decode(), qwen2_0_5b_decode_layer_11_prefill(), qwen2_0_5b_decode_layer_12_decode(), qwen2_0_5b_decode_layer_12_prefill(), qwen2_0_5b_decode_layer_13_decode(), qwen2_0_5b_decode_layer_13_prefill(), qwen2_0_5b_decode_layer_14_decode(), qwen2_0_5b_decode_layer_14_prefill(), qwen2_0_5b_decode_layer_15_decode(), qwen2_0_5b_decode_layer_15_prefill(), qwen2_0_5b_decode_layer_16_decode(), qwen2_0_5b_decode_layer_16_prefill(), qwen2_0_5b_decode_layer_17_decode(), qwen2_0_5b_decode_layer_17_prefill(), qwen2_0_5b_decode_layer_18_decode(), qwen2_0_5b_decode_layer_18_prefill(), qwen2_0_5b_decode_layer_19_decode(), qwen2_0_5b_decode_layer_19_prefill(), qwen2_0_5b_decode_layer_1_decode(), qwen2_0_5b_decode_layer_1_prefill(), qwen2_0_5b_decode_layer_20_decode(), qwen2_0_5b_decode_layer_20_prefill(), qwen2_0_5b_decode_layer_21_decode(), qwen2_0_5b_decode_layer_21_prefill(), qwen2_0_5b_decode_layer_22_decode(), qwen2_0_5b_decode_layer_22_prefill(), qwen2_0_5b_decode_layer_23_decode(), qwen2_0_5b_decode_layer_23_prefill(), qwen2_0_5b_decode_layer_2_decode(), qwen2_0_5b_decode_layer_2_prefill(), qwen2_0_5b_decode_layer_3_decode(), qwen2_0_5b_decode_layer_3_prefill(), qwen2_0_5b_decode_layer_4_decode(), qwen2_0_5b_decode_layer_4_prefill(), qwen2_0_5b_decode_layer_5_decode(), qwen2_0_5b_decode_layer_5_prefill(), qwen2_0_5b_decode_layer_6_decode(), qwen2_0_5b_decode_layer_6_prefill(), qwen2_0_5b_decode_layer_7_decode(), qwen2_0_5b_decode_layer_7_prefill(), qwen2_0_5b_decode_layer_8_decode(), qwen2_0_5b_decode_layer_8_prefill(), qwen2_0_5b_decode_layer_9_decode(), qwen2_0_5b_decode_layer_9_prefill(), and qwen2_0_5b_decode_precompute_rope().
|
static |
Definition at line 57 of file v6.5/test_generated/ck-kernel-inference.h.
Referenced by qwen2_0_5b_decode_decode_token(), qwen2_0_5b_decode_forward_prefill_impl(), qwen2_0_5b_decode_layer_0_decode(), and qwen2_0_5b_decode_layer_0_prefill().
|
static |
Definition at line 93 of file v6.5/test_generated/ck-kernel-inference.h.
Referenced by qwen2_0_5b_decode_decode_token(), qwen2_0_5b_decode_forward_prefill_impl(), qwen2_0_5b_decode_layer_0_decode(), qwen2_0_5b_decode_layer_0_prefill(), qwen2_0_5b_decode_layer_10_decode(), qwen2_0_5b_decode_layer_10_prefill(), qwen2_0_5b_decode_layer_11_decode(), qwen2_0_5b_decode_layer_11_prefill(), qwen2_0_5b_decode_layer_12_decode(), qwen2_0_5b_decode_layer_12_prefill(), qwen2_0_5b_decode_layer_13_decode(), qwen2_0_5b_decode_layer_13_prefill(), qwen2_0_5b_decode_layer_14_decode(), qwen2_0_5b_decode_layer_14_prefill(), qwen2_0_5b_decode_layer_15_decode(), qwen2_0_5b_decode_layer_15_prefill(), qwen2_0_5b_decode_layer_16_decode(), qwen2_0_5b_decode_layer_16_prefill(), qwen2_0_5b_decode_layer_17_decode(), qwen2_0_5b_decode_layer_17_prefill(), qwen2_0_5b_decode_layer_18_decode(), qwen2_0_5b_decode_layer_18_prefill(), qwen2_0_5b_decode_layer_19_decode(), qwen2_0_5b_decode_layer_19_prefill(), qwen2_0_5b_decode_layer_1_decode(), qwen2_0_5b_decode_layer_1_prefill(), qwen2_0_5b_decode_layer_20_decode(), qwen2_0_5b_decode_layer_20_prefill(), qwen2_0_5b_decode_layer_21_decode(), qwen2_0_5b_decode_layer_21_prefill(), qwen2_0_5b_decode_layer_22_decode(), qwen2_0_5b_decode_layer_22_prefill(), qwen2_0_5b_decode_layer_23_decode(), qwen2_0_5b_decode_layer_23_prefill(), qwen2_0_5b_decode_layer_2_decode(), qwen2_0_5b_decode_layer_2_prefill(), qwen2_0_5b_decode_layer_3_decode(), qwen2_0_5b_decode_layer_3_prefill(), qwen2_0_5b_decode_layer_4_decode(), qwen2_0_5b_decode_layer_4_prefill(), qwen2_0_5b_decode_layer_5_decode(), qwen2_0_5b_decode_layer_5_prefill(), qwen2_0_5b_decode_layer_6_decode(), qwen2_0_5b_decode_layer_6_prefill(), qwen2_0_5b_decode_layer_7_decode(), qwen2_0_5b_decode_layer_7_prefill(), qwen2_0_5b_decode_layer_8_decode(), qwen2_0_5b_decode_layer_8_prefill(), qwen2_0_5b_decode_layer_9_decode(), and qwen2_0_5b_decode_layer_9_prefill().