#include <ckernel_orchestration.h>
Data Fields | |
| int | aligned_context_window |
| int | aligned_embed_dim |
| int | aligned_head_dim |
| int | aligned_intermediate_dim |
| float * | attn_out |
| const float * | b1 |
| const float * | b2 |
| const float * | bk |
| const float * | bo |
| const float * | bq |
| const float * | bv |
| int | embed_dim |
| float | eps |
| float * | fc1_out |
| int | head_dim |
| const float * | input |
| int | intermediate_dim |
| float * | k |
| const float * | ln1_gamma |
| float * | ln1_out |
| float * | ln1_rstd |
| const float * | ln2_gamma |
| float * | ln2_out |
| float * | ln2_rstd |
| float * | mlp_out |
| int | num_heads |
| int | num_kv_heads |
| float * | output |
| float * | proj_scratch |
| float * | proj_tmp |
| float * | q |
| float * | residual1 |
| const float * | rope_cos |
| int | rope_pos_offset |
| const float * | rope_sin |
| float * | scores |
| float * | swiglu_out |
| int | tokens |
| float * | v |
| const void * | w1 |
| CKDataType | w1_dtype |
| const void * | w2 |
| CKDataType | w2_dtype |
| const void * | wk |
| CKDataType | wk_dtype |
| const void * | wo |
| CKDataType | wo_dtype |
| const void * | wq |
| CKDataType | wq_dtype |
| const void * | wv |
| CKDataType | wv_dtype |
Definition at line 318 of file ckernel_orchestration.h.
| int CKLayerForwardParamsQ4K::aligned_context_window |
Definition at line 326 of file ckernel_orchestration.h.
Referenced by ck_layer_forward_rmsnorm_swiglu_q4_k(), and ck_layer_forward_rmsnorm_swiglu_quant().
| int CKLayerForwardParamsQ4K::aligned_embed_dim |
Definition at line 321 of file ckernel_orchestration.h.
Referenced by ck_layer_forward_rmsnorm_swiglu_decode_q4_k(), ck_layer_forward_rmsnorm_swiglu_decode_quant(), ck_layer_forward_rmsnorm_swiglu_q4_k(), and ck_layer_forward_rmsnorm_swiglu_quant().
| int CKLayerForwardParamsQ4K::aligned_head_dim |
Definition at line 325 of file ckernel_orchestration.h.
Referenced by ck_layer_forward_rmsnorm_swiglu_decode_q4_k(), ck_layer_forward_rmsnorm_swiglu_decode_quant(), ck_layer_forward_rmsnorm_swiglu_q4_k(), and ck_layer_forward_rmsnorm_swiglu_quant().
| int CKLayerForwardParamsQ4K::aligned_intermediate_dim |
Definition at line 328 of file ckernel_orchestration.h.
Referenced by ck_layer_forward_rmsnorm_swiglu_decode_q4_k(), ck_layer_forward_rmsnorm_swiglu_decode_quant(), ck_layer_forward_rmsnorm_swiglu_q4_k(), and ck_layer_forward_rmsnorm_swiglu_quant().
| float* CKLayerForwardParamsQ4K::attn_out |
Definition at line 360 of file ckernel_orchestration.h.
Referenced by ck_layer_forward_rmsnorm_swiglu_q4_k(), and ck_layer_forward_rmsnorm_swiglu_quant().
| const float* CKLayerForwardParamsQ4K::b1 |
Definition at line 350 of file ckernel_orchestration.h.
Referenced by ck_layer_forward_rmsnorm_swiglu_decode_q4_k(), ck_layer_forward_rmsnorm_swiglu_decode_quant(), ck_layer_forward_rmsnorm_swiglu_q4_k(), and ck_layer_forward_rmsnorm_swiglu_quant().
| const float* CKLayerForwardParamsQ4K::b2 |
Definition at line 352 of file ckernel_orchestration.h.
Referenced by ck_layer_forward_rmsnorm_swiglu_decode_q4_k(), ck_layer_forward_rmsnorm_swiglu_decode_quant(), ck_layer_forward_rmsnorm_swiglu_q4_k(), and ck_layer_forward_rmsnorm_swiglu_quant().
| const float* CKLayerForwardParamsQ4K::bk |
Definition at line 342 of file ckernel_orchestration.h.
Referenced by ck_layer_forward_rmsnorm_swiglu_decode_q4_k(), ck_layer_forward_rmsnorm_swiglu_decode_quant(), ck_layer_forward_rmsnorm_swiglu_q4_k(), and ck_layer_forward_rmsnorm_swiglu_quant().
| const float* CKLayerForwardParamsQ4K::bo |
Definition at line 347 of file ckernel_orchestration.h.
Referenced by ck_layer_forward_rmsnorm_swiglu_decode_q4_k(), ck_layer_forward_rmsnorm_swiglu_decode_quant(), ck_layer_forward_rmsnorm_swiglu_q4_k(), and ck_layer_forward_rmsnorm_swiglu_quant().
| const float* CKLayerForwardParamsQ4K::bq |
Definition at line 340 of file ckernel_orchestration.h.
Referenced by ck_layer_forward_rmsnorm_swiglu_decode_q4_k(), ck_layer_forward_rmsnorm_swiglu_decode_quant(), ck_layer_forward_rmsnorm_swiglu_q4_k(), and ck_layer_forward_rmsnorm_swiglu_quant().
| const float* CKLayerForwardParamsQ4K::bv |
Definition at line 344 of file ckernel_orchestration.h.
Referenced by ck_layer_forward_rmsnorm_swiglu_decode_q4_k(), ck_layer_forward_rmsnorm_swiglu_decode_quant(), ck_layer_forward_rmsnorm_swiglu_q4_k(), and ck_layer_forward_rmsnorm_swiglu_quant().
| int CKLayerForwardParamsQ4K::embed_dim |
Definition at line 320 of file ckernel_orchestration.h.
Referenced by ck_layer_forward_rmsnorm_swiglu_decode_q4_k(), ck_layer_forward_rmsnorm_swiglu_decode_quant(), ck_layer_forward_rmsnorm_swiglu_q4_k(), and ck_layer_forward_rmsnorm_swiglu_quant().
| float CKLayerForwardParamsQ4K::eps |
Definition at line 329 of file ckernel_orchestration.h.
Referenced by ck_layer_forward_rmsnorm_swiglu_decode_q4_k(), ck_layer_forward_rmsnorm_swiglu_decode_quant(), ck_layer_forward_rmsnorm_swiglu_q4_k(), and ck_layer_forward_rmsnorm_swiglu_quant().
| float* CKLayerForwardParamsQ4K::fc1_out |
Definition at line 366 of file ckernel_orchestration.h.
Referenced by ck_layer_forward_rmsnorm_swiglu_decode_q4_k(), ck_layer_forward_rmsnorm_swiglu_decode_quant(), ck_layer_forward_rmsnorm_swiglu_q4_k(), and ck_layer_forward_rmsnorm_swiglu_quant().
| int CKLayerForwardParamsQ4K::head_dim |
Definition at line 324 of file ckernel_orchestration.h.
Referenced by ck_layer_forward_rmsnorm_swiglu_decode_q4_k(), ck_layer_forward_rmsnorm_swiglu_decode_quant(), ck_layer_forward_rmsnorm_swiglu_q4_k(), and ck_layer_forward_rmsnorm_swiglu_quant().
| const float* CKLayerForwardParamsQ4K::input |
Definition at line 332 of file ckernel_orchestration.h.
Referenced by ck_layer_forward_rmsnorm_swiglu_decode_q4_k(), ck_layer_forward_rmsnorm_swiglu_decode_quant(), ck_layer_forward_rmsnorm_swiglu_q4_k(), and ck_layer_forward_rmsnorm_swiglu_quant().
| int CKLayerForwardParamsQ4K::intermediate_dim |
Definition at line 327 of file ckernel_orchestration.h.
| float* CKLayerForwardParamsQ4K::k |
Definition at line 357 of file ckernel_orchestration.h.
Referenced by ck_layer_forward_rmsnorm_swiglu_decode_q4_k(), ck_layer_forward_rmsnorm_swiglu_decode_quant(), ck_layer_forward_rmsnorm_swiglu_q4_k(), and ck_layer_forward_rmsnorm_swiglu_quant().
| const float* CKLayerForwardParamsQ4K::ln1_gamma |
Definition at line 333 of file ckernel_orchestration.h.
Referenced by ck_layer_forward_rmsnorm_swiglu_decode_q4_k(), ck_layer_forward_rmsnorm_swiglu_decode_quant(), ck_layer_forward_rmsnorm_swiglu_q4_k(), and ck_layer_forward_rmsnorm_swiglu_quant().
| float* CKLayerForwardParamsQ4K::ln1_out |
Definition at line 354 of file ckernel_orchestration.h.
Referenced by ck_layer_forward_rmsnorm_swiglu_decode_q4_k(), ck_layer_forward_rmsnorm_swiglu_decode_quant(), ck_layer_forward_rmsnorm_swiglu_q4_k(), and ck_layer_forward_rmsnorm_swiglu_quant().
| float* CKLayerForwardParamsQ4K::ln1_rstd |
Definition at line 355 of file ckernel_orchestration.h.
Referenced by ck_layer_forward_rmsnorm_swiglu_decode_q4_k(), ck_layer_forward_rmsnorm_swiglu_decode_quant(), ck_layer_forward_rmsnorm_swiglu_q4_k(), and ck_layer_forward_rmsnorm_swiglu_quant().
| const float* CKLayerForwardParamsQ4K::ln2_gamma |
Definition at line 334 of file ckernel_orchestration.h.
Referenced by ck_layer_forward_rmsnorm_swiglu_decode_q4_k(), ck_layer_forward_rmsnorm_swiglu_decode_quant(), ck_layer_forward_rmsnorm_swiglu_q4_k(), and ck_layer_forward_rmsnorm_swiglu_quant().
| float* CKLayerForwardParamsQ4K::ln2_out |
Definition at line 364 of file ckernel_orchestration.h.
Referenced by ck_layer_forward_rmsnorm_swiglu_decode_q4_k(), ck_layer_forward_rmsnorm_swiglu_decode_quant(), ck_layer_forward_rmsnorm_swiglu_q4_k(), and ck_layer_forward_rmsnorm_swiglu_quant().
| float* CKLayerForwardParamsQ4K::ln2_rstd |
Definition at line 365 of file ckernel_orchestration.h.
Referenced by ck_layer_forward_rmsnorm_swiglu_decode_q4_k(), ck_layer_forward_rmsnorm_swiglu_decode_quant(), ck_layer_forward_rmsnorm_swiglu_q4_k(), and ck_layer_forward_rmsnorm_swiglu_quant().
| float* CKLayerForwardParamsQ4K::mlp_out |
Definition at line 368 of file ckernel_orchestration.h.
Referenced by ck_layer_forward_rmsnorm_swiglu_decode_q4_k(), ck_layer_forward_rmsnorm_swiglu_decode_quant(), ck_layer_forward_rmsnorm_swiglu_q4_k(), and ck_layer_forward_rmsnorm_swiglu_quant().
| int CKLayerForwardParamsQ4K::num_heads |
Definition at line 322 of file ckernel_orchestration.h.
Referenced by ck_layer_forward_rmsnorm_swiglu_decode_q4_k(), ck_layer_forward_rmsnorm_swiglu_decode_quant(), ck_layer_forward_rmsnorm_swiglu_q4_k(), and ck_layer_forward_rmsnorm_swiglu_quant().
| int CKLayerForwardParamsQ4K::num_kv_heads |
Definition at line 323 of file ckernel_orchestration.h.
Referenced by ck_layer_forward_rmsnorm_swiglu_decode_q4_k(), ck_layer_forward_rmsnorm_swiglu_decode_quant(), ck_layer_forward_rmsnorm_swiglu_q4_k(), and ck_layer_forward_rmsnorm_swiglu_quant().
| float* CKLayerForwardParamsQ4K::output |
Definition at line 369 of file ckernel_orchestration.h.
Referenced by ck_layer_forward_rmsnorm_swiglu_decode_q4_k(), ck_layer_forward_rmsnorm_swiglu_decode_quant(), ck_layer_forward_rmsnorm_swiglu_q4_k(), and ck_layer_forward_rmsnorm_swiglu_quant().
| float* CKLayerForwardParamsQ4K::proj_scratch |
Definition at line 362 of file ckernel_orchestration.h.
Referenced by ck_layer_forward_rmsnorm_swiglu_decode_quant(), ck_layer_forward_rmsnorm_swiglu_q4_k(), and ck_layer_forward_rmsnorm_swiglu_quant().
| float* CKLayerForwardParamsQ4K::proj_tmp |
Definition at line 361 of file ckernel_orchestration.h.
Referenced by ck_layer_forward_rmsnorm_swiglu_decode_q4_k(), ck_layer_forward_rmsnorm_swiglu_decode_quant(), ck_layer_forward_rmsnorm_swiglu_q4_k(), and ck_layer_forward_rmsnorm_swiglu_quant().
| float* CKLayerForwardParamsQ4K::q |
Definition at line 356 of file ckernel_orchestration.h.
Referenced by ck_layer_forward_rmsnorm_swiglu_q4_k(), and ck_layer_forward_rmsnorm_swiglu_quant().
| float* CKLayerForwardParamsQ4K::residual1 |
Definition at line 363 of file ckernel_orchestration.h.
Referenced by ck_layer_forward_rmsnorm_swiglu_decode_q4_k(), ck_layer_forward_rmsnorm_swiglu_decode_quant(), ck_layer_forward_rmsnorm_swiglu_q4_k(), and ck_layer_forward_rmsnorm_swiglu_quant().
| const float* CKLayerForwardParamsQ4K::rope_cos |
Definition at line 336 of file ckernel_orchestration.h.
Referenced by ck_layer_forward_rmsnorm_swiglu_decode_q4_k(), ck_layer_forward_rmsnorm_swiglu_decode_quant(), ck_layer_forward_rmsnorm_swiglu_q4_k(), and ck_layer_forward_rmsnorm_swiglu_quant().
| int CKLayerForwardParamsQ4K::rope_pos_offset |
Definition at line 330 of file ckernel_orchestration.h.
Referenced by ck_layer_forward_rmsnorm_swiglu_decode_q4_k(), ck_layer_forward_rmsnorm_swiglu_decode_quant(), ck_layer_forward_rmsnorm_swiglu_q4_k(), and ck_layer_forward_rmsnorm_swiglu_quant().
| const float* CKLayerForwardParamsQ4K::rope_sin |
Definition at line 337 of file ckernel_orchestration.h.
Referenced by ck_layer_forward_rmsnorm_swiglu_decode_q4_k(), ck_layer_forward_rmsnorm_swiglu_decode_quant(), ck_layer_forward_rmsnorm_swiglu_q4_k(), and ck_layer_forward_rmsnorm_swiglu_quant().
| float* CKLayerForwardParamsQ4K::scores |
Definition at line 359 of file ckernel_orchestration.h.
Referenced by ck_layer_forward_rmsnorm_swiglu_q4_k(), and ck_layer_forward_rmsnorm_swiglu_quant().
| float* CKLayerForwardParamsQ4K::swiglu_out |
Definition at line 367 of file ckernel_orchestration.h.
Referenced by ck_layer_forward_rmsnorm_swiglu_decode_q4_k(), ck_layer_forward_rmsnorm_swiglu_decode_quant(), ck_layer_forward_rmsnorm_swiglu_q4_k(), and ck_layer_forward_rmsnorm_swiglu_quant().
| int CKLayerForwardParamsQ4K::tokens |
Definition at line 319 of file ckernel_orchestration.h.
Referenced by ck_layer_forward_rmsnorm_swiglu_q4_k(), and ck_layer_forward_rmsnorm_swiglu_quant().
| float* CKLayerForwardParamsQ4K::v |
Definition at line 358 of file ckernel_orchestration.h.
Referenced by ck_layer_forward_rmsnorm_swiglu_decode_q4_k(), ck_layer_forward_rmsnorm_swiglu_decode_quant(), ck_layer_forward_rmsnorm_swiglu_q4_k(), and ck_layer_forward_rmsnorm_swiglu_quant().
| const void* CKLayerForwardParamsQ4K::w1 |
Definition at line 349 of file ckernel_orchestration.h.
Referenced by ck_layer_forward_rmsnorm_swiglu_decode_q4_k(), ck_layer_forward_rmsnorm_swiglu_decode_quant(), ck_layer_forward_rmsnorm_swiglu_q4_k(), and ck_layer_forward_rmsnorm_swiglu_quant().
| CKDataType CKLayerForwardParamsQ4K::w1_dtype |
Definition at line 375 of file ckernel_orchestration.h.
Referenced by ck_layer_forward_rmsnorm_swiglu_decode_quant(), and ck_layer_forward_rmsnorm_swiglu_quant().
| const void* CKLayerForwardParamsQ4K::w2 |
Definition at line 351 of file ckernel_orchestration.h.
Referenced by ck_layer_forward_rmsnorm_swiglu_decode_q4_k(), ck_layer_forward_rmsnorm_swiglu_decode_quant(), ck_layer_forward_rmsnorm_swiglu_q4_k(), and ck_layer_forward_rmsnorm_swiglu_quant().
| CKDataType CKLayerForwardParamsQ4K::w2_dtype |
Definition at line 376 of file ckernel_orchestration.h.
Referenced by ck_layer_forward_rmsnorm_swiglu_decode_quant(), and ck_layer_forward_rmsnorm_swiglu_quant().
| const void* CKLayerForwardParamsQ4K::wk |
Definition at line 341 of file ckernel_orchestration.h.
Referenced by ck_layer_forward_rmsnorm_swiglu_decode_q4_k(), ck_layer_forward_rmsnorm_swiglu_decode_quant(), ck_layer_forward_rmsnorm_swiglu_q4_k(), and ck_layer_forward_rmsnorm_swiglu_quant().
| CKDataType CKLayerForwardParamsQ4K::wk_dtype |
Definition at line 372 of file ckernel_orchestration.h.
Referenced by ck_layer_forward_rmsnorm_swiglu_decode_quant(), and ck_layer_forward_rmsnorm_swiglu_quant().
| const void* CKLayerForwardParamsQ4K::wo |
Definition at line 346 of file ckernel_orchestration.h.
Referenced by ck_layer_forward_rmsnorm_swiglu_decode_q4_k(), ck_layer_forward_rmsnorm_swiglu_decode_quant(), ck_layer_forward_rmsnorm_swiglu_q4_k(), and ck_layer_forward_rmsnorm_swiglu_quant().
| CKDataType CKLayerForwardParamsQ4K::wo_dtype |
Definition at line 374 of file ckernel_orchestration.h.
Referenced by ck_layer_forward_rmsnorm_swiglu_decode_quant(), and ck_layer_forward_rmsnorm_swiglu_quant().
| const void* CKLayerForwardParamsQ4K::wq |
Definition at line 339 of file ckernel_orchestration.h.
Referenced by ck_layer_forward_rmsnorm_swiglu_decode_q4_k(), ck_layer_forward_rmsnorm_swiglu_decode_quant(), ck_layer_forward_rmsnorm_swiglu_q4_k(), and ck_layer_forward_rmsnorm_swiglu_quant().
| CKDataType CKLayerForwardParamsQ4K::wq_dtype |
Definition at line 371 of file ckernel_orchestration.h.
Referenced by ck_layer_forward_rmsnorm_swiglu_decode_quant(), and ck_layer_forward_rmsnorm_swiglu_quant().
| const void* CKLayerForwardParamsQ4K::wv |
Definition at line 343 of file ckernel_orchestration.h.
Referenced by ck_layer_forward_rmsnorm_swiglu_decode_q4_k(), ck_layer_forward_rmsnorm_swiglu_decode_quant(), ck_layer_forward_rmsnorm_swiglu_q4_k(), and ck_layer_forward_rmsnorm_swiglu_quant().
| CKDataType CKLayerForwardParamsQ4K::wv_dtype |
Definition at line 373 of file ckernel_orchestration.h.
Referenced by ck_layer_forward_rmsnorm_swiglu_decode_quant(), and ck_layer_forward_rmsnorm_swiglu_quant().