#include <ck_model_api.h>
Data Fields | |
| size_t | activation_bytes |
| int | context_window |
| int | embed_dim |
| int | head_dim |
| int | hidden_size |
| int | intermediate_size |
| int | max_seq_len |
| const char * | model_family |
| const char * | model_name |
| int | num_heads |
| int | num_kv_heads |
| int | num_layers |
| float | rms_norm_eps |
| float | rope_theta |
| size_t | total_bytes |
| int | vocab_size |
| size_t | weight_bytes |
Minimal HF-style model config extracted from config.json.
Design note:
This header focuses on the basic decoder-only transformer parameters and node-level IR that higher layers (codegen, memory planner, etc.) will build on.
Definition at line 32 of file ck_model_api.h.
| size_t CKModelConfig::activation_bytes |
Definition at line 43 of file ck_model_api.h.
| int CKModelConfig::context_window |
Definition at line 30 of file ckernel_ir.h.
Referenced by build_plan(), ck_codegen_c_skeleton(), ck_codegen_emit_runtime(), ck_codegen_v2_emit_sections(), ck_ir_dump(), ck_ir_parse_json(), ck_ir_serialize_json(), ck_ir_v2_lower_emit_json(), ck_ir_v2_parse_json(), ck_ir_v2_resolve_align(), ck_ir_v2_resolve_dim_value(), ck_ir_v2_serialize_json_internal(), ck_model_config_from_hf_json(), ck_model_load_weights_flat(), compute_align(), emit_library_api(), layout_transformer_from_ir(), and resolve_dim().
| int CKModelConfig::embed_dim |
Definition at line 33 of file ck_model_api.h.
Referenced by main(), and run_benchmark().
| int CKModelConfig::head_dim |
Definition at line 36 of file ck_model_api.h.
| int CKModelConfig::hidden_size |
Definition at line 25 of file ckernel_ir.h.
Referenced by build_plan(), ck_codegen_c_skeleton(), ck_codegen_emit_runtime(), ck_codegen_v2_emit_sections(), ck_ir_dump(), ck_ir_parse_json(), ck_ir_serialize_json(), ck_ir_v2_parse_json(), ck_ir_v2_resolve_align(), ck_ir_v2_resolve_dim_value(), ck_ir_v2_serialize_json_internal(), ck_model_config_from_hf_json(), ck_model_load_weights_flat(), compute_align(), emit_library_api(), layout_transformer_from_ir(), and resolve_dim().
| int CKModelConfig::intermediate_size |
Definition at line 37 of file ck_model_api.h.
Referenced by build_plan(), ck_codegen_c_skeleton(), ck_codegen_emit_runtime(), ck_codegen_v2_emit_sections(), ck_ir_dump(), ck_ir_parse_json(), ck_ir_serialize_json(), ck_ir_v2_parse_json(), ck_ir_v2_resolve_align(), ck_ir_v2_resolve_dim_value(), ck_ir_v2_serialize_json_internal(), ck_model_config_from_hf_json(), ck_model_load_weights_flat(), compute_align(), emit_library_api(), layout_transformer_from_ir(), main(), and resolve_dim().
| int CKModelConfig::max_seq_len |
Definition at line 40 of file ck_model_api.h.
Referenced by main().
| const char* CKModelConfig::model_family |
Definition at line 45 of file ck_model_api.h.
Referenced by main().
| const char* CKModelConfig::model_name |
Definition at line 44 of file ck_model_api.h.
Referenced by main(), and run_benchmark().
| int CKModelConfig::num_heads |
Definition at line 34 of file ck_model_api.h.
Referenced by build_plan(), ck_codegen_c_skeleton(), ck_codegen_emit_runtime(), ck_codegen_v2_emit_sections(), ck_ir_dump(), ck_ir_parse_json(), ck_ir_serialize_json(), ck_ir_v2_parse_json(), ck_ir_v2_resolve_align(), ck_ir_v2_resolve_dim_value(), ck_ir_v2_serialize_json_internal(), ck_model_config_from_hf_json(), compute_align(), emit_library_api(), main(), resolve_dim(), and run_benchmark().
| int CKModelConfig::num_kv_heads |
Definition at line 35 of file ck_model_api.h.
Referenced by ck_codegen_c_skeleton(), ck_codegen_emit_runtime(), ck_codegen_v2_emit_sections(), ck_ir_dump(), ck_ir_parse_json(), ck_ir_serialize_json(), ck_ir_v2_parse_json(), ck_ir_v2_resolve_dim_value(), ck_ir_v2_serialize_json_internal(), ck_model_config_from_hf_json(), emit_library_api(), main(), resolve_dim(), and run_benchmark().
| int CKModelConfig::num_layers |
Definition at line 38 of file ck_model_api.h.
Referenced by ck_build_decoder_ir(), ck_codegen_c_skeleton(), ck_codegen_emit_runtime(), ck_codegen_v2_emit_sections(), ck_ir_dump(), ck_ir_parse_json(), ck_ir_serialize_json(), ck_ir_v2_build_decoder(), ck_ir_v2_build_decoder_backward(), ck_ir_v2_parse_json(), ck_ir_v2_serialize_json_internal(), ck_model_config_from_hf_json(), ck_model_load_weights_flat(), emit_library_api(), layout_transformer_from_ir(), main(), and run_benchmark().
| float CKModelConfig::rms_norm_eps |
Definition at line 31 of file ckernel_ir.h.
Referenced by ck_codegen_c_skeleton(), ck_codegen_emit_runtime(), ck_ir_dump(), ck_ir_parse_json(), ck_ir_serialize_json(), ck_ir_v2_parse_json(), ck_ir_v2_serialize_json_internal(), ck_model_config_from_hf_json(), and emit_library_api().
| float CKModelConfig::rope_theta |
Definition at line 32 of file ckernel_ir.h.
Referenced by buffer_enabled(), ck_codegen_c_skeleton(), ck_codegen_emit_runtime(), ck_ir_dump(), ck_ir_parse_json(), ck_ir_serialize_json(), ck_ir_v2_parse_json(), ck_ir_v2_serialize_json_internal(), ck_model_config_from_hf_json(), ck_plan_step_enabled(), and emit_library_api().
| size_t CKModelConfig::total_bytes |
Definition at line 41 of file ck_model_api.h.
Referenced by main().
| int CKModelConfig::vocab_size |
Definition at line 39 of file ck_model_api.h.
Referenced by ck_codegen_c_skeleton(), ck_codegen_emit_runtime(), ck_codegen_v2_emit_sections(), ck_ir_dump(), ck_ir_parse_json(), ck_ir_serialize_json(), ck_ir_v2_parse_json(), ck_ir_v2_resolve_dim_value(), ck_ir_v2_serialize_json_internal(), ck_model_config_from_hf_json(), ck_model_load_weights_flat(), emit_library_api(), layout_transformer_from_ir(), main(), resolve_dim(), run_benchmark(), and run_generation_test().
| size_t CKModelConfig::weight_bytes |
Definition at line 42 of file ck_model_api.h.
Referenced by load_weights_from_bump(), and main().