Go to the source code of this file.
Data Structures | |
| struct | CKIRV2Binding |
| struct | CKIRV2Buffer |
| struct | CKIRV2Graph |
| struct | CKIRV2Node |
Macros | |
| #define | CK_IR_V2_MAX_BINDINGS 24 |
| #define | CK_IR_V2_MAX_DIMS 4 |
| #define | CK_IR_V2_MAX_INPUTS 8 |
| #define | CK_IR_V2_MAX_OUTPUTS 4 |
Enumerations | |
| enum | CKIRV2NodeFlags { CK_IR_V2_NODE_NONE = 0 , CK_IR_V2_NODE_FUSED = 1 << 0 , CK_IR_V2_NODE_INFERENCE_ONLY = 1 << 1 } |
Functions | |
| int | ck_ir_v2_apply_meta (const char *path, CKIRV2Graph *graph) |
| int | ck_ir_v2_build_decoder (const CKModelConfig *cfg, CKIRV2Graph *graph) |
| int | ck_ir_v2_build_decoder_backward (const CKIRV2Graph *forward, CKIRV2Graph *backward) |
| void | ck_ir_v2_free (CKIRV2Graph *graph) |
| int | ck_ir_v2_parse_json (const char *path, CKIRV2Graph *graph) |
| int | ck_ir_v2_serialize_json (const CKIRV2Graph *graph, const char *path) |
| int | ck_ir_v2_serialize_json_with_plan (const CKIRV2Graph *graph, const struct CKMemPlan *plan, const char *mode, int tokens_override, int base_context_window, const char *path) |
| #define CK_IR_V2_MAX_BINDINGS 24 |
Definition at line 16 of file ckernel_ir_v2.h.
| #define CK_IR_V2_MAX_DIMS 4 |
Definition at line 13 of file ckernel_ir_v2.h.
| #define CK_IR_V2_MAX_INPUTS 8 |
Definition at line 14 of file ckernel_ir_v2.h.
| #define CK_IR_V2_MAX_OUTPUTS 4 |
Definition at line 15 of file ckernel_ir_v2.h.
| enum CKIRV2NodeFlags |
| Enumerator | |
|---|---|
| CK_IR_V2_NODE_NONE | |
| CK_IR_V2_NODE_FUSED | |
| CK_IR_V2_NODE_INFERENCE_ONLY | |
Definition at line 18 of file ckernel_ir_v2.h.
| int ck_ir_v2_apply_meta | ( | const char * | path, |
| CKIRV2Graph * | graph | ||
| ) |
Definition at line 220 of file ckernel_ir_v2_builder.c.
References CKIRV2Buffer::alias_of, CKIRV2Graph::buffers, ck_ir_v2_apply_weight_dtypes(), ck_ir_v2_find_buffer_index(), ck_ir_v2_parse_bool(), ck_ir_v2_strdup(), end, CKIRV2Graph::fused_qkv, CKIRV2Graph::gated_mlp, CKIRV2Graph::has_pos_emb, and CKIRV2Graph::tie_word_embeddings.
Referenced by main().
| int ck_ir_v2_build_decoder | ( | const CKModelConfig * | cfg, |
| CKIRV2Graph * | graph | ||
| ) |
Definition at line 285 of file ckernel_ir_v2_builder.c.
References CKIRV2Binding::arg, CKPlanBinding::arg, CKIRV2Node::bindings, CKPlanStepV2::bindings, CKIRV2Binding::buffer, CKPlanBinding::buffer, CKIRV2Graph::buffers, ck_decoder_buffer_count, ck_decoder_buffers, ck_decoder_forward_plan_v2, ck_decoder_forward_plan_v2_count, CK_DT_FP32, ck_ir_v2_copy_buffer_spec(), ck_ir_v2_find_buffer_index(), ck_ir_v2_find_kernel_spec(), ck_ir_v2_free(), CK_IR_V2_MAX_BINDINGS, ck_ir_v2_select_kernel(), ck_ir_v2_strdup(), CKIRV2Buffer::condition, CKIRV2Node::condition, CKPlanStepV2::condition, CKIRV2Graph::config, CKKernelSpec::default_dtype, CKIRV2Node::flags, CKIRV2Graph::fused_qkv, CKIRV2Graph::gated_mlp, CKIRV2Graph::has_pos_emb, CKIRV2Node::kernel, CKPlanStepV2::kernel, CKIRV2Node::kernel_dtype, CKIRV2Node::layer, CKIRV2Node::n_bindings, CKIRV2Node::n_inputs, CKIRV2Node::n_outputs, CKIRV2Buffer::name, CKIRV2Graph::nodes, CKPlanStepV2::num_bindings, CKIRV2Graph::num_buffers, CKModelConfig::num_layers, CKIRV2Graph::num_nodes, CKIRV2Node::op, and CKIRV2Graph::tie_word_embeddings.
Referenced by main().
| int ck_ir_v2_build_decoder_backward | ( | const CKIRV2Graph * | forward, |
| CKIRV2Graph * | backward | ||
| ) |
Definition at line 356 of file ckernel_ir_v2_builder.c.
References CKIRV2Buffer::alias_of, CKBufferSpec::alias_of, CKIRV2Binding::arg, CKPlanBinding::arg, CKIRV2Node::bindings, CKPlanStepV2::bindings, CKIRV2Binding::buffer, CKPlanBinding::buffer, CKIRV2Graph::buffers, ck_decoder_backward_plan_v2, ck_decoder_backward_plan_v2_count, CK_DT_FP32, ck_ir_v2_copy_buffer_spec(), ck_ir_v2_find_buffer_index(), ck_ir_v2_find_kernel_spec(), ck_ir_v2_free(), CK_IR_V2_MAX_BINDINGS, ck_ir_v2_select_kernel(), ck_ir_v2_strdup(), CKIRV2Buffer::condition, CKIRV2Node::condition, CKBufferSpec::condition, CKPlanStepV2::condition, CKIRV2Graph::config, CKKernelSpec::default_dtype, CKIRV2Buffer::dtype, CKBufferSpec::dtype, CKIRV2Node::flags, CKIRV2Node::kernel, CKPlanStepV2::kernel, CKIRV2Node::kernel_dtype, CKIRV2Node::layer, CKIRV2Node::n_bindings, CKIRV2Node::n_inputs, CKIRV2Node::n_outputs, CKIRV2Buffer::name, CKBufferSpec::name, CKIRV2Graph::nodes, CKPlanStepV2::num_bindings, CKIRV2Graph::num_buffers, CKModelConfig::num_layers, CKIRV2Graph::num_nodes, CKIRV2Node::op, CKIRV2Buffer::optional, CKBufferSpec::optional, CKIRV2Buffer::role, CKBufferSpec::role, CKIRV2Buffer::scope, CKBufferSpec::scope, CKIRV2Buffer::shape, and CKBufferSpec::shape.
Referenced by main().
| void ck_ir_v2_free | ( | CKIRV2Graph * | graph | ) |
Definition at line 34 of file ckernel_ir_v2.c.
References CKIRV2Graph::buffers, ck_ir_v2_free_buffer(), ck_ir_v2_free_node(), CKIRV2Graph::nodes, CKIRV2Graph::num_buffers, and CKIRV2Graph::num_nodes.
Referenced by ck_ir_v2_build_decoder(), ck_ir_v2_build_decoder_backward(), ck_ir_v2_lower_emit_json(), ck_ir_v2_lower_graph(), ck_ir_v2_parse_json(), and main().
| int ck_ir_v2_parse_json | ( | const char * | path, |
| CKIRV2Graph * | graph | ||
| ) |
Definition at line 1100 of file ckernel_ir_v2.c.
References ck_ir_v2_find_key(), ck_ir_v2_free(), ck_ir_v2_next_object(), ck_ir_v2_parse_bool(), ck_ir_v2_parse_buffers(), ck_ir_v2_parse_float(), ck_ir_v2_parse_int(), ck_ir_v2_parse_nodes(), CKIRV2Graph::config, CKModelConfig::context_window, end, CKIRV2Graph::fused_qkv, CKIRV2Graph::gated_mlp, CKIRV2Graph::has_pos_emb, CKModelConfig::hidden_size, CKModelConfig::intermediate_size, CKModelConfig::num_heads, CKModelConfig::num_kv_heads, CKModelConfig::num_layers, CKModelConfig::rms_norm_eps, CKModelConfig::rope_theta, CKIRV2Graph::tie_word_embeddings, and CKModelConfig::vocab_size.
Referenced by main().
| int ck_ir_v2_serialize_json | ( | const CKIRV2Graph * | graph, |
| const char * | path | ||
| ) |
Definition at line 511 of file ckernel_ir_v2.c.
References ck_ir_v2_serialize_json_internal().
Referenced by main().
| int ck_ir_v2_serialize_json_with_plan | ( | const CKIRV2Graph * | graph, |
| const struct CKMemPlan * | plan, | ||
| const char * | mode, | ||
| int | tokens_override, | ||
| int | base_context_window, | ||
| const char * | path | ||
| ) |
Referenced by ck_ir_v2_lower_emit_json().