#include <stdint.h>#include <stddef.h>Go to the source code of this file.
Functions | |
| static void | bf16_tensor_to_float (const uint16_t *src, float *dst, size_t count) |
| static float | bf16_to_float (uint16_t v) |
| static void | float_tensor_to_bf16 (const float *src, uint16_t *dst, size_t count) |
| static uint16_t | float_to_bf16 (float f) |
|
inlinestatic |
Definition at line 250 of file bf16_utils.h.
References bf16_to_float().
Referenced by backward_causal_softmax_head_major_bf16(), causal_softmax_head_major_bf16(), convert_bf16_tensor_to_buf(), geglu_forward_bf16(), gelu_backward_exact_bf16(), gelu_backward_fast_bf16(), gelu_fast_inplace_bf16(), layernorm_backward_kernel_bf16(), layernorm_forward_rolled_slice_bf16(), layernorm_forward_unrolled_slice_bf16(), mlp_token_parallel_bf16_fp32act(), rope_backward_bf16(), rope_forward_bf16(), sigmoid_backward_bf16(), sigmoid_forward_bf16(), and softmax_cross_entropy_loss_bf16().
|
inlinestatic |
Definition at line 38 of file bf16_utils.h.
Referenced by __attribute__(), adamw_update_bf16(), add_forward_2d_bf16(), add_forward_bf16(), add_inplace_bf16(), add_scaled_forward_bf16(), add_scaled_inplace_bf16(), bf16_tensor_to_float(), embedding_backward_bf16(), embedding_forward_bf16(), gemm_bf16_fp32out(), gemm_nn_bf16(), gemm_tn_bf16(), gradient_accumulate_bf16(), gradient_clip_norm_bf16(), gradient_scale_bf16(), mlp_token_parallel_bf16(), patch2im_bf16(), relu_backward_bf16(), relu_forward_bf16(), relu_forward_inplace_bf16(), rmsnorm_backward_bf16(), rmsnorm_forward_bf16(), sgd_momentum_update_bf16(), swiglu_backward_bf16(), and swiglu_forward_bf16().
|
inlinestatic |
Definition at line 271 of file bf16_utils.h.
References float_to_bf16().
Referenced by backward_causal_softmax_head_major_bf16(), causal_softmax_head_major_bf16(), geglu_forward_bf16(), gelu_backward_exact_bf16(), gelu_backward_fast_bf16(), gelu_fast_inplace_bf16(), layernorm_backward_kernel_bf16(), layernorm_forward_rolled_slice_bf16(), layernorm_forward_unrolled_slice_bf16(), mlp_token_parallel_bf16_fp32act(), rope_backward_bf16(), rope_forward_bf16(), sigmoid_backward_bf16(), sigmoid_forward_bf16(), and softmax_cross_entropy_loss_bf16().
|
inlinestatic |
Definition at line 90 of file bf16_utils.h.
Referenced by __attribute__(), adamw_update_bf16(), add_forward_2d_bf16(), add_forward_bf16(), add_inplace_bf16(), add_scaled_forward_bf16(), add_scaled_inplace_bf16(), embedding_backward_bf16(), embedding_forward_bf16(), float_tensor_to_bf16(), gemm_nn_bf16(), gemm_tn_bf16(), gradient_accumulate_bf16(), gradient_scale_bf16(), mlp_token_parallel_bf16(), patch2im_bf16(), relu_backward_bf16(), relu_forward_bf16(), relu_forward_inplace_bf16(), rmsnorm_backward_bf16(), rmsnorm_forward_bf16(), sgd_momentum_update_bf16(), swiglu_backward_bf16(), and swiglu_forward_bf16().