| Name | Last modified | Size | Description | |
|---|---|---|---|---|
| Parent Directory | - | |||
| feature-tests/ | 2026-02-03 17:07 | - | ||
| reglu.comp | 2026-02-03 17:07 | 126 | ||
| swiglu.comp | 2026-02-03 17:07 | 134 | ||
| rte.glsl | 2026-02-03 17:07 | 154 | ||
| generic_head.glsl | 2026-02-03 17:07 | 196 | ||
| geglu_quick.comp | 2026-02-03 17:07 | 200 | ||
| dequant_head.glsl | 2026-02-03 17:07 | 249 | ||
| swiglu_oai.comp | 2026-02-03 17:07 | 288 | ||
| geglu.comp | 2026-02-03 17:07 | 327 | ||
| rope_neox.comp | 2026-02-03 17:07 | 346 | ||
| rope_norm.comp | 2026-02-03 17:07 | 346 | ||
| rope_multi.comp | 2026-02-03 17:07 | 347 | ||
| rope_vision.comp | 2026-02-03 17:07 | 348 | ||
| fill.comp | 2026-02-03 17:07 | 363 | ||
| cos.comp | 2026-02-03 17:07 | 374 | ||
| sin.comp | 2026-02-03 17:07 | 374 | ||
| sqrt.comp | 2026-02-03 17:07 | 375 | ||
| square.comp | 2026-02-03 17:07 | 375 | ||
| log.comp | 2026-02-03 17:07 | 384 | ||
| arange.comp | 2026-02-03 17:07 | 422 | ||
| clamp.comp | 2026-02-03 17:07 | 427 | ||
| dequant_f32.comp | 2026-02-03 17:07 | 442 | ||
| glu_head.glsl | 2026-02-03 17:07 | 457 | ||
| rope_params.glsl | 2026-02-03 17:07 | 514 | ||
| neg.comp | 2026-02-03 17:07 | 520 | ||
| abs.comp | 2026-02-03 17:07 | 525 | ||
| relu.comp | 2026-02-03 17:07 | 528 | ||
| sigmoid.comp | 2026-02-03 17:07 | 541 | ||
| exp.comp | 2026-02-03 17:07 | 544 | ||
| tanh.comp | 2026-02-03 17:07 | 544 | ||
| ceil.comp | 2026-02-03 17:07 | 549 | ||
| floor.comp | 2026-02-03 17:07 | 550 | ||
| trunc.comp | 2026-02-03 17:07 | 550 | ||
| silu.comp | 2026-02-03 17:07 | 565 | ||
| step.comp | 2026-02-03 17:07 | 565 | ||
| hardsigmoid.comp | 2026-02-03 17:07 | 581 | ||
| hardswish.comp | 2026-02-03 17:07 | 585 | ||
| leaky_relu.comp | 2026-02-03 17:07 | 586 | ||
| sum_rows.glsl | 2026-02-03 17:07 | 592 | ||
| rope_head.glsl | 2026-02-03 17:07 | 607 | ||
| softplus.comp | 2026-02-03 17:07 | 611 | ||
| opt_step_sgd.comp | 2026-02-03 17:07 | 612 | ||
| copy.comp | 2026-02-03 17:07 | 619 | ||
| scale.comp | 2026-02-03 17:07 | 625 | ||
| gelu_quick.comp | 2026-02-03 17:07 | 631 | ||
| add1.comp | 2026-02-03 17:07 | 702 | ||
| round.comp | 2026-02-03 17:07 | 728 | ||
| utils.glsl | 2026-02-03 17:07 | 752 | ||
| silu_back.comp | 2026-02-03 17:07 | 761 | ||
| gelu.comp | 2026-02-03 17:07 | 767 | ||
| div.comp | 2026-02-03 17:07 | 776 | ||
| mul.comp | 2026-02-03 17:07 | 776 | ||
| count_equal.comp | 2026-02-03 17:07 | 796 | ||
| diag_mask_inf.comp | 2026-02-03 17:07 | 799 | ||
| repeat.comp | 2026-02-03 17:07 | 809 | ||
| sub.comp | 2026-02-03 17:07 | 826 | ||
| xielu.comp | 2026-02-03 17:07 | 836 | ||
| dequant_q8_0.comp | 2026-02-03 17:07 | 839 | ||
| glu_main.glsl | 2026-02-03 17:07 | 859 | ||
| dequant_q4_0.comp | 2026-02-03 17:07 | 861 | ||
| geglu_erf.comp | 2026-02-03 17:07 | 882 | ||
| dequant_q4_1.comp | 2026-02-03 17:07 | 892 | ||
| diag.comp | 2026-02-03 17:07 | 902 | ||
| dequant_iq4_nl.comp | 2026-02-03 17:07 | 909 | ||
| dequant_mxfp4.comp | 2026-02-03 17:07 | 941 | ||
| acc.comp | 2026-02-03 17:07 | 946 | ||
| add_id.comp | 2026-02-03 17:07 | 1.0K | ||
| timestep_embedding.comp | 2026-02-03 17:07 | 1.0K | ||
| dequant_q5_1.comp | 2026-02-03 17:07 | 1.0K | ||
| dequant_q5_0.comp | 2026-02-03 17:07 | 1.0K | ||
| mul_mat_vec_iface.glsl | 2026-02-03 17:07 | 1.1K | ||
| dequant_iq4_xs.comp | 2026-02-03 17:07 | 1.1K | ||
| CMakeLists.txt | 2026-02-03 17:07 | 1.1K | ||
| dequant_iq1_s.comp | 2026-02-03 17:07 | 1.1K | ||
| count_experts.comp | 2026-02-03 17:07 | 1.2K | ||
| opt_step_adamw.comp | 2026-02-03 17:07 | 1.2K | ||
| repeat_back.comp | 2026-02-03 17:07 | 1.2K | ||
| l2_norm.comp | 2026-02-03 17:07 | 1.2K | ||
| get_rows.comp | 2026-02-03 17:07 | 1.2K | ||
| ssm_conv.comp | 2026-02-03 17:07 | 1.2K | ||
| norm.comp | 2026-02-03 17:07 | 1.3K | ||
| soft_max_large_common.glsl | 2026-02-03 17:07 | 1.3K | ||
| mul_mat_split_k_reduce.comp | 2026-02-03 17:07 | 1.3K | ||
| tri.comp | 2026-02-03 17:07 | 1.3K | ||
| gelu_erf.comp | 2026-02-03 17:07 | 1.3K | ||
| sum_rows.comp | 2026-02-03 17:07 | 1.4K | ||
| argmax.comp | 2026-02-03 17:07 | 1.4K | ||
| copy_from_quant.comp | 2026-02-03 17:07 | 1.4K | ||
| dequant_q6_k.comp | 2026-02-03 17:07 | 1.4K | ||
| roll.comp | 2026-02-03 17:07 | 1.4K | ||
| dequant_q2_k.comp | 2026-02-03 17:07 | 1.4K | ||
| concat.comp | 2026-02-03 17:07 | 1.5K | ||
| mul_mmq_shmem_types.glsl | 2026-02-03 17:07 | 1.5K | ||
| contig_copy.comp | 2026-02-03 17:07 | 1.5K | ||
| dequant_iq1_m.comp | 2026-02-03 17:07 | 1.5K | ||
| dequant_iq3_s.comp | 2026-02-03 17:07 | 1.5K | ||
| soft_max_back.comp | 2026-02-03 17:07 | 1.5K | ||
| get_rows_quant.comp | 2026-02-03 17:07 | 1.5K | ||
| soft_max_large1.comp | 2026-02-03 17:07 | 1.6K | ||
| dequant_q3_k.comp | 2026-02-03 17:07 | 1.7K | ||
| group_norm.comp | 2026-02-03 17:07 | 1.7K | ||
| soft_max_large3.comp | 2026-02-03 17:07 | 1.7K | ||
| pool2d.comp | 2026-02-03 17:07 | 1.7K | ||
| rms_norm_back.comp | 2026-02-03 17:07 | 1.8K | ||
| dequant_iq2_xs.comp | 2026-02-03 17:07 | 1.8K | ||
| cumsum_multipass2.comp | 2026-02-03 17:07 | 1.9K | ||
| dequant_iq2_s.comp | 2026-02-03 17:07 | 1.9K | ||
| cumsum_multipass1.comp | 2026-02-03 17:07 | 1.9K | ||
| dequant_iq2_xxs.comp | 2026-02-03 17:07 | 2.0K | ||
| add.comp | 2026-02-03 17:07 | 2.0K | ||
| dequant_iq3_xxs.comp | 2026-02-03 17:07 | 2.1K | ||
| soft_max_large2.comp | 2026-02-03 17:07 | 2.1K | ||
| mul_mm_id_funcs.glsl | 2026-02-03 17:07 | 2.1K | ||
| rms_norm_partials.comp | 2026-02-03 17:07 | 2.2K | ||
| generic_binary_head.glsl | 2026-02-03 17:07 | 2.2K | ||
| copy_transpose.comp | 2026-02-03 17:07 | 2.2K | ||
| pad.comp | 2026-02-03 17:07 | 2.4K | ||
| argsort.comp | 2026-02-03 17:07 | 2.5K | ||
| solve_tri.comp | 2026-02-03 17:07 | 2.6K | ||
| dequant_q4_k.comp | 2026-02-03 17:07 | 2.6K | ||
| wkv6.comp | 2026-02-03 17:07 | 2.7K | ||
| cumsum.comp | 2026-02-03 17:07 | 2.8K | ||
| wkv7.comp | 2026-02-03 17:07 | 2.9K | ||
| im2col.comp | 2026-02-03 17:07 | 3.0K | ||
| conv_transpose_1d.comp | 2026-02-03 17:07 | 3.0K | ||
| dequant_q5_k.comp | 2026-02-03 17:07 | 3.1K | ||
| quantize_q8_1.comp | 2026-02-03 17:07 | 3.1K | ||
| conv2d_dw.comp | 2026-02-03 17:07 | 3.1K | ||
| generic_unary_head.glsl | 2026-02-03 17:07 | 3.3K | ||
| flash_attn_split_k_reduce.comp | 2026-02-03 17:07 | 3.3K | ||
| im2col_3d.comp | 2026-02-03 17:07 | 3.6K | ||
| mul_mat_vec_nc.comp | 2026-02-03 17:07 | 3.6K | ||
| mul_mat_vec_iq1_s.comp | 2026-02-03 17:07 | 3.6K | ||
| mul_mat_vec_iq2_xxs.comp | 2026-02-03 17:07 | 3.7K | ||
| mul_mat_vec_iq3_xxs.comp | 2026-02-03 17:07 | 3.8K | ||
| mul_mat_vec_iq3_s.comp | 2026-02-03 17:07 | 3.8K | ||
| mul_mat_vec_iq2_s.comp | 2026-02-03 17:07 | 3.8K | ||
| argsort_large.comp | 2026-02-03 17:07 | 3.9K | ||
| ssm_scan.comp | 2026-02-03 17:07 | 3.9K | ||
| topk_argsort.comp | 2026-02-03 17:07 | 4.0K | ||
| mul_mat_vec_p021.comp | 2026-02-03 17:07 | 4.5K | ||
| mul_mat_vec_iq2_xs.comp | 2026-02-03 17:07 | 4.5K | ||
| rms_norm.comp | 2026-02-03 17:07 | 4.8K | ||
| mul_mat_vecq.comp | 2026-02-03 17:07 | 4.9K | ||
| mul_mat_vec_iq1_m.comp | 2026-02-03 17:07 | 5.1K | ||
| soft_max.comp | 2026-02-03 17:07 | 5.2K | ||
| mul_mat_vec.comp | 2026-02-03 17:07 | 5.3K | ||
| mul_mat_vec_q6_k.comp | 2026-02-03 17:07 | 5.6K | ||
| upscale.comp | 2026-02-03 17:07 | 5.9K | ||
| mul_mat_vec_q2_k.comp | 2026-02-03 17:07 | 6.2K | ||
| mul_mat_vec_q4_k.comp | 2026-02-03 17:07 | 6.4K | ||
| mul_mat_vec_q3_k.comp | 2026-02-03 17:07 | 6.4K | ||
| topk_moe.comp | 2026-02-03 17:07 | 6.7K | ||
| multi_add.comp | 2026-02-03 17:07 | 7.2K | ||
| flash_attn_base.glsl | 2026-02-03 17:07 | 7.4K | ||
| rope_funcs.glsl | 2026-02-03 17:07 | 7.6K | ||
| mul_mat_vec_q5_k.comp | 2026-02-03 17:07 | 7.7K | ||
| copy_to_quant.comp | 2026-02-03 17:07 | 7.8K | ||
| mul_mat_vec_base.glsl | 2026-02-03 17:07 | 8.0K | ||
| topk_nary_search.comp | 2026-02-03 17:07 | 8.9K | ||
| mul_mmq.comp | 2026-02-03 17:07 | 9.2K | ||
| conv2d_mm.comp | 2026-02-03 17:07 | 12K | ||
| flash_attn.comp | 2026-02-03 17:07 | 14K | ||
| flash_attn_cm2.comp | 2026-02-03 17:07 | 14K | ||
| mul_mm.comp | 2026-02-03 17:07 | 17K | ||
| mul_mmq_funcs.glsl | 2026-02-03 17:07 | 17K | ||
| mul_mat_vecq_funcs.glsl | 2026-02-03 17:07 | 21K | ||
| flash_attn_cm1.comp | 2026-02-03 17:07 | 24K | ||
| dequant_funcs_cm2.glsl | 2026-02-03 17:07 | 24K | ||
| dequant_funcs.glsl | 2026-02-03 17:07 | 24K | ||
| mul_mm_cm2.comp | 2026-02-03 17:07 | 25K | ||
| mul_mm_funcs.glsl | 2026-02-03 17:07 | 30K | ||
| vulkan-shaders-gen.cpp | 2026-02-03 17:07 | 63K | ||
| types.glsl | 2026-02-03 17:07 | 120K | ||