File tree Expand file tree Collapse file tree 23 files changed +72
-24
lines changed Expand file tree Collapse file tree 23 files changed +72
-24
lines changed Original file line number Diff line number Diff line change 16
16
#include " ck_tile/host/host_tensor.hpp"
17
17
#include " ck_tile/host/joinable_thread.hpp"
18
18
#include " ck_tile/host/kernel_launch.hpp"
19
+ #include " ck_tile/host/permute_pk_int4.hpp"
19
20
#include " ck_tile/host/ranges.hpp"
20
21
#include " ck_tile/host/reference/reference_batched_dropout.hpp"
21
22
#include " ck_tile/host/reference/reference_batched_dropout_randval.hpp"
Original file line number Diff line number Diff line change 9
9
#include " ck_tile/ops/add_rmsnorm2d_rdquant/pipeline/add_rmsnorm2d_rdquant_fwd_pipeline_problem.hpp"
10
10
#include " ck_tile/ops/add_rmsnorm2d_rdquant/pipeline/add_rmsnorm2d_rdquant_fwd_pipeline_three_pass.hpp"
11
11
#include " ck_tile/ops/common/generic_2d_block_shape.hpp"
12
+ #include " ck_tile/ops/common/load_interleaved_pk_type.hpp"
13
+ #include " ck_tile/ops/common/streamk_common.hpp"
12
14
#include " ck_tile/ops/common/tensor_layout.hpp"
13
15
#include " ck_tile/ops/common/utils.hpp"
Original file line number Diff line number Diff line change 12
12
#include " ck_tile/ops/batched_transpose/pipeline/batched_transpose_policy.hpp"
13
13
#include " ck_tile/ops/batched_transpose/pipeline/batched_transpose_problem.hpp"
14
14
#include " ck_tile/ops/common/generic_2d_block_shape.hpp"
15
+ #include " ck_tile/ops/common/load_interleaved_pk_type.hpp"
16
+ #include " ck_tile/ops/common/streamk_common.hpp"
15
17
#include " ck_tile/ops/common/tensor_layout.hpp"
16
18
#include " ck_tile/ops/common/utils.hpp"
Original file line number Diff line number Diff line change 4
4
#pragma once
5
5
6
6
#include " ck_tile/ops/common/generic_2d_block_shape.hpp"
7
+ #include " ck_tile/ops/common/load_interleaved_pk_type.hpp"
8
+ #include " ck_tile/ops/common/streamk_common.hpp"
7
9
#include " ck_tile/ops/common/tensor_layout.hpp"
8
10
#include " ck_tile/ops/common/utils.hpp"
9
- #include " ck_tile/ops/common/streamk_common.hpp"
Original file line number Diff line number Diff line change 10
10
#include " ck_tile/ops/elementwise/pipeline/elementwise_shape.hpp"
11
11
#include " ck_tile/ops/elementwise/unary_element_wise_operation.hpp"
12
12
#include " ck_tile/ops/common/generic_2d_block_shape.hpp"
13
+ #include " ck_tile/ops/common/load_interleaved_pk_type.hpp"
14
+ #include " ck_tile/ops/common/streamk_common.hpp"
13
15
#include " ck_tile/ops/common/tensor_layout.hpp"
14
16
#include " ck_tile/ops/common/utils.hpp"
Original file line number Diff line number Diff line change 8
8
#include " ck_tile/ops/epilogue/default_2d_epilogue.hpp"
9
9
#include " ck_tile/ops/epilogue/dynamic_quant_epilogue.hpp"
10
10
#include " ck_tile/ops/common/generic_2d_block_shape.hpp"
11
+ #include " ck_tile/ops/common/load_interleaved_pk_type.hpp"
12
+ #include " ck_tile/ops/common/streamk_common.hpp"
11
13
#include " ck_tile/ops/common/tensor_layout.hpp"
12
14
#include " ck_tile/ops/common/utils.hpp"
Original file line number Diff line number Diff line change 14
14
#include " ck_tile/ops/flatmm/pipeline/flatmm_pipeline_agmem_bgmem_creg_v1_policy.hpp"
15
15
#include " ck_tile/ops/flatmm/pipeline/tile_flatmm_shape.hpp"
16
16
#include " ck_tile/ops/common/generic_2d_block_shape.hpp"
17
+ #include " ck_tile/ops/common/load_interleaved_pk_type.hpp"
18
+ #include " ck_tile/ops/common/streamk_common.hpp"
17
19
#include " ck_tile/ops/common/tensor_layout.hpp"
18
20
#include " ck_tile/ops/common/utils.hpp"
Original file line number Diff line number Diff line change 60
60
#include " ck_tile/ops/fmha/pipeline/tile_fmha_shape.hpp"
61
61
#include " ck_tile/ops/fmha/pipeline/tile_fmha_traits.hpp"
62
62
#include " ck_tile/ops/common/generic_2d_block_shape.hpp"
63
+ #include " ck_tile/ops/common/load_interleaved_pk_type.hpp"
64
+ #include " ck_tile/ops/common/streamk_common.hpp"
63
65
#include " ck_tile/ops/common/tensor_layout.hpp"
64
66
#include " ck_tile/ops/common/utils.hpp"
Original file line number Diff line number Diff line change 16
16
#include " ck_tile/ops/fused_moe/pipeline/moe_sorting_pipeline.hpp"
17
17
#include " ck_tile/ops/fused_moe/pipeline/moe_sorting_policy.hpp"
18
18
#include " ck_tile/ops/common/generic_2d_block_shape.hpp"
19
+ #include " ck_tile/ops/common/load_interleaved_pk_type.hpp"
20
+ #include " ck_tile/ops/common/streamk_common.hpp"
19
21
#include " ck_tile/ops/common/tensor_layout.hpp"
20
22
#include " ck_tile/ops/common/utils.hpp"
Original file line number Diff line number Diff line change 30
30
#include " ck_tile/ops/gemm/block/block_wp_asmem_bsmem_creg_v1_custom_policy.hpp"
31
31
#include " ck_tile/ops/gemm/kernel/batched_gemm_kernel.hpp"
32
32
#include " ck_tile/ops/gemm/kernel/gemm_kernel.hpp"
33
- #include " ck_tile/ops/gemm/kernel/gemm_multi_d_kernel.hpp"
34
33
#include " ck_tile/ops/gemm/kernel/gemm_multi_abd_kernel.hpp"
34
+ #include " ck_tile/ops/gemm/kernel/gemm_multi_d_kernel.hpp"
35
35
#include " ck_tile/ops/gemm/kernel/gemm_tile_partitioner.hpp"
36
36
#include " ck_tile/ops/gemm/kernel/grouped_gemm_kernel.hpp"
37
37
#include " ck_tile/ops/gemm/kernel/streamk_gemm_kernel.hpp"
70
70
#include " ck_tile/ops/gemm/warp/warp_gemm_smfmac_impl.hpp"
71
71
#include " ck_tile/ops/gemm/warp/warp_wmma_gemm.hpp"
72
72
#include " ck_tile/ops/common/generic_2d_block_shape.hpp"
73
+ #include " ck_tile/ops/common/load_interleaved_pk_type.hpp"
74
+ #include " ck_tile/ops/common/streamk_common.hpp"
73
75
#include " ck_tile/ops/common/tensor_layout.hpp"
74
76
#include " ck_tile/ops/common/utils.hpp"
You can’t perform that action at this time.
0 commit comments