diff --git a/example/ck_tile/15_fused_moe/instances/fused_moegemm_api_internal.hpp b/example/ck_tile/15_fused_moe/instances/fused_moegemm_api_internal.hpp index 92d7cbfec1..fa21716344 100644 --- a/example/ck_tile/15_fused_moe/instances/fused_moegemm_api_internal.hpp +++ b/example/ck_tile/15_fused_moe/instances/fused_moegemm_api_internal.hpp @@ -16,11 +16,11 @@ float fused_moegemm_(const ck_tile::stream_config& s, fused_moegemm_args a) { using f_traits = ck_tile::FusedMoeGemmTraits; using f_shape = ck_tile::FusedMoeGemmShape; + typename Ts_::WarpPerBlock_0, + typename Ts_::WarpTile_0, + typename Ts_::BlockTile_1, + typename Ts_::WarpPerBlock_0, + typename Ts_::WarpTile_0>; using f_problem = ck_tile::FusedMoeGemmPipelineProblem(kargs.o_ptr); auto o_view_ = make_naive_tensor_view( + memory_operation_enum::atomic_add>( o_ptr, make_tuple(kargs.num_tokens, kargs.hidden_size), make_tuple(kargs.stride_token, 1),