diff --git a/cinn/auto_schedule/search_space/auto_gen_rule/CMakeLists.txt b/cinn/auto_schedule/search_space/auto_gen_rule/CMakeLists.txt index 5105ed66dc..510d445adf 100644 --- a/cinn/auto_schedule/search_space/auto_gen_rule/CMakeLists.txt +++ b/cinn/auto_schedule/search_space/auto_gen_rule/CMakeLists.txt @@ -21,4 +21,4 @@ endif() cc_test(test_auto_inline SRCS auto_inline_test.cc DEPS cinncore auto_gen_rule_test_helper) cc_test(test_skip_rule SRCS skip_rule_test.cc DEPS cinncore) -cc_test(test_auto_unroll SRCS auto_unroll_test.cc DEPS cinncore) +cc_test(test_auto_unroll SRCS auto_unroll_test.cc DEPS cinncore auto_gen_rule_test_helper test_program_builder) diff --git a/cinn/auto_schedule/search_space/auto_gen_rule/auto_unroll_test.cc b/cinn/auto_schedule/search_space/auto_gen_rule/auto_unroll_test.cc index 99688a2da6..a671c8e0d1 100644 --- a/cinn/auto_schedule/search_space/auto_gen_rule/auto_unroll_test.cc +++ b/cinn/auto_schedule/search_space/auto_gen_rule/auto_unroll_test.cc @@ -17,8 +17,11 @@ #include #include +#include "cinn/auto_schedule/search_space/auto_gen_rule/test_helper.h" #include "cinn/cinn.h" #include "cinn/lang/lower.h" +#include "tests/concrete_program_builder.h" +#include "tests/program_builder.h" namespace cinn { namespace auto_schedule { @@ -103,5 +106,94 @@ TEST(AutoUnroll, UnrollableApply) { test_func(&states[0]->ir_schedule); } +#ifdef CINN_WITH_CUDA +class TestAutoUnroll : public TestAutoGenRuleBase { + public: + std::vector default_input_names = {"X", "Y"}; + std::vector default_output_names = {"temp_matmul_out"}; +}; + +/* Before AutoUnroll: + * for (i=0; i < 4; i++): + * for(j=0; j < 4; j++): + * for(k=0; k < 4; k++): + * C(i, j) = C(i, j) + A(i, k) * B(k, j) + * + * After AutoUnroll on 'k', the third loop is unrolled. + * for(i=0; i < 4; i++): + * for(j=0; j < 4; j++): + * C(i, j) = C(i, j) + A(i, 0) * B(0, j) + * C(i, j) = C(i, j) + A(i, 1) * B(1, j) + * C(i, j) = C(i, j) + A(i, 2) * B(2, j) + * C(i, j) = C(i, j) + A(i, 3) * B(3, j) + */ +TEST_F(TestAutoUnroll, ApplyOnMatmulWithUnroll) { + frontend::Program matmul_op = tests::OpBuilder("matmul").Build({{"X", {4, 4}}, {"Y", {4, 4}}}); + Initialize(common::DefaultNVGPUTarget()); + ir::IRSchedule ir_schedule = MakeIRSchedule(matmul_op); + std::vector func_bodys = ir_schedule.GetModule().GetExprs(); + ASSERT_EQ(func_bodys.size(), 1UL); + VLOG(6) << "Original Expr:\n" << func_bodys[0]; + + // Construct the computation graph and convert it to ir::Expr + AutoUnroll auto_unroll(target_); + SearchState state(ir_schedule, 0, {}); + const std::string& applied_block_name = default_output_names.back(); + EXPECT_EQ(auto_unroll.AnalyseApplyType(state, applied_block_name), RuleApplyType::kApplyAndPruneOtherRules); + auto new_states = auto_unroll.ApplyOnBlock(state, applied_block_name); + std::vector exprs = new_states[0]->ir_schedule.GetModule().GetExprs(); + EXPECT_EQ(exprs.size(), 1UL); + + // Check if the block has an 'auto_unroll_max_step' attribute + auto* applied_block_realize = exprs.front().As()->stmts.front().As(); + auto* applied_schedule_block = applied_block_realize->schedule_block.As(); + ASSERT_FALSE(applied_schedule_block->attrs.empty()); + EXPECT_EQ(applied_schedule_block->attrs.count(ir::attr::auto_unroll_max_step), 1); + const auto& attr_value = applied_schedule_block->attrs.at(ir::attr::auto_unroll_max_step); + const int* max_step = absl::get_if(&attr_value); + EXPECT_NE(max_step, nullptr); + EXPECT_LE(*max_step, 128); + VLOG(6) << "Expr after AutoUnroll applied on block:max_step=" << *max_step << ", Ast:\n" << exprs.front(); + + // build ir::Module and debug source code + auto build_module = BuildIRModule(new_states[0]->ir_schedule); + auto source_code = GenSourceCode(build_module); + VLOG(6) << " auto-schedule source code:\n" << source_code; + // execute and check precision + CheckResult(GenExecutableKernel(build_module), + GenExecutableKernel(BuildIRModule(MakeIRSchedule(matmul_op, -1, true))), + default_input_names, + default_output_names, + {{4, 4}, {4, 4}}, + {{4, 4}}, + target_); +} + +/* Operators of type elementwise or injective can not be auto-unrolled.*/ +TEST_F(TestAutoUnroll, PureSpatial) { + Target target = common::DefaultNVGPUTarget(); + Initialize(target); + std::vector input_names = {"x", "y"}; + std::vector output_names = { + "var_6", "var_4", "constant_idx_last", "constant_idx_first", "var_2", "var_5"}; + std::vector input_shape{256, 256}; + std::vector inputs_varinfo({{"x", input_shape}, {"y", input_shape}}); + + // Construct the computation graph and convert it to ir::Expr + Context::Global().ResetNameId(); + ir::IRSchedule ir_schedule = MakeIRSchedule(tests::GatherAddSubBuilder().Build(inputs_varinfo)); + SearchState state(ir_schedule, 0, {}); + std::vector func_bodys = ir_schedule.GetModule().GetExprs(); + ASSERT_EQ(func_bodys.size(), 1UL); + VLOG(6) << "Original Expr:\n" << func_bodys[0]; + + // Analyzes whether the block can be unrolled + AutoUnroll auto_unroll(target_); + for (const auto& applied_block_name : output_names) { + EXPECT_EQ(auto_unroll.AnalyseApplyType(state, applied_block_name), RuleApplyType::kCannotApply); + } +} +#endif + } // namespace auto_schedule } // namespace cinn