diff --git a/src/s_tir/meta_schedule/schedule_rule/schedule_rule.cc b/src/s_tir/meta_schedule/schedule_rule/schedule_rule.cc index aa280b2e5b91..04a9a99eba5d 100644 --- a/src/s_tir/meta_schedule/schedule_rule/schedule_rule.cc +++ b/src/s_tir/meta_schedule/schedule_rule/schedule_rule.cc @@ -166,7 +166,7 @@ ffi::Array ScheduleRule::DefaultCUDA() { ScheduleRule::ParallelizeVectorizeUnroll( /*max_jobs_per_core=*/-1, /*max_vectorize_extent=*/-1, - /*unroll_max_steps=*/ffi::Array{0, 16, 64, 512, 1024}, + /*unroll_max_steps=*/ffi::Array{0, 16, 32, 64, 128, 256, 512, 1024}, /*unroll_explicit=*/true), ScheduleRule::AutoBind( /*max_threadblocks=*/256,