From e0628129692a9ac29267c75ac47c7f0e83c7670a Mon Sep 17 00:00:00 2001 From: Philippe Tillet Date: Fri, 17 Dec 2021 12:44:47 -0800 Subject: [PATCH] [CODEGEN] Disabled peephole for masked load + select -- masked_load doesn't work as expected when vectorized --- lib/codegen/transform/peephole.cc | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/lib/codegen/transform/peephole.cc b/lib/codegen/transform/peephole.cc index ac0220ebc..f7ebdad80 100644 --- a/lib/codegen/transform/peephole.cc +++ b/lib/codegen/transform/peephole.cc @@ -284,7 +284,8 @@ void peephole::run(ir::module &mod) { // was_modified = was_modified || rewrite_trans_phi(i, builder); was_modified = was_modified || rewrite_unit_red(i, builder); was_modified = was_modified || rewrite_gep_ptr_min_off_plus_off(i, builder); - was_modified = was_modified || rewrite_select_masked_load(i, builder); + // TODO: DOESN'T WORK FOR VECTORIZED MASKED LOAD +// was_modified = was_modified || rewrite_select_masked_load(i, builder); was_modified = was_modified || rewrite_cvt_layout(i, builder); if(tgt_->as_nvidia() && tgt_->as_nvidia()->sm() >= 80) was_modified = was_modified || rewrite_load_to_shared(i, builder);