[CODEGEN] Fixed performance regression on vectorized loads (#259)

2021-09-02 01:07:31 -07:00
parent 768e0ded28
commit 8a882b215f
1 changed files with 6 additions and 3 deletions
--- a/lib/codegen/selection/generator.cc
+++ b/lib/codegen/selection/generator.cc
@@ -586,11 +586,14 @@ void generator::visit_load_inst(ir::load_inst* x){
  Type* ty  = cvt(op->get_type()->get_scalar_ty()->get_pointer_element_ty());
  // compute vector width
  size_t vec = 1;
-  if(op->get_type()->is_block_ty() && op->get_type()->get_tile_rank() > 1){
+  if(op->get_type()->is_block_ty()){
    auto   ord = ords_.at(op);
    size_t aln = alignment_->get(op, ord[0]);
-    size_t nts = layouts_->get(x)->to_scanline()->nts(ord[0]);
-    vec = std::min(nts, aln);
+    auto layout = layouts_->get(x)->to_scanline();
+    if(layout){
+      size_t nts = layout->nts(ord[0]);
+      vec = std::min(nts, aln);
+    }
  }
  // code generation
  auto idxs = idxs_.at(x);