| 
									
										
										
										
											2021-07-27 12:38:38 -07:00
										 |  |  | #include <algorithm>
 | 
					
						
							| 
									
										
										
										
											2021-02-21 15:19:39 -08:00
										 |  |  | #include <iostream>
 | 
					
						
							| 
									
										
										
										
											2021-07-27 12:38:38 -07:00
										 |  |  | #include "triton/ir/module.h"
 | 
					
						
							|  |  |  | #include "triton/ir/function.h"
 | 
					
						
							|  |  |  | #include "triton/codegen/transform/peephole.h"
 | 
					
						
							| 
									
										
										
										
											2021-02-21 15:19:39 -08:00
										 |  |  | #include "triton/codegen/analysis/layout.h"
 | 
					
						
							| 
									
										
										
										
											2021-07-27 12:38:38 -07:00
										 |  |  | 
 | 
					
						
							|  |  |  | namespace triton { | 
					
						
							|  |  |  | namespace codegen{ | 
					
						
							|  |  |  | namespace transform{ | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | ir::value* rewrite_trans_phi_impl(ir::value *value, ir::builder &builder, | 
					
						
							|  |  |  |                                  const std::vector<int>& perm) { | 
					
						
							|  |  |  |   if(auto phi = dynamic_cast<ir::phi_node*>(value)) { | 
					
						
							|  |  |  |     // transpose operands
 | 
					
						
							|  |  |  |     std::vector<ir::value*> incs; | 
					
						
							|  |  |  |     for(unsigned n = 0; n < phi->get_num_incoming(); n++) | 
					
						
							|  |  |  |       incs.push_back(rewrite_trans_phi_impl(phi->get_incoming_value(n), builder, perm)); | 
					
						
							|  |  |  |     // create phi for transposed values
 | 
					
						
							|  |  |  |     builder.set_insert_point(phi); | 
					
						
							|  |  |  |     ir::phi_node* result = builder.create_phi(incs[0]->get_type(), incs.size()); | 
					
						
							|  |  |  |     for(unsigned n = 0; n < phi->get_num_incoming(); n++) | 
					
						
							|  |  |  |       result->add_incoming(incs[n], phi->get_incoming_block(n)); | 
					
						
							|  |  |  |     return result; | 
					
						
							|  |  |  |   } | 
					
						
							|  |  |  |   else if(auto i = dynamic_cast<ir::instruction*>(value)){ | 
					
						
							|  |  |  |     ir::basic_block* block = i->get_parent(); | 
					
						
							|  |  |  |     auto it = std::find(block->begin(), block->end(), i); | 
					
						
							|  |  |  |     it++; | 
					
						
							|  |  |  |     builder.set_insert_point(it); | 
					
						
							|  |  |  |     ir::instruction *trans = (ir::instruction*)builder.create_trans(i, perm); | 
					
						
							|  |  |  |     trans->set_operand(0, i); | 
					
						
							|  |  |  |     return trans; | 
					
						
							|  |  |  |   } | 
					
						
							|  |  |  |   return nullptr; | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | bool peephole::rewrite_trans_phi(ir::instruction* value, ir::builder& builder) { | 
					
						
							|  |  |  |   auto trans = dynamic_cast<ir::trans_inst*>(value); | 
					
						
							|  |  |  |   if(!trans) | 
					
						
							|  |  |  |     return false; | 
					
						
							|  |  |  |   auto users = trans->get_users(); | 
					
						
							|  |  |  |   auto ops = trans->ops(); | 
					
						
							|  |  |  |   if(users.size() > 1 || ops.size() > 1) | 
					
						
							|  |  |  |     return false; | 
					
						
							|  |  |  |   ir::value* op = *ops.begin(); | 
					
						
							|  |  |  |   // trans(phi) -> phi(trans(), trans()...)
 | 
					
						
							|  |  |  |   auto* phi = dynamic_cast<ir::phi_node*>(op); | 
					
						
							|  |  |  |   if(!phi) | 
					
						
							|  |  |  |     return false; | 
					
						
							|  |  |  |   ir::value* new_phi = rewrite_trans_phi_impl(phi, builder, trans->get_perm()); | 
					
						
							|  |  |  |   if(!new_phi) | 
					
						
							|  |  |  |     return false; | 
					
						
							|  |  |  |   trans->replace_all_uses_with(new_phi); | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   return true; | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | bool peephole::rewrite_dot(ir::instruction *value, ir::builder& builder){ | 
					
						
							| 
									
										
										
										
											2021-04-20 22:29:40 -04:00
										 |  |  |   // dot(a, b, c) + d -> dot(a, b, c + d)
 | 
					
						
							|  |  |  |   // d + dot(a, b, c) -> dot(a, b, c + d)
 | 
					
						
							| 
									
										
										
										
											2021-07-27 12:38:38 -07:00
										 |  |  |   auto add = dynamic_cast<ir::binary_operator*>(value); | 
					
						
							| 
									
										
										
										
											2022-01-28 01:12:44 +08:00
										 |  |  |   if(add && (add->get_op() == ir::binary_op_t::FAdd || add->get_op() == ir::binary_op_t::Add)) { | 
					
						
							|  |  |  |     bool is_int_dot = add->get_op() == ir::binary_op_t::Add; | 
					
						
							| 
									
										
										
										
											2021-07-27 12:38:38 -07:00
										 |  |  |     ir::value *lhs = add->get_operand(0); | 
					
						
							|  |  |  |     ir::value *rhs = add->get_operand(1); | 
					
						
							|  |  |  |     ir::dot_inst *lhs_dot = dynamic_cast<ir::dot_inst*>(lhs); | 
					
						
							|  |  |  |     ir::dot_inst *rhs_dot = dynamic_cast<ir::dot_inst*>(rhs); | 
					
						
							|  |  |  |     if(!lhs_dot && !rhs_dot) | 
					
						
							|  |  |  |       return false; | 
					
						
							|  |  |  |     ir::dot_inst *dot = lhs_dot ? lhs_dot : rhs_dot; | 
					
						
							|  |  |  |     ir::value *other = (dot == lhs) ? rhs : lhs; | 
					
						
							|  |  |  |     ir::value *acc = dot->get_operand(2); | 
					
						
							|  |  |  |     ir::splat_inst *splat = dynamic_cast<ir::splat_inst*>(acc); | 
					
						
							| 
									
										
										
										
											2022-01-28 01:12:44 +08:00
										 |  |  |     ir::constant *_0 = nullptr; | 
					
						
							| 
									
										
										
										
											2021-07-27 12:38:38 -07:00
										 |  |  |     if(splat) | 
					
						
							| 
									
										
										
										
											2022-01-28 01:12:44 +08:00
										 |  |  |       _0 = dynamic_cast<ir::constant*>(splat->get_operand(0)); | 
					
						
							|  |  |  |     if(!_0) | 
					
						
							| 
									
										
										
										
											2021-07-27 12:38:38 -07:00
										 |  |  |       return false; | 
					
						
							| 
									
										
										
										
											2022-01-28 01:12:44 +08:00
										 |  |  |     if (auto *fp_0 = dynamic_cast<ir::constant_fp*>(_0)) | 
					
						
							|  |  |  |       if (fp_0->get_value() != 0.0) | 
					
						
							|  |  |  |         return false; | 
					
						
							|  |  |  |     if (auto *int_0 = dynamic_cast<ir::constant_int*>(_0)) | 
					
						
							|  |  |  |       if (int_0->get_value() != 0) | 
					
						
							|  |  |  |         return false; | 
					
						
							| 
									
										
										
										
											2021-07-27 12:38:38 -07:00
										 |  |  |     ir::value *a = dot->get_operand(0); | 
					
						
							|  |  |  |     ir::value *b = dot->get_operand(1); | 
					
						
							|  |  |  |     builder.set_insert_point(add); | 
					
						
							| 
									
										
										
										
											2022-01-12 02:20:31 +08:00
										 |  |  |     ir::value * new_dot = builder.insert(ir::dot_inst::create_nn(a, b, other, dot->allow_tf32(), dot->get_name())); | 
					
						
							| 
									
										
										
										
											2021-07-27 12:38:38 -07:00
										 |  |  |     add->replace_all_uses_with(new_dot); | 
					
						
							|  |  |  |     return true; | 
					
						
							|  |  |  |   } | 
					
						
							| 
									
										
										
										
											2020-05-11 11:07:21 -04:00
										 |  |  |   return false; | 
					
						
							| 
									
										
										
										
											2021-07-27 12:38:38 -07:00
										 |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2020-05-11 00:26:03 -04:00
										 |  |  | //bool peephole::rewrite_cts_cfs(ir::instruction *value, ir::builder &builder){
 | 
					
						
							|  |  |  | //  auto cfs = dynamic_cast<ir::copy_from_shared_inst*>(value);
 | 
					
						
							|  |  |  | //  if(cfs) {
 | 
					
						
							|  |  |  | //    ir::value *arg = cfs->get_operand(0);
 | 
					
						
							|  |  |  | //    ir::copy_to_shared_inst* cts = dynamic_cast<ir::copy_to_shared_inst*>(arg);
 | 
					
						
							|  |  |  | //    if(!cts)
 | 
					
						
							|  |  |  | //      return false;
 | 
					
						
							|  |  |  | //    cfs->replace_all_uses_with(cts->get_operand(0));
 | 
					
						
							|  |  |  | //    return true;
 | 
					
						
							|  |  |  | //  }
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | //}
 | 
					
						
							| 
									
										
										
										
											2020-03-31 18:55:31 -04:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2021-01-11 19:20:34 -05:00
										 |  |  | bool peephole::rewrite_load_to_shared(ir::instruction *value, ir::builder& builder){ | 
					
						
							|  |  |  |   auto copy_to_shared = dynamic_cast<ir::copy_to_shared_inst*>(value); | 
					
						
							|  |  |  |   if(!copy_to_shared) | 
					
						
							|  |  |  |     return false; | 
					
						
							|  |  |  |   ir::value *arg = copy_to_shared->get_operand(0); | 
					
						
							|  |  |  |   ir::masked_load_inst* ld = dynamic_cast<ir::masked_load_inst*>(arg); | 
					
						
							|  |  |  |   if(!ld) | 
					
						
							|  |  |  |     return false; | 
					
						
							|  |  |  |   builder.set_insert_point(copy_to_shared); | 
					
						
							|  |  |  |   ir::value *ptr = ld->get_pointer_operand(); | 
					
						
							|  |  |  |   ir::value *msk = ld->get_mask_operand(); | 
					
						
							|  |  |  |   ir::value *val = ld->get_false_value_operand(); | 
					
						
							| 
									
										
										
										
											2021-02-21 15:19:39 -08:00
										 |  |  |   analysis::scanline_layout* layout = layouts_->get(ptr)->to_scanline(); | 
					
						
							|  |  |  |   int nts = layout->nts(layout->get_order()[0]); | 
					
						
							|  |  |  |   int dtsize = value->get_type()->get_scalar_ty()->get_primitive_size_in_bits() / 8; | 
					
						
							|  |  |  |   if(nts*dtsize >= 4){ | 
					
						
							| 
									
										
										
										
											2021-10-18 13:14:04 +08:00
										 |  |  |     ir::value* new_load = builder.create_masked_load_async(ptr, msk, val, ld->get_cache_modifier()); | 
					
						
							| 
									
										
										
										
											2021-02-21 15:19:39 -08:00
										 |  |  |     copy_to_shared->replace_all_uses_with(new_load); | 
					
						
							|  |  |  |     return true; | 
					
						
							|  |  |  |   } | 
					
						
							|  |  |  |   return false; | 
					
						
							|  |  |  | //  analysis::scanline_layout* layout = layouts_->get(ptr)->to_scanline();
 | 
					
						
							|  |  |  | //  std::cout << layout->nts(layout->get_order(0)) << std::endl;
 | 
					
						
							|  |  |  | //  return true;
 | 
					
						
							| 
									
										
										
										
											2021-01-11 19:20:34 -05:00
										 |  |  | 
 | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2021-07-27 12:38:38 -07:00
										 |  |  | bool peephole::rewrite_unit_red(ir::instruction *value, ir::builder& builder){ | 
					
						
							|  |  |  |   auto x = dynamic_cast<ir::reduce_inst*>(value); | 
					
						
							|  |  |  |   if(!x) | 
					
						
							|  |  |  |     return false; | 
					
						
							|  |  |  |   ir::value *arg = x->get_operand(0); | 
					
						
							| 
									
										
										
										
											2021-04-20 22:29:40 -04:00
										 |  |  |   auto shapes = arg->get_type()->get_block_shapes(); | 
					
						
							| 
									
										
										
										
											2021-07-27 12:38:38 -07:00
										 |  |  |   if(shapes[x->get_axis()] == 1){ | 
					
						
							|  |  |  |     builder.set_insert_point(x); | 
					
						
							| 
									
										
										
										
											2021-04-20 22:29:40 -04:00
										 |  |  |     ir::value* new_red = builder.create_reshape(arg, x->get_type()->get_block_shapes()); | 
					
						
							| 
									
										
										
										
											2021-07-27 12:38:38 -07:00
										 |  |  |     x->replace_all_uses_with(new_red); | 
					
						
							|  |  |  |     return true; | 
					
						
							|  |  |  |   } | 
					
						
							|  |  |  |   return false; | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | bool peephole::rewrite_mult(ir::instruction *value, ir::builder& builder) { | 
					
						
							|  |  |  |     auto binop = dynamic_cast<ir::binary_operator*>(value); | 
					
						
							|  |  |  |     if(binop && binop->get_op() == ir::binary_op_t::Mul) { | 
					
						
							|  |  |  |       ir::value *lhs = binop->get_operand(0); | 
					
						
							|  |  |  |       ir::value *rhs = binop->get_operand(1); | 
					
						
							|  |  |  |       ir::constant_int *_1_lhs = nullptr; | 
					
						
							| 
									
										
										
										
											2020-02-18 23:04:46 -05:00
										 |  |  |       if(ir::splat_inst *splat = dynamic_cast<ir::splat_inst*>(lhs)){ | 
					
						
							|  |  |  |         auto *cst = dynamic_cast<ir::constant_int*>(splat->get_operand(0)); | 
					
						
							|  |  |  |         if(cst && cst->get_value() == 1) | 
					
						
							|  |  |  |           _1_lhs = cst; | 
					
						
							|  |  |  |       } | 
					
						
							| 
									
										
										
										
											2021-07-27 12:38:38 -07:00
										 |  |  |       ir::constant_int *_1_rhs = nullptr; | 
					
						
							| 
									
										
										
										
											2020-02-18 23:04:46 -05:00
										 |  |  |       if(ir::splat_inst *splat = dynamic_cast<ir::splat_inst*>(rhs)){ | 
					
						
							|  |  |  |         auto *cst = dynamic_cast<ir::constant_int*>(splat->get_operand(0)); | 
					
						
							|  |  |  |         if(cst && cst->get_value() == 1) | 
					
						
							|  |  |  |           _1_rhs = cst; | 
					
						
							|  |  |  |       } | 
					
						
							| 
									
										
										
										
											2021-07-27 12:38:38 -07:00
										 |  |  |       if(_1_lhs){ | 
					
						
							|  |  |  |         binop->replace_all_uses_with(rhs); | 
					
						
							|  |  |  |         return true; | 
					
						
							|  |  |  |       } | 
					
						
							|  |  |  |       else if(_1_rhs){ | 
					
						
							|  |  |  |         binop->replace_all_uses_with(lhs); | 
					
						
							|  |  |  |         return true; | 
					
						
							|  |  |  |       } | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  |     return false; | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | bool peephole::rewrite_gep_ptr_min_off_plus_off(ir::instruction *value, ir::builder& builder) { | 
					
						
							|  |  |  |   auto x = dynamic_cast<ir::getelementptr_inst*>(value); | 
					
						
							|  |  |  |   if(!x) | 
					
						
							|  |  |  |     return false; | 
					
						
							|  |  |  |   auto y = dynamic_cast<ir::getelementptr_inst*>(x->get_pointer_operand()); | 
					
						
							|  |  |  |   if(!y) | 
					
						
							|  |  |  |     return false; | 
					
						
							|  |  |  |   auto idx = *y->idx_begin(); | 
					
						
							|  |  |  |   auto z = dynamic_cast<ir::binary_operator*>(idx); | 
					
						
							|  |  |  |   if(!z) | 
					
						
							|  |  |  |     return false; | 
					
						
							|  |  |  |   bool is_sub = z->get_op() == ir::binary_op_t::Sub; | 
					
						
							|  |  |  |   auto *lhs = dynamic_cast<ir::constant_int*>(z->get_operand(0)); | 
					
						
							|  |  |  |   bool is_lhs_0 = lhs && (lhs->get_value()==0); | 
					
						
							|  |  |  |   bool is_rhs_eq_x_rhs = z->get_operand(1) == *x->idx_begin(); | 
					
						
							|  |  |  |   if(is_sub && is_lhs_0 && is_rhs_eq_x_rhs){ | 
					
						
							|  |  |  |     x->replace_all_uses_with(y->get_pointer_operand()); | 
					
						
							|  |  |  |     return true; | 
					
						
							|  |  |  |   } | 
					
						
							|  |  |  |   return false; | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2021-03-07 14:53:48 -05:00
										 |  |  | bool peephole::rewrite_select_masked_load(ir::instruction *value, ir::builder& builder){ | 
					
						
							|  |  |  |   auto select = dynamic_cast<ir::select_inst*>(value); | 
					
						
							|  |  |  |   if(!select) | 
					
						
							|  |  |  |     return false; | 
					
						
							|  |  |  |   auto if_value = dynamic_cast<ir::masked_load_inst*>(select->get_if_value_op()); | 
					
						
							|  |  |  |   if(!if_value) | 
					
						
							|  |  |  |     return false; | 
					
						
							|  |  |  |   if(select->get_pred_op() != if_value->get_mask_operand()) | 
					
						
							|  |  |  |     return false; | 
					
						
							|  |  |  |   builder.set_insert_point(select); | 
					
						
							|  |  |  |   ir::value* new_load = builder.create_masked_load(if_value->get_pointer_operand(), | 
					
						
							|  |  |  |                                                    if_value->get_mask_operand(), | 
					
						
							| 
									
										
										
										
											2021-10-18 13:14:04 +08:00
										 |  |  |                                                    select->get_else_value_op(), | 
					
						
							| 
									
										
										
										
											2021-12-30 22:33:24 -08:00
										 |  |  |                                                    if_value->get_cache_modifier(), | 
					
						
							|  |  |  |                                                    if_value->get_is_volatile()); | 
					
						
							| 
									
										
										
										
											2021-03-07 14:53:48 -05:00
										 |  |  |   select->replace_all_uses_with(new_load); | 
					
						
							|  |  |  |   return true; | 
					
						
							|  |  |  | } | 
					
						
							| 
									
										
										
										
											2021-07-27 12:38:38 -07:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2021-08-30 11:50:35 -07:00
										 |  |  | bool peephole::rewrite_cvt_layout(ir::instruction *value, ir::builder& builder){ | 
					
						
							|  |  |  |   auto cvt = dynamic_cast<ir::cvt_layout_inst*>(value); | 
					
						
							|  |  |  |   if(!cvt) | 
					
						
							|  |  |  |     return false; | 
					
						
							|  |  |  |   ir::instruction* op = dynamic_cast<ir::instruction*>(cvt->get_operand(0)); | 
					
						
							|  |  |  |   if(!op) | 
					
						
							|  |  |  |     return false; | 
					
						
							|  |  |  |   // convert(elementwise(x, y)) = elementwise(convert(x), convert(y))
 | 
					
						
							|  |  |  |   if(op->get_id() == ir::INST_BINOP){ | 
					
						
							|  |  |  |     for(size_t i = 0; i < op->get_num_operands(); i++){ | 
					
						
							|  |  |  |       ir::value* arg_i = op->get_operand(i); | 
					
						
							|  |  |  |       builder.set_insert_point(op); | 
					
						
							|  |  |  |       // create new layout transform
 | 
					
						
							|  |  |  |       ir::instruction* new_arg_i = cvt->clone(); | 
					
						
							|  |  |  |       layouts_->copy(new_arg_i, op); | 
					
						
							|  |  |  |       builder.insert(new_arg_i); | 
					
						
							|  |  |  |       // set the right args
 | 
					
						
							|  |  |  |       new_arg_i->replace_uses_of_with(new_arg_i->get_operand(0), arg_i); | 
					
						
							|  |  |  |       op->replace_uses_of_with(arg_i, new_arg_i); | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  |     cvt->replace_all_uses_with(op); | 
					
						
							|  |  |  |     return true; | 
					
						
							|  |  |  |   } | 
					
						
							|  |  |  |   auto cvt_op = dynamic_cast<ir::cvt_layout_inst*>(op); | 
					
						
							|  |  |  |   if(!cvt_op) | 
					
						
							|  |  |  |     return false; | 
					
						
							|  |  |  |   // convert1(convert2(x)) if convert1 is the inverse of convert2
 | 
					
						
							|  |  |  |   ir::value* op_op = cvt_op->get_operand(0); | 
					
						
							|  |  |  |   if(layouts_->has(cvt) && layouts_->has(op_op) && | 
					
						
							|  |  |  |      layouts_->get(cvt) && layouts_->get(op_op)){ | 
					
						
							|  |  |  |     cvt->replace_all_uses_with(op_op); | 
					
						
							|  |  |  |     return true; | 
					
						
							|  |  |  |   } | 
					
						
							|  |  |  |   return false; | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2021-07-27 12:38:38 -07:00
										 |  |  | void peephole::run(ir::module &mod) { | 
					
						
							|  |  |  |   ir::builder &builder = mod.get_builder(); | 
					
						
							|  |  |  |   // keep track of whether any modification was made
 | 
					
						
							|  |  |  |   std::set<ir::value*> seen; | 
					
						
							|  |  |  |   size_t n_seen; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   // rewrite dots first
 | 
					
						
							|  |  |  |   do{ | 
					
						
							|  |  |  |     n_seen = seen.size(); | 
					
						
							|  |  |  |     for(ir::function *fn: mod.get_function_list()) | 
					
						
							|  |  |  |     for(ir::basic_block *block: fn->blocks()) | 
					
						
							|  |  |  |     for(ir::instruction* i: block->get_inst_list()){ | 
					
						
							|  |  |  |       if(seen.find(i) != seen.end()) | 
					
						
							|  |  |  |         continue; | 
					
						
							|  |  |  |       bool was_modified = rewrite_dot(i, builder); | 
					
						
							|  |  |  |       if(was_modified){ | 
					
						
							|  |  |  |         seen.insert(i); | 
					
						
							|  |  |  |       } | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  |   }while(seen.size() != n_seen); | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   // rewrite other ops
 | 
					
						
							|  |  |  |   seen.clear(); | 
					
						
							|  |  |  |   do{ | 
					
						
							|  |  |  |     n_seen = seen.size(); | 
					
						
							|  |  |  |     for(ir::function *fn: mod.get_function_list()) | 
					
						
							|  |  |  |     for(ir::basic_block *block: fn->blocks()) | 
					
						
							|  |  |  |     for(ir::instruction* i: block->get_inst_list()){ | 
					
						
							|  |  |  |       if(seen.find(i) != seen.end()) | 
					
						
							|  |  |  |         continue; | 
					
						
							|  |  |  |       bool was_modified = false; | 
					
						
							|  |  |  |       was_modified = was_modified || rewrite_mult(i, builder); | 
					
						
							| 
									
										
										
										
											2021-01-11 19:20:34 -05:00
										 |  |  |       // was_modified = was_modified || rewrite_cts_cfs(i, builder);
 | 
					
						
							| 
									
										
										
										
											2021-02-21 15:19:39 -08:00
										 |  |  | //      was_modified = was_modified || rewrite_trans_phi(i, builder);
 | 
					
						
							| 
									
										
										
										
											2021-07-27 12:38:38 -07:00
										 |  |  |       was_modified = was_modified || rewrite_unit_red(i, builder); | 
					
						
							|  |  |  |       was_modified = was_modified || rewrite_gep_ptr_min_off_plus_off(i, builder); | 
					
						
							| 
									
										
										
										
											2021-12-17 12:44:47 -08:00
										 |  |  |       // TODO: DOESN'T WORK FOR VECTORIZED MASKED LOAD
 | 
					
						
							|  |  |  | //      was_modified = was_modified || rewrite_select_masked_load(i, builder);
 | 
					
						
							| 
									
										
										
										
											2021-08-30 11:50:35 -07:00
										 |  |  |       was_modified = was_modified || rewrite_cvt_layout(i, builder); | 
					
						
							| 
									
										
										
										
											2021-09-09 13:46:55 -07:00
										 |  |  |       if(tgt_->as_nvidia() && tgt_->as_nvidia()->sm() >= 80) | 
					
						
							| 
									
										
										
										
											2021-02-21 15:19:39 -08:00
										 |  |  |         was_modified = was_modified || rewrite_load_to_shared(i, builder); | 
					
						
							| 
									
										
										
										
											2021-07-27 12:38:38 -07:00
										 |  |  |       if(was_modified) | 
					
						
							|  |  |  |         seen.insert(i); | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  |   }while(seen.size() != n_seen); | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | } |