- A100 support via mma.16816 - Thread swizzling for conflict-free shared memory accesses without padding - Complete overhaul of the LLVM code generation in codegen/selection/generator.cc to remove overengineering - Added debugging capabilities in the Python binding - Compilation error for kernels that spill
83 lines
2.4 KiB
C++
83 lines
2.4 KiB
C++
#include <iostream>
|
|
#include "triton/ir/basic_block.h"
|
|
#include "triton/ir/module.h"
|
|
#include "triton/ir/type.h"
|
|
#include "triton/ir/constant.h"
|
|
#include "triton/ir/function.h"
|
|
#include "triton/ir/instructions.h"
|
|
#include "triton/ir/print.h"
|
|
|
|
namespace triton{
|
|
namespace ir{
|
|
|
|
std::string get_name(ir::value *v, unsigned i) {
|
|
if(v->get_name().empty()){
|
|
std::string name = "%" + std::to_string(i);
|
|
v->set_name(name);
|
|
}
|
|
return v->get_name();
|
|
}
|
|
|
|
|
|
void print(module &mod, std::ostream& os) {
|
|
unsigned cnt = 0;
|
|
for(ir::function *fn: mod.get_function_list()){
|
|
os << "def " << fn->get_fn_type()->get_return_ty()->repr() << " " << fn->get_name() << "(" ;
|
|
for(ir::argument* arg: fn->args()) {
|
|
if(arg->get_arg_no() > 0)
|
|
os << ", ";
|
|
os << arg->get_type()->repr() << " " << arg->get_name();
|
|
auto attrs = fn->get_attributes(arg);
|
|
if(attrs.size() > 0)
|
|
os << " ";
|
|
for(ir::attribute attr: attrs)
|
|
os << attr.repr() << " ";
|
|
}
|
|
os << ")" << std::endl;
|
|
os << "{" << std::endl;
|
|
for(ir::basic_block *block: fn->blocks()){
|
|
auto const &predecessors = block->get_predecessors();
|
|
os << block->get_name() << ":";
|
|
if(!predecessors.empty()){
|
|
os << " ";
|
|
os << "; preds = ";
|
|
auto const &predecessors = block->get_predecessors();
|
|
for(ir::basic_block *pred: predecessors)
|
|
os << pred->get_name() << (pred!=predecessors.back()?", ":"");
|
|
}
|
|
os << std::endl;
|
|
for(ir::instruction *inst: block->get_inst_list()){
|
|
os << " ";
|
|
if(!inst->get_type()->is_void_ty()){
|
|
os << get_name(inst, cnt++);
|
|
os << " = ";
|
|
}
|
|
ir::type* type = inst->get_type();
|
|
os << inst->repr() << " " << type->repr();
|
|
ir::instruction::ops_t ops = inst->ops();
|
|
size_t num_ops = inst->get_num_operands();
|
|
if(num_ops > 0)
|
|
os << " ";;
|
|
for(unsigned i = 0; i < num_ops; i++){
|
|
if(auto *x = dynamic_cast<ir::constant*>(ops[i]))
|
|
os << x->repr();
|
|
else
|
|
os << get_name(ops[i], cnt++);
|
|
os << (i < num_ops - 1?", ":"");
|
|
}
|
|
os << ";";
|
|
// os << " (";
|
|
// for(ir::user* usr: inst->get_users())
|
|
// os << get_name(usr, cnt++) << ", " ;
|
|
// os << " )";
|
|
os << std::endl;
|
|
}
|
|
}
|
|
os << "}" << std::endl;
|
|
}
|
|
}
|
|
|
|
|
|
}
|
|
}
|