Files
triton/scripts/amd/test.sh
Michael Melesse 4464dfcc18 save scripts
2022-10-26 17:42:58 +00:00

137 lines
9.1 KiB
Bash
Executable File

# clear
rm -rf triton_rocm_kernels
# export TRITON_LIBHIP=/opt/rocm/lib/libamdhip64.so
# export AMD_OCL_WAIT_COMMAND=1
# export AMD_LOG_LEVEL=3
# export HIP_LAUNCH_BLOCKING=1
# remove cache to avoid segfaults
# TODO: inform triton dev the cache cause segfault
rm -rf /tmp/triton
# pytest python/test
# pytest python/test/test_blocksparse.py
# pytest --verbose python/test/test_conv.py
# pytest --verbose python/test/test_blocksparse.py::test_matmul[sdd-False-False-16-float16]
# pytest --verbose python/test/test_blocksparse.py::test_attention_fwd_bwd
# python python/test/test_conv.py
# gdb -ex "set breakpoint pending on" \
# -ex 'break add_passes_to_emit_bin' \
# --args python python/test/test_add.py
# python python/test/test_empty.py
# -ex 'ignore 1 472' \
# pytest --verbose python/test/unit/language/test_core.py 2>&1 | tee /dockerx/triton/test_core.log
# pytest --verbose python/test/unit/language/test_core.py::test_empty_kernel[float32] 2>&1 | tee /dockerx/triton/test_empty_kernel.log
# pytest --verbose python/test/unit/language/test_core.py::test_bin_op[int32-uint32-+] 2>&1 | tee /dockerx/triton/test_bin_op.log
pytest --verbose python/test/unit/language/test_core.py::test_atomic_rmw[add-float16-all_neg] 2>&1 | tee /dockerx/triton/test_bin_op.log
# pytest --capture=tee-sys --verbose python/test/regression/test_performance.py | tee /dockerx/triton/test_performance.log
# pytest --capture=tee-sys --verbose python/test/regression/test_performance.py::test_matmul | tee /dockerx/triton/test_performance_matmul.log
# pytest --capture=tee-sys --verbose python/test/regression/test_performance.py::test_elementwise | tee /dockerx/triton/test_performance_elementwise.log
# pytest --capture=tee-sys --verbose python/test/regression/test_performance.py::test_matmul[256-256-256]
# pytest --capture=tee-sys --verbose python/test/unit/language/test_core.py::test_empty_kernel[float32]
# pytest --verbose python/test/unit/language/test_core.py::test_load_and_store_op[float32-2]
# pytest --capture=tee-sys --verbose python/test/unit/language/test_core.py::test_load_and_store_op_with_mask
# pytest --verbose python/test/unit/language/test_core.py::test_program_id[float32]
# pytest --capture=tee-sys --verbose python/test/unit/language/test_core.py::test_num_programs[float32]
# pytest --verbose python/test/unit/language/test_core.py::test_unary_op
# pytest --verbose python/test/unit/language/test_core.py::test_bin_op
# pytest --verbose "python/test/unit/language/test_core.py::test_dot"
# pytest --verbose python/test/unit/language/test_core.py::test_cast
# pytest --verbose python/test/unit/language/test_core.py::test_reduce1d
# pytest --verbose python/test/unit/language/test_core.py::test_reduce2d
# pytest --verbose python/test/unit/language/test_core.py::test_math_op
# pytest --capture=tee-sys --verbose python/test/unit/language/test_core.py::test_atomic_rmw
# pytest --verbose python/test/unit/operators/test_blocksparse.py::test_matmul
# pytest --verbose python/test/unit/operators/test_blocksparse.py::test_matmul[DTYPE0-16-False-False-dds]
# pytest --verbose python/test/unit/operators/test_blocksparse.py::test_matmul[DTYPE0-64-False-False-dds]
# pytest --capture=tee-sys --verbose python/test/unit/language/test_core.py::test_matmul
# pytest --capture=tee-sys --verbose python/test/unit/language/test_core.py::test_load_and_store_op_with_mask
# pytest --capture=tee-sys --verbose "python/test/unit/language/test_core.py::test_masked_load_shared_memory"
# pytest --verbose "python/test/unit/operators/test_blocksparse.py::test_softmax[DTYPE0-256-16]"
# pytest --verbose "python/test/unit/operators/test_blocksparse.py::test_softmax" #|& tee /dockerx/triton/test_softmax.log
# pytest --verbose "python/test/unit/operators/test_blocksparse.py::test_softmax[DTYPE0-1024-16]" # PASSED [ 29%]
# pytest --verbose "python/test/unit/operators/test_blocksparse.py::test_softmax[DTYPE0-1024-32]" # FAILED
# pytest --verbose python/test/unit/language/test_core.py::test_permute
# pytest --verbose python/test/unit/language/test_core.py::test_load_cache_modifier
# pytest --verbose python/test/unit/language/test_core.py::test_math_op[log]
# pytest --capture=tee-sys --verbose python/test/unit/language/test_core.py::test_load_and_store_op[float64]
# pytest --verbose "python/test/unit/language/test_core.py::test_bin_op[int8-int64- x % y]"
# pytest --verbose "python/test/unit/language/test_core.py::test_dot[none]" |& tee /dockerx/triton/test_dot_none.log
# pytest --verbose "python/test/unit/language/test_core.py::test_dot[add-rows]"
# pytest --verbose "python/test/unit/language/test_core.py::test_dot[add-cols]"
# pytest --verbose "python/test/unit/language/test_core.py::test_cast[float32-float16-False]"
# pytest --verbose python/test/unit/operators/test_blocksparse.py::test_matmul[DTYPE0-32-False-False-sdd]
# pytest --capture=tee-sys --verbose python/test/unit/operators/test_blocksparse.py::test_softmax[DTYPE0-256-32]
# pytest --verbose python/test/unit/operators/test_blocksparse.py
# pytest --verbose python/test/unit/operators/test_blocksparse.py::test_matmul[DTYPE0-32-False-False-sdd]
# pytest --verbose scripts/amd/test_fptrunc.py
# pytest --verbose scripts/amd/test_fptrunc.py::test_fptrunc[float32-float32-False]
# pytest --verbose "python/test/unit/language/test_core.py::test_cast"
# pytest --verbose "python/test/unit/language/test_core.py::test_cast[float32-float16-False]"
# pytest --verbose "python/test/unit/language/test_core.py::test_cast[float32-bfloat16-False]"
# python python/test/unit/language/test_core.py
# pytest --capture=tee-sys --verbose python/test/unit/language/test_core.py::test_empty_kernel
# pytest --capture=tee-sys --verbose "python/test/unit/language/test_core.py::test_bin_op[int8-int64- x % y]"
# pytest --capture=tee-sys --verbose "python/test/unit/language/test_core.py::test_bin_op[int8-float32- x % y]"
# pytest --capture=tee-sys --verbose "python/test/unit/language/test_core.py::test_bin_op[int8-float16- x % y]"
# pytest --capture=tee-sys --verbose "python/test/unit/language/test_core.py::test_bin_op[float32-float64- x % y]"
# pytest --capture=tee-sys --verbose "python/test/unit/language/test_core.py::test_math_op[exp]"
# pytest --verbose "python/test/unit/operators/test_blocksparse.py"
# pytest --capture=tee-sys --verbose "python/test/unit/operators/test_blocksparse.py::test_matmul[sdd-False-False-16-float16]"
# pytest --capture=tee-sys --verbose "python/test/unit/language/test_core.py::test_arange"
# pytest --verbose "python/test/unit/language/test_core.py::test_masked_load_shared_memory"
# pytest --verbose "python/test/unit/language/test_core.py::test_dot_without_load"
# pytest --verbose "python/test/unit/language/test_core.py::test_fmadot"
# FAILING TESTS
# pytest --verbose "python/test/unit/language/test_core.py::test_bin_op[int8-float16- x % y]" \
# "python/test/unit/language/test_core.py::test_bin_op[int8-float32- x % y]" \
# "python/test/unit/language/test_core.py::test_bin_op[int8-float64- x % y]" \
# "python/test/unit/language/test_core.py::test_bin_op[int16-float16- x % y]" \
# "python/test/unit/language/test_core.py::test_bin_op[int16-float32- x % y]" \
# "python/test/unit/language/test_core.py::test_bin_op[int16-float64- x % y]" \
# "python/test/unit/language/test_core.py::test_bin_op[int32-float16- x % y]" \
# "python/test/unit/language/test_core.py::test_bin_op[int32-float32- x % y]" \
# "python/test/unit/language/test_core.py::test_bin_op[int32-float64- x % y]" \
# "python/test/unit/language/test_core.py::test_bin_op[int64-float16- x % y]" \
# "python/test/unit/language/test_core.py::test_bin_op[int64-float32- x % y]" \
# "python/test/unit/language/test_core.py::test_bin_op[int64-float64- x % y]" \
# "python/test/unit/language/test_core.py::test_bin_op[float16-int8- x % y]" \
# "python/test/unit/language/test_core.py::test_bin_op[float16-int16- x % y]" \
# "python/test/unit/language/test_core.py::test_bin_op[float16-int32- x % y]" \
# "python/test/unit/language/test_core.py::test_bin_op[float16-int64- x % y]" \
# "python/test/unit/language/test_core.py::test_bin_op[float16-float64- x % y]" \
# "python/test/unit/language/test_core.py::test_bin_op[float32-int8- x % y]" \
# "python/test/unit/language/test_core.py::test_bin_op[float32-int16- x % y]" \
# "python/test/unit/language/test_core.py::test_bin_op[float32-int32- x % y]" \
# "python/test/unit/language/test_core.py::test_bin_op[float32-int64- x % y]" \
# "python/test/unit/language/test_core.py::test_bin_op[float32-float64- x % y]" \
# "python/test/unit/language/test_core.py::test_bin_op[float64-int8- x % y]" \
# "python/test/unit/language/test_core.py::test_bin_op[float64-int16- x % y]" \
# "python/test/unit/language/test_core.py::test_bin_op[float64-int32- x % y]" \
# "python/test/unit/language/test_core.py::test_bin_op[float64-int64- x % y]" \
# "python/test/unit/language/test_core.py::test_bin_op[float64-float16- x % y]" \
# "python/test/unit/language/test_core.py::test_bin_op[float64-float32- x % y]"
# do post test steps
# bash scripts/amd/post.sh # it should be run in the run script