Files
ROCm/python/triton/language/__init__.py
Jason Furmanek 5c87f363e4 Merge commit 'cb3d79a185e40c9d8a579bea07747a8a8d157d52' into ifu-231117
Conflicts:
	lib/Conversion/TritonGPUToLLVM/ElementwiseOpToLLVM.cpp
	lib/Conversion/TritonGPUToLLVM/TritonGPUToLLVM.cpp
	lib/Dialect/TritonGPU/IR/Dialect.cpp
	python/setup.py
	python/test/unit/language/assert_helper.py
	python/test/unit/operators/test_flash_attention.py
	python/test/unit/runtime/test_subproc.py
	python/triton/compiler/compiler.py
	python/triton/language/semantic.py
	python/triton/runtime/autotuner.py
	python/triton/runtime/jit.py
	python/tutorials/03-matrix-multiplication.py
	python/tutorials/05-layer-norm.py
	python/tutorials/06-fused-attention.py
	python/tutorials/11-grouped-gemm.py
	test/Conversion/tritongpu_to_llvm.mlir
2023-11-17 20:42:12 +00:00

219 lines
3.2 KiB
Python

"""isort:skip_file"""
# Import order is significant here.
from . import math
from . import extra
from .standard import (
argmax,
argmin,
cdiv,
cumprod,
cumsum,
max,
maximum,
min,
minimum,
sigmoid,
softmax,
sum,
ravel,
swizzle2d,
xor_sum,
zeros,
zeros_like,
)
from .core import (
TRITON_MAX_TENSOR_NUMEL,
abs,
advance,
arange,
associative_scan,
atomic_add,
atomic_and,
atomic_cas,
atomic_max,
atomic_min,
atomic_or,
atomic_xchg,
atomic_xor,
bfloat16,
block_type,
broadcast,
broadcast_to,
cat,
constexpr,
cos,
debug_barrier,
device_assert,
device_print,
dot,
dtype,
exp,
expand_dims,
full,
fdiv,
float16,
float32,
float64,
float8e4b15,
float8e4b15x4,
float8e4nv,
float8e4b8,
float8e5,
float8e5b16,
function_type,
inline_asm_elementwise,
int1,
int16,
int32,
int64,
int8,
load,
log,
make_block_ptr,
max_constancy,
max_contiguous,
multiple_of,
num_programs,
pi32_t,
pointer_type,
program_id,
reduce,
reshape,
sin,
sqrt,
static_assert,
static_print,
store,
static_range,
tensor,
trans,
# triton,
uint16,
uint32,
uint64,
uint8,
umulhi,
view,
void,
where,
)
from .random import (
pair_uniform_to_normal,
philox,
philox_impl,
rand,
rand4x,
randint,
randint4x,
randn,
randn4x,
uint32_to_uniform_float,
)
__all__ = [
"TRITON_MAX_TENSOR_NUMEL",
"abs",
"advance",
"arange",
"argmin",
"argmax",
"associative_scan",
"atomic_add",
"atomic_and",
"atomic_cas",
"atomic_max",
"atomic_min",
"atomic_or",
"atomic_xchg",
"atomic_xor",
"bfloat16",
"block_type",
"broadcast",
"broadcast_to",
"builtin",
"cat",
"cdiv",
"constexpr",
"cos",
"cumprod",
"cumsum",
"debug_barrier",
"device_assert",
"device_print",
"dot",
"dtype",
"exp",
"expand_dims",
"extra",
"fdiv",
"float16",
"float32",
"float64",
"float8e4b15",
"float8e4b15x4",
"float8e4nv",
"float8e5",
"full",
"function_type",
"inline_asm_elementwise",
"int1",
"int16",
"int32",
"int64",
"int8",
"ir",
"math",
"load",
"log",
"make_block_ptr",
"max",
"max_constancy",
"max_contiguous",
"maximum",
"min",
"minimum",
"multiple_of",
"num_programs",
"pair_uniform_to_normal",
"philox",
"philox_impl",
"pi32_t",
"pointer_type",
"program_id",
"rand",
"rand4x",
"randint",
"randint4x",
"randn",
"randn4x",
"ravel",
"reduce",
"reshape",
"sigmoid",
"sin",
"softmax",
"sqrt",
"static_range",
"static_assert",
"static_print",
"store",
"sum",
"swizzle2d",
"tensor",
"trans",
"triton",
"uint16",
"uint32",
"uint32_to_uniform_float",
"uint64",
"uint8",
"umulhi",
"view",
"void",
"where",
"xor_sum",
"zeros",
"zeros_like",
]