Python API
- aitemplate.compiler
- aitemplate.compiler.ops
EpilogueOp
FuncEnum
JaggedDim
JaggedIntVar
argmax
avg_pool2d
batch_gather
batch_layernorm_sigmoid_mul
batched_dense_vec_jagged_2d_mul
batched_nms
bert_embeddings
bmm_ccc
bmm_ccc_add
bmm_ccr
bmm_ccr_add
bmm_crc
bmm_crc_add
bmm_crr
bmm_crr_add
bmm_rcc
bmm_rcc_add
bmm_rcr
bmm_rcr_add
bmm_rcr_n1
bmm_rcr_permute
bmm_rcr_softmax
bmm_rrc
bmm_rrc_add
bmm_rrr
bmm_rrr_add
bmm_rrr_k1_tanh
bmm_rrr_permute
bmm_softmax_bmm
bmm_softmax_bmm_permute
cast
chunk
clamp
classic_b2b_bmm
concatenate
concatenate_tanh
conv2d
conv2d_bias
conv2d_bias_add
conv2d_bias_add_hardswish
conv2d_bias_add_relu
conv2d_bias_few_channels
conv2d_bias_hardswish
conv2d_bias_hardswish_few_channels
conv2d_bias_relu
conv2d_bias_relu_few_channels
conv2d_bias_sigmoid
conv2d_depthwise
conv2d_depthwise_bias
conv3d
conv3d_bias
convert_shape_to_IntVar()
depthwise_conv3d
dual_bmm_rrr_div
dual_gemm_rcr_fast_gelu
dual_gemm_rcr_silu
dynamic_slice
efficient_nms
elementwise
eq
expand
flash_attention
flatten
fmha_style_b2b_bmm
full
fused_elementwise
gather
ge
gemm_rcr
gemm_rcr_bias
gemm_rcr_bias_add
gemm_rcr_bias_add_add
gemm_rcr_bias_add_add_relu
gemm_rcr_bias_add_relu
gemm_rcr_bias_fast_gelu
gemm_rcr_bias_gelu
gemm_rcr_bias_hardswish
gemm_rcr_bias_mul
gemm_rcr_bias_mul_add
gemm_rcr_bias_mul_tanh
gemm_rcr_bias_permute
gemm_rcr_bias_relu
gemm_rcr_bias_sigmoid
gemm_rcr_bias_sigmoid_mul
gemm_rcr_bias_sigmoid_mul_tanh
gemm_rcr_bias_softmax
gemm_rcr_bias_swish
gemm_rcr_bias_tanh
gemm_rcr_fast_gelu
gemm_rcr_permute
gemm_rcr_permute_elup1
gemm_rcr_softmax
gemm_rrr
gemm_rrr_bias
gemm_rrr_bias_permute
gemm_rrr_permute
gemm_rrr_small_nk
gen_int_var_min_max()
getitem
group_gemm_rcr
group_gemm_rcr_bias
group_gemm_rcr_bias_relu
group_gemm_rcr_bias_sigmoid
group_layernorm
group_layernorm_sigmoid_mul
group_norm
group_norm_swish
grouped_classic_b2b_bmm
grouped_fmha_style_b2b_bmm
gt
identity
index_select
int_elementwise
is_symbolic()
jagged_lengths_to_offsets
jagged_lengths_to_presences
jagged_to_padded_dense
layernorm
layernorm_sigmoid_mul
le
list_construct
lt
make_jagged
masked_select
max_pool2d
mem_eff_attention
multi_level_roi_align
ndhwc3to8
ne
nhwc3to4
nhwc3to8
nms
normalize_dtype()
pad_last_dim
padded_dense_to_jagged
perm021fc_ccr
perm021fc_ccr_bias
perm021fc_ccr_bias_permute
perm021fc_crc
perm021fc_crc_bias
perm102_bmm_rcr
perm102_bmm_rcr_bias
perm102_bmm_rrr
perm102_bmm_rrr_bias
permute
permute021
permute0213
permute102
permute210
reduce_max
reduce_mean
reduce_min
reduce_sum
reshape
roi_align
simplify_intvar_values()
size
slice_reshape_scatter
slice_scatter
softmax
split
squeeze
topk
transpose
transposed_conv2d
transposed_conv2d_bias
transposed_conv2d_bias_relu
tuple_construct
unsqueeze
upsampling2d
upsampling2d_add
var
vector_norm
where
- aitemplate.compiler.transform
- apply_padding
- bind_constants
- constant_folding
- fuse_conv_elementwise
- fuse_group_ops
- fuse_mm_elementwise
- fuse_ops
- fuse_parallel_gemms
- fuse_permute_bmm
- fuse_split
- mark_param_tensor
- memory_planning
- name_graph
- optimize_graph
- profile
- refine_graph
- remove_no_ops
- remove_unused_ops
- toposort
- transform_memory_ops
- transform_odd_alignment
- transform_special_ops
- transform_strided_op_and_view_op
- transform_strided_ops
- transform_strided_slice
- aitemplate.backend
- aitemplate.backend.cuda
- aitemplate.backend.rocm
- aitemplate.frontend
AvgPool2d
BertEmbeddings
Conv1d
Conv2d
Conv2dBias
Conv2dBiasAddHardswish
Conv2dBiasAddRelu
Conv2dBiasFewChannels
Conv2dBiasHardswish
Conv2dBiasHardswishFewChannels
Conv2dBiasRelu
Conv2dBiasReluFewChannels
Conv2dBiasSigmoid
Conv2dDepthwise
Conv2dDepthwiseBias
Conv3d
ConvTranspose2dBias
ConvTranspose2dBiasRelu
CrossAttention
DropPath
Dropout
Embedding
FPNProposal
FPNRoiAlign
FlashAttention
Flatten
GroupNorm
Identity
LayerNorm
Linear
MaxPool2d
Module
ModuleDict
ModuleList
MultiScaleBlock
MultiheadAttention
Ndhwc3to8
Nhwc3to8
Proposal
Reshape
RoiAlign
ScaledDotProductAttention
Sequential
T5DenseGatedGeluDense
Tensor
Upsampling2d
Upsampling2dAdd
VanillaCrossAttention
VanillaMultiheadAttention
View
avg_pool2d
conv3d
conv3d_bias
depthwise_conv3d
detect_target()
flatten
max_pool2d
multi_level_roi_align
ndhwc3to8
nhwc3to8
reshape
roi_align
squeeze
unsqueeze
upsampling2d
upsampling2d_add
vanilla_attention()
- aitemplate.testing
- aitemplate.utils