MANIFEST.in
setup.py
build_tools/VERSION.txt
build_tools/__init__.py
build_tools/build_ext.py
build_tools/jax.py
build_tools/paddle.py
build_tools/pytorch.py
build_tools/te_version.py
build_tools/utils.py
build_tools/__pycache__/__init__.cpython-310.pyc
build_tools/__pycache__/__init__.cpython-38.pyc
build_tools/__pycache__/build_ext.cpython-310.pyc
build_tools/__pycache__/build_ext.cpython-38.pyc
build_tools/__pycache__/pytorch.cpython-38.pyc
build_tools/__pycache__/te_version.cpython-310.pyc
build_tools/__pycache__/te_version.cpython-38.pyc
build_tools/__pycache__/utils.cpython-310.pyc
build_tools/__pycache__/utils.cpython-38.pyc
build_tools/wheel_utils/Dockerfile.aarch
build_tools/wheel_utils/Dockerfile.x86
build_tools/wheel_utils/build_wheels.sh
build_tools/wheel_utils/launch_aarch.sh
build_tools/wheel_utils/launch_x86.sh
common_headers/common/common.h
common_headers/common/nvtx.h
common_headers/common/utils.cuh
common_headers/common/activation/activation_template.h
common_headers/common/fused_attn/fused_attn_f16_arbitrary_seqlen.h
common_headers/common/fused_attn/fused_attn_f16_max512_seqlen.h
common_headers/common/fused_attn/fused_attn_fp8.h
common_headers/common/fused_attn/utils.h
common_headers/common/include/transformer_engine/activation.h
common_headers/common/include/transformer_engine/cast.h
common_headers/common/include/transformer_engine/cast_transpose_noop.h
common_headers/common/include/transformer_engine/fused_attn.h
common_headers/common/include/transformer_engine/fused_rope.h
common_headers/common/include/transformer_engine/gemm.h
common_headers/common/include/transformer_engine/layer_norm.h
common_headers/common/include/transformer_engine/padding.h
common_headers/common/include/transformer_engine/permutation.h
common_headers/common/include/transformer_engine/recipe.h
common_headers/common/include/transformer_engine/rmsnorm.h
common_headers/common/include/transformer_engine/softmax.h
common_headers/common/include/transformer_engine/transformer_engine.h
common_headers/common/include/transformer_engine/transpose.h
common_headers/common/layer_norm/ln.h
common_headers/common/layer_norm/ln_bwd_kernels.cuh
common_headers/common/layer_norm/ln_fwd_kernels.cuh
common_headers/common/layer_norm/ln_kernel_traits.h
common_headers/common/rmsnorm/rmsnorm.h
common_headers/common/rmsnorm/rmsnorm_bwd_kernels.cuh
common_headers/common/rmsnorm/rmsnorm_fwd_kernels.cuh
common_headers/common/rmsnorm/rmsnorm_kernel_traits.h
common_headers/common/util/cuda_driver.h
common_headers/common/util/cuda_runtime.h
common_headers/common/util/logging.h
common_headers/common/util/math.h
common_headers/common/util/rtc.h
common_headers/common/util/string.h
common_headers/common/util/system.h
common_headers/common/util/vectorized_pointwise.h
csrc/comm_gemm_overlap.h
csrc/common.cu
csrc/common.h
csrc/extensions.h
csrc/multi_tensor_apply.cuh
csrc/ts_fp8_op.cpp
csrc/type_shim.h
csrc/extensions/activation.cu
csrc/extensions/apply_rope.cu
csrc/extensions/attention.cu
csrc/extensions/cast.cu
csrc/extensions/gemm.cu
csrc/extensions/misc.cu
csrc/extensions/normalization.cu
csrc/extensions/padding.cu
csrc/extensions/permutation.cu
csrc/extensions/pybind.cpp
csrc/extensions/recipe.cu
csrc/extensions/softmax.cu
csrc/extensions/transpose.cu
csrc/extensions/multi_tensor/multi_tensor_adam.cu
csrc/extensions/multi_tensor/multi_tensor_l2norm_kernel.cu
csrc/extensions/multi_tensor/multi_tensor_scale_kernel.cu
csrc/extensions/multi_tensor/multi_tensor_sgd_kernel.cu
csrc/userbuffers/ipcsocket.cc
csrc/userbuffers/ipcsocket.h
csrc/userbuffers/userbuffers-host.cpp
csrc/userbuffers/userbuffers.cu
csrc/userbuffers/userbuffers.h
transformer_engine_torch.egg-info/PKG-INFO
transformer_engine_torch.egg-info/SOURCES.txt
transformer_engine_torch.egg-info/dependency_links.txt
transformer_engine_torch.egg-info/requires.txt
transformer_engine_torch.egg-info/top_level.txt