git: 639e0f24c626 - main - misc/pytorch: Tensors and dynamic neural networks in Python (C++ library)

From: Yuri Victorovich <yuri_at_FreeBSD.org>
Date: Fri, 30 Dec 2022 19:52:06 UTC
The branch main has been updated by yuri:

URL: https://cgit.FreeBSD.org/ports/commit/?id=639e0f24c6263bb648f4dab0094b020242e74212

commit 639e0f24c6263bb648f4dab0094b020242e74212
Author:     Yuri Victorovich <yuri@FreeBSD.org>
AuthorDate: 2022-12-30 18:27:07 +0000
Commit:     Yuri Victorovich <yuri@FreeBSD.org>
CommitDate: 2022-12-30 19:50:05 +0000

    misc/pytorch: Tensors and dynamic neural networks in Python (C++ library)
---
 misc/Makefile                                      |    1 +
 misc/pytorch/Makefile                              |   63 +
 misc/pytorch/distinfo                              |    3 +
 .../files/patch-aten_src_ATen_native_SoftMax.cpp   |   11 +
 ...native_sparse_ValidateCompressedIndicesCommon.h |   80 +
 ...aten_src_ATen_native_transformers_attention.cpp |   11 +
 misc/pytorch/files/patch-cmake_Dependencies.cmake  |   11 +
 misc/pytorch/files/patch-cmake_public_mkldnn.cmake |   11 +
 .../patch-third__party_cpuinfo_CMakeLists.txt      |   11 +
 ...third__party_asmjit_src_asmjit_core_virtmem.cpp |   10 +
 ...hird__party_kineto_libkineto_src_ThreadUtil.cpp |   11 +
 misc/pytorch/pkg-descr                             |    3 +
 misc/pytorch/pkg-plist                             | 8950 ++++++++++++++++++++
 13 files changed, 9176 insertions(+)

diff --git a/misc/Makefile b/misc/Makefile
index 3fce38632444..a3744390b899 100644
--- a/misc/Makefile
+++ b/misc/Makefile
@@ -445,6 +445,7 @@
     SUBDIR += py-wurlitzer
     SUBDIR += py-xgboost
     SUBDIR += pyobd
+    SUBDIR += pytorch
     SUBDIR += qbrew
     SUBDIR += qlas
     SUBDIR += qt5-doc
diff --git a/misc/pytorch/Makefile b/misc/pytorch/Makefile
new file mode 100644
index 000000000000..253304abf2de
--- /dev/null
+++ b/misc/pytorch/Makefile
@@ -0,0 +1,63 @@
+PORTNAME=	pytorch
+DISTVERSIONPREFIX=	v
+DISTVERSION=	1.13.1
+CATEGORIES=	misc # machine-learning
+MASTER_SITES=	https://github.com/pytorch/pytorch/releases/download/v1.13.1/
+DIST_SUBDIR=	${PORTNAME}
+
+MAINTAINER=	yuri@FreeBSD.org
+COMMENT=	Tensors and dynamic neural networks in Python (C++ library)
+WWW=		https://pytorch.org/
+
+LICENSE=	BSD3CLAUSE
+
+BUILD_DEPENDS=	gmake:devel/gmake \
+		${LOCALBASE}/include/fxdiv.h:devel/fxdiv
+LIB_DEPENDS=	libopenblas.so:math/openblas \
+		libmpi.so:net/openmpi \
+		libpthreadpool.so:devel/pthreadpool \
+		libonnx.so:misc/onnx \
+		libprotobuf.so:devel/protobuf \
+		libsleef.so:math/sleef
+
+USES=		compiler:c++14-lang cmake localbase:ldflags python # requires python even with PYTHON=off
+
+CMAKE_OFF=	BUILD_CUSTOM_PROTOBUF USE_CUDA USE_ROCM  USE_NNPACK USE_QNNPACK USE_PYTORCH_QNNPACK \
+		USE_FBGEMM # workaround recommended by the upstream here: https://github.com/pytorch/pytorch/issues/28337
+CMAKE_ON=	USE_SYSTEM_PYBIND11 \
+		USE_SYSTEM_SLEEF \
+		USE_SYSTEM_ONNX # see other USE_SYSTEM_xx in CMakeLists.txt
+CMAKE_ARGS=	-DPSIMD_SOURCE_DIR=${WRKSRC}/third_party/psimd \
+		-DFREEBSD_PYTHON_VER=${PYTHON_VER} \
+		-DPYTHON_EXECUTABLE:STRING=${PYTHON_CMD}
+
+MAKE_ENV=	USE_NINJA=no # ninja breaks for some reason
+LDFLAGS+=	-lexecinfo
+
+BINARY_ALIAS=	make=${GMAKE} git=true
+
+OPTIONS_DEFINE=		PYTHON # PYTHON only provides python support for the py-PyTorch port - it's not a python binding
+OPTIONS_DEFAULT=	PYTHON
+OPTIONS_SUB=		yes
+
+PYTHON_CMAKE_BOOL=	BUILD_PYTHON
+PYTHON_PY_DEPENDS=	${PYNUMPY} \
+			${PYTHON_PKGNAMEPREFIX}typing-extensions>0:devel/py-typing-extensions@${PY_FLAVOR} \
+			${PYTHON_PKGNAMEPREFIX}yaml>0:devel/py-yaml@${PY_FLAVOR}
+PYTHON_BUILD_DEPENDS=	${PYTHON_PY_DEPENDS} \
+			pybind11>0:devel/pybind11
+PYTHON_RUN_DEPENDS=	${PYTHON_PY_DEPENDS}
+
+post-patch:
+	# replace malloc.h -> stdlib.h in many places
+	@cd ${WRKSRC} && for f in $$(${GREP} -rl "include <malloc\.h>" * | ${GREP} -E "\.(c|cpp|h|hpp)$$"); do \
+	  ${REINPLACE_CMD} -i'' -E "s|include <malloc\.h>|include <stdlib.h>|" $$f; \
+	done
+
+post-install:
+	# functorch.so is installed back into the source directory, see https://github.com/pytorch/pytorch/issues/91524
+	@${RM} $$(${FIND} ${STAGEDIR} -name functorch.so)
+	# https://github.com/pytorch/pytorch/issues/24417
+	@${FIND} ${STAGEDIR} -type d -empty -delete
+
+.include <bsd.port.mk>
diff --git a/misc/pytorch/distinfo b/misc/pytorch/distinfo
new file mode 100644
index 000000000000..2b0b01afc7df
--- /dev/null
+++ b/misc/pytorch/distinfo
@@ -0,0 +1,3 @@
+TIMESTAMP = 1672353185
+SHA256 (pytorch/pytorch-v1.13.1.tar.gz) = dbc229ee9750b02b514937d017744443a269ea0241ed3f32b9af0703589d25d4
+SIZE (pytorch/pytorch-v1.13.1.tar.gz) = 234057741
diff --git a/misc/pytorch/files/patch-aten_src_ATen_native_SoftMax.cpp b/misc/pytorch/files/patch-aten_src_ATen_native_SoftMax.cpp
new file mode 100644
index 000000000000..6f66aece26dc
--- /dev/null
+++ b/misc/pytorch/files/patch-aten_src_ATen_native_SoftMax.cpp
@@ -0,0 +1,11 @@
+--- aten/src/ATen/native/SoftMax.cpp.orig	2022-12-29 23:05:30 UTC
++++ aten/src/ATen/native/SoftMax.cpp
+@@ -132,7 +132,7 @@ void host_softmax(
+     const Tensor& input,
+     const int64_t dim,
+     bool* mask = nullptr,
+-    const c10::optional<int64_t> mask_type_ = NULL) {
++    const c10::optional<int64_t> mask_type_ = 0) {
+ 
+   if (MaskedSoftMax) {
+     TORCH_CHECK(mask_type_.has_value(), "Mask Type should be defined");
diff --git a/misc/pytorch/files/patch-aten_src_ATen_native_sparse_ValidateCompressedIndicesCommon.h b/misc/pytorch/files/patch-aten_src_ATen_native_sparse_ValidateCompressedIndicesCommon.h
new file mode 100644
index 000000000000..3eba700c307c
--- /dev/null
+++ b/misc/pytorch/files/patch-aten_src_ATen_native_sparse_ValidateCompressedIndicesCommon.h
@@ -0,0 +1,80 @@
+--- aten/src/ATen/native/sparse/ValidateCompressedIndicesCommon.h.orig	2022-12-29 23:09:42 UTC
++++ aten/src/ATen/native/sparse/ValidateCompressedIndicesCommon.h
+@@ -38,7 +38,7 @@ namespace {
+ // respectively.
+ 
+ INVARIANT_CHECK_FUNC_API
+-_assert(const bool cond, const char* const message) {
++__assert__(const bool cond, const char* const message) {
+ #ifdef GPUCC
+   CUDA_KERNEL_ASSERT(cond && message);
+ #else
+@@ -58,10 +58,10 @@ INVARIANT_CHECK_FUNC_API
+ _check_first_cidx_is_zero(const index_t& cidx, const index_t& zero) {
+   const bool invariant = cidx == zero;
+   if (cdim_name == CDimName::CRow) {
+-    _assert(invariant, "`crow_indices[..., 0] == 0` is not satisfied.");
++    __assert__(invariant, "`crow_indices[..., 0] == 0` is not satisfied.");
+   }
+   else {
+-    _assert(invariant, "`ccol_indices[..., 0] == 0` is not satisfied.");
++    __assert__(invariant, "`ccol_indices[..., 0] == 0` is not satisfied.");
+   }
+ }
+ 
+@@ -72,10 +72,10 @@ INVARIANT_CHECK_FUNC_API
+ _check_last_cidx_is_nnz(const index_t& cidx, const index_t& nnz) {
+   const bool invariant = cidx == nnz;
+   if (cdim_name == CDimName::CRow) {
+-    _assert(invariant, "`crow_indices[..., -1] == nnz` is not satisfied.");
++    __assert__(invariant, "`crow_indices[..., -1] == nnz` is not satisfied.");
+   }
+   else {
+-    _assert(invariant, "`ccol_indices[..., -1] == nnz` is not satisfied.");
++    __assert__(invariant, "`ccol_indices[..., -1] == nnz` is not satisfied.");
+   }
+ }
+ 
+@@ -91,11 +91,11 @@ _check_cidx_nondecreasing_locally_bounded_sequence(
+   const auto s_cidx = cidx_next - cidx;
+   const bool invariant = zero <= s_cidx && s_cidx <= dim;
+   if (cdim_name == CDimName::CRow) {
+-    _assert(invariant,
++    __assert__(invariant,
+         "`0 <= crow_indices[..., 1:] - crow_indices[..., :-1] <= ncols` is not satisfied.");
+   }
+   else {
+-    _assert(invariant,
++    __assert__(invariant,
+         "`0 <= ccol_indices[..., 1:] - ccol_indices[..., :-1] <= nrows` is not satisfied.");
+   }
+ }
+@@ -110,10 +110,10 @@ _check_idx_bounds(
+     const index_t& dim) {
+   const bool invariant = zero <= idx && idx < dim;
+   if (cdim_name == CDimName::CRow) {
+-    _assert(invariant, "`0 <= col_indices < ncols` is not satisfied.");
++    __assert__(invariant, "`0 <= col_indices < ncols` is not satisfied.");
+   }
+   else {
+-    _assert(invariant, "`0 <= row_indices < nrows` is not satisfied.");
++    __assert__(invariant, "`0 <= row_indices < nrows` is not satisfied.");
+   }
+ }
+ 
+@@ -133,13 +133,13 @@ _check_idx_sorted_distinct_vals_slices_with_cidx(
+   for (auto* RESTRICT curr = slice_begin + 1; curr < slice_end; ++curr) {
+     const auto invariant = *(curr - 1) < *curr;
+     if (cdim_name == CDimName::CRow) {
+-      _assert(invariant, "`col_indices[..., crow_indices[..., i - 1]:crow_indices[..., i]] "
++      __assert__(invariant, "`col_indices[..., crow_indices[..., i - 1]:crow_indices[..., i]] "
+                          "for all i = 1, ..., nrows "
+                          "are sorted and distinct along the last dimension values` "
+                          "is not satisfied.");
+     }
+     else {
+-      _assert(invariant, "`row_indices[..., ccol_indices[..., i - 1]:ccol_indices[..., i]] "
++      __assert__(invariant, "`row_indices[..., ccol_indices[..., i - 1]:ccol_indices[..., i]] "
+                          "for all i = 1, ..., ncols "
+                          "are sorted and distinct along the last dimension values` "
+                          "is not satisfied.");
diff --git a/misc/pytorch/files/patch-aten_src_ATen_native_transformers_attention.cpp b/misc/pytorch/files/patch-aten_src_ATen_native_transformers_attention.cpp
new file mode 100644
index 000000000000..0f3383d2260a
--- /dev/null
+++ b/misc/pytorch/files/patch-aten_src_ATen_native_transformers_attention.cpp
@@ -0,0 +1,11 @@
+--- aten/src/ATen/native/transformers/attention.cpp.orig	2022-12-29 23:18:12 UTC
++++ aten/src/ATen/native/transformers/attention.cpp
+@@ -118,7 +118,7 @@ Tensor masked_softmax(
+     Tensor& attn_scores,
+     c10::optional<Tensor> attn_mask,
+     const Tensor& query,
+-    c10::optional<int64_t> mask_type = NULL) {
++    c10::optional<int64_t> mask_type = 0) {
+   if (query.is_nested() && !attn_mask) {
+     return at::_nested_tensor_softmax_with_shape(attn_scores, query);
+   }
diff --git a/misc/pytorch/files/patch-cmake_Dependencies.cmake b/misc/pytorch/files/patch-cmake_Dependencies.cmake
new file mode 100644
index 000000000000..165534d123bd
--- /dev/null
+++ b/misc/pytorch/files/patch-cmake_Dependencies.cmake
@@ -0,0 +1,11 @@
+--- cmake/Dependencies.cmake.orig	2022-12-16 00:23:46 UTC
++++ cmake/Dependencies.cmake
+@@ -339,7 +339,7 @@ if(USE_NNPACK OR USE_QNNPACK OR USE_PYTORCH_QNNPACK OR
+       set(DISABLE_NNPACK_AND_FAMILY ON)
+     endif()
+   else()
+-    if(NOT IOS AND NOT (CMAKE_SYSTEM_NAME MATCHES "^(Android|Linux|Darwin|Windows)$"))
++    if(NOT IOS AND NOT (CMAKE_SYSTEM_NAME MATCHES "^(Android|Linux|FreeBSD|Darwin|Windows)$"))
+       message(WARNING
+         "Target platform \"${CMAKE_SYSTEM_NAME}\" is not supported in {Q/X}NNPACK. "
+         "Supported platforms are Android, iOS, Linux, and macOS. "
diff --git a/misc/pytorch/files/patch-cmake_public_mkldnn.cmake b/misc/pytorch/files/patch-cmake_public_mkldnn.cmake
new file mode 100644
index 000000000000..77b3923f4e2b
--- /dev/null
+++ b/misc/pytorch/files/patch-cmake_public_mkldnn.cmake
@@ -0,0 +1,11 @@
+--- cmake/public/mkldnn.cmake.orig	2022-12-16 00:23:46 UTC
++++ cmake/public/mkldnn.cmake
+@@ -4,7 +4,7 @@ if(CPU_AARCH64)
+   include(${CMAKE_CURRENT_LIST_DIR}/ComputeLibrary.cmake)
+ endif()
+ 
+-find_package(MKLDNN QUIET)
++find_package(MKLDNN REQUIRED)
+ 
+ if(NOT TARGET caffe2::mkldnn)
+   add_library(caffe2::mkldnn INTERFACE IMPORTED)
diff --git a/misc/pytorch/files/patch-third__party_cpuinfo_CMakeLists.txt b/misc/pytorch/files/patch-third__party_cpuinfo_CMakeLists.txt
new file mode 100644
index 000000000000..755ebd06f98a
--- /dev/null
+++ b/misc/pytorch/files/patch-third__party_cpuinfo_CMakeLists.txt
@@ -0,0 +1,11 @@
+--- third_party/cpuinfo/CMakeLists.txt.orig	2022-12-16 00:23:47 UTC
++++ third_party/cpuinfo/CMakeLists.txt
+@@ -77,7 +77,7 @@ IF(NOT CMAKE_SYSTEM_NAME)
+       "Target operating system is not specified. "
+       "cpuinfo will compile, but cpuinfo_initialize() will always fail.")
+   SET(CPUINFO_SUPPORTED_PLATFORM FALSE)
+-ELSEIF(NOT CMAKE_SYSTEM_NAME MATCHES "^(Windows|CYGWIN|MSYS|Darwin|Linux|Android)$")
++ELSEIF(NOT CMAKE_SYSTEM_NAME MATCHES "^(Windows|CYGWIN|MSYS|Darwin|Linux|FreeBSD|Android)$")
+   IF(${CMAKE_VERSION} VERSION_GREATER_EQUAL "3.14" AND NOT CMAKE_SYSTEM_NAME STREQUAL "iOS")
+     MESSAGE(WARNING
+       "Target operating system \"${CMAKE_SYSTEM_NAME}\" is not supported in cpuinfo. "
diff --git a/misc/pytorch/files/patch-third__party_fbgemm_third__party_asmjit_src_asmjit_core_virtmem.cpp b/misc/pytorch/files/patch-third__party_fbgemm_third__party_asmjit_src_asmjit_core_virtmem.cpp
new file mode 100644
index 000000000000..09a801db1dfc
--- /dev/null
+++ b/misc/pytorch/files/patch-third__party_fbgemm_third__party_asmjit_src_asmjit_core_virtmem.cpp
@@ -0,0 +1,10 @@
+--- third_party/fbgemm/third_party/asmjit/src/asmjit/core/virtmem.cpp.orig	2022-12-16 00:23:48 UTC
++++ third_party/fbgemm/third_party/asmjit/src/asmjit/core/virtmem.cpp
+@@ -45,6 +45,7 @@
+ #endif
+ 
+ #include <atomic>
++#include <sys/stat.h>
+ 
+ #if defined(__APPLE__) || defined(__BIONIC__)
+   #define ASMJIT_VM_SHM_DETECT 0
diff --git a/misc/pytorch/files/patch-third__party_kineto_libkineto_src_ThreadUtil.cpp b/misc/pytorch/files/patch-third__party_kineto_libkineto_src_ThreadUtil.cpp
new file mode 100644
index 000000000000..e6ec0eca3790
--- /dev/null
+++ b/misc/pytorch/files/patch-third__party_kineto_libkineto_src_ThreadUtil.cpp
@@ -0,0 +1,11 @@
+--- third_party/kineto/libkineto/src/ThreadUtil.cpp.orig	2022-12-29 22:41:51 UTC
++++ third_party/kineto/libkineto/src/ThreadUtil.cpp
+@@ -49,7 +49,7 @@ int32_t systemThreadId() {
+ #elif defined _MSC_VER
+     _sysTid = (int32_t)GetCurrentThreadId();
+ #else
+-    _sysTid = (int32_t)syscall(SYS_gettid);
++    _sysTid = (int32_t)syscall(SYS_getpid);
+ #endif
+   }
+   return _sysTid;
diff --git a/misc/pytorch/pkg-descr b/misc/pytorch/pkg-descr
new file mode 100644
index 000000000000..6378f7a68ec8
--- /dev/null
+++ b/misc/pytorch/pkg-descr
@@ -0,0 +1,3 @@
+PyTorch is a Python package that provides two high-level features:
+* Tensor computation (like NumPy) with strong GPU acceleration
+* Deep neural networks built on a tape-based autograd system
diff --git a/misc/pytorch/pkg-plist b/misc/pytorch/pkg-plist
new file mode 100644
index 000000000000..9f32a8cb03f6
--- /dev/null
+++ b/misc/pytorch/pkg-plist
@@ -0,0 +1,8950 @@
+bin/torch_shm_manager
+include/ATen/ATen.h
+include/ATen/AccumulateType.h
+include/ATen/ArrayRef.h
+include/ATen/Backend.h
+include/ATen/Backtrace.h
+include/ATen/BatchedFallback.h
+include/ATen/BatchedTensorImpl.h
+include/ATen/CPUApplyUtils.h
+include/ATen/CPUFixedAllocator.h
+include/ATen/CPUFunctions.h
+include/ATen/CPUFunctions_inl.h
+include/ATen/CPUGeneratorImpl.h
+include/ATen/CUDAFunctions.h
+include/ATen/CUDAFunctions_inl.h
+include/ATen/CollapseDims.h
+include/ATen/CompositeExplicitAutogradFunctions.h
+include/ATen/CompositeExplicitAutogradFunctions_inl.h
+include/ATen/CompositeExplicitAutogradNonFunctionalFunctions.h
+include/ATen/CompositeExplicitAutogradNonFunctionalFunctions_inl.h
+include/ATen/CompositeImplicitAutogradFunctions.h
+include/ATen/CompositeImplicitAutogradFunctions_inl.h
+include/ATen/CompositeImplicitAutogradNestedTensorFunctions.h
+include/ATen/CompositeImplicitAutogradNestedTensorFunctions_inl.h
+include/ATen/Config.h
+include/ATen/Context.h
+include/ATen/DLConvertor.h
+include/ATen/Device.h
+include/ATen/DeviceGuard.h
+include/ATen/DimVector.h
+include/ATen/Dimname.h
+include/ATen/Dispatch.h
+include/ATen/DynamicLibrary.h
+include/ATen/EmptyTensor.h
+include/ATen/ExpandBase.h
+include/ATen/ExpandUtils.h
+include/ATen/Formatting.h
+include/ATen/FuncTorchTLS.h
+include/ATen/FunctionalStorageImpl.h
+include/ATen/FunctionalTensorWrapper.h
+include/ATen/Functions.h
+include/ATen/Generator.h
+include/ATen/InferSize.h
+include/ATen/InitialTensorOptions.h
+include/ATen/Layout.h
+include/ATen/LinalgBackend.h
+include/ATen/MapAllocator.h
+include/ATen/MatrixRef.h
+include/ATen/MemoryOverlap.h
+include/ATen/MetaFunctions.h
+include/ATen/MetaFunctions_inl.h
+include/ATen/MethodOperators.h
+include/ATen/NamedTensor.h
+include/ATen/NamedTensorUtils.h
+include/ATen/NativeFunctions.h
+include/ATen/NativeMetaFunctions.h
+include/ATen/NestedTensorImpl.h
+include/ATen/NumericUtils.h
+include/ATen/OpMathType.h
+include/ATen/OpaqueTensorImpl.h
+include/ATen/Operators.h
+include/ATen/PTThreadPool.h
+include/ATen/PadNd.h
+include/ATen/Parallel-inl.h
+include/ATen/Parallel.h
+include/ATen/ParallelFuture.h
+include/ATen/ParallelNative.h
+include/ATen/ParallelNativeTBB.h
+include/ATen/ParallelOpenMP.h
+include/ATen/PythonTorchFunctionTLS.h
+include/ATen/RedispatchFunctions.h
+include/ATen/RegistrationDeclarations.h
+include/ATen/SavedTensorHooks.h
+include/ATen/Scalar.h
+include/ATen/ScalarOps.h
+include/ATen/ScalarType.h
+include/ATen/SequenceNumber.h
+include/ATen/SmallVector.h
+include/ATen/SparseCsrTensorImpl.h
+include/ATen/SparseCsrTensorUtils.h
+include/ATen/SparseTensorImpl.h
+include/ATen/SparseTensorUtils.h
+include/ATen/Storage.h
+include/ATen/Tensor.h
+include/ATen/TensorAccessor.h
+include/ATen/TensorGeometry.h
+include/ATen/TensorIndexing.h
+include/ATen/TensorIterator.h
+include/ATen/TensorIteratorInternal.h
+include/ATen/TensorMeta.h
+include/ATen/TensorNames.h
+include/ATen/TensorOperators.h
+include/ATen/TensorOptions.h
+include/ATen/TensorSubclassLikeUtils.h
+include/ATen/TensorUtils.h
+include/ATen/ThreadLocalState.h
+include/ATen/TracerMode.h
+include/ATen/TypeDefault.h
+include/ATen/Utils.h
+include/ATen/Version.h
+include/ATen/VmapGeneratedPlumbing.h
+include/ATen/VmapMode.h
+include/ATen/VmapTransforms.h
+include/ATen/WrapDimUtils.h
+include/ATen/WrapDimUtilsMulti.h
+include/ATen/autocast_mode.h
+include/ATen/ceil_div.h
+include/ATen/code_template.h
+include/ATen/core/ATenGeneral.h
+include/ATen/core/ATenOpList.h
+include/ATen/core/ATen_fwd.h
+include/ATen/core/ATen_pch.h
+include/ATen/core/Array.h
+include/ATen/core/Backtrace.h
+include/ATen/core/CheckMemoryFormat.h
+include/ATen/core/DeprecatedTypeProperties.h
+include/ATen/core/DeprecatedTypePropertiesRegistry.h
+include/ATen/core/Dict.h
+include/ATen/core/Dict_inl.h
+include/ATen/core/DimVector.h
+include/ATen/core/Dimname.h
+include/ATen/core/DistributionsHelper.h
+include/ATen/core/Formatting.h
+include/ATen/core/Generator.h
+include/ATen/core/IListRef.h
+include/ATen/core/IListRef_inl.h
+include/ATen/core/LegacyTypeDispatch.h
+include/ATen/core/List.h
+include/ATen/core/List_inl.h
+include/ATen/core/MT19937RNGEngine.h
+include/ATen/core/NamedTensor.h
+include/ATen/core/PhiloxRNGEngine.h
+include/ATen/core/PythonFallbackKernel.h
+include/ATen/core/QuantizerBase.h
+include/ATen/core/Range.h
+include/ATen/core/Reduction.h
+include/ATen/core/Scalar.h
+include/ATen/core/ScalarType.h
+include/ATen/core/Tensor.h
+include/ATen/core/TensorAccessor.h
+include/ATen/core/TensorBase.h
+include/ATen/core/TensorBody.h
+include/ATen/core/TorchDispatchUtils.h
+include/ATen/core/TransformationHelper.h
+include/ATen/core/UndefinedTensorImpl.h
+include/ATen/core/UnsafeFromTH.h
+include/ATen/core/VariableHooksInterface.h
+include/ATen/core/Variadic.h
+include/ATen/core/Vitals.h
+include/ATen/core/alias_info.h
+include/ATen/core/aten_interned_strings.h
+include/ATen/core/blob.h
+include/ATen/core/boxing/BoxedKernel.h
+include/ATen/core/boxing/BoxedKernel_impl.h
+include/ATen/core/boxing/KernelFunction.h
+include/ATen/core/boxing/KernelFunction_impl.h
+include/ATen/core/boxing/OperatorKernel.h
+include/ATen/core/boxing/impl/WrapFunctionIntoFunctor.h
+include/ATen/core/boxing/impl/WrapFunctionIntoRuntimeFunctor.h
+include/ATen/core/boxing/impl/boxing.h
+include/ATen/core/boxing/impl/make_boxed_from_unboxed_functor.h
+include/ATen/core/boxing/impl/test_helpers.h
+include/ATen/core/builtin_function.h
+include/ATen/core/class_type.h
+include/ATen/core/custom_class.h
+include/ATen/core/dispatch/CppSignature.h
+include/ATen/core/dispatch/DispatchKeyExtractor.h
+include/ATen/core/dispatch/Dispatcher.h
+include/ATen/core/dispatch/ObservedOperators.h
+include/ATen/core/dispatch/OperatorEntry.h
+include/ATen/core/dispatch/OperatorOptions.h
+include/ATen/core/dispatch/RegistrationHandleRAII.h
+include/ATen/core/dynamic_type.h
+include/ATen/core/enum_tag.h
+include/ATen/core/enum_type.h
+include/ATen/core/function.h
+include/ATen/core/function_schema.h
+include/ATen/core/function_schema_inl.h
+include/ATen/core/functional.h
+include/ATen/core/grad_mode.h
+include/ATen/core/interned_strings.h
+include/ATen/core/interned_strings_class.h
+include/ATen/core/ivalue.h
+include/ATen/core/ivalue_inl.h
+include/ATen/core/ivalue_to.h
+include/ATen/core/jit_type.h
+include/ATen/core/jit_type_base.h
+include/ATen/core/op_registration/adaption.h
+include/ATen/core/op_registration/infer_schema.h
+include/ATen/core/op_registration/op_allowlist.h
+include/ATen/core/op_registration/op_registration.h
+include/ATen/core/operator_name.h
+include/ATen/core/qualified_name.h
+include/ATen/core/rref_interface.h
+include/ATen/core/stack.h
+include/ATen/core/symbol.h
+include/ATen/core/type_factory.h
+include/ATen/core/type_ptr.h
+include/ATen/core/typeid.h
+include/ATen/cpp_custom_type_hack.h
+include/ATen/cpu/FlushDenormal.h
+include/ATen/cpu/vec/functional.h
+include/ATen/cpu/vec/functional_base.h
+include/ATen/cpu/vec/functional_bfloat16.h
+include/ATen/cpu/vec/intrinsics.h
+include/ATen/cpu/vec/vec.h
+include/ATen/cpu/vec/vec256/missing_vld1_neon.h
+include/ATen/cpu/vec/vec256/missing_vst1_neon.h
+include/ATen/cpu/vec/vec256/vec256.h
+include/ATen/cpu/vec/vec256/vec256_bfloat16.h
+include/ATen/cpu/vec/vec256/vec256_complex_double.h
+include/ATen/cpu/vec/vec256/vec256_complex_float.h
+include/ATen/cpu/vec/vec256/vec256_double.h
+include/ATen/cpu/vec/vec256/vec256_float.h
+include/ATen/cpu/vec/vec256/vec256_float_neon.h
+include/ATen/cpu/vec/vec256/vec256_int.h
+include/ATen/cpu/vec/vec256/vec256_qint.h
+include/ATen/cpu/vec/vec512/vec512.h
+include/ATen/cpu/vec/vec512/vec512_bfloat16.h
+include/ATen/cpu/vec/vec512/vec512_complex_double.h
+include/ATen/cpu/vec/vec512/vec512_complex_float.h
+include/ATen/cpu/vec/vec512/vec512_double.h
+include/ATen/cpu/vec/vec512/vec512_float.h
+include/ATen/cpu/vec/vec512/vec512_int.h
+include/ATen/cpu/vec/vec512/vec512_qint.h
+include/ATen/cpu/vec/vec_base.h
+include/ATen/cpu/vml.h
+include/ATen/cuda/ATenCUDAGeneral.h
+include/ATen/cuda/ApplyGridUtils.cuh
+include/ATen/cuda/AsmUtils.cuh
+include/ATen/cuda/Atomic.cuh
+include/ATen/cuda/CUDAApplyUtils.cuh
+include/ATen/cuda/CUDABlas.h
+include/ATen/cuda/CUDAContext.h
+include/ATen/cuda/CUDADataType.h
+include/ATen/cuda/CUDADevice.h
+include/ATen/cuda/CUDAEvent.h
+include/ATen/cuda/CUDAGeneratorImpl.h
+include/ATen/cuda/CUDAGraph.h
+include/ATen/cuda/CUDAGraphsUtils.cuh
+include/ATen/cuda/CUDASparse.h
+include/ATen/cuda/CUDASparseBlas.h
+include/ATen/cuda/CUDASparseDescriptors.h
+include/ATen/cuda/CUDATensorMethods.cuh
+include/ATen/cuda/CUDAUtils.h
+include/ATen/cuda/CachingHostAllocator.h
+include/ATen/cuda/DeviceUtils.cuh
+include/ATen/cuda/EmptyTensor.h
+include/ATen/cuda/Exceptions.h
+include/ATen/cuda/NumericLimits.cuh
+include/ATen/cuda/PeerToPeerAccess.h
+include/ATen/cuda/PinnedMemoryAllocator.h
+include/ATen/cuda/ScanUtils.cuh
+include/ATen/cuda/Sleep.h
+include/ATen/cuda/ThrustAllocator.h
+include/ATen/cuda/cub.cuh
+include/ATen/cuda/cub.h
+include/ATen/cuda/cub_definitions.cuh
+include/ATen/cuda/detail/CUDAHooks.h
+include/ATen/cuda/detail/DeviceThreadHandles.h
+include/ATen/cuda/detail/IndexUtils.cuh
+include/ATen/cuda/detail/IntegerDivider.cuh
+include/ATen/cuda/detail/KernelUtils.h
+include/ATen/cuda/detail/LazyNVRTC.h
+include/ATen/cuda/detail/OffsetCalculator.cuh
+include/ATen/cuda/detail/PhiloxCudaStateRaw.cuh
+include/ATen/cuda/detail/TensorInfo.cuh
+include/ATen/cuda/detail/UnpackRaw.cuh
+include/ATen/cuda/jiterator.h
+include/ATen/cuda/jiterator_impl.h
+include/ATen/cuda/llvm_jit_strings.h
+include/ATen/cudnn/Descriptors.h
+include/ATen/cudnn/Exceptions.h
+include/ATen/cudnn/Handle.h
+include/ATen/cudnn/Handles.h
+include/ATen/cudnn/Types.h
+include/ATen/cudnn/Utils.h
+include/ATen/cudnn/cudnn-wrapper.h
+include/ATen/detail/CUDAHooksInterface.h
+include/ATen/detail/FunctionTraits.h
+include/ATen/detail/HIPHooksInterface.h
+include/ATen/detail/ORTHooksInterface.h
+include/ATen/div_rtn.h
+include/ATen/dlpack.h
+include/ATen/functorch/ADInterpreters.h
+include/ATen/functorch/BatchRulesHelper.h
+include/ATen/functorch/BatchedFallback.h
+include/ATen/functorch/BatchedTensorImpl.h
+include/ATen/functorch/BatchingMetaprogramming.h
+include/ATen/functorch/DynamicLayer.h
+include/ATen/functorch/FunctionalizeInterpreter.h
+include/ATen/functorch/Interpreter.h
+include/ATen/functorch/LegacyVmapTransforms.h
+include/ATen/functorch/Macros.h
+include/ATen/functorch/PlumbingHelper.h
+include/ATen/functorch/TensorWrapper.h
+include/ATen/functorch/VmapInterpreter.h
+include/ATen/hip/impl/HIPAllocatorMasqueradingAsCUDA.h
+include/ATen/hip/impl/HIPCachingAllocatorMasqueradingAsCUDA.h
+include/ATen/hip/impl/HIPGuardImplMasqueradingAsCUDA.h
+include/ATen/hip/impl/HIPStreamMasqueradingAsCUDA.h
+include/ATen/jit_macros.h
+include/ATen/jiterator_macros.h
+include/ATen/metal/Context.h
+include/ATen/miopen/Descriptors.h
+include/ATen/miopen/Exceptions.h
+include/ATen/miopen/Handle.h
+include/ATen/miopen/Types.h
+include/ATen/miopen/Utils.h
+include/ATen/miopen/miopen-wrapper.h
+include/ATen/native/Activation.h
+include/ATen/native/AdaptivePooling.h
+include/ATen/native/BatchLinearAlgebra.h
+include/ATen/native/BinaryOps.h
+include/ATen/native/BucketizationUtils.h
+include/ATen/native/CPUBlas.h
+include/ATen/native/CPUFallback.h
+include/ATen/native/CanUse32BitIndexMath.h
+include/ATen/native/ComplexHelper.h
+include/ATen/native/CompositeRandomAccessor.h
+include/ATen/native/CompositeRandomAccessorCommon.h
+include/ATen/native/ConvUtils.h
+include/ATen/native/ConvolutionMM3d.h
+include/ATen/native/Copy.h
+include/ATen/native/Cross.h
+include/ATen/native/DilatedConvolutionUtils.h
+include/ATen/native/DispatchStub.h
+include/ATen/native/Distance.h
+include/ATen/native/DistributionTemplates.h
+include/ATen/native/Distributions.h
+include/ATen/native/EmbeddingBag.h
+include/ATen/native/Fill.h
+include/ATen/native/ForeachUtils.h
+include/ATen/native/FunctionOfAMatrixUtils.h
+include/ATen/native/GridSampler.h
+include/ATen/native/GridSamplerUtils.h
+include/ATen/native/Histogram.h
+include/ATen/native/IndexKernel.h
+include/ATen/native/IndexingUtils.h
+include/ATen/native/Lerp.h
+include/ATen/native/LinearAlgebra.h
+include/ATen/native/LinearAlgebraUtils.h
+include/ATen/native/LossMulti.h
+include/ATen/native/Math.h
+include/ATen/native/MathBitFallThroughLists.h
+include/ATen/native/MathBitsFallback.h
+include/ATen/native/MaxPooling.h
+include/ATen/native/NonEmptyUtils.h
+include/ATen/native/NonSymbolicBC.h
+include/ATen/native/Normalization.h
+include/ATen/native/PointwiseOps.h
+include/ATen/native/Pool.h
+include/ATen/native/Pow.h
+include/ATen/native/RNN.h
+include/ATen/native/RangeFactories.h
+include/ATen/native/ReduceAllOps.h
+include/ATen/native/ReduceOps.h
+include/ATen/native/ReduceOpsUtils.h
+include/ATen/native/Repeat.h
+include/ATen/native/Resize.h
+include/ATen/native/ResizeCommon.h
+include/ATen/native/ScatterGatherChecks.h
+include/ATen/native/SegmentReduce.h
+include/ATen/native/SharedReduceOps.h
+include/ATen/native/SobolEngineOpsUtils.h
+include/ATen/native/Sorting.h
+include/ATen/native/SortingUtils.h
+include/ATen/native/SpectralOpsUtils.h
+include/ATen/native/StridedRandomAccessor.h
+include/ATen/native/TensorAdvancedIndexing.h
+include/ATen/native/TensorAdvancedIndexingUtils.h
+include/ATen/native/TensorCompare.h
+include/ATen/native/TensorConversions.h
+include/ATen/native/TensorDimApply.h
+include/ATen/native/TensorFactories.h
+include/ATen/native/TensorIterator.h
+include/ATen/native/TensorIteratorDynamicCasting.h
+include/ATen/native/TensorProperties.h
+include/ATen/native/TensorShape.h
+include/ATen/native/TensorTransformations.h
+include/ATen/native/TopKImpl.h
+include/ATen/native/TransposeType.h
+include/ATen/native/TriangularOpsUtils.h
+include/ATen/native/TypeProperties.h
+include/ATen/native/UnaryOps.h
+include/ATen/native/Unfold2d.h
+include/ATen/native/Unfold3d.h
+include/ATen/native/UnfoldBackward.h
+include/ATen/native/UpSample.h
+include/ATen/native/ao_sparse/quantized/cpu/fbgemm_utils.h
+include/ATen/native/ao_sparse/quantized/cpu/packed_params.h
+include/ATen/native/ao_sparse/quantized/cpu/qnnpack_utils.h
+include/ATen/native/batch_norm.h
+include/ATen/native/cpu/AtomicAddFloat.h
+include/ATen/native/cpu/CatKernel.h
+include/ATen/native/cpu/ChannelShuffleKernel.h
+include/ATen/native/cpu/CopyKernel.h
+include/ATen/native/cpu/DepthwiseConvKernel.h
+include/ATen/native/cpu/DistributionTemplates.h
+include/ATen/native/cpu/GridSamplerKernel.h
+include/ATen/native/cpu/IndexKernelUtils.h
+include/ATen/native/cpu/Intrinsics.h
+include/ATen/native/cpu/IsContiguous.h
+include/ATen/native/cpu/Loops.h
+include/ATen/native/cpu/MaxUnpoolKernel.h
+include/ATen/native/cpu/PixelShuffleKernel.h
+include/ATen/native/cpu/Reduce.h
+include/ATen/native/cpu/SerialStackImpl.h
+include/ATen/native/cpu/SoftmaxKernel.h
+include/ATen/native/cpu/StackKernel.h
+include/ATen/native/cpu/WeightNormKernel.h
+include/ATen/native/cpu/avx_mathfun.h
+include/ATen/native/cpu/mixed_data_type.h
+include/ATen/native/cpu/moments_utils.h
+include/ATen/native/cpu/utils.h
+include/ATen/native/cpu/zmath.h
+include/ATen/native/cuda/Activation.h
+include/ATen/native/cuda/BinaryInternal.h
+include/ATen/native/cuda/CUDAJitLoops.cuh
+include/ATen/native/cuda/CUDALoops.cuh
+include/ATen/native/cuda/CompositeRandomAccessor.h
+include/ATen/native/cuda/Copy.h
+include/ATen/native/cuda/CuFFTPlanCache.h
+include/ATen/native/cuda/CuFFTUtils.h
+include/ATen/native/cuda/DeviceSqrt.cuh
+include/ATen/native/cuda/DistributionTemplates.h
+include/ATen/native/cuda/Distributions.h
+include/ATen/native/cuda/EmbeddingBackwardKernel.cuh
+include/ATen/native/cuda/ForeachFunctors.cuh
+include/ATen/native/cuda/GridSampler.cuh
+include/ATen/native/cuda/GridSampler.h
+include/ATen/native/cuda/IndexKernel.h
+include/ATen/native/cuda/JitLoops.cuh
+include/ATen/native/cuda/KernelUtils.cuh
+include/ATen/native/cuda/LaunchUtils.h
+include/ATen/native/cuda/Loops.cuh
+include/ATen/native/cuda/Math.cuh
+include/ATen/native/cuda/MemoryAccess.cuh
+include/ATen/native/cuda/MiscUtils.h
+include/ATen/native/cuda/MultiTensorApply.cuh
+include/ATen/native/cuda/Normalization.cuh
+include/ATen/native/cuda/PersistentSoftmax.cuh
+include/ATen/native/cuda/Pow.cuh
+include/ATen/native/cuda/ROCmLoops.cuh
+include/ATen/native/cuda/Randperm.cuh
+include/ATen/native/cuda/Reduce.cuh
+include/ATen/native/cuda/ReduceOps.h
+include/ATen/native/cuda/Resize.h
+include/ATen/native/cuda/ScanKernels.h
+include/ATen/native/cuda/ScanUtils.cuh
+include/ATen/native/cuda/Sort.h
+include/ATen/native/cuda/SortStable.h
+include/ATen/native/cuda/SortUtils.cuh
+include/ATen/native/cuda/Sorting.h
+include/ATen/native/cuda/SortingCommon.cuh
+include/ATen/native/cuda/SortingRadixSelect.cuh
+include/ATen/native/cuda/TensorModeKernel.cuh
+include/ATen/native/cuda/TensorModeKernel.h
+include/ATen/native/cuda/TensorTopK.h
+include/ATen/native/cuda/UniqueCub.cuh
+include/ATen/native/cuda/UpSample.cuh
+include/ATen/native/cuda/block_reduce.cuh
+include/ATen/native/cuda/fused_adam_amsgrad_impl.cuh
+include/ATen/native/cuda/fused_adam_impl.cuh
+include/ATen/native/cuda/fused_adam_utils.cuh
+include/ATen/native/cuda/im2col.cuh
+include/ATen/native/cuda/jit_utils.h
+include/ATen/native/cuda/reduction_template.cuh
+include/ATen/native/cuda/thread_constants.h
+include/ATen/native/cuda/vol2col.cuh
+include/ATen/native/group_norm.h
+include/ATen/native/im2col.h
+include/ATen/native/im2col_shape_check.h
+include/ATen/native/layer_norm.h
+include/ATen/native/quantized/AffineQuantizer.h
+include/ATen/native/quantized/AffineQuantizerBase.h
+include/ATen/native/quantized/Copy.h
+include/ATen/native/quantized/FakeQuantAffine.h
+include/ATen/native/quantized/IndexKernel.h
+include/ATen/native/quantized/PackedParams.h
+include/ATen/native/quantized/cpu/BinaryOps.h
+include/ATen/native/quantized/cpu/EmbeddingPackedParams.h
+include/ATen/native/quantized/cpu/OnednnUtils.h
+include/ATen/native/quantized/cpu/QnnpackUtils.h
+include/ATen/native/quantized/cpu/QuantUtils.h
+include/ATen/native/quantized/cpu/QuantizedOps.h
+include/ATen/native/quantized/cpu/RuyUtils.h
+include/ATen/native/quantized/cpu/XnnpackUtils.h
+include/ATen/native/quantized/cpu/conv_serialization.h
+include/ATen/native/quantized/cpu/fbgemm_utils.h
+include/ATen/native/quantized/cpu/init_qnnpack.h
+include/ATen/native/quantized/cpu/qembeddingbag.h
+include/ATen/native/quantized/cpu/qembeddingbag_prepack.h
+include/ATen/native/quantized/cudnn/utils.h
+include/ATen/native/verbose_wrapper.h
+include/ATen/native/vol2col.h
+include/ATen/ops/_adaptive_avg_pool2d.h
+include/ATen/ops/_adaptive_avg_pool2d_backward.h
+include/ATen/ops/_adaptive_avg_pool2d_backward_compositeexplicitautograd_dispatch.h
+include/ATen/ops/_adaptive_avg_pool2d_backward_cpu_dispatch.h
+include/ATen/ops/_adaptive_avg_pool2d_backward_cuda_dispatch.h
+include/ATen/ops/_adaptive_avg_pool2d_backward_native.h
+include/ATen/ops/_adaptive_avg_pool2d_backward_ops.h
+include/ATen/ops/_adaptive_avg_pool2d_compositeexplicitautograd_dispatch.h
+include/ATen/ops/_adaptive_avg_pool2d_cpu_dispatch.h
+include/ATen/ops/_adaptive_avg_pool2d_cuda_dispatch.h
+include/ATen/ops/_adaptive_avg_pool2d_native.h
+include/ATen/ops/_adaptive_avg_pool2d_ops.h
+include/ATen/ops/_adaptive_avg_pool3d.h
+include/ATen/ops/_adaptive_avg_pool3d_backward.h
+include/ATen/ops/_adaptive_avg_pool3d_backward_compositeexplicitautograd_dispatch.h
+include/ATen/ops/_adaptive_avg_pool3d_backward_cpu_dispatch.h
+include/ATen/ops/_adaptive_avg_pool3d_backward_cuda_dispatch.h
+include/ATen/ops/_adaptive_avg_pool3d_backward_native.h
+include/ATen/ops/_adaptive_avg_pool3d_backward_ops.h
+include/ATen/ops/_adaptive_avg_pool3d_compositeexplicitautograd_dispatch.h
+include/ATen/ops/_adaptive_avg_pool3d_cpu_dispatch.h
+include/ATen/ops/_adaptive_avg_pool3d_cuda_dispatch.h
+include/ATen/ops/_adaptive_avg_pool3d_native.h
+include/ATen/ops/_adaptive_avg_pool3d_ops.h
+include/ATen/ops/_add_batch_dim.h
+include/ATen/ops/_add_batch_dim_compositeimplicitautograd_dispatch.h
+include/ATen/ops/_add_batch_dim_native.h
+include/ATen/ops/_add_batch_dim_ops.h
+include/ATen/ops/_add_relu.h
+include/ATen/ops/_add_relu_compositeexplicitautograd_dispatch.h
+include/ATen/ops/_add_relu_cpu_dispatch.h
+include/ATen/ops/_add_relu_meta_dispatch.h
+include/ATen/ops/_add_relu_native.h
+include/ATen/ops/_add_relu_ops.h
+include/ATen/ops/_addmm_activation.h
+include/ATen/ops/_addmm_activation_compositeexplicitautogradnonfunctional_dispatch.h
+include/ATen/ops/_addmm_activation_cpu_dispatch.h
+include/ATen/ops/_addmm_activation_cuda_dispatch.h
+include/ATen/ops/_addmm_activation_meta.h
+include/ATen/ops/_addmm_activation_meta_dispatch.h
+include/ATen/ops/_addmm_activation_native.h
+include/ATen/ops/_addmm_activation_ops.h
+include/ATen/ops/_aminmax.h
+include/ATen/ops/_aminmax_compositeexplicitautograd_dispatch.h
+include/ATen/ops/_aminmax_cpu_dispatch.h
+include/ATen/ops/_aminmax_cuda_dispatch.h
+include/ATen/ops/_aminmax_native.h
+include/ATen/ops/_aminmax_ops.h
+include/ATen/ops/_amp_foreach_non_finite_check_and_unscale.h
+include/ATen/ops/_amp_foreach_non_finite_check_and_unscale_compositeexplicitautograd_dispatch.h
+include/ATen/ops/_amp_foreach_non_finite_check_and_unscale_cuda_dispatch.h
+include/ATen/ops/_amp_foreach_non_finite_check_and_unscale_native.h
+include/ATen/ops/_amp_foreach_non_finite_check_and_unscale_ops.h
+include/ATen/ops/_amp_update_scale.h
+include/ATen/ops/_amp_update_scale_compositeexplicitautograd_dispatch.h
+include/ATen/ops/_amp_update_scale_cuda_dispatch.h
+include/ATen/ops/_amp_update_scale_meta_dispatch.h
+include/ATen/ops/_amp_update_scale_native.h
+include/ATen/ops/_amp_update_scale_ops.h
+include/ATen/ops/_assert_async.h
+include/ATen/ops/_assert_async_cpu_dispatch.h
+include/ATen/ops/_assert_async_cuda_dispatch.h
+include/ATen/ops/_assert_async_native.h
+include/ATen/ops/_assert_async_ops.h
+include/ATen/ops/_assert_tensor_metadata.h
+include/ATen/ops/_assert_tensor_metadata_compositeimplicitautograd_dispatch.h
+include/ATen/ops/_assert_tensor_metadata_native.h
+include/ATen/ops/_assert_tensor_metadata_ops.h
+include/ATen/ops/_autocast_to_full_precision.h
+include/ATen/ops/_autocast_to_full_precision_compositeimplicitautograd_dispatch.h
+include/ATen/ops/_autocast_to_full_precision_native.h
+include/ATen/ops/_autocast_to_full_precision_ops.h
+include/ATen/ops/_autocast_to_reduced_precision.h
+include/ATen/ops/_autocast_to_reduced_precision_compositeimplicitautograd_dispatch.h
+include/ATen/ops/_autocast_to_reduced_precision_native.h
+include/ATen/ops/_autocast_to_reduced_precision_ops.h
+include/ATen/ops/_backward.h
+include/ATen/ops/_backward_compositeimplicitautograd_dispatch.h
+include/ATen/ops/_backward_native.h
+include/ATen/ops/_backward_ops.h
+include/ATen/ops/_batch_norm_impl_index.h
+include/ATen/ops/_batch_norm_impl_index_backward.h
+include/ATen/ops/_batch_norm_impl_index_backward_compositeimplicitautograd_dispatch.h
+include/ATen/ops/_batch_norm_impl_index_backward_native.h
+include/ATen/ops/_batch_norm_impl_index_backward_ops.h
+include/ATen/ops/_batch_norm_impl_index_compositeimplicitautograd_dispatch.h
+include/ATen/ops/_batch_norm_impl_index_native.h
+include/ATen/ops/_batch_norm_impl_index_ops.h
+include/ATen/ops/_cast_Byte.h
+include/ATen/ops/_cast_Byte_compositeimplicitautograd_dispatch.h
+include/ATen/ops/_cast_Byte_native.h
+include/ATen/ops/_cast_Byte_ops.h
+include/ATen/ops/_cast_Char.h
+include/ATen/ops/_cast_Char_compositeimplicitautograd_dispatch.h
+include/ATen/ops/_cast_Char_native.h
+include/ATen/ops/_cast_Char_ops.h
+include/ATen/ops/_cast_Double.h
+include/ATen/ops/_cast_Double_compositeimplicitautograd_dispatch.h
+include/ATen/ops/_cast_Double_native.h
+include/ATen/ops/_cast_Double_ops.h
+include/ATen/ops/_cast_Float.h
+include/ATen/ops/_cast_Float_compositeimplicitautograd_dispatch.h
+include/ATen/ops/_cast_Float_native.h
+include/ATen/ops/_cast_Float_ops.h
+include/ATen/ops/_cast_Half.h
+include/ATen/ops/_cast_Half_compositeimplicitautograd_dispatch.h
+include/ATen/ops/_cast_Half_native.h
+include/ATen/ops/_cast_Half_ops.h
+include/ATen/ops/_cast_Int.h
+include/ATen/ops/_cast_Int_compositeimplicitautograd_dispatch.h
+include/ATen/ops/_cast_Int_native.h
+include/ATen/ops/_cast_Int_ops.h
+include/ATen/ops/_cast_Long.h
+include/ATen/ops/_cast_Long_compositeimplicitautograd_dispatch.h
+include/ATen/ops/_cast_Long_native.h
+include/ATen/ops/_cast_Long_ops.h
+include/ATen/ops/_cast_Short.h
+include/ATen/ops/_cast_Short_compositeimplicitautograd_dispatch.h
+include/ATen/ops/_cast_Short_native.h
+include/ATen/ops/_cast_Short_ops.h
+include/ATen/ops/_cdist_backward.h
+include/ATen/ops/_cdist_backward_compositeexplicitautograd_dispatch.h
+include/ATen/ops/_cdist_backward_cpu_dispatch.h
+include/ATen/ops/_cdist_backward_cuda_dispatch.h
+include/ATen/ops/_cdist_backward_native.h
+include/ATen/ops/_cdist_backward_ops.h
+include/ATen/ops/_cdist_forward.h
+include/ATen/ops/_cdist_forward_compositeexplicitautograd_dispatch.h
+include/ATen/ops/_cdist_forward_cpu_dispatch.h
+include/ATen/ops/_cdist_forward_cuda_dispatch.h
+include/ATen/ops/_cdist_forward_native.h
+include/ATen/ops/_cdist_forward_ops.h
+include/ATen/ops/_cholesky_solve_helper.h
+include/ATen/ops/_cholesky_solve_helper_compositeexplicitautograd_dispatch.h
+include/ATen/ops/_cholesky_solve_helper_cpu_dispatch.h
+include/ATen/ops/_cholesky_solve_helper_cuda_dispatch.h
+include/ATen/ops/_cholesky_solve_helper_native.h
+include/ATen/ops/_cholesky_solve_helper_ops.h
+include/ATen/ops/_choose_qparams_per_tensor.h
+include/ATen/ops/_choose_qparams_per_tensor_compositeimplicitautograd_dispatch.h
+include/ATen/ops/_choose_qparams_per_tensor_native.h
+include/ATen/ops/_choose_qparams_per_tensor_ops.h
+include/ATen/ops/_coalesce.h
+include/ATen/ops/_coalesce_compositeexplicitautograd_dispatch.h
+include/ATen/ops/_coalesce_native.h
+include/ATen/ops/_coalesce_ops.h
+include/ATen/ops/_coalesced.h
+include/ATen/ops/_coalesced_compositeexplicitautograd_dispatch.h
+include/ATen/ops/_coalesced_meta_dispatch.h
+include/ATen/ops/_coalesced_native.h
+include/ATen/ops/_coalesced_ops.h
+include/ATen/ops/_compute_linear_combination.h
+include/ATen/ops/_compute_linear_combination_cpu_dispatch.h
+include/ATen/ops/_compute_linear_combination_cuda_dispatch.h
+include/ATen/ops/_compute_linear_combination_native.h
*** 8299 LINES SKIPPED ***