git: dbe851cc291b - main - misc/pytorch: Update to 2.1.0
- Go to: [ bottom of page ] [ top of archives ] [ this month ]
Date: Mon, 27 Nov 2023 10:45:03 UTC
The branch main has been updated by sunpoet: URL: https://cgit.FreeBSD.org/ports/commit/?id=dbe851cc291bde43def88e727615619c64c2117c commit dbe851cc291bde43def88e727615619c64c2117c Author: Po-Chuan Hsieh <sunpoet@FreeBSD.org> AuthorDate: 2023-11-27 10:09:26 +0000 Commit: Po-Chuan Hsieh <sunpoet@FreeBSD.org> CommitDate: 2023-11-27 10:30:09 +0000 misc/pytorch: Update to 2.1.0 - Add LICENSE_FILE - Remove PYTHON_EXECUTABLE which is set by USES=python now - Comment BROKEN_* temporarily to see if the new version builds Changes: https://github.com/pytorch/pytorch/releases PR: 274859 Approved by: maintainer (timeout, 25 days) --- misc/pytorch/Makefile | 19 +- misc/pytorch/distinfo | 6 +- .../files/patch-aten_src_ATen_native_SoftMax.cpp | 11 - ...native_sparse_ValidateCompressedIndicesCommon.h | 82 ++- ...aten_src_ATen_native_transformers_attention.cpp | 11 - misc/pytorch/files/patch-cmake_Dependencies.cmake | 17 +- .../patch-third__party_cpuinfo_CMakeLists.txt | 53 +- ...hird__party_kineto_libkineto_src_ThreadUtil.cpp | 4 +- misc/pytorch/pkg-plist | 784 ++++++++++++++------- 9 files changed, 637 insertions(+), 350 deletions(-) diff --git a/misc/pytorch/Makefile b/misc/pytorch/Makefile index fef8cca67935..841af8cd1dbd 100644 --- a/misc/pytorch/Makefile +++ b/misc/pytorch/Makefile @@ -1,9 +1,8 @@ PORTNAME= pytorch DISTVERSIONPREFIX= v -DISTVERSION= 1.13.1 -PORTREVISION= 1 +DISTVERSION= 2.1.0 CATEGORIES= misc # machine-learning -MASTER_SITES= https://github.com/pytorch/pytorch/releases/download/v1.13.1/ +MASTER_SITES= https://github.com/pytorch/pytorch/releases/download/v${DISTVERSION}/ DIST_SUBDIR= ${PORTNAME} MAINTAINER= yuri@FreeBSD.org @@ -11,21 +10,22 @@ COMMENT= Tensors and dynamic neural networks in Python (C++ library) WWW= https://pytorch.org/ LICENSE= BSD3CLAUSE +LICENSE_FILE= ${WRKSRC}/LICENSE -BROKEN_aarch64= configure fails: CMake Error at third_party/XNNPACK/CMakeLists.txt:94 (MESSAGE): Unrecognized CMAKE_SYSTEM_NAME = FreeBSD -BROKEN_i386= compilation fails: error: use of undeclared identifier 'AVX2' -BROKEN_FreeBSD_14= fails to compile calling a private constructor of class +#BROKEN_aarch64= configure fails: CMake Error at third_party/XNNPACK/CMakeLists.txt:94 (MESSAGE): Unrecognized CMAKE_SYSTEM_NAME = FreeBSD +#BROKEN_i386= compilation fails: error: use of undeclared identifier 'AVX2' +#BROKEN_FreeBSD_14= fails to compile calling a private constructor of class BUILD_DEPENDS= gmake:devel/gmake \ ${LOCALBASE}/include/fxdiv.h:devel/fxdiv LIB_DEPENDS= libopenblas.so:math/openblas \ libmpi.so:net/openmpi \ - libpthreadpool.so:devel/pthreadpool \ libonnx.so:misc/onnx \ + libpthreadpool.so:devel/pthreadpool \ libprotobuf.so:devel/protobuf \ libsleef.so:math/sleef -USES= compiler:c++14-lang cmake localbase:ldflags python # requires python even with PYTHON=off +USES= compiler:c++17-lang cmake localbase:ldflags python # requires python even with PYTHON=off CMAKE_OFF= BUILD_CUSTOM_PROTOBUF USE_CUDA USE_ROCM USE_NNPACK USE_QNNPACK USE_PYTORCH_QNNPACK \ USE_FBGEMM # workaround recommended by the upstream here: https://github.com/pytorch/pytorch/issues/28337 @@ -33,8 +33,7 @@ CMAKE_ON= USE_SYSTEM_PYBIND11 \ USE_SYSTEM_SLEEF \ USE_SYSTEM_ONNX # see other USE_SYSTEM_xx in CMakeLists.txt CMAKE_ARGS= -DPSIMD_SOURCE_DIR=${WRKSRC}/third_party/psimd \ - -DFREEBSD_PYTHON_VER=${PYTHON_VER} \ - -DPYTHON_EXECUTABLE:STRING=${PYTHON_CMD} + -DFREEBSD_PYTHON_VER=${PYTHON_VER} MAKE_ENV= USE_NINJA=no # ninja breaks for some reason LDFLAGS+= -lexecinfo diff --git a/misc/pytorch/distinfo b/misc/pytorch/distinfo index 2b0b01afc7df..654de6ea7ac3 100644 --- a/misc/pytorch/distinfo +++ b/misc/pytorch/distinfo @@ -1,3 +1,3 @@ -TIMESTAMP = 1672353185 -SHA256 (pytorch/pytorch-v1.13.1.tar.gz) = dbc229ee9750b02b514937d017744443a269ea0241ed3f32b9af0703589d25d4 -SIZE (pytorch/pytorch-v1.13.1.tar.gz) = 234057741 +TIMESTAMP = 1697035721 +SHA256 (pytorch/pytorch-v2.1.0.tar.gz) = 631c71f7f7d6174952f35b5ed4a45ec115720a4ef3eb619678de5893af54f403 +SIZE (pytorch/pytorch-v2.1.0.tar.gz) = 283041980 diff --git a/misc/pytorch/files/patch-aten_src_ATen_native_SoftMax.cpp b/misc/pytorch/files/patch-aten_src_ATen_native_SoftMax.cpp deleted file mode 100644 index 6f66aece26dc..000000000000 --- a/misc/pytorch/files/patch-aten_src_ATen_native_SoftMax.cpp +++ /dev/null @@ -1,11 +0,0 @@ ---- aten/src/ATen/native/SoftMax.cpp.orig 2022-12-29 23:05:30 UTC -+++ aten/src/ATen/native/SoftMax.cpp -@@ -132,7 +132,7 @@ void host_softmax( - const Tensor& input, - const int64_t dim, - bool* mask = nullptr, -- const c10::optional<int64_t> mask_type_ = NULL) { -+ const c10::optional<int64_t> mask_type_ = 0) { - - if (MaskedSoftMax) { - TORCH_CHECK(mask_type_.has_value(), "Mask Type should be defined"); diff --git a/misc/pytorch/files/patch-aten_src_ATen_native_sparse_ValidateCompressedIndicesCommon.h b/misc/pytorch/files/patch-aten_src_ATen_native_sparse_ValidateCompressedIndicesCommon.h index 3eba700c307c..70dc6fbd61e2 100644 --- a/misc/pytorch/files/patch-aten_src_ATen_native_sparse_ValidateCompressedIndicesCommon.h +++ b/misc/pytorch/files/patch-aten_src_ATen_native_sparse_ValidateCompressedIndicesCommon.h @@ -1,80 +1,78 @@ ---- aten/src/ATen/native/sparse/ValidateCompressedIndicesCommon.h.orig 2022-12-29 23:09:42 UTC +--- aten/src/ATen/native/sparse/ValidateCompressedIndicesCommon.h.orig 2023-05-07 08:51:40 UTC +++ aten/src/ATen/native/sparse/ValidateCompressedIndicesCommon.h -@@ -38,7 +38,7 @@ namespace { - // respectively. +@@ -39,7 +39,7 @@ namespace { + // use `cidx/idx` to refer to `compressed_indices/plain_indices` respectively. INVARIANT_CHECK_FUNC_API -_assert(const bool cond, const char* const message) { -+__assert__(const bool cond, const char* const message) { ++__assert(const bool cond, const char* const message) { #ifdef GPUCC CUDA_KERNEL_ASSERT(cond && message); #else -@@ -58,10 +58,10 @@ INVARIANT_CHECK_FUNC_API - _check_first_cidx_is_zero(const index_t& cidx, const index_t& zero) { +@@ -57,9 +57,9 @@ INVARIANT_CHECK_FUNC_API _check_first_cidx_is_zero( + const index_t& zero) { const bool invariant = cidx == zero; if (cdim_name == CDimName::CRow) { - _assert(invariant, "`crow_indices[..., 0] == 0` is not satisfied."); -+ __assert__(invariant, "`crow_indices[..., 0] == 0` is not satisfied."); - } - else { ++ __assert(invariant, "`crow_indices[..., 0] == 0` is not satisfied."); + } else { - _assert(invariant, "`ccol_indices[..., 0] == 0` is not satisfied."); -+ __assert__(invariant, "`ccol_indices[..., 0] == 0` is not satisfied."); ++ __assert(invariant, "`ccol_indices[..., 0] == 0` is not satisfied."); } } -@@ -72,10 +72,10 @@ INVARIANT_CHECK_FUNC_API - _check_last_cidx_is_nnz(const index_t& cidx, const index_t& nnz) { +@@ -71,9 +71,9 @@ INVARIANT_CHECK_FUNC_API _check_last_cidx_is_nnz( + const index_t& nnz) { const bool invariant = cidx == nnz; if (cdim_name == CDimName::CRow) { - _assert(invariant, "`crow_indices[..., -1] == nnz` is not satisfied."); -+ __assert__(invariant, "`crow_indices[..., -1] == nnz` is not satisfied."); - } - else { ++ __assert(invariant, "`crow_indices[..., -1] == nnz` is not satisfied."); + } else { - _assert(invariant, "`ccol_indices[..., -1] == nnz` is not satisfied."); -+ __assert__(invariant, "`ccol_indices[..., -1] == nnz` is not satisfied."); ++ __assert(invariant, "`ccol_indices[..., -1] == nnz` is not satisfied."); } } -@@ -91,11 +91,11 @@ _check_cidx_nondecreasing_locally_bounded_sequence( +@@ -88,11 +88,11 @@ INVARIANT_CHECK_FUNC_API _check_cidx_nondecreasing_loc const auto s_cidx = cidx_next - cidx; const bool invariant = zero <= s_cidx && s_cidx <= dim; if (cdim_name == CDimName::CRow) { -- _assert(invariant, -+ __assert__(invariant, +- _assert( ++ __assert( + invariant, "`0 <= crow_indices[..., 1:] - crow_indices[..., :-1] <= ncols` is not satisfied."); - } - else { -- _assert(invariant, -+ __assert__(invariant, + } else { +- _assert( ++ __assert( + invariant, "`0 <= ccol_indices[..., 1:] - ccol_indices[..., :-1] <= nrows` is not satisfied."); } - } -@@ -110,10 +110,10 @@ _check_idx_bounds( +@@ -107,9 +107,9 @@ INVARIANT_CHECK_FUNC_API _check_idx_bounds( const index_t& dim) { const bool invariant = zero <= idx && idx < dim; if (cdim_name == CDimName::CRow) { - _assert(invariant, "`0 <= col_indices < ncols` is not satisfied."); -+ __assert__(invariant, "`0 <= col_indices < ncols` is not satisfied."); - } - else { ++ __assert(invariant, "`0 <= col_indices < ncols` is not satisfied."); + } else { - _assert(invariant, "`0 <= row_indices < nrows` is not satisfied."); -+ __assert__(invariant, "`0 <= row_indices < nrows` is not satisfied."); ++ __assert(invariant, "`0 <= row_indices < nrows` is not satisfied."); } } -@@ -133,13 +133,13 @@ _check_idx_sorted_distinct_vals_slices_with_cidx( +@@ -128,14 +128,14 @@ INVARIANT_CHECK_FUNC_API _check_idx_sorted_distinct_va for (auto* RESTRICT curr = slice_begin + 1; curr < slice_end; ++curr) { const auto invariant = *(curr - 1) < *curr; if (cdim_name == CDimName::CRow) { -- _assert(invariant, "`col_indices[..., crow_indices[..., i - 1]:crow_indices[..., i]] " -+ __assert__(invariant, "`col_indices[..., crow_indices[..., i - 1]:crow_indices[..., i]] " - "for all i = 1, ..., nrows " - "are sorted and distinct along the last dimension values` " - "is not satisfied."); - } - else { -- _assert(invariant, "`row_indices[..., ccol_indices[..., i - 1]:ccol_indices[..., i]] " -+ __assert__(invariant, "`row_indices[..., ccol_indices[..., i - 1]:ccol_indices[..., i]] " - "for all i = 1, ..., ncols " - "are sorted and distinct along the last dimension values` " - "is not satisfied."); +- _assert( ++ __assert( + invariant, + "`col_indices[..., crow_indices[..., i - 1]:crow_indices[..., i]] " + "for all i = 1, ..., nrows " + "are sorted and distinct along the last dimension values` " + "is not satisfied."); + } else { +- _assert( ++ __assert( + invariant, + "`row_indices[..., ccol_indices[..., i - 1]:ccol_indices[..., i]] " + "for all i = 1, ..., ncols " diff --git a/misc/pytorch/files/patch-aten_src_ATen_native_transformers_attention.cpp b/misc/pytorch/files/patch-aten_src_ATen_native_transformers_attention.cpp deleted file mode 100644 index 0f3383d2260a..000000000000 --- a/misc/pytorch/files/patch-aten_src_ATen_native_transformers_attention.cpp +++ /dev/null @@ -1,11 +0,0 @@ ---- aten/src/ATen/native/transformers/attention.cpp.orig 2022-12-29 23:18:12 UTC -+++ aten/src/ATen/native/transformers/attention.cpp -@@ -118,7 +118,7 @@ Tensor masked_softmax( - Tensor& attn_scores, - c10::optional<Tensor> attn_mask, - const Tensor& query, -- c10::optional<int64_t> mask_type = NULL) { -+ c10::optional<int64_t> mask_type = 0) { - if (query.is_nested() && !attn_mask) { - return at::_nested_tensor_softmax_with_shape(attn_scores, query); - } diff --git a/misc/pytorch/files/patch-cmake_Dependencies.cmake b/misc/pytorch/files/patch-cmake_Dependencies.cmake index 165534d123bd..0b1436e51889 100644 --- a/misc/pytorch/files/patch-cmake_Dependencies.cmake +++ b/misc/pytorch/files/patch-cmake_Dependencies.cmake @@ -1,11 +1,8 @@ ---- cmake/Dependencies.cmake.orig 2022-12-16 00:23:46 UTC +--- cmake/Dependencies.cmake.orig 2023-05-08 19:58:16 UTC +++ cmake/Dependencies.cmake -@@ -339,7 +339,7 @@ if(USE_NNPACK OR USE_QNNPACK OR USE_PYTORCH_QNNPACK OR - set(DISABLE_NNPACK_AND_FAMILY ON) - endif() - else() -- if(NOT IOS AND NOT (CMAKE_SYSTEM_NAME MATCHES "^(Android|Linux|Darwin|Windows)$")) -+ if(NOT IOS AND NOT (CMAKE_SYSTEM_NAME MATCHES "^(Android|Linux|FreeBSD|Darwin|Windows)$")) - message(WARNING - "Target platform \"${CMAKE_SYSTEM_NAME}\" is not supported in {Q/X}NNPACK. " - "Supported platforms are Android, iOS, Linux, and macOS. " +@@ -1,3 +1,5 @@ ++set(CMAKE_CXX_STANDARD 17) ++ + # RPATH stuff + # see https://cmake.org/Wiki/CMake_RPATH_handling + if(APPLE) diff --git a/misc/pytorch/files/patch-third__party_cpuinfo_CMakeLists.txt b/misc/pytorch/files/patch-third__party_cpuinfo_CMakeLists.txt index 755ebd06f98a..059eaaedadcf 100644 --- a/misc/pytorch/files/patch-third__party_cpuinfo_CMakeLists.txt +++ b/misc/pytorch/files/patch-third__party_cpuinfo_CMakeLists.txt @@ -1,11 +1,56 @@ ---- third_party/cpuinfo/CMakeLists.txt.orig 2022-12-16 00:23:47 UTC +--- third_party/cpuinfo/CMakeLists.txt.orig 2023-10-16 12:32:17 UTC +++ third_party/cpuinfo/CMakeLists.txt -@@ -77,7 +77,7 @@ IF(NOT CMAKE_SYSTEM_NAME) +@@ -77,7 +77,7 @@ IF(NOT CMAKE_SYSTEM_PROCESSOR) + "cpuinfo will compile, but cpuinfo_initialize() will always fail.") + SET(CPUINFO_SUPPORTED_PLATFORM FALSE) + ENDIF() +-ELSEIF(NOT CPUINFO_TARGET_PROCESSOR MATCHES "^(i[3-6]86|AMD64|x86(_64)?|armv[5-8].*|aarch64|arm64|ARM64)$") ++ELSEIF(NOT CPUINFO_TARGET_PROCESSOR MATCHES "^(i[3-6]86|amd64|x86(_64)?|armv[5-8].*|aarch64|arm64|ARM64)$") + MESSAGE(WARNING + "Target processor architecture \"${CPUINFO_TARGET_PROCESSOR}\" is not supported in cpuinfo. " + "cpuinfo will compile, but cpuinfo_initialize() will always fail.") +@@ -89,7 +89,7 @@ IF(NOT CMAKE_SYSTEM_NAME) "Target operating system is not specified. " "cpuinfo will compile, but cpuinfo_initialize() will always fail.") SET(CPUINFO_SUPPORTED_PLATFORM FALSE) --ELSEIF(NOT CMAKE_SYSTEM_NAME MATCHES "^(Windows|CYGWIN|MSYS|Darwin|Linux|Android)$") -+ELSEIF(NOT CMAKE_SYSTEM_NAME MATCHES "^(Windows|CYGWIN|MSYS|Darwin|Linux|FreeBSD|Android)$") +-ELSEIF(NOT CMAKE_SYSTEM_NAME MATCHES "^(Windows|WindowsStore|CYGWIN|MSYS|Darwin|Linux|Android)$") ++ELSEIF(NOT CMAKE_SYSTEM_NAME MATCHES "^(Windows|WindowsStore|CYGWIN|MSYS|Darwin|Linux|FreeBSD|Android)$") IF(${CMAKE_VERSION} VERSION_GREATER_EQUAL "3.14" AND NOT CMAKE_SYSTEM_NAME STREQUAL "iOS") MESSAGE(WARNING "Target operating system \"${CMAKE_SYSTEM_NAME}\" is not supported in cpuinfo. " +@@ -135,7 +135,7 @@ IF(CPUINFO_SUPPORTED_PLATFORM) + src/cache.c) + + IF(CPUINFO_SUPPORTED_PLATFORM) +- IF(NOT CMAKE_SYSTEM_NAME STREQUAL "Emscripten" AND (CPUINFO_TARGET_PROCESSOR MATCHES "^(i[3-6]86|AMD64|x86(_64)?)$" OR IOS_ARCH MATCHES "^(i386|x86_64)$")) ++ IF(NOT CMAKE_SYSTEM_NAME STREQUAL "Emscripten" AND (CPUINFO_TARGET_PROCESSOR MATCHES "^(i[3-6]86|amd64|x86(_64)?)$" OR IOS_ARCH MATCHES "^(i386|x86_64)$")) + LIST(APPEND CPUINFO_SRCS + src/x86/init.c + src/x86/info.c +@@ -341,7 +341,7 @@ IF(CPUINFO_SUPPORTED_PLATFORM AND CPUINFO_BUILD_MOCK_T + # ---[ cpuinfo mock library and mock tests + IF(CPUINFO_SUPPORTED_PLATFORM AND CPUINFO_BUILD_MOCK_TESTS) + SET(CPUINFO_MOCK_SRCS "${CPUINFO_SRCS}") +- IF(CPUINFO_TARGET_PROCESSOR MATCHES "^(i[3-6]86|AMD64|x86(_64)?)$") ++ IF(CPUINFO_TARGET_PROCESSOR MATCHES "^(i[3-6]86|amd64|x86(_64)?)$") + LIST(APPEND CPUINFO_MOCK_SRCS src/x86/mockcpuid.c) + ENDIF() + IF(CMAKE_SYSTEM_NAME STREQUAL "Linux" OR CMAKE_SYSTEM_NAME STREQUAL "Android") +@@ -785,7 +785,7 @@ IF(CPUINFO_SUPPORTED_PLATFORM AND CPUINFO_BUILD_UNIT_T + ADD_TEST(NAME get-current-test COMMAND get-current-test) + ENDIF() + +- IF(CPUINFO_TARGET_PROCESSOR MATCHES "^(i[3-6]86|AMD64|x86(_64)?)$") ++ IF(CPUINFO_TARGET_PROCESSOR MATCHES "^(i[3-6]86|amd64|x86(_64)?)$") + ADD_EXECUTABLE(brand-string-test test/name/brand-string.cc) + CPUINFO_TARGET_ENABLE_CXX11(brand-string-test) + CPUINFO_TARGET_RUNTIME_LIBRARY(brand-string-test) +@@ -852,7 +852,7 @@ IF(CPUINFO_SUPPORTED_PLATFORM AND CPUINFO_BUILD_TOOLS) + CPUINFO_TARGET_RUNTIME_LIBRARY(cpuinfo-dump) + ENDIF() + +- IF(CPUINFO_TARGET_PROCESSOR MATCHES "^(i[3-6]86|AMD64|x86(_64)?)$") ++ IF(CPUINFO_TARGET_PROCESSOR MATCHES "^(i[3-6]86|amd64|x86(_64)?)$") + ADD_EXECUTABLE(cpuid-dump tools/cpuid-dump.c) + CPUINFO_TARGET_ENABLE_C99(cpuid-dump) + CPUINFO_TARGET_RUNTIME_LIBRARY(cpuid-dump) diff --git a/misc/pytorch/files/patch-third__party_kineto_libkineto_src_ThreadUtil.cpp b/misc/pytorch/files/patch-third__party_kineto_libkineto_src_ThreadUtil.cpp index e6ec0eca3790..f014a26e4f20 100644 --- a/misc/pytorch/files/patch-third__party_kineto_libkineto_src_ThreadUtil.cpp +++ b/misc/pytorch/files/patch-third__party_kineto_libkineto_src_ThreadUtil.cpp @@ -1,6 +1,6 @@ ---- third_party/kineto/libkineto/src/ThreadUtil.cpp.orig 2022-12-29 22:41:51 UTC +--- third_party/kineto/libkineto/src/ThreadUtil.cpp.orig 2023-04-03 19:46:02 UTC +++ third_party/kineto/libkineto/src/ThreadUtil.cpp -@@ -49,7 +49,7 @@ int32_t systemThreadId() { +@@ -57,7 +57,7 @@ int32_t systemThreadId() { #elif defined _MSC_VER _sysTid = (int32_t)GetCurrentThreadId(); #else diff --git a/misc/pytorch/pkg-plist b/misc/pytorch/pkg-plist index 95479410cab7..ea3ba93c4270 100644 --- a/misc/pytorch/pkg-plist +++ b/misc/pytorch/pkg-plist @@ -4,8 +4,6 @@ include/ATen/AccumulateType.h include/ATen/ArrayRef.h include/ATen/Backend.h include/ATen/Backtrace.h -include/ATen/BatchedFallback.h -include/ATen/BatchedTensorImpl.h include/ATen/CPUApplyUtils.h include/ATen/CPUFixedAllocator.h include/ATen/CPUFunctions.h @@ -13,6 +11,7 @@ include/ATen/CPUFunctions_inl.h include/ATen/CPUGeneratorImpl.h include/ATen/CUDAFunctions.h include/ATen/CUDAFunctions_inl.h +include/ATen/CachedTensorUtils.h include/ATen/CollapseDims.h include/ATen/CompositeExplicitAutogradFunctions.h include/ATen/CompositeExplicitAutogradFunctions_inl.h @@ -43,6 +42,10 @@ include/ATen/Generator.h include/ATen/InferSize.h include/ATen/InitialTensorOptions.h include/ATen/Layout.h +include/ATen/LegacyBatchedFallback.h +include/ATen/LegacyBatchedTensorImpl.h +include/ATen/LegacyVmapMode.h +include/ATen/LegacyVmapTransforms.h include/ATen/LinalgBackend.h include/ATen/MapAllocator.h include/ATen/MatrixRef.h @@ -79,8 +82,8 @@ include/ATen/SmallVector.h include/ATen/SparseCsrTensorImpl.h include/ATen/SparseCsrTensorUtils.h include/ATen/SparseTensorImpl.h -include/ATen/SparseTensorUtils.h include/ATen/Storage.h +include/ATen/StorageUtils.h include/ATen/Tensor.h include/ATen/TensorAccessor.h include/ATen/TensorGeometry.h @@ -93,14 +96,13 @@ include/ATen/TensorOperators.h include/ATen/TensorOptions.h include/ATen/TensorSubclassLikeUtils.h include/ATen/TensorUtils.h +include/ATen/ThreadLocalPythonObjects.h include/ATen/ThreadLocalState.h include/ATen/TracerMode.h include/ATen/TypeDefault.h include/ATen/Utils.h include/ATen/Version.h include/ATen/VmapGeneratedPlumbing.h -include/ATen/VmapMode.h -include/ATen/VmapTransforms.h include/ATen/WrapDimUtils.h include/ATen/WrapDimUtilsMulti.h include/ATen/autocast_mode.h @@ -122,6 +124,7 @@ include/ATen/core/Dimname.h include/ATen/core/DistributionsHelper.h include/ATen/core/Formatting.h include/ATen/core/Generator.h +include/ATen/core/GeneratorForPrivateuseone.h include/ATen/core/IListRef.h include/ATen/core/IListRef_inl.h include/ATen/core/LegacyTypeDispatch.h @@ -131,6 +134,7 @@ include/ATen/core/MT19937RNGEngine.h include/ATen/core/NamedTensor.h include/ATen/core/PhiloxRNGEngine.h include/ATen/core/PythonFallbackKernel.h +include/ATen/core/PythonOpRegistrationTrampoline.h include/ATen/core/QuantizerBase.h include/ATen/core/Range.h include/ATen/core/Reduction.h @@ -199,6 +203,7 @@ include/ATen/core/type_ptr.h include/ATen/core/typeid.h include/ATen/cpp_custom_type_hack.h include/ATen/cpu/FlushDenormal.h +include/ATen/cpu/Utils.h include/ATen/cpu/vec/functional.h include/ATen/cpu/vec/functional_base.h include/ATen/cpu/vec/functional_bfloat16.h @@ -215,6 +220,19 @@ include/ATen/cpu/vec/vec256/vec256_float.h include/ATen/cpu/vec/vec256/vec256_float_neon.h include/ATen/cpu/vec/vec256/vec256_int.h include/ATen/cpu/vec/vec256/vec256_qint.h +include/ATen/cpu/vec/vec256/vsx/vec256_bfloat16_vsx.h +include/ATen/cpu/vec/vec256/vsx/vec256_common_vsx.h +include/ATen/cpu/vec/vec256/vsx/vec256_complex_double_vsx.h +include/ATen/cpu/vec/vec256/vsx/vec256_complex_float_vsx.h +include/ATen/cpu/vec/vec256/vsx/vec256_double_vsx.h +include/ATen/cpu/vec/vec256/vsx/vec256_float_vsx.h +include/ATen/cpu/vec/vec256/vsx/vec256_int16_vsx.h +include/ATen/cpu/vec/vec256/vsx/vec256_int32_vsx.h +include/ATen/cpu/vec/vec256/vsx/vec256_int64_vsx.h +include/ATen/cpu/vec/vec256/vsx/vec256_qint32_vsx.h +include/ATen/cpu/vec/vec256/vsx/vec256_qint8_vsx.h +include/ATen/cpu/vec/vec256/vsx/vec256_quint8_vsx.h +include/ATen/cpu/vec/vec256/vsx/vsx_helpers.h include/ATen/cpu/vec/vec512/vec512.h include/ATen/cpu/vec/vec512/vec512_bfloat16.h include/ATen/cpu/vec/vec512/vec512_complex_double.h @@ -279,7 +297,11 @@ include/ATen/cudnn/cudnn-wrapper.h include/ATen/detail/CUDAHooksInterface.h include/ATen/detail/FunctionTraits.h include/ATen/detail/HIPHooksInterface.h +include/ATen/detail/MPSHooksInterface.h +include/ATen/detail/MTIAHooksInterface.h include/ATen/detail/ORTHooksInterface.h +include/ATen/detail/PrivateUse1HooksInterface.h +include/ATen/detail/XPUHooksInterface.h include/ATen/div_rtn.h include/ATen/dlpack.h include/ATen/functorch/ADInterpreters.h @@ -308,6 +330,17 @@ include/ATen/miopen/Handle.h include/ATen/miopen/Types.h include/ATen/miopen/Utils.h include/ATen/miopen/miopen-wrapper.h +include/ATen/mps/EmptyTensor.h +include/ATen/mps/IndexKernels.h +include/ATen/mps/MPSAllocator.h +include/ATen/mps/MPSAllocatorInterface.h +include/ATen/mps/MPSDevice.h +include/ATen/mps/MPSEvent.h +include/ATen/mps/MPSGeneratorImpl.h +include/ATen/mps/MPSGuardImpl.h +include/ATen/mps/MPSHooks.h +include/ATen/mps/MPSProfiler.h +include/ATen/mps/MPSStream.h include/ATen/native/Activation.h include/ATen/native/AdaptivePooling.h include/ATen/native/BatchLinearAlgebra.h @@ -331,6 +364,7 @@ include/ATen/native/Distributions.h include/ATen/native/EmbeddingBag.h include/ATen/native/Fill.h include/ATen/native/ForeachUtils.h +include/ATen/native/FractionalMaxPooling.h include/ATen/native/FunctionOfAMatrixUtils.h include/ATen/native/GridSampler.h include/ATen/native/GridSamplerUtils.h @@ -348,6 +382,7 @@ include/ATen/native/MaxPooling.h include/ATen/native/NonEmptyUtils.h include/ATen/native/NonSymbolicBC.h include/ATen/native/Normalization.h +include/ATen/native/Padding.h include/ATen/native/PointwiseOps.h include/ATen/native/Pool.h include/ATen/native/Pow.h @@ -356,6 +391,7 @@ include/ATen/native/RangeFactories.h include/ATen/native/ReduceAllOps.h include/ATen/native/ReduceOps.h include/ATen/native/ReduceOpsUtils.h +include/ATen/native/ReductionType.h include/ATen/native/Repeat.h include/ATen/native/Resize.h include/ATen/native/ResizeCommon.h @@ -365,6 +401,7 @@ include/ATen/native/SharedReduceOps.h include/ATen/native/SobolEngineOpsUtils.h include/ATen/native/Sorting.h include/ATen/native/SortingUtils.h +include/ATen/native/SparseTensorUtils.h include/ATen/native/SpectralOpsUtils.h include/ATen/native/StridedRandomAccessor.h include/ATen/native/TensorAdvancedIndexing.h @@ -401,13 +438,18 @@ include/ATen/native/cpu/GridSamplerKernel.h include/ATen/native/cpu/IndexKernelUtils.h include/ATen/native/cpu/Intrinsics.h include/ATen/native/cpu/IsContiguous.h +include/ATen/native/cpu/LogAddExp.h include/ATen/native/cpu/Loops.h include/ATen/native/cpu/MaxUnpoolKernel.h include/ATen/native/cpu/PixelShuffleKernel.h include/ATen/native/cpu/Reduce.h +include/ATen/native/cpu/ReduceUtils.h +include/ATen/native/cpu/SampledAddmmKernel.h include/ATen/native/cpu/SerialStackImpl.h include/ATen/native/cpu/SoftmaxKernel.h +include/ATen/native/cpu/SpmmReduceKernel.h include/ATen/native/cpu/StackKernel.h +include/ATen/native/cpu/UpSampleKernelAVXAntialias.h include/ATen/native/cpu/WeightNormKernel.h include/ATen/native/cpu/avx_mathfun.h include/ATen/native/cpu/mixed_data_type.h @@ -427,6 +469,7 @@ include/ATen/native/cuda/DistributionTemplates.h include/ATen/native/cuda/Distributions.h include/ATen/native/cuda/EmbeddingBackwardKernel.cuh include/ATen/native/cuda/ForeachFunctors.cuh +include/ATen/native/cuda/ForeachMinMaxFunctors.cuh include/ATen/native/cuda/GridSampler.cuh include/ATen/native/cuda/GridSampler.h include/ATen/native/cuda/IndexKernel.h @@ -463,6 +506,8 @@ include/ATen/native/cuda/block_reduce.cuh include/ATen/native/cuda/fused_adam_amsgrad_impl.cuh include/ATen/native/cuda/fused_adam_impl.cuh include/ATen/native/cuda/fused_adam_utils.cuh +include/ATen/native/cuda/fused_adamw_amsgrad_impl.cuh +include/ATen/native/cuda/fused_adamw_impl.cuh include/ATen/native/cuda/im2col.cuh include/ATen/native/cuda/jit_utils.h include/ATen/native/cuda/reduction_template.cuh @@ -472,8 +517,15 @@ include/ATen/native/group_norm.h include/ATen/native/im2col.h include/ATen/native/im2col_shape_check.h include/ATen/native/layer_norm.h +include/ATen/native/mps/Copy.h +include/ATen/native/mps/MPSGraphVenturaOps.h +include/ATen/native/mps/OperationUtils.h +include/ATen/native/mps/TensorFactory.h +include/ATen/native/mps/UnaryConstants.h +include/ATen/native/mps/operations/Indexing.h include/ATen/native/quantized/AffineQuantizer.h include/ATen/native/quantized/AffineQuantizerBase.h +include/ATen/native/quantized/ConvUtils.h include/ATen/native/quantized/Copy.h include/ATen/native/quantized/FakeQuantAffine.h include/ATen/native/quantized/IndexKernel.h @@ -492,6 +544,9 @@ include/ATen/native/quantized/cpu/init_qnnpack.h include/ATen/native/quantized/cpu/qembeddingbag.h include/ATen/native/quantized/cpu/qembeddingbag_prepack.h include/ATen/native/quantized/cudnn/utils.h +include/ATen/native/utils/Factory.h +include/ATen/native/utils/ParamUtils.h +include/ATen/native/utils/ParamsHash.h include/ATen/native/verbose_wrapper.h include/ATen/native/vol2col.h include/ATen/ops/_adaptive_avg_pool2d.h @@ -704,6 +759,14 @@ include/ATen/ops/_copy_from_and_resize_ops.h include/ATen/ops/_copy_from_compositeexplicitautograd_dispatch.h include/ATen/ops/_copy_from_native.h include/ATen/ops/_copy_from_ops.h +include/ATen/ops/_cslt_compress.h +include/ATen/ops/_cslt_compress_cuda_dispatch.h +include/ATen/ops/_cslt_compress_native.h +include/ATen/ops/_cslt_compress_ops.h +include/ATen/ops/_cslt_sparse_mm.h +include/ATen/ops/_cslt_sparse_mm_cuda_dispatch.h +include/ATen/ops/_cslt_sparse_mm_native.h +include/ATen/ops/_cslt_sparse_mm_ops.h include/ATen/ops/_ctc_loss.h include/ATen/ops/_ctc_loss_backward.h include/ATen/ops/_ctc_loss_backward_compositeexplicitautograd_dispatch.h @@ -787,10 +850,19 @@ include/ATen/ops/_dirichlet_grad_cpu_dispatch.h include/ATen/ops/_dirichlet_grad_cuda_dispatch.h include/ATen/ops/_dirichlet_grad_native.h include/ATen/ops/_dirichlet_grad_ops.h +include/ATen/ops/_efficient_attention_backward.h +include/ATen/ops/_efficient_attention_backward_cuda_dispatch.h +include/ATen/ops/_efficient_attention_backward_native.h +include/ATen/ops/_efficient_attention_backward_ops.h +include/ATen/ops/_efficient_attention_forward.h +include/ATen/ops/_efficient_attention_forward_cuda_dispatch.h +include/ATen/ops/_efficient_attention_forward_native.h +include/ATen/ops/_efficient_attention_forward_ops.h include/ATen/ops/_efficientzerotensor.h include/ATen/ops/_efficientzerotensor_compositeexplicitautograd_dispatch.h include/ATen/ops/_efficientzerotensor_cpu_dispatch.h include/ATen/ops/_efficientzerotensor_cuda_dispatch.h +include/ATen/ops/_efficientzerotensor_meta_dispatch.h include/ATen/ops/_efficientzerotensor_native.h include/ATen/ops/_efficientzerotensor_ops.h include/ATen/ops/_embedding_bag.h @@ -882,10 +954,19 @@ include/ATen/ops/_fft_r2c_cpu_dispatch.h include/ATen/ops/_fft_r2c_cuda_dispatch.h include/ATen/ops/_fft_r2c_native.h include/ATen/ops/_fft_r2c_ops.h -include/ATen/ops/_flash_scaled_dot_product_attention.h -include/ATen/ops/_flash_scaled_dot_product_attention_cuda_dispatch.h -include/ATen/ops/_flash_scaled_dot_product_attention_native.h -include/ATen/ops/_flash_scaled_dot_product_attention_ops.h +include/ATen/ops/_fill_mem_eff_dropout_mask.h +include/ATen/ops/_fill_mem_eff_dropout_mask_cuda_dispatch.h +include/ATen/ops/_fill_mem_eff_dropout_mask_meta_dispatch.h +include/ATen/ops/_fill_mem_eff_dropout_mask_native.h +include/ATen/ops/_fill_mem_eff_dropout_mask_ops.h +include/ATen/ops/_flash_attention_backward.h +include/ATen/ops/_flash_attention_backward_cuda_dispatch.h +include/ATen/ops/_flash_attention_backward_native.h +include/ATen/ops/_flash_attention_backward_ops.h +include/ATen/ops/_flash_attention_forward.h +include/ATen/ops/_flash_attention_forward_cuda_dispatch.h +include/ATen/ops/_flash_attention_forward_native.h +include/ATen/ops/_flash_attention_forward_ops.h include/ATen/ops/_foobar.h include/ATen/ops/_foobar_compositeexplicitautograd_dispatch.h include/ATen/ops/_foobar_cpu_dispatch.h @@ -939,6 +1020,24 @@ include/ATen/ops/_foreach_ceil_cpu_dispatch.h include/ATen/ops/_foreach_ceil_cuda_dispatch.h include/ATen/ops/_foreach_ceil_native.h include/ATen/ops/_foreach_ceil_ops.h +include/ATen/ops/_foreach_clamp_max.h +include/ATen/ops/_foreach_clamp_max_compositeexplicitautograd_dispatch.h +include/ATen/ops/_foreach_clamp_max_cpu_dispatch.h +include/ATen/ops/_foreach_clamp_max_cuda_dispatch.h +include/ATen/ops/_foreach_clamp_max_native.h +include/ATen/ops/_foreach_clamp_max_ops.h +include/ATen/ops/_foreach_clamp_min.h +include/ATen/ops/_foreach_clamp_min_compositeexplicitautograd_dispatch.h +include/ATen/ops/_foreach_clamp_min_cpu_dispatch.h +include/ATen/ops/_foreach_clamp_min_cuda_dispatch.h +include/ATen/ops/_foreach_clamp_min_native.h +include/ATen/ops/_foreach_clamp_min_ops.h +include/ATen/ops/_foreach_copy.h +include/ATen/ops/_foreach_copy_compositeexplicitautograd_dispatch.h +include/ATen/ops/_foreach_copy_cpu_dispatch.h +include/ATen/ops/_foreach_copy_cuda_dispatch.h +include/ATen/ops/_foreach_copy_native.h +include/ATen/ops/_foreach_copy_ops.h include/ATen/ops/_foreach_cos.h include/ATen/ops/_foreach_cos_compositeexplicitautograd_dispatch.h include/ATen/ops/_foreach_cos_cpu_dispatch.h @@ -993,6 +1092,12 @@ include/ATen/ops/_foreach_frac_cpu_dispatch.h include/ATen/ops/_foreach_frac_cuda_dispatch.h include/ATen/ops/_foreach_frac_native.h include/ATen/ops/_foreach_frac_ops.h +include/ATen/ops/_foreach_lerp.h +include/ATen/ops/_foreach_lerp_compositeexplicitautograd_dispatch.h +include/ATen/ops/_foreach_lerp_cpu_dispatch.h +include/ATen/ops/_foreach_lerp_cuda_dispatch.h +include/ATen/ops/_foreach_lerp_native.h +include/ATen/ops/_foreach_lerp_ops.h include/ATen/ops/_foreach_lgamma.h include/ATen/ops/_foreach_lgamma_compositeexplicitautograd_dispatch.h include/ATen/ops/_foreach_lgamma_cpu_dispatch.h @@ -1053,6 +1158,12 @@ include/ATen/ops/_foreach_norm_cpu_dispatch.h include/ATen/ops/_foreach_norm_cuda_dispatch.h include/ATen/ops/_foreach_norm_native.h include/ATen/ops/_foreach_norm_ops.h +include/ATen/ops/_foreach_pow.h +include/ATen/ops/_foreach_pow_compositeexplicitautograd_dispatch.h +include/ATen/ops/_foreach_pow_cpu_dispatch.h +include/ATen/ops/_foreach_pow_cuda_dispatch.h +include/ATen/ops/_foreach_pow_native.h +include/ATen/ops/_foreach_pow_ops.h include/ATen/ops/_foreach_reciprocal.h include/ATen/ops/_foreach_reciprocal_compositeexplicitautograd_dispatch.h include/ATen/ops/_foreach_reciprocal_cpu_dispatch.h @@ -1071,6 +1182,12 @@ include/ATen/ops/_foreach_sigmoid_cpu_dispatch.h include/ATen/ops/_foreach_sigmoid_cuda_dispatch.h include/ATen/ops/_foreach_sigmoid_native.h include/ATen/ops/_foreach_sigmoid_ops.h +include/ATen/ops/_foreach_sign.h +include/ATen/ops/_foreach_sign_compositeexplicitautograd_dispatch.h +include/ATen/ops/_foreach_sign_cpu_dispatch.h +include/ATen/ops/_foreach_sign_cuda_dispatch.h +include/ATen/ops/_foreach_sign_native.h +include/ATen/ops/_foreach_sign_ops.h include/ATen/ops/_foreach_sin.h include/ATen/ops/_foreach_sin_compositeexplicitautograd_dispatch.h include/ATen/ops/_foreach_sin_cpu_dispatch.h @@ -1119,11 +1236,28 @@ include/ATen/ops/_foreach_zero_cpu_dispatch.h include/ATen/ops/_foreach_zero_cuda_dispatch.h include/ATen/ops/_foreach_zero_native.h include/ATen/ops/_foreach_zero_ops.h +include/ATen/ops/_functional_assert_async.h +include/ATen/ops/_functional_assert_async_cpu_dispatch.h +include/ATen/ops/_functional_assert_async_native.h +include/ATen/ops/_functional_assert_async_ops.h +include/ATen/ops/_functional_sym_constrain_range.h +include/ATen/ops/_functional_sym_constrain_range_compositeexplicitautograd_dispatch.h +include/ATen/ops/_functional_sym_constrain_range_for_size.h +include/ATen/ops/_functional_sym_constrain_range_for_size_compositeexplicitautograd_dispatch.h +include/ATen/ops/_functional_sym_constrain_range_for_size_native.h +include/ATen/ops/_functional_sym_constrain_range_for_size_ops.h +include/ATen/ops/_functional_sym_constrain_range_native.h +include/ATen/ops/_functional_sym_constrain_range_ops.h include/ATen/ops/_fused_adam.h include/ATen/ops/_fused_adam_compositeexplicitautograd_dispatch.h include/ATen/ops/_fused_adam_cuda_dispatch.h include/ATen/ops/_fused_adam_native.h include/ATen/ops/_fused_adam_ops.h +include/ATen/ops/_fused_adamw.h +include/ATen/ops/_fused_adamw_compositeexplicitautograd_dispatch.h +include/ATen/ops/_fused_adamw_cuda_dispatch.h +include/ATen/ops/_fused_adamw_native.h +include/ATen/ops/_fused_adamw_ops.h include/ATen/ops/_fused_dropout.h include/ATen/ops/_fused_dropout_compositeexplicitautograd_dispatch.h include/ATen/ops/_fused_dropout_cuda_dispatch.h @@ -1135,6 +1269,12 @@ include/ATen/ops/_fused_moving_avg_obs_fq_helper_cpu_dispatch.h include/ATen/ops/_fused_moving_avg_obs_fq_helper_cuda_dispatch.h include/ATen/ops/_fused_moving_avg_obs_fq_helper_native.h include/ATen/ops/_fused_moving_avg_obs_fq_helper_ops.h +include/ATen/ops/_fused_sdp_choice.h +include/ATen/ops/_fused_sdp_choice_cpu_dispatch.h +include/ATen/ops/_fused_sdp_choice_cuda_dispatch.h +include/ATen/ops/_fused_sdp_choice_meta_dispatch.h +include/ATen/ops/_fused_sdp_choice_native.h +include/ATen/ops/_fused_sdp_choice_ops.h include/ATen/ops/_fw_primal.h include/ATen/ops/_fw_primal_compositeexplicitautograd_dispatch.h include/ATen/ops/_fw_primal_copy.h @@ -1194,6 +1334,18 @@ include/ATen/ops/_indices_copy_native.h include/ATen/ops/_indices_copy_ops.h include/ATen/ops/_indices_native.h include/ATen/ops/_indices_ops.h +include/ATen/ops/_int_mm.h +include/ATen/ops/_int_mm_cuda_dispatch.h +include/ATen/ops/_int_mm_native.h +include/ATen/ops/_int_mm_ops.h +include/ATen/ops/_is_all_true.h +include/ATen/ops/_is_all_true_compositeexplicitautograd_dispatch.h +include/ATen/ops/_is_all_true_native.h +include/ATen/ops/_is_all_true_ops.h +include/ATen/ops/_is_any_true.h +include/ATen/ops/_is_any_true_compositeexplicitautograd_dispatch.h +include/ATen/ops/_is_any_true_native.h +include/ATen/ops/_is_any_true_ops.h include/ATen/ops/_is_zerotensor.h include/ATen/ops/_is_zerotensor_compositeimplicitautograd_dispatch.h include/ATen/ops/_is_zerotensor_native.h @@ -1276,6 +1428,10 @@ include/ATen/ops/_lu_with_info.h include/ATen/ops/_lu_with_info_compositeimplicitautograd_dispatch.h include/ATen/ops/_lu_with_info_native.h include/ATen/ops/_lu_with_info_ops.h +include/ATen/ops/_make_dep_token.h +include/ATen/ops/_make_dep_token_cpu_dispatch.h +include/ATen/ops/_make_dep_token_native.h +include/ATen/ops/_make_dep_token_ops.h include/ATen/ops/_make_dual.h include/ATen/ops/_make_dual_compositeexplicitautograd_dispatch.h include/ATen/ops/_make_dual_copy.h @@ -1331,16 +1487,16 @@ include/ATen/ops/_mps_convolution_transpose.h include/ATen/ops/_mps_convolution_transpose_compositeexplicitautograd_dispatch.h include/ATen/ops/_mps_convolution_transpose_native.h include/ATen/ops/_mps_convolution_transpose_ops.h -include/ATen/ops/_mps_max_pool2d.h -include/ATen/ops/_mps_max_pool2d_compositeexplicitautograd_dispatch.h -include/ATen/ops/_mps_max_pool2d_native.h -include/ATen/ops/_mps_max_pool2d_ops.h -include/ATen/ops/_native_decoder_only_multi_head_attention.h -include/ATen/ops/_native_decoder_only_multi_head_attention_compositeexplicitautograd_dispatch.h -include/ATen/ops/_native_decoder_only_multi_head_attention_cpu_dispatch.h -include/ATen/ops/_native_decoder_only_multi_head_attention_cuda_dispatch.h -include/ATen/ops/_native_decoder_only_multi_head_attention_native.h -include/ATen/ops/_native_decoder_only_multi_head_attention_ops.h +include/ATen/ops/_native_batch_norm_legit.h +include/ATen/ops/_native_batch_norm_legit_compositeexplicitautograd_dispatch.h +include/ATen/ops/_native_batch_norm_legit_cpu_dispatch.h +include/ATen/ops/_native_batch_norm_legit_cuda_dispatch.h +include/ATen/ops/_native_batch_norm_legit_native.h +include/ATen/ops/_native_batch_norm_legit_no_training.h +include/ATen/ops/_native_batch_norm_legit_no_training_compositeexplicitautograd_dispatch.h +include/ATen/ops/_native_batch_norm_legit_no_training_native.h +include/ATen/ops/_native_batch_norm_legit_no_training_ops.h +include/ATen/ops/_native_batch_norm_legit_ops.h include/ATen/ops/_native_multi_head_attention.h include/ATen/ops/_native_multi_head_attention_compositeexplicitautograd_dispatch.h include/ATen/ops/_native_multi_head_attention_cpu_dispatch.h @@ -1387,13 +1543,6 @@ include/ATen/ops/_nested_tensor_from_tensor_list.h include/ATen/ops/_nested_tensor_from_tensor_list_compositeexplicitautograd_dispatch.h include/ATen/ops/_nested_tensor_from_tensor_list_native.h include/ATen/ops/_nested_tensor_from_tensor_list_ops.h -include/ATen/ops/_nested_tensor_layer_norm.h -include/ATen/ops/_nested_tensor_layer_norm_compositeexplicitautograd_dispatch.h -include/ATen/ops/_nested_tensor_layer_norm_native.h -include/ATen/ops/_nested_tensor_layer_norm_ops.h -include/ATen/ops/_nested_tensor_offsets.h -include/ATen/ops/_nested_tensor_offsets_native.h -include/ATen/ops/_nested_tensor_offsets_ops.h include/ATen/ops/_nested_tensor_size.h include/ATen/ops/_nested_tensor_size_compositeexplicitautograd_dispatch.h include/ATen/ops/_nested_tensor_size_native.h @@ -1401,6 +1550,10 @@ include/ATen/ops/_nested_tensor_size_ops.h include/ATen/ops/_nested_tensor_softmax_with_shape.h include/ATen/ops/_nested_tensor_softmax_with_shape_native.h include/ATen/ops/_nested_tensor_softmax_with_shape_ops.h +include/ATen/ops/_nested_tensor_storage_offsets.h +include/ATen/ops/_nested_tensor_storage_offsets_compositeexplicitautograd_dispatch.h +include/ATen/ops/_nested_tensor_storage_offsets_native.h +include/ATen/ops/_nested_tensor_storage_offsets_ops.h include/ATen/ops/_nested_tensor_strides.h include/ATen/ops/_nested_tensor_strides_compositeexplicitautograd_dispatch.h include/ATen/ops/_nested_tensor_strides_native.h @@ -1467,6 +1620,20 @@ include/ATen/ops/_pin_memory_compositeexplicitautograd_dispatch.h include/ATen/ops/_pin_memory_cuda_dispatch.h include/ATen/ops/_pin_memory_native.h include/ATen/ops/_pin_memory_ops.h +include/ATen/ops/_prelu_kernel.h +include/ATen/ops/_prelu_kernel_backward.h +include/ATen/ops/_prelu_kernel_backward_cpu_dispatch.h +include/ATen/ops/_prelu_kernel_backward_cuda_dispatch.h +include/ATen/ops/_prelu_kernel_backward_native.h +include/ATen/ops/_prelu_kernel_backward_ops.h +include/ATen/ops/_prelu_kernel_cpu_dispatch.h +include/ATen/ops/_prelu_kernel_cuda_dispatch.h +include/ATen/ops/_prelu_kernel_native.h +include/ATen/ops/_prelu_kernel_ops.h +include/ATen/ops/_propagate_xla_data.h +include/ATen/ops/_propagate_xla_data_compositeimplicitautograd_dispatch.h +include/ATen/ops/_propagate_xla_data_native.h +include/ATen/ops/_propagate_xla_data_ops.h include/ATen/ops/_remove_batch_dim.h include/ATen/ops/_remove_batch_dim_compositeimplicitautograd_dispatch.h include/ATen/ops/_remove_batch_dim_native.h @@ -1482,6 +1649,10 @@ include/ATen/ops/_reshape_alias_cuda_dispatch.h include/ATen/ops/_reshape_alias_meta_dispatch.h include/ATen/ops/_reshape_alias_native.h include/ATen/ops/_reshape_alias_ops.h +include/ATen/ops/_reshape_copy.h +include/ATen/ops/_reshape_copy_compositeexplicitautograd_dispatch.h +include/ATen/ops/_reshape_copy_native.h +include/ATen/ops/_reshape_copy_ops.h include/ATen/ops/_reshape_from_tensor.h include/ATen/ops/_reshape_from_tensor_compositeimplicitautograd_dispatch.h include/ATen/ops/_reshape_from_tensor_native.h @@ -1505,20 +1676,32 @@ include/ATen/ops/_saturate_weight_to_fp16.h include/ATen/ops/_saturate_weight_to_fp16_compositeimplicitautograd_dispatch.h include/ATen/ops/_saturate_weight_to_fp16_native.h include/ATen/ops/_saturate_weight_to_fp16_ops.h -include/ATen/ops/_scaled_dot_product_attention.h -include/ATen/ops/_scaled_dot_product_attention_compositeimplicitautograd_dispatch.h -include/ATen/ops/_scaled_dot_product_attention_forward.h -include/ATen/ops/_scaled_dot_product_attention_forward_cpu_dispatch.h -include/ATen/ops/_scaled_dot_product_attention_forward_cuda_dispatch.h -include/ATen/ops/_scaled_dot_product_attention_forward_meta_dispatch.h -include/ATen/ops/_scaled_dot_product_attention_forward_native.h -include/ATen/ops/_scaled_dot_product_attention_forward_ops.h include/ATen/ops/_scaled_dot_product_attention_math.h include/ATen/ops/_scaled_dot_product_attention_math_compositeimplicitautograd_dispatch.h include/ATen/ops/_scaled_dot_product_attention_math_native.h include/ATen/ops/_scaled_dot_product_attention_math_ops.h -include/ATen/ops/_scaled_dot_product_attention_native.h -include/ATen/ops/_scaled_dot_product_attention_ops.h +include/ATen/ops/_scaled_dot_product_efficient_attention.h +include/ATen/ops/_scaled_dot_product_efficient_attention_backward.h +include/ATen/ops/_scaled_dot_product_efficient_attention_backward_cuda_dispatch.h +include/ATen/ops/_scaled_dot_product_efficient_attention_backward_native.h +include/ATen/ops/_scaled_dot_product_efficient_attention_backward_ops.h +include/ATen/ops/_scaled_dot_product_efficient_attention_cuda_dispatch.h +include/ATen/ops/_scaled_dot_product_efficient_attention_native.h +include/ATen/ops/_scaled_dot_product_efficient_attention_ops.h +include/ATen/ops/_scaled_dot_product_flash_attention.h +include/ATen/ops/_scaled_dot_product_flash_attention_backward.h +include/ATen/ops/_scaled_dot_product_flash_attention_backward_cpu_dispatch.h +include/ATen/ops/_scaled_dot_product_flash_attention_backward_cuda_dispatch.h +include/ATen/ops/_scaled_dot_product_flash_attention_backward_native.h +include/ATen/ops/_scaled_dot_product_flash_attention_backward_ops.h +include/ATen/ops/_scaled_dot_product_flash_attention_cpu_dispatch.h +include/ATen/ops/_scaled_dot_product_flash_attention_cuda_dispatch.h +include/ATen/ops/_scaled_dot_product_flash_attention_native.h +include/ATen/ops/_scaled_dot_product_flash_attention_ops.h +include/ATen/ops/_scaled_mm.h +include/ATen/ops/_scaled_mm_cuda_dispatch.h +include/ATen/ops/_scaled_mm_native.h +include/ATen/ops/_scaled_mm_ops.h include/ATen/ops/_segment_reduce_backward.h include/ATen/ops/_segment_reduce_backward_compositeexplicitautograd_dispatch.h include/ATen/ops/_segment_reduce_backward_cpu_dispatch.h @@ -1635,14 +1818,24 @@ include/ATen/ops/_sparse_log_softmax_compositeexplicitautograd_dispatch.h include/ATen/ops/_sparse_log_softmax_compositeimplicitautograd_dispatch.h include/ATen/ops/_sparse_log_softmax_native.h include/ATen/ops/_sparse_log_softmax_ops.h -include/ATen/ops/_sparse_mask_helper.h -include/ATen/ops/_sparse_mask_helper_compositeexplicitautograd_dispatch.h -include/ATen/ops/_sparse_mask_helper_native.h -include/ATen/ops/_sparse_mask_helper_ops.h +include/ATen/ops/_sparse_mask_projection.h +include/ATen/ops/_sparse_mask_projection_compositeexplicitautograd_dispatch.h +include/ATen/ops/_sparse_mask_projection_native.h +include/ATen/ops/_sparse_mask_projection_ops.h include/ATen/ops/_sparse_mm.h include/ATen/ops/_sparse_mm_compositeimplicitautograd_dispatch.h include/ATen/ops/_sparse_mm_native.h include/ATen/ops/_sparse_mm_ops.h +include/ATen/ops/_sparse_mm_reduce_impl.h +include/ATen/ops/_sparse_mm_reduce_impl_backward.h +include/ATen/ops/_sparse_mm_reduce_impl_backward_native.h +include/ATen/ops/_sparse_mm_reduce_impl_backward_ops.h +include/ATen/ops/_sparse_mm_reduce_impl_native.h +include/ATen/ops/_sparse_mm_reduce_impl_ops.h +include/ATen/ops/_sparse_semi_structured_linear.h +include/ATen/ops/_sparse_semi_structured_linear_cuda_dispatch.h +include/ATen/ops/_sparse_semi_structured_linear_native.h +include/ATen/ops/_sparse_semi_structured_linear_ops.h include/ATen/ops/_sparse_softmax.h include/ATen/ops/_sparse_softmax_backward_data.h include/ATen/ops/_sparse_softmax_backward_data_compositeexplicitautograd_dispatch.h @@ -1687,12 +1880,6 @@ include/ATen/ops/_standard_gamma_grad_native.h include/ATen/ops/_standard_gamma_grad_ops.h include/ATen/ops/_standard_gamma_native.h include/ATen/ops/_standard_gamma_ops.h -include/ATen/ops/_symeig_helper.h -include/ATen/ops/_symeig_helper_compositeexplicitautograd_dispatch.h -include/ATen/ops/_symeig_helper_cpu_dispatch.h -include/ATen/ops/_symeig_helper_cuda_dispatch.h -include/ATen/ops/_symeig_helper_native.h -include/ATen/ops/_symeig_helper_ops.h include/ATen/ops/_test_ambiguous_defaults.h include/ATen/ops/_test_ambiguous_defaults_compositeimplicitautograd_dispatch.h include/ATen/ops/_test_ambiguous_defaults_native.h @@ -1711,6 +1898,15 @@ include/ATen/ops/_test_autograd_multiple_dispatch_view_copy_native.h include/ATen/ops/_test_autograd_multiple_dispatch_view_copy_ops.h include/ATen/ops/_test_autograd_multiple_dispatch_view_native.h include/ATen/ops/_test_autograd_multiple_dispatch_view_ops.h +include/ATen/ops/_test_check_tensor.h +include/ATen/ops/_test_check_tensor_compositeimplicitautograd_dispatch.h +include/ATen/ops/_test_check_tensor_native.h +include/ATen/ops/_test_check_tensor_ops.h +include/ATen/ops/_test_functorch_fallback.h +include/ATen/ops/_test_functorch_fallback_compositeexplicitautograd_dispatch.h +include/ATen/ops/_test_functorch_fallback_cpu_dispatch.h +include/ATen/ops/_test_functorch_fallback_native.h +include/ATen/ops/_test_functorch_fallback_ops.h include/ATen/ops/_test_optional_filled_intlist.h include/ATen/ops/_test_optional_filled_intlist_compositeexplicitautograd_dispatch.h include/ATen/ops/_test_optional_filled_intlist_cpu_dispatch.h @@ -1782,23 +1978,46 @@ include/ATen/ops/_to_dense.h include/ATen/ops/_to_dense_compositeexplicitautograd_dispatch.h include/ATen/ops/_to_dense_native.h include/ATen/ops/_to_dense_ops.h -include/ATen/ops/_torch_cuda_cu_linker_symbol_op.h -include/ATen/ops/_torch_cuda_cu_linker_symbol_op_compositeexplicitautograd_dispatch.h -include/ATen/ops/_torch_cuda_cu_linker_symbol_op_cuda_dispatch.h -include/ATen/ops/_torch_cuda_cu_linker_symbol_op_native.h -include/ATen/ops/_torch_cuda_cu_linker_symbol_op_ops.h +include/ATen/ops/_to_sparse.h +include/ATen/ops/_to_sparse_bsc.h +include/ATen/ops/_to_sparse_bsc_compositeexplicitautograd_dispatch.h +include/ATen/ops/_to_sparse_bsc_cpu_dispatch.h +include/ATen/ops/_to_sparse_bsc_cuda_dispatch.h +include/ATen/ops/_to_sparse_bsc_native.h +include/ATen/ops/_to_sparse_bsc_ops.h +include/ATen/ops/_to_sparse_bsr.h +include/ATen/ops/_to_sparse_bsr_compositeexplicitautograd_dispatch.h +include/ATen/ops/_to_sparse_bsr_cpu_dispatch.h +include/ATen/ops/_to_sparse_bsr_cuda_dispatch.h +include/ATen/ops/_to_sparse_bsr_native.h +include/ATen/ops/_to_sparse_bsr_ops.h +include/ATen/ops/_to_sparse_compositeexplicitautograd_dispatch.h +include/ATen/ops/_to_sparse_cpu_dispatch.h +include/ATen/ops/_to_sparse_csc.h *** 1237 LINES SKIPPED ***