Skip to content

Commit cc50515

Browse files
rwgkkkraus14
andauthored
Support CUDA 13.3 (#2139)
* run_cybind_cython_gen 13.3.0 ../ctk-next (NO MANUAL CHANGES) * run_cybind_native 13.3.0 ../ctk-next (NO MANUAL CHANGES) * git apply --index /home/rgrossekunst/stash/squash_merge_into_public_main_preview_2026-05-26+0012_non_gen_transfer.patch (NO MANUAL CHANGES) * Update ci/versions.yml: build with 13.3.0 * Guard NVLink 6 mapping for older bindings * Add cuda-pathfinder 1.5.5 release notes * Consolidate cuda-bindings 13.3.0 release notes * Add CUDA Python 13.3.0 release notes * Add 12.9.7 release notes * Enable security scans on ctk-next Run Bandit and CodeQL on ctk-next pushes and grant the scanner jobs the read permissions needed to checkout private repository contents and inspect workflow runs. * Xfail MCDM mempool OOM with older bindings Keep cuda-core tests using published older cuda-bindings wheels from failing when the shared mempool xfail helper is unavailable. --------- Co-authored-by: Keith Kraus <keith.j.kraus@gmail.com>
1 parent 6959cb9 commit cc50515

67 files changed

Lines changed: 5178 additions & 621 deletions

Some content is hidden

Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.

.github/workflows/bandit.yml

Lines changed: 4 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
# SPDX-FileCopyrightText: Copyright (c) 2024-2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
1+
# SPDX-FileCopyrightText: Copyright (c) 2024-2026 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
22
#
33
# SPDX-License-Identifier: Apache-2.0
44

@@ -8,6 +8,7 @@ on:
88
push:
99
branches:
1010
- "pull-request/[0-9]+"
11+
- "ctk-next"
1112
- "main"
1213
concurrency:
1314
group: ${{ github.workflow }}-${{ github.ref }}-${{ github.event_name }}
@@ -17,6 +18,8 @@ jobs:
1718
analyze:
1819
runs-on: ubuntu-latest
1920
permissions:
21+
actions: read
22+
contents: read
2023
security-events: write
2124
steps:
2225
- name: Checkout

.github/workflows/codeql.yml

Lines changed: 4 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
# SPDX-FileCopyrightText: Copyright (c) 2024-2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
1+
# SPDX-FileCopyrightText: Copyright (c) 2024-2026 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
22
#
33
# SPDX-License-Identifier: Apache-2.0
44

@@ -8,6 +8,7 @@ on:
88
push:
99
branches:
1010
- "pull-request/[0-9]+"
11+
- "ctk-next"
1112
- "main"
1213
concurrency:
1314
group: ${{ github.workflow }}-${{ github.ref }}-${{ github.event_name }}
@@ -18,6 +19,8 @@ jobs:
1819
name: Analyze (${{ matrix.language }})
1920
runs-on: ubuntu-latest
2021
permissions:
22+
actions: read
23+
contents: read
2124
security-events: write
2225

2326
strategy:

ci/versions.yml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -5,6 +5,6 @@ backport_branch: "12.9.x" # keep in sync with target-branch in .github/dependab
55

66
cuda:
77
build:
8-
version: "13.2.1"
8+
version: "13.3.0"
99
prev_build:
1010
version: "12.9.1"

cuda_bindings/cuda/bindings/_bindings/cydriver.pxd.in

Lines changed: 71 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -1,7 +1,7 @@
11
# SPDX-FileCopyrightText: Copyright (c) 2021-2026 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
22
# SPDX-License-Identifier: LicenseRef-NVIDIA-SOFTWARE-LICENSE
33

4-
# This code was automatically generated with version 13.2.0, generator version 0.3.1.dev1422+gf4812259e.d20260318. Do not modify it directly.
4+
# This code was automatically generated with version 13.3.0, generator version 0.3.1.dev1719+g565f73f4e. Do not modify it directly.
55
from cuda.bindings.cydriver cimport *
66

77
{{if 'cuGetErrorString' in found_functions}}
@@ -1024,6 +1024,66 @@ cdef CUresult _cuMulticastUnbind(CUmemGenericAllocationHandle mcHandle, CUdevice
10241024
cdef CUresult _cuMulticastGetGranularity(size_t* granularity, const CUmulticastObjectProp* prop, CUmulticastGranularity_flags option) except ?CUDA_ERROR_NOT_FOUND nogil
10251025
{{endif}}
10261026

1027+
{{if 'cuLogicalEndpointIdReserve' in found_functions}}
1028+
1029+
cdef CUresult _cuLogicalEndpointIdReserve(CUlogicalEndpointId* baseLeId, cuuint32_t count) except ?CUDA_ERROR_NOT_FOUND nogil
1030+
{{endif}}
1031+
1032+
{{if 'cuLogicalEndpointIdRelease' in found_functions}}
1033+
1034+
cdef CUresult _cuLogicalEndpointIdRelease(CUlogicalEndpointId baseLeId, cuuint32_t count) except ?CUDA_ERROR_NOT_FOUND nogil
1035+
{{endif}}
1036+
1037+
{{if 'cuLogicalEndpointCreate' in found_functions}}
1038+
1039+
cdef CUresult _cuLogicalEndpointCreate(CUlogicalEndpointId leId, const CUlogicalEndpointProp* prop) except ?CUDA_ERROR_NOT_FOUND nogil
1040+
{{endif}}
1041+
1042+
{{if 'cuLogicalEndpointAddDevice' in found_functions}}
1043+
1044+
cdef CUresult _cuLogicalEndpointAddDevice(CUlogicalEndpointId leId, CUdevice dev) except ?CUDA_ERROR_NOT_FOUND nogil
1045+
{{endif}}
1046+
1047+
{{if 'cuLogicalEndpointDestroy' in found_functions}}
1048+
1049+
cdef CUresult _cuLogicalEndpointDestroy(CUlogicalEndpointId leId) except ?CUDA_ERROR_NOT_FOUND nogil
1050+
{{endif}}
1051+
1052+
{{if 'cuLogicalEndpointBindAddr' in found_functions}}
1053+
1054+
cdef CUresult _cuLogicalEndpointBindAddr(CUlogicalEndpointId leId, CUdevice dev, cuuint64_t offset, void* ptr, cuuint64_t size, unsigned long long flags) except ?CUDA_ERROR_NOT_FOUND nogil
1055+
{{endif}}
1056+
1057+
{{if 'cuLogicalEndpointBindMem' in found_functions}}
1058+
1059+
cdef CUresult _cuLogicalEndpointBindMem(CUlogicalEndpointId leId, CUdevice dev, cuuint64_t offset, CUmemGenericAllocationHandle memHandle, cuuint64_t memOffset, cuuint64_t size, unsigned long long flags) except ?CUDA_ERROR_NOT_FOUND nogil
1060+
{{endif}}
1061+
1062+
{{if 'cuLogicalEndpointUnbind' in found_functions}}
1063+
1064+
cdef CUresult _cuLogicalEndpointUnbind(CUlogicalEndpointId leId, CUdevice dev, cuuint64_t offset, cuuint64_t size) except ?CUDA_ERROR_NOT_FOUND nogil
1065+
{{endif}}
1066+
1067+
{{if 'cuLogicalEndpointExport' in found_functions}}
1068+
1069+
cdef CUresult _cuLogicalEndpointExport(void* handle, CUlogicalEndpointId leId, CUlogicalEndpointIpcHandleType handleType) except ?CUDA_ERROR_NOT_FOUND nogil
1070+
{{endif}}
1071+
1072+
{{if 'cuLogicalEndpointImport' in found_functions}}
1073+
1074+
cdef CUresult _cuLogicalEndpointImport(CUlogicalEndpointId leId, const void* handle, CUlogicalEndpointIpcHandleType handleType) except ?CUDA_ERROR_NOT_FOUND nogil
1075+
{{endif}}
1076+
1077+
{{if 'cuLogicalEndpointGetLimits' in found_functions}}
1078+
1079+
cdef CUresult _cuLogicalEndpointGetLimits(cuuint64_t* bindAlignment, cuuint64_t* maxSize, const CUlogicalEndpointProp* prop) except ?CUDA_ERROR_NOT_FOUND nogil
1080+
{{endif}}
1081+
1082+
{{if 'cuLogicalEndpointQuery' in found_functions}}
1083+
1084+
cdef CUresult _cuLogicalEndpointQuery(CUlogicalEndpointId leId, cuuint32_t count, int* queryStatus) except ?CUDA_ERROR_NOT_FOUND nogil
1085+
{{endif}}
1086+
10271087
{{if 'cuPointerGetAttribute' in found_functions}}
10281088

10291089
cdef CUresult _cuPointerGetAttribute(void* data, CUpointer_attribute attribute, CUdeviceptr ptr) except ?CUDA_ERROR_NOT_FOUND nogil
@@ -1139,6 +1199,11 @@ cdef CUresult _cuStreamAddCallback(CUstream hStream, CUstreamCallback callback,
11391199
cdef CUresult _cuStreamBeginCapture_v2(CUstream hStream, CUstreamCaptureMode mode) except ?CUDA_ERROR_NOT_FOUND nogil
11401200
{{endif}}
11411201

1202+
{{if 'cuStreamBeginRecaptureToGraph' in found_functions}}
1203+
1204+
cdef CUresult _cuStreamBeginRecaptureToGraph(CUstream hStream, CUstreamCaptureMode mode, CUgraph hGraph, CUgraphRecaptureCallback callbackFunc, void* userData) except ?CUDA_ERROR_NOT_FOUND nogil
1205+
{{endif}}
1206+
11421207
{{if 'cuStreamBeginCaptureToGraph' in found_functions}}
11431208

11441209
cdef CUresult _cuStreamBeginCaptureToGraph(CUstream hStream, CUgraph hGraph, const CUgraphNode* dependencies, const CUgraphEdgeData* dependencyData, size_t numDependencies, CUstreamCaptureMode mode) except ?CUDA_ERROR_NOT_FOUND nogil
@@ -1364,11 +1429,6 @@ cdef CUresult _cuLaunchKernelEx(const CUlaunchConfig* config, CUfunction f, void
13641429
cdef CUresult _cuLaunchCooperativeKernel(CUfunction f, unsigned int gridDimX, unsigned int gridDimY, unsigned int gridDimZ, unsigned int blockDimX, unsigned int blockDimY, unsigned int blockDimZ, unsigned int sharedMemBytes, CUstream hStream, void** kernelParams) except ?CUDA_ERROR_NOT_FOUND nogil
13651430
{{endif}}
13661431

1367-
{{if 'cuLaunchCooperativeKernelMultiDevice' in found_functions}}
1368-
1369-
cdef CUresult _cuLaunchCooperativeKernelMultiDevice(CUDA_LAUNCH_PARAMS* launchParamsList, unsigned int numDevices, unsigned int flags) except ?CUDA_ERROR_NOT_FOUND nogil
1370-
{{endif}}
1371-
13721432
{{if 'cuLaunchHostFunc' in found_functions}}
13731433

13741434
cdef CUresult _cuLaunchHostFunc(CUstream hStream, CUhostFn fn, void* userData) except ?CUDA_ERROR_NOT_FOUND nogil
@@ -1424,6 +1484,11 @@ cdef CUresult _cuLaunchGrid(CUfunction f, int grid_width, int grid_height) excep
14241484
cdef CUresult _cuLaunchGridAsync(CUfunction f, int grid_width, int grid_height, CUstream hStream) except ?CUDA_ERROR_NOT_FOUND nogil
14251485
{{endif}}
14261486

1487+
{{if 'cuLaunchCooperativeKernelMultiDevice' in found_functions}}
1488+
1489+
cdef CUresult _cuLaunchCooperativeKernelMultiDevice(CUDA_LAUNCH_PARAMS* launchParamsList, unsigned int numDevices, unsigned int flags) except ?CUDA_ERROR_NOT_FOUND nogil
1490+
{{endif}}
1491+
14271492
{{if 'cuParamSetTexRef' in found_functions}}
14281493

14291494
cdef CUresult _cuParamSetTexRef(CUfunction hfunc, int texunit, CUtexref hTexRef) except ?CUDA_ERROR_NOT_FOUND nogil

0 commit comments

Comments
 (0)