Skip to content

Commit d7fe30a

Browse files
author
Katharine Hyatt
committed
Get AMDGPU tensor ops working
1 parent f10e81a commit d7fe30a

2 files changed

Lines changed: 5 additions & 2 deletions

File tree

Project.toml

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -85,3 +85,6 @@ cuTENSOR = "011b41b2-24ef-40a8-b3eb-fa098493e9e1"
8585

8686
[targets]
8787
test = ["Test", "Random", "DynamicPolynomials", "ChainRulesTestUtils", "ChainRulesCore", "cuRAND", "CUDACore", "cuTENSOR", "Aqua", "Logging", "Bumper", "Mooncake", "Enzyme", "EnzymeTestUtils", "Adapt", "JLArrays", "AMDGPU"]
88+
89+
[sources]
90+
Strided = {url = "https://github.com/QuantumKitHub/Strided.jl/", rev = "ksh/gemm"}

ext/TensorOperationsAMDGPUExt.jl

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -8,7 +8,7 @@ using TensorOperations: TensorOperations as TO
88
# Allocator
99
#-------------------------------------------------------------------------------------------
1010

11-
TO.tensoradd_type(TC, A::AnyRocArray, pA::Index2Tuple, conjA::Bool) =
11+
TO.tensoradd_type(TC, A::AnyROCArray, pA::Index2Tuple, conjA::Bool) =
1212
ROCArray{TC, TO.numind(pA)}
1313

1414
function TO.tensoralloc_add(
@@ -37,7 +37,7 @@ end
3737
function TO.tensoralloc(
3838
::Type{<:ROCArray{T, N}}, structure,
3939
::Val{istemp}, allocator::TO.AMDAllocator
40-
) where {T, N}
40+
) where {T, N, istemp}
4141
return ROCArray{T, N}(undef, structure)
4242
end
4343

0 commit comments

Comments
 (0)