Skip to content

Commit 180674d

Browse files
Merge pull request #918 from InfiniTensor/issue/867
issue/867 fix cpu malloc
2 parents 422a4e1 + ef867cc commit 180674d

File tree

3 files changed

+6
-9
lines changed

3 files changed

+6
-9
lines changed

src/infinicore/context/context_impl.cc

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -126,6 +126,7 @@ std::shared_ptr<Memory> allocateMemory(size_t size) {
126126
}
127127

128128
std::shared_ptr<Memory> allocateHostMemory(size_t size) {
129+
setDevice(Device::cpu());
129130
return ContextImpl::singleton().getCpuRuntime()->allocateMemory(size);
130131
}
131132

src/infiniop/ops/rearrange/nvidia/rearrange_nvidia.cu

Lines changed: 4 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -345,12 +345,10 @@ infiniStatus_t launchKernel(
345345
const_cast<void *>(static_cast<const void *>(params.dst_grid_stride.data())),
346346
const_cast<void *>(static_cast<const void *>(constraints_data))};
347347

348-
CHECK_OR_RETURN(cudaLaunchKernel(
349-
kernel_func,
350-
static_cast<unsigned int>(grid_size), static_cast<unsigned int>(BLOCK_SIZE),
351-
args, 0, stream)
352-
== cudaSuccess,
353-
INFINI_STATUS_INTERNAL_ERROR);
348+
CHECK_CUDA(cudaLaunchKernel(
349+
kernel_func,
350+
static_cast<unsigned int>(grid_size), static_cast<unsigned int>(BLOCK_SIZE),
351+
args, 0, stream));
354352

355353
return INFINI_STATUS_SUCCESS;
356354
}

xmake/test.lua

Lines changed: 1 addition & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -88,8 +88,6 @@ target("infinicore-test")
8888
add_files(os.projectdir().."/src/infinicore/ops/*/*.cc")
8989
add_files(os.projectdir().."/src/infinicore/nn/*.cc")
9090

91-
add_files(os.projectdir().."/src/infinicore-test/*.cc")
92-
add_files(os.projectdir().."/src/infinicore-test/*/*.cc")
93-
91+
add_files(os.projectdir().."/src/infinicore-test/**.cc")
9492
set_installdir(INFINI_ROOT)
9593
target_end()

0 commit comments

Comments
 (0)