|
1 | | - |
2 | 1 | /** |
3 | | - * Copyright (c) 2019-2021 The University of Tennessee and The University |
| 2 | + * Copyright (c) 2019-2024 The University of Tennessee and The University |
4 | 3 | * of Tennessee Research Foundation. All rights |
5 | 4 | * reserved. |
6 | 5 | * Copyright (c) 2024 NVIDIA Corporation. All rights reserved. |
@@ -104,10 +103,7 @@ parsec_taskpool_t* testing_nvlink_New( parsec_context_t *ctx, int depth, int mb |
104 | 103 |
|
105 | 104 | /** Find all CUDA devices */ |
106 | 105 | nb = parsec_context_query(ctx, PARSEC_CONTEXT_QUERY_DEVICES, PARSEC_DEV_CUDA); |
107 | | - if(nb <= 0) { |
108 | | - parsec_warning("ABORTED: This test requires at least one CUDA device per node (query returned %d)\n", nb); |
109 | | - return NULL; |
110 | | - } |
| 106 | + assert(nb >= 0); |
111 | 107 | dev_index = (int*)malloc(nb * sizeof(int)); |
112 | 108 | nb = 0; |
113 | 109 | for(dev = 0; dev < (int)parsec_nb_devices; dev++) { |
@@ -147,7 +143,7 @@ parsec_taskpool_t* testing_nvlink_New( parsec_context_t *ctx, int depth, int mb |
147 | 143 |
|
148 | 144 | /* GEMM1 tasks will create one data copy per GPU, and work on those. |
149 | 145 | * see nvlink.jdf:MAKE_C tasks */ |
150 | | - |
| 146 | + |
151 | 147 | /* userM is a user-managed matrix: the user creates the data copies |
152 | 148 | * only on the GPU they want the GEMM2 to run. To simplify the code, |
153 | 149 | * we use parsec_matrix_block_cyclic that requires to also have a CPU data |
@@ -199,14 +195,14 @@ parsec_taskpool_t* testing_nvlink_New( parsec_context_t *ctx, int depth, int mb |
199 | 195 | g++; |
200 | 196 | } |
201 | 197 | } |
202 | | - |
| 198 | + |
203 | 199 | testing_handle = parsec_nvlink_new(dcA, userM, ctx->nb_nodes, CuHI, nb, dev_index); |
204 | 200 |
|
205 | 201 | parsec_add2arena( &testing_handle->arenas_datatypes[PARSEC_nvlink_DEFAULT_ADT_IDX], |
206 | 202 | parsec_datatype_double_complex_t, |
207 | 203 | PARSEC_MATRIX_FULL, 1, mb, mb, mb, |
208 | 204 | PARSEC_ARENA_ALIGNMENT_SSE, -1 ); |
209 | | - |
| 205 | + |
210 | 206 | return &testing_handle->super; |
211 | 207 | } |
212 | 208 |
|
0 commit comments