|
| 1 | +// SPDX-License-Identifier: MIT |
| 2 | +// Copyright (c), Advanced Micro Devices, Inc. All rights reserved. |
| 3 | + |
| 4 | +#pragma once |
| 5 | + |
| 6 | +template <typename ADataType, typename BDataType, typename AccDataType, typename CDataType> |
| 7 | +auto calculate_rtol_atol(const ck_tile::index_t K, |
| 8 | + const ck_tile::index_t kbatch, |
| 9 | + const float max_accumulated_value) |
| 10 | +{ |
| 11 | + using ComputeType = |
| 12 | + std::conditional_t<sizeof(ADataType) < sizeof(BDataType), ADataType, BDataType>; |
| 13 | + // Calculate thresholds |
| 14 | + const auto rtol = ck_tile::get_relative_threshold<ComputeType, CDataType, AccDataType>( |
| 15 | + ck_tile::integer_divide_ceil(K, kbatch)); |
| 16 | + const auto atol = ck_tile::get_absolute_threshold<ComputeType, CDataType, AccDataType>( |
| 17 | + max_accumulated_value / kbatch, ck_tile::integer_divide_ceil(K, kbatch)); |
| 18 | + // Calculate error due to split_k accumulation |
| 19 | + const auto rtol_split_k = |
| 20 | + ck_tile::get_relative_threshold<CDataType, CDataType, CDataType>(kbatch); |
| 21 | + const auto atol_split_k = ck_tile::get_absolute_threshold<CDataType, CDataType, CDataType>( |
| 22 | + max_accumulated_value, kbatch); |
| 23 | + // Use higher threshold |
| 24 | + return ck_tile::make_tuple(std::max(rtol, rtol_split_k), std::max(atol, atol_split_k)); |
| 25 | +} |
| 26 | + |
| 27 | +/// @brief Function to compare the results of the device and host computations |
| 28 | +bool compare(std::string instanceName, |
| 29 | + ck_tile::index_t K, |
| 30 | + ck_tile::index_t kbatch, |
| 31 | + ck_tile::HostTensor<CDataType>& c_m_n_dev_result, |
| 32 | + ck_tile::HostTensor<CDataType>& c_m_n_host_result) |
| 33 | +{ |
| 34 | + const float max_accumulated_value = |
| 35 | + *std::max_element(c_m_n_host_result.mData.begin(), c_m_n_host_result.mData.end()); |
| 36 | + const auto rtol_atol = calculate_rtol_atol<ADataType, BDataType, AccDataType, CDataType>( |
| 37 | + K, kbatch, max_accumulated_value); |
| 38 | + bool pass = ck_tile::check_err(c_m_n_dev_result, |
| 39 | + c_m_n_host_result, |
| 40 | + "Error: Incorrect results!", |
| 41 | + rtol_atol.at(ck_tile::number<0>{}), |
| 42 | + rtol_atol.at(ck_tile::number<1>{})); |
| 43 | + |
| 44 | + std::cout << "For " << instanceName << " Relative error threshold is " |
| 45 | + << rtol_atol.at(ck_tile::number<0>{}) << " Absolute error threshold is " |
| 46 | + << rtol_atol.at(ck_tile::number<1>{}) << std::endl; |
| 47 | + std::cout << "The verification result is:" << (pass ? "correct" : "fail") << std::endl; |
| 48 | + |
| 49 | + return pass; |
| 50 | +} |
0 commit comments