Skip to content

Commit 9637997

Browse files
q10meta-codesync[bot]
authored andcommitted
[fbgemm_gpu[ Fix aarch64 build issues caused by D99968947 (pytorch#5655)
Summary: Pull Request resolved: pytorch#5655 - Fix aarch64 build issues caused by D99968947 Reviewed By: Nicoshev, ZhijianJiang Differential Revision: D101387235 fbshipit-source-id: 1cb3c11f4224571e0706226a7617a58ac304d8ac
1 parent a6de255 commit 9637997

2 files changed

Lines changed: 9 additions & 1 deletion

File tree

include/fbgemm/FbgemmConvert.h

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -118,11 +118,11 @@ FBGEMM_API void FloatToFloat16_simd(
118118
FBGEMM_API void
119119
Float16ToFloat_simd(const float16* src, float* dst, size_t size);
120120

121+
#if !defined(__aarch64__)
121122
/**
122123
* @brief AVX2 implementation to convert fp32 numbers to fp16 numbers.
123124
*
124125
*/
125-
#if !defined(__aarch64__)
126126
FBGEMM_API void FloatToFloat16_avx2(
127127
const float* src,
128128
float16* dst,

src/QuantUtilsAvx2.cc

Lines changed: 8 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1626,7 +1626,11 @@ void FloatOrHalfToFusedNBitRowwiseQuantizedSBHalfAvx2(
16261626
maximum_element = min_max_row_float[1];
16271627

16281628
if constexpr (std::is_same_v<InputType, float16>) {
1629+
#if !defined(__aarch64__)
16291630
Float16ToFloat_avx2(input_row, input_row_float_for_fp16, input_columns);
1631+
#else
1632+
Float16ToFloat_ref(input_row, input_row_float_for_fp16, input_columns);
1633+
#endif
16301634
}
16311635
} else {
16321636
__m256 min_v = _mm256_set1_ps(minimum_element);
@@ -1847,7 +1851,11 @@ void FloatOrHalfToFused8BitRowwiseQuantizedSBFloatAvx2(
18471851
maximum_element = min_max_row_float[1];
18481852

18491853
if constexpr (std::is_same_v<InputType, float16>) {
1854+
#if !defined(__aarch64__)
18501855
Float16ToFloat_avx2(input_row, input_row_float_for_fp16, input_columns);
1856+
#else
1857+
Float16ToFloat_ref(input_row, input_row_float_for_fp16, input_columns);
1858+
#endif
18511859
}
18521860
} else {
18531861
__m256 min_v = _mm256_set1_ps(minimum_element);

0 commit comments

Comments
 (0)