Skip to content

Commit c4bc4f4

Browse files
authored
change AVX512 macro name (#131)
1 parent e15172d commit c4bc4f4

File tree

6 files changed

+6
-6
lines changed

6 files changed

+6
-6
lines changed

cmake/CPU.cmake

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -82,7 +82,7 @@ set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -Wno-error=redundant-decls")
8282
set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -Wno-error=old-style-cast")
8383
IF (C_AVX512_FOUND OR CXX_AVX512_FOUND)
8484
set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -DCPU_CAPABILITY_AVX2")
85-
set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -DAVX512")
85+
set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -DCPU_AVX512")
8686
set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -mavx512f")
8787
set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -mavx512bw")
8888
set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -mavx512vl")

torch_ipex/csrc/cpu/bf16/Converter.cpp

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -4,7 +4,7 @@
44
#include <ATen/Parallel.h>
55
#include <torch/extension.h>
66

7-
#if defined(AVX512)
7+
#if defined(CPU_AVX512)
88
#define BF16_2_FP32(dst, src, len) cvt_bf16_to_fp32(dst, src, len)
99
#define FP32_2_BF16(dst, src, len) cvt_fp32_to_bf16(dst, src, len)
1010
#else

torch_ipex/csrc/cpu/bf16/vec/vec_type_cvt.h

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,5 @@
11
#include <ATen/ATen.h>
2-
#if defined(AVX512)
2+
#if defined(CPU_AVX512)
33
#include <immintrin.h>
44
// Conversion from BF16 to FP32
55
inline __m512 cvt_bf16_to_fp32(const __m256i src) {

torch_ipex/csrc/cpu/kernel/RnntEmbedding.cpp

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -7,7 +7,7 @@
77
#include <torch/csrc/autograd/variable.h>
88
#include <torch/script.h>
99

10-
#if defined(AVX512)
10+
#if defined(CPU_AVX512)
1111
#include "vec/vec512/rnnt_embedding.h"
1212
#else
1313
#warning "IPEX RNN-T custom kernel requires AVX512"

torch_ipex/csrc/cpu/kernel/UpdateBatch.cpp

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -7,7 +7,7 @@
77
#include <torch/csrc/autograd/variable.h>
88
#include <torch/script.h>
99

10-
#if defined(AVX512)
10+
#if defined(CPU_AVX512)
1111
#include "vec/vec512/update_batch.h"
1212
#else
1313
#warning "IPEX RNN-T custom kernel requires AVX512"

torch_ipex/csrc/cpu/nms.cpp

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -89,7 +89,7 @@ at::Tensor nms_cpu_kernel(const at::Tensor& dets,
8989
return at::nonzero(suppressed_t == 0).squeeze(1);
9090
}
9191

92-
#ifdef AVX512
92+
#ifdef CPU_AVX512
9393
// Optimized nms_cpu_kernel specialized for data type: float32 and sorted_score
9494
template <>
9595
at::Tensor nms_cpu_kernel</*scalar_t*/float, /*sorted*/true>(const at::Tensor& dets,

0 commit comments

Comments
 (0)