1 # Copyright (c) 2018 Cisco and/or its affiliates.
2 # Licensed under the Apache License, Version 2.0 (the "License");
3 # you may not use this file except in compliance with the License.
4 # You may obtain a copy of the License at:
6 # http://www.apache.org/licenses/LICENSE-2.0
8 # Unless required by applicable law or agreed to in writing, software
9 # distributed under the License is distributed on an "AS IS" BASIS,
10 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
11 # See the License for the specific language governing permissions and
12 # limitations under the License.
14 macro(set_log2_cacheline_size var n)
20 message(FATAL_ERROR "Cacheline size ${n} not supported")
24 ##############################################################################
26 ##############################################################################
27 if(DEFINED VPP_CACHE_LINE_SIZE)
28 # Cache line size assigned via cmake args
29 elseif(CMAKE_SYSTEM_PROCESSOR MATCHES "^(aarch64.*|AARCH64.*)")
30 set(VPP_CACHE_LINE_SIZE 128)
32 set(VPP_CACHE_LINE_SIZE 64)
35 set(VPP_CACHE_LINE_SIZE ${VPP_CACHE_LINE_SIZE}
36 CACHE STRING "Target CPU cache line size")
38 set_log2_cacheline_size(VPP_LOG2_CACHE_LINE_SIZE ${VPP_CACHE_LINE_SIZE})
40 ##############################################################################
41 # Gnu Assembler AVX-512 bug detection
42 # - see: https://sourceware.org/bugzilla/show_bug.cgi?id=23465
43 ##############################################################################
44 if(CMAKE_SYSTEM_PROCESSOR MATCHES "amd64.*|x86_64.*|AMD64.*")
45 if (CMAKE_C_COMPILER_ID STREQUAL "GNU")
46 set(pfx ${CMAKE_CURRENT_BINARY_DIR}${CMAKE_FILES_DIRECTORY}/gas_avx512_bug_test)
47 file(WRITE ${pfx}.s "vmovaps 0x40(,%rax), %zmm0\n")
48 execute_process(COMMAND ${CMAKE_C_COMPILER} -c ${pfx}.s -o ${pfx}.o)
49 execute_process(COMMAND objdump -s ${pfx}.o OUTPUT_VARIABLE _output)
50 if (NOT _output MATCHES "62f17c48 28040540 000000")
51 set(GNU_ASSEMBLER_AVX512_BUG 1)
56 ##############################################################################
57 # CPU optimizations and multiarch support
58 ##############################################################################
59 macro(add_vpp_march_variant v)
60 cmake_parse_arguments(ARG
62 "N_PREFETCHES;CACHE_PREFETCH_BYTES"
70 foreach(f ${ARG_FLAGS})
71 string(APPEND fs " ${f}")
72 string(REGEX REPLACE "[-=+]" "_" sfx ${f})
73 if(NOT DEFINED compiler_flag${sfx})
74 check_c_compiler_flag(${f} compiler_flag${sfx})
76 if(NOT compiler_flag${sfx})
81 string(APPEND fs " -DCLIB_N_PREFETCHES=${ARG_N_PREFETCHES}")
83 if(ARG_CACHE_PREFETCH_BYTES)
84 set_log2_cacheline_size(log2 ${ARG_CACHE_PREFETCH_BYTES})
85 string(APPEND fs " -DCLIB_LOG2_CACHE_PREFETCH_BYTES=${log2}")
88 string(TOUPPER ${v} uv)
90 option(VPP_MARCH_VARIANT_${uv} "Build ${v} multiarch variant." OFF)
92 option(VPP_MARCH_VARIANT_${uv} "Build ${v} multiarch variant." ON)
94 if (VPP_MARCH_VARIANT_${uv})
95 list(APPEND MARCH_VARIANTS "${v}\;${fs}")
97 list(APPEND MARCH_VARIANTS_DISABLED "${v}\;${fs}")
103 if(CMAKE_SYSTEM_PROCESSOR MATCHES "amd64.*|x86_64.*|AMD64.*")
104 set(VPP_DEFAULT_MARCH_FLAGS -march=corei7 -mtune=corei7-avx)
106 add_vpp_march_variant(hsw
107 FLAGS -march=haswell -mtune=haswell
110 add_vpp_march_variant(trm
111 FLAGS -march=tremont -mtune=tremont
115 if (GNU_ASSEMBLER_AVX512_BUG)
116 message(WARNING "AVX-512 multiarch variant(s) disabled due to GNU Assembler bug")
118 add_vpp_march_variant(skx
119 FLAGS -march=skylake-avx512 -mtune=skylake-avx512 -mprefer-vector-width=256
122 add_vpp_march_variant(icl
123 FLAGS -march=icelake-client -mtune=icelake-client -mprefer-vector-width=512
126 elseif(CMAKE_SYSTEM_PROCESSOR MATCHES "^(aarch64.*|AARCH64.*)")
127 set(VPP_DEFAULT_MARCH_FLAGS -march=armv8-a+crc)
129 add_vpp_march_variant(qdf24xx
130 FLAGS -march=armv8-a+crc+crypto -mtune=qdf24xx
132 CACHE_PREFETCH_BYTES 64
136 add_vpp_march_variant(octeontx2
137 FLAGS -march=armv8.2-a+crc+crypto+lse
141 add_vpp_march_variant(thunderx2t99
142 FLAGS -march=armv8.1-a+crc+crypto -mtune=thunderx2t99
144 CACHE_PREFETCH_BYTES 64
147 add_vpp_march_variant(cortexa72
148 FLAGS -march=armv8-a+crc+crypto -mtune=cortex-a72
150 CACHE_PREFETCH_BYTES 64
153 add_vpp_march_variant(neoversen1
154 FLAGS -march=armv8.2-a+crc+crypto -mtune=neoverse-n1
156 CACHE_PREFETCH_BYTES 64
160 macro(vpp_library_set_multiarch_sources lib)
161 cmake_parse_arguments(ARG
164 "SOURCES;DEPENDS;FORCE_ON"
168 set(VARIANTS "${MARCH_VARIANTS}")
171 foreach(F ${ARG_FORCE_ON})
172 foreach(V ${MARCH_VARIANTS_DISABLED})
173 list(GET V 0 VARIANT)
174 if (VARIANT STREQUAL F)
175 list(GET V 1 VARIANT_FLAGS)
176 list(APPEND VARIANTS "${VARIANT}\;${VARIANT_FLAGS}")
182 foreach(V ${VARIANTS})
183 list(GET V 0 VARIANT)
184 list(GET V 1 VARIANT_FLAGS)
185 set(l ${lib}_${VARIANT})
186 add_library(${l} OBJECT ${ARG_SOURCES})
188 add_dependencies(${l} ${ARG_DEPENDS})
190 set_target_properties(${l} PROPERTIES POSITION_INDEPENDENT_CODE ON)
191 target_compile_definitions(${l} PUBLIC CLIB_MARCH_VARIANT=${VARIANT})
192 separate_arguments(VARIANT_FLAGS)
193 target_compile_options(${l} PUBLIC ${VARIANT_FLAGS})
194 target_sources(${lib} PRIVATE $<TARGET_OBJECTS:${l}>)