Damjan Marion | d16004d | 2018-08-26 10:14:52 +0200 | [diff] [blame] | 1 | # Copyright (c) 2018 Cisco and/or its affiliates. |
| 2 | # Licensed under the Apache License, Version 2.0 (the "License"); |
| 3 | # you may not use this file except in compliance with the License. |
| 4 | # You may obtain a copy of the License at: |
| 5 | # |
| 6 | # http://www.apache.org/licenses/LICENSE-2.0 |
| 7 | # |
| 8 | # Unless required by applicable law or agreed to in writing, software |
| 9 | # distributed under the License is distributed on an "AS IS" BASIS, |
| 10 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| 11 | # See the License for the specific language governing permissions and |
| 12 | # limitations under the License. |
| 13 | |
| 14 | ############################################################################## |
Damjan Marion | edc4387 | 2018-09-02 11:16:00 +0200 | [diff] [blame] | 15 | # Cache line size detection |
| 16 | ############################################################################## |
Damjan Marion | dd39529 | 2019-01-15 00:36:03 +0100 | [diff] [blame] | 17 | if(CMAKE_CROSSCOMPILING) |
| 18 | message(STATUS "Cross-compiling - cache line size detection disabled") |
| 19 | set(VPP_LOG2_CACHE_LINE_SIZE 6) |
Lijian.Zhang | 49c1bc8 | 2019-02-27 18:17:34 +0800 | [diff] [blame] | 20 | elseif(DEFINED VPP_LOG2_CACHE_LINE_SIZE) |
| 21 | # Cache line size assigned via cmake args |
Damjan Marion | dd39529 | 2019-01-15 00:36:03 +0100 | [diff] [blame] | 22 | elseif(CMAKE_SYSTEM_PROCESSOR MATCHES "^(aarch64.*|AARCH64.*)") |
Damjan Marion | edc4387 | 2018-09-02 11:16:00 +0200 | [diff] [blame] | 23 | file(READ "/proc/cpuinfo" cpuinfo) |
| 24 | string(REPLACE "\n" ";" cpuinfo ${cpuinfo}) |
| 25 | foreach(l ${cpuinfo}) |
| 26 | string(REPLACE ":" ";" l ${l}) |
| 27 | list(GET l 0 name) |
| 28 | list(GET l 1 value) |
| 29 | string(STRIP ${name} name) |
| 30 | string(STRIP ${value} value) |
| 31 | if(${name} STREQUAL "CPU implementer") |
| 32 | set(CPU_IMPLEMENTER ${value}) |
Marco Varlese | 0745036 | 2018-09-07 11:02:26 +0200 | [diff] [blame] | 33 | endif() |
Damjan Marion | edc4387 | 2018-09-02 11:16:00 +0200 | [diff] [blame] | 34 | if(${name} STREQUAL "CPU part") |
| 35 | set(CPU_PART ${value}) |
Marco Varlese | 0745036 | 2018-09-07 11:02:26 +0200 | [diff] [blame] | 36 | endif() |
Damjan Marion | edc4387 | 2018-09-02 11:16:00 +0200 | [diff] [blame] | 37 | endforeach() |
Nitin Saxena | 66bff59 | 2018-09-06 13:45:41 +0000 | [diff] [blame] | 38 | # Implementer 0x43 - Cavium |
| 39 | # Part 0x0af - ThunderX2 is 64B, rest all are 128B |
Marco Varlese | 0745036 | 2018-09-07 11:02:26 +0200 | [diff] [blame] | 40 | if (${CPU_IMPLEMENTER} STREQUAL "0x43") |
| 41 | if (${CPU_PART} STREQUAL "0x0af") |
| 42 | set(VPP_LOG2_CACHE_LINE_SIZE 6) |
| 43 | else() |
| 44 | set(VPP_LOG2_CACHE_LINE_SIZE 7) |
| 45 | endif() |
Nitin Saxena | 66bff59 | 2018-09-06 13:45:41 +0000 | [diff] [blame] | 46 | else() |
Marco Varlese | 0745036 | 2018-09-07 11:02:26 +0200 | [diff] [blame] | 47 | set(VPP_LOG2_CACHE_LINE_SIZE 6) |
Damjan Marion | edc4387 | 2018-09-02 11:16:00 +0200 | [diff] [blame] | 48 | endif() |
| 49 | math(EXPR VPP_CACHE_LINE_SIZE "1 << ${VPP_LOG2_CACHE_LINE_SIZE}") |
| 50 | message(STATUS "ARM AArch64 CPU implementer ${CPU_IMPLEMENTER} part ${CPU_PART} cacheline size ${VPP_CACHE_LINE_SIZE}") |
| 51 | else() |
| 52 | set(VPP_LOG2_CACHE_LINE_SIZE 6) |
| 53 | endif() |
| 54 | |
| 55 | set(VPP_LOG2_CACHE_LINE_SIZE ${VPP_LOG2_CACHE_LINE_SIZE} |
| 56 | CACHE STRING "Target CPU cache line size (power of 2)") |
| 57 | |
| 58 | ############################################################################## |
Damjan Marion | 6e39ff0 | 2020-04-29 15:15:45 +0200 | [diff] [blame] | 59 | # Gnu Assembler AVX-512 bug detection |
| 60 | # - see: https://sourceware.org/bugzilla/show_bug.cgi?id=23465 |
| 61 | ############################################################################## |
| 62 | if(CMAKE_SYSTEM_PROCESSOR MATCHES "amd64.*|x86_64.*|AMD64.*") |
| 63 | if (CMAKE_C_COMPILER_ID STREQUAL "GNU") |
| 64 | set(pfx ${CMAKE_CURRENT_BINARY_DIR}${CMAKE_FILES_DIRECTORY}/gas_avx512_bug_test) |
| 65 | file(WRITE ${pfx}.s "vmovaps 0x40(,%rax), %zmm0\n") |
| 66 | execute_process(COMMAND ${CMAKE_C_COMPILER} -c ${pfx}.s -o ${pfx}.o) |
| 67 | execute_process(COMMAND objdump -s ${pfx}.o OUTPUT_VARIABLE _output) |
| 68 | if (NOT _output MATCHES "62f17c48 28040540 000000") |
| 69 | set(GNU_ASSEMBLER_AVX512_BUG 1) |
| 70 | endif() |
| 71 | endif() |
| 72 | endif() |
| 73 | |
| 74 | ############################################################################## |
Damjan Marion | d16004d | 2018-08-26 10:14:52 +0200 | [diff] [blame] | 75 | # CPU optimizations and multiarch support |
| 76 | ############################################################################## |
| 77 | if(CMAKE_SYSTEM_PROCESSOR MATCHES "amd64.*|x86_64.*|AMD64.*") |
| 78 | set(CMAKE_C_FLAGS "-march=corei7 -mtune=corei7-avx ${CMAKE_C_FLAGS}") |
Damjan Marion | 162330f | 2020-04-29 21:28:15 +0200 | [diff] [blame] | 79 | check_c_compiler_flag("-march=haswell" compiler_flag_march_haswell) |
| 80 | if(compiler_flag_march_haswell) |
| 81 | list(APPEND MARCH_VARIANTS "hsw\;-march=haswell -mtune=haswell") |
Damjan Marion | d16004d | 2018-08-26 10:14:52 +0200 | [diff] [blame] | 82 | endif() |
Radu Nicolau | e1480a2 | 2021-01-14 10:25:02 +0000 | [diff] [blame^] | 83 | check_c_compiler_flag("-march=tremont" compiler_flag_march_tremont) |
| 84 | if(compiler_flag_march_tremont) |
| 85 | list(APPEND MARCH_VARIANTS "trm\;-march=tremont -mtune=tremont") |
| 86 | endif() |
Damjan Marion | 6e39ff0 | 2020-04-29 15:15:45 +0200 | [diff] [blame] | 87 | if (GNU_ASSEMBLER_AVX512_BUG) |
| 88 | message(WARNING "AVX-512 multiarch variant(s) disabled due to GNU Assembler bug") |
| 89 | else() |
Damjan Marion | 162330f | 2020-04-29 21:28:15 +0200 | [diff] [blame] | 90 | check_c_compiler_flag("-mprefer-vector-width=256" compiler_flag_mprefer_vector_width) |
Damjan Marion | 6e39ff0 | 2020-04-29 15:15:45 +0200 | [diff] [blame] | 91 | check_c_compiler_flag("-march=skylake-avx512" compiler_flag_march_skylake_avx512) |
| 92 | check_c_compiler_flag("-march=icelake-client" compiler_flag_march_icelake_client) |
Damjan Marion | 162330f | 2020-04-29 21:28:15 +0200 | [diff] [blame] | 93 | if(compiler_flag_march_skylake_avx512 AND compiler_flag_mprefer_vector_width) |
| 94 | list(APPEND MARCH_VARIANTS "skx\;-march=skylake-avx512 -mtune=skylake-avx512 -mprefer-vector-width=256") |
| 95 | endif() |
| 96 | if(compiler_flag_march_icelake_client AND compiler_flag_mprefer_vector_width) |
| 97 | list(APPEND MARCH_VARIANTS "icl\;-march=icelake-client -mtune=icelake-client -mprefer-vector-width=512") |
Damjan Marion | 6e39ff0 | 2020-04-29 15:15:45 +0200 | [diff] [blame] | 98 | endif() |
Damjan Marion | d16004d | 2018-08-26 10:14:52 +0200 | [diff] [blame] | 99 | endif() |
| 100 | elseif(CMAKE_SYSTEM_PROCESSOR MATCHES "^(aarch64.*|AARCH64.*)") |
| 101 | set(CMAKE_C_FLAGS "-march=armv8-a+crc ${CMAKE_C_FLAGS}") |
Lijian Zhang | 2e23721 | 2018-09-10 17:13:56 +0800 | [diff] [blame] | 102 | check_c_compiler_flag("-march=armv8-a+crc+crypto -mtune=qdf24xx" compiler_flag_march_core_qdf24xx) |
| 103 | if(compiler_flag_march_core_qdf24xx) |
| 104 | list(APPEND MARCH_VARIANTS "qdf24xx\;-march=armv8-a+crc+crypto -DCLIB_N_PREFETCHES=8") |
| 105 | endif() |
Nitin Saxena | e2f5236 | 2020-08-25 19:58:37 +0530 | [diff] [blame] | 106 | check_c_compiler_flag("-march=armv8.2-a+crc+crypto+lse" compiler_flag_march_core_octeontx2) |
| 107 | if(compiler_flag_march_core_octeontx2) |
| 108 | list(APPEND MARCH_VARIANTS "octeontx2\;-march=armv8.2-a+crc+crypto+lse -DCLIB_N_PREFETCHES=8") |
| 109 | endif() |
Lijian Zhang | 2e23721 | 2018-09-10 17:13:56 +0800 | [diff] [blame] | 110 | check_c_compiler_flag("-march=armv8.1-a+crc+crypto -mtune=thunderx2t99" compiler_flag_march_thunderx2t99) |
| 111 | if(compiler_flag_march_thunderx2t99) |
jialv01 | ea397f5 | 2019-09-04 11:31:10 +0800 | [diff] [blame] | 112 | if (CMAKE_C_COMPILER_ID STREQUAL "GNU" AND (NOT CMAKE_C_COMPILER_VERSION VERSION_LESS 8.3)) |
Lijian Zhang | 2e23721 | 2018-09-10 17:13:56 +0800 | [diff] [blame] | 113 | list(APPEND MARCH_VARIANTS "thunderx2t99\;-march=armv8.1-a+crc+crypto -mtune=thunderx2t99 -DCLIB_N_PREFETCHES=8") |
| 114 | else() |
| 115 | list(APPEND MARCH_VARIANTS "thunderx2t99\;-march=armv8.1-a+crc+crypto -DCLIB_N_PREFETCHES=8") |
| 116 | endif() |
| 117 | endif() |
| 118 | check_c_compiler_flag("-march=armv8-a+crc+crypto -mtune=cortex-a72" compiler_flag_march_cortexa72) |
| 119 | if(compiler_flag_march_cortexa72) |
| 120 | list(APPEND MARCH_VARIANTS "cortexa72\;-march=armv8-a+crc+crypto -mtune=cortex-a72 -DCLIB_N_PREFETCHES=6") |
| 121 | endif() |
Lijian.Zhang | 690ce86 | 2020-02-18 19:58:19 +0800 | [diff] [blame] | 122 | check_c_compiler_flag("-march=armv8.2-a+crc+crypto -mtune=neoverse-n1" compiler_flag_march_neoversen1) |
| 123 | if(compiler_flag_march_neoversen1) |
| 124 | list(APPEND MARCH_VARIANTS "neoversen1\;-march=armv8.2-a+crc+crypto -mtune=neoverse-n1 -DCLIB_N_PREFETCHES=6") |
| 125 | endif() |
Damjan Marion | d16004d | 2018-08-26 10:14:52 +0200 | [diff] [blame] | 126 | endif() |
| 127 | |
Aloys Augustin | 2a65804 | 2020-10-13 15:43:00 +0200 | [diff] [blame] | 128 | macro(vpp_library_set_multiarch_sources lib deps) |
Damjan Marion | d16004d | 2018-08-26 10:14:52 +0200 | [diff] [blame] | 129 | foreach(V ${MARCH_VARIANTS}) |
| 130 | list(GET V 0 VARIANT) |
| 131 | list(GET V 1 VARIANT_FLAGS) |
| 132 | set(l ${lib}_${VARIANT}) |
| 133 | add_library(${l} OBJECT ${ARGN}) |
Aloys Augustin | 2a65804 | 2020-10-13 15:43:00 +0200 | [diff] [blame] | 134 | if("${deps}") |
| 135 | add_dependencies(${l} ${deps}) |
| 136 | endif() |
Damjan Marion | d16004d | 2018-08-26 10:14:52 +0200 | [diff] [blame] | 137 | set_target_properties(${l} PROPERTIES POSITION_INDEPENDENT_CODE ON) |
BenoƮt Ganne | 49ee684 | 2019-04-30 11:50:46 +0200 | [diff] [blame] | 138 | target_compile_options(${l} PUBLIC "-DCLIB_MARCH_VARIANT=${VARIANT}") |
Damjan Marion | d16004d | 2018-08-26 10:14:52 +0200 | [diff] [blame] | 139 | separate_arguments(VARIANT_FLAGS) |
| 140 | target_compile_options(${l} PUBLIC ${VARIANT_FLAGS}) |
| 141 | target_sources(${lib} PRIVATE $<TARGET_OBJECTS:${l}>) |
| 142 | endforeach() |
| 143 | endmacro() |
| 144 | |