at master 9.8 kB view raw
1/* SPDX-License-Identifier: GPL-2.0+ OR BSD-3-Clause */ 2/* 3 * Copyright (c) Meta Platforms, Inc. and affiliates. 4 * All rights reserved. 5 * 6 * This source code is licensed under both the BSD-style license (found in the 7 * LICENSE file in the root directory of this source tree) and the GPLv2 (found 8 * in the COPYING file in the root directory of this source tree). 9 * You may select, at your option, one of the above-listed licenses. 10 */ 11 12#ifndef ZSTD_COMPILER_H 13#define ZSTD_COMPILER_H 14 15#include <linux/types.h> 16 17#include "portability_macros.h" 18 19/*-******************************************************* 20* Compiler specifics 21*********************************************************/ 22/* force inlining */ 23 24#if !defined(ZSTD_NO_INLINE) 25#if (defined(__GNUC__) && !defined(__STRICT_ANSI__)) || defined(__cplusplus) || defined(__STDC_VERSION__) && __STDC_VERSION__ >= 199901L /* C99 */ 26# define INLINE_KEYWORD inline 27#else 28# define INLINE_KEYWORD 29#endif 30 31#define FORCE_INLINE_ATTR __attribute__((always_inline)) 32 33#else 34 35#define INLINE_KEYWORD 36#define FORCE_INLINE_ATTR 37 38#endif 39 40/* 41 On MSVC qsort requires that functions passed into it use the __cdecl calling conversion(CC). 42 This explicitly marks such functions as __cdecl so that the code will still compile 43 if a CC other than __cdecl has been made the default. 44*/ 45#define WIN_CDECL 46 47/* UNUSED_ATTR tells the compiler it is okay if the function is unused. */ 48#define UNUSED_ATTR __attribute__((unused)) 49 50/* 51 * FORCE_INLINE_TEMPLATE is used to define C "templates", which take constant 52 * parameters. They must be inlined for the compiler to eliminate the constant 53 * branches. 54 */ 55#define FORCE_INLINE_TEMPLATE static INLINE_KEYWORD FORCE_INLINE_ATTR UNUSED_ATTR 56/* 57 * HINT_INLINE is used to help the compiler generate better code. It is *not* 58 * used for "templates", so it can be tweaked based on the compilers 59 * performance. 60 * 61 * gcc-4.8 and gcc-4.9 have been shown to benefit from leaving off the 62 * always_inline attribute. 63 * 64 * clang up to 5.0.0 (trunk) benefit tremendously from the always_inline 65 * attribute. 66 */ 67#if !defined(__clang__) && defined(__GNUC__) && __GNUC__ >= 4 && __GNUC_MINOR__ >= 8 && __GNUC__ < 5 68# define HINT_INLINE static INLINE_KEYWORD 69#else 70# define HINT_INLINE FORCE_INLINE_TEMPLATE 71#endif 72 73/* "soft" inline : 74 * The compiler is free to select if it's a good idea to inline or not. 75 * The main objective is to silence compiler warnings 76 * when a defined function in included but not used. 77 * 78 * Note : this macro is prefixed `MEM_` because it used to be provided by `mem.h` unit. 79 * Updating the prefix is probably preferable, but requires a fairly large codemod, 80 * since this name is used everywhere. 81 */ 82#ifndef MEM_STATIC /* already defined in Linux Kernel mem.h */ 83#define MEM_STATIC static __inline UNUSED_ATTR 84#endif 85 86/* force no inlining */ 87#define FORCE_NOINLINE static __attribute__((__noinline__)) 88 89 90/* target attribute */ 91#define TARGET_ATTRIBUTE(target) __attribute__((__target__(target))) 92 93/* Target attribute for BMI2 dynamic dispatch. 94 * Enable lzcnt, bmi, and bmi2. 95 * We test for bmi1 & bmi2. lzcnt is included in bmi1. 96 */ 97#define BMI2_TARGET_ATTRIBUTE TARGET_ATTRIBUTE("lzcnt,bmi,bmi2") 98 99/* prefetch 100 * can be disabled, by declaring NO_PREFETCH build macro */ 101#if ( (__GNUC__ >= 4) || ( (__GNUC__ == 3) && (__GNUC_MINOR__ >= 1) ) ) 102# define PREFETCH_L1(ptr) __builtin_prefetch((ptr), 0 /* rw==read */, 3 /* locality */) 103# define PREFETCH_L2(ptr) __builtin_prefetch((ptr), 0 /* rw==read */, 2 /* locality */) 104#elif defined(__aarch64__) 105# define PREFETCH_L1(ptr) do { __asm__ __volatile__("prfm pldl1keep, %0" ::"Q"(*(ptr))); } while (0) 106# define PREFETCH_L2(ptr) do { __asm__ __volatile__("prfm pldl2keep, %0" ::"Q"(*(ptr))); } while (0) 107#else 108# define PREFETCH_L1(ptr) do { (void)(ptr); } while (0) /* disabled */ 109# define PREFETCH_L2(ptr) do { (void)(ptr); } while (0) /* disabled */ 110#endif /* NO_PREFETCH */ 111 112#define CACHELINE_SIZE 64 113 114#define PREFETCH_AREA(p, s) \ 115 do { \ 116 const char* const _ptr = (const char*)(p); \ 117 size_t const _size = (size_t)(s); \ 118 size_t _pos; \ 119 for (_pos=0; _pos<_size; _pos+=CACHELINE_SIZE) { \ 120 PREFETCH_L2(_ptr + _pos); \ 121 } \ 122 } while (0) 123 124/* vectorization 125 * older GCC (pre gcc-4.3 picked as the cutoff) uses a different syntax, 126 * and some compilers, like Intel ICC and MCST LCC, do not support it at all. */ 127#if !defined(__INTEL_COMPILER) && !defined(__clang__) && defined(__GNUC__) && !defined(__LCC__) 128# if (__GNUC__ == 4 && __GNUC_MINOR__ > 3) || (__GNUC__ >= 5) 129# define DONT_VECTORIZE __attribute__((optimize("no-tree-vectorize"))) 130# else 131# define DONT_VECTORIZE _Pragma("GCC optimize(\"no-tree-vectorize\")") 132# endif 133#else 134# define DONT_VECTORIZE 135#endif 136 137/* Tell the compiler that a branch is likely or unlikely. 138 * Only use these macros if it causes the compiler to generate better code. 139 * If you can remove a LIKELY/UNLIKELY annotation without speed changes in gcc 140 * and clang, please do. 141 */ 142#define LIKELY(x) (__builtin_expect((x), 1)) 143#define UNLIKELY(x) (__builtin_expect((x), 0)) 144 145#if __has_builtin(__builtin_unreachable) || (defined(__GNUC__) && (__GNUC__ > 4 || (__GNUC__ == 4 && __GNUC_MINOR__ >= 5))) 146# define ZSTD_UNREACHABLE do { assert(0), __builtin_unreachable(); } while (0) 147#else 148# define ZSTD_UNREACHABLE do { assert(0); } while (0) 149#endif 150 151/* disable warnings */ 152 153/* compile time determination of SIMD support */ 154 155/* C-language Attributes are added in C23. */ 156#if defined(__STDC_VERSION__) && (__STDC_VERSION__ > 201710L) && defined(__has_c_attribute) 157# define ZSTD_HAS_C_ATTRIBUTE(x) __has_c_attribute(x) 158#else 159# define ZSTD_HAS_C_ATTRIBUTE(x) 0 160#endif 161 162/* Only use C++ attributes in C++. Some compilers report support for C++ 163 * attributes when compiling with C. 164 */ 165#define ZSTD_HAS_CPP_ATTRIBUTE(x) 0 166 167/* Define ZSTD_FALLTHROUGH macro for annotating switch case with the 'fallthrough' attribute. 168 * - C23: https://en.cppreference.com/w/c/language/attributes/fallthrough 169 * - CPP17: https://en.cppreference.com/w/cpp/language/attributes/fallthrough 170 * - Else: __attribute__((__fallthrough__)) 171 */ 172#define ZSTD_FALLTHROUGH fallthrough 173 174/*-************************************************************** 175* Alignment 176*****************************************************************/ 177 178/* @return 1 if @u is a 2^n value, 0 otherwise 179 * useful to check a value is valid for alignment restrictions */ 180MEM_STATIC int ZSTD_isPower2(size_t u) { 181 return (u & (u-1)) == 0; 182} 183 184/* this test was initially positioned in mem.h, 185 * but this file is removed (or replaced) for linux kernel 186 * so it's now hosted in compiler.h, 187 * which remains valid for both user & kernel spaces. 188 */ 189 190#ifndef ZSTD_ALIGNOF 191/* covers gcc, clang & MSVC */ 192/* note : this section must come first, before C11, 193 * due to a limitation in the kernel source generator */ 194# define ZSTD_ALIGNOF(T) __alignof(T) 195 196#endif /* ZSTD_ALIGNOF */ 197 198#ifndef ZSTD_ALIGNED 199/* C90-compatible alignment macro (GCC/Clang). Adjust for other compilers if needed. */ 200#define ZSTD_ALIGNED(a) __attribute__((aligned(a))) 201#endif /* ZSTD_ALIGNED */ 202 203 204/*-************************************************************** 205* Sanitizer 206*****************************************************************/ 207 208/* 209 * Zstd relies on pointer overflow in its decompressor. 210 * We add this attribute to functions that rely on pointer overflow. 211 */ 212#ifndef ZSTD_ALLOW_POINTER_OVERFLOW_ATTR 213# if __has_attribute(no_sanitize) 214# if !defined(__clang__) && defined(__GNUC__) && __GNUC__ < 8 215 /* gcc < 8 only has signed-integer-overlow which triggers on pointer overflow */ 216# define ZSTD_ALLOW_POINTER_OVERFLOW_ATTR __attribute__((no_sanitize("signed-integer-overflow"))) 217# else 218 /* older versions of clang [3.7, 5.0) will warn that pointer-overflow is ignored. */ 219# define ZSTD_ALLOW_POINTER_OVERFLOW_ATTR __attribute__((no_sanitize("pointer-overflow"))) 220# endif 221# else 222# define ZSTD_ALLOW_POINTER_OVERFLOW_ATTR 223# endif 224#endif 225 226/* 227 * Helper function to perform a wrapped pointer difference without triggering 228 * UBSAN. 229 * 230 * @returns lhs - rhs with wrapping 231 */ 232MEM_STATIC 233ZSTD_ALLOW_POINTER_OVERFLOW_ATTR 234ptrdiff_t ZSTD_wrappedPtrDiff(unsigned char const* lhs, unsigned char const* rhs) 235{ 236 return lhs - rhs; 237} 238 239/* 240 * Helper function to perform a wrapped pointer add without triggering UBSAN. 241 * 242 * @return ptr + add with wrapping 243 */ 244MEM_STATIC 245ZSTD_ALLOW_POINTER_OVERFLOW_ATTR 246unsigned char const* ZSTD_wrappedPtrAdd(unsigned char const* ptr, ptrdiff_t add) 247{ 248 return ptr + add; 249} 250 251/* 252 * Helper function to perform a wrapped pointer subtraction without triggering 253 * UBSAN. 254 * 255 * @return ptr - sub with wrapping 256 */ 257MEM_STATIC 258ZSTD_ALLOW_POINTER_OVERFLOW_ATTR 259unsigned char const* ZSTD_wrappedPtrSub(unsigned char const* ptr, ptrdiff_t sub) 260{ 261 return ptr - sub; 262} 263 264/* 265 * Helper function to add to a pointer that works around C's undefined behavior 266 * of adding 0 to NULL. 267 * 268 * @returns `ptr + add` except it defines `NULL + 0 == NULL`. 269 */ 270MEM_STATIC 271unsigned char* ZSTD_maybeNullPtrAdd(unsigned char* ptr, ptrdiff_t add) 272{ 273 return add > 0 ? ptr + add : ptr; 274} 275 276/* Issue #3240 reports an ASAN failure on an llvm-mingw build. Out of an 277 * abundance of caution, disable our custom poisoning on mingw. */ 278#ifdef __MINGW32__ 279#ifndef ZSTD_ASAN_DONT_POISON_WORKSPACE 280#define ZSTD_ASAN_DONT_POISON_WORKSPACE 1 281#endif 282#ifndef ZSTD_MSAN_DONT_POISON_WORKSPACE 283#define ZSTD_MSAN_DONT_POISON_WORKSPACE 1 284#endif 285#endif 286 287 288 289#endif /* ZSTD_COMPILER_H */