at master 3.1 kB view raw
1/* SPDX-License-Identifier: GPL-2.0 */ 2 3/* 4 * Copyright (C) 2023 Google LLC. 5 */ 6 7#ifndef __UNROLL_H 8#define __UNROLL_H 9 10#include <linux/args.h> 11 12#ifdef CONFIG_CC_IS_CLANG 13#define __pick_unrolled(x, y) _Pragma(#x) 14#else 15#define __pick_unrolled(x, y) _Pragma(#y) 16#endif 17 18/** 19 * unrolled - loop attributes to ask the compiler to unroll it 20 * 21 * Usage: 22 * 23 * #define BATCH 8 24 * 25 * unrolled_count(BATCH) 26 * for (u32 i = 0; i < BATCH; i++) 27 * // loop body without cross-iteration dependencies 28 * 29 * This is only a hint and the compiler is free to disable unrolling if it 30 * thinks the count is suboptimal and may hurt performance and/or hugely 31 * increase object code size. 32 * Not having any cross-iteration dependencies (i.e. when iter x + 1 depends 33 * on what iter x will do with variables) is not a strict requirement, but 34 * provides best performance and object code size. 35 * Available only on Clang and GCC 8.x onwards. 36 */ 37 38/* Ask the compiler to pick an optimal unroll count, Clang only */ 39#define unrolled \ 40 __pick_unrolled(clang loop unroll(enable), /* nothing */) 41 42/* Unroll each @n iterations of the loop */ 43#define unrolled_count(n) \ 44 __pick_unrolled(clang loop unroll_count(n), GCC unroll n) 45 46/* Unroll the whole loop */ 47#define unrolled_full \ 48 __pick_unrolled(clang loop unroll(full), GCC unroll 65534) 49 50/* Never unroll the loop */ 51#define unrolled_none \ 52 __pick_unrolled(clang loop unroll(disable), GCC unroll 1) 53 54#define UNROLL(N, MACRO, args...) CONCATENATE(__UNROLL_, N)(MACRO, args) 55 56#define __UNROLL_0(MACRO, args...) 57#define __UNROLL_1(MACRO, args...) __UNROLL_0(MACRO, args) MACRO(0, args) 58#define __UNROLL_2(MACRO, args...) __UNROLL_1(MACRO, args) MACRO(1, args) 59#define __UNROLL_3(MACRO, args...) __UNROLL_2(MACRO, args) MACRO(2, args) 60#define __UNROLL_4(MACRO, args...) __UNROLL_3(MACRO, args) MACRO(3, args) 61#define __UNROLL_5(MACRO, args...) __UNROLL_4(MACRO, args) MACRO(4, args) 62#define __UNROLL_6(MACRO, args...) __UNROLL_5(MACRO, args) MACRO(5, args) 63#define __UNROLL_7(MACRO, args...) __UNROLL_6(MACRO, args) MACRO(6, args) 64#define __UNROLL_8(MACRO, args...) __UNROLL_7(MACRO, args) MACRO(7, args) 65#define __UNROLL_9(MACRO, args...) __UNROLL_8(MACRO, args) MACRO(8, args) 66#define __UNROLL_10(MACRO, args...) __UNROLL_9(MACRO, args) MACRO(9, args) 67#define __UNROLL_11(MACRO, args...) __UNROLL_10(MACRO, args) MACRO(10, args) 68#define __UNROLL_12(MACRO, args...) __UNROLL_11(MACRO, args) MACRO(11, args) 69#define __UNROLL_13(MACRO, args...) __UNROLL_12(MACRO, args) MACRO(12, args) 70#define __UNROLL_14(MACRO, args...) __UNROLL_13(MACRO, args) MACRO(13, args) 71#define __UNROLL_15(MACRO, args...) __UNROLL_14(MACRO, args) MACRO(14, args) 72#define __UNROLL_16(MACRO, args...) __UNROLL_15(MACRO, args) MACRO(15, args) 73#define __UNROLL_17(MACRO, args...) __UNROLL_16(MACRO, args) MACRO(16, args) 74#define __UNROLL_18(MACRO, args...) __UNROLL_17(MACRO, args) MACRO(17, args) 75#define __UNROLL_19(MACRO, args...) __UNROLL_18(MACRO, args) MACRO(18, args) 76#define __UNROLL_20(MACRO, args...) __UNROLL_19(MACRO, args) MACRO(19, args) 77 78#endif /* __UNROLL_H */