1/* SPDX-License-Identifier: GPL-2.0 */
2
3/*
4 * Copyright (C) 2023 Google LLC.
5 */
6
7#ifndef __UNROLL_H
8#define __UNROLL_H
9
10#include <linux/args.h>
11
12#ifdef CONFIG_CC_IS_CLANG
13#define __pick_unrolled(x, y) _Pragma(#x)
14#else
15#define __pick_unrolled(x, y) _Pragma(#y)
16#endif
17
18/**
19 * unrolled - loop attributes to ask the compiler to unroll it
20 *
21 * Usage:
22 *
23 * #define BATCH 8
24 *
25 * unrolled_count(BATCH)
26 * for (u32 i = 0; i < BATCH; i++)
27 * // loop body without cross-iteration dependencies
28 *
29 * This is only a hint and the compiler is free to disable unrolling if it
30 * thinks the count is suboptimal and may hurt performance and/or hugely
31 * increase object code size.
32 * Not having any cross-iteration dependencies (i.e. when iter x + 1 depends
33 * on what iter x will do with variables) is not a strict requirement, but
34 * provides best performance and object code size.
35 * Available only on Clang and GCC 8.x onwards.
36 */
37
38/* Ask the compiler to pick an optimal unroll count, Clang only */
39#define unrolled \
40 __pick_unrolled(clang loop unroll(enable), /* nothing */)
41
42/* Unroll each @n iterations of the loop */
43#define unrolled_count(n) \
44 __pick_unrolled(clang loop unroll_count(n), GCC unroll n)
45
46/* Unroll the whole loop */
47#define unrolled_full \
48 __pick_unrolled(clang loop unroll(full), GCC unroll 65534)
49
50/* Never unroll the loop */
51#define unrolled_none \
52 __pick_unrolled(clang loop unroll(disable), GCC unroll 1)
53
54#define UNROLL(N, MACRO, args...) CONCATENATE(__UNROLL_, N)(MACRO, args)
55
56#define __UNROLL_0(MACRO, args...)
57#define __UNROLL_1(MACRO, args...) __UNROLL_0(MACRO, args) MACRO(0, args)
58#define __UNROLL_2(MACRO, args...) __UNROLL_1(MACRO, args) MACRO(1, args)
59#define __UNROLL_3(MACRO, args...) __UNROLL_2(MACRO, args) MACRO(2, args)
60#define __UNROLL_4(MACRO, args...) __UNROLL_3(MACRO, args) MACRO(3, args)
61#define __UNROLL_5(MACRO, args...) __UNROLL_4(MACRO, args) MACRO(4, args)
62#define __UNROLL_6(MACRO, args...) __UNROLL_5(MACRO, args) MACRO(5, args)
63#define __UNROLL_7(MACRO, args...) __UNROLL_6(MACRO, args) MACRO(6, args)
64#define __UNROLL_8(MACRO, args...) __UNROLL_7(MACRO, args) MACRO(7, args)
65#define __UNROLL_9(MACRO, args...) __UNROLL_8(MACRO, args) MACRO(8, args)
66#define __UNROLL_10(MACRO, args...) __UNROLL_9(MACRO, args) MACRO(9, args)
67#define __UNROLL_11(MACRO, args...) __UNROLL_10(MACRO, args) MACRO(10, args)
68#define __UNROLL_12(MACRO, args...) __UNROLL_11(MACRO, args) MACRO(11, args)
69#define __UNROLL_13(MACRO, args...) __UNROLL_12(MACRO, args) MACRO(12, args)
70#define __UNROLL_14(MACRO, args...) __UNROLL_13(MACRO, args) MACRO(13, args)
71#define __UNROLL_15(MACRO, args...) __UNROLL_14(MACRO, args) MACRO(14, args)
72#define __UNROLL_16(MACRO, args...) __UNROLL_15(MACRO, args) MACRO(15, args)
73#define __UNROLL_17(MACRO, args...) __UNROLL_16(MACRO, args) MACRO(16, args)
74#define __UNROLL_18(MACRO, args...) __UNROLL_17(MACRO, args) MACRO(17, args)
75#define __UNROLL_19(MACRO, args...) __UNROLL_18(MACRO, args) MACRO(18, args)
76#define __UNROLL_20(MACRO, args...) __UNROLL_19(MACRO, args) MACRO(19, args)
77
78#endif /* __UNROLL_H */
79