summaryrefslogtreecommitdiff
path: root/arch/mips/include/asm/unroll.h
blob: 6f4ac854b12d28911e409ee2df9c8c17a293e958 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
/* SPDX-License-Identifier: GPL-2.0-only */
#ifndef __ASM_UNROLL_H__
#define __ASM_UNROLL_H__

/*
 * Explicitly unroll a loop, for use in cases where doing so is performance
 * critical.
 *
 * Ideally we'd rely upon the compiler to provide this but there's no commonly
 * available means to do so. For example GCC's "#pragma GCC unroll"
 * functionality would be ideal but is only available from GCC 8 onwards. Using
 * -funroll-loops is an option but GCC tends to make poor choices when
 * compiling our string functions. -funroll-all-loops leads to massive code
 * bloat, even if only applied to the string functions.
 */
#define unroll(times, fn, ...) do {				\
	extern void bad_unroll(void)				\
		__compiletime_error("Unsupported unroll");	\
								\
	/*							\
	 * We can't unroll if the number of iterations isn't	\
	 * compile-time constant. Unfortunately clang versions	\
	 * up until 8.0 tend to miss obvious constants & cause	\
	 * this check to fail, even though they go on to	\
	 * generate reasonable code for the switch statement,	\
	 * so we skip the sanity check for those compilers.	\
	 */							\
	BUILD_BUG_ON(!__builtin_constant_p(times));		\
								\
	switch (times) {					\
	case 32: fn(__VA_ARGS__); fallthrough;			\
	case 31: fn(__VA_ARGS__); fallthrough;			\
	case 30: fn(__VA_ARGS__); fallthrough;			\
	case 29: fn(__VA_ARGS__); fallthrough;			\
	case 28: fn(__VA_ARGS__); fallthrough;			\
	case 27: fn(__VA_ARGS__); fallthrough;			\
	case 26: fn(__VA_ARGS__); fallthrough;			\
	case 25: fn(__VA_ARGS__); fallthrough;			\
	case 24: fn(__VA_ARGS__); fallthrough;			\
	case 23: fn(__VA_ARGS__); fallthrough;			\
	case 22: fn(__VA_ARGS__); fallthrough;			\
	case 21: fn(__VA_ARGS__); fallthrough;			\
	case 20: fn(__VA_ARGS__); fallthrough;			\
	case 19: fn(__VA_ARGS__); fallthrough;			\
	case 18: fn(__VA_ARGS__); fallthrough;			\
	case 17: fn(__VA_ARGS__); fallthrough;			\
	case 16: fn(__VA_ARGS__); fallthrough;			\
	case 15: fn(__VA_ARGS__); fallthrough;			\
	case 14: fn(__VA_ARGS__); fallthrough;			\
	case 13: fn(__VA_ARGS__); fallthrough;			\
	case 12: fn(__VA_ARGS__); fallthrough;			\
	case 11: fn(__VA_ARGS__); fallthrough;			\
	case 10: fn(__VA_ARGS__); fallthrough;			\
	case 9: fn(__VA_ARGS__); fallthrough;			\
	case 8: fn(__VA_ARGS__); fallthrough;			\
	case 7: fn(__VA_ARGS__); fallthrough;			\
	case 6: fn(__VA_ARGS__); fallthrough;			\
	case 5: fn(__VA_ARGS__); fallthrough;			\
	case 4: fn(__VA_ARGS__); fallthrough;			\
	case 3: fn(__VA_ARGS__); fallthrough;			\
	case 2: fn(__VA_ARGS__); fallthrough;			\
	case 1: fn(__VA_ARGS__); fallthrough;			\
	case 0: break;						\
								\
	default:						\
		/*						\
		 * Either the iteration count is unreasonable	\
		 * or we need to add more cases above.		\
		 */						\
		bad_unroll();					\
		break;						\
	}							\
} while (0)

#endif /* __ASM_UNROLL_H__ */