alternative.h 12.0 KB
Newer Older
1
/* SPDX-License-Identifier: GPL-2.0 */
H
H. Peter Anvin 已提交
2 3
#ifndef _ASM_X86_ALTERNATIVE_H
#define _ASM_X86_ALTERNATIVE_H
4 5

#include <linux/types.h>
M
Mathieu Desnoyers 已提交
6
#include <linux/stringify.h>
7 8
#include <asm/asm.h>

9 10 11 12
#ifndef __ASSEMBLY__

#include <linux/stddef.h>

13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34
/*
 * Alternative inline assembly for SMP.
 *
 * The LOCK_PREFIX macro defined here replaces the LOCK and
 * LOCK_PREFIX macros used everywhere in the source tree.
 *
 * SMP alternatives use the same data structures as the other
 * alternatives and the X86_FEATURE_UP flag to indicate the case of a
 * UP system running a SMP kernel.  The existing apply_alternatives()
 * works fine for patching a SMP kernel for UP.
 *
 * The SMP alternative tables can be kept after boot and contain both
 * UP and SMP versions of the instructions to allow switching back to
 * SMP at runtime, when hotplugging in a new CPU, which is especially
 * useful in virtualized environments.
 *
 * The very common lock prefix is handled as special case in a
 * separate table which is a pure address list without replacement ptr
 * and size information.  That keeps the table sizes small.
 */

#ifdef CONFIG_SMP
35 36 37 38 39 40 41 42 43
#define LOCK_PREFIX_HERE \
		".pushsection .smp_locks,\"a\"\n"	\
		".balign 4\n"				\
		".long 671f - .\n" /* offset */		\
		".popsection\n"				\
		"671:"

#define LOCK_PREFIX LOCK_PREFIX_HERE "\n\tlock; "

44
#else /* ! CONFIG_SMP */
45
#define LOCK_PREFIX_HERE ""
46 47 48
#define LOCK_PREFIX ""
#endif

49 50 51 52 53 54 55 56 57 58
/*
 * objtool annotation to ignore the alternatives and only consider the original
 * instruction(s).
 */
#define ANNOTATE_IGNORE_ALTERNATIVE				\
	"999:\n\t"						\
	".pushsection .discard.ignore_alts\n\t"			\
	".long 999b - .\n\t"					\
	".popsection\n\t"

59
struct alt_instr {
60 61
	s32 instr_offset;	/* original instruction */
	s32 repl_offset;	/* offset to replacement instruction */
62
	u16 cpuid;		/* cpuid bit set for replacement */
63
	u8  instrlen;		/* length of original instruction */
64 65 66
	u8  replacementlen;	/* length of new instruction */
	u8  padlen;		/* length of build-time padding */
} __packed;
67

68 69 70 71 72 73
/*
 * Debug flag that can be tested to see whether alternative
 * instructions were patched in already:
 */
extern int alternatives_patched;

74 75 76 77 78 79 80 81 82 83
extern void alternative_instructions(void);
extern void apply_alternatives(struct alt_instr *start, struct alt_instr *end);

struct module;

#ifdef CONFIG_SMP
extern void alternatives_smp_module_add(struct module *mod, char *name,
					void *locks, void *locks_end,
					void *text, void *text_end);
extern void alternatives_smp_module_del(struct module *mod);
84
extern void alternatives_enable_smp(void);
85
extern int alternatives_text_reserved(void *start, void *end);
86
extern bool skip_smp_alternatives;
87 88
#else
static inline void alternatives_smp_module_add(struct module *mod, char *name,
89 90
					       void *locks, void *locks_end,
					       void *text, void *text_end) {}
91
static inline void alternatives_smp_module_del(struct module *mod) {}
92
static inline void alternatives_enable_smp(void) {}
93 94 95 96
static inline int alternatives_text_reserved(void *start, void *end)
{
	return 0;
}
97 98
#endif	/* CONFIG_SMP */

99 100
#define b_replacement(num)	"664"#num
#define e_replacement(num)	"665"#num
101

102 103 104 105 106
#define alt_end_marker		"663"
#define alt_slen		"662b-661b"
#define alt_pad_len		alt_end_marker"b-662b"
#define alt_total_slen		alt_end_marker"b-661b"
#define alt_rlen(num)		e_replacement(num)"f-"b_replacement(num)"f"
107

108 109
#define OLDINSTR(oldinstr, num)						\
	"# ALT: oldnstr\n"						\
110
	"661:\n\t" oldinstr "\n662:\n"					\
111
	"# ALT: padding\n"						\
112
	".skip -(((" alt_rlen(num) ")-(" alt_slen ")) > 0) * "		\
113
		"((" alt_rlen(num) ")-(" alt_slen ")),0x90\n"		\
114 115
	alt_end_marker ":\n"

116
/*
117
 * gas compatible max based on the idea from:
118 119
 * http://graphics.stanford.edu/~seander/bithacks.html#IntegerMinOrMax
 *
120
 * The additional "-" is needed because gas uses a "true" value of -1.
121
 */
122
#define alt_max_short(a, b)	"((" a ") ^ (((" a ") ^ (" b ")) & -(-((" a ") < (" b ")))))"
123

124 125 126 127
/*
 * Pad the second replacement alternative with additional NOPs if it is
 * additionally longer than the first replacement alternative.
 */
128
#define OLDINSTR_2(oldinstr, num1, num2) \
129
	"# ALT: oldinstr2\n"									\
130
	"661:\n\t" oldinstr "\n662:\n"								\
131
	"# ALT: padding2\n"									\
132 133
	".skip -((" alt_max_short(alt_rlen(num1), alt_rlen(num2)) " - (" alt_slen ")) > 0) * "	\
		"(" alt_max_short(alt_rlen(num1), alt_rlen(num2)) " - (" alt_slen ")), 0x90\n"	\
134 135
	alt_end_marker ":\n"

136 137 138 139 140 141 142 143 144 145
#define OLDINSTR_3(oldinsn, n1, n2, n3)								\
	"# ALT: oldinstr3\n"									\
	"661:\n\t" oldinsn "\n662:\n"								\
	"# ALT: padding3\n"									\
	".skip -((" alt_max_short(alt_max_short(alt_rlen(n1), alt_rlen(n2)), alt_rlen(n3))	\
		" - (" alt_slen ")) > 0) * "							\
		"(" alt_max_short(alt_max_short(alt_rlen(n1), alt_rlen(n2)), alt_rlen(n3))	\
		" - (" alt_slen ")), 0x90\n"							\
	alt_end_marker ":\n"

146
#define ALTINSTR_ENTRY(feature, num)					      \
147
	" .long 661b - .\n"				/* label           */ \
148
	" .long " b_replacement(num)"f - .\n"		/* new instruction */ \
149
	" .word " __stringify(feature) "\n"		/* feature bit     */ \
150 151 152
	" .byte " alt_total_slen "\n"			/* source len      */ \
	" .byte " alt_rlen(num) "\n"			/* replacement len */ \
	" .byte " alt_pad_len "\n"			/* pad len */
153

154
#define ALTINSTR_REPLACEMENT(newinstr, num)		/* replacement */	\
155 156
	"# ALT: replacement " #num "\n"						\
	b_replacement(num)":\n\t" newinstr "\n" e_replacement(num) ":\n"
157

M
Mathieu Desnoyers 已提交
158 159
/* alternative assembly primitive: */
#define ALTERNATIVE(oldinstr, newinstr, feature)			\
160
	OLDINSTR(oldinstr, 1)						\
161
	".pushsection .altinstructions,\"a\"\n"				\
162
	ALTINSTR_ENTRY(feature, 1)					\
163 164
	".popsection\n"							\
	".pushsection .altinstr_replacement, \"ax\"\n"			\
165
	ALTINSTR_REPLACEMENT(newinstr, 1)				\
166
	".popsection\n"
167 168

#define ALTERNATIVE_2(oldinstr, newinstr1, feature1, newinstr2, feature2)\
169
	OLDINSTR_2(oldinstr, 1, 2)					\
170
	".pushsection .altinstructions,\"a\"\n"				\
171 172
	ALTINSTR_ENTRY(feature1, 1)					\
	ALTINSTR_ENTRY(feature2, 2)					\
173 174
	".popsection\n"							\
	".pushsection .altinstr_replacement, \"ax\"\n"			\
175 176
	ALTINSTR_REPLACEMENT(newinstr1, 1)				\
	ALTINSTR_REPLACEMENT(newinstr2, 2)				\
177
	".popsection\n"
M
Mathieu Desnoyers 已提交
178

179 180 181 182 183 184 185 186
#define ALTERNATIVE_3(oldinsn, newinsn1, feat1, newinsn2, feat2, newinsn3, feat3) \
	OLDINSTR_3(oldinsn, 1, 2, 3)						\
	".pushsection .altinstructions,\"a\"\n"					\
	ALTINSTR_ENTRY(feat1, 1)						\
	ALTINSTR_ENTRY(feat2, 2)						\
	ALTINSTR_ENTRY(feat3, 3)						\
	".popsection\n"								\
	".pushsection .altinstr_replacement, \"ax\"\n"				\
187 188 189
	ALTINSTR_REPLACEMENT(newinsn1, 1)					\
	ALTINSTR_REPLACEMENT(newinsn2, 2)					\
	ALTINSTR_REPLACEMENT(newinsn3, 3)					\
190 191
	".popsection\n"

192 193 194 195 196 197 198 199 200 201 202 203 204
/*
 * Alternative instructions for different CPU types or capabilities.
 *
 * This allows to use optimized instructions even on generic binary
 * kernels.
 *
 * length of oldinstr must be longer or equal the length of newinstr
 * It can be padded with nops as needed.
 *
 * For non barrier like inlines please define new variants
 * without volatile and memory clobber.
 */
#define alternative(oldinstr, newinstr, feature)			\
205
	asm_inline volatile (ALTERNATIVE(oldinstr, newinstr, feature) : : : "memory")
206

207
#define alternative_2(oldinstr, newinstr1, feature1, newinstr2, feature2) \
208
	asm_inline volatile(ALTERNATIVE_2(oldinstr, newinstr1, feature1, newinstr2, feature2) ::: "memory")
209

210 211 212
/*
 * Alternative inline assembly with input.
 *
I
Ingo Molnar 已提交
213
 * Peculiarities:
214 215 216 217 218
 * No memory clobber here.
 * Argument numbers start with 1.
 * Best is to use constraints that are fixed size (like (%1) ... "r")
 * If you use variable sized constraints like "m" or "g" in the
 * replacement make sure to pad to the worst case length.
M
Mathieu Desnoyers 已提交
219
 * Leaving an unused argument 0 to keep API compatibility.
220 221
 */
#define alternative_input(oldinstr, newinstr, feature, input...)	\
222
	asm_inline volatile (ALTERNATIVE(oldinstr, newinstr, feature)	\
M
Mathieu Desnoyers 已提交
223
		: : "i" (0), ## input)
224

225 226 227 228 229 230 231 232 233 234
/*
 * This is similar to alternative_input. But it has two features and
 * respective instructions.
 *
 * If CPU has feature2, newinstr2 is used.
 * Otherwise, if CPU has feature1, newinstr1 is used.
 * Otherwise, oldinstr is used.
 */
#define alternative_input_2(oldinstr, newinstr1, feature1, newinstr2,	     \
			   feature2, input...)				     \
235
	asm_inline volatile(ALTERNATIVE_2(oldinstr, newinstr1, feature1,     \
236 237 238
		newinstr2, feature2)					     \
		: : "i" (0), ## input)

239 240
/* Like alternative_input, but with a single output argument */
#define alternative_io(oldinstr, newinstr, feature, output, input...)	\
241
	asm_inline volatile (ALTERNATIVE(oldinstr, newinstr, feature)	\
M
Mathieu Desnoyers 已提交
242
		: output : "i" (0), ## input)
243

244 245
/* Like alternative_io, but for replacing a direct call with another one. */
#define alternative_call(oldfunc, newfunc, feature, output, input...)	\
246
	asm_inline volatile (ALTERNATIVE("call %P[old]", "call %P[new]", feature) \
247 248
		: output : [old] "i" (oldfunc), [new] "i" (newfunc), ## input)

249 250 251 252 253 254 255 256
/*
 * Like alternative_call, but there are two features and respective functions.
 * If CPU has feature2, function2 is used.
 * Otherwise, if CPU has feature1, function1 is used.
 * Otherwise, old function is used.
 */
#define alternative_call_2(oldfunc, newfunc1, feature1, newfunc2, feature2,   \
			   output, input...)				      \
257
	asm_inline volatile (ALTERNATIVE_2("call %P[old]", "call %P[new1]", feature1,\
258
		"call %P[new2]", feature2)				      \
259
		: output, ASM_CALL_CONSTRAINT				      \
260
		: [old] "i" (oldfunc), [new1] "i" (newfunc1),		      \
261
		  [new2] "i" (newfunc2), ## input)
262

263 264 265 266
/*
 * use this macro(s) if you need more than one output parameter
 * in alternative_io
 */
267
#define ASM_OUTPUT2(a...) a
268

269 270 271 272 273 274
/*
 * use this macro if you need clobbers but no inputs in
 * alternative_{input,io,call}()
 */
#define ASM_NO_INPUT_CLOBBER(clbr...) "i" (0) : clbr

275 276 277 278 279 280 281 282 283 284 285 286 287 288 289 290 291 292 293 294 295 296 297 298 299 300 301 302 303 304 305 306 307 308 309 310 311 312 313 314 315 316 317 318 319 320 321 322 323 324 325 326 327 328 329 330 331 332 333 334 335 336 337 338 339 340 341 342 343 344 345 346 347 348 349 350 351 352 353 354 355 356 357 358 359 360 361 362 363 364 365 366 367 368 369 370 371 372 373 374 375 376 377 378 379
#else /* __ASSEMBLY__ */

#ifdef CONFIG_SMP
	.macro LOCK_PREFIX
672:	lock
	.pushsection .smp_locks,"a"
	.balign 4
	.long 672b - .
	.popsection
	.endm
#else
	.macro LOCK_PREFIX
	.endm
#endif

/*
 * objtool annotation to ignore the alternatives and only consider the original
 * instruction(s).
 */
.macro ANNOTATE_IGNORE_ALTERNATIVE
	.Lannotate_\@:
	.pushsection .discard.ignore_alts
	.long .Lannotate_\@ - .
	.popsection
.endm

/*
 * Issue one struct alt_instr descriptor entry (need to put it into
 * the section .altinstructions, see below). This entry contains
 * enough information for the alternatives patching code to patch an
 * instruction. See apply_alternatives().
 */
.macro altinstruction_entry orig alt feature orig_len alt_len pad_len
	.long \orig - .
	.long \alt - .
	.word \feature
	.byte \orig_len
	.byte \alt_len
	.byte \pad_len
.endm

/*
 * Define an alternative between two instructions. If @feature is
 * present, early code in apply_alternatives() replaces @oldinstr with
 * @newinstr. ".skip" directive takes care of proper instruction padding
 * in case @newinstr is longer than @oldinstr.
 */
.macro ALTERNATIVE oldinstr, newinstr, feature
140:
	\oldinstr
141:
	.skip -(((144f-143f)-(141b-140b)) > 0) * ((144f-143f)-(141b-140b)),0x90
142:

	.pushsection .altinstructions,"a"
	altinstruction_entry 140b,143f,\feature,142b-140b,144f-143f,142b-141b
	.popsection

	.pushsection .altinstr_replacement,"ax"
143:
	\newinstr
144:
	.popsection
.endm

#define old_len			141b-140b
#define new_len1		144f-143f
#define new_len2		145f-144f

/*
 * gas compatible max based on the idea from:
 * http://graphics.stanford.edu/~seander/bithacks.html#IntegerMinOrMax
 *
 * The additional "-" is needed because gas uses a "true" value of -1.
 */
#define alt_max_short(a, b)	((a) ^ (((a) ^ (b)) & -(-((a) < (b)))))


/*
 * Same as ALTERNATIVE macro above but for two alternatives. If CPU
 * has @feature1, it replaces @oldinstr with @newinstr1. If CPU has
 * @feature2, it replaces @oldinstr with @feature2.
 */
.macro ALTERNATIVE_2 oldinstr, newinstr1, feature1, newinstr2, feature2
140:
	\oldinstr
141:
	.skip -((alt_max_short(new_len1, new_len2) - (old_len)) > 0) * \
		(alt_max_short(new_len1, new_len2) - (old_len)),0x90
142:

	.pushsection .altinstructions,"a"
	altinstruction_entry 140b,143f,\feature1,142b-140b,144f-143f,142b-141b
	altinstruction_entry 140b,144f,\feature2,142b-140b,145f-144f,142b-141b
	.popsection

	.pushsection .altinstr_replacement,"ax"
143:
	\newinstr1
144:
	\newinstr2
145:
	.popsection
.endm

380 381
#endif /* __ASSEMBLY__ */

H
H. Peter Anvin 已提交
382
#endif /* _ASM_X86_ALTERNATIVE_H */