alternative.h 12.7 KB
Newer Older
1
/* SPDX-License-Identifier: GPL-2.0 */
H
H. Peter Anvin 已提交
2 3
#ifndef _ASM_X86_ALTERNATIVE_H
#define _ASM_X86_ALTERNATIVE_H
4 5

#include <linux/types.h>
M
Mathieu Desnoyers 已提交
6
#include <linux/stringify.h>
7 8
#include <asm/asm.h>

9 10 11
#define ALTINSTR_FLAG_INV	(1 << 15)
#define ALT_NOT(feat)		((feat) | ALTINSTR_FLAG_INV)

12 13 14 15
#ifndef __ASSEMBLY__

#include <linux/stddef.h>

16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37
/*
 * Alternative inline assembly for SMP.
 *
 * The LOCK_PREFIX macro defined here replaces the LOCK and
 * LOCK_PREFIX macros used everywhere in the source tree.
 *
 * SMP alternatives use the same data structures as the other
 * alternatives and the X86_FEATURE_UP flag to indicate the case of a
 * UP system running a SMP kernel.  The existing apply_alternatives()
 * works fine for patching a SMP kernel for UP.
 *
 * The SMP alternative tables can be kept after boot and contain both
 * UP and SMP versions of the instructions to allow switching back to
 * SMP at runtime, when hotplugging in a new CPU, which is especially
 * useful in virtualized environments.
 *
 * The very common lock prefix is handled as special case in a
 * separate table which is a pure address list without replacement ptr
 * and size information.  That keeps the table sizes small.
 */

#ifdef CONFIG_SMP
38 39 40 41 42 43 44 45 46
#define LOCK_PREFIX_HERE \
		".pushsection .smp_locks,\"a\"\n"	\
		".balign 4\n"				\
		".long 671f - .\n" /* offset */		\
		".popsection\n"				\
		"671:"

#define LOCK_PREFIX LOCK_PREFIX_HERE "\n\tlock; "

47
#else /* ! CONFIG_SMP */
48
#define LOCK_PREFIX_HERE ""
49 50 51
#define LOCK_PREFIX ""
#endif

52 53 54 55 56 57 58 59 60 61
/*
 * objtool annotation to ignore the alternatives and only consider the original
 * instruction(s).
 */
#define ANNOTATE_IGNORE_ALTERNATIVE				\
	"999:\n\t"						\
	".pushsection .discard.ignore_alts\n\t"			\
	".long 999b - .\n\t"					\
	".popsection\n\t"

62
struct alt_instr {
63 64
	s32 instr_offset;	/* original instruction */
	s32 repl_offset;	/* offset to replacement instruction */
65
	u16 cpuid;		/* cpuid bit set for replacement */
66
	u8  instrlen;		/* length of original instruction */
67 68 69
	u8  replacementlen;	/* length of new instruction */
	u8  padlen;		/* length of build-time padding */
} __packed;
70

71 72 73 74 75 76
/*
 * Debug flag that can be tested to see whether alternative
 * instructions were patched in already:
 */
extern int alternatives_patched;

77 78 79 80 81 82 83 84 85 86
extern void alternative_instructions(void);
extern void apply_alternatives(struct alt_instr *start, struct alt_instr *end);

struct module;

#ifdef CONFIG_SMP
extern void alternatives_smp_module_add(struct module *mod, char *name,
					void *locks, void *locks_end,
					void *text, void *text_end);
extern void alternatives_smp_module_del(struct module *mod);
87
extern void alternatives_enable_smp(void);
88
extern int alternatives_text_reserved(void *start, void *end);
89
extern bool skip_smp_alternatives;
90 91
#else
static inline void alternatives_smp_module_add(struct module *mod, char *name,
92 93
					       void *locks, void *locks_end,
					       void *text, void *text_end) {}
94
static inline void alternatives_smp_module_del(struct module *mod) {}
95
static inline void alternatives_enable_smp(void) {}
96 97 98 99
static inline int alternatives_text_reserved(void *start, void *end)
{
	return 0;
}
100 101
#endif	/* CONFIG_SMP */

102 103
#define b_replacement(num)	"664"#num
#define e_replacement(num)	"665"#num
104

105 106 107 108 109
#define alt_end_marker		"663"
#define alt_slen		"662b-661b"
#define alt_pad_len		alt_end_marker"b-662b"
#define alt_total_slen		alt_end_marker"b-661b"
#define alt_rlen(num)		e_replacement(num)"f-"b_replacement(num)"f"
110

111 112
#define OLDINSTR(oldinstr, num)						\
	"# ALT: oldnstr\n"						\
113
	"661:\n\t" oldinstr "\n662:\n"					\
114
	"# ALT: padding\n"						\
115
	".skip -(((" alt_rlen(num) ")-(" alt_slen ")) > 0) * "		\
116
		"((" alt_rlen(num) ")-(" alt_slen ")),0x90\n"		\
117 118
	alt_end_marker ":\n"

119
/*
120
 * gas compatible max based on the idea from:
121 122
 * http://graphics.stanford.edu/~seander/bithacks.html#IntegerMinOrMax
 *
123
 * The additional "-" is needed because gas uses a "true" value of -1.
124
 */
125
#define alt_max_short(a, b)	"((" a ") ^ (((" a ") ^ (" b ")) & -(-((" a ") < (" b ")))))"
126

127 128 129 130
/*
 * Pad the second replacement alternative with additional NOPs if it is
 * additionally longer than the first replacement alternative.
 */
131
#define OLDINSTR_2(oldinstr, num1, num2) \
132
	"# ALT: oldinstr2\n"									\
133
	"661:\n\t" oldinstr "\n662:\n"								\
134
	"# ALT: padding2\n"									\
135 136
	".skip -((" alt_max_short(alt_rlen(num1), alt_rlen(num2)) " - (" alt_slen ")) > 0) * "	\
		"(" alt_max_short(alt_rlen(num1), alt_rlen(num2)) " - (" alt_slen ")), 0x90\n"	\
137 138
	alt_end_marker ":\n"

139 140 141 142 143 144 145 146 147 148
#define OLDINSTR_3(oldinsn, n1, n2, n3)								\
	"# ALT: oldinstr3\n"									\
	"661:\n\t" oldinsn "\n662:\n"								\
	"# ALT: padding3\n"									\
	".skip -((" alt_max_short(alt_max_short(alt_rlen(n1), alt_rlen(n2)), alt_rlen(n3))	\
		" - (" alt_slen ")) > 0) * "							\
		"(" alt_max_short(alt_max_short(alt_rlen(n1), alt_rlen(n2)), alt_rlen(n3))	\
		" - (" alt_slen ")), 0x90\n"							\
	alt_end_marker ":\n"

149
#define ALTINSTR_ENTRY(feature, num)					      \
150
	" .long 661b - .\n"				/* label           */ \
151
	" .long " b_replacement(num)"f - .\n"		/* new instruction */ \
152
	" .word " __stringify(feature) "\n"		/* feature bit     */ \
153 154 155
	" .byte " alt_total_slen "\n"			/* source len      */ \
	" .byte " alt_rlen(num) "\n"			/* replacement len */ \
	" .byte " alt_pad_len "\n"			/* pad len */
156

157
#define ALTINSTR_REPLACEMENT(newinstr, num)		/* replacement */	\
158 159
	"# ALT: replacement " #num "\n"						\
	b_replacement(num)":\n\t" newinstr "\n" e_replacement(num) ":\n"
160

M
Mathieu Desnoyers 已提交
161 162
/* alternative assembly primitive: */
#define ALTERNATIVE(oldinstr, newinstr, feature)			\
163
	OLDINSTR(oldinstr, 1)						\
164
	".pushsection .altinstructions,\"a\"\n"				\
165
	ALTINSTR_ENTRY(feature, 1)					\
166 167
	".popsection\n"							\
	".pushsection .altinstr_replacement, \"ax\"\n"			\
168
	ALTINSTR_REPLACEMENT(newinstr, 1)				\
169
	".popsection\n"
170 171

#define ALTERNATIVE_2(oldinstr, newinstr1, feature1, newinstr2, feature2)\
172
	OLDINSTR_2(oldinstr, 1, 2)					\
173
	".pushsection .altinstructions,\"a\"\n"				\
174 175
	ALTINSTR_ENTRY(feature1, 1)					\
	ALTINSTR_ENTRY(feature2, 2)					\
176 177
	".popsection\n"							\
	".pushsection .altinstr_replacement, \"ax\"\n"			\
178 179
	ALTINSTR_REPLACEMENT(newinstr1, 1)				\
	ALTINSTR_REPLACEMENT(newinstr2, 2)				\
180
	".popsection\n"
M
Mathieu Desnoyers 已提交
181

182 183 184 185 186
/* If @feature is set, patch in @newinstr_yes, otherwise @newinstr_no. */
#define ALTERNATIVE_TERNARY(oldinstr, feature, newinstr_yes, newinstr_no) \
	ALTERNATIVE_2(oldinstr, newinstr_no, X86_FEATURE_ALWAYS,	\
		      newinstr_yes, feature)

187 188 189 190 191 192 193 194
#define ALTERNATIVE_3(oldinsn, newinsn1, feat1, newinsn2, feat2, newinsn3, feat3) \
	OLDINSTR_3(oldinsn, 1, 2, 3)						\
	".pushsection .altinstructions,\"a\"\n"					\
	ALTINSTR_ENTRY(feat1, 1)						\
	ALTINSTR_ENTRY(feat2, 2)						\
	ALTINSTR_ENTRY(feat3, 3)						\
	".popsection\n"								\
	".pushsection .altinstr_replacement, \"ax\"\n"				\
195 196 197
	ALTINSTR_REPLACEMENT(newinsn1, 1)					\
	ALTINSTR_REPLACEMENT(newinsn2, 2)					\
	ALTINSTR_REPLACEMENT(newinsn3, 3)					\
198 199
	".popsection\n"

200 201 202 203 204 205 206 207 208 209 210 211 212
/*
 * Alternative instructions for different CPU types or capabilities.
 *
 * This allows to use optimized instructions even on generic binary
 * kernels.
 *
 * length of oldinstr must be longer or equal the length of newinstr
 * It can be padded with nops as needed.
 *
 * For non barrier like inlines please define new variants
 * without volatile and memory clobber.
 */
#define alternative(oldinstr, newinstr, feature)			\
213
	asm_inline volatile (ALTERNATIVE(oldinstr, newinstr, feature) : : : "memory")
214

215
#define alternative_2(oldinstr, newinstr1, feature1, newinstr2, feature2) \
216
	asm_inline volatile(ALTERNATIVE_2(oldinstr, newinstr1, feature1, newinstr2, feature2) ::: "memory")
217

218 219 220
#define alternative_ternary(oldinstr, feature, newinstr_yes, newinstr_no) \
	asm_inline volatile(ALTERNATIVE_TERNARY(oldinstr, feature, newinstr_yes, newinstr_no) ::: "memory")

221 222 223
/*
 * Alternative inline assembly with input.
 *
I
Ingo Molnar 已提交
224
 * Peculiarities:
225 226 227 228 229
 * No memory clobber here.
 * Argument numbers start with 1.
 * Best is to use constraints that are fixed size (like (%1) ... "r")
 * If you use variable sized constraints like "m" or "g" in the
 * replacement make sure to pad to the worst case length.
M
Mathieu Desnoyers 已提交
230
 * Leaving an unused argument 0 to keep API compatibility.
231 232
 */
#define alternative_input(oldinstr, newinstr, feature, input...)	\
233
	asm_inline volatile (ALTERNATIVE(oldinstr, newinstr, feature)	\
M
Mathieu Desnoyers 已提交
234
		: : "i" (0), ## input)
235

236 237 238 239 240 241 242 243 244 245
/*
 * This is similar to alternative_input. But it has two features and
 * respective instructions.
 *
 * If CPU has feature2, newinstr2 is used.
 * Otherwise, if CPU has feature1, newinstr1 is used.
 * Otherwise, oldinstr is used.
 */
#define alternative_input_2(oldinstr, newinstr1, feature1, newinstr2,	     \
			   feature2, input...)				     \
246
	asm_inline volatile(ALTERNATIVE_2(oldinstr, newinstr1, feature1,     \
247 248 249
		newinstr2, feature2)					     \
		: : "i" (0), ## input)

250 251
/* Like alternative_input, but with a single output argument */
#define alternative_io(oldinstr, newinstr, feature, output, input...)	\
252
	asm_inline volatile (ALTERNATIVE(oldinstr, newinstr, feature)	\
M
Mathieu Desnoyers 已提交
253
		: output : "i" (0), ## input)
254

255 256
/* Like alternative_io, but for replacing a direct call with another one. */
#define alternative_call(oldfunc, newfunc, feature, output, input...)	\
257
	asm_inline volatile (ALTERNATIVE("call %P[old]", "call %P[new]", feature) \
258 259
		: output : [old] "i" (oldfunc), [new] "i" (newfunc), ## input)

260 261 262 263 264 265 266 267
/*
 * Like alternative_call, but there are two features and respective functions.
 * If CPU has feature2, function2 is used.
 * Otherwise, if CPU has feature1, function1 is used.
 * Otherwise, old function is used.
 */
#define alternative_call_2(oldfunc, newfunc1, feature1, newfunc2, feature2,   \
			   output, input...)				      \
268
	asm_inline volatile (ALTERNATIVE_2("call %P[old]", "call %P[new1]", feature1,\
269
		"call %P[new2]", feature2)				      \
270
		: output, ASM_CALL_CONSTRAINT				      \
271
		: [old] "i" (oldfunc), [new1] "i" (newfunc1),		      \
272
		  [new2] "i" (newfunc2), ## input)
273

274 275 276 277
/*
 * use this macro(s) if you need more than one output parameter
 * in alternative_io
 */
278
#define ASM_OUTPUT2(a...) a
279

280 281 282 283 284 285
/*
 * use this macro if you need clobbers but no inputs in
 * alternative_{input,io,call}()
 */
#define ASM_NO_INPUT_CLOBBER(clbr...) "i" (0) : clbr

286 287 288 289 290 291 292 293 294 295 296 297 298 299 300 301 302 303 304 305 306 307 308 309 310 311 312 313 314 315 316 317 318 319 320 321 322 323 324 325 326 327 328 329 330 331 332 333 334 335 336 337 338 339 340 341 342 343 344 345 346 347 348 349 350 351 352 353 354 355 356 357 358 359 360 361 362 363 364 365 366 367 368 369 370 371 372 373 374 375 376 377 378 379 380 381 382 383 384 385 386 387 388 389 390
#else /* __ASSEMBLY__ */

#ifdef CONFIG_SMP
	.macro LOCK_PREFIX
672:	lock
	.pushsection .smp_locks,"a"
	.balign 4
	.long 672b - .
	.popsection
	.endm
#else
	.macro LOCK_PREFIX
	.endm
#endif

/*
 * objtool annotation to ignore the alternatives and only consider the original
 * instruction(s).
 */
.macro ANNOTATE_IGNORE_ALTERNATIVE
	.Lannotate_\@:
	.pushsection .discard.ignore_alts
	.long .Lannotate_\@ - .
	.popsection
.endm

/*
 * Issue one struct alt_instr descriptor entry (need to put it into
 * the section .altinstructions, see below). This entry contains
 * enough information for the alternatives patching code to patch an
 * instruction. See apply_alternatives().
 */
.macro altinstruction_entry orig alt feature orig_len alt_len pad_len
	.long \orig - .
	.long \alt - .
	.word \feature
	.byte \orig_len
	.byte \alt_len
	.byte \pad_len
.endm

/*
 * Define an alternative between two instructions. If @feature is
 * present, early code in apply_alternatives() replaces @oldinstr with
 * @newinstr. ".skip" directive takes care of proper instruction padding
 * in case @newinstr is longer than @oldinstr.
 */
.macro ALTERNATIVE oldinstr, newinstr, feature
140:
	\oldinstr
141:
	.skip -(((144f-143f)-(141b-140b)) > 0) * ((144f-143f)-(141b-140b)),0x90
142:

	.pushsection .altinstructions,"a"
	altinstruction_entry 140b,143f,\feature,142b-140b,144f-143f,142b-141b
	.popsection

	.pushsection .altinstr_replacement,"ax"
143:
	\newinstr
144:
	.popsection
.endm

#define old_len			141b-140b
#define new_len1		144f-143f
#define new_len2		145f-144f

/*
 * gas compatible max based on the idea from:
 * http://graphics.stanford.edu/~seander/bithacks.html#IntegerMinOrMax
 *
 * The additional "-" is needed because gas uses a "true" value of -1.
 */
#define alt_max_short(a, b)	((a) ^ (((a) ^ (b)) & -(-((a) < (b)))))


/*
 * Same as ALTERNATIVE macro above but for two alternatives. If CPU
 * has @feature1, it replaces @oldinstr with @newinstr1. If CPU has
 * @feature2, it replaces @oldinstr with @feature2.
 */
.macro ALTERNATIVE_2 oldinstr, newinstr1, feature1, newinstr2, feature2
140:
	\oldinstr
141:
	.skip -((alt_max_short(new_len1, new_len2) - (old_len)) > 0) * \
		(alt_max_short(new_len1, new_len2) - (old_len)),0x90
142:

	.pushsection .altinstructions,"a"
	altinstruction_entry 140b,143f,\feature1,142b-140b,144f-143f,142b-141b
	altinstruction_entry 140b,144f,\feature2,142b-140b,145f-144f,142b-141b
	.popsection

	.pushsection .altinstr_replacement,"ax"
143:
	\newinstr1
144:
	\newinstr2
145:
	.popsection
.endm

391 392 393 394 395
/* If @feature is set, patch in @newinstr_yes, otherwise @newinstr_no. */
#define ALTERNATIVE_TERNARY(oldinstr, feature, newinstr_yes, newinstr_no) \
	ALTERNATIVE_2 oldinstr, newinstr_no, X86_FEATURE_ALWAYS,	\
	newinstr_yes, feature

396 397
#endif /* __ASSEMBLY__ */

H
H. Peter Anvin 已提交
398
#endif /* _ASM_X86_ALTERNATIVE_H */