123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212 |
- // SPDX-License-Identifier: GPL-2.0
- #include <linux/static_call.h>
- #include <linux/memory.h>
- #include <linux/bug.h>
- #include <asm/text-patching.h>
- enum insn_type {
- CALL = 0, /* site call */
- NOP = 1, /* site cond-call */
- JMP = 2, /* tramp / site tail-call */
- RET = 3, /* tramp / site cond-tail-call */
- JCC = 4,
- };
- /*
- * ud1 %esp, %ecx - a 3 byte #UD that is unique to trampolines, chosen such
- * that there is no false-positive trampoline identification while also being a
- * speculation stop.
- */
- static const u8 tramp_ud[] = { 0x0f, 0xb9, 0xcc };
- /*
- * cs cs cs xorl %eax, %eax - a single 5 byte instruction that clears %[er]ax
- */
- static const u8 xor5rax[] = { 0x2e, 0x2e, 0x2e, 0x31, 0xc0 };
- static const u8 retinsn[] = { RET_INSN_OPCODE, 0xcc, 0xcc, 0xcc, 0xcc };
- static u8 __is_Jcc(u8 *insn) /* Jcc.d32 */
- {
- u8 ret = 0;
- if (insn[0] == 0x0f) {
- u8 tmp = insn[1];
- if ((tmp & 0xf0) == 0x80)
- ret = tmp;
- }
- return ret;
- }
- extern void __static_call_return(void);
- asm (".global __static_call_return\n\t"
- ".type __static_call_return, @function\n\t"
- "__static_call_return:\n\t"
- ANNOTATE_NOENDBR
- ANNOTATE_RETPOLINE_SAFE
- "ret; int3\n\t"
- ".size __static_call_return, . - __static_call_return \n\t");
- static void __ref __static_call_transform(void *insn, enum insn_type type,
- void *func, bool modinit)
- {
- const void *emulate = NULL;
- int size = CALL_INSN_SIZE;
- const void *code;
- u8 op, buf[6];
- if ((type == JMP || type == RET) && (op = __is_Jcc(insn)))
- type = JCC;
- switch (type) {
- case CALL:
- code = text_gen_insn(CALL_INSN_OPCODE, insn, func);
- if (func == &__static_call_return0) {
- emulate = code;
- code = &xor5rax;
- }
- break;
- case NOP:
- code = x86_nops[5];
- break;
- case JMP:
- code = text_gen_insn(JMP32_INSN_OPCODE, insn, func);
- break;
- case RET:
- if (cpu_feature_enabled(X86_FEATURE_RETHUNK))
- code = text_gen_insn(JMP32_INSN_OPCODE, insn, &__x86_return_thunk);
- else
- code = &retinsn;
- break;
- case JCC:
- if (!func) {
- func = __static_call_return;
- if (cpu_feature_enabled(X86_FEATURE_RETHUNK))
- func = __x86_return_thunk;
- }
- buf[0] = 0x0f;
- __text_gen_insn(buf+1, op, insn+1, func, 5);
- code = buf;
- size = 6;
- break;
- }
- if (memcmp(insn, code, size) == 0)
- return;
- if (system_state == SYSTEM_BOOTING || modinit)
- return text_poke_early(insn, code, size);
- text_poke_bp(insn, code, size, emulate);
- }
- static void __static_call_validate(u8 *insn, bool tail, bool tramp)
- {
- u8 opcode = insn[0];
- if (tramp && memcmp(insn+5, tramp_ud, 3)) {
- pr_err("trampoline signature fail");
- BUG();
- }
- if (tail) {
- if (opcode == JMP32_INSN_OPCODE ||
- opcode == RET_INSN_OPCODE ||
- __is_Jcc(insn))
- return;
- } else {
- if (opcode == CALL_INSN_OPCODE ||
- !memcmp(insn, x86_nops[5], 5) ||
- !memcmp(insn, xor5rax, 5))
- return;
- }
- /*
- * If we ever trigger this, our text is corrupt, we'll probably not live long.
- */
- pr_err("unexpected static_call insn opcode 0x%x at %pS\n", opcode, insn);
- BUG();
- }
- static inline enum insn_type __sc_insn(bool null, bool tail)
- {
- /*
- * Encode the following table without branches:
- *
- * tail null insn
- * -----+-------+------
- * 0 | 0 | CALL
- * 0 | 1 | NOP
- * 1 | 0 | JMP
- * 1 | 1 | RET
- */
- return 2*tail + null;
- }
- void arch_static_call_transform(void *site, void *tramp, void *func, bool tail)
- {
- mutex_lock(&text_mutex);
- if (tramp) {
- __static_call_validate(tramp, true, true);
- __static_call_transform(tramp, __sc_insn(!func, true), func, false);
- }
- if (IS_ENABLED(CONFIG_HAVE_STATIC_CALL_INLINE) && site) {
- __static_call_validate(site, tail, false);
- __static_call_transform(site, __sc_insn(!func, tail), func, false);
- }
- mutex_unlock(&text_mutex);
- }
- EXPORT_SYMBOL_GPL(arch_static_call_transform);
- #ifdef CONFIG_RETHUNK
- /*
- * This is called by apply_returns() to fix up static call trampolines,
- * specifically ARCH_DEFINE_STATIC_CALL_NULL_TRAMP which is recorded as
- * having a return trampoline.
- *
- * The problem is that static_call() is available before determining
- * X86_FEATURE_RETHUNK and, by implication, running alternatives.
- *
- * This means that __static_call_transform() above can have overwritten the
- * return trampoline and we now need to fix things up to be consistent.
- */
- bool __static_call_fixup(void *tramp, u8 op, void *dest)
- {
- unsigned long addr = (unsigned long)tramp;
- /*
- * Not all .return_sites are a static_call trampoline (most are not).
- * Check if the 3 bytes after the return are still kernel text, if not,
- * then this definitely is not a trampoline and we need not worry
- * further.
- *
- * This avoids the memcmp() below tripping over pagefaults etc..
- */
- if (((addr >> PAGE_SHIFT) != ((addr + 7) >> PAGE_SHIFT)) &&
- !kernel_text_address(addr + 7))
- return false;
- if (memcmp(tramp+5, tramp_ud, 3)) {
- /* Not a trampoline site, not our problem. */
- return false;
- }
- mutex_lock(&text_mutex);
- if (op == RET_INSN_OPCODE || dest == &__x86_return_thunk)
- __static_call_transform(tramp, RET, NULL, true);
- mutex_unlock(&text_mutex);
- return true;
- }
- #endif
|