x86/its: Align RETs in BHB clear sequence to avoid thunking

author Pawan Gupta <pawan.kumar.gupta@linux.intel.com>

Fri, 2 May 2025 13:25:19 +0000 (06:25 -0700)

committer Dave Hansen <dave.hansen@linux.intel.com>

Fri, 9 May 2025 20:22:05 +0000 (13:22 -0700)
author Pawan Gupta <pawan.kumar.gupta@linux.intel.com>
Fri, 2 May 2025 13:25:19 +0000 (06:25 -0700)
committer Dave Hansen <dave.hansen@linux.intel.com>
Fri, 9 May 2025 20:22:05 +0000 (13:22 -0700)
diff --git a/arch/x86/entry/entry_64.S b/arch/x86/entry/entry_64.S

index f40bdf97d390a7396315d33c720d2d52d65b0238..ed04a968cc7d0095ab0185b2e3b5beffb7680afd 100644 (file)
--- a/arch/x86/entry/entry_64.S
+++ b/arch/x86/entry/entry_64.S
@@ -1525,7 +1525,9 @@ SYM_CODE_END(rewind_stack_and_make_dead)
   * ORC to unwind properly.
   *
   * The alignment is for performance and not for safety, and may be safely
- * refactored in the future if needed.
+ * refactored in the future if needed. The .skips are for safety, to ensure
+ * that all RETs are in the second half of a cacheline to mitigate Indirect
+ * Target Selection, rather than taking the slowpath via its_return_thunk.
   */
  SYM_FUNC_START(clear_bhb_loop)
         ANNOTATE_NOENDBR
@@ -1536,10 +1538,22 @@ SYM_FUNC_START(clear_bhb_loop)
         call    1f
         jmp     5f
         .align 64, 0xcc
+       /*
+        * Shift instructions so that the RET is in the upper half of the
+        * cacheline and don't take the slowpath to its_return_thunk.
+        */
+       .skip 32 - (.Lret1 - 1f), 0xcc
         ANNOTATE_INTRA_FUNCTION_CALL
  1:     call    2f
-       RET
+.Lret1:        RET
         .align 64, 0xcc
+       /*
+        * As above shift instructions for RET at .Lret2 as well.
+        *
+        * This should be ideally be: .skip 32 - (.Lret2 - 2f), 0xcc
+        * but some Clang versions (e.g. 18) don't like this.
+        */
+       .skip 32 - 18, 0xcc
  2:     movl    $5, %eax
  3:     jmp     4f
         nop
@@ -1547,7 +1561,7 @@ SYM_FUNC_START(clear_bhb_loop)
         jnz     3b
         sub     $1, %ecx
         jnz     1b
-       RET
+.Lret2:        RET
  5:     lfence
         pop     %rbp
         RET
author	Pawan Gupta <pawan.kumar.gupta@linux.intel.com>
	Fri, 2 May 2025 13:25:19 +0000 (06:25 -0700)
committer	Dave Hansen <dave.hansen@linux.intel.com>
	Fri, 9 May 2025 20:22:05 +0000 (13:22 -0700)