[v2,01/01] : Prerequisites for PIC modules

The patchset extends the prior PIE kernel patch (by Thomas Garnier) to also
support position-independent modules that can be placed anywhere in the
48/64-bit address space (for better KASLR). The patch extends PIE v6.

The first part provides some fixes for the PIE patch as well as
some improvements/prerequisites for position-independent modules.
It also avoids generating the same object file in several places for
the kernel and modules.

Signed-off-by: Ruslan Nikolaev <rnikola@vt.edu>
Signed-off-by: Hassan Nadeem <hnadeem@vt.edu>
---
  arch/x86/crypto/aes-x86_64-asm_64.S       |   81 
++++++++++++++++++------------
  arch/x86/crypto/camellia-x86_64-asm_64.S  |    5 +
  arch/x86/crypto/cast5-avx-x86_64-asm_64.S |    9 +--
  arch/x86/crypto/cast6-avx-x86_64-asm_64.S |    9 +--
  arch/x86/include/asm/asm.h                |   67 +++++++++++++++++++++++-
  arch/x86/kernel/kvm.c                     |    8 +-
  lib/zstd/Makefile                         |    2
  lib/zstd/entropy_common_dec.c             |    2
  lib/zstd/fse_decompress_dec.c             |    2
  lib/zstd/zstd_common_dec.c                |    2
  10 files changed, 138 insertions(+), 49 deletions(-)

diff -uprN a/arch/x86/crypto/aes-x86_64-asm_64.S 
b/arch/x86/crypto/aes-x86_64-asm_64.S

--- a/arch/x86/crypto/aes-x86_64-asm_64.S	2019-03-16 10:50:57.093692118 
-0400
+++ b/arch/x86/crypto/aes-x86_64-asm_64.S	2019-03-20 19:42:23.627815384 
-0400
@@ -17,6 +17,7 @@

  #include <linux/linkage.h>
  #include <asm/asm-offsets.h>
+#include <asm/asm.h>

  #define R1	%rax
  #define R1E	%eax
@@ -48,12 +49,34 @@
  #define R10	%r10
  #define R11	%r11

-/* Hold global for PIE support */
+/* Hold global for PIE/PIC support */
  #define RBASE	%r12

-#define prologue(FUNC,KEY,B128,B192,r1,r2,r5,r6,r7,r8,r9,r10,r11) \
+#if defined(CONFIG_X86_PIE) || (defined(MODULE) && defined(CONFIG_X86_PIC))
+# define rbase_save			\
+	pushq   RBASE;
+# define rbase_restore			\
+	popq    RBASE;
+# define rbase_load(tab)		\
+	_ASM_LEA(tab, %rip, RBASE);
+# define round_mov(tab, tab_off, reg_i, reg_o)	\
+	movl    tab_off(RBASE,reg_i,4), reg_o;
+# define round_xor(tab, tab_off, reg_i, reg_o)	\
+	xorl    tab_off(RBASE,reg_i,4), reg_o;
+#else
+# define rbase_save
+# define rbase_restore
+# define rbase_load(tab)
+# define round_mov(tab, tab_off, reg_i, reg_o)	\
+	movl    tab+tab_off(,reg_i,4), reg_o;
+# define round_xor(tab, tab_off, reg_i, reg_o)	\
+	xorl    tab+tab_off(,reg_i,4), reg_o;
+#endif
+
+#define prologue(FUNC,KEY,B128,B192,TAB,r1,r2,r5,r6,r7,r8,r9,r10,r11) \
  	ENTRY(FUNC);			\
-	pushq	RBASE;			\
+	rbase_save			\
+	rbase_load(TAB)			\
  	movq	r1,r2;			\
  	leaq	KEY+48(r8),r9;		\
  	movq	r10,r11;		\
@@ -78,70 +101,62 @@
  	movl	r6 ## E,4(r9);		\
  	movl	r7 ## E,8(r9);		\
  	movl	r8 ## E,12(r9);		\
-	popq	RBASE;			\
+	rbase_restore			\
  	ret;				\
  	ENDPROC(FUNC);

-#define round_mov(tab_off, reg_i, reg_o) \
-	leaq	tab_off(%rip), RBASE; \
-	movl	(RBASE,reg_i,4), reg_o;
-
-#define round_xor(tab_off, reg_i, reg_o) \
-	leaq	tab_off(%rip), RBASE; \
-	xorl	(RBASE,reg_i,4), reg_o;
-
  #define round(TAB,OFFSET,r1,r2,r3,r4,r5,r6,r7,r8,ra,rb,rc,rd) \
  	movzbl	r2 ## H,r5 ## E;	\
  	movzbl	r2 ## L,r6 ## E;	\
-	round_mov(TAB+1024, r5, r5 ## E)\
+	round_mov(TAB, 1024, r5, r5 ## E)\
  	movw	r4 ## X,r2 ## X;	\
-	round_mov(TAB, r6, r6 ## E)	\
+	round_mov(TAB, 0, r6, r6 ## E)	\
  	roll	$16,r2 ## E;		\
  	shrl	$16,r4 ## E;		\
  	movzbl	r4 ## L,r7 ## E;	\
  	movzbl	r4 ## H,r4 ## E;	\
  	xorl	OFFSET(r8),ra ## E;	\
  	xorl	OFFSET+4(r8),rb ## E;	\
-	round_xor(TAB+3072, r4, r5 ## E)\
-	round_xor(TAB+2048, r7, r6 ## E)\
+	round_xor(TAB, 3072, r4, r5 ## E)\
+	round_xor(TAB, 2048, r7, r6 ## E)\
  	movzbl	r1 ## L,r7 ## E;	\
  	movzbl	r1 ## H,r4 ## E;	\
-	round_mov(TAB+1024, r4, r4 ## E)\
+	round_mov(TAB, 1024, r4, r4 ## E)\
  	movw	r3 ## X,r1 ## X;	\
  	roll	$16,r1 ## E;		\
  	shrl	$16,r3 ## E;		\
-	round_xor(TAB, r7, r5 ## E)	\
+	round_xor(TAB, 0, r7, r5 ## E)	\
  	movzbl	r3 ## L,r7 ## E;	\
  	movzbl	r3 ## H,r3 ## E;	\
-	round_xor(TAB+3072, r3, r4 ## E)\
-	round_xor(TAB+2048, r7, r5 ## E)\
+	round_xor(TAB, 3072, r3, r4 ## E)\
+	round_xor(TAB, 2048, r7, r5 ## E)\
  	movzbl	r1 ## L,r7 ## E;	\
  	movzbl	r1 ## H,r3 ## E;	\
  	shrl	$16,r1 ## E;		\
-	round_xor(TAB+3072, r3, r6 ## E)\
-	round_mov(TAB+2048, r7, r3 ## E)\
+	round_xor(TAB, 3072, r3, r6 ## E)\
+	round_mov(TAB, 2048, r7, r3 ## E)\
  	movzbl	r1 ## L,r7 ## E;	\
  	movzbl	r1 ## H,r1 ## E;	\
-	round_xor(TAB+1024, r1, r6 ## E)\
-	round_xor(TAB, r7, r3 ## E)	\
+	round_xor(TAB, 1024, r1, r6 ## E)\
+	round_xor(TAB, 0, r7, r3 ## E)	\
  	movzbl	r2 ## H,r1 ## E;	\
  	movzbl	r2 ## L,r7 ## E;	\
  	shrl	$16,r2 ## E;		\
-	round_xor(TAB+3072, r1, r3 ## E)\
-	round_xor(TAB+2048, r7, r4 ## E)\
+	round_xor(TAB, 3072, r1, r3 ## E)\
+	round_xor(TAB, 2048, r7, r4 ## E)\
  	movzbl	r2 ## H,r1 ## E;	\
  	movzbl	r2 ## L,r2 ## E;	\
  	xorl	OFFSET+8(r8),rc ## E;	\
  	xorl	OFFSET+12(r8),rd ## E;	\
-	round_xor(TAB+1024, r1, r3 ## E)\
-	round_xor(TAB, r2, r4 ## E)
+	round_xor(TAB, 1024, r1, r3 ## E)\
+	round_xor(TAB, 0, r2, r4 ## E)

  #define move_regs(r1,r2,r3,r4) \
  	movl	r3 ## E,r1 ## E;	\
  	movl	r4 ## E,r2 ## E;

-#define entry(FUNC,KEY,B128,B192) \
-	prologue(FUNC,KEY,B128,B192,R2,R8,R1,R3,R4,R6,R10,R5,R11)
+#define entry(FUNC,KEY,B128,B192,TAB) \
+	prologue(FUNC,KEY,B128,B192,TAB,R2,R8,R1,R3,R4,R6,R10,R5,R11)

  #define return(FUNC) epilogue(FUNC,R8,R2,R5,R6,R3,R4,R11)

@@ -161,7 +176,7 @@

  /* void aes_enc_blk(stuct crypto_tfm *tfm, u8 *out, const u8 *in) */

-	entry(aes_enc_blk,0,.Le128,.Le192)
+	entry(aes_enc_blk,0,.Le128,.Le192,crypto_ft_tab)
  	encrypt_round(crypto_ft_tab,-96)
  	encrypt_round(crypto_ft_tab,-80)
  .Le192:	encrypt_round(crypto_ft_tab,-64)
@@ -175,12 +190,13 @@
  	encrypt_round(crypto_ft_tab, 64)
  	encrypt_round(crypto_ft_tab, 80)
  	encrypt_round(crypto_ft_tab, 96)
+	rbase_load(crypto_fl_tab)
  	encrypt_final(crypto_fl_tab,112)
  	return(aes_enc_blk)

  /* void aes_dec_blk(struct crypto_tfm *tfm, u8 *out, const u8 *in) */

-	entry(aes_dec_blk,240,.Ld128,.Ld192)
+	entry(aes_dec_blk,240,.Ld128,.Ld192,crypto_it_tab)
  	decrypt_round(crypto_it_tab,-96)
  	decrypt_round(crypto_it_tab,-80)
  .Ld192:	decrypt_round(crypto_it_tab,-64)
@@ -194,5 +210,6 @@
  	decrypt_round(crypto_it_tab, 64)
  	decrypt_round(crypto_it_tab, 80)
  	decrypt_round(crypto_it_tab, 96)
+	rbase_load(crypto_il_tab)
  	decrypt_final(crypto_il_tab,112)
  	return(aes_dec_blk)
diff -uprN a/arch/x86/crypto/camellia-x86_64-asm_64.S 
b/arch/x86/crypto/camellia-x86_64-asm_64.S
--- a/arch/x86/crypto/camellia-x86_64-asm_64.S	2019-03-16 
10:50:57.093692118 -0400
+++ b/arch/x86/crypto/camellia-x86_64-asm_64.S	2019-03-20 
19:42:23.627815384 -0400
@@ -21,6 +21,7 @@
   */

  #include <linux/linkage.h>
+#include <asm/asm.h>

  .file "camellia-x86_64-asm_64.S"
  .text
@@ -92,10 +93,10 @@
  #define RXORbl %r9b

  #define xor2ror16(T0, T1, tmp1, tmp2, ab, dst) \
-	leaq T0(%rip), 			tmp1; \
+	_ASM_LEA(T0, %rip, tmp1); \
  	movzbl ab ## bl,		tmp2 ## d; \
  	xorq (tmp1, tmp2, 8),		dst; \
-	leaq T1(%rip), 			tmp2; \
+	_ASM_LEA(T1, %rip, tmp2); \
  	movzbl ab ## bh,		tmp1 ## d; \
  	xorq (tmp2, tmp1, 8),		dst; \
  	rorq $16,			ab;
diff -uprN a/arch/x86/crypto/cast5-avx-x86_64-asm_64.S 
b/arch/x86/crypto/cast5-avx-x86_64-asm_64.S
--- a/arch/x86/crypto/cast5-avx-x86_64-asm_64.S	2019-03-16 
10:50:57.093692118 -0400
+++ b/arch/x86/crypto/cast5-avx-x86_64-asm_64.S	2019-03-20 
19:42:23.627815384 -0400
@@ -25,6 +25,7 @@

  #include <linux/linkage.h>
  #include <asm/frame.h>
+#include <asm/asm.h>

  .file "cast5-avx-x86_64-asm_64.S"

@@ -99,17 +100,17 @@

  #define lookup_32bit(src, dst, op1, op2, op3, interleave_op, il_reg) \
  	movzbl		src ## bh,       RID1d;    \
-	leaq		s1(%rip),        RID2;     \
+	_ASM_LEA(s1, %rip, RID2);                  \
  	movl		(RID2, RID1, 4), dst ## d; \
  	movzbl		src ## bl,       RID2d;    \
-	leaq		s2(%rip),        RID1;     \
+	_ASM_LEA(s2, %rip, RID1);                  \
  	op1		(RID1, RID2, 4), dst ## d; \
  	shrq $16,	src;                       \
  	movzbl		src ## bh,     RID1d;      \
-	leaq		s3(%rip),        RID2;     \
+	_ASM_LEA(s3, %rip, RID2);                  \
  	op2		(RID2, RID1, 4), dst ## d; \
  	movzbl		src ## bl,     RID2d;      \
-	leaq		s4(%rip),        RID1;     \
+	_ASM_LEA(s4, %rip, RID1);                  \
  	op3		(RID1, RID2, 4), dst ## d; \
  	interleave_op(il_reg);

diff -uprN a/arch/x86/crypto/cast6-avx-x86_64-asm_64.S 
b/arch/x86/crypto/cast6-avx-x86_64-asm_64.S
--- a/arch/x86/crypto/cast6-avx-x86_64-asm_64.S	2019-03-16 
10:50:57.093692118 -0400
+++ b/arch/x86/crypto/cast6-avx-x86_64-asm_64.S	2019-03-20 
19:42:23.627815384 -0400
@@ -25,6 +25,7 @@

  #include <linux/linkage.h>
  #include <asm/frame.h>
+#include <asm/asm.h>
  #include "glue_helper-asm-avx.S"

  .file "cast6-avx-x86_64-asm_64.S"
@@ -99,17 +100,17 @@

  #define lookup_32bit(src, dst, op1, op2, op3, interleave_op, il_reg) \
  	movzbl		src ## bh,       RID1d;    \
-	leaq		s1(%rip),        RID2;     \
+	_ASM_LEA(s1, %rip, RID2);                  \
  	movl		(RID2, RID1, 4), dst ## d; \
  	movzbl		src ## bl,       RID2d;    \
-	leaq		s2(%rip),        RID1;     \
+	_ASM_LEA(s2, %rip, RID1);                  \
  	op1		(RID1, RID2, 4), dst ## d; \
  	shrq $16,	src;                       \
  	movzbl		src ## bh,     RID1d;      \
-	leaq		s3(%rip),        RID2;     \
+	_ASM_LEA(s3, %rip, RID2);                  \
  	op2		(RID2, RID1, 4), dst ## d; \
  	movzbl		src ## bl,     RID2d;      \
-	leaq		s4(%rip),        RID1;     \
+	_ASM_LEA(s4, %rip, RID1);                  \
  	op3		(RID1, RID2, 4), dst ## d; \
  	interleave_op(il_reg);


Message ID	04e2b8e3-81cb-4dd9-d056-7361d6bf8323@yahoo.com (mailing list archive)
State	New, archived
Headers	show Return-Path: <kernel-hardening-return-15469-patchwork-kernel-hardening=patchwork.kernel.org@lists.openwall.com> Mailing-List: contact kernel-hardening-help@lists.openwall.com; run by ezmlm Precedence: bulk To: kernel-hardening@lists.openwall.com Cc: thgarnie@google.com, x86@kernel.org, kstewart@linuxfoundation.org, gregkh@linuxfoundation.org, keescook@chromium.org, jpoimboe@redhat.com From: Ruslan Nikolaev <nruslan_devel@yahoo.com> Subject: [PATCH v2 01/01]: Prerequisites for PIC modules Message-ID: <04e2b8e3-81cb-4dd9-d056-7361d6bf8323@yahoo.com> Date: Wed, 20 Mar 2019 21:30:28 -0400 User-Agent: Mozilla/5.0 (X11; Linux x86_64; rv:60.0) Gecko/20100101 Thunderbird/60.5.1 MIME-Version: 1.0 Content-Type: text/plain; charset=utf-8; format=flowed Content-Language: en-US Content-Transfer-Encoding: 7bit
Series	[v2,01/01] : Prerequisites for PIC modules \| expand [v2,01/01] : Prerequisites for PIC modules

[v2,01/01] : Prerequisites for PIC modules

Commit Message

Patch