From: Jussi Kivilinna Subject: Re: GPF in aesni_xts_crypt8 (3.10-rc5) Date: Tue, 11 Jun 2013 22:01:01 +0300 Message-ID: <51B773ED.9080308@iki.fi> References: <20130611172624.GA20496@redhat.com> Mime-Version: 1.0 Content-Type: multipart/mixed; boundary="------------010303060502000304030708" To: Dave Jones , Linux Kernel , herbert@gondor.apana.org.au, "linux-crypto@vger.kernel.org" Return-path: Received: from saarni.dnainternet.net ([83.102.40.136]:56004 "EHLO saarni.dnainternet.net" rhost-flags-OK-OK-OK-OK) by vger.kernel.org with ESMTP id S1755248Ab3FKTBJ (ORCPT ); Tue, 11 Jun 2013 15:01:09 -0400 In-Reply-To: <20130611172624.GA20496@redhat.com> Sender: linux-crypto-owner@vger.kernel.org List-ID: This is a multi-part message in MIME format. --------------010303060502000304030708 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 7bit Hello, Does attached patch help? -Jussi On 11.06.2013 20:26, Dave Jones wrote: > Just found that 3.10-rc doesn't boot on my laptop with encrypted disk. > > > general protection fault: 0000 [#1] PREEMPT SMP DEBUG_PAGEALLOC > Modules linked in: xfs libcrc32c dm_crypt crc32c_intel ghash_clmulni_intel aesni_intel glue_helper ablk_helper i915 i2c_algo_bit drm_kms_helper drm i2c_core video > CPU: 1 PID: 53 Comm: kworker/1:1 Not tainted 3.10.0-rc5+ #5 > Hardware name: LENOVO 2356JK8/2356JK8, BIOS G7ET94WW (2.54 ) 04/30/2013 > Workqueue: kcryptd kcryptd_crypt [dm_crypt] > task: ffff880135c58000 ti: ffff880135c54000 task.ti: ffff880135c54000 > RIP: 0010:[] [] aesni_xts_crypt8+0x42/0x1e0 [aesni_intel] > RSP: 0018:ffff880135c55b68 EFLAGS: 00010282 > RAX: ffffffffa0142eb8 RBX: 0000000000000080 RCX: 00000000000000f0 > RDX: ffff8801316eeaa8 RSI: ffff8801316eeaa8 RDI: ffff88012fd84440 > RBP: ffff880135c55b70 R08: ffff8801304fe118 R09: 0000000000000020 > R10: 00000000000000f0 R11: ffffffffa0142eb8 R12: ffff8801316eeb28 > R13: 0000000000000080 R14: ffff8801316eeb28 R15: 0000000000000180 > FS: 0000000000000000(0000) GS:ffff880139400000(0000) knlGS:0000000000000000 > CS: 0010 DS: 0000 ES: 0000 CR0: 0000000080050033 > CR2: 00000039e88bc720 CR3: 0000000001c0b000 CR4: 00000000001407e0 > Stack: > ffffffffa0143683 ffff880135c55c40 ffffffffa00602fb ffff880135c55c70 > ffffffffa0146060 0000000001ad0190 ffffffffa0146060 ffffea0004c5bb80 > ffff8801316eeaa8 ffffea0004c5bb80 ffff8801316eeaa8 ffff8801304fe0c0 > Call Trace: > [] ? aesni_xts_dec8+0x13/0x20 [aesni_intel] > [] glue_xts_crypt_128bit+0x10b/0x1c0 [glue_helper] > [] xts_decrypt+0x4b/0x50 [aesni_intel] > [] ablk_decrypt+0x4f/0xd0 [ablk_helper] > [] crypt_convert+0x352/0x3b0 [dm_crypt] > [] kcryptd_crypt+0x355/0x4e0 [dm_crypt] > [] ? process_one_work+0x1a5/0x700 > [] process_one_work+0x211/0x700 > [] ? process_one_work+0x1a5/0x700 > [] worker_thread+0x11b/0x3a0 > [] ? process_one_work+0x700/0x700 > [] kthread+0xed/0x100 > [] ? insert_kthread_work+0x80/0x80 > [] ret_from_fork+0x7c/0xb0 > [] ? insert_kthread_work+0x80/0x80 > Code: 8d 04 25 b8 2e 14 a0 41 0f 44 ca 4c 0f 44 d8 66 44 0f 6f 14 25 00 70 14 a0 41 0f 10 18 44 8b 8f e0 01 00 00 48 01 cf 66 0f 6f c3 <66> 0f ef 02 f3 0f 7f 1e 66 44 0f 70 db 13 66 0f d4 db 66 41 0f > RIP [] aesni_xts_crypt8+0x42/0x1e0 [aesni_intel] > RSP > > 0: 8d 04 25 b8 2e 14 a0 lea 0xffffffffa0142eb8,%eax > 7: 41 0f 44 ca cmove %r10d,%ecx > b: 4c 0f 44 d8 cmove %rax,%r11 > f: 66 44 0f 6f 14 25 00 movdqa 0xffffffffa0147000,%xmm10 > 16: 70 14 a0 > 19: 41 0f 10 18 movups (%r8),%xmm3 > 1d: 44 8b 8f e0 01 00 00 mov 0x1e0(%rdi),%r9d > 24: 48 01 cf add %rcx,%rdi > 27: 66 0f 6f c3 movdqa %xmm3,%xmm0 > 2b:* 66 0f ef 02 pxor (%rdx),%xmm0 <-- trapping instruction > 2f: f3 0f 7f 1e movdqu %xmm3,(%rsi) > 33: 66 44 0f 70 db 13 pshufd $0x13,%xmm3,%xmm11 > 39: 66 0f d4 db paddq %xmm3,%xmm3 > 3d: 66 data16 > 3e: 41 rex.B > 3f: > > --------------010303060502000304030708 Content-Type: text/x-patch; name="05-aesni_intel-xts-fix-unaligned-mem-access.patch" Content-Transfer-Encoding: 7bit Content-Disposition: attachment; filename="05-aesni_intel-xts-fix-unaligned-mem-access.patch" crypto: aesni_intel - fix accessing of unaligned memory From: Jussi Kivilinna The new XTS code for aesni_intel uses input buffers directly as memory operands for pxor instructions, which causes crash if those buffers are not aligned to 16 bytes. Patch change XTS code to handle unaligned memory correctly, by loading memory with movdqu instead. Reported-by: Dave Jones Signed-off-by: Jussi Kivilinna --- arch/x86/crypto/aesni-intel_asm.S | 48 +++++++++++++++++++++++++------------ 1 file changed, 32 insertions(+), 16 deletions(-) diff --git a/arch/x86/crypto/aesni-intel_asm.S b/arch/x86/crypto/aesni-intel_asm.S index 62fe22c..477e9d7 100644 --- a/arch/x86/crypto/aesni-intel_asm.S +++ b/arch/x86/crypto/aesni-intel_asm.S @@ -2681,56 +2681,68 @@ ENTRY(aesni_xts_crypt8) addq %rcx, KEYP movdqa IV, STATE1 - pxor 0x00(INP), STATE1 + movdqu 0x00(INP), INC + pxor INC, STATE1 movdqu IV, 0x00(OUTP) _aesni_gf128mul_x_ble() movdqa IV, STATE2 - pxor 0x10(INP), STATE2 + movdqu 0x10(INP), INC + pxor INC, STATE2 movdqu IV, 0x10(OUTP) _aesni_gf128mul_x_ble() movdqa IV, STATE3 - pxor 0x20(INP), STATE3 + movdqu 0x20(INP), INC + pxor INC, STATE3 movdqu IV, 0x20(OUTP) _aesni_gf128mul_x_ble() movdqa IV, STATE4 - pxor 0x30(INP), STATE4 + movdqu 0x30(INP), INC + pxor INC, STATE4 movdqu IV, 0x30(OUTP) call *%r11 - pxor 0x00(OUTP), STATE1 + movdqu 0x00(OUTP), INC + pxor INC, STATE1 movdqu STATE1, 0x00(OUTP) _aesni_gf128mul_x_ble() movdqa IV, STATE1 - pxor 0x40(INP), STATE1 + movdqu 0x40(INP), INC + pxor INC, STATE1 movdqu IV, 0x40(OUTP) - pxor 0x10(OUTP), STATE2 + movdqu 0x10(OUTP), INC + pxor INC, STATE2 movdqu STATE2, 0x10(OUTP) _aesni_gf128mul_x_ble() movdqa IV, STATE2 - pxor 0x50(INP), STATE2 + movdqu 0x50(INP), INC + pxor INC, STATE2 movdqu IV, 0x50(OUTP) - pxor 0x20(OUTP), STATE3 + movdqu 0x20(OUTP), INC + pxor INC, STATE3 movdqu STATE3, 0x20(OUTP) _aesni_gf128mul_x_ble() movdqa IV, STATE3 - pxor 0x60(INP), STATE3 + movdqu 0x60(INP), INC + pxor INC, STATE3 movdqu IV, 0x60(OUTP) - pxor 0x30(OUTP), STATE4 + movdqu 0x30(OUTP), INC + pxor INC, STATE4 movdqu STATE4, 0x30(OUTP) _aesni_gf128mul_x_ble() movdqa IV, STATE4 - pxor 0x70(INP), STATE4 + movdqu 0x70(INP), INC + pxor INC, STATE4 movdqu IV, 0x70(OUTP) _aesni_gf128mul_x_ble() @@ -2738,16 +2750,20 @@ ENTRY(aesni_xts_crypt8) call *%r11 - pxor 0x40(OUTP), STATE1 + movdqu 0x40(OUTP), INC + pxor INC, STATE1 movdqu STATE1, 0x40(OUTP) - pxor 0x50(OUTP), STATE2 + movdqu 0x50(OUTP), INC + pxor INC, STATE2 movdqu STATE2, 0x50(OUTP) - pxor 0x60(OUTP), STATE3 + movdqu 0x60(OUTP), INC + pxor INC, STATE3 movdqu STATE3, 0x60(OUTP) - pxor 0x70(OUTP), STATE4 + movdqu 0x70(OUTP), INC + pxor INC, STATE4 movdqu STATE4, 0x70(OUTP) ret --------------010303060502000304030708--