Commit ac3f75f4 authored by Robert Love's avatar Robert Love Committed by Linus Torvalds

[PATCH] make raid5 checksums preempt-safe, take two

The raid5 xor checksums use MMX/SSE state and are not preempt-safe.

Attached patch disables preemption in FPU_SAVE and XMMS_SAVE and
restores it in FPU_RESTORE and XMMS_RESTORE - preventing preemption
while in fp mode.
parent c9247f49
...@@ -20,6 +20,7 @@ ...@@ -20,6 +20,7 @@
#define FPU_SAVE \ #define FPU_SAVE \
do { \ do { \
preempt_disable(); \
if (!test_thread_flag(TIF_USEDFPU)) \ if (!test_thread_flag(TIF_USEDFPU)) \
__asm__ __volatile__ (" clts;\n"); \ __asm__ __volatile__ (" clts;\n"); \
__asm__ __volatile__ ("fsave %0; fwait": "=m"(fpu_save[0])); \ __asm__ __volatile__ ("fsave %0; fwait": "=m"(fpu_save[0])); \
...@@ -30,6 +31,7 @@ ...@@ -30,6 +31,7 @@
__asm__ __volatile__ ("frstor %0": : "m"(fpu_save[0])); \ __asm__ __volatile__ ("frstor %0": : "m"(fpu_save[0])); \
if (!test_thread_flag(TIF_USEDFPU)) \ if (!test_thread_flag(TIF_USEDFPU)) \
stts(); \ stts(); \
preempt_enable(); \
} while (0) } while (0)
#define LD(x,y) " movq 8*("#x")(%1), %%mm"#y" ;\n" #define LD(x,y) " movq 8*("#x")(%1), %%mm"#y" ;\n"
...@@ -542,7 +544,8 @@ static struct xor_block_template xor_block_p5_mmx = { ...@@ -542,7 +544,8 @@ static struct xor_block_template xor_block_p5_mmx = {
* Copyright (C) 1999 Zach Brown (with obvious credit due Ingo) * Copyright (C) 1999 Zach Brown (with obvious credit due Ingo)
*/ */
#define XMMS_SAVE \ #define XMMS_SAVE do { \
preempt_disable(); \
__asm__ __volatile__ ( \ __asm__ __volatile__ ( \
"movl %%cr0,%0 ;\n\t" \ "movl %%cr0,%0 ;\n\t" \
"clts ;\n\t" \ "clts ;\n\t" \
...@@ -552,9 +555,10 @@ static struct xor_block_template xor_block_p5_mmx = { ...@@ -552,9 +555,10 @@ static struct xor_block_template xor_block_p5_mmx = {
"movups %%xmm3,0x30(%1) ;\n\t" \ "movups %%xmm3,0x30(%1) ;\n\t" \
: "=&r" (cr0) \ : "=&r" (cr0) \
: "r" (xmm_save) \ : "r" (xmm_save) \
: "memory") : "memory"); \
} while(0)
#define XMMS_RESTORE \ #define XMMS_RESTORE do { \
__asm__ __volatile__ ( \ __asm__ __volatile__ ( \
"sfence ;\n\t" \ "sfence ;\n\t" \
"movups (%1),%%xmm0 ;\n\t" \ "movups (%1),%%xmm0 ;\n\t" \
...@@ -564,7 +568,9 @@ static struct xor_block_template xor_block_p5_mmx = { ...@@ -564,7 +568,9 @@ static struct xor_block_template xor_block_p5_mmx = {
"movl %0,%%cr0 ;\n\t" \ "movl %0,%%cr0 ;\n\t" \
: \ : \
: "r" (cr0), "r" (xmm_save) \ : "r" (cr0), "r" (xmm_save) \
: "memory") : "memory"); \
preempt_enable(); \
} while(0)
#define ALIGN16 __attribute__((aligned(16))) #define ALIGN16 __attribute__((aligned(16)))
......
...@@ -37,7 +37,8 @@ typedef struct { unsigned long a,b; } __attribute__((aligned(16))) xmm_store_t; ...@@ -37,7 +37,8 @@ typedef struct { unsigned long a,b; } __attribute__((aligned(16))) xmm_store_t;
/* Doesn't use gcc to save the XMM registers, because there is no easy way to /* Doesn't use gcc to save the XMM registers, because there is no easy way to
tell it to do a clts before the register saving. */ tell it to do a clts before the register saving. */
#define XMMS_SAVE \ #define XMMS_SAVE do { \
preempt_disable(); \
asm volatile ( \ asm volatile ( \
"movq %%cr0,%0 ;\n\t" \ "movq %%cr0,%0 ;\n\t" \
"clts ;\n\t" \ "clts ;\n\t" \
...@@ -47,7 +48,8 @@ typedef struct { unsigned long a,b; } __attribute__((aligned(16))) xmm_store_t; ...@@ -47,7 +48,8 @@ typedef struct { unsigned long a,b; } __attribute__((aligned(16))) xmm_store_t;
"movups %%xmm3,0x30(%1) ;\n\t" \ "movups %%xmm3,0x30(%1) ;\n\t" \
: "=r" (cr0) \ : "=r" (cr0) \
: "r" (xmm_save) \ : "r" (xmm_save) \
: "memory") : "memory"); \
} while(0)
#define XMMS_RESTORE \ #define XMMS_RESTORE \
asm volatile ( \ asm volatile ( \
...@@ -59,7 +61,9 @@ typedef struct { unsigned long a,b; } __attribute__((aligned(16))) xmm_store_t; ...@@ -59,7 +61,9 @@ typedef struct { unsigned long a,b; } __attribute__((aligned(16))) xmm_store_t;
"movq %0,%%cr0 ;\n\t" \ "movq %0,%%cr0 ;\n\t" \
: \ : \
: "r" (cr0), "r" (xmm_save) \ : "r" (cr0), "r" (xmm_save) \
: "memory") : "memory"); \
preempt_enable(); \
} while(0)
#define OFFS(x) "16*("#x")" #define OFFS(x) "16*("#x")"
#define PF_OFFS(x) "256+16*("#x")" #define PF_OFFS(x) "256+16*("#x")"
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment