Commit a62bc073 authored by Michael Holzheu's avatar Michael Holzheu Committed by Martin Schwidefsky

s390/kdump: add support for vector extension

With this patch for kdump the s390 vector registers are stored into the
prepared save areas in the old kernel and into the REGSET_VX_LOW and
REGSET_VX_HIGH ELF notes for /proc/vmcore in the new kernel.

The NT_S390_VXRS_LOW note contains the lower halves of the first 16 vector
registers 0-15. The higher halves are stored in the floating point register
ELF note.  The NT_S390_VXRS_HIGH contains the full vector registers 16-31.

The kernel provides a save area for storing vector register in case of
machine checks. A pointer to this save are is stored in the CPU lowcore
at offset 0x11b0. This save area is also used to save the registers for
kdump. In case of a dumped crashed kdump those areas are used to extract
the registers of the production system.

The vector registers for remote CPUs are stored using the "store additional
status at address" SIGP. For the dump CPU the vector registers are stored
with the VSTM instruction.

With this patch also zfcpdump stores the vector registers.
Reviewed-by: default avatarHeiko Carstens <heiko.carstens@de.ibm.com>
Signed-off-by: default avatarMichael Holzheu <holzheu@linux.vnet.ibm.com>
Signed-off-by: default avatarMartin Schwidefsky <schwidefsky@de.ibm.com>
parent 3585cb02
...@@ -226,6 +226,6 @@ int arch_setup_additional_pages(struct linux_binprm *, int); ...@@ -226,6 +226,6 @@ int arch_setup_additional_pages(struct linux_binprm *, int);
extern unsigned long arch_randomize_brk(struct mm_struct *mm); extern unsigned long arch_randomize_brk(struct mm_struct *mm);
#define arch_randomize_brk arch_randomize_brk #define arch_randomize_brk arch_randomize_brk
void *fill_cpu_elf_notes(void *ptr, struct save_area *sa); void *fill_cpu_elf_notes(void *ptr, struct save_area *sa, __vector128 *vxrs);
#endif #endif
...@@ -89,12 +89,12 @@ extern u32 ipl_flags; ...@@ -89,12 +89,12 @@ extern u32 ipl_flags;
extern u32 dump_prefix_page; extern u32 dump_prefix_page;
struct dump_save_areas { struct dump_save_areas {
struct save_area **areas; struct save_area_ext **areas;
int count; int count;
}; };
extern struct dump_save_areas dump_save_areas; extern struct dump_save_areas dump_save_areas;
struct save_area *dump_save_area_create(int cpu); struct save_area_ext *dump_save_area_create(int cpu);
extern void do_reipl(void); extern void do_reipl(void);
extern void do_halt(void); extern void do_halt(void);
......
...@@ -11,6 +11,7 @@ ...@@ -11,6 +11,7 @@
#include <linux/types.h> #include <linux/types.h>
#include <asm/ptrace.h> #include <asm/ptrace.h>
#include <asm/cpu.h> #include <asm/cpu.h>
#include <asm/types.h>
#ifdef CONFIG_32BIT #ifdef CONFIG_32BIT
...@@ -31,6 +32,11 @@ struct save_area { ...@@ -31,6 +32,11 @@ struct save_area {
u32 ctrl_regs[16]; u32 ctrl_regs[16];
} __packed; } __packed;
struct save_area_ext {
struct save_area sa;
__vector128 vx_regs[32];
};
struct _lowcore { struct _lowcore {
psw_t restart_psw; /* 0x0000 */ psw_t restart_psw; /* 0x0000 */
psw_t restart_old_psw; /* 0x0008 */ psw_t restart_old_psw; /* 0x0008 */
...@@ -183,6 +189,11 @@ struct save_area { ...@@ -183,6 +189,11 @@ struct save_area {
u64 ctrl_regs[16]; u64 ctrl_regs[16];
} __packed; } __packed;
struct save_area_ext {
struct save_area sa;
__vector128 vx_regs[32];
};
struct _lowcore { struct _lowcore {
__u8 pad_0x0000[0x0014-0x0000]; /* 0x0000 */ __u8 pad_0x0000[0x0014-0x0000]; /* 0x0000 */
__u32 ipl_parmblock_ptr; /* 0x0014 */ __u32 ipl_parmblock_ptr; /* 0x0014 */
......
...@@ -15,6 +15,7 @@ ...@@ -15,6 +15,7 @@
#define SIGP_SET_ARCHITECTURE 18 #define SIGP_SET_ARCHITECTURE 18
#define SIGP_COND_EMERGENCY_SIGNAL 19 #define SIGP_COND_EMERGENCY_SIGNAL 19
#define SIGP_SENSE_RUNNING 21 #define SIGP_SENSE_RUNNING 21
#define SIGP_STORE_ADDITIONAL_STATUS 23
/* SIGP condition codes */ /* SIGP condition codes */
#define SIGP_CC_ORDER_CODE_ACCEPTED 0 #define SIGP_CC_ORDER_CODE_ACCEPTED 0
...@@ -33,9 +34,10 @@ ...@@ -33,9 +34,10 @@
#ifndef __ASSEMBLY__ #ifndef __ASSEMBLY__
static inline int __pcpu_sigp(u16 addr, u8 order, u32 parm, u32 *status) static inline int __pcpu_sigp(u16 addr, u8 order, unsigned long parm,
u32 *status)
{ {
register unsigned int reg1 asm ("1") = parm; register unsigned long reg1 asm ("1") = parm;
int cc; int cc;
asm volatile( asm volatile(
......
...@@ -114,6 +114,19 @@ static inline void save_vx_regs(__vector128 *vxrs) ...@@ -114,6 +114,19 @@ static inline void save_vx_regs(__vector128 *vxrs)
: "=Q" (*(addrtype *) vxrs) : : "1"); : "=Q" (*(addrtype *) vxrs) : : "1");
} }
static inline void save_vx_regs_safe(__vector128 *vxrs)
{
unsigned long cr0, flags;
flags = arch_local_irq_save();
__ctl_store(cr0, 0, 0);
__ctl_set_bit(0, 17);
__ctl_set_bit(0, 18);
save_vx_regs(vxrs);
__ctl_load(cr0, 0, 0);
arch_local_irq_restore(flags);
}
static inline void restore_vx_regs(__vector128 *vxrs) static inline void restore_vx_regs(__vector128 *vxrs)
{ {
typedef struct { __vector128 _[__NUM_VXRS]; } addrtype; typedef struct { __vector128 _[__NUM_VXRS]; } addrtype;
......
...@@ -46,9 +46,9 @@ struct dump_save_areas dump_save_areas; ...@@ -46,9 +46,9 @@ struct dump_save_areas dump_save_areas;
/* /*
* Allocate and add a save area for a CPU * Allocate and add a save area for a CPU
*/ */
struct save_area *dump_save_area_create(int cpu) struct save_area_ext *dump_save_area_create(int cpu)
{ {
struct save_area **save_areas, *save_area; struct save_area_ext **save_areas, *save_area;
save_area = kmalloc(sizeof(*save_area), GFP_KERNEL); save_area = kmalloc(sizeof(*save_area), GFP_KERNEL);
if (!save_area) if (!save_area)
...@@ -385,10 +385,46 @@ static void *nt_s390_prefix(void *ptr, struct save_area *sa) ...@@ -385,10 +385,46 @@ static void *nt_s390_prefix(void *ptr, struct save_area *sa)
sizeof(sa->pref_reg), KEXEC_CORE_NOTE_NAME); sizeof(sa->pref_reg), KEXEC_CORE_NOTE_NAME);
} }
/*
* Initialize vxrs high note (full 128 bit VX registers 16-31)
*/
static void *nt_s390_vx_high(void *ptr, __vector128 *vx_regs)
{
return nt_init(ptr, NT_S390_VXRS_HIGH, &vx_regs[16],
16 * sizeof(__vector128), KEXEC_CORE_NOTE_NAME);
}
/*
* Initialize vxrs low note (lower halves of VX registers 0-15)
*/
static void *nt_s390_vx_low(void *ptr, __vector128 *vx_regs)
{
Elf64_Nhdr *note;
u64 len;
int i;
note = (Elf64_Nhdr *)ptr;
note->n_namesz = strlen(KEXEC_CORE_NOTE_NAME) + 1;
note->n_descsz = 16 * 8;
note->n_type = NT_S390_VXRS_LOW;
len = sizeof(Elf64_Nhdr);
memcpy(ptr + len, KEXEC_CORE_NOTE_NAME, note->n_namesz);
len = roundup(len + note->n_namesz, 4);
ptr += len;
/* Copy lower halves of SIMD registers 0-15 */
for (i = 0; i < 16; i++) {
memcpy(ptr, &vx_regs[i], 8);
ptr += 8;
}
return ptr;
}
/* /*
* Fill ELF notes for one CPU with save area registers * Fill ELF notes for one CPU with save area registers
*/ */
void *fill_cpu_elf_notes(void *ptr, struct save_area *sa) void *fill_cpu_elf_notes(void *ptr, struct save_area *sa, __vector128 *vx_regs)
{ {
ptr = nt_prstatus(ptr, sa); ptr = nt_prstatus(ptr, sa);
ptr = nt_fpregset(ptr, sa); ptr = nt_fpregset(ptr, sa);
...@@ -397,6 +433,10 @@ void *fill_cpu_elf_notes(void *ptr, struct save_area *sa) ...@@ -397,6 +433,10 @@ void *fill_cpu_elf_notes(void *ptr, struct save_area *sa)
ptr = nt_s390_tod_preg(ptr, sa); ptr = nt_s390_tod_preg(ptr, sa);
ptr = nt_s390_ctrs(ptr, sa); ptr = nt_s390_ctrs(ptr, sa);
ptr = nt_s390_prefix(ptr, sa); ptr = nt_s390_prefix(ptr, sa);
if (MACHINE_HAS_VX && vx_regs) {
ptr = nt_s390_vx_low(ptr, vx_regs);
ptr = nt_s390_vx_high(ptr, vx_regs);
}
return ptr; return ptr;
} }
...@@ -484,7 +524,7 @@ static int get_cpu_cnt(void) ...@@ -484,7 +524,7 @@ static int get_cpu_cnt(void)
int i, cpus = 0; int i, cpus = 0;
for (i = 0; i < dump_save_areas.count; i++) { for (i = 0; i < dump_save_areas.count; i++) {
if (dump_save_areas.areas[i]->pref_reg == 0) if (dump_save_areas.areas[i]->sa.pref_reg == 0)
continue; continue;
cpus++; cpus++;
} }
...@@ -530,17 +570,17 @@ static void loads_init(Elf64_Phdr *phdr, u64 loads_offset) ...@@ -530,17 +570,17 @@ static void loads_init(Elf64_Phdr *phdr, u64 loads_offset)
*/ */
static void *notes_init(Elf64_Phdr *phdr, void *ptr, u64 notes_offset) static void *notes_init(Elf64_Phdr *phdr, void *ptr, u64 notes_offset)
{ {
struct save_area *sa; struct save_area_ext *sa_ext;
void *ptr_start = ptr; void *ptr_start = ptr;
int i; int i;
ptr = nt_prpsinfo(ptr); ptr = nt_prpsinfo(ptr);
for (i = 0; i < dump_save_areas.count; i++) { for (i = 0; i < dump_save_areas.count; i++) {
sa = dump_save_areas.areas[i]; sa_ext = dump_save_areas.areas[i];
if (sa->pref_reg == 0) if (sa_ext->sa.pref_reg == 0)
continue; continue;
ptr = fill_cpu_elf_notes(ptr, sa); ptr = fill_cpu_elf_notes(ptr, &sa_ext->sa, sa_ext->vx_regs);
} }
ptr = nt_vmcoreinfo(ptr); ptr = nt_vmcoreinfo(ptr);
memset(phdr, 0, sizeof(*phdr)); memset(phdr, 0, sizeof(*phdr));
...@@ -581,7 +621,7 @@ int elfcorehdr_alloc(unsigned long long *addr, unsigned long long *size) ...@@ -581,7 +621,7 @@ int elfcorehdr_alloc(unsigned long long *addr, unsigned long long *size)
mem_chunk_cnt = get_mem_chunk_cnt(); mem_chunk_cnt = get_mem_chunk_cnt();
alloc_size = 0x1000 + get_cpu_cnt() * 0x300 + alloc_size = 0x1000 + get_cpu_cnt() * 0x4a0 +
mem_chunk_cnt * sizeof(Elf64_Phdr); mem_chunk_cnt * sizeof(Elf64_Phdr);
hdr = kzalloc_panic(alloc_size); hdr = kzalloc_panic(alloc_size);
/* Init elf header */ /* Init elf header */
......
...@@ -25,6 +25,7 @@ ...@@ -25,6 +25,7 @@
#include <asm/elf.h> #include <asm/elf.h>
#include <asm/asm-offsets.h> #include <asm/asm-offsets.h>
#include <asm/os_info.h> #include <asm/os_info.h>
#include <asm/switch_to.h>
typedef void (*relocate_kernel_t)(kimage_entry_t *, unsigned long); typedef void (*relocate_kernel_t)(kimage_entry_t *, unsigned long);
...@@ -43,7 +44,7 @@ static void add_elf_notes(int cpu) ...@@ -43,7 +44,7 @@ static void add_elf_notes(int cpu)
memcpy((void *) (4608UL + sa->pref_reg), sa, sizeof(*sa)); memcpy((void *) (4608UL + sa->pref_reg), sa, sizeof(*sa));
ptr = (u64 *) per_cpu_ptr(crash_notes, cpu); ptr = (u64 *) per_cpu_ptr(crash_notes, cpu);
ptr = fill_cpu_elf_notes(ptr, sa); ptr = fill_cpu_elf_notes(ptr, sa, NULL);
memset(ptr, 0, sizeof(struct elf_note)); memset(ptr, 0, sizeof(struct elf_note));
} }
...@@ -53,8 +54,11 @@ static void add_elf_notes(int cpu) ...@@ -53,8 +54,11 @@ static void add_elf_notes(int cpu)
static void setup_regs(void) static void setup_regs(void)
{ {
unsigned long sa = S390_lowcore.prefixreg_save_area + SAVE_AREA_BASE; unsigned long sa = S390_lowcore.prefixreg_save_area + SAVE_AREA_BASE;
struct _lowcore *lc;
int cpu, this_cpu; int cpu, this_cpu;
/* Get lowcore pointer from store status of this CPU (absolute zero) */
lc = (struct _lowcore *)(unsigned long)S390_lowcore.prefixreg_save_area;
this_cpu = smp_find_processor_id(stap()); this_cpu = smp_find_processor_id(stap());
add_elf_notes(this_cpu); add_elf_notes(this_cpu);
for_each_online_cpu(cpu) { for_each_online_cpu(cpu) {
...@@ -64,6 +68,8 @@ static void setup_regs(void) ...@@ -64,6 +68,8 @@ static void setup_regs(void)
continue; continue;
add_elf_notes(cpu); add_elf_notes(cpu);
} }
if (MACHINE_HAS_VX)
save_vx_regs_safe((void *) lc->vector_save_area_addr);
/* Copy dump CPU store status info to absolute zero */ /* Copy dump CPU store status info to absolute zero */
memcpy((void *) SAVE_AREA_BASE, (void *) sa, sizeof(struct save_area)); memcpy((void *) SAVE_AREA_BASE, (void *) sa, sizeof(struct save_area));
} }
......
...@@ -83,7 +83,8 @@ DEFINE_MUTEX(smp_cpu_state_mutex); ...@@ -83,7 +83,8 @@ DEFINE_MUTEX(smp_cpu_state_mutex);
/* /*
* Signal processor helper functions. * Signal processor helper functions.
*/ */
static inline int __pcpu_sigp_relax(u16 addr, u8 order, u32 parm, u32 *status) static inline int __pcpu_sigp_relax(u16 addr, u8 order, unsigned long parm,
u32 *status)
{ {
int cc; int cc;
...@@ -515,35 +516,53 @@ EXPORT_SYMBOL(smp_ctl_clear_bit); ...@@ -515,35 +516,53 @@ EXPORT_SYMBOL(smp_ctl_clear_bit);
static void __init smp_get_save_area(int cpu, u16 address) static void __init smp_get_save_area(int cpu, u16 address)
{ {
void *lc = pcpu_devices[0].lowcore; void *lc = pcpu_devices[0].lowcore;
struct save_area *save_area; struct save_area_ext *sa_ext;
unsigned long vx_sa;
if (is_kdump_kernel()) if (is_kdump_kernel())
return; return;
if (!OLDMEM_BASE && (address == boot_cpu_address || if (!OLDMEM_BASE && (address == boot_cpu_address ||
ipl_info.type != IPL_TYPE_FCP_DUMP)) ipl_info.type != IPL_TYPE_FCP_DUMP))
return; return;
save_area = dump_save_area_create(cpu); sa_ext = dump_save_area_create(cpu);
if (!save_area) if (!sa_ext)
panic("could not allocate memory for save area\n"); panic("could not allocate memory for save area\n");
if (address == boot_cpu_address) { if (address == boot_cpu_address) {
/* Copy the registers of the boot cpu. */ /* Copy the registers of the boot cpu. */
copy_oldmem_page(1, (void *) save_area, sizeof(*save_area), copy_oldmem_page(1, (void *) &sa_ext->sa, sizeof(sa_ext->sa),
SAVE_AREA_BASE - PAGE_SIZE, 0); SAVE_AREA_BASE - PAGE_SIZE, 0);
if (MACHINE_HAS_VX)
save_vx_regs_safe(sa_ext->vx_regs);
return; return;
} }
/* Get the registers of a non-boot cpu. */ /* Get the registers of a non-boot cpu. */
__pcpu_sigp_relax(address, SIGP_STOP_AND_STORE_STATUS, 0, NULL); __pcpu_sigp_relax(address, SIGP_STOP_AND_STORE_STATUS, 0, NULL);
memcpy_real(save_area, lc + SAVE_AREA_BASE, sizeof(*save_area)); memcpy_real(&sa_ext->sa, lc + SAVE_AREA_BASE, sizeof(sa_ext->sa));
if (!MACHINE_HAS_VX)
return;
/* Get the VX registers */
vx_sa = __get_free_page(GFP_KERNEL);
if (!vx_sa)
panic("could not allocate memory for VX save area\n");
__pcpu_sigp_relax(address, SIGP_STORE_ADDITIONAL_STATUS, vx_sa, NULL);
memcpy(sa_ext->vx_regs, (void *) vx_sa, sizeof(sa_ext->vx_regs));
free_page(vx_sa);
} }
int smp_store_status(int cpu) int smp_store_status(int cpu)
{ {
unsigned long vx_sa;
struct pcpu *pcpu; struct pcpu *pcpu;
pcpu = pcpu_devices + cpu; pcpu = pcpu_devices + cpu;
if (__pcpu_sigp_relax(pcpu->address, SIGP_STOP_AND_STORE_STATUS, if (__pcpu_sigp_relax(pcpu->address, SIGP_STOP_AND_STORE_STATUS,
0, NULL) != SIGP_CC_ORDER_CODE_ACCEPTED) 0, NULL) != SIGP_CC_ORDER_CODE_ACCEPTED)
return -EIO; return -EIO;
if (!MACHINE_HAS_VX)
return 0;
vx_sa = __pa(pcpu->lowcore->vector_save_area_addr);
__pcpu_sigp_relax(pcpu->address, SIGP_STORE_ADDITIONAL_STATUS,
vx_sa, NULL);
return 0; return 0;
} }
......
...@@ -28,6 +28,7 @@ ...@@ -28,6 +28,7 @@
#include <asm/processor.h> #include <asm/processor.h>
#include <asm/irqflags.h> #include <asm/irqflags.h>
#include <asm/checksum.h> #include <asm/checksum.h>
#include <asm/switch_to.h>
#include "sclp.h" #include "sclp.h"
#define TRACE(x...) debug_sprintf_event(zcore_dbf, 1, x) #define TRACE(x...) debug_sprintf_event(zcore_dbf, 1, x)
...@@ -149,18 +150,21 @@ static int memcpy_hsa_kernel(void *dest, unsigned long src, size_t count) ...@@ -149,18 +150,21 @@ static int memcpy_hsa_kernel(void *dest, unsigned long src, size_t count)
static int __init init_cpu_info(enum arch_id arch) static int __init init_cpu_info(enum arch_id arch)
{ {
struct save_area *sa; struct save_area_ext *sa_ext;
/* get info for boot cpu from lowcore, stored in the HSA */ /* get info for boot cpu from lowcore, stored in the HSA */
sa = dump_save_area_create(0); sa_ext = dump_save_area_create(0);
if (!sa) if (!sa_ext)
return -ENOMEM; return -ENOMEM;
if (memcpy_hsa_kernel(sa, sys_info.sa_base, sys_info.sa_size) < 0) { if (memcpy_hsa_kernel(&sa_ext->sa, sys_info.sa_base,
sys_info.sa_size) < 0) {
TRACE("could not copy from HSA\n"); TRACE("could not copy from HSA\n");
kfree(sa); kfree(sa_ext);
return -EIO; return -EIO;
} }
if (MACHINE_HAS_VX)
save_vx_regs_safe(sa_ext->vx_regs);
return 0; return 0;
} }
...@@ -258,7 +262,7 @@ static int zcore_add_lc(char __user *buf, unsigned long start, size_t count) ...@@ -258,7 +262,7 @@ static int zcore_add_lc(char __user *buf, unsigned long start, size_t count)
unsigned long sa_start, sa_end; /* save area range */ unsigned long sa_start, sa_end; /* save area range */
unsigned long prefix; unsigned long prefix;
unsigned long sa_off, len, buf_off; unsigned long sa_off, len, buf_off;
struct save_area *save_area = dump_save_areas.areas[i]; struct save_area *save_area = &dump_save_areas.areas[i]->sa;
prefix = save_area->pref_reg; prefix = save_area->pref_reg;
sa_start = prefix + sys_info.sa_base; sa_start = prefix + sys_info.sa_base;
...@@ -612,7 +616,7 @@ static void __init zcore_header_init(int arch, struct zcore_header *hdr, ...@@ -612,7 +616,7 @@ static void __init zcore_header_init(int arch, struct zcore_header *hdr,
hdr->tod = get_tod_clock(); hdr->tod = get_tod_clock();
get_cpu_id(&hdr->cpu_id); get_cpu_id(&hdr->cpu_id);
for (i = 0; i < dump_save_areas.count; i++) { for (i = 0; i < dump_save_areas.count; i++) {
prefix = dump_save_areas.areas[i]->pref_reg; prefix = dump_save_areas.areas[i]->sa.pref_reg;
hdr->real_cpu_cnt++; hdr->real_cpu_cnt++;
if (!prefix) if (!prefix)
continue; continue;
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment