mirror of
https://git.proxmox.com/git/mirror_ubuntu-kernels.git
synced 2025-12-07 23:45:36 +00:00
Improve the save and restore behavior of FPU register contents to use the vector extension within the kernel. The kernel does not use floating-point or vector registers and, therefore, saving and restoring the FPU register contents are performed for handling signals or switching processes only. To prepare for using vector instructions and vector registers within the kernel, enhance the save behavior and implement a lazy restore at return to user space from a system call or interrupt. To implement the lazy restore, the save_fpu_regs() sets a CPU information flag, CIF_FPU, to indicate that the FPU registers must be restored. Saving and setting CIF_FPU is performed in an atomic fashion to be interrupt-safe. When the kernel wants to use the vector extension or wants to change the FPU register state for a task during signal handling, the save_fpu_regs() must be called first. The CIF_FPU flag is also set at process switch. At return to user space, the FPU state is restored. In particular, the FPU state includes the floating-point or vector register contents, as well as, vector-enablement and floating-point control. The FPU state restore and clearing CIF_FPU is also performed in an atomic fashion. For KVM, the restore of the FPU register state is performed when restoring the general-purpose guest registers before the SIE instructions is started. Because the path towards the SIE instruction is interruptible, the CIF_FPU flag must be checked again right before going into SIE. If set, the guest registers must be reloaded again by re-entering the outer SIE loop. This is the same behavior as if the SIE critical section is interrupted. Signed-off-by: Hendrik Brueckner <brueckner@linux.vnet.ibm.com> Signed-off-by: Martin Schwidefsky <schwidefsky@de.ibm.com>
344 lines
9.1 KiB
C
344 lines
9.1 KiB
C
/*
|
|
* S390 version
|
|
* Copyright IBM Corp. 1999
|
|
* Author(s): Hartmut Penner (hp@de.ibm.com),
|
|
* Martin Schwidefsky (schwidefsky@de.ibm.com)
|
|
*
|
|
* Derived from "include/asm-i386/processor.h"
|
|
* Copyright (C) 1994, Linus Torvalds
|
|
*/
|
|
|
|
#ifndef __ASM_S390_PROCESSOR_H
|
|
#define __ASM_S390_PROCESSOR_H
|
|
|
|
#define CIF_MCCK_PENDING 0 /* machine check handling is pending */
|
|
#define CIF_ASCE 1 /* user asce needs fixup / uaccess */
|
|
#define CIF_NOHZ_DELAY 2 /* delay HZ disable for a tick */
|
|
#define CIF_FPU 3 /* restore vector registers */
|
|
|
|
#define _CIF_MCCK_PENDING (1<<CIF_MCCK_PENDING)
|
|
#define _CIF_ASCE (1<<CIF_ASCE)
|
|
#define _CIF_NOHZ_DELAY (1<<CIF_NOHZ_DELAY)
|
|
#define _CIF_FPU (1<<CIF_FPU)
|
|
|
|
#ifndef __ASSEMBLY__
|
|
|
|
#include <linux/linkage.h>
|
|
#include <linux/irqflags.h>
|
|
#include <asm/cpu.h>
|
|
#include <asm/page.h>
|
|
#include <asm/ptrace.h>
|
|
#include <asm/setup.h>
|
|
#include <asm/runtime_instr.h>
|
|
#include <asm/fpu-internal.h>
|
|
|
|
static inline void set_cpu_flag(int flag)
|
|
{
|
|
S390_lowcore.cpu_flags |= (1U << flag);
|
|
}
|
|
|
|
static inline void clear_cpu_flag(int flag)
|
|
{
|
|
S390_lowcore.cpu_flags &= ~(1U << flag);
|
|
}
|
|
|
|
static inline int test_cpu_flag(int flag)
|
|
{
|
|
return !!(S390_lowcore.cpu_flags & (1U << flag));
|
|
}
|
|
|
|
#define arch_needs_cpu() test_cpu_flag(CIF_NOHZ_DELAY)
|
|
|
|
/*
|
|
* Default implementation of macro that returns current
|
|
* instruction pointer ("program counter").
|
|
*/
|
|
#define current_text_addr() ({ void *pc; asm("basr %0,0" : "=a" (pc)); pc; })
|
|
|
|
static inline void get_cpu_id(struct cpuid *ptr)
|
|
{
|
|
asm volatile("stidp %0" : "=Q" (*ptr));
|
|
}
|
|
|
|
extern void s390_adjust_jiffies(void);
|
|
extern const struct seq_operations cpuinfo_op;
|
|
extern int sysctl_ieee_emulation_warnings;
|
|
extern void execve_tail(void);
|
|
|
|
/*
|
|
* User space process size: 2GB for 31 bit, 4TB or 8PT for 64 bit.
|
|
*/
|
|
|
|
#define TASK_SIZE_OF(tsk) ((tsk)->mm->context.asce_limit)
|
|
#define TASK_UNMAPPED_BASE (test_thread_flag(TIF_31BIT) ? \
|
|
(1UL << 30) : (1UL << 41))
|
|
#define TASK_SIZE TASK_SIZE_OF(current)
|
|
#define TASK_MAX_SIZE (1UL << 53)
|
|
|
|
#define STACK_TOP (1UL << (test_thread_flag(TIF_31BIT) ? 31:42))
|
|
#define STACK_TOP_MAX (1UL << 42)
|
|
|
|
#define HAVE_ARCH_PICK_MMAP_LAYOUT
|
|
|
|
typedef struct {
|
|
__u32 ar4;
|
|
} mm_segment_t;
|
|
|
|
/*
|
|
* Thread structure
|
|
*/
|
|
struct thread_struct {
|
|
struct fpu fpu; /* FP and VX register save area */
|
|
unsigned int acrs[NUM_ACRS];
|
|
unsigned long ksp; /* kernel stack pointer */
|
|
mm_segment_t mm_segment;
|
|
unsigned long gmap_addr; /* address of last gmap fault. */
|
|
unsigned int gmap_pfault; /* signal of a pending guest pfault */
|
|
struct per_regs per_user; /* User specified PER registers */
|
|
struct per_event per_event; /* Cause of the last PER trap */
|
|
unsigned long per_flags; /* Flags to control debug behavior */
|
|
/* pfault_wait is used to block the process on a pfault event */
|
|
unsigned long pfault_wait;
|
|
struct list_head list;
|
|
/* cpu runtime instrumentation */
|
|
struct runtime_instr_cb *ri_cb;
|
|
int ri_signum;
|
|
unsigned char trap_tdb[256]; /* Transaction abort diagnose block */
|
|
};
|
|
|
|
/* Flag to disable transactions. */
|
|
#define PER_FLAG_NO_TE 1UL
|
|
/* Flag to enable random transaction aborts. */
|
|
#define PER_FLAG_TE_ABORT_RAND 2UL
|
|
/* Flag to specify random transaction abort mode:
|
|
* - abort each transaction at a random instruction before TEND if set.
|
|
* - abort random transactions at a random instruction if cleared.
|
|
*/
|
|
#define PER_FLAG_TE_ABORT_RAND_TEND 4UL
|
|
|
|
typedef struct thread_struct thread_struct;
|
|
|
|
/*
|
|
* Stack layout of a C stack frame.
|
|
*/
|
|
#ifndef __PACK_STACK
|
|
struct stack_frame {
|
|
unsigned long back_chain;
|
|
unsigned long empty1[5];
|
|
unsigned long gprs[10];
|
|
unsigned int empty2[8];
|
|
};
|
|
#else
|
|
struct stack_frame {
|
|
unsigned long empty1[5];
|
|
unsigned int empty2[8];
|
|
unsigned long gprs[10];
|
|
unsigned long back_chain;
|
|
};
|
|
#endif
|
|
|
|
#define ARCH_MIN_TASKALIGN 8
|
|
|
|
#define INIT_THREAD { \
|
|
.ksp = sizeof(init_stack) + (unsigned long) &init_stack, \
|
|
}
|
|
|
|
/*
|
|
* Do necessary setup to start up a new thread.
|
|
*/
|
|
#define start_thread(regs, new_psw, new_stackp) do { \
|
|
regs->psw.mask = PSW_USER_BITS | PSW_MASK_EA | PSW_MASK_BA; \
|
|
regs->psw.addr = new_psw | PSW_ADDR_AMODE; \
|
|
regs->gprs[15] = new_stackp; \
|
|
execve_tail(); \
|
|
} while (0)
|
|
|
|
#define start_thread31(regs, new_psw, new_stackp) do { \
|
|
regs->psw.mask = PSW_USER_BITS | PSW_MASK_BA; \
|
|
regs->psw.addr = new_psw | PSW_ADDR_AMODE; \
|
|
regs->gprs[15] = new_stackp; \
|
|
crst_table_downgrade(current->mm, 1UL << 31); \
|
|
execve_tail(); \
|
|
} while (0)
|
|
|
|
/* Forward declaration, a strange C thing */
|
|
struct task_struct;
|
|
struct mm_struct;
|
|
struct seq_file;
|
|
|
|
void show_cacheinfo(struct seq_file *m);
|
|
|
|
/* Free all resources held by a thread. */
|
|
extern void release_thread(struct task_struct *);
|
|
|
|
/*
|
|
* Return saved PC of a blocked thread.
|
|
*/
|
|
extern unsigned long thread_saved_pc(struct task_struct *t);
|
|
|
|
unsigned long get_wchan(struct task_struct *p);
|
|
#define task_pt_regs(tsk) ((struct pt_regs *) \
|
|
(task_stack_page(tsk) + THREAD_SIZE) - 1)
|
|
#define KSTK_EIP(tsk) (task_pt_regs(tsk)->psw.addr)
|
|
#define KSTK_ESP(tsk) (task_pt_regs(tsk)->gprs[15])
|
|
|
|
/* Has task runtime instrumentation enabled ? */
|
|
#define is_ri_task(tsk) (!!(tsk)->thread.ri_cb)
|
|
|
|
static inline unsigned short stap(void)
|
|
{
|
|
unsigned short cpu_address;
|
|
|
|
asm volatile("stap %0" : "=m" (cpu_address));
|
|
return cpu_address;
|
|
}
|
|
|
|
/*
|
|
* Give up the time slice of the virtual PU.
|
|
*/
|
|
void cpu_relax(void);
|
|
|
|
#define cpu_relax_lowlatency() barrier()
|
|
|
|
static inline void psw_set_key(unsigned int key)
|
|
{
|
|
asm volatile("spka 0(%0)" : : "d" (key));
|
|
}
|
|
|
|
/*
|
|
* Set PSW to specified value.
|
|
*/
|
|
static inline void __load_psw(psw_t psw)
|
|
{
|
|
asm volatile("lpswe %0" : : "Q" (psw) : "cc");
|
|
}
|
|
|
|
/*
|
|
* Set PSW mask to specified value, while leaving the
|
|
* PSW addr pointing to the next instruction.
|
|
*/
|
|
static inline void __load_psw_mask (unsigned long mask)
|
|
{
|
|
unsigned long addr;
|
|
psw_t psw;
|
|
|
|
psw.mask = mask;
|
|
|
|
asm volatile(
|
|
" larl %0,1f\n"
|
|
" stg %0,%O1+8(%R1)\n"
|
|
" lpswe %1\n"
|
|
"1:"
|
|
: "=&d" (addr), "=Q" (psw) : "Q" (psw) : "memory", "cc");
|
|
}
|
|
|
|
/*
|
|
* Rewind PSW instruction address by specified number of bytes.
|
|
*/
|
|
static inline unsigned long __rewind_psw(psw_t psw, unsigned long ilc)
|
|
{
|
|
unsigned long mask;
|
|
|
|
mask = (psw.mask & PSW_MASK_EA) ? -1UL :
|
|
(psw.mask & PSW_MASK_BA) ? (1UL << 31) - 1 :
|
|
(1UL << 24) - 1;
|
|
return (psw.addr - ilc) & mask;
|
|
}
|
|
|
|
/*
|
|
* Function to stop a processor until the next interrupt occurs
|
|
*/
|
|
void enabled_wait(void);
|
|
|
|
/*
|
|
* Function to drop a processor into disabled wait state
|
|
*/
|
|
static inline void __noreturn disabled_wait(unsigned long code)
|
|
{
|
|
unsigned long ctl_buf;
|
|
psw_t dw_psw;
|
|
|
|
dw_psw.mask = PSW_MASK_BASE | PSW_MASK_WAIT | PSW_MASK_BA | PSW_MASK_EA;
|
|
dw_psw.addr = code;
|
|
/*
|
|
* Store status and then load disabled wait psw,
|
|
* the processor is dead afterwards
|
|
*/
|
|
asm volatile(
|
|
" stctg 0,0,0(%2)\n"
|
|
" ni 4(%2),0xef\n" /* switch off protection */
|
|
" lctlg 0,0,0(%2)\n"
|
|
" lghi 1,0x1000\n"
|
|
" stpt 0x328(1)\n" /* store timer */
|
|
" stckc 0x330(1)\n" /* store clock comparator */
|
|
" stpx 0x318(1)\n" /* store prefix register */
|
|
" stam 0,15,0x340(1)\n"/* store access registers */
|
|
" stfpc 0x31c(1)\n" /* store fpu control */
|
|
" std 0,0x200(1)\n" /* store f0 */
|
|
" std 1,0x208(1)\n" /* store f1 */
|
|
" std 2,0x210(1)\n" /* store f2 */
|
|
" std 3,0x218(1)\n" /* store f3 */
|
|
" std 4,0x220(1)\n" /* store f4 */
|
|
" std 5,0x228(1)\n" /* store f5 */
|
|
" std 6,0x230(1)\n" /* store f6 */
|
|
" std 7,0x238(1)\n" /* store f7 */
|
|
" std 8,0x240(1)\n" /* store f8 */
|
|
" std 9,0x248(1)\n" /* store f9 */
|
|
" std 10,0x250(1)\n" /* store f10 */
|
|
" std 11,0x258(1)\n" /* store f11 */
|
|
" std 12,0x260(1)\n" /* store f12 */
|
|
" std 13,0x268(1)\n" /* store f13 */
|
|
" std 14,0x270(1)\n" /* store f14 */
|
|
" std 15,0x278(1)\n" /* store f15 */
|
|
" stmg 0,15,0x280(1)\n"/* store general registers */
|
|
" stctg 0,15,0x380(1)\n"/* store control registers */
|
|
" oi 0x384(1),0x10\n"/* fake protection bit */
|
|
" lpswe 0(%1)"
|
|
: "=m" (ctl_buf)
|
|
: "a" (&dw_psw), "a" (&ctl_buf), "m" (dw_psw) : "cc", "0", "1");
|
|
while (1);
|
|
}
|
|
|
|
/*
|
|
* Use to set psw mask except for the first byte which
|
|
* won't be changed by this function.
|
|
*/
|
|
static inline void
|
|
__set_psw_mask(unsigned long mask)
|
|
{
|
|
__load_psw_mask(mask | (arch_local_save_flags() & ~(-1UL >> 8)));
|
|
}
|
|
|
|
#define local_mcck_enable() \
|
|
__set_psw_mask(PSW_KERNEL_BITS | PSW_MASK_DAT | PSW_MASK_MCHECK)
|
|
#define local_mcck_disable() \
|
|
__set_psw_mask(PSW_KERNEL_BITS | PSW_MASK_DAT)
|
|
|
|
/*
|
|
* Basic Machine Check/Program Check Handler.
|
|
*/
|
|
|
|
extern void s390_base_mcck_handler(void);
|
|
extern void s390_base_pgm_handler(void);
|
|
extern void s390_base_ext_handler(void);
|
|
|
|
extern void (*s390_base_mcck_handler_fn)(void);
|
|
extern void (*s390_base_pgm_handler_fn)(void);
|
|
extern void (*s390_base_ext_handler_fn)(void);
|
|
|
|
#define ARCH_LOW_ADDRESS_LIMIT 0x7fffffffUL
|
|
|
|
extern int memcpy_real(void *, void *, size_t);
|
|
extern void memcpy_absolute(void *, void *, size_t);
|
|
|
|
#define mem_assign_absolute(dest, val) { \
|
|
__typeof__(dest) __tmp = (val); \
|
|
\
|
|
BUILD_BUG_ON(sizeof(__tmp) != sizeof(val)); \
|
|
memcpy_absolute(&(dest), &__tmp, sizeof(__tmp)); \
|
|
}
|
|
|
|
#endif /* __ASSEMBLY__ */
|
|
|
|
#endif /* __ASM_S390_PROCESSOR_H */
|