2005-04-17 06:20:36 +08:00
|
|
|
/*
|
|
|
|
* S390 low-level entry points.
|
|
|
|
*
|
2012-07-20 17:15:04 +08:00
|
|
|
* Copyright IBM Corp. 1999, 2012
|
2005-04-17 06:20:36 +08:00
|
|
|
* Author(s): Martin Schwidefsky (schwidefsky@de.ibm.com),
|
2006-09-28 22:56:37 +08:00
|
|
|
* Hartmut Penner (hp@de.ibm.com),
|
|
|
|
* Denis Joseph Barrow (djbarrow@de.ibm.com,barrow_dj@yahoo.com),
|
2005-06-26 05:55:30 +08:00
|
|
|
* Heiko Carstens <heiko.carstens@de.ibm.com>
|
2005-04-17 06:20:36 +08:00
|
|
|
*/
|
|
|
|
|
2008-02-05 23:50:40 +08:00
|
|
|
#include <linux/init.h>
|
2011-07-24 16:48:19 +08:00
|
|
|
#include <linux/linkage.h>
|
2012-09-05 19:26:11 +08:00
|
|
|
#include <asm/processor.h>
|
2005-04-17 06:20:36 +08:00
|
|
|
#include <asm/cache.h>
|
|
|
|
#include <asm/errno.h>
|
|
|
|
#include <asm/ptrace.h>
|
|
|
|
#include <asm/thread_info.h>
|
2005-09-10 02:57:26 +08:00
|
|
|
#include <asm/asm-offsets.h>
|
2005-04-17 06:20:36 +08:00
|
|
|
#include <asm/unistd.h>
|
|
|
|
#include <asm/page.h>
|
2012-06-04 21:05:43 +08:00
|
|
|
#include <asm/sigp.h>
|
2013-06-27 15:01:09 +08:00
|
|
|
#include <asm/irq.h>
|
2005-04-17 06:20:36 +08:00
|
|
|
|
2011-12-27 18:27:15 +08:00
|
|
|
__PT_R0 = __PT_GPRS
|
|
|
|
__PT_R1 = __PT_GPRS + 8
|
|
|
|
__PT_R2 = __PT_GPRS + 16
|
|
|
|
__PT_R3 = __PT_GPRS + 24
|
|
|
|
__PT_R4 = __PT_GPRS + 32
|
|
|
|
__PT_R5 = __PT_GPRS + 40
|
|
|
|
__PT_R6 = __PT_GPRS + 48
|
|
|
|
__PT_R7 = __PT_GPRS + 56
|
|
|
|
__PT_R8 = __PT_GPRS + 64
|
|
|
|
__PT_R9 = __PT_GPRS + 72
|
|
|
|
__PT_R10 = __PT_GPRS + 80
|
|
|
|
__PT_R11 = __PT_GPRS + 88
|
|
|
|
__PT_R12 = __PT_GPRS + 96
|
|
|
|
__PT_R13 = __PT_GPRS + 104
|
|
|
|
__PT_R14 = __PT_GPRS + 112
|
|
|
|
__PT_R15 = __PT_GPRS + 120
|
2005-04-17 06:20:36 +08:00
|
|
|
|
|
|
|
STACK_SHIFT = PAGE_SHIFT + THREAD_ORDER
|
|
|
|
STACK_SIZE = 1 << STACK_SHIFT
|
2013-04-24 16:20:43 +08:00
|
|
|
STACK_INIT = STACK_SIZE - STACK_FRAME_OVERHEAD - __PT_SIZE
|
2005-04-17 06:20:36 +08:00
|
|
|
|
2014-04-15 18:55:07 +08:00
|
|
|
_TIF_WORK = (_TIF_SIGPENDING | _TIF_NOTIFY_RESUME | _TIF_NEED_RESCHED)
|
|
|
|
_TIF_TRACE = (_TIF_SYSCALL_TRACE | _TIF_SYSCALL_AUDIT | _TIF_SECCOMP | \
|
|
|
|
_TIF_SYSCALL_TRACEPOINT)
|
|
|
|
_CIF_WORK = (_CIF_MCCK_PENDING | _CIF_ASCE)
|
|
|
|
_PIF_WORK = (_PIF_PER_TRAP)
|
2005-04-17 06:20:36 +08:00
|
|
|
|
|
|
|
#define BASED(name) name-system_call(%r13)
|
|
|
|
|
2006-07-03 15:24:46 +08:00
|
|
|
.macro TRACE_IRQS_ON
|
2011-12-27 18:27:15 +08:00
|
|
|
#ifdef CONFIG_TRACE_IRQFLAGS
|
2010-05-17 16:00:02 +08:00
|
|
|
basr %r2,%r0
|
|
|
|
brasl %r14,trace_hardirqs_on_caller
|
2011-12-27 18:27:15 +08:00
|
|
|
#endif
|
2006-07-03 15:24:46 +08:00
|
|
|
.endm
|
|
|
|
|
|
|
|
.macro TRACE_IRQS_OFF
|
2011-12-27 18:27:15 +08:00
|
|
|
#ifdef CONFIG_TRACE_IRQFLAGS
|
2010-05-17 16:00:02 +08:00
|
|
|
basr %r2,%r0
|
|
|
|
brasl %r14,trace_hardirqs_off_caller
|
2007-11-20 18:13:32 +08:00
|
|
|
#endif
|
2011-12-27 18:27:15 +08:00
|
|
|
.endm
|
2007-11-20 18:13:32 +08:00
|
|
|
|
|
|
|
.macro LOCKDEP_SYS_EXIT
|
2011-12-27 18:27:15 +08:00
|
|
|
#ifdef CONFIG_LOCKDEP
|
|
|
|
tm __PT_PSW+1(%r11),0x01 # returning to user ?
|
|
|
|
jz .+10
|
2007-11-20 18:13:32 +08:00
|
|
|
brasl %r14,lockdep_sys_exit
|
2006-07-03 15:24:46 +08:00
|
|
|
#endif
|
2005-04-17 06:20:36 +08:00
|
|
|
.endm
|
|
|
|
|
2013-02-12 01:11:09 +08:00
|
|
|
.macro LPP newpp
|
2013-11-01 17:08:20 +08:00
|
|
|
#if IS_ENABLED(CONFIG_KVM)
|
2013-02-12 01:11:09 +08:00
|
|
|
tm __LC_MACHINE_FLAGS+6,0x20 # MACHINE_FLAG_LPP
|
2011-12-27 18:27:15 +08:00
|
|
|
jz .+8
|
|
|
|
.insn s,0xb2800000,\newpp
|
|
|
|
#endif
|
|
|
|
.endm
|
2005-04-17 06:20:36 +08:00
|
|
|
|
2013-05-17 20:41:37 +08:00
|
|
|
.macro HANDLE_SIE_INTERCEPT scratch,reason
|
2013-11-01 17:08:20 +08:00
|
|
|
#if IS_ENABLED(CONFIG_KVM)
|
2012-05-09 22:27:36 +08:00
|
|
|
tmhh %r8,0x0001 # interrupting from user ?
|
2013-05-17 20:41:37 +08:00
|
|
|
jnz .+62
|
2011-12-27 18:27:15 +08:00
|
|
|
lgr \scratch,%r9
|
2013-05-17 20:41:37 +08:00
|
|
|
slg \scratch,BASED(.Lsie_critical)
|
|
|
|
clg \scratch,BASED(.Lsie_critical_length)
|
|
|
|
.if \reason==1
|
2012-11-15 16:35:16 +08:00
|
|
|
# Some program interrupts are suppressing (e.g. protection).
|
|
|
|
# We must also check the instruction after SIE in that case.
|
|
|
|
# do_protection_exception will rewind to rewind_pad
|
2013-05-17 20:41:37 +08:00
|
|
|
jh .+42
|
2012-11-15 16:35:16 +08:00
|
|
|
.else
|
2013-05-17 20:41:37 +08:00
|
|
|
jhe .+42
|
2012-11-15 16:35:16 +08:00
|
|
|
.endif
|
2013-05-17 20:41:37 +08:00
|
|
|
lg %r14,__SF_EMPTY(%r15) # get control block pointer
|
|
|
|
LPP __SF_EMPTY+16(%r15) # set host id
|
2013-05-17 20:41:34 +08:00
|
|
|
ni __SIE_PROG0C+3(%r14),0xfe # no longer in SIE
|
2013-05-17 20:41:37 +08:00
|
|
|
lctlg %c1,%c1,__LC_USER_ASCE # load primary asce
|
|
|
|
larl %r9,sie_exit # skip forward to sie_exit
|
|
|
|
mvi __SF_EMPTY+31(%r15),\reason # set exit reason
|
2011-12-27 18:27:15 +08:00
|
|
|
#endif
|
2007-07-10 17:24:18 +08:00
|
|
|
.endm
|
|
|
|
|
2011-12-27 18:27:15 +08:00
|
|
|
.macro CHECK_STACK stacksize,savearea
|
2006-06-29 20:58:05 +08:00
|
|
|
#ifdef CONFIG_CHECK_STACK
|
2011-12-27 18:27:15 +08:00
|
|
|
tml %r15,\stacksize - CONFIG_STACK_GUARD
|
|
|
|
lghi %r14,\savearea
|
|
|
|
jz stack_overflow
|
2006-06-29 20:58:05 +08:00
|
|
|
#endif
|
|
|
|
.endm
|
|
|
|
|
2011-12-27 18:27:15 +08:00
|
|
|
.macro SWITCH_ASYNC savearea,stack,shift
|
|
|
|
tmhh %r8,0x0001 # interrupting from user ?
|
|
|
|
jnz 1f
|
|
|
|
lgr %r14,%r9
|
|
|
|
slg %r14,BASED(.Lcritical_start)
|
|
|
|
clg %r14,BASED(.Lcritical_length)
|
2005-04-17 06:20:36 +08:00
|
|
|
jhe 0f
|
2011-12-27 18:27:15 +08:00
|
|
|
lghi %r11,\savearea # inside critical section, do cleanup
|
2005-04-17 06:20:36 +08:00
|
|
|
brasl %r14,cleanup_critical
|
2011-12-27 18:27:15 +08:00
|
|
|
tmhh %r8,0x0001 # retest problem state after cleanup
|
2005-04-17 06:20:36 +08:00
|
|
|
jnz 1f
|
2011-12-27 18:27:15 +08:00
|
|
|
0: lg %r14,\stack # are we already on the target stack?
|
2005-04-17 06:20:36 +08:00
|
|
|
slgr %r14,%r15
|
2011-12-27 18:27:15 +08:00
|
|
|
srag %r14,%r14,\shift
|
2010-05-17 16:00:05 +08:00
|
|
|
jnz 1f
|
2011-12-27 18:27:15 +08:00
|
|
|
CHECK_STACK 1<<\shift,\savearea
|
2013-04-24 16:20:43 +08:00
|
|
|
aghi %r15,-(STACK_FRAME_OVERHEAD + __PT_SIZE)
|
2011-12-27 18:27:15 +08:00
|
|
|
j 2f
|
|
|
|
1: lg %r15,\stack # load target stack
|
2013-04-24 16:20:43 +08:00
|
|
|
2: la %r11,STACK_FRAME_OVERHEAD(%r15)
|
2006-09-28 22:56:37 +08:00
|
|
|
.endm
|
2005-04-17 06:20:36 +08:00
|
|
|
|
2011-12-27 18:27:15 +08:00
|
|
|
.macro UPDATE_VTIME scratch,enter_timer
|
|
|
|
lg \scratch,__LC_EXIT_TIMER
|
|
|
|
slg \scratch,\enter_timer
|
|
|
|
alg \scratch,__LC_USER_TIMER
|
|
|
|
stg \scratch,__LC_USER_TIMER
|
|
|
|
lg \scratch,__LC_LAST_UPDATE_TIMER
|
|
|
|
slg \scratch,__LC_EXIT_TIMER
|
|
|
|
alg \scratch,__LC_SYSTEM_TIMER
|
|
|
|
stg \scratch,__LC_SYSTEM_TIMER
|
|
|
|
mvc __LC_LAST_UPDATE_TIMER(8),\enter_timer
|
2005-04-17 06:20:36 +08:00
|
|
|
.endm
|
|
|
|
|
2011-12-27 18:27:15 +08:00
|
|
|
.macro LAST_BREAK scratch
|
|
|
|
srag \scratch,%r10,23
|
|
|
|
jz .+10
|
|
|
|
stg %r10,__TI_last_break(%r12)
|
2010-05-17 16:00:05 +08:00
|
|
|
.endm
|
|
|
|
|
2010-10-25 22:10:37 +08:00
|
|
|
.macro REENABLE_IRQS
|
2011-12-27 18:27:15 +08:00
|
|
|
stg %r8,__LC_RETURN_PSW
|
|
|
|
ni __LC_RETURN_PSW,0xbf
|
|
|
|
ssm __LC_RETURN_PSW
|
2010-10-25 22:10:37 +08:00
|
|
|
.endm
|
|
|
|
|
2012-05-09 22:27:39 +08:00
|
|
|
.macro STCK savearea
|
2012-05-14 16:35:22 +08:00
|
|
|
#ifdef CONFIG_HAVE_MARCH_Z9_109_FEATURES
|
2012-05-09 22:27:39 +08:00
|
|
|
.insn s,0xb27c0000,\savearea # store clock fast
|
|
|
|
#else
|
|
|
|
.insn s,0xb2050000,\savearea # store clock
|
|
|
|
#endif
|
|
|
|
.endm
|
|
|
|
|
2011-01-05 19:47:25 +08:00
|
|
|
.section .kprobes.text, "ax"
|
|
|
|
|
2005-04-17 06:20:36 +08:00
|
|
|
/*
|
|
|
|
* Scheduler resume function, called by switch_to
|
|
|
|
* gpr2 = (task_struct *) prev
|
|
|
|
* gpr3 = (task_struct *) next
|
|
|
|
* Returns:
|
|
|
|
* gpr2 = prev
|
|
|
|
*/
|
2011-07-24 16:48:19 +08:00
|
|
|
ENTRY(__switch_to)
|
2012-05-15 15:20:06 +08:00
|
|
|
stmg %r6,%r15,__SF_GPRS(%r15) # store gprs of prev task
|
|
|
|
stg %r15,__THREAD_ksp(%r2) # store kernel stack of prev
|
2011-01-05 19:48:10 +08:00
|
|
|
lg %r4,__THREAD_info(%r2) # get thread_info of prev
|
|
|
|
lg %r5,__THREAD_info(%r3) # get thread_info of next
|
2012-05-15 15:20:06 +08:00
|
|
|
lgr %r15,%r5
|
2013-04-24 16:20:43 +08:00
|
|
|
aghi %r15,STACK_INIT # end of kernel stack of next
|
2012-05-15 15:20:06 +08:00
|
|
|
stg %r3,__LC_CURRENT # store task struct of next
|
|
|
|
stg %r5,__LC_THREAD_INFO # store thread info of next
|
|
|
|
stg %r15,__LC_KERNEL_STACK # store end of kernel stack
|
|
|
|
lctl %c4,%c4,__TASK_pid(%r3) # load pid to control reg. 4
|
|
|
|
mvc __LC_CURRENT_PID+4(4,%r0),__TASK_pid(%r3) # store pid of next
|
|
|
|
lg %r15,__THREAD_ksp(%r3) # load kernel stack of next
|
2014-04-15 18:55:07 +08:00
|
|
|
lmg %r6,%r15,__SF_GPRS(%r15) # load gprs of next task
|
2005-04-17 06:20:36 +08:00
|
|
|
br %r14
|
|
|
|
|
|
|
|
__critical_start:
|
|
|
|
/*
|
|
|
|
* SVC interrupt handler routine. System calls are synchronous events and
|
|
|
|
* are executed with interrupts enabled.
|
|
|
|
*/
|
|
|
|
|
2011-07-24 16:48:19 +08:00
|
|
|
ENTRY(system_call)
|
2008-12-25 20:39:25 +08:00
|
|
|
stpt __LC_SYNC_ENTER_TIMER
|
2011-12-27 18:27:15 +08:00
|
|
|
sysc_stmg:
|
|
|
|
stmg %r8,%r15,__LC_SAVE_AREA_SYNC
|
|
|
|
lg %r10,__LC_LAST_BREAK
|
|
|
|
lg %r12,__LC_THREAD_INFO
|
2014-04-15 18:55:07 +08:00
|
|
|
lghi %r14,_PIF_SYSCALL
|
2011-12-27 18:27:15 +08:00
|
|
|
sysc_per:
|
|
|
|
lg %r15,__LC_KERNEL_STACK
|
|
|
|
la %r11,STACK_FRAME_OVERHEAD(%r15) # pointer to pt_regs
|
2005-04-17 06:20:36 +08:00
|
|
|
sysc_vtime:
|
2011-12-27 18:27:15 +08:00
|
|
|
UPDATE_VTIME %r13,__LC_SYNC_ENTER_TIMER
|
|
|
|
LAST_BREAK %r13
|
|
|
|
stmg %r0,%r7,__PT_R0(%r11)
|
|
|
|
mvc __PT_R8(64,%r11),__LC_SAVE_AREA_SYNC
|
|
|
|
mvc __PT_PSW(16,%r11),__LC_SVC_OLD_PSW
|
2011-12-27 18:27:18 +08:00
|
|
|
mvc __PT_INT_CODE(4,%r11),__LC_SVC_ILC
|
2014-04-15 18:55:07 +08:00
|
|
|
stg %r14,__PT_FLAGS(%r11)
|
2005-04-17 06:20:36 +08:00
|
|
|
sysc_do_svc:
|
2013-04-24 18:58:39 +08:00
|
|
|
lg %r10,__TI_sysc_table(%r12) # address of system call table
|
2011-12-27 18:27:18 +08:00
|
|
|
llgh %r8,__PT_INT_CODE+2(%r11)
|
2011-12-27 18:27:15 +08:00
|
|
|
slag %r8,%r8,2 # shift and test for svc 0
|
2005-04-17 06:20:36 +08:00
|
|
|
jnz sysc_nr_ok
|
|
|
|
# svc 0: system call number in %r1
|
2011-12-27 18:27:15 +08:00
|
|
|
llgfr %r1,%r1 # clear high word in r1
|
2010-05-17 16:00:05 +08:00
|
|
|
cghi %r1,NR_syscalls
|
2005-04-17 06:20:36 +08:00
|
|
|
jnl sysc_nr_ok
|
2011-12-27 18:27:18 +08:00
|
|
|
sth %r1,__PT_INT_CODE+2(%r11)
|
2011-12-27 18:27:15 +08:00
|
|
|
slag %r8,%r1,2
|
2005-04-17 06:20:36 +08:00
|
|
|
sysc_nr_ok:
|
2011-12-27 18:27:15 +08:00
|
|
|
xc __SF_BACKCHAIN(8,%r15),__SF_BACKCHAIN(%r15)
|
|
|
|
stg %r2,__PT_ORIG_GPR2(%r11)
|
|
|
|
stg %r7,STACK_FRAME_OVERHEAD(%r15)
|
|
|
|
lgf %r9,0(%r8,%r10) # get system call add.
|
2014-04-15 18:55:07 +08:00
|
|
|
tm __TI_flags+7(%r12),_TIF_TRACE
|
2006-09-28 22:56:37 +08:00
|
|
|
jnz sysc_tracesys
|
2011-12-27 18:27:15 +08:00
|
|
|
basr %r14,%r9 # call sys_xxxx
|
|
|
|
stg %r2,__PT_R2(%r11) # store return value
|
2005-04-17 06:20:36 +08:00
|
|
|
|
|
|
|
sysc_return:
|
2010-05-17 16:00:02 +08:00
|
|
|
LOCKDEP_SYS_EXIT
|
|
|
|
sysc_tif:
|
2011-12-27 18:27:15 +08:00
|
|
|
tm __PT_PSW+1(%r11),0x01 # returning to user ?
|
2011-10-30 22:16:49 +08:00
|
|
|
jno sysc_restore
|
2014-04-15 18:55:07 +08:00
|
|
|
tm __PT_FLAGS+7(%r11),_PIF_WORK
|
|
|
|
jnz sysc_work
|
|
|
|
tm __TI_flags+7(%r12),_TIF_WORK
|
2011-12-27 18:27:15 +08:00
|
|
|
jnz sysc_work # check for work
|
2014-04-15 18:55:07 +08:00
|
|
|
tm __LC_CPU_FLAGS+7,_CIF_WORK
|
|
|
|
jnz sysc_work
|
2007-11-20 18:13:32 +08:00
|
|
|
sysc_restore:
|
2011-12-27 18:27:15 +08:00
|
|
|
lg %r14,__LC_VDSO_PER_CPU
|
|
|
|
lmg %r0,%r10,__PT_R0(%r11)
|
|
|
|
mvc __LC_RETURN_PSW(16),__PT_PSW(%r11)
|
|
|
|
stpt __LC_EXIT_TIMER
|
|
|
|
mvc __VDSO_ECTG_BASE(16,%r14),__LC_EXIT_TIMER
|
|
|
|
lmg %r11,%r15,__PT_R11(%r11)
|
|
|
|
lpswe __LC_RETURN_PSW
|
2007-11-20 18:13:32 +08:00
|
|
|
sysc_done:
|
|
|
|
|
2010-05-17 16:00:01 +08:00
|
|
|
#
|
|
|
|
# One of the work bits is on. Find out which one.
|
|
|
|
#
|
2011-10-30 22:16:49 +08:00
|
|
|
sysc_work:
|
2014-04-15 18:55:07 +08:00
|
|
|
tm __LC_CPU_FLAGS+7,_CIF_MCCK_PENDING
|
2005-06-26 05:55:30 +08:00
|
|
|
jo sysc_mcck_pending
|
2010-05-17 16:00:05 +08:00
|
|
|
tm __TI_flags+7(%r12),_TIF_NEED_RESCHED
|
2005-04-17 06:20:36 +08:00
|
|
|
jo sysc_reschedule
|
2014-04-15 18:55:07 +08:00
|
|
|
tm __PT_FLAGS+7(%r11),_PIF_PER_TRAP
|
2012-11-21 23:36:27 +08:00
|
|
|
jo sysc_singlestep
|
2010-05-17 16:00:05 +08:00
|
|
|
tm __TI_flags+7(%r12),_TIF_SIGPENDING
|
2010-05-17 16:00:01 +08:00
|
|
|
jo sysc_sigpending
|
2010-05-17 16:00:05 +08:00
|
|
|
tm __TI_flags+7(%r12),_TIF_NOTIFY_RESUME
|
2010-05-17 16:00:01 +08:00
|
|
|
jo sysc_notify_resume
|
2014-04-15 18:55:07 +08:00
|
|
|
tm __LC_CPU_FLAGS+7,_CIF_ASCE
|
s390/uaccess: rework uaccess code - fix locking issues
The current uaccess code uses a page table walk in some circumstances,
e.g. in case of the in atomic futex operations or if running on old
hardware which doesn't support the mvcos instruction.
However it turned out that the page table walk code does not correctly
lock page tables when accessing page table entries.
In other words: a different cpu may invalidate a page table entry while
the current cpu inspects the pte. This may lead to random data corruption.
Adding correct locking however isn't trivial for all uaccess operations.
Especially copy_in_user() is problematic since that requires to hold at
least two locks, but must be protected against ABBA deadlock when a
different cpu also performs a copy_in_user() operation.
So the solution is a different approach where we change address spaces:
User space runs in primary address mode, or access register mode within
vdso code, like it currently already does.
The kernel usually also runs in home space mode, however when accessing
user space the kernel switches to primary or secondary address mode if
the mvcos instruction is not available or if a compare-and-swap (futex)
instruction on a user space address is performed.
KVM however is special, since that requires the kernel to run in home
address space while implicitly accessing user space with the sie
instruction.
So we end up with:
User space:
- runs in primary or access register mode
- cr1 contains the user asce
- cr7 contains the user asce
- cr13 contains the kernel asce
Kernel space:
- runs in home space mode
- cr1 contains the user or kernel asce
-> the kernel asce is loaded when a uaccess requires primary or
secondary address mode
- cr7 contains the user or kernel asce, (changed with set_fs())
- cr13 contains the kernel asce
In case of uaccess the kernel changes to:
- primary space mode in case of a uaccess (copy_to_user) and uses
e.g. the mvcp instruction to access user space. However the kernel
will stay in home space mode if the mvcos instruction is available
- secondary space mode in case of futex atomic operations, so that the
instructions come from primary address space and data from secondary
space
In case of kvm the kernel runs in home space mode, but cr1 gets switched
to contain the gmap asce before the sie instruction gets executed. When
the sie instruction is finished cr1 will be switched back to contain the
user asce.
A context switch between two processes will always load the kernel asce
for the next process in cr1. So the first exit to user space is a bit
more expensive (one extra load control register instruction) than before,
however keeps the code rather simple.
In sum this means there is no need to perform any error prone page table
walks anymore when accessing user space.
The patch seems to be rather large, however it mainly removes the
the page table walk code and restores the previously deleted "standard"
uaccess code, with a couple of changes.
The uaccess without mvcos mode can be enforced with the "uaccess_primary"
kernel parameter.
Reported-by: Christian Borntraeger <borntraeger@de.ibm.com>
Signed-off-by: Heiko Carstens <heiko.carstens@de.ibm.com>
Signed-off-by: Martin Schwidefsky <schwidefsky@de.ibm.com>
2014-03-21 17:42:25 +08:00
|
|
|
jo sysc_uaccess
|
2010-05-17 16:00:01 +08:00
|
|
|
j sysc_return # beware of critical section cleanup
|
2005-04-17 06:20:36 +08:00
|
|
|
|
|
|
|
#
|
|
|
|
# _TIF_NEED_RESCHED is set, call schedule
|
2006-09-28 22:56:37 +08:00
|
|
|
#
|
|
|
|
sysc_reschedule:
|
2010-05-17 16:00:02 +08:00
|
|
|
larl %r14,sysc_return
|
2011-12-27 18:27:15 +08:00
|
|
|
jg schedule
|
2005-04-17 06:20:36 +08:00
|
|
|
|
2005-06-26 05:55:30 +08:00
|
|
|
#
|
2014-04-15 18:55:07 +08:00
|
|
|
# _CIF_MCCK_PENDING is set, call handler
|
2005-06-26 05:55:30 +08:00
|
|
|
#
|
|
|
|
sysc_mcck_pending:
|
2010-05-17 16:00:02 +08:00
|
|
|
larl %r14,sysc_return
|
2006-09-28 22:56:37 +08:00
|
|
|
jg s390_handle_mcck # TIF bit will be cleared by handler
|
2005-06-26 05:55:30 +08:00
|
|
|
|
s390/uaccess: rework uaccess code - fix locking issues
The current uaccess code uses a page table walk in some circumstances,
e.g. in case of the in atomic futex operations or if running on old
hardware which doesn't support the mvcos instruction.
However it turned out that the page table walk code does not correctly
lock page tables when accessing page table entries.
In other words: a different cpu may invalidate a page table entry while
the current cpu inspects the pte. This may lead to random data corruption.
Adding correct locking however isn't trivial for all uaccess operations.
Especially copy_in_user() is problematic since that requires to hold at
least two locks, but must be protected against ABBA deadlock when a
different cpu also performs a copy_in_user() operation.
So the solution is a different approach where we change address spaces:
User space runs in primary address mode, or access register mode within
vdso code, like it currently already does.
The kernel usually also runs in home space mode, however when accessing
user space the kernel switches to primary or secondary address mode if
the mvcos instruction is not available or if a compare-and-swap (futex)
instruction on a user space address is performed.
KVM however is special, since that requires the kernel to run in home
address space while implicitly accessing user space with the sie
instruction.
So we end up with:
User space:
- runs in primary or access register mode
- cr1 contains the user asce
- cr7 contains the user asce
- cr13 contains the kernel asce
Kernel space:
- runs in home space mode
- cr1 contains the user or kernel asce
-> the kernel asce is loaded when a uaccess requires primary or
secondary address mode
- cr7 contains the user or kernel asce, (changed with set_fs())
- cr13 contains the kernel asce
In case of uaccess the kernel changes to:
- primary space mode in case of a uaccess (copy_to_user) and uses
e.g. the mvcp instruction to access user space. However the kernel
will stay in home space mode if the mvcos instruction is available
- secondary space mode in case of futex atomic operations, so that the
instructions come from primary address space and data from secondary
space
In case of kvm the kernel runs in home space mode, but cr1 gets switched
to contain the gmap asce before the sie instruction gets executed. When
the sie instruction is finished cr1 will be switched back to contain the
user asce.
A context switch between two processes will always load the kernel asce
for the next process in cr1. So the first exit to user space is a bit
more expensive (one extra load control register instruction) than before,
however keeps the code rather simple.
In sum this means there is no need to perform any error prone page table
walks anymore when accessing user space.
The patch seems to be rather large, however it mainly removes the
the page table walk code and restores the previously deleted "standard"
uaccess code, with a couple of changes.
The uaccess without mvcos mode can be enforced with the "uaccess_primary"
kernel parameter.
Reported-by: Christian Borntraeger <borntraeger@de.ibm.com>
Signed-off-by: Heiko Carstens <heiko.carstens@de.ibm.com>
Signed-off-by: Martin Schwidefsky <schwidefsky@de.ibm.com>
2014-03-21 17:42:25 +08:00
|
|
|
#
|
2014-04-15 18:55:07 +08:00
|
|
|
# _CIF_ASCE is set, load user space asce
|
s390/uaccess: rework uaccess code - fix locking issues
The current uaccess code uses a page table walk in some circumstances,
e.g. in case of the in atomic futex operations or if running on old
hardware which doesn't support the mvcos instruction.
However it turned out that the page table walk code does not correctly
lock page tables when accessing page table entries.
In other words: a different cpu may invalidate a page table entry while
the current cpu inspects the pte. This may lead to random data corruption.
Adding correct locking however isn't trivial for all uaccess operations.
Especially copy_in_user() is problematic since that requires to hold at
least two locks, but must be protected against ABBA deadlock when a
different cpu also performs a copy_in_user() operation.
So the solution is a different approach where we change address spaces:
User space runs in primary address mode, or access register mode within
vdso code, like it currently already does.
The kernel usually also runs in home space mode, however when accessing
user space the kernel switches to primary or secondary address mode if
the mvcos instruction is not available or if a compare-and-swap (futex)
instruction on a user space address is performed.
KVM however is special, since that requires the kernel to run in home
address space while implicitly accessing user space with the sie
instruction.
So we end up with:
User space:
- runs in primary or access register mode
- cr1 contains the user asce
- cr7 contains the user asce
- cr13 contains the kernel asce
Kernel space:
- runs in home space mode
- cr1 contains the user or kernel asce
-> the kernel asce is loaded when a uaccess requires primary or
secondary address mode
- cr7 contains the user or kernel asce, (changed with set_fs())
- cr13 contains the kernel asce
In case of uaccess the kernel changes to:
- primary space mode in case of a uaccess (copy_to_user) and uses
e.g. the mvcp instruction to access user space. However the kernel
will stay in home space mode if the mvcos instruction is available
- secondary space mode in case of futex atomic operations, so that the
instructions come from primary address space and data from secondary
space
In case of kvm the kernel runs in home space mode, but cr1 gets switched
to contain the gmap asce before the sie instruction gets executed. When
the sie instruction is finished cr1 will be switched back to contain the
user asce.
A context switch between two processes will always load the kernel asce
for the next process in cr1. So the first exit to user space is a bit
more expensive (one extra load control register instruction) than before,
however keeps the code rather simple.
In sum this means there is no need to perform any error prone page table
walks anymore when accessing user space.
The patch seems to be rather large, however it mainly removes the
the page table walk code and restores the previously deleted "standard"
uaccess code, with a couple of changes.
The uaccess without mvcos mode can be enforced with the "uaccess_primary"
kernel parameter.
Reported-by: Christian Borntraeger <borntraeger@de.ibm.com>
Signed-off-by: Heiko Carstens <heiko.carstens@de.ibm.com>
Signed-off-by: Martin Schwidefsky <schwidefsky@de.ibm.com>
2014-03-21 17:42:25 +08:00
|
|
|
#
|
|
|
|
sysc_uaccess:
|
2014-04-15 18:55:07 +08:00
|
|
|
ni __LC_CPU_FLAGS+7,255-_CIF_ASCE
|
s390/uaccess: rework uaccess code - fix locking issues
The current uaccess code uses a page table walk in some circumstances,
e.g. in case of the in atomic futex operations or if running on old
hardware which doesn't support the mvcos instruction.
However it turned out that the page table walk code does not correctly
lock page tables when accessing page table entries.
In other words: a different cpu may invalidate a page table entry while
the current cpu inspects the pte. This may lead to random data corruption.
Adding correct locking however isn't trivial for all uaccess operations.
Especially copy_in_user() is problematic since that requires to hold at
least two locks, but must be protected against ABBA deadlock when a
different cpu also performs a copy_in_user() operation.
So the solution is a different approach where we change address spaces:
User space runs in primary address mode, or access register mode within
vdso code, like it currently already does.
The kernel usually also runs in home space mode, however when accessing
user space the kernel switches to primary or secondary address mode if
the mvcos instruction is not available or if a compare-and-swap (futex)
instruction on a user space address is performed.
KVM however is special, since that requires the kernel to run in home
address space while implicitly accessing user space with the sie
instruction.
So we end up with:
User space:
- runs in primary or access register mode
- cr1 contains the user asce
- cr7 contains the user asce
- cr13 contains the kernel asce
Kernel space:
- runs in home space mode
- cr1 contains the user or kernel asce
-> the kernel asce is loaded when a uaccess requires primary or
secondary address mode
- cr7 contains the user or kernel asce, (changed with set_fs())
- cr13 contains the kernel asce
In case of uaccess the kernel changes to:
- primary space mode in case of a uaccess (copy_to_user) and uses
e.g. the mvcp instruction to access user space. However the kernel
will stay in home space mode if the mvcos instruction is available
- secondary space mode in case of futex atomic operations, so that the
instructions come from primary address space and data from secondary
space
In case of kvm the kernel runs in home space mode, but cr1 gets switched
to contain the gmap asce before the sie instruction gets executed. When
the sie instruction is finished cr1 will be switched back to contain the
user asce.
A context switch between two processes will always load the kernel asce
for the next process in cr1. So the first exit to user space is a bit
more expensive (one extra load control register instruction) than before,
however keeps the code rather simple.
In sum this means there is no need to perform any error prone page table
walks anymore when accessing user space.
The patch seems to be rather large, however it mainly removes the
the page table walk code and restores the previously deleted "standard"
uaccess code, with a couple of changes.
The uaccess without mvcos mode can be enforced with the "uaccess_primary"
kernel parameter.
Reported-by: Christian Borntraeger <borntraeger@de.ibm.com>
Signed-off-by: Heiko Carstens <heiko.carstens@de.ibm.com>
Signed-off-by: Martin Schwidefsky <schwidefsky@de.ibm.com>
2014-03-21 17:42:25 +08:00
|
|
|
lctlg %c1,%c1,__LC_USER_ASCE # load primary asce
|
|
|
|
j sysc_return
|
|
|
|
|
2005-04-17 06:20:36 +08:00
|
|
|
#
|
2008-04-30 15:53:08 +08:00
|
|
|
# _TIF_SIGPENDING is set, call do_signal
|
2005-04-17 06:20:36 +08:00
|
|
|
#
|
2006-09-28 22:56:37 +08:00
|
|
|
sysc_sigpending:
|
2011-12-27 18:27:15 +08:00
|
|
|
lgr %r2,%r11 # pass pointer to pt_regs
|
|
|
|
brasl %r14,do_signal
|
2014-04-15 18:55:07 +08:00
|
|
|
tm __PT_FLAGS+7(%r11),_PIF_SYSCALL
|
2011-10-30 22:16:49 +08:00
|
|
|
jno sysc_return
|
2011-12-27 18:27:15 +08:00
|
|
|
lmg %r2,%r7,__PT_R2(%r11) # load svc arguments
|
2013-09-27 21:24:38 +08:00
|
|
|
lg %r10,__TI_sysc_table(%r12) # address of system call table
|
2011-12-27 18:27:15 +08:00
|
|
|
lghi %r8,0 # svc 0 returns -ENOSYS
|
2012-10-09 19:33:53 +08:00
|
|
|
llgh %r1,__PT_INT_CODE+2(%r11) # load new svc number
|
2011-10-30 22:16:49 +08:00
|
|
|
cghi %r1,NR_syscalls
|
|
|
|
jnl sysc_nr_ok # invalid svc number -> do svc 0
|
2011-12-27 18:27:15 +08:00
|
|
|
slag %r8,%r1,2
|
2011-10-30 22:16:49 +08:00
|
|
|
j sysc_nr_ok # restart svc
|
2005-04-17 06:20:36 +08:00
|
|
|
|
2008-10-11 03:33:20 +08:00
|
|
|
#
|
|
|
|
# _TIF_NOTIFY_RESUME is set, call do_notify_resume
|
|
|
|
#
|
|
|
|
sysc_notify_resume:
|
2011-12-27 18:27:15 +08:00
|
|
|
lgr %r2,%r11 # pass pointer to pt_regs
|
2010-05-17 16:00:02 +08:00
|
|
|
larl %r14,sysc_return
|
2011-12-27 18:27:15 +08:00
|
|
|
jg do_notify_resume
|
2008-10-11 03:33:20 +08:00
|
|
|
|
2005-04-17 06:20:36 +08:00
|
|
|
#
|
2014-04-15 18:55:07 +08:00
|
|
|
# _PIF_PER_TRAP is set, call do_per_trap
|
2005-04-17 06:20:36 +08:00
|
|
|
#
|
|
|
|
sysc_singlestep:
|
2014-04-15 18:55:07 +08:00
|
|
|
ni __PT_FLAGS+7(%r11),255-_PIF_PER_TRAP
|
2011-12-27 18:27:15 +08:00
|
|
|
lgr %r2,%r11 # pass pointer to pt_regs
|
|
|
|
larl %r14,sysc_return
|
2011-01-05 19:48:10 +08:00
|
|
|
jg do_per_trap
|
2005-04-17 06:20:36 +08:00
|
|
|
|
|
|
|
#
|
2008-10-11 03:33:20 +08:00
|
|
|
# call tracehook_report_syscall_entry/tracehook_report_syscall_exit before
|
|
|
|
# and after the system call
|
2005-04-17 06:20:36 +08:00
|
|
|
#
|
|
|
|
sysc_tracesys:
|
2011-12-27 18:27:15 +08:00
|
|
|
lgr %r2,%r11 # pass pointer to pt_regs
|
2005-04-17 06:20:36 +08:00
|
|
|
la %r3,0
|
2011-12-27 18:27:18 +08:00
|
|
|
llgh %r0,__PT_INT_CODE+2(%r11)
|
2011-12-27 18:27:15 +08:00
|
|
|
stg %r0,__PT_R2(%r11)
|
2008-10-11 03:33:20 +08:00
|
|
|
brasl %r14,do_syscall_trace_enter
|
2005-04-17 06:20:36 +08:00
|
|
|
lghi %r0,NR_syscalls
|
2008-10-11 03:33:20 +08:00
|
|
|
clgr %r0,%r2
|
2005-04-17 06:20:36 +08:00
|
|
|
jnh sysc_tracenogo
|
2011-12-27 18:27:15 +08:00
|
|
|
sllg %r8,%r2,2
|
|
|
|
lgf %r9,0(%r8,%r10)
|
2005-04-17 06:20:36 +08:00
|
|
|
sysc_tracego:
|
2011-12-27 18:27:15 +08:00
|
|
|
lmg %r3,%r7,__PT_R3(%r11)
|
|
|
|
stg %r7,STACK_FRAME_OVERHEAD(%r15)
|
|
|
|
lg %r2,__PT_ORIG_GPR2(%r11)
|
|
|
|
basr %r14,%r9 # call sys_xxx
|
|
|
|
stg %r2,__PT_R2(%r11) # store return value
|
2005-04-17 06:20:36 +08:00
|
|
|
sysc_tracenogo:
|
2014-04-15 18:55:07 +08:00
|
|
|
tm __TI_flags+7(%r12),_TIF_TRACE
|
2006-09-28 22:56:37 +08:00
|
|
|
jz sysc_return
|
2011-12-27 18:27:15 +08:00
|
|
|
lgr %r2,%r11 # pass pointer to pt_regs
|
|
|
|
larl %r14,sysc_return
|
2008-10-11 03:33:20 +08:00
|
|
|
jg do_syscall_trace_exit
|
2005-04-17 06:20:36 +08:00
|
|
|
|
|
|
|
#
|
|
|
|
# a new process exits the kernel with ret_from_fork
|
|
|
|
#
|
2011-07-24 16:48:19 +08:00
|
|
|
ENTRY(ret_from_fork)
|
2011-12-27 18:27:15 +08:00
|
|
|
la %r11,STACK_FRAME_OVERHEAD(%r15)
|
|
|
|
lg %r12,__LC_THREAD_INFO
|
2012-09-11 06:03:41 +08:00
|
|
|
brasl %r14,schedule_tail
|
|
|
|
TRACE_IRQS_ON
|
|
|
|
ssm __LC_SVC_NEW_PSW # reenable interrupts
|
2012-10-12 03:30:14 +08:00
|
|
|
tm __PT_PSW+1(%r11),0x01 # forking a kernel thread ?
|
|
|
|
jne sysc_tracenogo
|
|
|
|
# it's a kernel thread
|
|
|
|
lmg %r9,%r10,__PT_R9(%r11) # load gprs
|
2012-09-11 06:03:41 +08:00
|
|
|
ENTRY(kernel_thread_starter)
|
|
|
|
la %r2,0(%r10)
|
|
|
|
basr %r14,%r9
|
2012-10-12 03:30:14 +08:00
|
|
|
j sysc_tracenogo
|
2005-04-17 06:20:36 +08:00
|
|
|
|
|
|
|
/*
|
|
|
|
* Program check handler routine
|
|
|
|
*/
|
|
|
|
|
2011-07-24 16:48:19 +08:00
|
|
|
ENTRY(pgm_check_handler)
|
2008-12-25 20:39:25 +08:00
|
|
|
stpt __LC_SYNC_ENTER_TIMER
|
2011-12-27 18:27:15 +08:00
|
|
|
stmg %r8,%r15,__LC_SAVE_AREA_SYNC
|
|
|
|
lg %r10,__LC_LAST_BREAK
|
|
|
|
lg %r12,__LC_THREAD_INFO
|
|
|
|
larl %r13,system_call
|
|
|
|
lmg %r8,%r9,__LC_PGM_OLD_PSW
|
2012-11-15 16:35:16 +08:00
|
|
|
HANDLE_SIE_INTERCEPT %r14,1
|
2011-12-27 18:27:15 +08:00
|
|
|
tmhh %r8,0x0001 # test problem state bit
|
|
|
|
jnz 1f # -> fault in user space
|
|
|
|
tmhh %r8,0x4000 # PER bit set in old PSW ?
|
|
|
|
jnz 0f # -> enabled, can't be a double fault
|
|
|
|
tm __LC_PGM_ILC+3,0x80 # check for per exception
|
|
|
|
jnz pgm_svcper # -> single stepped svc
|
|
|
|
0: CHECK_STACK STACK_SIZE,__LC_SAVE_AREA_SYNC
|
2013-04-24 16:20:43 +08:00
|
|
|
aghi %r15,-(STACK_FRAME_OVERHEAD + __PT_SIZE)
|
2011-12-27 18:27:15 +08:00
|
|
|
j 2f
|
|
|
|
1: UPDATE_VTIME %r14,__LC_SYNC_ENTER_TIMER
|
|
|
|
LAST_BREAK %r14
|
|
|
|
lg %r15,__LC_KERNEL_STACK
|
2012-07-31 17:03:04 +08:00
|
|
|
lg %r14,__TI_task(%r12)
|
|
|
|
lghi %r13,__LC_PGM_TDB
|
|
|
|
tm __LC_PGM_ILC+2,0x02 # check for transaction abort
|
|
|
|
jz 2f
|
|
|
|
mvc __THREAD_trap_tdb(256,%r14),0(%r13)
|
2013-04-24 16:20:43 +08:00
|
|
|
2: la %r11,STACK_FRAME_OVERHEAD(%r15)
|
2011-12-27 18:27:15 +08:00
|
|
|
stmg %r0,%r7,__PT_R0(%r11)
|
|
|
|
mvc __PT_R8(64,%r11),__LC_SAVE_AREA_SYNC
|
|
|
|
stmg %r8,%r9,__PT_PSW(%r11)
|
2011-12-27 18:27:18 +08:00
|
|
|
mvc __PT_INT_CODE(4,%r11),__LC_PGM_ILC
|
|
|
|
mvc __PT_INT_PARM_LONG(8,%r11),__LC_TRANS_EXC_CODE
|
2014-04-15 18:55:07 +08:00
|
|
|
xc __PT_FLAGS(8,%r11),__PT_FLAGS(%r11)
|
2011-12-27 18:27:15 +08:00
|
|
|
stg %r10,__PT_ARGS(%r11)
|
|
|
|
tm __LC_PGM_ILC+3,0x80 # check for per exception
|
|
|
|
jz 0f
|
|
|
|
tmhh %r8,0x0001 # kernel per event ?
|
|
|
|
jz pgm_kprobe
|
2014-04-15 18:55:07 +08:00
|
|
|
oi __PT_FLAGS+7(%r11),_PIF_PER_TRAP
|
2012-07-31 17:03:04 +08:00
|
|
|
mvc __THREAD_per_address(8,%r14),__LC_PER_ADDRESS
|
2014-02-26 23:32:46 +08:00
|
|
|
mvc __THREAD_per_cause(2,%r14),__LC_PER_CODE
|
|
|
|
mvc __THREAD_per_paid(1,%r14),__LC_PER_ACCESS_ID
|
2011-12-27 18:27:18 +08:00
|
|
|
0: REENABLE_IRQS
|
2011-12-27 18:27:15 +08:00
|
|
|
xc __SF_BACKCHAIN(8,%r15),__SF_BACKCHAIN(%r15)
|
2010-07-28 01:29:37 +08:00
|
|
|
larl %r1,pgm_check_table
|
2011-12-27 18:27:18 +08:00
|
|
|
llgh %r10,__PT_INT_CODE+2(%r11)
|
|
|
|
nill %r10,0x007f
|
2012-10-19 00:10:06 +08:00
|
|
|
sll %r10,2
|
2011-12-27 18:27:18 +08:00
|
|
|
je sysc_return
|
2012-10-19 00:10:06 +08:00
|
|
|
lgf %r1,0(%r10,%r1) # load address of handler routine
|
2011-12-27 18:27:15 +08:00
|
|
|
lgr %r2,%r11 # pass pointer to pt_regs
|
2010-07-28 01:29:37 +08:00
|
|
|
basr %r14,%r1 # branch to interrupt-handler
|
|
|
|
j sysc_return
|
2005-04-17 06:20:36 +08:00
|
|
|
|
|
|
|
#
|
2011-12-27 18:27:15 +08:00
|
|
|
# PER event in supervisor state, must be kprobes
|
2005-04-17 06:20:36 +08:00
|
|
|
#
|
2011-12-27 18:27:15 +08:00
|
|
|
pgm_kprobe:
|
|
|
|
REENABLE_IRQS
|
|
|
|
xc __SF_BACKCHAIN(8,%r15),__SF_BACKCHAIN(%r15)
|
|
|
|
lgr %r2,%r11 # pass pointer to pt_regs
|
|
|
|
brasl %r14,do_per_trap
|
|
|
|
j sysc_return
|
2005-04-17 06:20:36 +08:00
|
|
|
|
2006-09-20 21:58:39 +08:00
|
|
|
#
|
2011-12-27 18:27:15 +08:00
|
|
|
# single stepped system call
|
2006-09-20 21:58:39 +08:00
|
|
|
#
|
2011-12-27 18:27:15 +08:00
|
|
|
pgm_svcper:
|
|
|
|
mvc __LC_RETURN_PSW(8),__LC_SVC_NEW_PSW
|
|
|
|
larl %r14,sysc_per
|
|
|
|
stg %r14,__LC_RETURN_PSW+8
|
2014-04-15 18:55:07 +08:00
|
|
|
lghi %r14,_PIF_SYSCALL | _PIF_PER_TRAP
|
2011-12-27 18:27:15 +08:00
|
|
|
lpswe __LC_RETURN_PSW # branch to sysc_per and enable irqs
|
2006-09-20 21:58:39 +08:00
|
|
|
|
2005-04-17 06:20:36 +08:00
|
|
|
/*
|
|
|
|
* IO interrupt handler routine
|
|
|
|
*/
|
2011-07-24 16:48:19 +08:00
|
|
|
ENTRY(io_int_handler)
|
2012-05-09 22:27:39 +08:00
|
|
|
STCK __LC_INT_CLOCK
|
2008-12-31 22:11:41 +08:00
|
|
|
stpt __LC_ASYNC_ENTER_TIMER
|
2011-12-27 18:27:15 +08:00
|
|
|
stmg %r8,%r15,__LC_SAVE_AREA_ASYNC
|
|
|
|
lg %r10,__LC_LAST_BREAK
|
|
|
|
lg %r12,__LC_THREAD_INFO
|
|
|
|
larl %r13,system_call
|
|
|
|
lmg %r8,%r9,__LC_IO_OLD_PSW
|
2013-05-17 20:41:37 +08:00
|
|
|
HANDLE_SIE_INTERCEPT %r14,2
|
2011-12-27 18:27:15 +08:00
|
|
|
SWITCH_ASYNC __LC_SAVE_AREA_ASYNC,__LC_ASYNC_STACK,STACK_SHIFT
|
|
|
|
tmhh %r8,0x0001 # interrupting from user?
|
|
|
|
jz io_skip
|
|
|
|
UPDATE_VTIME %r14,__LC_ASYNC_ENTER_TIMER
|
|
|
|
LAST_BREAK %r14
|
|
|
|
io_skip:
|
|
|
|
stmg %r0,%r7,__PT_R0(%r11)
|
|
|
|
mvc __PT_R8(64,%r11),__LC_SAVE_AREA_ASYNC
|
|
|
|
stmg %r8,%r9,__PT_PSW(%r11)
|
2013-06-17 20:54:02 +08:00
|
|
|
mvc __PT_INT_CODE(12,%r11),__LC_SUBCHANNEL_ID
|
2014-04-15 18:55:07 +08:00
|
|
|
xc __PT_FLAGS(8,%r11),__PT_FLAGS(%r11)
|
2006-07-03 15:24:46 +08:00
|
|
|
TRACE_IRQS_OFF
|
2011-12-27 18:27:15 +08:00
|
|
|
xc __SF_BACKCHAIN(8,%r15),__SF_BACKCHAIN(%r15)
|
2013-06-17 20:54:02 +08:00
|
|
|
io_loop:
|
2011-12-27 18:27:15 +08:00
|
|
|
lgr %r2,%r11 # pass pointer to pt_regs
|
2013-06-27 15:01:09 +08:00
|
|
|
lghi %r3,IO_INTERRUPT
|
|
|
|
tm __PT_INT_CODE+8(%r11),0x80 # adapter interrupt ?
|
|
|
|
jz io_call
|
|
|
|
lghi %r3,THIN_INTERRUPT
|
|
|
|
io_call:
|
2011-12-27 18:27:15 +08:00
|
|
|
brasl %r14,do_IRQ
|
2013-06-17 20:54:02 +08:00
|
|
|
tm __LC_MACHINE_FLAGS+6,0x10 # MACHINE_FLAG_LPAR
|
|
|
|
jz io_return
|
|
|
|
tpi 0
|
|
|
|
jz io_return
|
|
|
|
mvc __PT_INT_CODE(12,%r11),__LC_SUBCHANNEL_ID
|
|
|
|
j io_loop
|
2005-04-17 06:20:36 +08:00
|
|
|
io_return:
|
2010-05-17 16:00:02 +08:00
|
|
|
LOCKDEP_SYS_EXIT
|
|
|
|
TRACE_IRQS_ON
|
|
|
|
io_tif:
|
2014-04-15 18:55:07 +08:00
|
|
|
tm __TI_flags+7(%r12),_TIF_WORK
|
2006-09-28 22:56:37 +08:00
|
|
|
jnz io_work # there is work to do (signals etc.)
|
2014-04-15 18:55:07 +08:00
|
|
|
tm __LC_CPU_FLAGS+7,_CIF_WORK
|
|
|
|
jnz io_work
|
2007-11-20 18:13:32 +08:00
|
|
|
io_restore:
|
2011-12-27 18:27:15 +08:00
|
|
|
lg %r14,__LC_VDSO_PER_CPU
|
|
|
|
lmg %r0,%r10,__PT_R0(%r11)
|
|
|
|
mvc __LC_RETURN_PSW(16),__PT_PSW(%r11)
|
|
|
|
stpt __LC_EXIT_TIMER
|
|
|
|
mvc __VDSO_ECTG_BASE(16,%r14),__LC_EXIT_TIMER
|
|
|
|
lmg %r11,%r15,__PT_R11(%r11)
|
|
|
|
lpswe __LC_RETURN_PSW
|
2005-09-04 06:57:56 +08:00
|
|
|
io_done:
|
2005-04-17 06:20:36 +08:00
|
|
|
|
2008-05-07 15:22:52 +08:00
|
|
|
#
|
2010-05-17 16:00:01 +08:00
|
|
|
# There is work todo, find out in which context we have been interrupted:
|
2014-04-15 18:55:07 +08:00
|
|
|
# 1) if we return to user space we can do all _TIF_WORK work
|
2010-05-17 16:00:01 +08:00
|
|
|
# 2) if we return to kernel code and kvm is enabled check if we need to
|
|
|
|
# modify the psw to leave SIE
|
|
|
|
# 3) if we return to kernel code and preemptive scheduling is enabled check
|
|
|
|
# the preemption counter and if it is zero call preempt_schedule_irq
|
|
|
|
# Before any work can be done, a switch to the kernel stack is required.
|
2008-05-07 15:22:52 +08:00
|
|
|
#
|
|
|
|
io_work:
|
2011-12-27 18:27:15 +08:00
|
|
|
tm __PT_PSW+1(%r11),0x01 # returning to user ?
|
2010-05-17 16:00:01 +08:00
|
|
|
jo io_work_user # yes -> do resched & signal
|
|
|
|
#ifdef CONFIG_PREEMPT
|
2008-05-07 15:22:52 +08:00
|
|
|
# check for preemptive scheduling
|
2010-05-17 16:00:05 +08:00
|
|
|
icm %r0,15,__TI_precount(%r12)
|
2008-05-07 15:22:52 +08:00
|
|
|
jnz io_restore # preemption is disabled
|
2010-05-17 16:00:02 +08:00
|
|
|
tm __TI_flags+7(%r12),_TIF_NEED_RESCHED
|
|
|
|
jno io_restore
|
2005-04-17 06:20:36 +08:00
|
|
|
# switch to kernel stack
|
2011-12-27 18:27:15 +08:00
|
|
|
lg %r1,__PT_R15(%r11)
|
|
|
|
aghi %r1,-(STACK_FRAME_OVERHEAD + __PT_SIZE)
|
|
|
|
mvc STACK_FRAME_OVERHEAD(__PT_SIZE,%r1),0(%r11)
|
|
|
|
xc __SF_BACKCHAIN(8,%r1),__SF_BACKCHAIN(%r1)
|
|
|
|
la %r11,STACK_FRAME_OVERHEAD(%r1)
|
2005-04-17 06:20:36 +08:00
|
|
|
lgr %r15,%r1
|
2010-05-17 16:00:02 +08:00
|
|
|
# TRACE_IRQS_ON already done at io_return, call
|
|
|
|
# TRACE_IRQS_OFF to keep things symmetrical
|
|
|
|
TRACE_IRQS_OFF
|
|
|
|
brasl %r14,preempt_schedule_irq
|
|
|
|
j io_return
|
|
|
|
#else
|
2010-05-17 16:00:01 +08:00
|
|
|
j io_restore
|
2010-05-17 16:00:02 +08:00
|
|
|
#endif
|
2005-04-17 06:20:36 +08:00
|
|
|
|
2010-05-17 16:00:01 +08:00
|
|
|
#
|
|
|
|
# Need to do work before returning to userspace, switch to kernel stack
|
|
|
|
#
|
2008-05-07 15:22:52 +08:00
|
|
|
io_work_user:
|
2005-04-17 06:20:36 +08:00
|
|
|
lg %r1,__LC_KERNEL_STACK
|
2011-12-27 18:27:15 +08:00
|
|
|
mvc STACK_FRAME_OVERHEAD(__PT_SIZE,%r1),0(%r11)
|
|
|
|
xc __SF_BACKCHAIN(8,%r1),__SF_BACKCHAIN(%r1)
|
|
|
|
la %r11,STACK_FRAME_OVERHEAD(%r1)
|
2005-04-17 06:20:36 +08:00
|
|
|
lgr %r15,%r1
|
2010-05-17 16:00:01 +08:00
|
|
|
|
2005-04-17 06:20:36 +08:00
|
|
|
#
|
|
|
|
# One of the work bits is on. Find out which one.
|
|
|
|
#
|
2010-05-17 16:00:02 +08:00
|
|
|
io_work_tif:
|
2014-04-15 18:55:07 +08:00
|
|
|
tm __LC_CPU_FLAGS+7,_CIF_MCCK_PENDING
|
2005-06-26 05:55:30 +08:00
|
|
|
jo io_mcck_pending
|
2010-05-17 16:00:05 +08:00
|
|
|
tm __TI_flags+7(%r12),_TIF_NEED_RESCHED
|
2005-04-17 06:20:36 +08:00
|
|
|
jo io_reschedule
|
2010-05-17 16:00:05 +08:00
|
|
|
tm __TI_flags+7(%r12),_TIF_SIGPENDING
|
2010-05-17 16:00:01 +08:00
|
|
|
jo io_sigpending
|
2010-05-17 16:00:05 +08:00
|
|
|
tm __TI_flags+7(%r12),_TIF_NOTIFY_RESUME
|
2010-05-17 16:00:01 +08:00
|
|
|
jo io_notify_resume
|
2014-04-15 18:55:07 +08:00
|
|
|
tm __LC_CPU_FLAGS+7,_CIF_ASCE
|
s390/uaccess: rework uaccess code - fix locking issues
The current uaccess code uses a page table walk in some circumstances,
e.g. in case of the in atomic futex operations or if running on old
hardware which doesn't support the mvcos instruction.
However it turned out that the page table walk code does not correctly
lock page tables when accessing page table entries.
In other words: a different cpu may invalidate a page table entry while
the current cpu inspects the pte. This may lead to random data corruption.
Adding correct locking however isn't trivial for all uaccess operations.
Especially copy_in_user() is problematic since that requires to hold at
least two locks, but must be protected against ABBA deadlock when a
different cpu also performs a copy_in_user() operation.
So the solution is a different approach where we change address spaces:
User space runs in primary address mode, or access register mode within
vdso code, like it currently already does.
The kernel usually also runs in home space mode, however when accessing
user space the kernel switches to primary or secondary address mode if
the mvcos instruction is not available or if a compare-and-swap (futex)
instruction on a user space address is performed.
KVM however is special, since that requires the kernel to run in home
address space while implicitly accessing user space with the sie
instruction.
So we end up with:
User space:
- runs in primary or access register mode
- cr1 contains the user asce
- cr7 contains the user asce
- cr13 contains the kernel asce
Kernel space:
- runs in home space mode
- cr1 contains the user or kernel asce
-> the kernel asce is loaded when a uaccess requires primary or
secondary address mode
- cr7 contains the user or kernel asce, (changed with set_fs())
- cr13 contains the kernel asce
In case of uaccess the kernel changes to:
- primary space mode in case of a uaccess (copy_to_user) and uses
e.g. the mvcp instruction to access user space. However the kernel
will stay in home space mode if the mvcos instruction is available
- secondary space mode in case of futex atomic operations, so that the
instructions come from primary address space and data from secondary
space
In case of kvm the kernel runs in home space mode, but cr1 gets switched
to contain the gmap asce before the sie instruction gets executed. When
the sie instruction is finished cr1 will be switched back to contain the
user asce.
A context switch between two processes will always load the kernel asce
for the next process in cr1. So the first exit to user space is a bit
more expensive (one extra load control register instruction) than before,
however keeps the code rather simple.
In sum this means there is no need to perform any error prone page table
walks anymore when accessing user space.
The patch seems to be rather large, however it mainly removes the
the page table walk code and restores the previously deleted "standard"
uaccess code, with a couple of changes.
The uaccess without mvcos mode can be enforced with the "uaccess_primary"
kernel parameter.
Reported-by: Christian Borntraeger <borntraeger@de.ibm.com>
Signed-off-by: Heiko Carstens <heiko.carstens@de.ibm.com>
Signed-off-by: Martin Schwidefsky <schwidefsky@de.ibm.com>
2014-03-21 17:42:25 +08:00
|
|
|
jo io_uaccess
|
2010-05-17 16:00:01 +08:00
|
|
|
j io_return # beware of critical section cleanup
|
2008-05-07 15:22:53 +08:00
|
|
|
|
2005-06-26 05:55:30 +08:00
|
|
|
#
|
2014-04-15 18:55:07 +08:00
|
|
|
# _CIF_MCCK_PENDING is set, call handler
|
2005-06-26 05:55:30 +08:00
|
|
|
#
|
|
|
|
io_mcck_pending:
|
2010-05-17 16:00:02 +08:00
|
|
|
# TRACE_IRQS_ON already done at io_return
|
2007-07-27 18:29:18 +08:00
|
|
|
brasl %r14,s390_handle_mcck # TIF bit will be cleared by handler
|
2010-05-17 16:00:02 +08:00
|
|
|
TRACE_IRQS_OFF
|
|
|
|
j io_return
|
2005-06-26 05:55:30 +08:00
|
|
|
|
s390/uaccess: rework uaccess code - fix locking issues
The current uaccess code uses a page table walk in some circumstances,
e.g. in case of the in atomic futex operations or if running on old
hardware which doesn't support the mvcos instruction.
However it turned out that the page table walk code does not correctly
lock page tables when accessing page table entries.
In other words: a different cpu may invalidate a page table entry while
the current cpu inspects the pte. This may lead to random data corruption.
Adding correct locking however isn't trivial for all uaccess operations.
Especially copy_in_user() is problematic since that requires to hold at
least two locks, but must be protected against ABBA deadlock when a
different cpu also performs a copy_in_user() operation.
So the solution is a different approach where we change address spaces:
User space runs in primary address mode, or access register mode within
vdso code, like it currently already does.
The kernel usually also runs in home space mode, however when accessing
user space the kernel switches to primary or secondary address mode if
the mvcos instruction is not available or if a compare-and-swap (futex)
instruction on a user space address is performed.
KVM however is special, since that requires the kernel to run in home
address space while implicitly accessing user space with the sie
instruction.
So we end up with:
User space:
- runs in primary or access register mode
- cr1 contains the user asce
- cr7 contains the user asce
- cr13 contains the kernel asce
Kernel space:
- runs in home space mode
- cr1 contains the user or kernel asce
-> the kernel asce is loaded when a uaccess requires primary or
secondary address mode
- cr7 contains the user or kernel asce, (changed with set_fs())
- cr13 contains the kernel asce
In case of uaccess the kernel changes to:
- primary space mode in case of a uaccess (copy_to_user) and uses
e.g. the mvcp instruction to access user space. However the kernel
will stay in home space mode if the mvcos instruction is available
- secondary space mode in case of futex atomic operations, so that the
instructions come from primary address space and data from secondary
space
In case of kvm the kernel runs in home space mode, but cr1 gets switched
to contain the gmap asce before the sie instruction gets executed. When
the sie instruction is finished cr1 will be switched back to contain the
user asce.
A context switch between two processes will always load the kernel asce
for the next process in cr1. So the first exit to user space is a bit
more expensive (one extra load control register instruction) than before,
however keeps the code rather simple.
In sum this means there is no need to perform any error prone page table
walks anymore when accessing user space.
The patch seems to be rather large, however it mainly removes the
the page table walk code and restores the previously deleted "standard"
uaccess code, with a couple of changes.
The uaccess without mvcos mode can be enforced with the "uaccess_primary"
kernel parameter.
Reported-by: Christian Borntraeger <borntraeger@de.ibm.com>
Signed-off-by: Heiko Carstens <heiko.carstens@de.ibm.com>
Signed-off-by: Martin Schwidefsky <schwidefsky@de.ibm.com>
2014-03-21 17:42:25 +08:00
|
|
|
#
|
2014-04-15 18:55:07 +08:00
|
|
|
# _CIF_ASCE is set, load user space asce
|
s390/uaccess: rework uaccess code - fix locking issues
The current uaccess code uses a page table walk in some circumstances,
e.g. in case of the in atomic futex operations or if running on old
hardware which doesn't support the mvcos instruction.
However it turned out that the page table walk code does not correctly
lock page tables when accessing page table entries.
In other words: a different cpu may invalidate a page table entry while
the current cpu inspects the pte. This may lead to random data corruption.
Adding correct locking however isn't trivial for all uaccess operations.
Especially copy_in_user() is problematic since that requires to hold at
least two locks, but must be protected against ABBA deadlock when a
different cpu also performs a copy_in_user() operation.
So the solution is a different approach where we change address spaces:
User space runs in primary address mode, or access register mode within
vdso code, like it currently already does.
The kernel usually also runs in home space mode, however when accessing
user space the kernel switches to primary or secondary address mode if
the mvcos instruction is not available or if a compare-and-swap (futex)
instruction on a user space address is performed.
KVM however is special, since that requires the kernel to run in home
address space while implicitly accessing user space with the sie
instruction.
So we end up with:
User space:
- runs in primary or access register mode
- cr1 contains the user asce
- cr7 contains the user asce
- cr13 contains the kernel asce
Kernel space:
- runs in home space mode
- cr1 contains the user or kernel asce
-> the kernel asce is loaded when a uaccess requires primary or
secondary address mode
- cr7 contains the user or kernel asce, (changed with set_fs())
- cr13 contains the kernel asce
In case of uaccess the kernel changes to:
- primary space mode in case of a uaccess (copy_to_user) and uses
e.g. the mvcp instruction to access user space. However the kernel
will stay in home space mode if the mvcos instruction is available
- secondary space mode in case of futex atomic operations, so that the
instructions come from primary address space and data from secondary
space
In case of kvm the kernel runs in home space mode, but cr1 gets switched
to contain the gmap asce before the sie instruction gets executed. When
the sie instruction is finished cr1 will be switched back to contain the
user asce.
A context switch between two processes will always load the kernel asce
for the next process in cr1. So the first exit to user space is a bit
more expensive (one extra load control register instruction) than before,
however keeps the code rather simple.
In sum this means there is no need to perform any error prone page table
walks anymore when accessing user space.
The patch seems to be rather large, however it mainly removes the
the page table walk code and restores the previously deleted "standard"
uaccess code, with a couple of changes.
The uaccess without mvcos mode can be enforced with the "uaccess_primary"
kernel parameter.
Reported-by: Christian Borntraeger <borntraeger@de.ibm.com>
Signed-off-by: Heiko Carstens <heiko.carstens@de.ibm.com>
Signed-off-by: Martin Schwidefsky <schwidefsky@de.ibm.com>
2014-03-21 17:42:25 +08:00
|
|
|
#
|
|
|
|
io_uaccess:
|
2014-04-15 18:55:07 +08:00
|
|
|
ni __LC_CPU_FLAGS+7,255-_CIF_ASCE
|
s390/uaccess: rework uaccess code - fix locking issues
The current uaccess code uses a page table walk in some circumstances,
e.g. in case of the in atomic futex operations or if running on old
hardware which doesn't support the mvcos instruction.
However it turned out that the page table walk code does not correctly
lock page tables when accessing page table entries.
In other words: a different cpu may invalidate a page table entry while
the current cpu inspects the pte. This may lead to random data corruption.
Adding correct locking however isn't trivial for all uaccess operations.
Especially copy_in_user() is problematic since that requires to hold at
least two locks, but must be protected against ABBA deadlock when a
different cpu also performs a copy_in_user() operation.
So the solution is a different approach where we change address spaces:
User space runs in primary address mode, or access register mode within
vdso code, like it currently already does.
The kernel usually also runs in home space mode, however when accessing
user space the kernel switches to primary or secondary address mode if
the mvcos instruction is not available or if a compare-and-swap (futex)
instruction on a user space address is performed.
KVM however is special, since that requires the kernel to run in home
address space while implicitly accessing user space with the sie
instruction.
So we end up with:
User space:
- runs in primary or access register mode
- cr1 contains the user asce
- cr7 contains the user asce
- cr13 contains the kernel asce
Kernel space:
- runs in home space mode
- cr1 contains the user or kernel asce
-> the kernel asce is loaded when a uaccess requires primary or
secondary address mode
- cr7 contains the user or kernel asce, (changed with set_fs())
- cr13 contains the kernel asce
In case of uaccess the kernel changes to:
- primary space mode in case of a uaccess (copy_to_user) and uses
e.g. the mvcp instruction to access user space. However the kernel
will stay in home space mode if the mvcos instruction is available
- secondary space mode in case of futex atomic operations, so that the
instructions come from primary address space and data from secondary
space
In case of kvm the kernel runs in home space mode, but cr1 gets switched
to contain the gmap asce before the sie instruction gets executed. When
the sie instruction is finished cr1 will be switched back to contain the
user asce.
A context switch between two processes will always load the kernel asce
for the next process in cr1. So the first exit to user space is a bit
more expensive (one extra load control register instruction) than before,
however keeps the code rather simple.
In sum this means there is no need to perform any error prone page table
walks anymore when accessing user space.
The patch seems to be rather large, however it mainly removes the
the page table walk code and restores the previously deleted "standard"
uaccess code, with a couple of changes.
The uaccess without mvcos mode can be enforced with the "uaccess_primary"
kernel parameter.
Reported-by: Christian Borntraeger <borntraeger@de.ibm.com>
Signed-off-by: Heiko Carstens <heiko.carstens@de.ibm.com>
Signed-off-by: Martin Schwidefsky <schwidefsky@de.ibm.com>
2014-03-21 17:42:25 +08:00
|
|
|
lctlg %c1,%c1,__LC_USER_ASCE # load primary asce
|
|
|
|
j io_return
|
|
|
|
|
2005-04-17 06:20:36 +08:00
|
|
|
#
|
|
|
|
# _TIF_NEED_RESCHED is set, call schedule
|
2006-09-28 22:56:37 +08:00
|
|
|
#
|
|
|
|
io_reschedule:
|
2010-05-17 16:00:02 +08:00
|
|
|
# TRACE_IRQS_ON already done at io_return
|
2011-12-27 18:27:15 +08:00
|
|
|
ssm __LC_SVC_NEW_PSW # reenable interrupts
|
2006-09-28 22:56:37 +08:00
|
|
|
brasl %r14,schedule # call scheduler
|
2011-12-27 18:27:15 +08:00
|
|
|
ssm __LC_PGM_NEW_PSW # disable I/O and ext. interrupts
|
2007-11-20 18:13:32 +08:00
|
|
|
TRACE_IRQS_OFF
|
2010-05-17 16:00:02 +08:00
|
|
|
j io_return
|
2005-04-17 06:20:36 +08:00
|
|
|
|
|
|
|
#
|
2008-04-30 15:53:08 +08:00
|
|
|
# _TIF_SIGPENDING or is set, call do_signal
|
2005-04-17 06:20:36 +08:00
|
|
|
#
|
2006-09-28 22:56:37 +08:00
|
|
|
io_sigpending:
|
2010-05-17 16:00:02 +08:00
|
|
|
# TRACE_IRQS_ON already done at io_return
|
2011-12-27 18:27:15 +08:00
|
|
|
ssm __LC_SVC_NEW_PSW # reenable interrupts
|
|
|
|
lgr %r2,%r11 # pass pointer to pt_regs
|
|
|
|
brasl %r14,do_signal
|
|
|
|
ssm __LC_PGM_NEW_PSW # disable I/O and ext. interrupts
|
2007-11-20 18:13:32 +08:00
|
|
|
TRACE_IRQS_OFF
|
2010-05-17 16:00:02 +08:00
|
|
|
j io_return
|
2005-04-17 06:20:36 +08:00
|
|
|
|
2008-10-11 03:33:20 +08:00
|
|
|
#
|
|
|
|
# _TIF_NOTIFY_RESUME or is set, call do_notify_resume
|
|
|
|
#
|
|
|
|
io_notify_resume:
|
2010-05-17 16:00:02 +08:00
|
|
|
# TRACE_IRQS_ON already done at io_return
|
2011-12-27 18:27:15 +08:00
|
|
|
ssm __LC_SVC_NEW_PSW # reenable interrupts
|
|
|
|
lgr %r2,%r11 # pass pointer to pt_regs
|
|
|
|
brasl %r14,do_notify_resume
|
|
|
|
ssm __LC_PGM_NEW_PSW # disable I/O and ext. interrupts
|
2008-10-11 03:33:20 +08:00
|
|
|
TRACE_IRQS_OFF
|
2010-05-17 16:00:02 +08:00
|
|
|
j io_return
|
2008-10-11 03:33:20 +08:00
|
|
|
|
2005-04-17 06:20:36 +08:00
|
|
|
/*
|
|
|
|
* External interrupt handler routine
|
|
|
|
*/
|
2011-07-24 16:48:19 +08:00
|
|
|
ENTRY(ext_int_handler)
|
2012-05-09 22:27:39 +08:00
|
|
|
STCK __LC_INT_CLOCK
|
2008-12-31 22:11:41 +08:00
|
|
|
stpt __LC_ASYNC_ENTER_TIMER
|
2011-12-27 18:27:15 +08:00
|
|
|
stmg %r8,%r15,__LC_SAVE_AREA_ASYNC
|
|
|
|
lg %r10,__LC_LAST_BREAK
|
|
|
|
lg %r12,__LC_THREAD_INFO
|
|
|
|
larl %r13,system_call
|
|
|
|
lmg %r8,%r9,__LC_EXT_OLD_PSW
|
2013-05-17 20:41:37 +08:00
|
|
|
HANDLE_SIE_INTERCEPT %r14,3
|
2011-12-27 18:27:15 +08:00
|
|
|
SWITCH_ASYNC __LC_SAVE_AREA_ASYNC,__LC_ASYNC_STACK,STACK_SHIFT
|
|
|
|
tmhh %r8,0x0001 # interrupting from user ?
|
|
|
|
jz ext_skip
|
|
|
|
UPDATE_VTIME %r14,__LC_ASYNC_ENTER_TIMER
|
|
|
|
LAST_BREAK %r14
|
|
|
|
ext_skip:
|
|
|
|
stmg %r0,%r7,__PT_R0(%r11)
|
|
|
|
mvc __PT_R8(64,%r11),__LC_SAVE_AREA_ASYNC
|
|
|
|
stmg %r8,%r9,__PT_PSW(%r11)
|
2013-06-17 20:54:02 +08:00
|
|
|
lghi %r1,__LC_EXT_PARAMS2
|
|
|
|
mvc __PT_INT_CODE(4,%r11),__LC_EXT_CPU_ADDR
|
|
|
|
mvc __PT_INT_PARM(4,%r11),__LC_EXT_PARAMS
|
|
|
|
mvc __PT_INT_PARM_LONG(8,%r11),0(%r1)
|
2014-04-15 18:55:07 +08:00
|
|
|
xc __PT_FLAGS(8,%r11),__PT_FLAGS(%r11)
|
2006-07-03 15:24:46 +08:00
|
|
|
TRACE_IRQS_OFF
|
2012-05-09 22:27:35 +08:00
|
|
|
xc __SF_BACKCHAIN(8,%r15),__SF_BACKCHAIN(%r15)
|
2011-12-27 18:27:15 +08:00
|
|
|
lgr %r2,%r11 # pass pointer to pt_regs
|
2013-06-27 15:01:09 +08:00
|
|
|
lghi %r3,EXT_INTERRUPT
|
|
|
|
brasl %r14,do_IRQ
|
2005-04-17 06:20:36 +08:00
|
|
|
j io_return
|
|
|
|
|
2012-03-11 23:59:27 +08:00
|
|
|
/*
|
|
|
|
* Load idle PSW. The second "half" of this function is in cleanup_idle.
|
|
|
|
*/
|
|
|
|
ENTRY(psw_idle)
|
2012-07-20 17:15:08 +08:00
|
|
|
stg %r3,__SF_EMPTY(%r15)
|
2012-03-11 23:59:27 +08:00
|
|
|
larl %r1,psw_idle_lpsw+4
|
|
|
|
stg %r1,__SF_EMPTY+8(%r15)
|
2012-07-20 17:15:08 +08:00
|
|
|
STCK __CLOCK_IDLE_ENTER(%r2)
|
|
|
|
stpt __TIMER_IDLE_ENTER(%r2)
|
2012-03-11 23:59:27 +08:00
|
|
|
psw_idle_lpsw:
|
|
|
|
lpswe __SF_EMPTY(%r15)
|
|
|
|
br %r14
|
|
|
|
psw_idle_end:
|
|
|
|
|
2005-09-04 06:57:56 +08:00
|
|
|
__critical_end:
|
|
|
|
|
2005-04-17 06:20:36 +08:00
|
|
|
/*
|
|
|
|
* Machine check handler routines
|
|
|
|
*/
|
2011-07-24 16:48:19 +08:00
|
|
|
ENTRY(mcck_int_handler)
|
2012-05-09 22:27:39 +08:00
|
|
|
STCK __LC_MCCK_CLOCK
|
2005-06-26 05:55:30 +08:00
|
|
|
la %r1,4095 # revalidate r1
|
|
|
|
spt __LC_CPU_TIMER_SAVE_AREA-4095(%r1) # revalidate cpu timer
|
2006-09-28 22:56:37 +08:00
|
|
|
lmg %r0,%r15,__LC_GPREGS_SAVE_AREA-4095(%r1)# revalidate gprs
|
2011-12-27 18:27:15 +08:00
|
|
|
lg %r10,__LC_LAST_BREAK
|
|
|
|
lg %r12,__LC_THREAD_INFO
|
2010-05-17 16:00:05 +08:00
|
|
|
larl %r13,system_call
|
2011-12-27 18:27:15 +08:00
|
|
|
lmg %r8,%r9,__LC_MCK_OLD_PSW
|
2013-05-17 20:41:37 +08:00
|
|
|
HANDLE_SIE_INTERCEPT %r14,4
|
2006-09-28 22:56:37 +08:00
|
|
|
tm __LC_MCCK_CODE,0x80 # system damage?
|
2011-12-27 18:27:15 +08:00
|
|
|
jo mcck_panic # yes -> rest of mcck code invalid
|
|
|
|
lghi %r14,__LC_CPU_TIMER_SAVE_AREA
|
|
|
|
mvc __LC_MCCK_ENTER_TIMER(8),0(%r14)
|
2006-06-29 20:58:05 +08:00
|
|
|
tm __LC_MCCK_CODE+5,0x02 # stored cpu timer value valid?
|
2011-12-27 18:27:15 +08:00
|
|
|
jo 3f
|
2006-06-29 20:58:05 +08:00
|
|
|
la %r14,__LC_SYNC_ENTER_TIMER
|
|
|
|
clc 0(8,%r14),__LC_ASYNC_ENTER_TIMER
|
|
|
|
jl 0f
|
|
|
|
la %r14,__LC_ASYNC_ENTER_TIMER
|
|
|
|
0: clc 0(8,%r14),__LC_EXIT_TIMER
|
2011-12-27 18:27:15 +08:00
|
|
|
jl 1f
|
2006-06-29 20:58:05 +08:00
|
|
|
la %r14,__LC_EXIT_TIMER
|
2011-12-27 18:27:15 +08:00
|
|
|
1: clc 0(8,%r14),__LC_LAST_UPDATE_TIMER
|
|
|
|
jl 2f
|
2006-06-29 20:58:05 +08:00
|
|
|
la %r14,__LC_LAST_UPDATE_TIMER
|
2011-12-27 18:27:15 +08:00
|
|
|
2: spt 0(%r14)
|
2010-05-17 16:00:03 +08:00
|
|
|
mvc __LC_MCCK_ENTER_TIMER(8),0(%r14)
|
2011-12-27 18:27:15 +08:00
|
|
|
3: tm __LC_MCCK_CODE+2,0x09 # mwp + ia of old psw valid?
|
|
|
|
jno mcck_panic # no -> skip cleanup critical
|
|
|
|
SWITCH_ASYNC __LC_GPREGS_SAVE_AREA+64,__LC_PANIC_STACK,PAGE_SHIFT
|
|
|
|
tm %r8,0x0001 # interrupting from user ?
|
|
|
|
jz mcck_skip
|
|
|
|
UPDATE_VTIME %r14,__LC_MCCK_ENTER_TIMER
|
|
|
|
LAST_BREAK %r14
|
|
|
|
mcck_skip:
|
2013-02-28 23:28:41 +08:00
|
|
|
lghi %r14,__LC_GPREGS_SAVE_AREA+64
|
|
|
|
stmg %r0,%r7,__PT_R0(%r11)
|
|
|
|
mvc __PT_R8(64,%r11),0(%r14)
|
2011-12-27 18:27:15 +08:00
|
|
|
stmg %r8,%r9,__PT_PSW(%r11)
|
2014-04-15 18:55:07 +08:00
|
|
|
xc __PT_FLAGS(8,%r11),__PT_FLAGS(%r11)
|
2011-12-27 18:27:15 +08:00
|
|
|
xc __SF_BACKCHAIN(8,%r15),__SF_BACKCHAIN(%r15)
|
|
|
|
lgr %r2,%r11 # pass pointer to pt_regs
|
2005-06-26 05:55:30 +08:00
|
|
|
brasl %r14,s390_do_machine_check
|
2011-12-27 18:27:15 +08:00
|
|
|
tm __PT_PSW+1(%r11),0x01 # returning to user ?
|
2005-06-26 05:55:30 +08:00
|
|
|
jno mcck_return
|
|
|
|
lg %r1,__LC_KERNEL_STACK # switch to kernel stack
|
2011-12-27 18:27:15 +08:00
|
|
|
mvc STACK_FRAME_OVERHEAD(__PT_SIZE,%r1),0(%r11)
|
|
|
|
xc __SF_BACKCHAIN(8,%r1),__SF_BACKCHAIN(%r1)
|
|
|
|
la %r11,STACK_FRAME_OVERHEAD(%r1)
|
2005-06-26 05:55:30 +08:00
|
|
|
lgr %r15,%r1
|
2011-12-27 18:27:15 +08:00
|
|
|
ssm __LC_PGM_NEW_PSW # turn dat on, keep irqs off
|
2014-04-15 18:55:07 +08:00
|
|
|
tm __LC_CPU_FLAGS+7,_CIF_MCCK_PENDING
|
2005-06-26 05:55:30 +08:00
|
|
|
jno mcck_return
|
2006-07-03 15:24:46 +08:00
|
|
|
TRACE_IRQS_OFF
|
2005-06-26 05:55:30 +08:00
|
|
|
brasl %r14,s390_handle_mcck
|
2006-07-03 15:24:46 +08:00
|
|
|
TRACE_IRQS_ON
|
2005-04-17 06:20:36 +08:00
|
|
|
mcck_return:
|
2011-12-27 18:27:15 +08:00
|
|
|
lg %r14,__LC_VDSO_PER_CPU
|
|
|
|
lmg %r0,%r10,__PT_R0(%r11)
|
|
|
|
mvc __LC_RETURN_MCCK_PSW(16),__PT_PSW(%r11) # move return PSW
|
2006-06-29 20:58:05 +08:00
|
|
|
tm __LC_RETURN_MCCK_PSW+1,0x01 # returning to user ?
|
|
|
|
jno 0f
|
|
|
|
stpt __LC_EXIT_TIMER
|
2011-12-27 18:27:15 +08:00
|
|
|
mvc __VDSO_ECTG_BASE(16,%r14),__LC_EXIT_TIMER
|
|
|
|
0: lmg %r11,%r15,__PT_R11(%r11)
|
|
|
|
lpswe __LC_RETURN_MCCK_PSW
|
|
|
|
|
|
|
|
mcck_panic:
|
|
|
|
lg %r14,__LC_PANIC_STACK
|
|
|
|
slgr %r14,%r15
|
|
|
|
srag %r14,%r14,PAGE_SHIFT
|
|
|
|
jz 0f
|
|
|
|
lg %r15,__LC_PANIC_STACK
|
|
|
|
0: aghi %r15,-(STACK_FRAME_OVERHEAD + __PT_SIZE)
|
|
|
|
j mcck_skip
|
2005-04-17 06:20:36 +08:00
|
|
|
|
2011-08-03 22:44:19 +08:00
|
|
|
#
|
|
|
|
# PSW restart interrupt handler
|
|
|
|
#
|
2012-03-11 23:59:26 +08:00
|
|
|
ENTRY(restart_int_handler)
|
2011-12-27 18:27:15 +08:00
|
|
|
stg %r15,__LC_SAVE_AREA_RESTART
|
2012-03-11 23:59:26 +08:00
|
|
|
lg %r15,__LC_RESTART_STACK
|
2011-12-27 18:27:15 +08:00
|
|
|
aghi %r15,-__PT_SIZE # create pt_regs on stack
|
2012-03-11 23:59:26 +08:00
|
|
|
xc 0(__PT_SIZE,%r15),0(%r15)
|
2011-12-27 18:27:15 +08:00
|
|
|
stmg %r0,%r14,__PT_R0(%r15)
|
|
|
|
mvc __PT_R15(8,%r15),__LC_SAVE_AREA_RESTART
|
|
|
|
mvc __PT_PSW(16,%r15),__LC_RST_OLD_PSW # store restart old psw
|
2012-03-11 23:59:26 +08:00
|
|
|
aghi %r15,-STACK_FRAME_OVERHEAD # create stack frame on stack
|
|
|
|
xc 0(STACK_FRAME_OVERHEAD,%r15),0(%r15)
|
2012-06-05 15:59:52 +08:00
|
|
|
lg %r1,__LC_RESTART_FN # load fn, parm & source cpu
|
|
|
|
lg %r2,__LC_RESTART_DATA
|
|
|
|
lg %r3,__LC_RESTART_SOURCE
|
2012-03-11 23:59:26 +08:00
|
|
|
ltgr %r3,%r3 # test source cpu address
|
|
|
|
jm 1f # negative -> skip source stop
|
2012-06-04 21:05:43 +08:00
|
|
|
0: sigp %r4,%r3,SIGP_SENSE # sigp sense to source cpu
|
2012-03-11 23:59:26 +08:00
|
|
|
brc 10,0b # wait for status stored
|
|
|
|
1: basr %r14,%r1 # call function
|
|
|
|
stap __SF_EMPTY(%r15) # store cpu address
|
|
|
|
llgh %r3,__SF_EMPTY(%r15)
|
2012-06-04 21:05:43 +08:00
|
|
|
2: sigp %r4,%r3,SIGP_STOP # sigp stop to current cpu
|
2012-03-11 23:59:26 +08:00
|
|
|
brc 2,2b
|
|
|
|
3: j 3b
|
2011-08-03 22:44:19 +08:00
|
|
|
|
2011-01-05 19:47:25 +08:00
|
|
|
.section .kprobes.text, "ax"
|
|
|
|
|
2005-04-17 06:20:36 +08:00
|
|
|
#ifdef CONFIG_CHECK_STACK
|
|
|
|
/*
|
|
|
|
* The synchronous or the asynchronous stack overflowed. We are dead.
|
|
|
|
* No need to properly save the registers, we are going to panic anyway.
|
|
|
|
* Setup a pt_regs so that show_trace can provide a good call trace.
|
|
|
|
*/
|
|
|
|
stack_overflow:
|
2013-04-24 16:20:43 +08:00
|
|
|
lg %r15,__LC_PANIC_STACK # change to panic stack
|
|
|
|
la %r11,STACK_FRAME_OVERHEAD(%r15)
|
2011-12-27 18:27:15 +08:00
|
|
|
stmg %r0,%r7,__PT_R0(%r11)
|
|
|
|
stmg %r8,%r9,__PT_PSW(%r11)
|
|
|
|
mvc __PT_R8(64,%r11),0(%r14)
|
|
|
|
stg %r10,__PT_ORIG_GPR2(%r11) # store last break to orig_gpr2
|
|
|
|
xc __SF_BACKCHAIN(8,%r15),__SF_BACKCHAIN(%r15)
|
|
|
|
lgr %r2,%r11 # pass pointer to pt_regs
|
2005-04-17 06:20:36 +08:00
|
|
|
jg kernel_stack_overflow
|
|
|
|
#endif
|
|
|
|
|
2011-12-27 18:27:15 +08:00
|
|
|
.align 8
|
|
|
|
cleanup_table:
|
|
|
|
.quad system_call
|
|
|
|
.quad sysc_do_svc
|
|
|
|
.quad sysc_tif
|
|
|
|
.quad sysc_restore
|
|
|
|
.quad sysc_done
|
|
|
|
.quad io_tif
|
|
|
|
.quad io_restore
|
|
|
|
.quad io_done
|
2012-03-11 23:59:27 +08:00
|
|
|
.quad psw_idle
|
|
|
|
.quad psw_idle_end
|
2005-04-17 06:20:36 +08:00
|
|
|
|
|
|
|
cleanup_critical:
|
2011-12-27 18:27:15 +08:00
|
|
|
clg %r9,BASED(cleanup_table) # system_call
|
2005-04-17 06:20:36 +08:00
|
|
|
jl 0f
|
2011-12-27 18:27:15 +08:00
|
|
|
clg %r9,BASED(cleanup_table+8) # sysc_do_svc
|
2005-04-17 06:20:36 +08:00
|
|
|
jl cleanup_system_call
|
2011-12-27 18:27:15 +08:00
|
|
|
clg %r9,BASED(cleanup_table+16) # sysc_tif
|
2005-04-17 06:20:36 +08:00
|
|
|
jl 0f
|
2011-12-27 18:27:15 +08:00
|
|
|
clg %r9,BASED(cleanup_table+24) # sysc_restore
|
2010-05-17 16:00:02 +08:00
|
|
|
jl cleanup_sysc_tif
|
2011-12-27 18:27:15 +08:00
|
|
|
clg %r9,BASED(cleanup_table+32) # sysc_done
|
2010-05-17 16:00:02 +08:00
|
|
|
jl cleanup_sysc_restore
|
2011-12-27 18:27:15 +08:00
|
|
|
clg %r9,BASED(cleanup_table+40) # io_tif
|
2006-06-29 20:58:05 +08:00
|
|
|
jl 0f
|
2011-12-27 18:27:15 +08:00
|
|
|
clg %r9,BASED(cleanup_table+48) # io_restore
|
2010-05-17 16:00:02 +08:00
|
|
|
jl cleanup_io_tif
|
2011-12-27 18:27:15 +08:00
|
|
|
clg %r9,BASED(cleanup_table+56) # io_done
|
2010-05-17 16:00:02 +08:00
|
|
|
jl cleanup_io_restore
|
2012-03-11 23:59:27 +08:00
|
|
|
clg %r9,BASED(cleanup_table+64) # psw_idle
|
|
|
|
jl 0f
|
|
|
|
clg %r9,BASED(cleanup_table+72) # psw_idle_end
|
|
|
|
jl cleanup_idle
|
2011-12-27 18:27:15 +08:00
|
|
|
0: br %r14
|
|
|
|
|
2005-04-17 06:20:36 +08:00
|
|
|
|
|
|
|
cleanup_system_call:
|
2011-12-27 18:27:15 +08:00
|
|
|
# check if stpt has been executed
|
|
|
|
clg %r9,BASED(cleanup_system_call_insn)
|
2005-04-17 06:20:36 +08:00
|
|
|
jh 0f
|
|
|
|
mvc __LC_SYNC_ENTER_TIMER(8),__LC_ASYNC_ENTER_TIMER
|
2011-12-27 18:27:15 +08:00
|
|
|
cghi %r11,__LC_SAVE_AREA_ASYNC
|
2010-05-17 16:00:03 +08:00
|
|
|
je 0f
|
2011-12-27 18:27:15 +08:00
|
|
|
mvc __LC_SYNC_ENTER_TIMER(8),__LC_MCCK_ENTER_TIMER
|
|
|
|
0: # check if stmg has been executed
|
|
|
|
clg %r9,BASED(cleanup_system_call_insn+8)
|
2005-04-17 06:20:36 +08:00
|
|
|
jh 0f
|
2011-12-27 18:27:15 +08:00
|
|
|
mvc __LC_SAVE_AREA_SYNC(64),0(%r11)
|
|
|
|
0: # check if base register setup + TIF bit load has been done
|
|
|
|
clg %r9,BASED(cleanup_system_call_insn+16)
|
|
|
|
jhe 0f
|
|
|
|
# set up saved registers r10 and r12
|
|
|
|
stg %r10,16(%r11) # r10 last break
|
|
|
|
stg %r12,32(%r11) # r12 thread-info pointer
|
|
|
|
0: # check if the user time update has been done
|
|
|
|
clg %r9,BASED(cleanup_system_call_insn+24)
|
|
|
|
jh 0f
|
|
|
|
lg %r15,__LC_EXIT_TIMER
|
|
|
|
slg %r15,__LC_SYNC_ENTER_TIMER
|
|
|
|
alg %r15,__LC_USER_TIMER
|
|
|
|
stg %r15,__LC_USER_TIMER
|
|
|
|
0: # check if the system time update has been done
|
|
|
|
clg %r9,BASED(cleanup_system_call_insn+32)
|
|
|
|
jh 0f
|
|
|
|
lg %r15,__LC_LAST_UPDATE_TIMER
|
|
|
|
slg %r15,__LC_EXIT_TIMER
|
|
|
|
alg %r15,__LC_SYSTEM_TIMER
|
|
|
|
stg %r15,__LC_SYSTEM_TIMER
|
|
|
|
0: # update accounting time stamp
|
2005-04-17 06:20:36 +08:00
|
|
|
mvc __LC_LAST_UPDATE_TIMER(8),__LC_SYNC_ENTER_TIMER
|
2011-12-27 18:27:15 +08:00
|
|
|
# do LAST_BREAK
|
|
|
|
lg %r9,16(%r11)
|
|
|
|
srag %r9,%r9,23
|
2010-05-17 16:00:05 +08:00
|
|
|
jz 0f
|
2011-12-27 18:27:15 +08:00
|
|
|
mvc __TI_last_break(8,%r12),16(%r11)
|
|
|
|
0: # set up saved register r11
|
|
|
|
lg %r15,__LC_KERNEL_STACK
|
2013-04-24 16:20:43 +08:00
|
|
|
la %r9,STACK_FRAME_OVERHEAD(%r15)
|
|
|
|
stg %r9,24(%r11) # r11 pt_regs pointer
|
2011-12-27 18:27:15 +08:00
|
|
|
# fill pt_regs
|
2013-04-24 16:20:43 +08:00
|
|
|
mvc __PT_R8(64,%r9),__LC_SAVE_AREA_SYNC
|
|
|
|
stmg %r0,%r7,__PT_R0(%r9)
|
|
|
|
mvc __PT_PSW(16,%r9),__LC_SVC_OLD_PSW
|
|
|
|
mvc __PT_INT_CODE(4,%r9),__LC_SVC_ILC
|
2014-04-15 18:55:07 +08:00
|
|
|
xc __PT_FLAGS(8,%r9),__PT_FLAGS(%r9)
|
|
|
|
mvi __PT_FLAGS+7(%r9),_PIF_SYSCALL
|
2011-12-27 18:27:15 +08:00
|
|
|
# setup saved register r15
|
|
|
|
stg %r15,56(%r11) # r15 stack pointer
|
|
|
|
# set new psw address and exit
|
|
|
|
larl %r9,sysc_do_svc
|
2005-04-17 06:20:36 +08:00
|
|
|
br %r14
|
|
|
|
cleanup_system_call_insn:
|
2006-09-28 22:56:37 +08:00
|
|
|
.quad system_call
|
2011-12-27 18:27:15 +08:00
|
|
|
.quad sysc_stmg
|
|
|
|
.quad sysc_per
|
|
|
|
.quad sysc_vtime+18
|
|
|
|
.quad sysc_vtime+42
|
2005-04-17 06:20:36 +08:00
|
|
|
|
2010-05-17 16:00:02 +08:00
|
|
|
cleanup_sysc_tif:
|
2011-12-27 18:27:15 +08:00
|
|
|
larl %r9,sysc_tif
|
2005-04-17 06:20:36 +08:00
|
|
|
br %r14
|
|
|
|
|
2010-05-17 16:00:02 +08:00
|
|
|
cleanup_sysc_restore:
|
2011-12-27 18:27:15 +08:00
|
|
|
clg %r9,BASED(cleanup_sysc_restore_insn)
|
2010-05-17 16:00:03 +08:00
|
|
|
je 0f
|
2011-12-27 18:27:15 +08:00
|
|
|
lg %r9,24(%r11) # get saved pointer to pt_regs
|
|
|
|
mvc __LC_RETURN_PSW(16),__PT_PSW(%r9)
|
|
|
|
mvc 0(64,%r11),__PT_R8(%r9)
|
|
|
|
lmg %r0,%r7,__PT_R0(%r9)
|
|
|
|
0: lmg %r8,%r9,__LC_RETURN_PSW
|
2005-04-17 06:20:36 +08:00
|
|
|
br %r14
|
2010-05-17 16:00:02 +08:00
|
|
|
cleanup_sysc_restore_insn:
|
2007-11-20 18:13:32 +08:00
|
|
|
.quad sysc_done - 4
|
2005-04-17 06:20:36 +08:00
|
|
|
|
2010-05-17 16:00:02 +08:00
|
|
|
cleanup_io_tif:
|
2011-12-27 18:27:15 +08:00
|
|
|
larl %r9,io_tif
|
2010-04-09 19:43:00 +08:00
|
|
|
br %r14
|
|
|
|
|
2010-05-17 16:00:02 +08:00
|
|
|
cleanup_io_restore:
|
2011-12-27 18:27:15 +08:00
|
|
|
clg %r9,BASED(cleanup_io_restore_insn)
|
|
|
|
je 0f
|
|
|
|
lg %r9,24(%r11) # get saved r11 pointer to pt_regs
|
|
|
|
mvc __LC_RETURN_PSW(16),__PT_PSW(%r9)
|
|
|
|
mvc 0(64,%r11),__PT_R8(%r9)
|
|
|
|
lmg %r0,%r7,__PT_R0(%r9)
|
|
|
|
0: lmg %r8,%r9,__LC_RETURN_PSW
|
2005-09-04 06:57:56 +08:00
|
|
|
br %r14
|
2010-05-17 16:00:02 +08:00
|
|
|
cleanup_io_restore_insn:
|
2007-11-20 18:13:32 +08:00
|
|
|
.quad io_done - 4
|
2005-09-04 06:57:56 +08:00
|
|
|
|
2012-03-11 23:59:27 +08:00
|
|
|
cleanup_idle:
|
|
|
|
# copy interrupt clock & cpu timer
|
2012-07-20 17:15:08 +08:00
|
|
|
mvc __CLOCK_IDLE_EXIT(8,%r2),__LC_INT_CLOCK
|
|
|
|
mvc __TIMER_IDLE_EXIT(8,%r2),__LC_ASYNC_ENTER_TIMER
|
2012-03-11 23:59:27 +08:00
|
|
|
cghi %r11,__LC_SAVE_AREA_ASYNC
|
|
|
|
je 0f
|
2012-07-20 17:15:08 +08:00
|
|
|
mvc __CLOCK_IDLE_EXIT(8,%r2),__LC_MCCK_CLOCK
|
|
|
|
mvc __TIMER_IDLE_EXIT(8,%r2),__LC_MCCK_ENTER_TIMER
|
2012-03-11 23:59:27 +08:00
|
|
|
0: # check if stck & stpt have been executed
|
|
|
|
clg %r9,BASED(cleanup_idle_insn)
|
|
|
|
jhe 1f
|
2012-07-20 17:15:08 +08:00
|
|
|
mvc __CLOCK_IDLE_ENTER(8,%r2),__CLOCK_IDLE_EXIT(%r2)
|
|
|
|
mvc __TIMER_IDLE_ENTER(8,%r2),__TIMER_IDLE_EXIT(%r2)
|
|
|
|
1: # account system time going idle
|
2012-03-11 23:59:27 +08:00
|
|
|
lg %r9,__LC_STEAL_TIMER
|
2012-07-20 17:15:08 +08:00
|
|
|
alg %r9,__CLOCK_IDLE_ENTER(%r2)
|
2012-03-11 23:59:27 +08:00
|
|
|
slg %r9,__LC_LAST_UPDATE_CLOCK
|
|
|
|
stg %r9,__LC_STEAL_TIMER
|
2012-07-20 17:15:08 +08:00
|
|
|
mvc __LC_LAST_UPDATE_CLOCK(8),__CLOCK_IDLE_EXIT(%r2)
|
2012-03-11 23:59:27 +08:00
|
|
|
lg %r9,__LC_SYSTEM_TIMER
|
|
|
|
alg %r9,__LC_LAST_UPDATE_TIMER
|
2012-07-20 17:15:08 +08:00
|
|
|
slg %r9,__TIMER_IDLE_ENTER(%r2)
|
2012-03-11 23:59:27 +08:00
|
|
|
stg %r9,__LC_SYSTEM_TIMER
|
2012-07-20 17:15:08 +08:00
|
|
|
mvc __LC_LAST_UPDATE_TIMER(8),__TIMER_IDLE_EXIT(%r2)
|
2012-03-11 23:59:27 +08:00
|
|
|
# prepare return psw
|
2013-08-23 20:45:58 +08:00
|
|
|
nihh %r8,0xfcfd # clear irq & wait state bits
|
2012-03-11 23:59:27 +08:00
|
|
|
lg %r9,48(%r11) # return from psw_idle
|
|
|
|
br %r14
|
|
|
|
cleanup_idle_insn:
|
|
|
|
.quad psw_idle_lpsw
|
|
|
|
|
2005-04-17 06:20:36 +08:00
|
|
|
/*
|
|
|
|
* Integer constants
|
|
|
|
*/
|
2011-12-27 18:27:15 +08:00
|
|
|
.align 8
|
2005-04-17 06:20:36 +08:00
|
|
|
.Lcritical_start:
|
2011-12-27 18:27:15 +08:00
|
|
|
.quad __critical_start
|
|
|
|
.Lcritical_length:
|
|
|
|
.quad __critical_end - __critical_start
|
|
|
|
|
2005-04-17 06:20:36 +08:00
|
|
|
|
2013-11-01 17:08:20 +08:00
|
|
|
#if IS_ENABLED(CONFIG_KVM)
|
2011-07-24 16:48:18 +08:00
|
|
|
/*
|
|
|
|
* sie64a calling convention:
|
|
|
|
* %r2 pointer to sie control block
|
|
|
|
* %r3 guest register save area
|
|
|
|
*/
|
2011-07-24 16:48:19 +08:00
|
|
|
ENTRY(sie64a)
|
2011-07-24 16:48:18 +08:00
|
|
|
stmg %r6,%r14,__SF_GPRS(%r15) # save kernel registers
|
|
|
|
stg %r2,__SF_EMPTY(%r15) # save control block pointer
|
|
|
|
stg %r3,__SF_EMPTY+8(%r15) # save guest register save area
|
2013-05-17 20:41:37 +08:00
|
|
|
xc __SF_EMPTY+16(16,%r15),__SF_EMPTY+16(%r15) # host id & reason
|
2011-07-24 16:48:18 +08:00
|
|
|
lmg %r0,%r13,0(%r3) # load guest gprs 0-13
|
2011-09-20 23:07:28 +08:00
|
|
|
lg %r14,__LC_GMAP # get gmap pointer
|
|
|
|
ltgr %r14,%r14
|
|
|
|
jz sie_gmap
|
|
|
|
lctlg %c1,%c1,__GMAP_ASCE(%r14) # load primary asce
|
|
|
|
sie_gmap:
|
2011-07-24 16:48:18 +08:00
|
|
|
lg %r14,__SF_EMPTY(%r15) # get control block pointer
|
2013-05-17 20:41:35 +08:00
|
|
|
oi __SIE_PROG0C+3(%r14),1 # we are going into SIE now
|
|
|
|
tm __SIE_PROG20+3(%r14),1 # last exit...
|
|
|
|
jnz sie_done
|
2013-02-12 01:11:09 +08:00
|
|
|
LPP __SF_EMPTY(%r15) # set guest id
|
2011-07-24 16:48:18 +08:00
|
|
|
sie 0(%r14)
|
|
|
|
sie_done:
|
2013-02-12 01:11:09 +08:00
|
|
|
LPP __SF_EMPTY+16(%r15) # set host id
|
2013-05-17 20:41:34 +08:00
|
|
|
ni __SIE_PROG0C+3(%r14),0xfe # no longer in SIE
|
2011-09-20 23:07:28 +08:00
|
|
|
lctlg %c1,%c1,__LC_USER_ASCE # load primary asce
|
2013-05-17 20:41:37 +08:00
|
|
|
# some program checks are suppressing. C code (e.g. do_protection_exception)
|
|
|
|
# will rewind the PSW by the ILC, which is 4 bytes in case of SIE. Other
|
2013-12-13 19:53:42 +08:00
|
|
|
# instructions between sie64a and sie_done should not cause program
|
2013-05-17 20:41:37 +08:00
|
|
|
# interrupts. So lets use a nop (47 00 00 00) as a landing pad.
|
|
|
|
# See also HANDLE_SIE_INTERCEPT
|
|
|
|
rewind_pad:
|
|
|
|
nop 0
|
2013-06-12 19:54:56 +08:00
|
|
|
.globl sie_exit
|
2013-05-17 20:41:37 +08:00
|
|
|
sie_exit:
|
2011-07-24 16:48:18 +08:00
|
|
|
lg %r14,__SF_EMPTY+8(%r15) # load guest register save area
|
|
|
|
stmg %r0,%r13,0(%r14) # save guest gprs 0-13
|
|
|
|
lmg %r6,%r14,__SF_GPRS(%r15) # restore kernel registers
|
2013-05-17 20:41:37 +08:00
|
|
|
lg %r2,__SF_EMPTY+24(%r15) # return exit reason code
|
2011-07-24 16:48:18 +08:00
|
|
|
br %r14
|
|
|
|
sie_fault:
|
2013-05-17 20:41:37 +08:00
|
|
|
lghi %r14,-EFAULT
|
|
|
|
stg %r14,__SF_EMPTY+24(%r15) # set exit reason code
|
|
|
|
j sie_exit
|
2011-07-24 16:48:18 +08:00
|
|
|
|
|
|
|
.align 8
|
2013-05-17 20:41:37 +08:00
|
|
|
.Lsie_critical:
|
|
|
|
.quad sie_gmap
|
|
|
|
.Lsie_critical_length:
|
|
|
|
.quad sie_done - sie_gmap
|
2011-07-24 16:48:18 +08:00
|
|
|
|
2012-11-15 16:35:16 +08:00
|
|
|
EX_TABLE(rewind_pad,sie_fault)
|
2013-05-17 20:41:37 +08:00
|
|
|
EX_TABLE(sie_exit,sie_fault)
|
2011-07-24 16:48:18 +08:00
|
|
|
#endif
|
|
|
|
|
2006-09-28 22:56:37 +08:00
|
|
|
.section .rodata, "a"
|
2005-04-17 06:20:36 +08:00
|
|
|
#define SYSCALL(esa,esame,emu) .long esame
|
2009-06-12 16:26:47 +08:00
|
|
|
.globl sys_call_table
|
2005-04-17 06:20:36 +08:00
|
|
|
sys_call_table:
|
|
|
|
#include "syscalls.S"
|
|
|
|
#undef SYSCALL
|
|
|
|
|
2006-01-06 16:19:28 +08:00
|
|
|
#ifdef CONFIG_COMPAT
|
2005-04-17 06:20:36 +08:00
|
|
|
|
|
|
|
#define SYSCALL(esa,esame,emu) .long emu
|
2013-04-24 18:58:39 +08:00
|
|
|
.globl sys_call_table_emu
|
2005-04-17 06:20:36 +08:00
|
|
|
sys_call_table_emu:
|
|
|
|
#include "syscalls.S"
|
|
|
|
#undef SYSCALL
|
|
|
|
#endif
|