PERFORCE change 29108 for review

Marcel Moolenaar marcel at FreeBSD.org
Thu Apr 17 00:32:15 PDT 2003


http://perforce.freebsd.org/chv.cgi?CH=29108

Change 29108 by marcel at marcel_nfs on 2003/04/17 00:32:02

	Finish the rudimenary EPC syscall code. Of course this is
	still missing the signal handling, but at least it gets us
	to the first fork(2). This is the point I needed to get to
	so that I can finish fork_trampoline (I now have a quick
	and dirty version that only works for the very first process
	(ie init).
	
	Change the syscall stub to use ar.k5 instead of ar.k3.
	
	Also: we didn't save the frame marker and return pointer
	of the function calling a syscall stub and thus got lost
	in the forest that is code on our way back. To keep the
	stubs small (but mostly generatable) we save the frame
	marker and return pointer of the function calling a
	syscall stub in registers and pass them on to the EPC
	syscall code. There we restore them for the process.
	Note that this is caused by the requirement to use a
	call to go to the EPC gateway page, because we need to
	lower the privilege level on our way back. This can only
	be done by a return. Otherwise I would have avoided the
	call so that we would not clobber the frame marker and
	return pointer.
	
	Oh, and we now use spills to store the syscall argument
	in memory. The reasoning is this: We don't know how many
	arguments a syscall has, but we know that 8 is the max.
	Hence, we may be reading garbage, including NaTs. If we
	don't spill, we could therefore get a NaT consumption fault.
	and since we're already in kernel mode, this is bad. By
	spilling we basicly ignore the NaT bits (if any).

Affected files ...

.. //depot/projects/ia64_epc/sys/ia64/ia64/syscall.s#6 edit
.. //depot/projects/ia64_epc/sys/ia64/include/asm.h#3 edit

Differences ...

==== //depot/projects/ia64_epc/sys/ia64/ia64/syscall.s#6 (text+ko) ====

@@ -30,26 +30,32 @@
 #include <assym.s>
 
 /*
- * A process performs a syscall by calling epc_syscall through the EPC
- * gateway page. The address of the gateway page is passed to the process
- * in ar.k3.
+ * A process performs a syscall by performing an indirect call to the
+ * address stored in ar.k5. The contents ar.pfs and rp should be saved
+ * prior to the syscall in r9 and r10 respectively. The kernel will
+ * restore these values on return. The value of gp is preserved across
+ * the call.
+ * The address in ar.k5 is the start of the EPC gateway page. The code
+ * in the gateway page is primarily responsible for increasing the
+ * privilege level, but will also make sure we have a reliable psr.
  *
- * Syscalls don't follow the calling convention completely. The reason
- * for this is that it would create unnecessary overhead. Arguments to
- * syscalls are:
+ * A process defines:
  *	r8		-	syscall number
  *	r9		-	copy of ar.pfs
+ *	r10		-	copy of rp
  *	in0-in7		-	syscall arguments
- *	b6		-	return address
  *
- * Syscalls return:
+ * A syscall returns:
  *	r8+r9		-	syscall return value(s)
  *	r10		-	syscall error flag
+ *	ar.pfs		-	restored from r9
+ *	rp		-	restored from r10
+ *	gp		-	preserved
  *
- * The EPC gateway code prefetches the following:
- *	r14		-	prefetched ar.k7
- *	r15		-	prefetched ar.k6
- *	p15		-	true for fork(2)
+ * The EPC defines:
+ *	r11		-	copy of psr.l
+ *	r14		-	Kernel memory stack
+ *	r15		-	Kernel register stack
  */
 
 	.section	.text.gateway, "ax"
@@ -63,16 +69,29 @@
 	;;
 }
 {	.mlx
-	add		r30=-1,r0		// XXX
+	mov		r11=psr
 	movl		r31=epc_syscall
 	;;
 }
 {	.mib
-	cmp.eq		p15,p0=r30,r8
+	rum		psr.be
 	mov		b7=r31
 	br		b7
 	;;
 }
+gw_ret:
+{	.mmi
+	mov		ar.rnat=r22
+	mov		ar.rsc=r24
+	mov		ar.pfs=r28
+}
+{	.mib
+	mov		ar.fpsr=r25
+	mov		b0=r29
+	br.sptk		b6
+	;;
+}
+
 	.align		PAGE_SIZE
 
 
@@ -82,99 +101,139 @@
 	.regstk		8,0,0,0
 epc_syscall:
 {	.mmi
-	mov		r17=ar.rsc
-	mov		r18=ar.unat
+	mov		r16=ar.rsc
+	mov		ar.rsc=0
+	mov		r17=r13
+	;;
+}
+{	.mmi
+	mov		r18=ar.bspstore
+	mov		r19=ar.rnat
 	add		r30=-SIZEOF_TRAPFRAME,r14
 	;;
 }
 {	.mmi
-	mov		ar.rsc=0
-	mov		r19=ar.fpsr
+	mov		ar.bspstore=r15
+	mov		r13=ar.k4
 	dep		r30=0,r30,0,10
 	;;
 }
-{	.mmi
-	mov		r21=ar.bspstore
-	mov		r22=ar.rnat
-	mov		r23=r13
+{	.mii
+	mov		r20=sp
+	add		r31=8,r30
+	add		sp=-16,r30
 	;;
 }
 {	.mmi
-	mov		ar.bspstore=r15
-	add		r31=8,r30
-	mov		r20=sp
+	mov		r21=ar.unat
+	mov		r22=ar.fpsr
+	sub		r29=r14,r30
 	;;
 }
 {	.mmi
+	mov		r23=ar.bsp
 	mov		ar.rsc=3
-	add		sp=-16,r30
-	sub		r29=r14,r30
+	add		r28=FRAME_SYSCALL,r0
 	;;
 }
 {	.mmi
 	st8		[r30]=r29,16		// tf_length
-	mov		r24=ar.bsp
-	add		r29=FRAME_SYSCALL,r0
+	st8		[r31]=r28,16		// tf_flags
+	mov		r24=rp
+	;;
+}
+{	.mmi
+	st8		[r30]=r20,16		// sp
+	st8		[r31]=r21,16		// unat
+	mov		r25=pr
+	;;
+}
+{	.mmi
+	st8		[r30]=r24,16		// rp (syscall stub)
+	st8		[r31]=r25,16		// pr
+	mov		r26=ar.pfs
 	;;
 }
 {	.mmi
-	st8		[r31]=r29,16		// tf_flags
-	mov		r27=psr
-	mov		r25=b6
+	st8		[r30]=r26,16		// pfs (syscall stub)
+	st8		[r31]=r18,16		// bspstore
+	sub		r27=r23,r15
 	;;
 }
 {	.mmi
-	st8		[r30]=r20,16		// sp
-	st8		[r31]=r18,16		// unat
-	mov		r26=pr
+	st8		[r30]=r19,16		// rnat
+	st8		[r31]=r0,16		// __spare
+	nop		0
 	;;
 }
 {	.mmi
-	st8		[r30]=r25,16		// rp
-	st8		[r31]=r26,16		// pr
-	sub		r24=r24,r15
+	st8		[r30]=r17,16		// tp
+	st8		[r31]=r16,16		// rsc
+	nop		0
 	;;
 }
 {	.mmi
-	st8		[r30]=r9,16		// pfs
-	st8		[r31]=r21,16		// bspstore
+	st8		[r30]=r22,16		// fpsr
+	st8		[r31]=r11,16		// psr
 	nop		0
 	;;
 }
 {	.mmi
-	st8		[r30]=r22,16		// rnat
-	st8		[r31]=r24,16		// __spare (=ndirty)
+	st8		[r30]=r1,16		// gp
+	st8		[r31]=r27,16		// ndirty
 	nop		0
 	;;
 }
 {	.mmi
-	st8		[r30]=r23,16		// tp
-	st8		[r31]=r17,16		// rsc
+	st8		[r30]=r9,16		// pfs (syscall caller)
+	st8		[r31]=r10,16		// rp (syscall caller)
 	nop		0
 	;;
 }
 {	.mmi
-	st8		[r30]=r19,128		// fpsr
-	st8		[r31]=r27,128		// psr
+	st8		[r30]=r0,80		// ifa
+	st8		[r31]=r0,80		// isr
 	nop		0
 	;;
 }
+{	.mmi
 	st8		[r30]=r8,16		// syscall number (=r15)
-	st8		[r31]=r32,16		// arg0 (=r16)
+	.mem.offset	0,0
+	st8.spill	[r31]=r32,16		// arg0 (=r16)
+	nop		0
 	;;
-	st8		[r30]=r33,16		// arg1 (=r17)
-	st8		[r31]=r34,16		// arg2 (=r18)
+}
+{	.mmi
+	.mem.offset	8,0
+	st8.spill	[r30]=r33,16		// arg1 (=r17)
+	.mem.offset	16,0
+	st8.spill	[r31]=r34,16		// arg2 (=r18)
+	nop		0
 	;;
-	st8		[r30]=r35,16		// arg3 (=r19)
-	st8		[r31]=r36,16		// arg4 (=r20)
+}
+{	.mmi
+	.mem.offset	24,0
+	st8.spill	[r30]=r35,16		// arg3 (=r19)
+	.mem.offset	32,0
+	st8.spill	[r31]=r36,16		// arg4 (=r20)
+	nop		0
 	;;
-	st8		[r30]=r37,16		// arg5 (=r21)
-	st8		[r31]=r38,16		// arg6 (=r22)
+}
+{	.mmi
+	.mem.offset	40,0
+	st8.spill	[r30]=r37,16		// arg5 (=r21)
+	.mem.offset	48,0
+	st8.spill	[r31]=r38,16		// arg6 (=r22)
+	nop		0
 	;;
-	st8		[r30]=r39,8		// arg7 (=r23)
-	mov		r13=ar.k4
+}
+{	.mmi
+	.mem.offset	56,0
+	st8.spill	[r30]=r39,8		// arg7 (=r23)
+	ssm		psr.dfh|psr.ac
+	nop		0
 	;;
-
+}
 {	.mlx
 	alloc		r14=ar.pfs,0,0,3,0
 	movl		gp=__gp
@@ -187,10 +246,109 @@
 	;;
 }
 {	.mfb
-	ssm		psr.dfh
+	srlz.d
 	nop		0
 	br.call.sptk	rp=syscall
 	;;
 }
-	break		0
+
+	.global		syscall_return
+	.type		syscall_return, @function
+syscall_return:
+{	.mmi
+	alloc		r31=ar.pfs,0,0,0,0
+	add		r14=32,sp
+	add		r15=16,sp
+	;;
+}
+{	.mmi
+	ld8		r31=[r15],24		// tf_length
+	ld8		r16=[r14],16		// sp
+	add		sp=16,sp
+	;;
+}
+{	.mmi
+	ld8		r17=[r15],16		// unat (before)
+	ld8		r18=[r14],16		// rp (syscall stub)
+	add		r31=r31,sp
+	;;
+}
+{	.mmi
+	ld8		r19=[r15],16		// pr
+	ld8		r20=[r14],16		// pfs (syscall stub)
+	mov		sp=r16
+	;;
+}
+{	.mmi
+	ld8		r21=[r15],24		// bspstore
+	ld8		r22=[r14],24		// rnat
+	mov		b6=r18
+	;;
+}
+{	.mmi
+	ld8		r23=[r15],16		// tp
+	ld8		r24=[r14],16		// rsc
+	mov		pr=r19,0x1fffe
+	;;
+}
+{	.mmi
+	ld8		r25=[r15],16		// fpsr
+	ld8		r26=[r14],16		// psr
+	mov		ar.pfs=r20
+	;;
+}
+{	.mmi
+	ld8		gp=[r15],16		// gp
+	ld8		r27=[r14],16		// ndirty
+	nop		0
+	;;
+}
+{	.mmi
+	ld8		r28=[r15],56		// pfs (syscall caller)
+	ld8		r29=[r14],56		// rp (syscall caller)
+	shl		r27=r27,16
+	;;
+}
+{	.mmi
+	ld8		r8=[r15],16		// r8
+	mov		ar.rsc=r27
+	nop		0
+	;;
+}
+{	.mmi
+	ld8		r9=[r14]		// r9
+	ld8		r10=[r15]		// r10
+	nop		0
+	;;
+}
+{	.mmi
+	loadrs
+	mov		ar.k7=r31
+	dep		r26=-1,r26,19,1		// Set psr.dfh
+	;;
+}
+{	.mmi
+	mov		r31=ar.bspstore
+	mov		ar.bspstore=r21
+	mov		r13=r23
+	;;
+}
+{	.mmi
+	mov		r14=ar.k5
+	mov		ar.k6=r31
+	nop		0
+	;;
+}
+{	.mmi
+	mov		psr.l=r26
+	mov		ar.unat=r17
+	add		r14=gw_ret-ia64_gateway_page,r14
+	;;
+}
+{	.mib
+	srlz.d
+	mov		b7=r14
+	br.ret.sptk	b7
+	;;
+}
 	.endp		epc_syscall

==== //depot/projects/ia64_epc/sys/ia64/include/asm.h#3 (text+ko) ====

@@ -164,11 +164,12 @@
 #define	EPC_CALLSYS_NOERROR(name)				\
 {	.mmi ;							\
 	alloc		r9 = ar.pfs, 0, 0, 8, 0 ;		\
-	mov		r14 = ar.k3 ;; }			\
+	mov		r31 = ar.k5 ;				\
+	mov		r10 = b0 ;; }				\
 {	.mib ;							\
 	mov		r8 = SYSCALLNUM(name) ;			\
-	mov		b7 = r14 ; 				\
-	br.call.sptk	b6 = b7 }
+	mov		b7 = r31 ; 				\
+	br.call.sptk	b0 = b7 ;; }
 
 
 /*


More information about the p4-projects mailing list