Source-Changes-HG archive

[Date Prev][Date Next][Thread Prev][Thread Next][Date Index][Thread Index][Old Index]

[src/netbsd-8]: src/sys Pull up following revision(s) (requested by maxv in t...



details:   https://anonhg.NetBSD.org/src/rev/4d14f7d1a987
branches:  netbsd-8
changeset: 434285:4d14f7d1a987
user:      snj <snj%NetBSD.org@localhost>
date:      Mon Sep 04 20:41:28 2017 +0000

description:
Pull up following revision(s) (requested by maxv in ticket #257):
        sys/compat/linux/arch/amd64/linux_machdep.c: 1.52
        sys/arch/amd64/amd64/copy.S: 1.21-1.24
        sys/arch/amd64/amd64/locore.S: 1.125
        sys/arch/amd64/amd64/machdep.c: 1.256
Fix a bug in ucas_32 and ucas_64. There is a branch where they don't
initialize %rax.
--
style, reduces an incoming diff
00
Split comment, otherwise it is misleading. kcopy operates on kernel
memory, and must *not* be used with userland pages.
--
Move incq outside of the copy section. No functional change, reduces
my smap diff.
--
Remove dumb debug code and outdated comment.
--
Don't forget to clean l_md.md_flags, otherwise there may be MDL_COMPAT32,
in which case the kernel would always use iret (slower).

diffstat:

 sys/arch/amd64/amd64/copy.S                 |  82 ++++++++++++++++------------
 sys/arch/amd64/amd64/locore.S               |  10 +---
 sys/arch/amd64/amd64/machdep.c              |   6 +-
 sys/compat/linux/arch/amd64/linux_machdep.c |   6 +-
 4 files changed, 57 insertions(+), 47 deletions(-)

diffs (truncated from 334 to 300 lines):

diff -r aa730cafdb1a -r 4d14f7d1a987 sys/arch/amd64/amd64/copy.S
--- a/sys/arch/amd64/amd64/copy.S       Mon Sep 04 16:11:37 2017 +0000
+++ b/sys/arch/amd64/amd64/copy.S       Mon Sep 04 20:41:28 2017 +0000
@@ -1,4 +1,4 @@
-/*     $NetBSD: copy.S,v 1.20 2015/12/09 16:55:18 maxv Exp $   */
+/*     $NetBSD: copy.S,v 1.20.10.1 2017/09/04 20:41:28 snj Exp $       */
 
 /*
  * Copyright (c) 2001 Wasabi Systems, Inc.
@@ -44,8 +44,8 @@
 #include <machine/frameasm.h>
 
 #define GET_CURPCB(reg)        \
-       movq    CPUVAR(CURLWP), reg; \
-       movq    L_PCB(reg), reg
+       movq    CPUVAR(CURLWP),reg; \
+       movq    L_PCB(reg),reg
 
 /*
  * These are arranged so that the abnormal case is a forwards
@@ -55,10 +55,10 @@
 #define DEFERRED_SWITCH_CHECK \
        CHECK_DEFERRED_SWITCH                   ; \
        jnz     99f                             ; \
-    98:
+98:
 
 #define DEFERRED_SWITCH_CALL \
-    99:                                                ; \
+99:                                            ; \
        call    _C_LABEL(do_pmap_load)          ; \
        jmp     98b
 
@@ -85,18 +85,18 @@
        pushq   %rdx
        pushq   %rcx
        pushq   %rbx
-       movq    CPUVAR(CURLWP), %rbx
+       movq    CPUVAR(CURLWP),%rbx
 1:
        incl    L_NOPREEMPT(%rbx)
        call    _C_LABEL(pmap_load)
        decl    L_NOPREEMPT(%rbx)
        jnz     2f
-       cmpl    $0, L_DOPREEMPT(%rbx)
+       cmpl    $0,L_DOPREEMPT(%rbx)
        jz      2f
-       xorq    %rdi, %rdi
+       xorq    %rdi,%rdi
        call    _C_LABEL(kpreempt)
 2:
-       cmpl    $0, CPUVAR(WANT_PMAPLOAD)
+       cmpl    $0,CPUVAR(WANT_PMAPLOAD)
        jnz     1b
        popq    %rbx
        popq    %rcx
@@ -107,9 +107,6 @@
        ret
 
 /*
- * int kcopy(const void *from, void *to, size_t len);
- * Copy len bytes, abort on fault.
- *
  * Copy routines from and to userland, plus a few more. See the
  * section 9 manpages for info. Some cases can be optimized more.
  *
@@ -125,6 +122,10 @@
  * be ably to do cache-line size copies....
  */
 
+/*
+ * int kcopy(const void *from, void *to, size_t len);
+ * Copy len bytes from and to kernel memory, and abort on fault.
+ */
 ENTRY(kcopy)
        xchgq   %rdi,%rsi
        movq    %rdx,%rcx
@@ -194,6 +195,7 @@
        rep
        movsb                           /* copy remaining bytes */
 .Lcopyout_end:
+
        xorl    %eax,%eax
        ret
        DEFERRED_SWITCH_CALL
@@ -221,6 +223,7 @@
        rep
        movsb
 .Lcopyin_end:
+
        xorl    %eax,%eax
        ret
        DEFERRED_SWITCH_CALL
@@ -256,9 +259,9 @@
        jae     1f
        movq    %rax,%rdx
        movq    %rax,%r8
-.Lcopyoutstr_start:
 1:     incq    %rdx
 
+.Lcopyoutstr_start:
 1:     decq    %rdx
        jz      2f
        lodsb
@@ -266,6 +269,7 @@
        testb   %al,%al
        jnz     1b
 .Lcopyoutstr_end:
+
        /* Success -- 0 byte reached. */
        decq    %rdx
        xorq    %rax,%rax
@@ -295,9 +299,9 @@
        jae     1f
        movq    %rax,%rdx
        movq    %rax,%r8
-.Lcopyinstr_start:
 1:     incq    %rdx
 
+.Lcopyinstr_start:
 1:     decq    %rdx
        jz      2f
        lodsb
@@ -363,7 +367,7 @@
 
 
 ENTRY(fuswintr)
-       cmpl    $TLBSTATE_VALID, CPUVAR(TLBSTATE)
+       cmpl    $TLBSTATE_VALID,CPUVAR(TLBSTATE)
        jnz     _C_LABEL(fusuaddrfault)
        movq    $VM_MAXUSER_ADDRESS-2,%r11
        cmpq    %r11,%rdi
@@ -371,7 +375,9 @@
        GET_CURPCB(%rcx)
        leaq    _C_LABEL(fusuintrfailure)(%rip),%r11
        movq    %r11,PCB_ONFAULT(%rcx)
+
        movzwl  (%rdi),%eax
+
        movq    $0,PCB_ONFAULT(%rcx)
        ret
 
@@ -383,13 +389,15 @@
        GET_CURPCB(%rcx)
        leaq    _C_LABEL(fusufailure)(%rip),%r11
        movq    %r11,PCB_ONFAULT(%rcx)
+
        movzbl  (%rdi),%eax
+
        movq    $0,PCB_ONFAULT(%rcx)
        ret
        DEFERRED_SWITCH_CALL
 
 ENTRY(suswintr)
-       cmpl    $TLBSTATE_VALID, CPUVAR(TLBSTATE)
+       cmpl    $TLBSTATE_VALID,CPUVAR(TLBSTATE)
        jnz     _C_LABEL(fusuaddrfault)
        movq    $VM_MAXUSER_ADDRESS-2,%r11
        cmpq    %r11,%rdi
@@ -397,7 +405,9 @@
        GET_CURPCB(%rcx)
        leaq    _C_LABEL(fusuintrfailure)(%rip),%r11
        movq    %r11,PCB_ONFAULT(%rcx)
+
        movw    %si,(%rdi)
+
        xorq    %rax,%rax
        movq    %rax,PCB_ONFAULT(%rcx)
        ret
@@ -413,6 +423,7 @@
        movq    %r11,PCB_ONFAULT(%rcx)
 
        movb    %sil,(%rdi)
+
        xorq    %rax,%rax
        movq    %rax,PCB_ONFAULT(%rcx)
        ret
@@ -444,21 +455,23 @@
 ENTRY(ucas_64)
        DEFERRED_SWITCH_CHECK
        /* Fail if kernel-space */
-       movq    $VM_MAXUSER_ADDRESS-8, %r8
-       cmpq    %r8, %rdi
-       ja      _C_LABEL(ucas_fault)
-       movq    %rsi, %rax
+       movq    $VM_MAXUSER_ADDRESS-8,%r8
+       cmpq    %r8,%rdi
+       ja      _C_LABEL(ucas_efault)
+       movq    %rsi,%rax
+
 .Lucas64_start:
        /* Perform the CAS */
        lock
-       cmpxchgq %rdx, (%rdi)
+       cmpxchgq %rdx,(%rdi)
 .Lucas64_end:
+
        /*
         * Note: %rax is "old" value.
         * Set the return values.
         */
-       movq    %rax, (%rcx)
-       xorq    %rax, %rax
+       movq    %rax,(%rcx)
+       xorq    %rax,%rax
        ret
        DEFERRED_SWITCH_CALL
 
@@ -468,28 +481,29 @@
 ENTRY(ucas_32)
        DEFERRED_SWITCH_CHECK
        /* Fail if kernel-space */
-       movq    $VM_MAXUSER_ADDRESS-4, %r8
-       cmpq    %r8, %rdi
-       ja      _C_LABEL(ucas_fault)
-       movl    %esi, %eax
+       movq    $VM_MAXUSER_ADDRESS-4,%r8
+       cmpq    %r8,%rdi
+       ja      _C_LABEL(ucas_efault)
+       movl    %esi,%eax
+
 .Lucas32_start:
        /* Perform the CAS */
        lock
-       cmpxchgl %edx, (%rdi)
+       cmpxchgl %edx,(%rdi)
 .Lucas32_end:
+
        /*
         * Note: %eax is "old" value.
         * Set the return values.
         */
-       movl    %eax, (%rcx)
-       xorq    %rax, %rax
+       movl    %eax,(%rcx)
+       xorq    %rax,%rax
        ret
        DEFERRED_SWITCH_CALL
 
-/*
- * Fault handler for ucas_*().
- * Just return the error set by trap().
- */
+ENTRY(ucas_efault)
+       movq    $EFAULT,%rax
+
 NENTRY(ucas_fault)
        ret
 
diff -r aa730cafdb1a -r 4d14f7d1a987 sys/arch/amd64/amd64/locore.S
--- a/sys/arch/amd64/amd64/locore.S     Mon Sep 04 16:11:37 2017 +0000
+++ b/sys/arch/amd64/amd64/locore.S     Mon Sep 04 20:41:28 2017 +0000
@@ -1,4 +1,4 @@
-/*     $NetBSD: locore.S,v 1.123.6.1 2017/07/05 19:59:29 snj Exp $     */
+/*     $NetBSD: locore.S,v 1.123.6.2 2017/09/04 20:41:28 snj Exp $     */
 
 /*
  * Copyright-o-rama!
@@ -1082,12 +1082,6 @@
 
        /* Switch to newlwp's stack. */
        movq    L_PCB(%r12),%r14
-#ifdef XEN /* XXX debug code */
-       cmpq    $0,PCB_RSP(%r14)
-       jne 999f
-       callq _C_LABEL(cpu_Debugger);
-999:
-#endif
        movq    PCB_RSP(%r14),%rsp
        movq    PCB_RBP(%r14),%rbp
 
@@ -1236,8 +1230,6 @@
  * syscall()
  *
  * syscall insn entry.
- * This currently isn't much faster, but it can be made faster in the future.
- * (Actually we've already saved a few 100 clocks by not loading the trap gate)
  */
 IDTVEC(syscall)
 #ifndef XEN
diff -r aa730cafdb1a -r 4d14f7d1a987 sys/arch/amd64/amd64/machdep.c
--- a/sys/arch/amd64/amd64/machdep.c    Mon Sep 04 16:11:37 2017 +0000
+++ b/sys/arch/amd64/amd64/machdep.c    Mon Sep 04 20:41:28 2017 +0000
@@ -1,4 +1,4 @@
-/*     $NetBSD: machdep.c,v 1.255 2017/03/24 17:09:36 maxv Exp $       */
+/*     $NetBSD: machdep.c,v 1.255.6.1 2017/09/04 20:41:28 snj Exp $    */
 
 /*-
  * Copyright (c) 1996, 1997, 1998, 2000, 2006, 2007, 2008, 2011
@@ -111,7 +111,7 @@
  */
 
 #include <sys/cdefs.h>
-__KERNEL_RCSID(0, "$NetBSD: machdep.c,v 1.255 2017/03/24 17:09:36 maxv Exp $");
+__KERNEL_RCSID(0, "$NetBSD: machdep.c,v 1.255.6.1 2017/09/04 20:41:28 snj Exp $");
 
 /* #define XENDEBUG_LOW  */
 
@@ -1325,6 +1325,8 @@
 



Home | Main Index | Thread Index | Old Index