Source-Changes-HG archive

[Date Prev][Date Next][Thread Prev][Thread Next][Date Index][Thread Index][Old Index]

[src/trunk]: src/sys/kern provide some semblance of valid cpu topology for bi...



details:   https://anonhg.NetBSD.org/src/rev/b1057135a9ac
branches:  trunk
changeset: 1006344:b1057135a9ac
user:      mrg <mrg%NetBSD.org@localhost>
date:      Sun Jan 12 09:29:18 2020 +0000

description:
provide some semblance of valid cpu topology for big.little systems.

while attaching cpus, if the FDT provides "capacity-dmips-mhz" track
the fastest set, and call cpu_topology_set() with slow=true for any
cpus that are not the fastest.

bug fix for cpu_topology_set(): actually set ci_is_slow for slow cpus.

with this change, and -current's recent scheduler changes, this means
that long running processes run on the faster cores.  on RK3399 based
systems, i am seeing 20-50% speed ups for many tasks.


XXX: all this can be made common with armv7 big.little.

diffstat:

 sys/arch/aarch64/aarch64/cpu.c     |  50 +++++++++++++++++++++++++++++++++----
 sys/arch/aarch64/aarch64/cpufunc.c |  10 +++---
 sys/arch/aarch64/aarch64/locore.S  |   7 +++--
 sys/arch/aarch64/include/cpu.h     |   5 +++-
 sys/arch/aarch64/include/cpufunc.h |   4 +-
 sys/arch/arm/fdt/cpu_fdt.c         |  15 +++++++++-
 sys/kern/subr_cpu.c                |   5 ++-
 7 files changed, 75 insertions(+), 21 deletions(-)

diffs (268 lines):

diff -r ea2e075bcb5e -r b1057135a9ac sys/arch/aarch64/aarch64/cpu.c
--- a/sys/arch/aarch64/aarch64/cpu.c    Sun Jan 12 06:41:02 2020 +0000
+++ b/sys/arch/aarch64/aarch64/cpu.c    Sun Jan 12 09:29:18 2020 +0000
@@ -1,4 +1,4 @@
-/* $NetBSD: cpu.c,v 1.32 2020/01/09 16:23:41 martin Exp $ */
+/* $NetBSD: cpu.c,v 1.33 2020/01/12 09:29:18 mrg Exp $ */
 
 /*
  * Copyright (c) 2017 Ryo Shimizu <ryo%nerv.org@localhost>
@@ -27,7 +27,7 @@
  */
 
 #include <sys/cdefs.h>
-__KERNEL_RCSID(1, "$NetBSD: cpu.c,v 1.32 2020/01/09 16:23:41 martin Exp $");
+__KERNEL_RCSID(1, "$NetBSD: cpu.c,v 1.33 2020/01/12 09:29:18 mrg Exp $");
 
 #include "locators.h"
 #include "opt_arm_debug.h"
@@ -65,6 +65,7 @@
 static void cpu_identify2(device_t self, struct cpu_info *);
 static void cpu_setup_id(struct cpu_info *);
 static void cpu_setup_sysctl(device_t, struct cpu_info *);
+static void cpu_do_topology(struct cpu_info *);
 
 #ifdef MULTIPROCESSOR
 uint64_t cpu_mpidr[MAXCPUS];
@@ -144,9 +145,9 @@
        ci->ci_dev = dv;
        dv->dv_private = ci;
 
-       aarch64_gettopology(ci, ci->ci_id.ac_mpidr);
+       cpu_do_topology(ci);
+       cpu_identify(ci->ci_dev, ci);
 
-       cpu_identify(ci->ci_dev, ci);
 #ifdef MULTIPROCESSOR
        if (unit != 0) {
                mi_cpu_attach(ci);
@@ -308,8 +309,8 @@
 
        dfr0 = reg_id_aa64dfr0_el1_read();
 
-       aprint_debug_dev(self, "midr=0x%" PRIx32 "\n",
-           (uint32_t)ci->ci_id.ac_midr);
+       aprint_debug_dev(self, "midr=0x%" PRIx32 " mpidr=0x%" PRIx32 "\n",
+           (uint32_t)ci->ci_id.ac_midr, (uint32_t)ci->ci_id.ac_mpidr);
        aprint_normal_dev(self, "revID=0x%" PRIx64, id->ac_revidr);
 
        /* ID_AA64DFR0_EL1 */
@@ -497,6 +498,43 @@
                       CTL_CREATE, CTL_EOL);
 }
 
+static void
+cpu_do_topology(struct cpu_info *newci)
+{
+       struct cpu_info *ci;
+       CPU_INFO_ITERATOR cii;
+       prop_dictionary_t dict;
+       uint32_t capacity_dmips_mhz;
+       static uint32_t best_cap = 0;
+
+       dict = device_properties(newci->ci_dev);
+       if (prop_dictionary_get_uint32(dict, "capacity_dmips_mhz",
+           &capacity_dmips_mhz)) {
+               newci->ci_capacity_dmips_mhz = capacity_dmips_mhz;
+       } else {
+               newci->ci_capacity_dmips_mhz = 0;
+       }
+
+       if (newci->ci_capacity_dmips_mhz > best_cap)
+               best_cap = newci->ci_capacity_dmips_mhz;
+
+       /*
+        * CPU_INFO_FOREACH() doesn't work for this CPU until mi_cpu_attach()
+        * is called and ncpu is bumped, so call it directly here.
+        */
+       aarch64_set_topology(newci, newci->ci_id.ac_mpidr,
+           newci->ci_capacity_dmips_mhz < best_cap);
+
+       /*
+        * Using saved largest capacity, refresh previous topology info.
+        * It's supposed to be OK to re-set topology.
+        */
+       for (CPU_INFO_FOREACH(cii, ci)) {
+               aarch64_set_topology(ci, ci->ci_id.ac_mpidr,
+                   ci->ci_capacity_dmips_mhz < best_cap);
+       }
+}
+
 #ifdef MULTIPROCESSOR
 void
 cpu_boot_secondary_processors(void)
diff -r ea2e075bcb5e -r b1057135a9ac sys/arch/aarch64/aarch64/cpufunc.c
--- a/sys/arch/aarch64/aarch64/cpufunc.c        Sun Jan 12 06:41:02 2020 +0000
+++ b/sys/arch/aarch64/aarch64/cpufunc.c        Sun Jan 12 09:29:18 2020 +0000
@@ -1,4 +1,4 @@
-/*     $NetBSD: cpufunc.c,v 1.13 2020/01/09 16:35:03 ad Exp $  */
+/*     $NetBSD: cpufunc.c,v 1.14 2020/01/12 09:29:18 mrg Exp $ */
 
 /*
  * Copyright (c) 2017 Ryo Shimizu <ryo%nerv.org@localhost>
@@ -29,7 +29,7 @@
 #include "opt_multiprocessor.h"
 
 #include <sys/cdefs.h>
-__KERNEL_RCSID(0, "$NetBSD: cpufunc.c,v 1.13 2020/01/09 16:35:03 ad Exp $");
+__KERNEL_RCSID(0, "$NetBSD: cpufunc.c,v 1.14 2020/01/12 09:29:18 mrg Exp $");
 
 #include <sys/param.h>
 #include <sys/types.h>
@@ -89,7 +89,7 @@
 }
 
 void
-aarch64_gettopology(struct cpu_info * const ci, uint64_t mpidr)
+aarch64_set_topology(struct cpu_info * const ci, uint64_t mpidr, bool slow)
 {
 
        if (mpidr & MPIDR_MT) {
@@ -98,14 +98,14 @@
                    __SHIFTOUT(mpidr, MPIDR_AFF1),
                    __SHIFTOUT(mpidr, MPIDR_AFF0),
                    0,
-                   false);
+                   slow);
        } else {
                cpu_topology_set(ci,
                    __SHIFTOUT(mpidr, MPIDR_AFF1),
                    __SHIFTOUT(mpidr, MPIDR_AFF0),
                    0,
                    0,
-                   false);
+                   slow);
        }
 }
 
diff -r ea2e075bcb5e -r b1057135a9ac sys/arch/aarch64/aarch64/locore.S
--- a/sys/arch/aarch64/aarch64/locore.S Sun Jan 12 06:41:02 2020 +0000
+++ b/sys/arch/aarch64/aarch64/locore.S Sun Jan 12 09:29:18 2020 +0000
@@ -1,4 +1,4 @@
-/*     $NetBSD: locore.S,v 1.50 2020/01/08 05:41:07 ryo Exp $  */
+/*     $NetBSD: locore.S,v 1.51 2020/01/12 09:29:18 mrg Exp $  */
 
 /*
  * Copyright (c) 2017 Ryo Shimizu <ryo%nerv.org@localhost>
@@ -38,7 +38,7 @@
 #include <aarch64/hypervisor.h>
 #include "assym.h"
 
-RCSID("$NetBSD: locore.S,v 1.50 2020/01/08 05:41:07 ryo Exp $")
+RCSID("$NetBSD: locore.S,v 1.51 2020/01/12 09:29:18 mrg Exp $")
 
 #ifdef AARCH64_DEVICE_MEM_STRONGLY_ORDERED
 #define        MAIR_DEVICE_MEM         MAIR_DEVICE_nGnRnE
@@ -187,7 +187,8 @@
        /* get cache configuration */
        mrs     x0, tpidr_el1           /* curcpu */
        mrs     x1, mpidr_el1
-       bl      aarch64_gettopology
+       mov     x2, #0
+       bl      aarch64_set_topology
        mov     x0, xzr
        bl      aarch64_getcacheinfo
 
diff -r ea2e075bcb5e -r b1057135a9ac sys/arch/aarch64/include/cpu.h
--- a/sys/arch/aarch64/include/cpu.h    Sun Jan 12 06:41:02 2020 +0000
+++ b/sys/arch/aarch64/include/cpu.h    Sun Jan 12 09:29:18 2020 +0000
@@ -1,4 +1,4 @@
-/* $NetBSD: cpu.h,v 1.17 2020/01/05 20:17:43 ad Exp $ */
+/* $NetBSD: cpu.h,v 1.18 2020/01/12 09:29:18 mrg Exp $ */
 
 /*-
  * Copyright (c) 2014 The NetBSD Foundation, Inc.
@@ -93,6 +93,9 @@
        struct evcnt ci_vfp_save;
        struct evcnt ci_vfp_release;
 
+       /* FDT or similar supplied "cpu capacity" */
+       uint32_t ci_capacity_dmips_mhz;
+
        /* interrupt controller */
        u_int ci_gic_redist;    /* GICv3 redistributor index */
        uint64_t ci_gic_sgir;   /* GICv3 SGIR target */
diff -r ea2e075bcb5e -r b1057135a9ac sys/arch/aarch64/include/cpufunc.h
--- a/sys/arch/aarch64/include/cpufunc.h        Sun Jan 12 06:41:02 2020 +0000
+++ b/sys/arch/aarch64/include/cpufunc.h        Sun Jan 12 09:29:18 2020 +0000
@@ -1,4 +1,4 @@
-/*     $NetBSD: cpufunc.h,v 1.9 2019/12/19 09:47:42 ryo Exp $  */
+/*     $NetBSD: cpufunc.h,v 1.10 2020/01/12 09:29:18 mrg Exp $ */
 
 /*
  * Copyright (c) 2017 Ryo Shimizu <ryo%nerv.org@localhost>
@@ -69,7 +69,7 @@
 extern u_int cputype;                  /* compat arm */
 
 int set_cpufuncs(void);
-void aarch64_gettopology(struct cpu_info *, uint64_t);
+void aarch64_set_topology(struct cpu_info *, uint64_t, bool);
 void aarch64_getcacheinfo(int);
 void aarch64_printcacheinfo(device_t);
 
diff -r ea2e075bcb5e -r b1057135a9ac sys/arch/arm/fdt/cpu_fdt.c
--- a/sys/arch/arm/fdt/cpu_fdt.c        Sun Jan 12 06:41:02 2020 +0000
+++ b/sys/arch/arm/fdt/cpu_fdt.c        Sun Jan 12 09:29:18 2020 +0000
@@ -1,4 +1,4 @@
-/* $NetBSD: cpu_fdt.c,v 1.30 2019/11/01 13:22:08 bad Exp $ */
+/* $NetBSD: cpu_fdt.c,v 1.31 2020/01/12 09:29:18 mrg Exp $ */
 
 /*-
  * Copyright (c) 2017 Jared McNeill <jmcneill%invisible.ca@localhost>
@@ -30,7 +30,7 @@
 #include "psci_fdt.h"
 
 #include <sys/cdefs.h>
-__KERNEL_RCSID(0, "$NetBSD: cpu_fdt.c,v 1.30 2019/11/01 13:22:08 bad Exp $");
+__KERNEL_RCSID(0, "$NetBSD: cpu_fdt.c,v 1.31 2020/01/12 09:29:18 mrg Exp $");
 
 #include <sys/param.h>
 #include <sys/atomic.h>
@@ -126,10 +126,21 @@
        enum cpu_fdt_type type;
        bus_addr_t mpidr;
        cpuid_t cpuid;
+       const uint32_t *cap_ptr;
+       int len;
 
        sc->sc_dev = self;
        sc->sc_phandle = phandle;
 
+       cap_ptr = fdtbus_get_prop(phandle, "capacity-dmips-mhz", &len);
+       if (cap_ptr && len == 4) {
+               prop_dictionary_t dict = device_properties(self);
+               uint32_t capacity_dmips_mhz = be32toh(*cap_ptr);
+
+               prop_dictionary_set_uint32(dict, "capacity_dmips_mhz",
+                   capacity_dmips_mhz);
+       }
+
        type = of_search_compatible(phandle, compat_data)->data;
 
        switch (type) {
diff -r ea2e075bcb5e -r b1057135a9ac sys/kern/subr_cpu.c
--- a/sys/kern/subr_cpu.c       Sun Jan 12 06:41:02 2020 +0000
+++ b/sys/kern/subr_cpu.c       Sun Jan 12 09:29:18 2020 +0000
@@ -1,4 +1,4 @@
-/*     $NetBSD: subr_cpu.c,v 1.6 2020/01/09 16:35:03 ad Exp $  */
+/*     $NetBSD: subr_cpu.c,v 1.7 2020/01/12 09:29:18 mrg Exp $ */
 
 /*-
  * Copyright (c) 2007, 2008, 2009, 2010, 2012, 2019, 2020
@@ -61,7 +61,7 @@
  */
 
 #include <sys/cdefs.h>
-__KERNEL_RCSID(0, "$NetBSD: subr_cpu.c,v 1.6 2020/01/09 16:35:03 ad Exp $");
+__KERNEL_RCSID(0, "$NetBSD: subr_cpu.c,v 1.7 2020/01/12 09:29:18 mrg Exp $");
 
 #include <sys/param.h>
 #include <sys/systm.h>
@@ -152,6 +152,7 @@
        ci->ci_core_id = core_id;
        ci->ci_smt_id = smt_id;
        ci->ci_numa_id = numa_id;
+       ci->ci_is_slow = slow;
        for (rel = 0; rel < __arraycount(ci->ci_sibling); rel++) {
                ci->ci_sibling[rel] = ci;
                ci->ci_nsibling[rel] = 1;



Home | Main Index | Thread Index | Old Index