Source-Changes-HG archive

[Date Prev][Date Next][Thread Prev][Thread Next][Date Index][Thread Index][Old Index]

[src/trunk]: src/sys/arch/aarch64/aarch64 change to minimum invalidation of TLB.



details:   https://anonhg.NetBSD.org/src/rev/a015010d81a6
branches:  trunk
changeset: 363760:a015010d81a6
user:      ryo <ryo%NetBSD.org@localhost>
date:      Sat Aug 11 12:16:34 2018 +0000

description:
change to minimum invalidation of TLB.
specifying not only va but also asid, and not invalidate L0-L2 entry using tlbi_*_ll() if needed.

diffstat:

 sys/arch/aarch64/aarch64/pmap.c |  143 +++++++++++++++++++--------------------
 1 files changed, 68 insertions(+), 75 deletions(-)

diffs (272 lines):

diff -r 801fcac3578a -r a015010d81a6 sys/arch/aarch64/aarch64/pmap.c
--- a/sys/arch/aarch64/aarch64/pmap.c   Sat Aug 11 11:33:10 2018 +0000
+++ b/sys/arch/aarch64/aarch64/pmap.c   Sat Aug 11 12:16:34 2018 +0000
@@ -1,4 +1,4 @@
-/*     $NetBSD: pmap.c,v 1.18 2018/08/10 21:06:42 ryo Exp $    */
+/*     $NetBSD: pmap.c,v 1.19 2018/08/11 12:16:34 ryo Exp $    */
 
 /*
  * Copyright (c) 2017 Ryo Shimizu <ryo%nerv.org@localhost>
@@ -27,7 +27,7 @@
  */
 
 #include <sys/cdefs.h>
-__KERNEL_RCSID(0, "$NetBSD: pmap.c,v 1.18 2018/08/10 21:06:42 ryo Exp $");
+__KERNEL_RCSID(0, "$NetBSD: pmap.c,v 1.19 2018/08/11 12:16:34 ryo Exp $");
 
 #include "opt_arm_debug.h"
 #include "opt_ddb.h"
@@ -154,6 +154,41 @@
 #define LX_BLKPAG_ATTR_DEVICE_MEM      __SHIFTIN(3, LX_BLKPAG_ATTR_INDX)
 #define LX_BLKPAG_ATTR_MASK            LX_BLKPAG_ATTR_INDX
 
+/*
+ * invalidate TLB entry for ASID and VA.
+ * `ll' invalidates only the Last Level (usually L3) of TLB entry
+ */
+#define AARCH64_TLBI_BY_ASID_VA(asid, va, ll)                          \
+       do {                                                            \
+               if ((ll)) {                                             \
+                       if ((asid) == 0)                                \
+                               aarch64_tlbi_by_va_ll((va));            \
+                       else                                            \
+                               aarch64_tlbi_by_asid_va_ll((asid), (va)); \
+               } else {                                                \
+                       if ((asid) == 0)                                \
+                               aarch64_tlbi_by_va((va));               \
+                       else                                            \
+                               aarch64_tlbi_by_asid_va((asid), (va));  \
+               }                                                       \
+       } while (0/*CONSTCOND*/)
+
+/*
+ * aarch64 require write permission in pte to invalidate instruction cache.
+ * changing pte to writable temporarly before cpu_icache_sync_range().
+ * this macro modifies PTE (*ptep). need to update PTE after this.
+ */
+#define PTE_ICACHE_SYNC_PAGE(pte, ptep, pm, va, ll)                    \
+       do {                                                            \
+               pt_entry_t tpte;                                        \
+               tpte = (pte) & ~(LX_BLKPAG_AF|LX_BLKPAG_AP);            \
+               tpte |= (LX_BLKPAG_AF|LX_BLKPAG_AP_RW);                 \
+               tpte |= (LX_BLKPAG_UXN|LX_BLKPAG_PXN);                  \
+               atomic_swap_64((ptep), tpte);                           \
+               AARCH64_TLBI_BY_ASID_VA((pm)->pm_asid, (va), (ll));     \
+               cpu_icache_sync_range((va), PAGE_SIZE);                 \
+       } while (0/*CONSTCOND*/)
+
 struct pv_entry {
        TAILQ_ENTRY(pv_entry) pv_link;
        struct pmap *pv_pmap;
@@ -267,12 +302,19 @@
 
                pte = pa | attr;
 
+               if (prot & VM_PROT_EXECUTE) {
+                       pt_entry_t tpte;
+                       /* need write permission to invalidate icache */
+                       tpte = pte & ~(LX_BLKPAG_AF|LX_BLKPAG_AP);
+                       tpte |= (LX_BLKPAG_AF|LX_BLKPAG_AP_RW);
+                       tpte |= (LX_BLKPAG_UXN|LX_BLKPAG_PXN);
+                       atomic_swap_64(&l2[l2pde_index(va)], tpte);
+                       aarch64_tlbi_by_va(va);
+                       cpu_icache_sync_range(va, L2_SIZE);
+               }
                atomic_swap_64(&l2[l2pde_index(va)], pte);
                aarch64_tlbi_by_va(va);
 
-               if (prot & VM_PROT_EXECUTE)
-                       cpu_icache_sync_range(va, L2_SIZE);
-
                va += L2_SIZE;
                pa += L2_SIZE;
                resid -= L2_SIZE;
@@ -1088,12 +1130,7 @@
        /* new prot = prot & pteprot & mdattr */
        pte = _pmap_pte_adjust_prot(pte, prot & pteprot, mdattr, user);
        atomic_swap_64(ptep, pte);
-
-#if 0
-       aarch64_tlbi_by_asid_va(pv->pv_pmap->pm_asid, pv->pv_va);
-#else
-       aarch64_tlbi_by_va(pv->pv_va);
-#endif
+       AARCH64_TLBI_BY_ASID_VA(pv->pv_pmap->pm_asid, pv->pv_va, true);
 
        pm_unlock(pv->pv_pmap);
 }
@@ -1178,31 +1215,17 @@
                            "pm=%p, va=%016lx, pte: %016lx -> %016lx",
                            pm, va, opte, pte);
                        if (!l3pte_writable(pte)) {
-                               /*
-                                * require write permission for cleaning dcache
-                                * (cpu_icache_sync_range)
-                                */
-                               pt_entry_t tpte;
-
-                               tpte = pte & ~(LX_BLKPAG_AF|LX_BLKPAG_AP);
-                               tpte |= (LX_BLKPAG_AF|LX_BLKPAG_AP_RW);
-                               tpte |= (LX_BLKPAG_UXN|LX_BLKPAG_PXN);
-                               atomic_swap_64(ptep, tpte);
-                               aarch64_tlbi_by_va(va);
-
-                               cpu_icache_sync_range(va, PAGE_SIZE);
-
+                               PTE_ICACHE_SYNC_PAGE(pte, ptep, pm, va, true);
                                atomic_swap_64(ptep, pte);
-                               aarch64_tlbi_by_va(va);
+                               AARCH64_TLBI_BY_ASID_VA(pm->pm_asid, va, true);
                        } else {
                                atomic_swap_64(ptep, pte);
-                               aarch64_tlbi_by_va(va);
-
+                               AARCH64_TLBI_BY_ASID_VA(pm->pm_asid, va, true);
                                cpu_icache_sync_range(va, PAGE_SIZE);
                        }
                } else {
                        atomic_swap_64(ptep, pte);
-                       aarch64_tlbi_by_va(va);
+                       AARCH64_TLBI_BY_ASID_VA(pm->pm_asid, va, true);
                }
        }
 
@@ -1332,6 +1355,7 @@
        int error = 0;
        const bool user = (pm != pmap_kernel());
        bool executable;
+       bool l3only = true;
 
        UVMHIST_FUNC(__func__);
        UVMHIST_CALLED(pmaphist);
@@ -1395,6 +1419,7 @@
                _pmap_alloc_pdp(pm, &pdppa);
                KASSERT(pdppa != POOL_PADDR_INVALID);
                atomic_swap_64(&l0[idx], pdppa | L0_TABLE);
+               l3only = false;
        } else {
                pdppa = l0pde_pa(pde);
        }
@@ -1406,6 +1431,7 @@
                _pmap_alloc_pdp(pm, &pdppa);
                KASSERT(pdppa != POOL_PADDR_INVALID);
                atomic_swap_64(&l1[idx], pdppa | L1_TABLE);
+               l3only = false;
        } else {
                pdppa = l1pde_pa(pde);
        }
@@ -1417,6 +1443,7 @@
                _pmap_alloc_pdp(pm, &pdppa);
                KASSERT(pdppa != POOL_PADDR_INVALID);
                atomic_swap_64(&l2[idx], pdppa | L2_TABLE);
+               l3only = false;
        } else {
                pdppa = l2pde_pa(pde);
        }
@@ -1514,32 +1541,17 @@
                    "icache_sync: pm=%p, va=%016lx, pte: %016lx -> %016lx",
                    pm, va, opte, pte);
                if (!l3pte_writable(pte)) {
-                       /*
-                        * require write permission for cleaning dcache
-                        * (cpu_icache_sync_range)
-                        */
-                       pt_entry_t tpte;
-
-                       tpte = pte & ~(LX_BLKPAG_AF|LX_BLKPAG_AP);
-                       tpte |= (LX_BLKPAG_AF|LX_BLKPAG_AP_RW);
-                       tpte |= (LX_BLKPAG_UXN|LX_BLKPAG_PXN);
-                       atomic_swap_64(ptep, tpte);
-                       aarch64_tlbi_by_va(va);
-
-                       cpu_icache_sync_range(va, PAGE_SIZE);
-
+                       PTE_ICACHE_SYNC_PAGE(pte, ptep, pm, va, l3only);
                        atomic_swap_64(ptep, pte);
-                       aarch64_tlbi_by_va(va);
-
+                       AARCH64_TLBI_BY_ASID_VA(pm->pm_asid, va ,true);
                } else {
                        atomic_swap_64(ptep, pte);
-                       aarch64_tlbi_by_va(va);
-
+                       AARCH64_TLBI_BY_ASID_VA(pm->pm_asid, va, l3only);
                        cpu_icache_sync_range(va, PAGE_SIZE);
                }
        } else {
                atomic_swap_64(ptep, pte);
-               aarch64_tlbi_by_va(va);
+               AARCH64_TLBI_BY_ASID_VA(pm->pm_asid, va, l3only);
        }
 
        if (pte & LX_BLKPAG_OS_WIRED)
@@ -1607,11 +1619,7 @@
                        opv = _pmap_remove_pv(pg, pm, va, pte);
 
                atomic_swap_64(ptep, 0);
-#if 0
-               aarch64_tlbi_by_asid_va(pm->pm_asid, va);
-#else
-               aarch64_tlbi_by_va(va);
-#endif
+               AARCH64_TLBI_BY_ASID_VA(pm->pm_asid, va, true);
 
                if ((pte & LX_BLKPAG_OS_WIRED) != 0)
                        pm->pm_stats.wired_count--;
@@ -1661,12 +1669,9 @@
                TAILQ_FOREACH_SAFE(pv, &md->mdpg_pvhead, pv_link, pvtmp) {
 
                        opte = atomic_swap_64(pv->pv_ptep, 0);
-#if 0
-                       aarch64_tlbi_by_asid_va(pv->pv_pmap->pm_asid,
-                           pv->pv_va);
-#else
-                       aarch64_tlbi_by_va(pv->pv_va);
-#endif
+                       AARCH64_TLBI_BY_ASID_VA(pv->pv_pmap->pm_asid,
+                           pv->pv_va, true);
+
                        if ((opte & LX_BLKPAG_OS_WIRED) != 0)
                                pv->pv_pmap->pm_stats.wired_count--;
                        pv->pv_pmap->pm_stats.resident_count--;
@@ -1851,12 +1856,8 @@
        pmap_pv_unlock(md);
 
        atomic_swap_64(ptep, pte);
-#if 0
-       /* didn't work??? */
-       aarch64_tlbi_by_asid_va(pm->pm_asid, va);
-#else
-       aarch64_tlbi_by_va(va);
-#endif
+       AARCH64_TLBI_BY_ASID_VA(pm->pm_asid, va, true);
+
        fixed = true;
 
  done:
@@ -1909,11 +1910,7 @@
                        goto tryagain;
                }
 
-#if 0
-               aarch64_tlbi_by_asid_va(pv->pv_pmap->pm_asid, va);
-#else
-               aarch64_tlbi_by_va(va);
-#endif
+               AARCH64_TLBI_BY_ASID_VA(pv->pv_pmap->pm_asid, va, true);
 
                UVMHIST_LOG(pmaphist,
                    "va=%016llx, ptep=%p, pa=%016lx, RW -> RO",
@@ -1968,11 +1965,7 @@
                        goto tryagain;
                }
 
-#if 0
-               aarch64_tlbi_by_asid_va(pv->pv_pmap->pm_asid, va);
-#else
-               aarch64_tlbi_by_va(va);
-#endif
+               AARCH64_TLBI_BY_ASID_VA(pv->pv_pmap->pm_asid, va, true);
 
                UVMHIST_LOG(pmaphist, "va=%016llx, ptep=%p, pa=%016lx, unse AF",
                    va, ptep, l3pte_pa(pte), 0);



Home | Main Index | Thread Index | Old Index