Source-Changes-HG archive
[Date Prev][Date Next][Thread Prev][Thread Next][Date Index][Thread Index][Old Index]
[src/trunk]: src/sys/arch/aarch64 improve pmap_remove
details: https://anonhg.NetBSD.org/src/rev/b5ea24e83f29
branches: trunk
changeset: 996657:b5ea24e83f29
user: ryo <ryo%NetBSD.org@localhost>
date: Wed Feb 06 05:33:41 2019 +0000
description:
improve pmap_remove
- don't lock/unlock per page in pmap_remove()
- speedup pte lookup for continuous addresses
- bring out pool_cache_put(&_pmap_pv_pool, pv) from lock/unlock section
diffstat:
sys/arch/aarch64/aarch64/pmap.c | 195 +++++++++++++++++++++------------------
sys/arch/aarch64/include/pmap.h | 11 +-
2 files changed, 110 insertions(+), 96 deletions(-)
diffs (truncated from 461 to 300 lines):
diff -r 97356989ab26 -r b5ea24e83f29 sys/arch/aarch64/aarch64/pmap.c
--- a/sys/arch/aarch64/aarch64/pmap.c Wed Feb 06 05:33:14 2019 +0000
+++ b/sys/arch/aarch64/aarch64/pmap.c Wed Feb 06 05:33:41 2019 +0000
@@ -1,4 +1,4 @@
-/* $NetBSD: pmap.c,v 1.34 2018/12/21 08:01:01 ryo Exp $ */
+/* $NetBSD: pmap.c,v 1.35 2019/02/06 05:33:41 ryo Exp $ */
/*
* Copyright (c) 2017 Ryo Shimizu <ryo%nerv.org@localhost>
@@ -27,7 +27,7 @@
*/
#include <sys/cdefs.h>
-__KERNEL_RCSID(0, "$NetBSD: pmap.c,v 1.34 2018/12/21 08:01:01 ryo Exp $");
+__KERNEL_RCSID(0, "$NetBSD: pmap.c,v 1.35 2019/02/06 05:33:41 ryo Exp $");
#include "opt_arm_debug.h"
#include "opt_ddb.h"
@@ -187,12 +187,15 @@
paddr_t pv_pa; /* debug */
pt_entry_t *pv_ptep; /* for fast pte lookup */
};
+#define pv_next pv_link.tqe_next
+
+#define L3INDEXMASK (L3_SIZE * Ln_ENTRIES - 1)
static pt_entry_t *_pmap_pte_lookup_l3(struct pmap *, vaddr_t);
static pt_entry_t *_pmap_pte_lookup_bs(struct pmap *, vaddr_t, vsize_t *);
static pt_entry_t _pmap_pte_adjust_prot(pt_entry_t, vm_prot_t, vm_prot_t, bool);
static pt_entry_t _pmap_pte_adjust_cacheflags(pt_entry_t, u_int);
-static void _pmap_remove(struct pmap *, vaddr_t, bool);
+static void _pmap_remove(struct pmap *, vaddr_t, vaddr_t, bool, struct pv_entry **);
static int _pmap_enter(struct pmap *, vaddr_t, paddr_t, vm_prot_t, u_int, bool);
static struct pmap kernel_pmap;
@@ -614,7 +617,7 @@
bool
pmap_extract(struct pmap *pm, vaddr_t va, paddr_t *pap)
{
- static pt_entry_t *ptep;
+ static pt_entry_t *ptep, pte;
paddr_t pa;
vsize_t blocksize = 0;
extern char __kernel_text[];
@@ -630,7 +633,10 @@
ptep = _pmap_pte_lookup_bs(pm, va, &blocksize);
if (ptep == NULL)
return false;
- pa = lxpde_pa(*ptep) + (va & (blocksize - 1));
+ pte = *ptep;
+ if (!lxpde_valid(pte))
+ return false;
+ pa = lxpde_pa(pte) + (va & (blocksize - 1));
}
if (pap != NULL)
@@ -676,46 +682,30 @@
blocksize = L0_SIZE;
l0 = pm->pm_l0table;
idx = l0pde_index(va);
- pde = l0[idx];
- if (!l0pde_valid(pde)) {
- ptep = NULL;
+ ptep = &l0[idx];
+ pde = *ptep;
+ if (!l0pde_valid(pde))
goto done;
- }
blocksize = L1_SIZE;
l1 = (pd_entry_t *)AARCH64_PA_TO_KVA(l0pde_pa(pde));
idx = l1pde_index(va);
- pde = l1[idx];
- if (!l1pde_valid(pde)) {
- ptep = NULL;
+ ptep = &l1[idx];
+ pde = *ptep;
+ if (!l1pde_valid(pde) || l1pde_is_block(pde))
goto done;
- }
- if (l1pde_is_block(pde)) {
- ptep = &l1[idx];
- goto done;
- }
blocksize = L2_SIZE;
l2 = (pd_entry_t *)AARCH64_PA_TO_KVA(l1pde_pa(pde));
idx = l2pde_index(va);
- pde = l2[idx];
- if (!l2pde_valid(pde)) {
- ptep = NULL;
+ ptep = &l2[idx];
+ pde = *ptep;
+ if (!l2pde_valid(pde) || l2pde_is_block(pde))
goto done;
- }
- if (l2pde_is_block(pde)) {
- ptep = &l2[idx];
- goto done;
- }
blocksize = L3_SIZE;
l3 = (pd_entry_t *)AARCH64_PA_TO_KVA(l2pde_pa(pde));
idx = l3pte_index(va);
- pde = l3[idx];
- if (!l3pte_valid(pde)) {
- ptep = NULL;
- goto done;
- }
ptep = &l3[idx];
done:
@@ -740,21 +730,27 @@
void
pmap_icache_sync_range(pmap_t pm, vaddr_t sva, vaddr_t eva)
{
- pt_entry_t *ptep, pte;
+ pt_entry_t *ptep = NULL, pte;
vaddr_t va;
vsize_t blocksize = 0;
pm_lock(pm);
- for (va = sva; va < eva; va += blocksize) {
- ptep = _pmap_pte_lookup_bs(pm, va, &blocksize);
- if (blocksize == 0)
- break;
- if (ptep != NULL) {
+ for (va = sva; va < eva; va = (va + blocksize) & ~(blocksize - 1)) {
+ /* va is belong to the same L3 table as before? */
+ if ((blocksize == L3_SIZE) && ((va & L3INDEXMASK) != 0)) {
+ ptep++;
+ } else {
+ ptep = _pmap_pte_lookup_bs(pm, va, &blocksize);
+ if (ptep == NULL)
+ break;
+ }
+
+ pte = *ptep;
+ if (lxpde_valid(pte)) {
vaddr_t eob = (va + blocksize) & ~(blocksize - 1);
vsize_t len = ulmin(eva, eob - va);
- pte = *ptep;
if (l3pte_writable(pte)) {
cpu_icache_sync_range(va, len);
} else {
@@ -771,7 +767,6 @@
atomic_swap_64(ptep, opte);
AARCH64_TLBI_BY_ASID_VA(pm->pm_asid, va, true);
}
- va &= ~(blocksize - 1);
}
}
@@ -826,7 +821,7 @@
/* and either to executable */
xn = user ? LX_BLKPAG_UXN : LX_BLKPAG_PXN;
if (prot & VM_PROT_EXECUTE)
- pte &= ~xn;
+ pte &= ~xn;
return pte;
}
@@ -942,20 +937,22 @@
TAILQ_FOREACH(pv, &md->mdpg_pvhead, pv_link) {
pr(" pv[%d] pv=%p\n",
i, pv);
- pr(" pv[%d].pv_pmap =%p (asid=%d)\n",
+ pr(" pv[%d].pv_pmap = %p (asid=%d)\n",
i, pv->pv_pmap, pv->pv_pmap->pm_asid);
- pr(" pv[%d].pv_va =%016lx (color=%d)\n",
+ pr(" pv[%d].pv_va = %016lx (color=%d)\n",
i, pv->pv_va, _pmap_color(pv->pv_va));
- pr(" pv[%d].pv_pa =%016lx (color=%d)\n",
+ pr(" pv[%d].pv_pa = %016lx (color=%d)\n",
i, pv->pv_pa, _pmap_color(pv->pv_pa));
+ pr(" pv[%d].pv_ptep = %p\n",
+ i, pv->pv_ptep);
i++;
}
}
#endif /* PMAP_PV_DEBUG & DDB */
static int
-_pmap_enter_pv(struct vm_page *pg, struct pmap *pm, struct pv_entry **pvp, vaddr_t va,
- pt_entry_t *ptep, paddr_t pa, u_int flags)
+_pmap_enter_pv(struct vm_page *pg, struct pmap *pm, struct pv_entry **pvp,
+ vaddr_t va, pt_entry_t *ptep, paddr_t pa, u_int flags)
{
struct vm_page_md *md;
struct pv_entry *pv;
@@ -1006,6 +1003,7 @@
}
#endif
}
+
pmap_pv_unlock(md);
return 0;
}
@@ -1024,7 +1022,6 @@
pmap_kremove(vaddr_t va, vsize_t size)
{
struct pmap *kpm = pmap_kernel();
- vaddr_t eva;
int s;
UVMHIST_FUNC(__func__);
@@ -1036,14 +1033,12 @@
KDASSERT((size & PGOFSET) == 0);
KDASSERT(!IN_KSEG_ADDR(va));
-
- eva = va + size;
KDASSERT(IN_RANGE(va, VM_MIN_KERNEL_ADDRESS, VM_MAX_KERNEL_ADDRESS));
s = splvm();
- for (; va < eva; va += PAGE_SIZE) {
- _pmap_remove(kpm, va, true);
- }
+ pm_lock(kpm);
+ _pmap_remove(kpm, va, va + size, true, NULL);
+ pm_unlock(kpm);
splx(s);
}
@@ -1089,7 +1084,9 @@
void
pmap_protect(struct pmap *pm, vaddr_t sva, vaddr_t eva, vm_prot_t prot)
{
+ pt_entry_t *ptep = NULL, pte;
vaddr_t va;
+ vsize_t blocksize = 0;
const bool user = (pm != pmap_kernel());
KASSERT((prot & VM_PROT_READ) || !(prot & VM_PROT_WRITE));
@@ -1115,8 +1112,7 @@
pm_lock(pm);
- for (va = sva; va < eva; va += PAGE_SIZE) {
- pt_entry_t *ptep, pte;
+ for (va = sva; va < eva; va = (va + blocksize) & ~(blocksize - 1)) {
#ifdef UVMHIST
pt_entry_t opte;
#endif
@@ -1125,20 +1121,19 @@
uint32_t mdattr;
bool executable;
- ptep = _pmap_pte_lookup_l3(pm, va);
- if (ptep == NULL) {
+ /* va is belong to the same L3 table as before? */
+ if ((blocksize == L3_SIZE) && ((va & L3INDEXMASK) != 0))
+ ptep++;
+ else
+ ptep = _pmap_pte_lookup_bs(pm, va, &blocksize);
+
+ pte = *ptep;
+ if (!lxpde_valid(pte)) {
PMAP_COUNT(protect_none);
continue;
}
- pte = *ptep;
-
- if (!l3pte_valid(pte)) {
- PMAP_COUNT(protect_none);
- continue;
- }
-
- pa = l3pte_pa(pte);
+ pa = lxpde_pa(pte);
pg = PHYS_TO_VM_PAGE(pa);
if (pg != NULL) {
@@ -1152,7 +1147,6 @@
PMAP_COUNT(protect_unmanaged);
}
- pte = *ptep;
#ifdef UVMHIST
opte = pte;
#endif
@@ -1282,6 +1276,7 @@
_pmap_free_pdp_all(pm);
mutex_destroy(&pm->pm_lock);
+
pool_cache_put(&_pmap_cache, pm);
PMAP_COUNT(destroy);
@@ -1555,37 +1550,46 @@
}
static void
-_pmap_remove(struct pmap *pm, vaddr_t va, bool kremove)
+_pmap_remove(struct pmap *pm, vaddr_t sva, vaddr_t eva, bool kremove,
+ struct pv_entry **pvtofree)
{
Home |
Main Index |
Thread Index |
Old Index