dynamically calculating NKPT [was: Re: huge ktr buffer]
Konstantin Belousov
kostikbel at gmail.com
Tue Feb 5 15:14:24 UTC 2013
On Mon, Feb 04, 2013 at 03:05:15PM -0800, Neel Natu wrote:
> Hi,
>
> I have a patch to dynamically calculate NKPT for amd64 kernels. This
> should fix the various issues that people pointed out in the email
> thread.
>
> Please review and let me know if there are any objections to committing this.
>
> Also, thanks to Alan (alc@) for reviewing and providing feedback on
> the initial version of the patch.
>
> Patch (also available at http://people.freebsd.org/~neel/patches/nkpt_diff.txt):
>
> Index: sys/amd64/include/pmap.h
> ===================================================================
> --- sys/amd64/include/pmap.h (revision 246277)
> +++ sys/amd64/include/pmap.h (working copy)
> @@ -113,13 +113,7 @@
> ((unsigned long)(l2) << PDRSHIFT) | \
> ((unsigned long)(l1) << PAGE_SHIFT))
>
> -/* Initial number of kernel page tables. */
> -#ifndef NKPT
> -#define NKPT 32
> -#endif
> -
> #define NKPML4E 1 /* number of kernel PML4 slots */
> -#define NKPDPE howmany(NKPT, NPDEPG)/* number of kernel PDP slots */
>
> #define NUPML4E (NPML4EPG/2) /* number of userland PML4 pages */
> #define NUPDPE (NUPML4E*NPDPEPG)/* number of userland PDP pages */
> @@ -181,6 +175,7 @@
> #define PML4map ((pd_entry_t *)(addr_PML4map))
> #define PML4pml4e ((pd_entry_t *)(addr_PML4pml4e))
>
> +extern int nkpt; /* Initial number of kernel page tables */
> extern u_int64_t KPDPphys; /* physical address of kernel level 3 */
> extern u_int64_t KPML4phys; /* physical address of kernel level 4 */
>
> Index: sys/amd64/amd64/minidump_machdep.c
> ===================================================================
> --- sys/amd64/amd64/minidump_machdep.c (revision 246277)
> +++ sys/amd64/amd64/minidump_machdep.c (working copy)
> @@ -232,7 +232,7 @@
> /* Walk page table pages, set bits in vm_page_dump */
> pmapsize = 0;
> pdp = (uint64_t *)PHYS_TO_DMAP(KPDPphys);
> - for (va = VM_MIN_KERNEL_ADDRESS; va < MAX(KERNBASE + NKPT * NBPDR,
> + for (va = VM_MIN_KERNEL_ADDRESS; va < MAX(KERNBASE + nkpt * NBPDR,
> kernel_vm_end); ) {
> /*
> * We always write a page, even if it is zero. Each
> @@ -364,7 +364,7 @@
> /* Dump kernel page directory pages */
> bzero(fakepd, sizeof(fakepd));
> pdp = (uint64_t *)PHYS_TO_DMAP(KPDPphys);
> - for (va = VM_MIN_KERNEL_ADDRESS; va < MAX(KERNBASE + NKPT * NBPDR,
> + for (va = VM_MIN_KERNEL_ADDRESS; va < MAX(KERNBASE + nkpt * NBPDR,
> kernel_vm_end); va += NBPDP) {
> i = (va >> PDPSHIFT) & ((1ul << NPDPEPGSHIFT) - 1);
>
> Index: sys/amd64/amd64/pmap.c
> ===================================================================
> --- sys/amd64/amd64/pmap.c (revision 246277)
> +++ sys/amd64/amd64/pmap.c (working copy)
> @@ -202,6 +202,10 @@
> vm_offset_t virtual_avail; /* VA of first avail page (after kernel bss) */
> vm_offset_t virtual_end; /* VA of last avail page (end of kernel AS) */
>
> +int nkpt;
> +SYSCTL_INT(_machdep, OID_AUTO, nkpt, CTLFLAG_RD, &nkpt, 0,
> + "Number of kernel page table pages allocated on bootup");
> +
> static int ndmpdp;
> static vm_paddr_t dmaplimit;
> vm_offset_t kernel_vm_end = VM_MIN_KERNEL_ADDRESS;
> @@ -495,17 +499,42 @@
>
> CTASSERT(powerof2(NDMPML4E));
>
> +/* number of kernel PDP slots */
> +#define NKPDPE(ptpgs) howmany((ptpgs), NPDEPG)
> +
> static void
> +nkpt_init(vm_paddr_t addr)
> +{
> + int pt_pages;
> +
> +#ifdef NKPT
> + pt_pages = NKPT;
> +#else
> + pt_pages = howmany(addr, 1 << PDRSHIFT);
> + pt_pages += NKPDPE(pt_pages);
> +
> + /*
> + * Add some slop beyond the bare minimum required for bootstrapping
> + * the kernel.
> + *
> + * This is quite important when allocating KVA for kernel modules.
> + * The modules are required to be linked in the negative 2GB of
> + * the address space. If we run out of KVA in this region then
> + * pmap_growkernel() will need to allocate page table pages to map
> + * the entire 512GB of KVA space which is an unnecessary tax on
> + * physical memory.
> + */
> + pt_pages += 4; /* 8MB additional slop for kernel modules */
8MB might be to low. I just checked one of my machines with fully
modularized kernel, it takes slightly more than 6 MB to load 50 modules.
I think that 16MB would be safer, but it probably needs to be scaled
down based on the available phys memory. amd64 kernel could be booted
on 128MB machine still.
-------------- next part --------------
A non-text attachment was scrubbed...
Name: not available
Type: application/pgp-signature
Size: 834 bytes
Desc: not available
URL: <http://lists.freebsd.org/pipermail/freebsd-hackers/attachments/20130205/72469407/attachment.sig>
More information about the freebsd-hackers
mailing list