Commit 7d35ecab authored by Jeff Dike's avatar Jeff Dike Committed by Linus Torvalds

[PATCH] UML: Three-level page table support

This is the three-level page table support from the x86_64 patch.  It can
be enabled on x86, although it's not particularly needed at this point.
However, it can be used to implement very large physical memory (with
almost all of it in highmem) on UML.
Signed-off-by: default avatarJeff Dike <jdike@addtoit.com>
Signed-off-by: default avatarAndrew Morton <akpm@osdl.org>
Signed-off-by: default avatarLinus Torvalds <torvalds@osdl.org>
parent 2b047b97
...@@ -68,6 +68,8 @@ config MODE_SKAS ...@@ -68,6 +68,8 @@ config MODE_SKAS
to CONFIG_MODE_TT). Otherwise, it is safe to say Y. Disabling this to CONFIG_MODE_TT). Otherwise, it is safe to say Y. Disabling this
option will shrink the UML binary slightly. option will shrink the UML binary slightly.
source "arch/um/Kconfig_arch"
config NET config NET
bool "Networking support" bool "Networking support"
help help
......
config 3_LEVEL_PGTABLES
bool "Three-level pagetables"
default n
help
Three-level pagetables will let UML have more than 4G of physical
memory. All the memory that can't be mapped directly will be treated
as high memory.
...@@ -17,7 +17,7 @@ core-y += $(ARCH_DIR)/kernel/ \ ...@@ -17,7 +17,7 @@ core-y += $(ARCH_DIR)/kernel/ \
# Have to precede the include because the included Makefiles reference them. # Have to precede the include because the included Makefiles reference them.
SYMLINK_HEADERS = archparam.h system.h sigcontext.h processor.h ptrace.h \ SYMLINK_HEADERS = archparam.h system.h sigcontext.h processor.h ptrace.h \
arch-signal.h module.h arch-signal.h module.h vm-flags.h
SYMLINK_HEADERS := $(foreach header,$(SYMLINK_HEADERS),include/asm-um/$(header)) SYMLINK_HEADERS := $(foreach header,$(SYMLINK_HEADERS),include/asm-um/$(header))
ARCH_SYMLINKS = include/asm-um/arch $(ARCH_DIR)/include/sysdep $(ARCH_DIR)/os \ ARCH_SYMLINKS = include/asm-um/arch $(ARCH_DIR)/include/sysdep $(ARCH_DIR)/os \
......
...@@ -17,6 +17,7 @@ CONFIG_GENERIC_CALIBRATE_DELAY=y ...@@ -17,6 +17,7 @@ CONFIG_GENERIC_CALIBRATE_DELAY=y
# #
CONFIG_MODE_TT=y CONFIG_MODE_TT=y
CONFIG_MODE_SKAS=y CONFIG_MODE_SKAS=y
# CONFIG_3_LEVEL_PGTABLES is not set
CONFIG_NET=y CONFIG_NET=y
CONFIG_BINFMT_ELF=y CONFIG_BINFMT_ELF=y
CONFIG_BINFMT_MISC=m CONFIG_BINFMT_MISC=m
......
...@@ -25,7 +25,7 @@ extern char __binary_start; ...@@ -25,7 +25,7 @@ extern char __binary_start;
/* Changed during early boot */ /* Changed during early boot */
unsigned long *empty_zero_page = NULL; unsigned long *empty_zero_page = NULL;
unsigned long *empty_bad_page = NULL; unsigned long *empty_bad_page = NULL;
pgd_t swapper_pg_dir[1024]; pgd_t swapper_pg_dir[PTRS_PER_PGD];
unsigned long highmem; unsigned long highmem;
int kmalloc_ok = 0; int kmalloc_ok = 0;
...@@ -242,6 +242,7 @@ struct page *arch_validate(struct page *page, int mask, int order) ...@@ -242,6 +242,7 @@ struct page *arch_validate(struct page *page, int mask, int order)
} }
addr += PAGE_SIZE; addr += PAGE_SIZE;
} }
if(i == (1 << order)) return(page); if(i == (1 << order)) return(page);
page = alloc_pages(mask, order); page = alloc_pages(mask, order);
goto again; goto again;
...@@ -336,7 +337,7 @@ struct page *pte_alloc_one(struct mm_struct *mm, unsigned long address) ...@@ -336,7 +337,7 @@ struct page *pte_alloc_one(struct mm_struct *mm, unsigned long address)
{ {
struct page *pte; struct page *pte;
pte = alloc_pages(GFP_KERNEL|__GFP_REPEAT|__GFP_ZERO, 0); pte = alloc_page(GFP_KERNEL|__GFP_REPEAT|__GFP_ZERO);
return pte; return pte;
} }
......
...@@ -309,7 +309,7 @@ struct page *__virt_to_page(const unsigned long virt) ...@@ -309,7 +309,7 @@ struct page *__virt_to_page(const unsigned long virt)
return(&mem_map[__pa(virt) >> PAGE_SHIFT]); return(&mem_map[__pa(virt) >> PAGE_SHIFT]);
} }
unsigned long page_to_phys(struct page *page) phys_t page_to_phys(struct page *page)
{ {
return((page - mem_map) << PAGE_SHIFT); return((page - mem_map) << PAGE_SHIFT);
} }
...@@ -318,8 +318,9 @@ pte_t mk_pte(struct page *page, pgprot_t pgprot) ...@@ -318,8 +318,9 @@ pte_t mk_pte(struct page *page, pgprot_t pgprot)
{ {
pte_t pte; pte_t pte;
pte_val(pte) = page_to_phys(page) + pgprot_val(pgprot); pte_set_val(pte, page_to_phys(page), pgprot);
if(pte_present(pte)) pte_mknewprot(pte_mknewpage(pte)); if(pte_present(pte))
pte_mknewprot(pte_mknewpage(pte));
return(pte); return(pte);
} }
......
/* /*
* Copyright (C) 2002 Jeff Dike (jdike@karaya.com) * Copyright (C) 2002 Jeff Dike (jdike@karaya.com)
* Copyright 2003 PathScale, Inc.
* Licensed under the GPL * Licensed under the GPL
*/ */
...@@ -18,24 +19,69 @@ static void fix_range(struct mm_struct *mm, unsigned long start_addr, ...@@ -18,24 +19,69 @@ static void fix_range(struct mm_struct *mm, unsigned long start_addr,
unsigned long end_addr, int force) unsigned long end_addr, int force)
{ {
pgd_t *npgd; pgd_t *npgd;
pmd_t *npud; pud_t *npud;
pmd_t *npmd; pmd_t *npmd;
pte_t *npte; pte_t *npte;
unsigned long addr; unsigned long addr, end;
int r, w, x, err, fd; int r, w, x, err, fd;
if(mm == NULL) return; if(mm == NULL) return;
fd = mm->context.skas.mm_fd; fd = mm->context.skas.mm_fd;
for(addr = start_addr; addr < end_addr;){ for(addr = start_addr; addr < end_addr;){
npgd = pgd_offset(mm, addr); npgd = pgd_offset(mm, addr);
if(!pgd_present(*npgd)){
if(force || pgd_newpage(*npgd)){
end = addr + PGDIR_SIZE;
if(end > end_addr)
end = end_addr;
err = unmap(fd, (void *) addr, end - addr);
if(err < 0)
panic("munmap failed, errno = %d\n",
-err);
pgd_mkuptodate(*npgd);
}
addr += PGDIR_SIZE;
continue;
}
npud = pud_offset(npgd, addr); npud = pud_offset(npgd, addr);
if(!pud_present(*npud)){
if(force || pud_newpage(*npud)){
end = addr + PUD_SIZE;
if(end > end_addr)
end = end_addr;
err = unmap(fd, (void *) addr, end - addr);
if(err < 0)
panic("munmap failed, errno = %d\n",
-err);
pud_mkuptodate(*npud);
}
addr += PUD_SIZE;
continue;
}
npmd = pmd_offset(npud, addr); npmd = pmd_offset(npud, addr);
if(pmd_present(*npmd)){ if(!pmd_present(*npmd)){
if(force || pmd_newpage(*npmd)){
end = addr + PMD_SIZE;
if(end > end_addr)
end = end_addr;
err = unmap(fd, (void *) addr, end - addr);
if(err < 0)
panic("munmap failed, errno = %d\n",
-err);
pmd_mkuptodate(*npmd);
}
addr += PMD_SIZE;
continue;
}
npte = pte_offset_kernel(npmd, addr); npte = pte_offset_kernel(npmd, addr);
r = pte_read(*npte); r = pte_read(*npte);
w = pte_write(*npte); w = pte_write(*npte);
x = pte_exec(*npte); x = pte_exec(*npte);
if(!pte_dirty(*npte)) w = 0; if(!pte_dirty(*npte))
w = 0;
if(!pte_young(*npte)){ if(!pte_young(*npte)){
r = 0; r = 0;
w = 0; w = 0;
...@@ -43,39 +89,27 @@ static void fix_range(struct mm_struct *mm, unsigned long start_addr, ...@@ -43,39 +89,27 @@ static void fix_range(struct mm_struct *mm, unsigned long start_addr,
if(force || pte_newpage(*npte)){ if(force || pte_newpage(*npte)){
err = unmap(fd, (void *) addr, PAGE_SIZE); err = unmap(fd, (void *) addr, PAGE_SIZE);
if(err < 0) if(err < 0)
panic("munmap failed, errno = %d\n", panic("munmap failed, errno = %d\n", -err);
-err);
if(pte_present(*npte)) if(pte_present(*npte))
map(fd, addr, map(fd, addr, pte_val(*npte) & PAGE_MASK,
pte_val(*npte) & PAGE_MASK,
PAGE_SIZE, r, w, x); PAGE_SIZE, r, w, x);
} }
else if(pte_newprot(*npte)){ else if(pte_newprot(*npte))
protect(fd, addr, PAGE_SIZE, r, w, x, 1); protect(fd, addr, PAGE_SIZE, r, w, x, 1);
}
*npte = pte_mkuptodate(*npte); *npte = pte_mkuptodate(*npte);
addr += PAGE_SIZE; addr += PAGE_SIZE;
} }
else {
if(force || pmd_newpage(*npmd)){
err = unmap(fd, (void *) addr, PMD_SIZE);
if(err < 0)
panic("munmap failed, errno = %d\n",
-err);
pmd_mkuptodate(*npmd);
}
addr += PMD_SIZE;
}
}
} }
void flush_tlb_kernel_range_skas(unsigned long start, unsigned long end) void flush_tlb_kernel_range_skas(unsigned long start, unsigned long end)
{ {
struct mm_struct *mm; struct mm_struct *mm;
pgd_t *pgd; pgd_t *pgd;
pud_t *pud;
pmd_t *pmd; pmd_t *pmd;
pte_t *pte; pte_t *pte;
unsigned long addr; unsigned long addr, last;
int updated = 0, err; int updated = 0, err;
mm = &init_mm; mm = &init_mm;
...@@ -83,36 +117,71 @@ void flush_tlb_kernel_range_skas(unsigned long start, unsigned long end) ...@@ -83,36 +117,71 @@ void flush_tlb_kernel_range_skas(unsigned long start, unsigned long end)
pgd = pgd_offset(mm, addr); pgd = pgd_offset(mm, addr);
pud = pud_offset(pgd, addr); pud = pud_offset(pgd, addr);
pmd = pmd_offset(pud, addr); pmd = pmd_offset(pud, addr);
if(pmd_present(*pmd)){ if(!pgd_present(*pgd)){
pte = pte_offset_kernel(pmd, addr); if(pgd_newpage(*pgd)){
if(!pte_present(*pte) || pte_newpage(*pte)){
updated = 1; updated = 1;
last = addr + PGDIR_SIZE;
if(last > end)
last = end;
err = os_unmap_memory((void *) addr, err = os_unmap_memory((void *) addr,
PAGE_SIZE); last - addr);
if(err < 0) if(err < 0)
panic("munmap failed, errno = %d\n", panic("munmap failed, errno = %d\n",
-err); -err);
if(pte_present(*pte))
map_memory(addr,
pte_val(*pte) & PAGE_MASK,
PAGE_SIZE, 1, 1, 1);
} }
else if(pte_newprot(*pte)){ addr += PGDIR_SIZE;
continue;
}
pud = pud_offset(pgd, addr);
if(!pud_present(*pud)){
if(pud_newpage(*pud)){
updated = 1; updated = 1;
protect_memory(addr, PAGE_SIZE, 1, 1, 1, 1); last = addr + PUD_SIZE;
if(last > end)
last = end;
err = os_unmap_memory((void *) addr,
last - addr);
if(err < 0)
panic("munmap failed, errno = %d\n",
-err);
} }
addr += PAGE_SIZE; addr += PUD_SIZE;
continue;
} }
else {
pmd = pmd_offset(pud, addr);
if(!pmd_present(*pmd)){
if(pmd_newpage(*pmd)){ if(pmd_newpage(*pmd)){
updated = 1; updated = 1;
err = os_unmap_memory((void *) addr, PMD_SIZE); last = addr + PMD_SIZE;
if(last > end)
last = end;
err = os_unmap_memory((void *) addr,
last - addr);
if(err < 0) if(err < 0)
panic("munmap failed, errno = %d\n", panic("munmap failed, errno = %d\n",
-err); -err);
} }
addr += PMD_SIZE; addr += PMD_SIZE;
continue;
}
pte = pte_offset_kernel(pmd, addr);
if(!pte_present(*pte) || pte_newpage(*pte)){
updated = 1;
err = os_unmap_memory((void *) addr, PAGE_SIZE);
if(err < 0)
panic("munmap failed, errno = %d\n", -err);
if(pte_present(*pte))
map_memory(addr, pte_val(*pte) & PAGE_MASK,
PAGE_SIZE, 1, 1, 1);
}
else if(pte_newprot(*pte)){
updated = 1;
protect_memory(addr, PAGE_SIZE, 1, 1, 1, 1);
} }
addr += PAGE_SIZE;
} }
} }
......
...@@ -56,7 +56,7 @@ int handle_page_fault(unsigned long address, unsigned long ip, ...@@ -56,7 +56,7 @@ int handle_page_fault(unsigned long address, unsigned long ip,
if(is_write && !(vma->vm_flags & VM_WRITE)) if(is_write && !(vma->vm_flags & VM_WRITE))
goto out; goto out;
page = address & PAGE_MASK; page = address & PAGE_MASK;
pgd = pgd_offset(mm); pgd = pgd_offset(mm, page);
pud = pud_offset(pgd, page); pud = pud_offset(pgd, page);
pmd = pmd_offset(pud, page); pmd = pmd_offset(pud, page);
do { do {
...@@ -77,6 +77,9 @@ int handle_page_fault(unsigned long address, unsigned long ip, ...@@ -77,6 +77,9 @@ int handle_page_fault(unsigned long address, unsigned long ip,
default: default:
BUG(); BUG();
} }
pgd = pgd_offset(mm, page);
pud = pud_offset(pgd, page);
pmd = pmd_offset(pud, page);
pte = pte_offset_kernel(pmd, page); pte = pte_offset_kernel(pmd, page);
} while(!pte_present(*pte)); } while(!pte_present(*pte));
err = 0; err = 0;
......
/* /*
* Copyright (C) 2002 Jeff Dike (jdike@karaya.com) * Copyright (C) 2002 Jeff Dike (jdike@karaya.com)
* Copyright 2003 PathScale, Inc.
* Licensed under the GPL * Licensed under the GPL
*/ */
...@@ -22,7 +23,7 @@ static void fix_range(struct mm_struct *mm, unsigned long start_addr, ...@@ -22,7 +23,7 @@ static void fix_range(struct mm_struct *mm, unsigned long start_addr,
pud_t *npud; pud_t *npud;
pmd_t *npmd; pmd_t *npmd;
pte_t *npte; pte_t *npte;
unsigned long addr; unsigned long addr, end;
int r, w, x, err; int r, w, x, err;
if((current->thread.mode.tt.extern_pid != -1) && if((current->thread.mode.tt.extern_pid != -1) &&
...@@ -42,47 +43,82 @@ static void fix_range(struct mm_struct *mm, unsigned long start_addr, ...@@ -42,47 +43,82 @@ static void fix_range(struct mm_struct *mm, unsigned long start_addr,
addr = STACK_TOP - ABOVE_KMEM; addr = STACK_TOP - ABOVE_KMEM;
continue; continue;
} }
npgd = pgd_offset(mm, addr); npgd = pgd_offset(mm, addr);
if(!pgd_present(*npgd)){
if(force || pgd_newpage(*npgd)){
end = addr + PGDIR_SIZE;
if(end > end_addr)
end = end_addr;
err = os_unmap_memory((void *) addr,
end - addr);
if(err < 0)
panic("munmap failed, errno = %d\n",
-err);
pgd_mkuptodate(*npgd);
}
addr += PGDIR_SIZE;
continue;
}
npud = pud_offset(npgd, addr); npud = pud_offset(npgd, addr);
if(!pud_present(*npud)){
if(force || pud_newpage(*npud)){
end = addr + PUD_SIZE;
if(end > end_addr)
end = end_addr;
err = os_unmap_memory((void *) addr,
end - addr);
if(err < 0)
panic("munmap failed, errno = %d\n",
-err);
pud_mkuptodate(*npud);
}
addr += PUD_SIZE;
continue;
}
npmd = pmd_offset(npud, addr); npmd = pmd_offset(npud, addr);
if(pmd_present(*npmd)){ if(!pmd_present(*npmd)){
if(force || pmd_newpage(*npmd)){
end = addr + PMD_SIZE;
if(end > end_addr)
end = end_addr;
err = os_unmap_memory((void *) addr,
end - addr);
if(err < 0)
panic("munmap failed, errno = %d\n",
-err);
pmd_mkuptodate(*npmd);
}
addr += PMD_SIZE;
continue;
}
npte = pte_offset_kernel(npmd, addr); npte = pte_offset_kernel(npmd, addr);
r = pte_read(*npte); r = pte_read(*npte);
w = pte_write(*npte); w = pte_write(*npte);
x = pte_exec(*npte); x = pte_exec(*npte);
if(!pte_dirty(*npte)) w = 0; if(!pte_dirty(*npte))
w = 0;
if(!pte_young(*npte)){ if(!pte_young(*npte)){
r = 0; r = 0;
w = 0; w = 0;
} }
if(force || pte_newpage(*npte)){ if(force || pte_newpage(*npte)){
err = os_unmap_memory((void *) addr, err = os_unmap_memory((void *) addr, PAGE_SIZE);
PAGE_SIZE);
if(err < 0) if(err < 0)
panic("munmap failed, errno = %d\n", panic("munmap failed, errno = %d\n", -err);
-err);
if(pte_present(*npte)) if(pte_present(*npte))
map_memory(addr, map_memory(addr, pte_val(*npte) & PAGE_MASK,
pte_val(*npte) & PAGE_MASK,
PAGE_SIZE, r, w, x); PAGE_SIZE, r, w, x);
} }
else if(pte_newprot(*npte)){ else if(pte_newprot(*npte))
protect_memory(addr, PAGE_SIZE, r, w, x, 1); protect_memory(addr, PAGE_SIZE, r, w, x, 1);
}
*npte = pte_mkuptodate(*npte); *npte = pte_mkuptodate(*npte);
addr += PAGE_SIZE; addr += PAGE_SIZE;
} }
else {
if(force || pmd_newpage(*npmd)){
err = os_unmap_memory((void *) addr, PMD_SIZE);
if(err < 0)
panic("munmap failed, errno = %d\n",
-err);
pmd_mkuptodate(*npmd);
}
addr += PMD_SIZE;
}
}
} }
atomic_t vmchange_seq = ATOMIC_INIT(1); atomic_t vmchange_seq = ATOMIC_INIT(1);
...@@ -92,18 +128,65 @@ static void flush_kernel_vm_range(unsigned long start, unsigned long end, ...@@ -92,18 +128,65 @@ static void flush_kernel_vm_range(unsigned long start, unsigned long end,
{ {
struct mm_struct *mm; struct mm_struct *mm;
pgd_t *pgd; pgd_t *pgd;
pud_t *pmd; pud_t *pud;
pmd_t *pmd; pmd_t *pmd;
pte_t *pte; pte_t *pte;
unsigned long addr; unsigned long addr, last;
int updated = 0, err; int updated = 0, err;
mm = &init_mm; mm = &init_mm;
for(addr = start; addr < end;){ for(addr = start; addr < end;){
pgd = pgd_offset(mm, addr); pgd = pgd_offset(mm, addr);
if(!pgd_present(*pgd)){
if(pgd_newpage(*pgd)){
updated = 1;
last = addr + PGDIR_SIZE;
if(last > end)
last = end;
err = os_unmap_memory((void *) addr,
last - addr);
if(err < 0)
panic("munmap failed, errno = %d\n",
-err);
}
addr += PGDIR_SIZE;
continue;
}
pud = pud_offset(pgd, addr); pud = pud_offset(pgd, addr);
if(!pud_present(*pud)){
if(pud_newpage(*pud)){
updated = 1;
last = addr + PUD_SIZE;
if(last > end)
last = end;
err = os_unmap_memory((void *) addr,
last - addr);
if(err < 0)
panic("munmap failed, errno = %d\n",
-err);
}
addr += PUD_SIZE;
continue;
}
pmd = pmd_offset(pud, addr); pmd = pmd_offset(pud, addr);
if(pmd_present(*pmd)){ if(!pmd_present(*pmd)){
if(pmd_newpage(*pmd)){
updated = 1;
last = addr + PMD_SIZE;
if(last > end)
last = end;
err = os_unmap_memory((void *) addr,
last - addr);
if(err < 0)
panic("munmap failed, errno = %d\n",
-err);
}
addr += PMD_SIZE;
continue;
}
pte = pte_offset_kernel(pmd, addr); pte = pte_offset_kernel(pmd, addr);
if(!pte_present(*pte) || pte_newpage(*pte)){ if(!pte_present(*pte) || pte_newpage(*pte)){
updated = 1; updated = 1;
...@@ -123,17 +206,6 @@ static void flush_kernel_vm_range(unsigned long start, unsigned long end, ...@@ -123,17 +206,6 @@ static void flush_kernel_vm_range(unsigned long start, unsigned long end,
} }
addr += PAGE_SIZE; addr += PAGE_SIZE;
} }
else {
if(pmd_newpage(*pmd)){
updated = 1;
err = os_unmap_memory((void *) addr, PMD_SIZE);
if(err < 0)
panic("munmap failed, errno = %d\n",
-err);
}
addr += PMD_SIZE;
}
}
if(updated && update_seq) atomic_inc(&vmchange_seq); if(updated && update_seq) atomic_inc(&vmchange_seq);
} }
......
/* /*
* Copyright (C) 2000 - 2003 Jeff Dike (jdike@addtoit.com) * Copyright (C) 2000 - 2003 Jeff Dike (jdike@addtoit.com)
* Copyright 2003 PathScale, Inc.
* Licensed under the GPL * Licensed under the GPL
*/ */
...@@ -8,18 +9,82 @@ ...@@ -8,18 +9,82 @@
struct page; struct page;
#include "asm/arch/page.h" #include <linux/config.h>
#include <asm/vm-flags.h>
#undef __pa /* PAGE_SHIFT determines the page size */
#undef __va #define PAGE_SHIFT 12
#undef pfn_to_page #define PAGE_SIZE (1UL << PAGE_SHIFT)
#undef page_to_pfn #define PAGE_MASK (~(PAGE_SIZE-1))
#undef virt_to_page
#undef pfn_valid /*
#undef virt_addr_valid * These are used to make use of C type-checking..
#undef VALID_PAGE */
#undef PAGE_OFFSET
#undef KERNELBASE #define clear_page(page) memset((void *)(page), 0, PAGE_SIZE)
#define copy_page(to,from) memcpy((void *)(to), (void *)(from), PAGE_SIZE)
#define clear_user_page(page, vaddr, pg) clear_page(page)
#define copy_user_page(to, from, vaddr, pg) copy_page(to, from)
#if defined(CONFIG_3_LEVEL_PGTABLES) && !defined(CONFIG_64_BIT)
typedef struct { unsigned long pte_low, pte_high; } pte_t;
typedef struct { unsigned long long pmd; } pmd_t;
typedef struct { unsigned long pgd; } pgd_t;
#define pte_val(x) ((x).pte_low | ((unsigned long long) (x).pte_high << 32))
#define pte_get_bits(pte, bits) ((pte).pte_low & (bits))
#define pte_set_bits(pte, bits) ((pte).pte_low |= (bits))
#define pte_clear_bits(pte, bits) ((pte).pte_low &= ~(bits))
#define pte_copy(to, from) ({ (to).pte_high = (from).pte_high; \
smp_wmb(); \
(to).pte_low = (from).pte_low; })
#define pte_is_zero(pte) (!((pte).pte_low & ~_PAGE_NEWPAGE) && !(pte).pte_high)
#define pte_set_val(pte, phys, prot) \
({ (pte).pte_high = (phys) >> 32; \
(pte).pte_low = (phys) | pgprot_val(prot); })
typedef unsigned long long pfn_t;
typedef unsigned long long phys_t;
#else
typedef struct { unsigned long pte; } pte_t;
typedef struct { unsigned long pgd; } pgd_t;
#ifdef CONFIG_3_LEVEL_PGTABLES
typedef struct { unsigned long pmd; } pmd_t;
#define pmd_val(x) ((x).pmd)
#define __pmd(x) ((pmd_t) { (x) } )
#endif
#define pte_val(x) ((x).pte)
#define pte_get_bits(p, bits) ((p).pte & (bits))
#define pte_set_bits(p, bits) ((p).pte |= (bits))
#define pte_clear_bits(p, bits) ((p).pte &= ~(bits))
#define pte_copy(to, from) ((to).pte = (from).pte)
#define pte_is_zero(p) (!((p).pte & ~_PAGE_NEWPAGE))
#define pte_set_val(p, phys, prot) (p).pte = (phys | pgprot_val(prot))
typedef unsigned long pfn_t;
typedef unsigned long phys_t;
#endif
typedef struct { unsigned long pgprot; } pgprot_t;
#define pgd_val(x) ((x).pgd)
#define pgprot_val(x) ((x).pgprot)
#define __pte(x) ((pte_t) { (x) } )
#define __pgd(x) ((pgd_t) { (x) } )
#define __pgprot(x) ((pgprot_t) { (x) } )
/* to align the pointer to the (next) page boundary */
#define PAGE_ALIGN(addr) (((addr)+PAGE_SIZE-1)&PAGE_MASK)
extern unsigned long uml_physmem; extern unsigned long uml_physmem;
...@@ -30,7 +95,6 @@ extern unsigned long uml_physmem; ...@@ -30,7 +95,6 @@ extern unsigned long uml_physmem;
extern unsigned long to_phys(void *virt); extern unsigned long to_phys(void *virt);
extern void *to_virt(unsigned long phys); extern void *to_virt(unsigned long phys);
#define __pa(virt) to_phys((void *) virt) #define __pa(virt) to_phys((void *) virt)
#define __va(phys) to_virt((unsigned long) phys) #define __va(phys) to_virt((unsigned long) phys)
...@@ -43,6 +107,20 @@ extern void *to_virt(unsigned long phys); ...@@ -43,6 +107,20 @@ extern void *to_virt(unsigned long phys);
#define pfn_valid(pfn) ((pfn) < max_mapnr) #define pfn_valid(pfn) ((pfn) < max_mapnr)
#define virt_addr_valid(v) pfn_valid(phys_to_pfn(__pa(v))) #define virt_addr_valid(v) pfn_valid(phys_to_pfn(__pa(v)))
/* Pure 2^n version of get_order */
static __inline__ int get_order(unsigned long size)
{
int order;
size = (size-1) >> (PAGE_SHIFT-1);
order = -1;
do {
size >>= 1;
order++;
} while (size);
return order;
}
extern struct page *arch_validate(struct page *page, int mask, int order); extern struct page *arch_validate(struct page *page, int mask, int order);
#define HAVE_ARCH_VALIDATE #define HAVE_ARCH_VALIDATE
......
/* /*
* Copyright (C) 2000, 2001, 2002 Jeff Dike (jdike@karaya.com) * Copyright (C) 2000, 2001, 2002 Jeff Dike (jdike@karaya.com)
* Copyright 2003 PathScale, Inc.
* Derived from include/asm-i386/pgalloc.h and include/asm-i386/pgtable.h * Derived from include/asm-i386/pgalloc.h and include/asm-i386/pgtable.h
* Licensed under the GPL * Licensed under the GPL
*/ */
...@@ -7,6 +8,7 @@ ...@@ -7,6 +8,7 @@
#ifndef __UM_PGALLOC_H #ifndef __UM_PGALLOC_H
#define __UM_PGALLOC_H #define __UM_PGALLOC_H
#include "linux/config.h"
#include "linux/mm.h" #include "linux/mm.h"
#include "asm/fixmap.h" #include "asm/fixmap.h"
...@@ -39,15 +41,13 @@ static inline void pte_free(struct page *pte) ...@@ -39,15 +41,13 @@ static inline void pte_free(struct page *pte)
#define __pte_free_tlb(tlb,pte) tlb_remove_page((tlb),(pte)) #define __pte_free_tlb(tlb,pte) tlb_remove_page((tlb),(pte))
#ifdef CONFIG_3_LEVEL_PGTABLES
/* /*
* allocating and freeing a pmd is trivial: the 1-entry pmd is * In the 3-level case we free the pmds as part of the pgd.
* inside the pgd, so has no extra memory associated with it.
*/ */
#define pmd_alloc_one(mm, addr) ({ BUG(); ((pmd_t *)2); })
#define pmd_free(x) do { } while (0) #define pmd_free(x) do { } while (0)
#define __pmd_free_tlb(tlb,x) do { } while (0) #define __pmd_free_tlb(tlb,x) do { } while (0)
#define pud_populate(mm, pmd, pte) BUG() #endif
#define check_pgt_cache() do { } while (0) #define check_pgt_cache() do { } while (0)
......
/*
* Copyright (C) 2000, 2001, 2002 Jeff Dike (jdike@karaya.com)
* Copyright 2003 PathScale, Inc.
* Derived from include/asm-i386/pgtable.h
* Licensed under the GPL
*/
#ifndef __UM_PGTABLE_2LEVEL_H
#define __UM_PGTABLE_2LEVEL_H
#include <asm-generic/pgtable-nopmd.h>
/* PGDIR_SHIFT determines what a third-level page table entry can map */
#define PGDIR_SHIFT 22
#define PGDIR_SIZE (1UL << PGDIR_SHIFT)
#define PGDIR_MASK (~(PGDIR_SIZE-1))
/*
* entries per page directory level: the i386 is two-level, so
* we don't really have any PMD directory physically.
*/
#define PTRS_PER_PTE 1024
#define PTRS_PER_PMD 1
#define USER_PTRS_PER_PGD ((TASK_SIZE + (PGDIR_SIZE - 1)) / PGDIR_SIZE)
#define PTRS_PER_PGD 1024
#define FIRST_USER_PGD_NR 0
#define pte_ERROR(e) \
printk("%s:%d: bad pte %p(%08lx).\n", __FILE__, __LINE__, &(e), \
pte_val(e))
#define pgd_ERROR(e) \
printk("%s:%d: bad pgd %p(%08lx).\n", __FILE__, __LINE__, &(e), \
pgd_val(e))
static inline int pgd_newpage(pgd_t pgd) { return 0; }
static inline void pgd_mkuptodate(pgd_t pgd) { }
#define pte_present(x) (pte_val(x) & (_PAGE_PRESENT | _PAGE_PROTNONE))
static inline pte_t pte_mknewprot(pte_t pte)
{
pte_val(pte) |= _PAGE_NEWPROT;
return(pte);
}
static inline pte_t pte_mknewpage(pte_t pte)
{
pte_val(pte) |= _PAGE_NEWPAGE;
return(pte);
}
static inline void set_pte(pte_t *pteptr, pte_t pteval)
{
/* If it's a swap entry, it needs to be marked _PAGE_NEWPAGE so
* fix_range knows to unmap it. _PAGE_NEWPROT is specific to
* mapped pages.
*/
*pteptr = pte_mknewpage(pteval);
if(pte_present(*pteptr)) *pteptr = pte_mknewprot(*pteptr);
}
#define set_pmd(pmdptr, pmdval) (*(pmdptr) = (pmdval))
#define pte_page(x) pfn_to_page(pte_pfn(x))
#define pte_none(x) !(pte_val(x) & ~_PAGE_NEWPAGE)
#define pte_pfn(x) phys_to_pfn(pte_val(x))
#define pfn_pte(pfn, prot) __pte(pfn_to_phys(pfn) | pgprot_val(prot))
#define pfn_pmd(pfn, prot) __pmd(pfn_to_phys(pfn) | pgprot_val(prot))
#define pmd_page_kernel(pmd) \
((unsigned long) __va(pmd_val(pmd) & PAGE_MASK))
/*
* Bits 0 through 3 are taken
*/
#define PTE_FILE_MAX_BITS 28
#define pte_to_pgoff(pte) (pte_val(pte) >> 4)
#define pgoff_to_pte(off) ((pte_t) { ((off) << 4) + _PAGE_FILE })
#endif
/*
* Copyright 2003 PathScale Inc
* Derived from include/asm-i386/pgtable.h
* Licensed under the GPL
*/
#ifndef __UM_PGTABLE_3LEVEL_H
#define __UM_PGTABLE_3LEVEL_H
#include <asm-generic/pgtable-nopud.h>
/* PGDIR_SHIFT determines what a third-level page table entry can map */
#define PGDIR_SHIFT 30
#define PGDIR_SIZE (1UL << PGDIR_SHIFT)
#define PGDIR_MASK (~(PGDIR_SIZE-1))
/* PMD_SHIFT determines the size of the area a second-level page table can
* map
*/
#define PMD_SHIFT 21
#define PMD_SIZE (1UL << PMD_SHIFT)
#define PMD_MASK (~(PMD_SIZE-1))
/*
* entries per page directory level
*/
#define PTRS_PER_PTE 512
#define PTRS_PER_PMD 512
#define USER_PTRS_PER_PGD ((TASK_SIZE + (PGDIR_SIZE - 1)) / PGDIR_SIZE)
#define PTRS_PER_PGD 512
#define FIRST_USER_PGD_NR 0
#define pte_ERROR(e) \
printk("%s:%d: bad pte %p(%016lx).\n", __FILE__, __LINE__, &(e), \
pte_val(e))
#define pmd_ERROR(e) \
printk("%s:%d: bad pmd %p(%016lx).\n", __FILE__, __LINE__, &(e), \
pmd_val(e))
#define pgd_ERROR(e) \
printk("%s:%d: bad pgd %p(%016lx).\n", __FILE__, __LINE__, &(e), \
pgd_val(e))
#define pud_none(x) (!(pud_val(x) & ~_PAGE_NEWPAGE))
#define pud_bad(x) ((pud_val(x) & (~PAGE_MASK & ~_PAGE_USER)) != _KERNPG_TABLE)
#define pud_present(x) (pud_val(x) & _PAGE_PRESENT)
#define pud_populate(mm, pud, pmd) \
set_pud(pud, __pud(_PAGE_TABLE + __pa(pmd)))
#define set_pud(pudptr, pudval) set_64bit((phys_t *) (pudptr), pud_val(pudval))
static inline int pgd_newpage(pgd_t pgd)
{
return(pgd_val(pgd) & _PAGE_NEWPAGE);
}
static inline void pgd_mkuptodate(pgd_t pgd) { pgd_val(pgd) &= ~_PAGE_NEWPAGE; }
#define pte_present(x) pte_get_bits(x, (_PAGE_PRESENT | _PAGE_PROTNONE))
static inline pte_t pte_mknewprot(pte_t pte)
{
pte_set_bits(pte, _PAGE_NEWPROT);
return(pte);
}
static inline pte_t pte_mknewpage(pte_t pte)
{
pte_set_bits(pte, _PAGE_NEWPAGE);
return(pte);
}
static inline void set_pte(pte_t *pteptr, pte_t pteval)
{
pte_copy(*pteptr, pteval);
/* If it's a swap entry, it needs to be marked _PAGE_NEWPAGE so
* fix_range knows to unmap it. _PAGE_NEWPROT is specific to
* mapped pages.
*/
*pteptr = pte_mknewpage(*pteptr);
if(pte_present(*pteptr)) *pteptr = pte_mknewprot(*pteptr);
}
#define set_pmd(pmdptr, pmdval) set_64bit((phys_t *) (pmdptr), pmd_val(pmdval))
static inline pmd_t *pmd_alloc_one(struct mm_struct *mm, unsigned long address)
{
pmd_t *pmd = (pmd_t *) __get_free_page(GFP_KERNEL);
if(pmd)
memset(pmd, 0, PAGE_SIZE);
return pmd;
}
static inline void pmd_free(pmd_t *pmd){
free_page((unsigned long) pmd);
}
#define __pmd_free_tlb(tlb,x) do { } while (0)
static inline void pud_clear (pud_t * pud) { }
#define pud_page(pud) \
((struct page *) __va(pud_val(pud) & PAGE_MASK))
/* Find an entry in the second-level page table.. */
#define pmd_offset(pud, address) ((pmd_t *) pud_page(*(pud)) + \
pmd_index(address))
#define pte_page(x) pfn_to_page(pte_pfn(x))
static inline int pte_none(pte_t pte)
{
return pte_is_zero(pte);
}
static inline unsigned long pte_pfn(pte_t pte)
{
return phys_to_pfn(pte_val(pte));
}
static inline pte_t pfn_pte(pfn_t page_nr, pgprot_t pgprot)
{
pte_t pte;
phys_t phys = pfn_to_phys(page_nr);
pte_set_val(pte, phys, pgprot);
return pte;
}
static inline pmd_t pfn_pmd(pfn_t page_nr, pgprot_t pgprot)
{
return __pmd((page_nr << PAGE_SHIFT) | pgprot_val(pgprot));
}
/*
* Bits 0 through 3 are taken in the low part of the pte,
* put the 32 bits of offset into the high part.
*/
#define PTE_FILE_MAX_BITS 32
#ifdef CONFIG_64_BIT
#define pte_to_pgoff(p) ((p).pte >> 32)
#define pgoff_to_pte(off) ((pte_t) { ((off) < 32) | _PAGE_FILE })
#else
#define pte_to_pgoff(pte) ((pte).pte_high)
#define pgoff_to_pte(off) ((pte_t) { _PAGE_FILE, (off) })
#endif
#endif
/*
* Overrides for Emacs so that we follow Linus's tabbing style.
* Emacs will notice this stuff at the end of the file and automatically
* adjust the settings for this buffer only. This must remain at the end
* of the file.
* ---------------------------------------------------------------------------
* Local variables:
* c-file-style: "linux"
* End:
*/
This diff is collapsed.
/*
* Copyright (C) 2004 Jeff Dike (jdike@addtoit.com)
* Licensed under the GPL
*/
#ifndef __VM_FLAGS_I386_H
#define __VM_FLAGS_I386_H
#define VM_DATA_DEFAULT_FLAGS \
(VM_READ | VM_WRITE | \
((current->personality & READ_IMPLIES_EXEC) ? VM_EXEC : 0 ) | \
VM_MAYREAD | VM_MAYWRITE | VM_MAYEXEC)
#endif
/*
* Copyright (C) 2004 Jeff Dike (jdike@addtoit.com)
* Copyright 2003 PathScale, Inc.
* Licensed under the GPL
*/
#ifndef __VM_FLAGS_X86_64_H
#define __VM_FLAGS_X86_64_H
#define __VM_DATA_DEFAULT_FLAGS (VM_READ | VM_WRITE | VM_EXEC | \
VM_MAYREAD | VM_MAYWRITE | VM_MAYEXEC)
#define __VM_STACK_FLAGS (VM_GROWSDOWN | VM_READ | VM_WRITE | \
VM_EXEC | VM_MAYREAD | VM_MAYWRITE | \
VM_MAYEXEC)
extern unsigned long vm_stack_flags, vm_stack_flags32;
extern unsigned long vm_data_default_flags, vm_data_default_flags32;
extern unsigned long vm_force_exec32;
#define VM_DATA_DEFAULT_FLAGS \
(test_thread_flag(TIF_IA32) ? vm_data_default_flags32 : \
vm_data_default_flags)
#define VM_STACK_DEFAULT_FLAGS \
(test_thread_flag(TIF_IA32) ? vm_stack_flags32 : vm_stack_flags)
#endif
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment