提交 d75586ad 编写于 作者: S Shaohua Li 提交者: Ingo Molnar

x86, pageattr: introduce APIs to change pageattr of a page array

Add array interface APIs of pageattr. page based cache flush is quite
slow for a lot of pages. If pages are more than 1024 (4M), the patch
will use a wbinvd(). We have a simple test here (run a 3d game - open
arena), nearly all agp memory allocation are small (< 1M), so suppose
this will not impact runtime performance.
Signed-off-by: NDave Airlie <airlied@gmail.com>
Signed-off-by: NShaohua Li <shaohua.li@intel.com>
Signed-off-by: NIngo Molnar <mingo@elte.hu>
上级 cacf8906
...@@ -25,15 +25,19 @@ ...@@ -25,15 +25,19 @@
* The current flushing context - we pass it instead of 5 arguments: * The current flushing context - we pass it instead of 5 arguments:
*/ */
struct cpa_data { struct cpa_data {
unsigned long vaddr; unsigned long *vaddr;
pgprot_t mask_set; pgprot_t mask_set;
pgprot_t mask_clr; pgprot_t mask_clr;
int numpages; int numpages;
int flushtlb; int flags;
unsigned long pfn; unsigned long pfn;
unsigned force_split : 1; unsigned force_split : 1;
int curpage;
}; };
#define CPA_FLUSHTLB 1
#define CPA_ARRAY 2
#ifdef CONFIG_PROC_FS #ifdef CONFIG_PROC_FS
static unsigned long direct_pages_count[PG_LEVEL_NUM]; static unsigned long direct_pages_count[PG_LEVEL_NUM];
...@@ -184,6 +188,41 @@ static void cpa_flush_range(unsigned long start, int numpages, int cache) ...@@ -184,6 +188,41 @@ static void cpa_flush_range(unsigned long start, int numpages, int cache)
} }
} }
static void cpa_flush_array(unsigned long *start, int numpages, int cache)
{
unsigned int i, level;
unsigned long *addr;
BUG_ON(irqs_disabled());
on_each_cpu(__cpa_flush_range, NULL, 1);
if (!cache)
return;
/* 4M threshold */
if (numpages >= 1024) {
if (boot_cpu_data.x86_model >= 4)
wbinvd();
return;
}
/*
* We only need to flush on one CPU,
* clflush is a MESI-coherent instruction that
* will cause all other CPUs to flush the same
* cachelines:
*/
for (i = 0, addr = start; i < numpages; i++, addr++) {
pte_t *pte = lookup_address(*addr, &level);
/*
* Only flush present addresses:
*/
if (pte && (pte_val(*pte) & _PAGE_PRESENT))
clflush_cache_range((void *) *addr, PAGE_SIZE);
}
}
/* /*
* Certain areas of memory on x86 require very specific protection flags, * Certain areas of memory on x86 require very specific protection flags,
* for example the BIOS area or kernel text. Callers don't always get this * for example the BIOS area or kernel text. Callers don't always get this
...@@ -392,7 +431,7 @@ try_preserve_large_page(pte_t *kpte, unsigned long address, ...@@ -392,7 +431,7 @@ try_preserve_large_page(pte_t *kpte, unsigned long address,
*/ */
new_pte = pfn_pte(pte_pfn(old_pte), canon_pgprot(new_prot)); new_pte = pfn_pte(pte_pfn(old_pte), canon_pgprot(new_prot));
__set_pmd_pte(kpte, address, new_pte); __set_pmd_pte(kpte, address, new_pte);
cpa->flushtlb = 1; cpa->flags |= CPA_FLUSHTLB;
do_split = 0; do_split = 0;
} }
...@@ -578,11 +617,16 @@ static int split_large_page(pte_t *kpte, unsigned long address) ...@@ -578,11 +617,16 @@ static int split_large_page(pte_t *kpte, unsigned long address)
static int __change_page_attr(struct cpa_data *cpa, int primary) static int __change_page_attr(struct cpa_data *cpa, int primary)
{ {
unsigned long address = cpa->vaddr; unsigned long address;
int do_split, err; int do_split, err;
unsigned int level; unsigned int level;
pte_t *kpte, old_pte; pte_t *kpte, old_pte;
if (cpa->flags & CPA_ARRAY)
address = cpa->vaddr[cpa->curpage];
else
address = *cpa->vaddr;
repeat: repeat:
kpte = lookup_address(address, &level); kpte = lookup_address(address, &level);
if (!kpte) if (!kpte)
...@@ -594,8 +638,8 @@ static int __change_page_attr(struct cpa_data *cpa, int primary) ...@@ -594,8 +638,8 @@ static int __change_page_attr(struct cpa_data *cpa, int primary)
return 0; return 0;
printk(KERN_WARNING "CPA: called for zero pte. " printk(KERN_WARNING "CPA: called for zero pte. "
"vaddr = %lx cpa->vaddr = %lx\n", address, "vaddr = %lx cpa->vaddr = %lx\n", address,
cpa->vaddr);
WARN_ON(1); WARN_ON(1);
*cpa->vaddr);
return -EINVAL; return -EINVAL;
} }
...@@ -621,7 +665,7 @@ static int __change_page_attr(struct cpa_data *cpa, int primary) ...@@ -621,7 +665,7 @@ static int __change_page_attr(struct cpa_data *cpa, int primary)
*/ */
if (pte_val(old_pte) != pte_val(new_pte)) { if (pte_val(old_pte) != pte_val(new_pte)) {
set_pte_atomic(kpte, new_pte); set_pte_atomic(kpte, new_pte);
cpa->flushtlb = 1; cpa->flags |= CPA_FLUSHTLB;
} }
cpa->numpages = 1; cpa->numpages = 1;
return 0; return 0;
...@@ -645,7 +689,7 @@ static int __change_page_attr(struct cpa_data *cpa, int primary) ...@@ -645,7 +689,7 @@ static int __change_page_attr(struct cpa_data *cpa, int primary)
*/ */
err = split_large_page(kpte, address); err = split_large_page(kpte, address);
if (!err) { if (!err) {
cpa->flushtlb = 1; cpa->flags |= CPA_FLUSHTLB;
goto repeat; goto repeat;
} }
...@@ -658,6 +702,7 @@ static int cpa_process_alias(struct cpa_data *cpa) ...@@ -658,6 +702,7 @@ static int cpa_process_alias(struct cpa_data *cpa)
{ {
struct cpa_data alias_cpa; struct cpa_data alias_cpa;
int ret = 0; int ret = 0;
unsigned long temp_cpa_vaddr, vaddr;
if (cpa->pfn >= max_pfn_mapped) if (cpa->pfn >= max_pfn_mapped)
return 0; return 0;
...@@ -670,16 +715,24 @@ static int cpa_process_alias(struct cpa_data *cpa) ...@@ -670,16 +715,24 @@ static int cpa_process_alias(struct cpa_data *cpa)
* No need to redo, when the primary call touched the direct * No need to redo, when the primary call touched the direct
* mapping already: * mapping already:
*/ */
if (!(within(cpa->vaddr, PAGE_OFFSET, if (cpa->flags & CPA_ARRAY)
vaddr = cpa->vaddr[cpa->curpage];
else
vaddr = *cpa->vaddr;
if (!(within(vaddr, PAGE_OFFSET,
PAGE_OFFSET + (max_low_pfn_mapped << PAGE_SHIFT)) PAGE_OFFSET + (max_low_pfn_mapped << PAGE_SHIFT))
#ifdef CONFIG_X86_64 #ifdef CONFIG_X86_64
|| within(cpa->vaddr, PAGE_OFFSET + (1UL<<32), || within(vaddr, PAGE_OFFSET + (1UL<<32),
PAGE_OFFSET + (max_pfn_mapped << PAGE_SHIFT)) PAGE_OFFSET + (max_pfn_mapped << PAGE_SHIFT))
#endif #endif
)) { )) {
alias_cpa = *cpa; alias_cpa = *cpa;
alias_cpa.vaddr = (unsigned long) __va(cpa->pfn << PAGE_SHIFT); temp_cpa_vaddr = (unsigned long) __va(cpa->pfn << PAGE_SHIFT);
alias_cpa.vaddr = &temp_cpa_vaddr;
alias_cpa.flags &= ~CPA_ARRAY;
ret = __change_page_attr_set_clr(&alias_cpa, 0); ret = __change_page_attr_set_clr(&alias_cpa, 0);
} }
...@@ -691,7 +744,7 @@ static int cpa_process_alias(struct cpa_data *cpa) ...@@ -691,7 +744,7 @@ static int cpa_process_alias(struct cpa_data *cpa)
* No need to redo, when the primary call touched the high * No need to redo, when the primary call touched the high
* mapping already: * mapping already:
*/ */
if (within(cpa->vaddr, (unsigned long) _text, (unsigned long) _end)) if (within(vaddr, (unsigned long) _text, (unsigned long) _end))
return 0; return 0;
/* /*
...@@ -702,8 +755,9 @@ static int cpa_process_alias(struct cpa_data *cpa) ...@@ -702,8 +755,9 @@ static int cpa_process_alias(struct cpa_data *cpa)
return 0; return 0;
alias_cpa = *cpa; alias_cpa = *cpa;
alias_cpa.vaddr = temp_cpa_vaddr = (cpa->pfn << PAGE_SHIFT) + __START_KERNEL_map - phys_base;
(cpa->pfn << PAGE_SHIFT) + __START_KERNEL_map - phys_base; alias_cpa.vaddr = &temp_cpa_vaddr;
alias_cpa.flags &= ~CPA_ARRAY;
/* /*
* The high mapping range is imprecise, so ignore the return value. * The high mapping range is imprecise, so ignore the return value.
...@@ -723,6 +777,9 @@ static int __change_page_attr_set_clr(struct cpa_data *cpa, int checkalias) ...@@ -723,6 +777,9 @@ static int __change_page_attr_set_clr(struct cpa_data *cpa, int checkalias)
* preservation check. * preservation check.
*/ */
cpa->numpages = numpages; cpa->numpages = numpages;
/* for array changes, we can't use large page */
if (cpa->flags & CPA_ARRAY)
cpa->numpages = 1;
ret = __change_page_attr(cpa, checkalias); ret = __change_page_attr(cpa, checkalias);
if (ret) if (ret)
...@@ -741,7 +798,11 @@ static int __change_page_attr_set_clr(struct cpa_data *cpa, int checkalias) ...@@ -741,7 +798,11 @@ static int __change_page_attr_set_clr(struct cpa_data *cpa, int checkalias)
*/ */
BUG_ON(cpa->numpages > numpages); BUG_ON(cpa->numpages > numpages);
numpages -= cpa->numpages; numpages -= cpa->numpages;
cpa->vaddr += cpa->numpages * PAGE_SIZE; if (cpa->flags & CPA_ARRAY)
cpa->curpage++;
else
*cpa->vaddr += cpa->numpages * PAGE_SIZE;
} }
return 0; return 0;
} }
...@@ -752,9 +813,9 @@ static inline int cache_attr(pgprot_t attr) ...@@ -752,9 +813,9 @@ static inline int cache_attr(pgprot_t attr)
(_PAGE_PAT | _PAGE_PAT_LARGE | _PAGE_PWT | _PAGE_PCD); (_PAGE_PAT | _PAGE_PAT_LARGE | _PAGE_PWT | _PAGE_PCD);
} }
static int change_page_attr_set_clr(unsigned long addr, int numpages, static int change_page_attr_set_clr(unsigned long *addr, int numpages,
pgprot_t mask_set, pgprot_t mask_clr, pgprot_t mask_set, pgprot_t mask_clr,
int force_split) int force_split, int array)
{ {
struct cpa_data cpa; struct cpa_data cpa;
int ret, cache, checkalias; int ret, cache, checkalias;
...@@ -769,12 +830,22 @@ static int change_page_attr_set_clr(unsigned long addr, int numpages, ...@@ -769,12 +830,22 @@ static int change_page_attr_set_clr(unsigned long addr, int numpages,
return 0; return 0;
/* Ensure we are PAGE_SIZE aligned */ /* Ensure we are PAGE_SIZE aligned */
if (addr & ~PAGE_MASK) { if (!array) {
addr &= PAGE_MASK; if (*addr & ~PAGE_MASK) {
/* *addr &= PAGE_MASK;
* People should not be passing in unaligned addresses: /*
*/ * People should not be passing in unaligned addresses:
WARN_ON_ONCE(1); */
WARN_ON_ONCE(1);
}
} else {
int i;
for (i = 0; i < numpages; i++) {
if (addr[i] & ~PAGE_MASK) {
addr[i] &= PAGE_MASK;
WARN_ON_ONCE(1);
}
}
} }
/* Must avoid aliasing mappings in the highmem code */ /* Must avoid aliasing mappings in the highmem code */
...@@ -784,9 +855,13 @@ static int change_page_attr_set_clr(unsigned long addr, int numpages, ...@@ -784,9 +855,13 @@ static int change_page_attr_set_clr(unsigned long addr, int numpages,
cpa.numpages = numpages; cpa.numpages = numpages;
cpa.mask_set = mask_set; cpa.mask_set = mask_set;
cpa.mask_clr = mask_clr; cpa.mask_clr = mask_clr;
cpa.flushtlb = 0; cpa.flags = 0;
cpa.curpage = 0;
cpa.force_split = force_split; cpa.force_split = force_split;
if (array)
cpa.flags |= CPA_ARRAY;
/* No alias checking for _NX bit modifications */ /* No alias checking for _NX bit modifications */
checkalias = (pgprot_val(mask_set) | pgprot_val(mask_clr)) != _PAGE_NX; checkalias = (pgprot_val(mask_set) | pgprot_val(mask_clr)) != _PAGE_NX;
...@@ -795,7 +870,7 @@ static int change_page_attr_set_clr(unsigned long addr, int numpages, ...@@ -795,7 +870,7 @@ static int change_page_attr_set_clr(unsigned long addr, int numpages,
/* /*
* Check whether we really changed something: * Check whether we really changed something:
*/ */
if (!cpa.flushtlb) if (!(cpa.flags & CPA_FLUSHTLB))
goto out; goto out;
/* /*
...@@ -810,9 +885,12 @@ static int change_page_attr_set_clr(unsigned long addr, int numpages, ...@@ -810,9 +885,12 @@ static int change_page_attr_set_clr(unsigned long addr, int numpages,
* error case we fall back to cpa_flush_all (which uses * error case we fall back to cpa_flush_all (which uses
* wbindv): * wbindv):
*/ */
if (!ret && cpu_has_clflush) if (!ret && cpu_has_clflush) {
cpa_flush_range(addr, numpages, cache); if (cpa.flags & CPA_ARRAY)
else cpa_flush_array(addr, numpages, cache);
else
cpa_flush_range(*addr, numpages, cache);
} else
cpa_flush_all(cache); cpa_flush_all(cache);
out: out:
...@@ -821,16 +899,18 @@ static int change_page_attr_set_clr(unsigned long addr, int numpages, ...@@ -821,16 +899,18 @@ static int change_page_attr_set_clr(unsigned long addr, int numpages,
return ret; return ret;
} }
static inline int change_page_attr_set(unsigned long addr, int numpages, static inline int change_page_attr_set(unsigned long *addr, int numpages,
pgprot_t mask) pgprot_t mask, int array)
{ {
return change_page_attr_set_clr(addr, numpages, mask, __pgprot(0), 0); return change_page_attr_set_clr(addr, numpages, mask, __pgprot(0), 0,
array);
} }
static inline int change_page_attr_clear(unsigned long addr, int numpages, static inline int change_page_attr_clear(unsigned long *addr, int numpages,
pgprot_t mask) pgprot_t mask, int array)
{ {
return change_page_attr_set_clr(addr, numpages, __pgprot(0), mask, 0); return change_page_attr_set_clr(addr, numpages, __pgprot(0), mask, 0,
array);
} }
int _set_memory_uc(unsigned long addr, int numpages) int _set_memory_uc(unsigned long addr, int numpages)
...@@ -838,8 +918,8 @@ int _set_memory_uc(unsigned long addr, int numpages) ...@@ -838,8 +918,8 @@ int _set_memory_uc(unsigned long addr, int numpages)
/* /*
* for now UC MINUS. see comments in ioremap_nocache() * for now UC MINUS. see comments in ioremap_nocache()
*/ */
return change_page_attr_set(addr, numpages, return change_page_attr_set(&addr, numpages,
__pgprot(_PAGE_CACHE_UC_MINUS)); __pgprot(_PAGE_CACHE_UC_MINUS), 0);
} }
int set_memory_uc(unsigned long addr, int numpages) int set_memory_uc(unsigned long addr, int numpages)
...@@ -855,10 +935,31 @@ int set_memory_uc(unsigned long addr, int numpages) ...@@ -855,10 +935,31 @@ int set_memory_uc(unsigned long addr, int numpages)
} }
EXPORT_SYMBOL(set_memory_uc); EXPORT_SYMBOL(set_memory_uc);
int set_memory_array_uc(unsigned long *addr, int addrinarray)
{
int i;
/*
* for now UC MINUS. see comments in ioremap_nocache()
*/
for (i = 0; i < addrinarray; i++) {
if (reserve_memtype(addr[i], addr[i] + PAGE_SIZE,
_PAGE_CACHE_UC_MINUS, NULL))
goto out;
}
return change_page_attr_set(addr, addrinarray,
__pgprot(_PAGE_CACHE_UC_MINUS), 1);
out:
while (--i >= 0)
free_memtype(addr[i], addr[i] + PAGE_SIZE);
return -EINVAL;
}
EXPORT_SYMBOL(set_memory_array_uc);
int _set_memory_wc(unsigned long addr, int numpages) int _set_memory_wc(unsigned long addr, int numpages)
{ {
return change_page_attr_set(addr, numpages, return change_page_attr_set(&addr, numpages,
__pgprot(_PAGE_CACHE_WC)); __pgprot(_PAGE_CACHE_WC), 0);
} }
int set_memory_wc(unsigned long addr, int numpages) int set_memory_wc(unsigned long addr, int numpages)
...@@ -876,8 +977,8 @@ EXPORT_SYMBOL(set_memory_wc); ...@@ -876,8 +977,8 @@ EXPORT_SYMBOL(set_memory_wc);
int _set_memory_wb(unsigned long addr, int numpages) int _set_memory_wb(unsigned long addr, int numpages)
{ {
return change_page_attr_clear(addr, numpages, return change_page_attr_clear(&addr, numpages,
__pgprot(_PAGE_CACHE_MASK)); __pgprot(_PAGE_CACHE_MASK), 0);
} }
int set_memory_wb(unsigned long addr, int numpages) int set_memory_wb(unsigned long addr, int numpages)
...@@ -888,37 +989,48 @@ int set_memory_wb(unsigned long addr, int numpages) ...@@ -888,37 +989,48 @@ int set_memory_wb(unsigned long addr, int numpages)
} }
EXPORT_SYMBOL(set_memory_wb); EXPORT_SYMBOL(set_memory_wb);
int set_memory_array_wb(unsigned long *addr, int addrinarray)
{
int i;
for (i = 0; i < addrinarray; i++)
free_memtype(addr[i], addr[i] + PAGE_SIZE);
return change_page_attr_clear(addr, addrinarray,
__pgprot(_PAGE_CACHE_MASK), 1);
}
EXPORT_SYMBOL(set_memory_array_wb);
int set_memory_x(unsigned long addr, int numpages) int set_memory_x(unsigned long addr, int numpages)
{ {
return change_page_attr_clear(addr, numpages, __pgprot(_PAGE_NX)); return change_page_attr_clear(&addr, numpages, __pgprot(_PAGE_NX), 0);
} }
EXPORT_SYMBOL(set_memory_x); EXPORT_SYMBOL(set_memory_x);
int set_memory_nx(unsigned long addr, int numpages) int set_memory_nx(unsigned long addr, int numpages)
{ {
return change_page_attr_set(addr, numpages, __pgprot(_PAGE_NX)); return change_page_attr_set(&addr, numpages, __pgprot(_PAGE_NX), 0);
} }
EXPORT_SYMBOL(set_memory_nx); EXPORT_SYMBOL(set_memory_nx);
int set_memory_ro(unsigned long addr, int numpages) int set_memory_ro(unsigned long addr, int numpages)
{ {
return change_page_attr_clear(addr, numpages, __pgprot(_PAGE_RW)); return change_page_attr_clear(&addr, numpages, __pgprot(_PAGE_RW), 0);
} }
int set_memory_rw(unsigned long addr, int numpages) int set_memory_rw(unsigned long addr, int numpages)
{ {
return change_page_attr_set(addr, numpages, __pgprot(_PAGE_RW)); return change_page_attr_set(&addr, numpages, __pgprot(_PAGE_RW), 0);
} }
int set_memory_np(unsigned long addr, int numpages) int set_memory_np(unsigned long addr, int numpages)
{ {
return change_page_attr_clear(addr, numpages, __pgprot(_PAGE_PRESENT)); return change_page_attr_clear(&addr, numpages, __pgprot(_PAGE_PRESENT), 0);
} }
int set_memory_4k(unsigned long addr, int numpages) int set_memory_4k(unsigned long addr, int numpages)
{ {
return change_page_attr_set_clr(addr, numpages, __pgprot(0), return change_page_attr_set_clr(&addr, numpages, __pgprot(0),
__pgprot(0), 1); __pgprot(0), 1, 0);
} }
int set_pages_uc(struct page *page, int numpages) int set_pages_uc(struct page *page, int numpages)
...@@ -971,20 +1083,24 @@ int set_pages_rw(struct page *page, int numpages) ...@@ -971,20 +1083,24 @@ int set_pages_rw(struct page *page, int numpages)
static int __set_pages_p(struct page *page, int numpages) static int __set_pages_p(struct page *page, int numpages)
{ {
struct cpa_data cpa = { .vaddr = (unsigned long) page_address(page), unsigned long tempaddr = (unsigned long) page_address(page);
struct cpa_data cpa = { .vaddr = &tempaddr,
.numpages = numpages, .numpages = numpages,
.mask_set = __pgprot(_PAGE_PRESENT | _PAGE_RW), .mask_set = __pgprot(_PAGE_PRESENT | _PAGE_RW),
.mask_clr = __pgprot(0)}; .mask_clr = __pgprot(0),
.flags = 0};
return __change_page_attr_set_clr(&cpa, 1); return __change_page_attr_set_clr(&cpa, 1);
} }
static int __set_pages_np(struct page *page, int numpages) static int __set_pages_np(struct page *page, int numpages)
{ {
struct cpa_data cpa = { .vaddr = (unsigned long) page_address(page), unsigned long tempaddr = (unsigned long) page_address(page);
struct cpa_data cpa = { .vaddr = &tempaddr,
.numpages = numpages, .numpages = numpages,
.mask_set = __pgprot(0), .mask_set = __pgprot(0),
.mask_clr = __pgprot(_PAGE_PRESENT | _PAGE_RW)}; .mask_clr = __pgprot(_PAGE_PRESENT | _PAGE_RW),
.flags = 0};
return __change_page_attr_set_clr(&cpa, 1); return __change_page_attr_set_clr(&cpa, 1);
} }
......
...@@ -66,6 +66,9 @@ int set_memory_rw(unsigned long addr, int numpages); ...@@ -66,6 +66,9 @@ int set_memory_rw(unsigned long addr, int numpages);
int set_memory_np(unsigned long addr, int numpages); int set_memory_np(unsigned long addr, int numpages);
int set_memory_4k(unsigned long addr, int numpages); int set_memory_4k(unsigned long addr, int numpages);
int set_memory_array_uc(unsigned long *addr, int addrinarray);
int set_memory_array_wb(unsigned long *addr, int addrinarray);
/* /*
* For legacy compatibility with the old APIs, a few functions * For legacy compatibility with the old APIs, a few functions
* are provided that work on a "struct page". * are provided that work on a "struct page".
......
Markdown is supported
0% .
You are about to add 0 people to the discussion. Proceed with caution.
先完成此消息的编辑!
想要评论请 注册