2008-09-16 04:44:55 +08:00
|
|
|
/*
|
|
|
|
* arch/arm/mm/highmem.c -- ARM highmem support
|
|
|
|
*
|
|
|
|
* Author: Nicolas Pitre
|
|
|
|
* Created: september 8, 2008
|
|
|
|
* Copyright: Marvell Semiconductors Inc.
|
|
|
|
*
|
|
|
|
* This program is free software; you can redistribute it and/or modify
|
|
|
|
* it under the terms of the GNU General Public License version 2 as
|
|
|
|
* published by the Free Software Foundation.
|
|
|
|
*/
|
|
|
|
|
|
|
|
#include <linux/module.h>
|
|
|
|
#include <linux/highmem.h>
|
|
|
|
#include <linux/interrupt.h>
|
|
|
|
#include <asm/fixmap.h>
|
|
|
|
#include <asm/cacheflush.h>
|
|
|
|
#include <asm/tlbflush.h>
|
|
|
|
#include "mm.h"
|
|
|
|
|
2014-04-18 16:43:32 +08:00
|
|
|
static inline void set_fixmap_pte(int idx, pte_t pte)
|
|
|
|
{
|
|
|
|
unsigned long vaddr = __fix_to_virt(idx);
|
2014-07-02 15:01:15 +08:00
|
|
|
pte_t *ptep = pte_offset_kernel(pmd_off_k(vaddr), vaddr);
|
|
|
|
|
|
|
|
set_pte_ext(ptep, pte, 0);
|
2014-04-18 16:43:32 +08:00
|
|
|
local_flush_tlb_kernel_page(vaddr);
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline pte_t get_fixmap_pte(unsigned long vaddr)
|
|
|
|
{
|
2014-07-02 15:01:15 +08:00
|
|
|
pte_t *ptep = pte_offset_kernel(pmd_off_k(vaddr), vaddr);
|
|
|
|
|
|
|
|
return *ptep;
|
2014-04-18 16:43:32 +08:00
|
|
|
}
|
|
|
|
|
2008-09-16 04:44:55 +08:00
|
|
|
void *kmap(struct page *page)
|
|
|
|
{
|
|
|
|
might_sleep();
|
|
|
|
if (!PageHighMem(page))
|
|
|
|
return page_address(page);
|
|
|
|
return kmap_high(page);
|
|
|
|
}
|
|
|
|
EXPORT_SYMBOL(kmap);
|
|
|
|
|
|
|
|
void kunmap(struct page *page)
|
|
|
|
{
|
|
|
|
BUG_ON(in_interrupt());
|
|
|
|
if (!PageHighMem(page))
|
|
|
|
return;
|
|
|
|
kunmap_high(page);
|
|
|
|
}
|
|
|
|
EXPORT_SYMBOL(kunmap);
|
|
|
|
|
2011-11-26 10:53:39 +08:00
|
|
|
void *kmap_atomic(struct page *page)
|
2008-09-16 04:44:55 +08:00
|
|
|
{
|
|
|
|
unsigned int idx;
|
|
|
|
unsigned long vaddr;
|
2009-09-04 04:45:59 +08:00
|
|
|
void *kmap;
|
2010-10-27 05:21:51 +08:00
|
|
|
int type;
|
2008-09-16 04:44:55 +08:00
|
|
|
|
2015-05-11 23:52:09 +08:00
|
|
|
preempt_disable();
|
2008-09-16 04:44:55 +08:00
|
|
|
pagefault_disable();
|
|
|
|
if (!PageHighMem(page))
|
|
|
|
return page_address(page);
|
|
|
|
|
2010-06-08 04:28:55 +08:00
|
|
|
#ifdef CONFIG_DEBUG_HIGHMEM
|
|
|
|
/*
|
|
|
|
* There is no cache coherency issue when non VIVT, so force the
|
|
|
|
* dedicated kmap usage for better debugging purposes in that case.
|
|
|
|
*/
|
|
|
|
if (!cache_is_vivt())
|
|
|
|
kmap = NULL;
|
|
|
|
else
|
|
|
|
#endif
|
|
|
|
kmap = kmap_high_get(page);
|
2009-09-04 04:45:59 +08:00
|
|
|
if (kmap)
|
|
|
|
return kmap;
|
|
|
|
|
2010-10-27 05:21:51 +08:00
|
|
|
type = kmap_atomic_idx_push();
|
|
|
|
|
2015-08-13 07:01:52 +08:00
|
|
|
idx = FIX_KMAP_BEGIN + type + KM_TYPE_NR * smp_processor_id();
|
2014-04-18 16:27:01 +08:00
|
|
|
vaddr = __fix_to_virt(idx);
|
2008-09-16 04:44:55 +08:00
|
|
|
#ifdef CONFIG_DEBUG_HIGHMEM
|
|
|
|
/*
|
|
|
|
* With debugging enabled, kunmap_atomic forces that entry to 0.
|
|
|
|
* Make sure it was indeed properly unmapped.
|
|
|
|
*/
|
2014-07-02 15:01:15 +08:00
|
|
|
BUG_ON(!pte_none(get_fixmap_pte(vaddr)));
|
2008-09-16 04:44:55 +08:00
|
|
|
#endif
|
|
|
|
/*
|
|
|
|
* When debugging is off, kunmap_atomic leaves the previous mapping
|
2011-07-02 22:20:44 +08:00
|
|
|
* in place, so the contained TLB flush ensures the TLB is updated
|
|
|
|
* with the new mapping.
|
2008-09-16 04:44:55 +08:00
|
|
|
*/
|
2014-04-18 16:43:32 +08:00
|
|
|
set_fixmap_pte(idx, mk_pte(page, kmap_prot));
|
2008-09-16 04:44:55 +08:00
|
|
|
|
|
|
|
return (void *)vaddr;
|
|
|
|
}
|
2011-11-26 10:53:39 +08:00
|
|
|
EXPORT_SYMBOL(kmap_atomic);
|
2008-09-16 04:44:55 +08:00
|
|
|
|
2010-10-27 05:21:51 +08:00
|
|
|
void __kunmap_atomic(void *kvaddr)
|
2008-09-16 04:44:55 +08:00
|
|
|
{
|
|
|
|
unsigned long vaddr = (unsigned long) kvaddr & PAGE_MASK;
|
2010-10-27 05:21:51 +08:00
|
|
|
int idx, type;
|
2008-09-16 04:44:55 +08:00
|
|
|
|
|
|
|
if (kvaddr >= (void *)FIXADDR_START) {
|
2010-10-28 06:32:58 +08:00
|
|
|
type = kmap_atomic_idx();
|
2015-08-13 07:01:52 +08:00
|
|
|
idx = FIX_KMAP_BEGIN + type + KM_TYPE_NR * smp_processor_id();
|
2010-10-27 05:21:51 +08:00
|
|
|
|
2010-03-30 04:46:02 +08:00
|
|
|
if (cache_is_vivt())
|
|
|
|
__cpuc_flush_dcache_area((void *)vaddr, PAGE_SIZE);
|
2008-09-16 04:44:55 +08:00
|
|
|
#ifdef CONFIG_DEBUG_HIGHMEM
|
2014-04-18 16:27:01 +08:00
|
|
|
BUG_ON(vaddr != __fix_to_virt(idx));
|
2014-04-18 16:43:32 +08:00
|
|
|
set_fixmap_pte(idx, __pte(0));
|
2008-09-16 04:44:55 +08:00
|
|
|
#else
|
|
|
|
(void) idx; /* to kill a warning */
|
|
|
|
#endif
|
2010-10-28 06:32:58 +08:00
|
|
|
kmap_atomic_idx_pop();
|
2009-09-04 04:45:59 +08:00
|
|
|
} else if (vaddr >= PKMAP_ADDR(0) && vaddr < PKMAP_ADDR(LAST_PKMAP)) {
|
|
|
|
/* this address was obtained through kmap_high_get() */
|
|
|
|
kunmap_high(pte_page(pkmap_page_table[PKMAP_NR(vaddr)]));
|
2008-09-16 04:44:55 +08:00
|
|
|
}
|
|
|
|
pagefault_enable();
|
2015-05-11 23:52:09 +08:00
|
|
|
preempt_enable();
|
2008-09-16 04:44:55 +08:00
|
|
|
}
|
2010-10-27 05:21:51 +08:00
|
|
|
EXPORT_SYMBOL(__kunmap_atomic);
|
2008-09-16 04:44:55 +08:00
|
|
|
|
2010-10-27 05:21:51 +08:00
|
|
|
void *kmap_atomic_pfn(unsigned long pfn)
|
2008-09-16 04:44:55 +08:00
|
|
|
{
|
|
|
|
unsigned long vaddr;
|
2010-10-27 05:21:51 +08:00
|
|
|
int idx, type;
|
ARM: 8180/1: mm: implement no-highmem fast path in kmap_atomic_pfn()
Since CONFIG_HIGHMEM got enabled on ARMv5 Kirkwood, we have noticed a
very significant drop in networking performance. The test were
conducted on an OpenBlocks A7 board. Without this patch, the outgoing
performance measured with iperf are:
- highmem OFF, TSO OFF 544 Mbit/s
- highmem OFF, TSO ON 942 Mbit/s
- highmem ON, TSO OFF 306 Mbit/s
- highmem ON, TSO ON 246 Mbit/s
On this Kirkwood platform, the L2 cache is a Feroceon cache, and with
this cache, all the range operations have to be done on virtual
addresses and not physical addresses. Therefore, whenever
CONFIG_HIGHMEM is enabled, the cache maintenance operations call
kmap_atomic_pfn() and kunmap_atomic().
However, kmap_atomic_pfn() does not implement the same fast path for
non-highmem pages as the one implemented in kmap_atomic(), and this is
one of the reason for the performance drop. While this patch does not
fully restore the performances, it clearly improves them a lot:
without patch with patch
- highmem ON, TSO OFF 306 Mbit/s 387 Mbit/s
- highmem ON, TSO ON 246 Mbit/s 434 Mbit/s
We're still far from the !CONFIG_HIGHMEM performances, but it does
improve a bit the situation.
Thanks a lot to Ezequiel Garcia and Gregory Clement for all the
testing work around this topic.
Signed-off-by: Thomas Petazzoni <thomas.petazzoni@free-electrons.com>
Signed-off-by: Russell King <rmk+kernel@arm.linux.org.uk>
2014-10-21 02:42:18 +08:00
|
|
|
struct page *page = pfn_to_page(pfn);
|
2008-09-16 04:44:55 +08:00
|
|
|
|
2015-05-11 23:52:09 +08:00
|
|
|
preempt_disable();
|
2008-09-16 04:44:55 +08:00
|
|
|
pagefault_disable();
|
ARM: 8180/1: mm: implement no-highmem fast path in kmap_atomic_pfn()
Since CONFIG_HIGHMEM got enabled on ARMv5 Kirkwood, we have noticed a
very significant drop in networking performance. The test were
conducted on an OpenBlocks A7 board. Without this patch, the outgoing
performance measured with iperf are:
- highmem OFF, TSO OFF 544 Mbit/s
- highmem OFF, TSO ON 942 Mbit/s
- highmem ON, TSO OFF 306 Mbit/s
- highmem ON, TSO ON 246 Mbit/s
On this Kirkwood platform, the L2 cache is a Feroceon cache, and with
this cache, all the range operations have to be done on virtual
addresses and not physical addresses. Therefore, whenever
CONFIG_HIGHMEM is enabled, the cache maintenance operations call
kmap_atomic_pfn() and kunmap_atomic().
However, kmap_atomic_pfn() does not implement the same fast path for
non-highmem pages as the one implemented in kmap_atomic(), and this is
one of the reason for the performance drop. While this patch does not
fully restore the performances, it clearly improves them a lot:
without patch with patch
- highmem ON, TSO OFF 306 Mbit/s 387 Mbit/s
- highmem ON, TSO ON 246 Mbit/s 434 Mbit/s
We're still far from the !CONFIG_HIGHMEM performances, but it does
improve a bit the situation.
Thanks a lot to Ezequiel Garcia and Gregory Clement for all the
testing work around this topic.
Signed-off-by: Thomas Petazzoni <thomas.petazzoni@free-electrons.com>
Signed-off-by: Russell King <rmk+kernel@arm.linux.org.uk>
2014-10-21 02:42:18 +08:00
|
|
|
if (!PageHighMem(page))
|
|
|
|
return page_address(page);
|
2008-09-16 04:44:55 +08:00
|
|
|
|
2010-10-27 05:21:51 +08:00
|
|
|
type = kmap_atomic_idx_push();
|
2015-08-13 07:01:52 +08:00
|
|
|
idx = FIX_KMAP_BEGIN + type + KM_TYPE_NR * smp_processor_id();
|
2014-04-18 16:27:01 +08:00
|
|
|
vaddr = __fix_to_virt(idx);
|
2008-09-16 04:44:55 +08:00
|
|
|
#ifdef CONFIG_DEBUG_HIGHMEM
|
2014-07-02 15:01:15 +08:00
|
|
|
BUG_ON(!pte_none(get_fixmap_pte(vaddr)));
|
2008-09-16 04:44:55 +08:00
|
|
|
#endif
|
2014-04-18 16:43:32 +08:00
|
|
|
set_fixmap_pte(idx, pfn_pte(pfn, kmap_prot));
|
2008-09-16 04:44:55 +08:00
|
|
|
|
|
|
|
return (void *)vaddr;
|
|
|
|
}
|
|
|
|
|
|
|
|
struct page *kmap_atomic_to_page(const void *ptr)
|
|
|
|
{
|
|
|
|
unsigned long vaddr = (unsigned long)ptr;
|
|
|
|
|
|
|
|
if (vaddr < FIXADDR_START)
|
|
|
|
return virt_to_page(ptr);
|
|
|
|
|
2014-04-18 16:43:32 +08:00
|
|
|
return pte_page(get_fixmap_pte(vaddr));
|
2008-09-16 04:44:55 +08:00
|
|
|
}
|