You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
453 lines
12 KiB
453 lines
12 KiB
/*
|
|
* arch/sh/kernel/cpu/sq.c
|
|
*
|
|
* General management API for SH-4 integrated Store Queues
|
|
*
|
|
* Copyright (C) 2001, 2002, 2003, 2004 Paul Mundt
|
|
* Copyright (C) 2001, 2002 M. R. Brown
|
|
*
|
|
* Some of this code has been adopted directly from the old arch/sh/mm/sq.c
|
|
* hack that was part of the LinuxDC project. For all intents and purposes,
|
|
* this is a completely new interface that really doesn't have much in common
|
|
* with the old zone-based approach at all. In fact, it's only listed here for
|
|
* general completeness.
|
|
*
|
|
* This file is subject to the terms and conditions of the GNU General Public
|
|
* License. See the file "COPYING" in the main directory of this archive
|
|
* for more details.
|
|
*/
|
|
#include <linux/init.h>
|
|
#include <linux/kernel.h>
|
|
#include <linux/module.h>
|
|
#include <linux/config.h>
|
|
#include <linux/slab.h>
|
|
#include <linux/list.h>
|
|
#include <linux/proc_fs.h>
|
|
#include <linux/miscdevice.h>
|
|
#include <linux/vmalloc.h>
|
|
|
|
#include <asm/io.h>
|
|
#include <asm/page.h>
|
|
#include <asm/mmu_context.h>
|
|
#include <asm/cpu/sq.h>
|
|
|
|
static LIST_HEAD(sq_mapping_list);
|
|
static DEFINE_SPINLOCK(sq_mapping_lock);
|
|
|
|
/**
|
|
* sq_flush - Flush (prefetch) the store queue cache
|
|
* @addr: the store queue address to flush
|
|
*
|
|
* Executes a prefetch instruction on the specified store queue cache,
|
|
* so that the cached data is written to physical memory.
|
|
*/
|
|
inline void sq_flush(void *addr)
|
|
{
|
|
__asm__ __volatile__ ("pref @%0" : : "r" (addr) : "memory");
|
|
}
|
|
|
|
/**
|
|
* sq_flush_range - Flush (prefetch) a specific SQ range
|
|
* @start: the store queue address to start flushing from
|
|
* @len: the length to flush
|
|
*
|
|
* Flushes the store queue cache from @start to @start + @len in a
|
|
* linear fashion.
|
|
*/
|
|
void sq_flush_range(unsigned long start, unsigned int len)
|
|
{
|
|
volatile unsigned long *sq = (unsigned long *)start;
|
|
unsigned long dummy;
|
|
|
|
/* Flush the queues */
|
|
for (len >>= 5; len--; sq += 8)
|
|
sq_flush((void *)sq);
|
|
|
|
/* Wait for completion */
|
|
dummy = ctrl_inl(P4SEG_STORE_QUE);
|
|
|
|
ctrl_outl(0, P4SEG_STORE_QUE + 0);
|
|
ctrl_outl(0, P4SEG_STORE_QUE + 8);
|
|
}
|
|
|
|
static struct sq_mapping *__sq_alloc_mapping(unsigned long virt, unsigned long phys, unsigned long size, const char *name)
|
|
{
|
|
struct sq_mapping *map;
|
|
|
|
if (virt + size > SQ_ADDRMAX)
|
|
return ERR_PTR(-ENOSPC);
|
|
|
|
map = kmalloc(sizeof(struct sq_mapping), GFP_KERNEL);
|
|
if (!map)
|
|
return ERR_PTR(-ENOMEM);
|
|
|
|
INIT_LIST_HEAD(&map->list);
|
|
|
|
map->sq_addr = virt;
|
|
map->addr = phys;
|
|
map->size = size + 1;
|
|
map->name = name;
|
|
|
|
list_add(&map->list, &sq_mapping_list);
|
|
|
|
return map;
|
|
}
|
|
|
|
static unsigned long __sq_get_next_addr(void)
|
|
{
|
|
if (!list_empty(&sq_mapping_list)) {
|
|
struct list_head *pos, *tmp;
|
|
|
|
/*
|
|
* Read one off the list head, as it will have the highest
|
|
* mapped allocation. Set the next one up right above it.
|
|
*
|
|
* This is somewhat sub-optimal, as we don't look at
|
|
* gaps between allocations or anything lower then the
|
|
* highest-level allocation.
|
|
*
|
|
* However, in the interest of performance and the general
|
|
* lack of desire to do constant list rebalancing, we don't
|
|
* worry about it.
|
|
*/
|
|
list_for_each_safe(pos, tmp, &sq_mapping_list) {
|
|
struct sq_mapping *entry;
|
|
|
|
entry = list_entry(pos, typeof(*entry), list);
|
|
|
|
return entry->sq_addr + entry->size;
|
|
}
|
|
}
|
|
|
|
return P4SEG_STORE_QUE;
|
|
}
|
|
|
|
/**
|
|
* __sq_remap - Perform a translation from the SQ to a phys addr
|
|
* @map: sq mapping containing phys and store queue addresses.
|
|
*
|
|
* Maps the store queue address specified in the mapping to the physical
|
|
* address specified in the mapping.
|
|
*/
|
|
static struct sq_mapping *__sq_remap(struct sq_mapping *map)
|
|
{
|
|
unsigned long flags, pteh, ptel;
|
|
struct vm_struct *vma;
|
|
pgprot_t pgprot;
|
|
|
|
/*
|
|
* Without an MMU (or with it turned off), this is much more
|
|
* straightforward, as we can just load up each queue's QACR with
|
|
* the physical address appropriately masked.
|
|
*/
|
|
|
|
ctrl_outl(((map->addr >> 26) << 2) & 0x1c, SQ_QACR0);
|
|
ctrl_outl(((map->addr >> 26) << 2) & 0x1c, SQ_QACR1);
|
|
|
|
#ifdef CONFIG_MMU
|
|
/*
|
|
* With an MMU on the other hand, things are slightly more involved.
|
|
* Namely, we have to have a direct mapping between the SQ addr and
|
|
* the associated physical address in the UTLB by way of setting up
|
|
* a virt<->phys translation by hand. We do this by simply specifying
|
|
* the SQ addr in UTLB.VPN and the associated physical address in
|
|
* UTLB.PPN.
|
|
*
|
|
* Notably, even though this is a special case translation, and some
|
|
* of the configuration bits are meaningless, we're still required
|
|
* to have a valid ASID context in PTEH.
|
|
*
|
|
* We could also probably get by without explicitly setting PTEA, but
|
|
* we do it here just for good measure.
|
|
*/
|
|
spin_lock_irqsave(&sq_mapping_lock, flags);
|
|
|
|
pteh = map->sq_addr;
|
|
ctrl_outl((pteh & MMU_VPN_MASK) | get_asid(), MMU_PTEH);
|
|
|
|
ptel = map->addr & PAGE_MASK;
|
|
ctrl_outl(((ptel >> 28) & 0xe) | (ptel & 0x1), MMU_PTEA);
|
|
|
|
pgprot = pgprot_noncached(PAGE_KERNEL);
|
|
|
|
ptel &= _PAGE_FLAGS_HARDWARE_MASK;
|
|
ptel |= pgprot_val(pgprot);
|
|
ctrl_outl(ptel, MMU_PTEL);
|
|
|
|
__asm__ __volatile__ ("ldtlb" : : : "memory");
|
|
|
|
spin_unlock_irqrestore(&sq_mapping_lock, flags);
|
|
|
|
/*
|
|
* Next, we need to map ourselves in the kernel page table, so that
|
|
* future accesses after a TLB flush will be handled when we take a
|
|
* page fault.
|
|
*
|
|
* Theoretically we could just do this directly and not worry about
|
|
* setting up the translation by hand ahead of time, but for the
|
|
* cases where we want a one-shot SQ mapping followed by a quick
|
|
* writeout before we hit the TLB flush, we do it anyways. This way
|
|
* we at least save ourselves the initial page fault overhead.
|
|
*/
|
|
vma = __get_vm_area(map->size, VM_ALLOC, map->sq_addr, SQ_ADDRMAX);
|
|
if (!vma)
|
|
return ERR_PTR(-ENOMEM);
|
|
|
|
vma->phys_addr = map->addr;
|
|
|
|
if (remap_area_pages((unsigned long)vma->addr, vma->phys_addr,
|
|
map->size, pgprot_val(pgprot))) {
|
|
vunmap(vma->addr);
|
|
return NULL;
|
|
}
|
|
#endif /* CONFIG_MMU */
|
|
|
|
return map;
|
|
}
|
|
|
|
/**
|
|
* sq_remap - Map a physical address through the Store Queues
|
|
* @phys: Physical address of mapping.
|
|
* @size: Length of mapping.
|
|
* @name: User invoking mapping.
|
|
*
|
|
* Remaps the physical address @phys through the next available store queue
|
|
* address of @size length. @name is logged at boot time as well as through
|
|
* the procfs interface.
|
|
*
|
|
* A pre-allocated and filled sq_mapping pointer is returned, and must be
|
|
* cleaned up with a call to sq_unmap() when the user is done with the
|
|
* mapping.
|
|
*/
|
|
struct sq_mapping *sq_remap(unsigned long phys, unsigned int size, const char *name)
|
|
{
|
|
struct sq_mapping *map;
|
|
unsigned long virt, end;
|
|
unsigned int psz;
|
|
|
|
/* Don't allow wraparound or zero size */
|
|
end = phys + size - 1;
|
|
if (!size || end < phys)
|
|
return NULL;
|
|
/* Don't allow anyone to remap normal memory.. */
|
|
if (phys < virt_to_phys(high_memory))
|
|
return NULL;
|
|
|
|
phys &= PAGE_MASK;
|
|
|
|
size = PAGE_ALIGN(end + 1) - phys;
|
|
virt = __sq_get_next_addr();
|
|
psz = (size + (PAGE_SIZE - 1)) / PAGE_SIZE;
|
|
map = __sq_alloc_mapping(virt, phys, size, name);
|
|
|
|
printk("sqremap: %15s [%4d page%s] va 0x%08lx pa 0x%08lx\n",
|
|
map->name ? map->name : "???",
|
|
psz, psz == 1 ? " " : "s",
|
|
map->sq_addr, map->addr);
|
|
|
|
return __sq_remap(map);
|
|
}
|
|
|
|
/**
|
|
* sq_unmap - Unmap a Store Queue allocation
|
|
* @map: Pre-allocated Store Queue mapping.
|
|
*
|
|
* Unmaps the store queue allocation @map that was previously created by
|
|
* sq_remap(). Also frees up the pte that was previously inserted into
|
|
* the kernel page table and discards the UTLB translation.
|
|
*/
|
|
void sq_unmap(struct sq_mapping *map)
|
|
{
|
|
if (map->sq_addr > (unsigned long)high_memory)
|
|
vfree((void *)(map->sq_addr & PAGE_MASK));
|
|
|
|
list_del(&map->list);
|
|
kfree(map);
|
|
}
|
|
|
|
/**
|
|
* sq_clear - Clear a store queue range
|
|
* @addr: Address to start clearing from.
|
|
* @len: Length to clear.
|
|
*
|
|
* A quick zero-fill implementation for clearing out memory that has been
|
|
* remapped through the store queues.
|
|
*/
|
|
void sq_clear(unsigned long addr, unsigned int len)
|
|
{
|
|
int i;
|
|
|
|
/* Clear out both queues linearly */
|
|
for (i = 0; i < 8; i++) {
|
|
ctrl_outl(0, addr + i + 0);
|
|
ctrl_outl(0, addr + i + 8);
|
|
}
|
|
|
|
sq_flush_range(addr, len);
|
|
}
|
|
|
|
/**
|
|
* sq_vma_unmap - Unmap a VMA range
|
|
* @area: VMA containing range.
|
|
* @addr: Start of range.
|
|
* @len: Length of range.
|
|
*
|
|
* Searches the sq_mapping_list for a mapping matching the sq addr @addr,
|
|
* and subsequently frees up the entry. Further cleanup is done by generic
|
|
* code.
|
|
*/
|
|
static void sq_vma_unmap(struct vm_area_struct *area,
|
|
unsigned long addr, size_t len)
|
|
{
|
|
struct list_head *pos, *tmp;
|
|
|
|
list_for_each_safe(pos, tmp, &sq_mapping_list) {
|
|
struct sq_mapping *entry;
|
|
|
|
entry = list_entry(pos, typeof(*entry), list);
|
|
|
|
if (entry->sq_addr == addr) {
|
|
/*
|
|
* We could probably get away without doing the tlb flush
|
|
* here, as generic code should take care of most of this
|
|
* when unmapping the rest of the VMA range for us. Leave
|
|
* it in for added sanity for the time being..
|
|
*/
|
|
__flush_tlb_page(get_asid(), entry->sq_addr & PAGE_MASK);
|
|
|
|
list_del(&entry->list);
|
|
kfree(entry);
|
|
|
|
return;
|
|
}
|
|
}
|
|
}
|
|
|
|
/**
|
|
* sq_vma_sync - Sync a VMA range
|
|
* @area: VMA containing range.
|
|
* @start: Start of range.
|
|
* @len: Length of range.
|
|
* @flags: Additional flags.
|
|
*
|
|
* Synchronizes an sq mapped range by flushing the store queue cache for
|
|
* the duration of the mapping.
|
|
*
|
|
* Used internally for user mappings, which must use msync() to prefetch
|
|
* the store queue cache.
|
|
*/
|
|
static int sq_vma_sync(struct vm_area_struct *area,
|
|
unsigned long start, size_t len, unsigned int flags)
|
|
{
|
|
sq_flush_range(start, len);
|
|
|
|
return 0;
|
|
}
|
|
|
|
static struct vm_operations_struct sq_vma_ops = {
|
|
.unmap = sq_vma_unmap,
|
|
.sync = sq_vma_sync,
|
|
};
|
|
|
|
/**
|
|
* sq_mmap - mmap() for /dev/cpu/sq
|
|
* @file: unused.
|
|
* @vma: VMA to remap.
|
|
*
|
|
* Remap the specified vma @vma through the store queues, and setup associated
|
|
* information for the new mapping. Also build up the page tables for the new
|
|
* area.
|
|
*/
|
|
static int sq_mmap(struct file *file, struct vm_area_struct *vma)
|
|
{
|
|
unsigned long offset = vma->vm_pgoff << PAGE_SHIFT;
|
|
unsigned long size = vma->vm_end - vma->vm_start;
|
|
struct sq_mapping *map;
|
|
|
|
/*
|
|
* We're not interested in any arbitrary virtual address that has
|
|
* been stuck in the VMA, as we already know what addresses we
|
|
* want. Save off the size, and reposition the VMA to begin at
|
|
* the next available sq address.
|
|
*/
|
|
vma->vm_start = __sq_get_next_addr();
|
|
vma->vm_end = vma->vm_start + size;
|
|
|
|
vma->vm_page_prot = pgprot_noncached(vma->vm_page_prot);
|
|
|
|
vma->vm_flags |= VM_IO | VM_RESERVED;
|
|
|
|
map = __sq_alloc_mapping(vma->vm_start, offset, size, "Userspace");
|
|
|
|
if (io_remap_pfn_range(vma, map->sq_addr, map->addr >> PAGE_SHIFT,
|
|
size, vma->vm_page_prot))
|
|
return -EAGAIN;
|
|
|
|
vma->vm_ops = &sq_vma_ops;
|
|
|
|
return 0;
|
|
}
|
|
|
|
#ifdef CONFIG_PROC_FS
|
|
static int sq_mapping_read_proc(char *buf, char **start, off_t off,
|
|
int len, int *eof, void *data)
|
|
{
|
|
struct list_head *pos;
|
|
char *p = buf;
|
|
|
|
list_for_each_prev(pos, &sq_mapping_list) {
|
|
struct sq_mapping *entry;
|
|
|
|
entry = list_entry(pos, typeof(*entry), list);
|
|
|
|
p += sprintf(p, "%08lx-%08lx [%08lx]: %s\n", entry->sq_addr,
|
|
entry->sq_addr + entry->size - 1, entry->addr,
|
|
entry->name);
|
|
}
|
|
|
|
return p - buf;
|
|
}
|
|
#endif
|
|
|
|
static struct file_operations sq_fops = {
|
|
.owner = THIS_MODULE,
|
|
.mmap = sq_mmap,
|
|
};
|
|
|
|
static struct miscdevice sq_dev = {
|
|
.minor = STORE_QUEUE_MINOR,
|
|
.name = "sq",
|
|
.devfs_name = "cpu/sq",
|
|
.fops = &sq_fops,
|
|
};
|
|
|
|
static int __init sq_api_init(void)
|
|
{
|
|
printk(KERN_NOTICE "sq: Registering store queue API.\n");
|
|
|
|
#ifdef CONFIG_PROC_FS
|
|
create_proc_read_entry("sq_mapping", 0, 0, sq_mapping_read_proc, 0);
|
|
#endif
|
|
|
|
return misc_register(&sq_dev);
|
|
}
|
|
|
|
static void __exit sq_api_exit(void)
|
|
{
|
|
misc_deregister(&sq_dev);
|
|
}
|
|
|
|
module_init(sq_api_init);
|
|
module_exit(sq_api_exit);
|
|
|
|
MODULE_AUTHOR("Paul Mundt <lethal@linux-sh.org>, M. R. Brown <mrbrown@0xd6.org>");
|
|
MODULE_DESCRIPTION("Simple API for SH-4 integrated Store Queues");
|
|
MODULE_LICENSE("GPL");
|
|
MODULE_ALIAS_MISCDEV(STORE_QUEUE_MINOR);
|
|
|
|
EXPORT_SYMBOL(sq_remap);
|
|
EXPORT_SYMBOL(sq_unmap);
|
|
EXPORT_SYMBOL(sq_clear);
|
|
EXPORT_SYMBOL(sq_flush);
|
|
EXPORT_SYMBOL(sq_flush_range);
|
|
|
|
|