aboutsummaryrefslogtreecommitdiffstats
path: root/linux-2.6-xen-sparse/arch/xen/x86_64/mm/ioremap.c
blob: c3d6ee395930097c55b74599a447466ac3a07936 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
/*
 * arch/x86_64/mm/ioremap.c
 *
 * Re-map IO memory to kernel address space so that we can access it.
 * This is needed for high PCI addresses that aren't mapped in the
 * 640k-1MB IO memory area on PC's
 *
 * (C) Copyright 1995 1996 Linus Torvalds
 */

#include <linux/vmalloc.h>
#include <linux/init.h>
#include <linux/slab.h>
#include <linux/module.h>
#include <asm/io.h>
#include <asm/fixmap.h>
#include <asm/cacheflush.h>
#include <asm/tlbflush.h>
#include <asm/pgtable.h>
#include <asm/pgalloc.h>

/*
 * Reuse arch/xen/i396/mm/ioremap.c. Need to merge later
 */
#ifndef CONFIG_XEN_PHYSDEV_ACCESS

void * __ioremap(unsigned long phys_addr, unsigned long size,
		 unsigned long flags)
{
	return NULL;
}

void *ioremap_nocache (unsigned long phys_addr, unsigned long size)
{
	return NULL;
}

void iounmap(volatile void __iomem *addr)
{
}

void __init *bt_ioremap(unsigned long phys_addr, unsigned long size)
{
	return NULL;
}

void __init bt_iounmap(void *addr, unsigned long size)
{
}

#else

#if defined(__i386__)
/*
 * Does @address reside within a non-highmem page that is local to this virtual
 * machine (i.e., not an I/O page, nor a memory page belonging to another VM).
 * See the comment that accompanies pte_pfn() in pgtable-2level.h to understand
 * why this works.
 */
static inline int is_local_lowmem(unsigned long address)
{
	extern unsigned long max_low_pfn;
	unsigned long mfn = address >> PAGE_SHIFT;
	unsigned long pfn = mfn_to_pfn(mfn);
	return ((pfn < max_low_pfn) && (pfn_to_mfn(pfn) == mfn));
}
#elif defined(__x86_64__)
/*
 * 
 */
static inline int is_local_lowmem(unsigned long address)
{
        return 0;
}
#endif

/*
 * Generic mapping function (not visible outside):
 */

/*
 * Remap an arbitrary physical address space into the kernel virtual
 * address space. Needed when the kernel wants to access high addresses
 * directly.
 *
 * NOTE! We need to allow non-page-aligned mappings too: we will obviously
 * have to convert them into an offset in a page-aligned mapping, but the
 * caller shouldn't need to know that small detail.
 */
void __iomem * __ioremap(unsigned long phys_addr, unsigned long size, unsigned long flags)
{
	void __iomem * addr;
	struct vm_struct * area;
	unsigned long offset, last_addr;
	domid_t domid = DOMID_IO;

	/* Don't allow wraparound or zero size */
	last_addr = phys_addr + size - 1;
	if (!size || last_addr < phys_addr)
		return NULL;

#ifdef CONFIG_XEN_PRIVILEGED_GUEST
	/*
	 * Don't remap the low PCI/ISA area, it's always mapped..
	 */
	if (phys_addr >= 0x0 && last_addr < 0x100000)
		return isa_bus_to_virt(phys_addr);
#endif

	/*
	 * Don't allow anybody to remap normal RAM that we're using..
	 */
	if (is_local_lowmem(phys_addr)) {
		char *t_addr, *t_end;
 		struct page *page;

		t_addr = bus_to_virt(phys_addr);
		t_end = t_addr + (size - 1);
	   
		for(page = virt_to_page(t_addr); page <= virt_to_page(t_end); page++)
			if(!PageReserved(page))
				return NULL;

		domid = DOMID_LOCAL;
	}

	/*
	 * Mappings have to be page-aligned
	 */
	offset = phys_addr & ~PAGE_MASK;
	phys_addr &= PAGE_MASK;
	size = PAGE_ALIGN(last_addr+1) - phys_addr;

	/*
	 * Ok, go for it..
	 */
	area = get_vm_area(size, VM_IOREMAP | (flags << 20));
	if (!area)
		return NULL;
	area->phys_addr = phys_addr;
	addr = (void __iomem *) area->addr;
	if (direct_remap_area_pages(&init_mm, (unsigned long) addr, phys_addr,
				    size, __pgprot(_PAGE_PRESENT | _PAGE_RW |
						   _PAGE_DIRTY | _PAGE_ACCESSED
#if defined(__x86_64__)
                                                   | _PAGE_USER
#endif
						   | flags), domid)) {
		vunmap((void __force *) addr);
		return NULL;
	}
	return (void __iomem *) (offset + (char __iomem *)addr);
}


/**
 * ioremap_nocache     -   map bus memory into CPU space
 * @offset:    bus address of the memory
 * @size:      size of the resource to map
 *
 * ioremap_nocache performs a platform specific sequence of operations to
 * make bus memory CPU accessible via the readb/readw/readl/writeb/
 * writew/writel functions and the other mmio helpers. The returned
 * address is not guaranteed to be usable directly as a virtual
 * address. 
 *
 * This version of ioremap ensures that the memory is marked uncachable
 * on the CPU as well as honouring existing caching rules from things like
 * the PCI bus. Note that there are other caches and buffers on many 
 * busses. In particular driver authors should read up on PCI writes
 *
 * It's useful if some control registers are in such an area and
 * write combining or read caching is not desirable:
 * 
 * Must be freed with iounmap.
 */

void __iomem *ioremap_nocache (unsigned long phys_addr, unsigned long size)
{
	unsigned long last_addr;
	void __iomem *p = __ioremap(phys_addr, size, _PAGE_PCD);
	if (!p) 
		return p; 

	/* Guaranteed to be > phys_addr, as per __ioremap() */
	last_addr = phys_addr + size - 1;

	if (is_local_lowmem(last_addr)) { 
		struct page *ppage = virt_to_page(bus_to_virt(phys_addr));
		unsigned long npages;

		phys_addr &= PAGE_MASK;

		/* This might overflow and become zero.. */
		last_addr = PAGE_ALIGN(last_addr);

		/* .. but that's ok, because modulo-2**n arithmetic will make
	 	* the page-aligned "last - first" come out right.
	 	*/
		npages = (last_addr - phys_addr) >> PAGE_SHIFT;

		if (change_page_attr(ppage, npages, PAGE_KERNEL_NOCACHE) < 0) { 
			iounmap(p); 
			p = NULL;
		}
		global_flush_tlb();
	}

	return p;					
}

void iounmap(volatile void __iomem *addr)
{
	struct vm_struct *p;
	if ((void __force *) addr <= high_memory) 
		return; 
#ifdef CONFIG_XEN_PRIVILEGED_GUEST
	if ((unsigned long) addr >= fix_to_virt(FIX_ISAMAP_BEGIN))
		return;
#endif
	p = remove_vm_area((void *) (PAGE_MASK & (unsigned long __force) addr));
	if (!p) { 
		printk("__iounmap: bad address %p\n", addr);
		return;
	}

	if ((p->flags >> 20) && is_local_lowmem(p->phys_addr)) {
		/* p->size includes the guard page, but cpa doesn't like that */
		change_page_attr(virt_to_page(bus_to_virt(p->phys_addr)),
				 (p->size - PAGE_SIZE) >> PAGE_SHIFT,
				 PAGE_KERNEL); 				 
		global_flush_tlb();
	} 
	kfree(p); 
}

#if defined(__i386__)
void __init *bt_ioremap(unsigned long phys_addr, unsigned long size)
{
	unsigned long offset, last_addr;
	unsigned int nrpages;
	enum fixed_addresses idx;

	/* Don't allow wraparound or zero size */
	last_addr = phys_addr + size - 1;
	if (!size || last_addr < phys_addr)
		return NULL;

#ifdef CONFIG_XEN_PRIVILEGED_GUEST
	/*
	 * Don't remap the low PCI/ISA area, it's always mapped..
	 */
	if (phys_addr >= 0x0 && last_addr < 0x100000)
		return isa_bus_to_virt(phys_addr);
#endif

	/*
	 * Mappings have to be page-aligned
	 */
	offset = phys_addr & ~PAGE_MASK;
	phys_addr &= PAGE_MASK;
	size = PAGE_ALIGN(last_addr) - phys_addr;

	/*
	 * Mappings have to fit in the FIX_BTMAP area.
	 */
	nrpages = size >> PAGE_SHIFT;
	if (nrpages > NR_FIX_BTMAPS)
		return NULL;

	/*
	 * Ok, go for it..
	 */
	idx = FIX_BTMAP_BEGIN;
	while (nrpages > 0) {
		set_fixmap(idx, phys_addr);
		phys_addr += PAGE_SIZE;
		--idx;
		--nrpages;
	}
	return (void*) (offset + fix_to_virt(FIX_BTMAP_BEGIN));
}

void __init bt_iounmap(void *addr, unsigned long size)
{
	unsigned long virt_addr;
	unsigned long offset;
	unsigned int nrpages;
	enum fixed_addresses idx;

	virt_addr = (unsigned long)addr;
	if (virt_addr < fix_to_virt(FIX_BTMAP_BEGIN))
		return;
#ifdef CONFIG_XEN_PRIVILEGED_GUEST
	if (virt_addr >= fix_to_virt(FIX_ISAMAP_BEGIN))
		return;
#endif
	offset = virt_addr & ~PAGE_MASK;
	nrpages = PAGE_ALIGN(offset + size - 1) >> PAGE_SHIFT;

	idx = FIX_BTMAP_BEGIN;
	while (nrpages > 0) {
		clear_fixmap(idx);
		--idx;
		--nrpages;
	}
}
#endif /* defined(__i386__) */

#endif /* CONFIG_XEN_PHYSDEV_ACCESS */

/* These hacky macros avoid phys->machine translations. */
#define __direct_pte(x) ((pte_t) { (x) } )
#define __direct_mk_pte(page_nr,pgprot) \
  __direct_pte(((page_nr) << PAGE_SHIFT) | pgprot_val(pgprot))
#define direct_mk_pte_phys(physpage, pgprot) \
  __direct_mk_pte((physpage) >> PAGE_SHIFT, pgprot)

static inline void direct_remap_area_pte(pte_t *pte, 
					 unsigned long address, 
					 unsigned long size,
					 mmu_update_t **v)
{
	unsigned long end;

	address &= ~PMD_MASK;
	end = address + size;
	if (end > PMD_SIZE)
		end = PMD_SIZE;
	if (address >= end)
		BUG();

	do {
		(*v)->ptr = virt_to_machine(pte);
		(*v)++;
		address += PAGE_SIZE;
		pte++;
	} while (address && (address < end));
}

static inline int direct_remap_area_pmd(struct mm_struct *mm,
					pmd_t *pmd, 
					unsigned long address, 
					unsigned long size,
					mmu_update_t **v)
{
	unsigned long end;

	address &= ~PGDIR_MASK;
	end = address + size;
	if (end > PGDIR_SIZE)
		end = PGDIR_SIZE;
	if (address >= end)
		BUG();
	do {
		pte_t *pte = (mm == &init_mm) ? 
			pte_alloc_kernel(mm, pmd, address) :
			pte_alloc_map(mm, pmd, address);
		if (!pte)
			return -ENOMEM;
		direct_remap_area_pte(pte, address, end - address, v);
		pte_unmap(pte);
		address = (address + PMD_SIZE) & PMD_MASK;
		pmd++;
	} while (address && (address < end));
	return 0;
}
 
int __direct_remap_area_pages(struct mm_struct *mm,
			      unsigned long address, 
			      unsigned long size, 
			      mmu_update_t *v)
{
	pgd_t * dir;
	unsigned long end = address + size;
	int error;

#if defined(__i386__)
	dir = pgd_offset(mm, address);
#elif defined (__x86_64)
        dir = (mm == &init_mm) ?
		pgd_offset_k(address):
		pgd_offset(mm, address);
#endif
	if (address >= end)
		BUG();
	spin_lock(&mm->page_table_lock);
	do {
		pud_t *pud;
		pmd_t *pmd;

		error = -ENOMEM;
		pud = pud_alloc(mm, dir, address);
		if (!pud)
			break;
		pmd = pmd_alloc(mm, pud, address);
		if (!pmd)
			break;
		error = 0;
		direct_remap_area_pmd(mm, pmd, address, end - address, &v);
		address = (address + PGDIR_SIZE) & PGDIR_MASK;
		dir++;

	} while (address && (address < end));
	spin_unlock(&mm->page_table_lock);
	return error;
}


int direct_remap_area_pages(struct mm_struct *mm,
			    unsigned long address, 
			    unsigned long machine_addr,
			    unsigned long size, 
			    pgprot_t prot,
			    domid_t  domid)
{
	int i;
	unsigned long start_address;
#define MAX_DIRECTMAP_MMU_QUEUE 130
	mmu_update_t u[MAX_DIRECTMAP_MMU_QUEUE], *v = u;

	start_address = address;

	flush_cache_all();

	for (i = 0; i < size; i += PAGE_SIZE) {
		if ((v - u) == MAX_DIRECTMAP_MMU_QUEUE) {
			/* Fill in the PTE pointers. */
			__direct_remap_area_pages(mm,
						  start_address, 
						  address-start_address, 
						  u);
 
			if (HYPERVISOR_mmu_update(u, v - u, NULL, domid) < 0)
				return -EFAULT;
			v = u;
			start_address = address;
		}

		/*
		 * Fill in the machine address: PTE ptr is done later by
		 * __direct_remap_area_pages(). 
		 */
		v->val = (machine_addr & PAGE_MASK) | pgprot_val(prot);

		machine_addr += PAGE_SIZE;
		address += PAGE_SIZE; 
		v++;
	}

	if (v != u) {
		/* get the ptep's filled in */
		__direct_remap_area_pages(mm,
					  start_address, 
					  address-start_address, 
					  u);
		if (unlikely(HYPERVISOR_mmu_update(u, v - u, NULL, domid) < 0))
			return -EFAULT;
	}

	flush_tlb_all();

	return 0;
}

EXPORT_SYMBOL(direct_remap_area_pages);

int create_lookup_pte_addr(struct mm_struct *mm, 
                           unsigned long address,
                           unsigned long *ptep)
{
    int f(pte_t *pte, struct page *pte_page, unsigned long addr, void *data) 
    {
        unsigned long *ptep = (unsigned long *)data;
        if (ptep) *ptep = (pfn_to_mfn(page_to_pfn(pte_page)) << PAGE_SHIFT)
                       | ((unsigned long)pte & ~PAGE_MASK);
        return 0;
    }

    return generic_page_range(mm, address, PAGE_SIZE, f, ptep);
}

EXPORT_SYMBOL(create_lookup_pte_addr);

int touch_pte_range(struct mm_struct *mm,
                    unsigned long address,
                    unsigned long size)
{
    int f(pte_t *pte, struct page *pte_page, unsigned long addr, void *data) 
    {
        return 0;
    }

    return generic_page_range(mm, address, size, f, NULL);
}                 

EXPORT_SYMBOL(touch_pte_range);