1 // SPDX-License-Identifier: GPL-2.0-only
2 /*
3 * PS3 address space management.
4 *
5 * Copyright (C) 2006 Sony Computer Entertainment Inc.
6 * Copyright 2006 Sony Corp.
7 */
8
9 #include <linux/kernel.h>
10 #include <linux/export.h>
11 #include <linux/memblock.h>
12 #include <linux/slab.h>
13
14 #include <asm/cell-regs.h>
15 #include <asm/firmware.h>
16 #include <asm/prom.h>
17 #include <asm/udbg.h>
18 #include <asm/lv1call.h>
19 #include <asm/setup.h>
20
21 #include "platform.h"
22
23 #if defined(DEBUG)
24 #define DBG udbg_printf
25 #else
26 #define DBG pr_devel
27 #endif
28
29 enum {
30 #if defined(CONFIG_PS3_DYNAMIC_DMA)
31 USE_DYNAMIC_DMA = 1,
32 #else
33 USE_DYNAMIC_DMA = 0,
34 #endif
35 };
36
37 enum {
38 PAGE_SHIFT_4K = 12U,
39 PAGE_SHIFT_64K = 16U,
40 PAGE_SHIFT_16M = 24U,
41 };
42
make_page_sizes(unsigned long a,unsigned long b)43 static unsigned long make_page_sizes(unsigned long a, unsigned long b)
44 {
45 return (a << 56) | (b << 48);
46 }
47
48 enum {
49 ALLOCATE_MEMORY_TRY_ALT_UNIT = 0X04,
50 ALLOCATE_MEMORY_ADDR_ZERO = 0X08,
51 };
52
53 /* valid htab sizes are {18,19,20} = 256K, 512K, 1M */
54
55 enum {
56 HTAB_SIZE_MAX = 20U, /* HV limit of 1MB */
57 HTAB_SIZE_MIN = 18U, /* CPU limit of 256KB */
58 };
59
60 /*============================================================================*/
61 /* virtual address space routines */
62 /*============================================================================*/
63
64 /**
65 * struct mem_region - memory region structure
66 * @base: base address
67 * @size: size in bytes
68 * @offset: difference between base and rm.size
69 * @destroy: flag if region should be destroyed upon shutdown
70 */
71
72 struct mem_region {
73 u64 base;
74 u64 size;
75 unsigned long offset;
76 int destroy;
77 };
78
79 /**
80 * struct map - address space state variables holder
81 * @total: total memory available as reported by HV
82 * @vas_id - HV virtual address space id
83 * @htab_size: htab size in bytes
84 *
85 * The HV virtual address space (vas) allows for hotplug memory regions.
86 * Memory regions can be created and destroyed in the vas at runtime.
87 * @rm: real mode (bootmem) region
88 * @r1: highmem region(s)
89 *
90 * ps3 addresses
91 * virt_addr: a cpu 'translated' effective address
92 * phys_addr: an address in what Linux thinks is the physical address space
93 * lpar_addr: an address in the HV virtual address space
94 * bus_addr: an io controller 'translated' address on a device bus
95 */
96
97 struct map {
98 u64 total;
99 u64 vas_id;
100 u64 htab_size;
101 struct mem_region rm;
102 struct mem_region r1;
103 };
104
105 #define debug_dump_map(x) _debug_dump_map(x, __func__, __LINE__)
_debug_dump_map(const struct map * m,const char * func,int line)106 static void __maybe_unused _debug_dump_map(const struct map *m,
107 const char *func, int line)
108 {
109 DBG("%s:%d: map.total = %llxh\n", func, line, m->total);
110 DBG("%s:%d: map.rm.size = %llxh\n", func, line, m->rm.size);
111 DBG("%s:%d: map.vas_id = %llu\n", func, line, m->vas_id);
112 DBG("%s:%d: map.htab_size = %llxh\n", func, line, m->htab_size);
113 DBG("%s:%d: map.r1.base = %llxh\n", func, line, m->r1.base);
114 DBG("%s:%d: map.r1.offset = %lxh\n", func, line, m->r1.offset);
115 DBG("%s:%d: map.r1.size = %llxh\n", func, line, m->r1.size);
116 }
117
118 static struct map map;
119
120 /**
121 * ps3_mm_phys_to_lpar - translate a linux physical address to lpar address
122 * @phys_addr: linux physical address
123 */
124
ps3_mm_phys_to_lpar(unsigned long phys_addr)125 unsigned long ps3_mm_phys_to_lpar(unsigned long phys_addr)
126 {
127 BUG_ON(is_kernel_addr(phys_addr));
128 return (phys_addr < map.rm.size || phys_addr >= map.total)
129 ? phys_addr : phys_addr + map.r1.offset;
130 }
131
132 EXPORT_SYMBOL(ps3_mm_phys_to_lpar);
133
134 /**
135 * ps3_mm_vas_create - create the virtual address space
136 */
137
ps3_mm_vas_create(unsigned long * htab_size)138 void __init ps3_mm_vas_create(unsigned long* htab_size)
139 {
140 int result;
141 u64 start_address;
142 u64 size;
143 u64 access_right;
144 u64 max_page_size;
145 u64 flags;
146
147 result = lv1_query_logical_partition_address_region_info(0,
148 &start_address, &size, &access_right, &max_page_size,
149 &flags);
150
151 if (result) {
152 DBG("%s:%d: lv1_query_logical_partition_address_region_info "
153 "failed: %s\n", __func__, __LINE__,
154 ps3_result(result));
155 goto fail;
156 }
157
158 if (max_page_size < PAGE_SHIFT_16M) {
159 DBG("%s:%d: bad max_page_size %llxh\n", __func__, __LINE__,
160 max_page_size);
161 goto fail;
162 }
163
164 BUILD_BUG_ON(CONFIG_PS3_HTAB_SIZE > HTAB_SIZE_MAX);
165 BUILD_BUG_ON(CONFIG_PS3_HTAB_SIZE < HTAB_SIZE_MIN);
166
167 result = lv1_construct_virtual_address_space(CONFIG_PS3_HTAB_SIZE,
168 2, make_page_sizes(PAGE_SHIFT_16M, PAGE_SHIFT_64K),
169 &map.vas_id, &map.htab_size);
170
171 if (result) {
172 DBG("%s:%d: lv1_construct_virtual_address_space failed: %s\n",
173 __func__, __LINE__, ps3_result(result));
174 goto fail;
175 }
176
177 result = lv1_select_virtual_address_space(map.vas_id);
178
179 if (result) {
180 DBG("%s:%d: lv1_select_virtual_address_space failed: %s\n",
181 __func__, __LINE__, ps3_result(result));
182 goto fail;
183 }
184
185 *htab_size = map.htab_size;
186
187 debug_dump_map(&map);
188
189 return;
190
191 fail:
192 panic("ps3_mm_vas_create failed");
193 }
194
195 /**
196 * ps3_mm_vas_destroy -
197 */
198
ps3_mm_vas_destroy(void)199 void ps3_mm_vas_destroy(void)
200 {
201 int result;
202
203 DBG("%s:%d: map.vas_id = %llu\n", __func__, __LINE__, map.vas_id);
204
205 if (map.vas_id) {
206 result = lv1_select_virtual_address_space(0);
207 BUG_ON(result);
208 result = lv1_destruct_virtual_address_space(map.vas_id);
209 BUG_ON(result);
210 map.vas_id = 0;
211 }
212 }
213
ps3_mm_get_repository_highmem(struct mem_region * r)214 static int ps3_mm_get_repository_highmem(struct mem_region *r)
215 {
216 int result;
217
218 /* Assume a single highmem region. */
219
220 result = ps3_repository_read_highmem_info(0, &r->base, &r->size);
221
222 if (result)
223 goto zero_region;
224
225 if (!r->base || !r->size) {
226 result = -1;
227 goto zero_region;
228 }
229
230 r->offset = r->base - map.rm.size;
231
232 DBG("%s:%d: Found high region in repository: %llxh %llxh\n",
233 __func__, __LINE__, r->base, r->size);
234
235 return 0;
236
237 zero_region:
238 DBG("%s:%d: No high region in repository.\n", __func__, __LINE__);
239
240 r->size = r->base = r->offset = 0;
241 return result;
242 }
243
ps3_mm_set_repository_highmem(const struct mem_region * r)244 static int ps3_mm_set_repository_highmem(const struct mem_region *r)
245 {
246 /* Assume a single highmem region. */
247
248 return r ? ps3_repository_write_highmem_info(0, r->base, r->size) :
249 ps3_repository_write_highmem_info(0, 0, 0);
250 }
251
252 /**
253 * ps3_mm_region_create - create a memory region in the vas
254 * @r: pointer to a struct mem_region to accept initialized values
255 * @size: requested region size
256 *
257 * This implementation creates the region with the vas large page size.
258 * @size is rounded down to a multiple of the vas large page size.
259 */
260
ps3_mm_region_create(struct mem_region * r,unsigned long size)261 static int ps3_mm_region_create(struct mem_region *r, unsigned long size)
262 {
263 int result;
264 u64 muid;
265
266 r->size = _ALIGN_DOWN(size, 1 << PAGE_SHIFT_16M);
267
268 DBG("%s:%d requested %lxh\n", __func__, __LINE__, size);
269 DBG("%s:%d actual %llxh\n", __func__, __LINE__, r->size);
270 DBG("%s:%d difference %llxh (%lluMB)\n", __func__, __LINE__,
271 size - r->size, (size - r->size) / 1024 / 1024);
272
273 if (r->size == 0) {
274 DBG("%s:%d: size == 0\n", __func__, __LINE__);
275 result = -1;
276 goto zero_region;
277 }
278
279 result = lv1_allocate_memory(r->size, PAGE_SHIFT_16M, 0,
280 ALLOCATE_MEMORY_TRY_ALT_UNIT, &r->base, &muid);
281
282 if (result || r->base < map.rm.size) {
283 DBG("%s:%d: lv1_allocate_memory failed: %s\n",
284 __func__, __LINE__, ps3_result(result));
285 goto zero_region;
286 }
287
288 r->destroy = 1;
289 r->offset = r->base - map.rm.size;
290 return result;
291
292 zero_region:
293 r->size = r->base = r->offset = 0;
294 return result;
295 }
296
297 /**
298 * ps3_mm_region_destroy - destroy a memory region
299 * @r: pointer to struct mem_region
300 */
301
ps3_mm_region_destroy(struct mem_region * r)302 static void ps3_mm_region_destroy(struct mem_region *r)
303 {
304 int result;
305
306 if (!r->destroy) {
307 pr_info("%s:%d: Not destroying high region: %llxh %llxh\n",
308 __func__, __LINE__, r->base, r->size);
309 return;
310 }
311
312 DBG("%s:%d: r->base = %llxh\n", __func__, __LINE__, r->base);
313
314 if (r->base) {
315 result = lv1_release_memory(r->base);
316 BUG_ON(result);
317 r->size = r->base = r->offset = 0;
318 map.total = map.rm.size;
319 }
320 ps3_mm_set_repository_highmem(NULL);
321 }
322
323 /*============================================================================*/
324 /* dma routines */
325 /*============================================================================*/
326
327 /**
328 * dma_sb_lpar_to_bus - Translate an lpar address to ioc mapped bus address.
329 * @r: pointer to dma region structure
330 * @lpar_addr: HV lpar address
331 */
332
dma_sb_lpar_to_bus(struct ps3_dma_region * r,unsigned long lpar_addr)333 static unsigned long dma_sb_lpar_to_bus(struct ps3_dma_region *r,
334 unsigned long lpar_addr)
335 {
336 if (lpar_addr >= map.rm.size)
337 lpar_addr -= map.r1.offset;
338 BUG_ON(lpar_addr < r->offset);
339 BUG_ON(lpar_addr >= r->offset + r->len);
340 return r->bus_addr + lpar_addr - r->offset;
341 }
342
343 #define dma_dump_region(_a) _dma_dump_region(_a, __func__, __LINE__)
_dma_dump_region(const struct ps3_dma_region * r,const char * func,int line)344 static void __maybe_unused _dma_dump_region(const struct ps3_dma_region *r,
345 const char *func, int line)
346 {
347 DBG("%s:%d: dev %llu:%llu\n", func, line, r->dev->bus_id,
348 r->dev->dev_id);
349 DBG("%s:%d: page_size %u\n", func, line, r->page_size);
350 DBG("%s:%d: bus_addr %lxh\n", func, line, r->bus_addr);
351 DBG("%s:%d: len %lxh\n", func, line, r->len);
352 DBG("%s:%d: offset %lxh\n", func, line, r->offset);
353 }
354
355 /**
356 * dma_chunk - A chunk of dma pages mapped by the io controller.
357 * @region - The dma region that owns this chunk.
358 * @lpar_addr: Starting lpar address of the area to map.
359 * @bus_addr: Starting ioc bus address of the area to map.
360 * @len: Length in bytes of the area to map.
361 * @link: A struct list_head used with struct ps3_dma_region.chunk_list, the
362 * list of all chuncks owned by the region.
363 *
364 * This implementation uses a very simple dma page manager
365 * based on the dma_chunk structure. This scheme assumes
366 * that all drivers use very well behaved dma ops.
367 */
368
369 struct dma_chunk {
370 struct ps3_dma_region *region;
371 unsigned long lpar_addr;
372 unsigned long bus_addr;
373 unsigned long len;
374 struct list_head link;
375 unsigned int usage_count;
376 };
377
378 #define dma_dump_chunk(_a) _dma_dump_chunk(_a, __func__, __LINE__)
_dma_dump_chunk(const struct dma_chunk * c,const char * func,int line)379 static void _dma_dump_chunk (const struct dma_chunk* c, const char* func,
380 int line)
381 {
382 DBG("%s:%d: r.dev %llu:%llu\n", func, line,
383 c->region->dev->bus_id, c->region->dev->dev_id);
384 DBG("%s:%d: r.bus_addr %lxh\n", func, line, c->region->bus_addr);
385 DBG("%s:%d: r.page_size %u\n", func, line, c->region->page_size);
386 DBG("%s:%d: r.len %lxh\n", func, line, c->region->len);
387 DBG("%s:%d: r.offset %lxh\n", func, line, c->region->offset);
388 DBG("%s:%d: c.lpar_addr %lxh\n", func, line, c->lpar_addr);
389 DBG("%s:%d: c.bus_addr %lxh\n", func, line, c->bus_addr);
390 DBG("%s:%d: c.len %lxh\n", func, line, c->len);
391 }
392
dma_find_chunk(struct ps3_dma_region * r,unsigned long bus_addr,unsigned long len)393 static struct dma_chunk * dma_find_chunk(struct ps3_dma_region *r,
394 unsigned long bus_addr, unsigned long len)
395 {
396 struct dma_chunk *c;
397 unsigned long aligned_bus = _ALIGN_DOWN(bus_addr, 1 << r->page_size);
398 unsigned long aligned_len = _ALIGN_UP(len+bus_addr-aligned_bus,
399 1 << r->page_size);
400
401 list_for_each_entry(c, &r->chunk_list.head, link) {
402 /* intersection */
403 if (aligned_bus >= c->bus_addr &&
404 aligned_bus + aligned_len <= c->bus_addr + c->len)
405 return c;
406
407 /* below */
408 if (aligned_bus + aligned_len <= c->bus_addr)
409 continue;
410
411 /* above */
412 if (aligned_bus >= c->bus_addr + c->len)
413 continue;
414
415 /* we don't handle the multi-chunk case for now */
416 dma_dump_chunk(c);
417 BUG();
418 }
419 return NULL;
420 }
421
dma_find_chunk_lpar(struct ps3_dma_region * r,unsigned long lpar_addr,unsigned long len)422 static struct dma_chunk *dma_find_chunk_lpar(struct ps3_dma_region *r,
423 unsigned long lpar_addr, unsigned long len)
424 {
425 struct dma_chunk *c;
426 unsigned long aligned_lpar = _ALIGN_DOWN(lpar_addr, 1 << r->page_size);
427 unsigned long aligned_len = _ALIGN_UP(len + lpar_addr - aligned_lpar,
428 1 << r->page_size);
429
430 list_for_each_entry(c, &r->chunk_list.head, link) {
431 /* intersection */
432 if (c->lpar_addr <= aligned_lpar &&
433 aligned_lpar < c->lpar_addr + c->len) {
434 if (aligned_lpar + aligned_len <= c->lpar_addr + c->len)
435 return c;
436 else {
437 dma_dump_chunk(c);
438 BUG();
439 }
440 }
441 /* below */
442 if (aligned_lpar + aligned_len <= c->lpar_addr) {
443 continue;
444 }
445 /* above */
446 if (c->lpar_addr + c->len <= aligned_lpar) {
447 continue;
448 }
449 }
450 return NULL;
451 }
452
dma_sb_free_chunk(struct dma_chunk * c)453 static int dma_sb_free_chunk(struct dma_chunk *c)
454 {
455 int result = 0;
456
457 if (c->bus_addr) {
458 result = lv1_unmap_device_dma_region(c->region->dev->bus_id,
459 c->region->dev->dev_id, c->bus_addr, c->len);
460 BUG_ON(result);
461 }
462
463 kfree(c);
464 return result;
465 }
466
dma_ioc0_free_chunk(struct dma_chunk * c)467 static int dma_ioc0_free_chunk(struct dma_chunk *c)
468 {
469 int result = 0;
470 int iopage;
471 unsigned long offset;
472 struct ps3_dma_region *r = c->region;
473
474 DBG("%s:start\n", __func__);
475 for (iopage = 0; iopage < (c->len >> r->page_size); iopage++) {
476 offset = (1 << r->page_size) * iopage;
477 /* put INVALID entry */
478 result = lv1_put_iopte(0,
479 c->bus_addr + offset,
480 c->lpar_addr + offset,
481 r->ioid,
482 0);
483 DBG("%s: bus=%#lx, lpar=%#lx, ioid=%d\n", __func__,
484 c->bus_addr + offset,
485 c->lpar_addr + offset,
486 r->ioid);
487
488 if (result) {
489 DBG("%s:%d: lv1_put_iopte failed: %s\n", __func__,
490 __LINE__, ps3_result(result));
491 }
492 }
493 kfree(c);
494 DBG("%s:end\n", __func__);
495 return result;
496 }
497
498 /**
499 * dma_sb_map_pages - Maps dma pages into the io controller bus address space.
500 * @r: Pointer to a struct ps3_dma_region.
501 * @phys_addr: Starting physical address of the area to map.
502 * @len: Length in bytes of the area to map.
503 * c_out: A pointer to receive an allocated struct dma_chunk for this area.
504 *
505 * This is the lowest level dma mapping routine, and is the one that will
506 * make the HV call to add the pages into the io controller address space.
507 */
508
dma_sb_map_pages(struct ps3_dma_region * r,unsigned long phys_addr,unsigned long len,struct dma_chunk ** c_out,u64 iopte_flag)509 static int dma_sb_map_pages(struct ps3_dma_region *r, unsigned long phys_addr,
510 unsigned long len, struct dma_chunk **c_out, u64 iopte_flag)
511 {
512 int result;
513 struct dma_chunk *c;
514
515 c = kzalloc(sizeof(*c), GFP_ATOMIC);
516 if (!c) {
517 result = -ENOMEM;
518 goto fail_alloc;
519 }
520
521 c->region = r;
522 c->lpar_addr = ps3_mm_phys_to_lpar(phys_addr);
523 c->bus_addr = dma_sb_lpar_to_bus(r, c->lpar_addr);
524 c->len = len;
525
526 BUG_ON(iopte_flag != 0xf800000000000000UL);
527 result = lv1_map_device_dma_region(c->region->dev->bus_id,
528 c->region->dev->dev_id, c->lpar_addr,
529 c->bus_addr, c->len, iopte_flag);
530 if (result) {
531 DBG("%s:%d: lv1_map_device_dma_region failed: %s\n",
532 __func__, __LINE__, ps3_result(result));
533 goto fail_map;
534 }
535
536 list_add(&c->link, &r->chunk_list.head);
537
538 *c_out = c;
539 return 0;
540
541 fail_map:
542 kfree(c);
543 fail_alloc:
544 *c_out = NULL;
545 DBG(" <- %s:%d\n", __func__, __LINE__);
546 return result;
547 }
548
dma_ioc0_map_pages(struct ps3_dma_region * r,unsigned long phys_addr,unsigned long len,struct dma_chunk ** c_out,u64 iopte_flag)549 static int dma_ioc0_map_pages(struct ps3_dma_region *r, unsigned long phys_addr,
550 unsigned long len, struct dma_chunk **c_out,
551 u64 iopte_flag)
552 {
553 int result;
554 struct dma_chunk *c, *last;
555 int iopage, pages;
556 unsigned long offset;
557
558 DBG(KERN_ERR "%s: phy=%#lx, lpar%#lx, len=%#lx\n", __func__,
559 phys_addr, ps3_mm_phys_to_lpar(phys_addr), len);
560 c = kzalloc(sizeof(*c), GFP_ATOMIC);
561 if (!c) {
562 result = -ENOMEM;
563 goto fail_alloc;
564 }
565
566 c->region = r;
567 c->len = len;
568 c->lpar_addr = ps3_mm_phys_to_lpar(phys_addr);
569 /* allocate IO address */
570 if (list_empty(&r->chunk_list.head)) {
571 /* first one */
572 c->bus_addr = r->bus_addr;
573 } else {
574 /* derive from last bus addr*/
575 last = list_entry(r->chunk_list.head.next,
576 struct dma_chunk, link);
577 c->bus_addr = last->bus_addr + last->len;
578 DBG("%s: last bus=%#lx, len=%#lx\n", __func__,
579 last->bus_addr, last->len);
580 }
581
582 /* FIXME: check whether length exceeds region size */
583
584 /* build ioptes for the area */
585 pages = len >> r->page_size;
586 DBG("%s: pgsize=%#x len=%#lx pages=%#x iopteflag=%#llx\n", __func__,
587 r->page_size, r->len, pages, iopte_flag);
588 for (iopage = 0; iopage < pages; iopage++) {
589 offset = (1 << r->page_size) * iopage;
590 result = lv1_put_iopte(0,
591 c->bus_addr + offset,
592 c->lpar_addr + offset,
593 r->ioid,
594 iopte_flag);
595 if (result) {
596 pr_warn("%s:%d: lv1_put_iopte failed: %s\n",
597 __func__, __LINE__, ps3_result(result));
598 goto fail_map;
599 }
600 DBG("%s: pg=%d bus=%#lx, lpar=%#lx, ioid=%#x\n", __func__,
601 iopage, c->bus_addr + offset, c->lpar_addr + offset,
602 r->ioid);
603 }
604
605 /* be sure that last allocated one is inserted at head */
606 list_add(&c->link, &r->chunk_list.head);
607
608 *c_out = c;
609 DBG("%s: end\n", __func__);
610 return 0;
611
612 fail_map:
613 for (iopage--; 0 <= iopage; iopage--) {
614 lv1_put_iopte(0,
615 c->bus_addr + offset,
616 c->lpar_addr + offset,
617 r->ioid,
618 0);
619 }
620 kfree(c);
621 fail_alloc:
622 *c_out = NULL;
623 return result;
624 }
625
626 /**
627 * dma_sb_region_create - Create a device dma region.
628 * @r: Pointer to a struct ps3_dma_region.
629 *
630 * This is the lowest level dma region create routine, and is the one that
631 * will make the HV call to create the region.
632 */
633
dma_sb_region_create(struct ps3_dma_region * r)634 static int dma_sb_region_create(struct ps3_dma_region *r)
635 {
636 int result;
637 u64 bus_addr;
638
639 DBG(" -> %s:%d:\n", __func__, __LINE__);
640
641 BUG_ON(!r);
642
643 if (!r->dev->bus_id) {
644 pr_info("%s:%d: %llu:%llu no dma\n", __func__, __LINE__,
645 r->dev->bus_id, r->dev->dev_id);
646 return 0;
647 }
648
649 DBG("%s:%u: len = 0x%lx, page_size = %u, offset = 0x%lx\n", __func__,
650 __LINE__, r->len, r->page_size, r->offset);
651
652 BUG_ON(!r->len);
653 BUG_ON(!r->page_size);
654 BUG_ON(!r->region_ops);
655
656 INIT_LIST_HEAD(&r->chunk_list.head);
657 spin_lock_init(&r->chunk_list.lock);
658
659 result = lv1_allocate_device_dma_region(r->dev->bus_id, r->dev->dev_id,
660 roundup_pow_of_two(r->len), r->page_size, r->region_type,
661 &bus_addr);
662 r->bus_addr = bus_addr;
663
664 if (result) {
665 DBG("%s:%d: lv1_allocate_device_dma_region failed: %s\n",
666 __func__, __LINE__, ps3_result(result));
667 r->len = r->bus_addr = 0;
668 }
669
670 return result;
671 }
672
dma_ioc0_region_create(struct ps3_dma_region * r)673 static int dma_ioc0_region_create(struct ps3_dma_region *r)
674 {
675 int result;
676 u64 bus_addr;
677
678 INIT_LIST_HEAD(&r->chunk_list.head);
679 spin_lock_init(&r->chunk_list.lock);
680
681 result = lv1_allocate_io_segment(0,
682 r->len,
683 r->page_size,
684 &bus_addr);
685 r->bus_addr = bus_addr;
686 if (result) {
687 DBG("%s:%d: lv1_allocate_io_segment failed: %s\n",
688 __func__, __LINE__, ps3_result(result));
689 r->len = r->bus_addr = 0;
690 }
691 DBG("%s: len=%#lx, pg=%d, bus=%#lx\n", __func__,
692 r->len, r->page_size, r->bus_addr);
693 return result;
694 }
695
696 /**
697 * dma_region_free - Free a device dma region.
698 * @r: Pointer to a struct ps3_dma_region.
699 *
700 * This is the lowest level dma region free routine, and is the one that
701 * will make the HV call to free the region.
702 */
703
dma_sb_region_free(struct ps3_dma_region * r)704 static int dma_sb_region_free(struct ps3_dma_region *r)
705 {
706 int result;
707 struct dma_chunk *c;
708 struct dma_chunk *tmp;
709
710 BUG_ON(!r);
711
712 if (!r->dev->bus_id) {
713 pr_info("%s:%d: %llu:%llu no dma\n", __func__, __LINE__,
714 r->dev->bus_id, r->dev->dev_id);
715 return 0;
716 }
717
718 list_for_each_entry_safe(c, tmp, &r->chunk_list.head, link) {
719 list_del(&c->link);
720 dma_sb_free_chunk(c);
721 }
722
723 result = lv1_free_device_dma_region(r->dev->bus_id, r->dev->dev_id,
724 r->bus_addr);
725
726 if (result)
727 DBG("%s:%d: lv1_free_device_dma_region failed: %s\n",
728 __func__, __LINE__, ps3_result(result));
729
730 r->bus_addr = 0;
731
732 return result;
733 }
734
dma_ioc0_region_free(struct ps3_dma_region * r)735 static int dma_ioc0_region_free(struct ps3_dma_region *r)
736 {
737 int result;
738 struct dma_chunk *c, *n;
739
740 DBG("%s: start\n", __func__);
741 list_for_each_entry_safe(c, n, &r->chunk_list.head, link) {
742 list_del(&c->link);
743 dma_ioc0_free_chunk(c);
744 }
745
746 result = lv1_release_io_segment(0, r->bus_addr);
747
748 if (result)
749 DBG("%s:%d: lv1_free_device_dma_region failed: %s\n",
750 __func__, __LINE__, ps3_result(result));
751
752 r->bus_addr = 0;
753 DBG("%s: end\n", __func__);
754
755 return result;
756 }
757
758 /**
759 * dma_sb_map_area - Map an area of memory into a device dma region.
760 * @r: Pointer to a struct ps3_dma_region.
761 * @virt_addr: Starting virtual address of the area to map.
762 * @len: Length in bytes of the area to map.
763 * @bus_addr: A pointer to return the starting ioc bus address of the area to
764 * map.
765 *
766 * This is the common dma mapping routine.
767 */
768
dma_sb_map_area(struct ps3_dma_region * r,unsigned long virt_addr,unsigned long len,dma_addr_t * bus_addr,u64 iopte_flag)769 static int dma_sb_map_area(struct ps3_dma_region *r, unsigned long virt_addr,
770 unsigned long len, dma_addr_t *bus_addr,
771 u64 iopte_flag)
772 {
773 int result;
774 unsigned long flags;
775 struct dma_chunk *c;
776 unsigned long phys_addr = is_kernel_addr(virt_addr) ? __pa(virt_addr)
777 : virt_addr;
778 unsigned long aligned_phys = _ALIGN_DOWN(phys_addr, 1 << r->page_size);
779 unsigned long aligned_len = _ALIGN_UP(len + phys_addr - aligned_phys,
780 1 << r->page_size);
781 *bus_addr = dma_sb_lpar_to_bus(r, ps3_mm_phys_to_lpar(phys_addr));
782
783 if (!USE_DYNAMIC_DMA) {
784 unsigned long lpar_addr = ps3_mm_phys_to_lpar(phys_addr);
785 DBG(" -> %s:%d\n", __func__, __LINE__);
786 DBG("%s:%d virt_addr %lxh\n", __func__, __LINE__,
787 virt_addr);
788 DBG("%s:%d phys_addr %lxh\n", __func__, __LINE__,
789 phys_addr);
790 DBG("%s:%d lpar_addr %lxh\n", __func__, __LINE__,
791 lpar_addr);
792 DBG("%s:%d len %lxh\n", __func__, __LINE__, len);
793 DBG("%s:%d bus_addr %llxh (%lxh)\n", __func__, __LINE__,
794 *bus_addr, len);
795 }
796
797 spin_lock_irqsave(&r->chunk_list.lock, flags);
798 c = dma_find_chunk(r, *bus_addr, len);
799
800 if (c) {
801 DBG("%s:%d: reusing mapped chunk", __func__, __LINE__);
802 dma_dump_chunk(c);
803 c->usage_count++;
804 spin_unlock_irqrestore(&r->chunk_list.lock, flags);
805 return 0;
806 }
807
808 result = dma_sb_map_pages(r, aligned_phys, aligned_len, &c, iopte_flag);
809
810 if (result) {
811 *bus_addr = 0;
812 DBG("%s:%d: dma_sb_map_pages failed (%d)\n",
813 __func__, __LINE__, result);
814 spin_unlock_irqrestore(&r->chunk_list.lock, flags);
815 return result;
816 }
817
818 c->usage_count = 1;
819
820 spin_unlock_irqrestore(&r->chunk_list.lock, flags);
821 return result;
822 }
823
dma_ioc0_map_area(struct ps3_dma_region * r,unsigned long virt_addr,unsigned long len,dma_addr_t * bus_addr,u64 iopte_flag)824 static int dma_ioc0_map_area(struct ps3_dma_region *r, unsigned long virt_addr,
825 unsigned long len, dma_addr_t *bus_addr,
826 u64 iopte_flag)
827 {
828 int result;
829 unsigned long flags;
830 struct dma_chunk *c;
831 unsigned long phys_addr = is_kernel_addr(virt_addr) ? __pa(virt_addr)
832 : virt_addr;
833 unsigned long aligned_phys = _ALIGN_DOWN(phys_addr, 1 << r->page_size);
834 unsigned long aligned_len = _ALIGN_UP(len + phys_addr - aligned_phys,
835 1 << r->page_size);
836
837 DBG(KERN_ERR "%s: vaddr=%#lx, len=%#lx\n", __func__,
838 virt_addr, len);
839 DBG(KERN_ERR "%s: ph=%#lx a_ph=%#lx a_l=%#lx\n", __func__,
840 phys_addr, aligned_phys, aligned_len);
841
842 spin_lock_irqsave(&r->chunk_list.lock, flags);
843 c = dma_find_chunk_lpar(r, ps3_mm_phys_to_lpar(phys_addr), len);
844
845 if (c) {
846 /* FIXME */
847 BUG();
848 *bus_addr = c->bus_addr + phys_addr - aligned_phys;
849 c->usage_count++;
850 spin_unlock_irqrestore(&r->chunk_list.lock, flags);
851 return 0;
852 }
853
854 result = dma_ioc0_map_pages(r, aligned_phys, aligned_len, &c,
855 iopte_flag);
856
857 if (result) {
858 *bus_addr = 0;
859 DBG("%s:%d: dma_ioc0_map_pages failed (%d)\n",
860 __func__, __LINE__, result);
861 spin_unlock_irqrestore(&r->chunk_list.lock, flags);
862 return result;
863 }
864 *bus_addr = c->bus_addr + phys_addr - aligned_phys;
865 DBG("%s: va=%#lx pa=%#lx a_pa=%#lx bus=%#llx\n", __func__,
866 virt_addr, phys_addr, aligned_phys, *bus_addr);
867 c->usage_count = 1;
868
869 spin_unlock_irqrestore(&r->chunk_list.lock, flags);
870 return result;
871 }
872
873 /**
874 * dma_sb_unmap_area - Unmap an area of memory from a device dma region.
875 * @r: Pointer to a struct ps3_dma_region.
876 * @bus_addr: The starting ioc bus address of the area to unmap.
877 * @len: Length in bytes of the area to unmap.
878 *
879 * This is the common dma unmap routine.
880 */
881
dma_sb_unmap_area(struct ps3_dma_region * r,dma_addr_t bus_addr,unsigned long len)882 static int dma_sb_unmap_area(struct ps3_dma_region *r, dma_addr_t bus_addr,
883 unsigned long len)
884 {
885 unsigned long flags;
886 struct dma_chunk *c;
887
888 spin_lock_irqsave(&r->chunk_list.lock, flags);
889 c = dma_find_chunk(r, bus_addr, len);
890
891 if (!c) {
892 unsigned long aligned_bus = _ALIGN_DOWN(bus_addr,
893 1 << r->page_size);
894 unsigned long aligned_len = _ALIGN_UP(len + bus_addr
895 - aligned_bus, 1 << r->page_size);
896 DBG("%s:%d: not found: bus_addr %llxh\n",
897 __func__, __LINE__, bus_addr);
898 DBG("%s:%d: not found: len %lxh\n",
899 __func__, __LINE__, len);
900 DBG("%s:%d: not found: aligned_bus %lxh\n",
901 __func__, __LINE__, aligned_bus);
902 DBG("%s:%d: not found: aligned_len %lxh\n",
903 __func__, __LINE__, aligned_len);
904 BUG();
905 }
906
907 c->usage_count--;
908
909 if (!c->usage_count) {
910 list_del(&c->link);
911 dma_sb_free_chunk(c);
912 }
913
914 spin_unlock_irqrestore(&r->chunk_list.lock, flags);
915 return 0;
916 }
917
dma_ioc0_unmap_area(struct ps3_dma_region * r,dma_addr_t bus_addr,unsigned long len)918 static int dma_ioc0_unmap_area(struct ps3_dma_region *r,
919 dma_addr_t bus_addr, unsigned long len)
920 {
921 unsigned long flags;
922 struct dma_chunk *c;
923
924 DBG("%s: start a=%#llx l=%#lx\n", __func__, bus_addr, len);
925 spin_lock_irqsave(&r->chunk_list.lock, flags);
926 c = dma_find_chunk(r, bus_addr, len);
927
928 if (!c) {
929 unsigned long aligned_bus = _ALIGN_DOWN(bus_addr,
930 1 << r->page_size);
931 unsigned long aligned_len = _ALIGN_UP(len + bus_addr
932 - aligned_bus,
933 1 << r->page_size);
934 DBG("%s:%d: not found: bus_addr %llxh\n",
935 __func__, __LINE__, bus_addr);
936 DBG("%s:%d: not found: len %lxh\n",
937 __func__, __LINE__, len);
938 DBG("%s:%d: not found: aligned_bus %lxh\n",
939 __func__, __LINE__, aligned_bus);
940 DBG("%s:%d: not found: aligned_len %lxh\n",
941 __func__, __LINE__, aligned_len);
942 BUG();
943 }
944
945 c->usage_count--;
946
947 if (!c->usage_count) {
948 list_del(&c->link);
949 dma_ioc0_free_chunk(c);
950 }
951
952 spin_unlock_irqrestore(&r->chunk_list.lock, flags);
953 DBG("%s: end\n", __func__);
954 return 0;
955 }
956
957 /**
958 * dma_sb_region_create_linear - Setup a linear dma mapping for a device.
959 * @r: Pointer to a struct ps3_dma_region.
960 *
961 * This routine creates an HV dma region for the device and maps all available
962 * ram into the io controller bus address space.
963 */
964
dma_sb_region_create_linear(struct ps3_dma_region * r)965 static int dma_sb_region_create_linear(struct ps3_dma_region *r)
966 {
967 int result;
968 unsigned long virt_addr, len;
969 dma_addr_t tmp;
970
971 if (r->len > 16*1024*1024) { /* FIXME: need proper fix */
972 /* force 16M dma pages for linear mapping */
973 if (r->page_size != PS3_DMA_16M) {
974 pr_info("%s:%d: forcing 16M pages for linear map\n",
975 __func__, __LINE__);
976 r->page_size = PS3_DMA_16M;
977 r->len = _ALIGN_UP(r->len, 1 << r->page_size);
978 }
979 }
980
981 result = dma_sb_region_create(r);
982 BUG_ON(result);
983
984 if (r->offset < map.rm.size) {
985 /* Map (part of) 1st RAM chunk */
986 virt_addr = map.rm.base + r->offset;
987 len = map.rm.size - r->offset;
988 if (len > r->len)
989 len = r->len;
990 result = dma_sb_map_area(r, virt_addr, len, &tmp,
991 CBE_IOPTE_PP_W | CBE_IOPTE_PP_R | CBE_IOPTE_SO_RW |
992 CBE_IOPTE_M);
993 BUG_ON(result);
994 }
995
996 if (r->offset + r->len > map.rm.size) {
997 /* Map (part of) 2nd RAM chunk */
998 virt_addr = map.rm.size;
999 len = r->len;
1000 if (r->offset >= map.rm.size)
1001 virt_addr += r->offset - map.rm.size;
1002 else
1003 len -= map.rm.size - r->offset;
1004 result = dma_sb_map_area(r, virt_addr, len, &tmp,
1005 CBE_IOPTE_PP_W | CBE_IOPTE_PP_R | CBE_IOPTE_SO_RW |
1006 CBE_IOPTE_M);
1007 BUG_ON(result);
1008 }
1009
1010 return result;
1011 }
1012
1013 /**
1014 * dma_sb_region_free_linear - Free a linear dma mapping for a device.
1015 * @r: Pointer to a struct ps3_dma_region.
1016 *
1017 * This routine will unmap all mapped areas and free the HV dma region.
1018 */
1019
dma_sb_region_free_linear(struct ps3_dma_region * r)1020 static int dma_sb_region_free_linear(struct ps3_dma_region *r)
1021 {
1022 int result;
1023 dma_addr_t bus_addr;
1024 unsigned long len, lpar_addr;
1025
1026 if (r->offset < map.rm.size) {
1027 /* Unmap (part of) 1st RAM chunk */
1028 lpar_addr = map.rm.base + r->offset;
1029 len = map.rm.size - r->offset;
1030 if (len > r->len)
1031 len = r->len;
1032 bus_addr = dma_sb_lpar_to_bus(r, lpar_addr);
1033 result = dma_sb_unmap_area(r, bus_addr, len);
1034 BUG_ON(result);
1035 }
1036
1037 if (r->offset + r->len > map.rm.size) {
1038 /* Unmap (part of) 2nd RAM chunk */
1039 lpar_addr = map.r1.base;
1040 len = r->len;
1041 if (r->offset >= map.rm.size)
1042 lpar_addr += r->offset - map.rm.size;
1043 else
1044 len -= map.rm.size - r->offset;
1045 bus_addr = dma_sb_lpar_to_bus(r, lpar_addr);
1046 result = dma_sb_unmap_area(r, bus_addr, len);
1047 BUG_ON(result);
1048 }
1049
1050 result = dma_sb_region_free(r);
1051 BUG_ON(result);
1052
1053 return result;
1054 }
1055
1056 /**
1057 * dma_sb_map_area_linear - Map an area of memory into a device dma region.
1058 * @r: Pointer to a struct ps3_dma_region.
1059 * @virt_addr: Starting virtual address of the area to map.
1060 * @len: Length in bytes of the area to map.
1061 * @bus_addr: A pointer to return the starting ioc bus address of the area to
1062 * map.
1063 *
1064 * This routine just returns the corresponding bus address. Actual mapping
1065 * occurs in dma_region_create_linear().
1066 */
1067
dma_sb_map_area_linear(struct ps3_dma_region * r,unsigned long virt_addr,unsigned long len,dma_addr_t * bus_addr,u64 iopte_flag)1068 static int dma_sb_map_area_linear(struct ps3_dma_region *r,
1069 unsigned long virt_addr, unsigned long len, dma_addr_t *bus_addr,
1070 u64 iopte_flag)
1071 {
1072 unsigned long phys_addr = is_kernel_addr(virt_addr) ? __pa(virt_addr)
1073 : virt_addr;
1074 *bus_addr = dma_sb_lpar_to_bus(r, ps3_mm_phys_to_lpar(phys_addr));
1075 return 0;
1076 }
1077
1078 /**
1079 * dma_unmap_area_linear - Unmap an area of memory from a device dma region.
1080 * @r: Pointer to a struct ps3_dma_region.
1081 * @bus_addr: The starting ioc bus address of the area to unmap.
1082 * @len: Length in bytes of the area to unmap.
1083 *
1084 * This routine does nothing. Unmapping occurs in dma_sb_region_free_linear().
1085 */
1086
dma_sb_unmap_area_linear(struct ps3_dma_region * r,dma_addr_t bus_addr,unsigned long len)1087 static int dma_sb_unmap_area_linear(struct ps3_dma_region *r,
1088 dma_addr_t bus_addr, unsigned long len)
1089 {
1090 return 0;
1091 };
1092
1093 static const struct ps3_dma_region_ops ps3_dma_sb_region_ops = {
1094 .create = dma_sb_region_create,
1095 .free = dma_sb_region_free,
1096 .map = dma_sb_map_area,
1097 .unmap = dma_sb_unmap_area
1098 };
1099
1100 static const struct ps3_dma_region_ops ps3_dma_sb_region_linear_ops = {
1101 .create = dma_sb_region_create_linear,
1102 .free = dma_sb_region_free_linear,
1103 .map = dma_sb_map_area_linear,
1104 .unmap = dma_sb_unmap_area_linear
1105 };
1106
1107 static const struct ps3_dma_region_ops ps3_dma_ioc0_region_ops = {
1108 .create = dma_ioc0_region_create,
1109 .free = dma_ioc0_region_free,
1110 .map = dma_ioc0_map_area,
1111 .unmap = dma_ioc0_unmap_area
1112 };
1113
ps3_dma_region_init(struct ps3_system_bus_device * dev,struct ps3_dma_region * r,enum ps3_dma_page_size page_size,enum ps3_dma_region_type region_type,void * addr,unsigned long len)1114 int ps3_dma_region_init(struct ps3_system_bus_device *dev,
1115 struct ps3_dma_region *r, enum ps3_dma_page_size page_size,
1116 enum ps3_dma_region_type region_type, void *addr, unsigned long len)
1117 {
1118 unsigned long lpar_addr;
1119
1120 lpar_addr = addr ? ps3_mm_phys_to_lpar(__pa(addr)) : 0;
1121
1122 r->dev = dev;
1123 r->page_size = page_size;
1124 r->region_type = region_type;
1125 r->offset = lpar_addr;
1126 if (r->offset >= map.rm.size)
1127 r->offset -= map.r1.offset;
1128 r->len = len ? len : _ALIGN_UP(map.total, 1 << r->page_size);
1129
1130 switch (dev->dev_type) {
1131 case PS3_DEVICE_TYPE_SB:
1132 r->region_ops = (USE_DYNAMIC_DMA)
1133 ? &ps3_dma_sb_region_ops
1134 : &ps3_dma_sb_region_linear_ops;
1135 break;
1136 case PS3_DEVICE_TYPE_IOC0:
1137 r->region_ops = &ps3_dma_ioc0_region_ops;
1138 break;
1139 default:
1140 BUG();
1141 return -EINVAL;
1142 }
1143 return 0;
1144 }
1145 EXPORT_SYMBOL(ps3_dma_region_init);
1146
ps3_dma_region_create(struct ps3_dma_region * r)1147 int ps3_dma_region_create(struct ps3_dma_region *r)
1148 {
1149 BUG_ON(!r);
1150 BUG_ON(!r->region_ops);
1151 BUG_ON(!r->region_ops->create);
1152 return r->region_ops->create(r);
1153 }
1154 EXPORT_SYMBOL(ps3_dma_region_create);
1155
ps3_dma_region_free(struct ps3_dma_region * r)1156 int ps3_dma_region_free(struct ps3_dma_region *r)
1157 {
1158 BUG_ON(!r);
1159 BUG_ON(!r->region_ops);
1160 BUG_ON(!r->region_ops->free);
1161 return r->region_ops->free(r);
1162 }
1163 EXPORT_SYMBOL(ps3_dma_region_free);
1164
ps3_dma_map(struct ps3_dma_region * r,unsigned long virt_addr,unsigned long len,dma_addr_t * bus_addr,u64 iopte_flag)1165 int ps3_dma_map(struct ps3_dma_region *r, unsigned long virt_addr,
1166 unsigned long len, dma_addr_t *bus_addr,
1167 u64 iopte_flag)
1168 {
1169 return r->region_ops->map(r, virt_addr, len, bus_addr, iopte_flag);
1170 }
1171
ps3_dma_unmap(struct ps3_dma_region * r,dma_addr_t bus_addr,unsigned long len)1172 int ps3_dma_unmap(struct ps3_dma_region *r, dma_addr_t bus_addr,
1173 unsigned long len)
1174 {
1175 return r->region_ops->unmap(r, bus_addr, len);
1176 }
1177
1178 /*============================================================================*/
1179 /* system startup routines */
1180 /*============================================================================*/
1181
1182 /**
1183 * ps3_mm_init - initialize the address space state variables
1184 */
1185
ps3_mm_init(void)1186 void __init ps3_mm_init(void)
1187 {
1188 int result;
1189
1190 DBG(" -> %s:%d\n", __func__, __LINE__);
1191
1192 result = ps3_repository_read_mm_info(&map.rm.base, &map.rm.size,
1193 &map.total);
1194
1195 if (result)
1196 panic("ps3_repository_read_mm_info() failed");
1197
1198 map.rm.offset = map.rm.base;
1199 map.vas_id = map.htab_size = 0;
1200
1201 /* this implementation assumes map.rm.base is zero */
1202
1203 BUG_ON(map.rm.base);
1204 BUG_ON(!map.rm.size);
1205
1206 /* Check if we got the highmem region from an earlier boot step */
1207
1208 if (ps3_mm_get_repository_highmem(&map.r1)) {
1209 result = ps3_mm_region_create(&map.r1, map.total - map.rm.size);
1210
1211 if (!result)
1212 ps3_mm_set_repository_highmem(&map.r1);
1213 }
1214
1215 /* correct map.total for the real total amount of memory we use */
1216 map.total = map.rm.size + map.r1.size;
1217
1218 if (!map.r1.size) {
1219 DBG("%s:%d: No highmem region found\n", __func__, __LINE__);
1220 } else {
1221 DBG("%s:%d: Adding highmem region: %llxh %llxh\n",
1222 __func__, __LINE__, map.rm.size,
1223 map.total - map.rm.size);
1224 memblock_add(map.rm.size, map.total - map.rm.size);
1225 }
1226
1227 DBG(" <- %s:%d\n", __func__, __LINE__);
1228 }
1229
1230 /**
1231 * ps3_mm_shutdown - final cleanup of address space
1232 */
1233
ps3_mm_shutdown(void)1234 void ps3_mm_shutdown(void)
1235 {
1236 ps3_mm_region_destroy(&map.r1);
1237 }
1238