1 // SPDX-License-Identifier: GPL-2.0-only 2 /* 3 * PS3 address space management. 4 * 5 * Copyright (C) 2006 Sony Computer Entertainment Inc. 6 * Copyright 2006 Sony Corp. 7 */ 8 9 #include <linux/dma-mapping.h> 10 #include <linux/kernel.h> 11 #include <linux/export.h> 12 #include <linux/memblock.h> 13 #include <linux/slab.h> 14 15 #include <asm/cell-regs.h> 16 #include <asm/firmware.h> 17 #include <asm/prom.h> 18 #include <asm/udbg.h> 19 #include <asm/lv1call.h> 20 #include <asm/setup.h> 21 22 #include "platform.h" 23 24 #if defined(DEBUG) 25 #define DBG udbg_printf 26 #else 27 #define DBG pr_devel 28 #endif 29 30 enum { 31 #if defined(CONFIG_PS3_DYNAMIC_DMA) 32 USE_DYNAMIC_DMA = 1, 33 #else 34 USE_DYNAMIC_DMA = 0, 35 #endif 36 }; 37 38 enum { 39 PAGE_SHIFT_4K = 12U, 40 PAGE_SHIFT_64K = 16U, 41 PAGE_SHIFT_16M = 24U, 42 }; 43 44 static unsigned long __init make_page_sizes(unsigned long a, unsigned long b) 45 { 46 return (a << 56) | (b << 48); 47 } 48 49 enum { 50 ALLOCATE_MEMORY_TRY_ALT_UNIT = 0X04, 51 ALLOCATE_MEMORY_ADDR_ZERO = 0X08, 52 }; 53 54 /* valid htab sizes are {18,19,20} = 256K, 512K, 1M */ 55 56 enum { 57 HTAB_SIZE_MAX = 20U, /* HV limit of 1MB */ 58 HTAB_SIZE_MIN = 18U, /* CPU limit of 256KB */ 59 }; 60 61 /*============================================================================*/ 62 /* virtual address space routines */ 63 /*============================================================================*/ 64 65 /** 66 * struct mem_region - memory region structure 67 * @base: base address 68 * @size: size in bytes 69 * @offset: difference between base and rm.size 70 * @destroy: flag if region should be destroyed upon shutdown 71 */ 72 73 struct mem_region { 74 u64 base; 75 u64 size; 76 unsigned long offset; 77 int destroy; 78 }; 79 80 /** 81 * struct map - address space state variables holder 82 * @total: total memory available as reported by HV 83 * @vas_id - HV virtual address space id 84 * @htab_size: htab size in bytes 85 * 86 * The HV virtual address space (vas) allows for hotplug memory regions. 87 * Memory regions can be created and destroyed in the vas at runtime. 88 * @rm: real mode (bootmem) region 89 * @r1: highmem region(s) 90 * 91 * ps3 addresses 92 * virt_addr: a cpu 'translated' effective address 93 * phys_addr: an address in what Linux thinks is the physical address space 94 * lpar_addr: an address in the HV virtual address space 95 * bus_addr: an io controller 'translated' address on a device bus 96 */ 97 98 struct map { 99 u64 total; 100 u64 vas_id; 101 u64 htab_size; 102 struct mem_region rm; 103 struct mem_region r1; 104 }; 105 106 #define debug_dump_map(x) _debug_dump_map(x, __func__, __LINE__) 107 static void __maybe_unused _debug_dump_map(const struct map *m, 108 const char *func, int line) 109 { 110 DBG("%s:%d: map.total = %llxh\n", func, line, m->total); 111 DBG("%s:%d: map.rm.size = %llxh\n", func, line, m->rm.size); 112 DBG("%s:%d: map.vas_id = %llu\n", func, line, m->vas_id); 113 DBG("%s:%d: map.htab_size = %llxh\n", func, line, m->htab_size); 114 DBG("%s:%d: map.r1.base = %llxh\n", func, line, m->r1.base); 115 DBG("%s:%d: map.r1.offset = %lxh\n", func, line, m->r1.offset); 116 DBG("%s:%d: map.r1.size = %llxh\n", func, line, m->r1.size); 117 } 118 119 static struct map map; 120 121 /** 122 * ps3_mm_phys_to_lpar - translate a linux physical address to lpar address 123 * @phys_addr: linux physical address 124 */ 125 126 unsigned long ps3_mm_phys_to_lpar(unsigned long phys_addr) 127 { 128 BUG_ON(is_kernel_addr(phys_addr)); 129 return (phys_addr < map.rm.size || phys_addr >= map.total) 130 ? phys_addr : phys_addr + map.r1.offset; 131 } 132 133 EXPORT_SYMBOL(ps3_mm_phys_to_lpar); 134 135 /** 136 * ps3_mm_vas_create - create the virtual address space 137 */ 138 139 void __init ps3_mm_vas_create(unsigned long* htab_size) 140 { 141 int result; 142 u64 start_address; 143 u64 size; 144 u64 access_right; 145 u64 max_page_size; 146 u64 flags; 147 148 result = lv1_query_logical_partition_address_region_info(0, 149 &start_address, &size, &access_right, &max_page_size, 150 &flags); 151 152 if (result) { 153 DBG("%s:%d: lv1_query_logical_partition_address_region_info " 154 "failed: %s\n", __func__, __LINE__, 155 ps3_result(result)); 156 goto fail; 157 } 158 159 if (max_page_size < PAGE_SHIFT_16M) { 160 DBG("%s:%d: bad max_page_size %llxh\n", __func__, __LINE__, 161 max_page_size); 162 goto fail; 163 } 164 165 BUILD_BUG_ON(CONFIG_PS3_HTAB_SIZE > HTAB_SIZE_MAX); 166 BUILD_BUG_ON(CONFIG_PS3_HTAB_SIZE < HTAB_SIZE_MIN); 167 168 result = lv1_construct_virtual_address_space(CONFIG_PS3_HTAB_SIZE, 169 2, make_page_sizes(PAGE_SHIFT_16M, PAGE_SHIFT_64K), 170 &map.vas_id, &map.htab_size); 171 172 if (result) { 173 DBG("%s:%d: lv1_construct_virtual_address_space failed: %s\n", 174 __func__, __LINE__, ps3_result(result)); 175 goto fail; 176 } 177 178 result = lv1_select_virtual_address_space(map.vas_id); 179 180 if (result) { 181 DBG("%s:%d: lv1_select_virtual_address_space failed: %s\n", 182 __func__, __LINE__, ps3_result(result)); 183 goto fail; 184 } 185 186 *htab_size = map.htab_size; 187 188 debug_dump_map(&map); 189 190 return; 191 192 fail: 193 panic("ps3_mm_vas_create failed"); 194 } 195 196 /** 197 * ps3_mm_vas_destroy - 198 * 199 * called during kexec sequence with MMU off. 200 */ 201 202 notrace void ps3_mm_vas_destroy(void) 203 { 204 int result; 205 206 if (map.vas_id) { 207 result = lv1_select_virtual_address_space(0); 208 result += lv1_destruct_virtual_address_space(map.vas_id); 209 210 if (result) { 211 lv1_panic(0); 212 } 213 214 map.vas_id = 0; 215 } 216 } 217 218 static int __init ps3_mm_get_repository_highmem(struct mem_region *r) 219 { 220 int result; 221 222 /* Assume a single highmem region. */ 223 224 result = ps3_repository_read_highmem_info(0, &r->base, &r->size); 225 226 if (result) 227 goto zero_region; 228 229 if (!r->base || !r->size) { 230 result = -1; 231 goto zero_region; 232 } 233 234 r->offset = r->base - map.rm.size; 235 236 DBG("%s:%d: Found high region in repository: %llxh %llxh\n", 237 __func__, __LINE__, r->base, r->size); 238 239 return 0; 240 241 zero_region: 242 DBG("%s:%d: No high region in repository.\n", __func__, __LINE__); 243 244 r->size = r->base = r->offset = 0; 245 return result; 246 } 247 248 static int ps3_mm_set_repository_highmem(const struct mem_region *r) 249 { 250 /* Assume a single highmem region. */ 251 252 return r ? ps3_repository_write_highmem_info(0, r->base, r->size) : 253 ps3_repository_write_highmem_info(0, 0, 0); 254 } 255 256 /** 257 * ps3_mm_region_create - create a memory region in the vas 258 * @r: pointer to a struct mem_region to accept initialized values 259 * @size: requested region size 260 * 261 * This implementation creates the region with the vas large page size. 262 * @size is rounded down to a multiple of the vas large page size. 263 */ 264 265 static int ps3_mm_region_create(struct mem_region *r, unsigned long size) 266 { 267 int result; 268 u64 muid; 269 270 r->size = ALIGN_DOWN(size, 1 << PAGE_SHIFT_16M); 271 272 DBG("%s:%d requested %lxh\n", __func__, __LINE__, size); 273 DBG("%s:%d actual %llxh\n", __func__, __LINE__, r->size); 274 DBG("%s:%d difference %llxh (%lluMB)\n", __func__, __LINE__, 275 size - r->size, (size - r->size) / 1024 / 1024); 276 277 if (r->size == 0) { 278 DBG("%s:%d: size == 0\n", __func__, __LINE__); 279 result = -1; 280 goto zero_region; 281 } 282 283 result = lv1_allocate_memory(r->size, PAGE_SHIFT_16M, 0, 284 ALLOCATE_MEMORY_TRY_ALT_UNIT, &r->base, &muid); 285 286 if (result || r->base < map.rm.size) { 287 DBG("%s:%d: lv1_allocate_memory failed: %s\n", 288 __func__, __LINE__, ps3_result(result)); 289 goto zero_region; 290 } 291 292 r->destroy = 1; 293 r->offset = r->base - map.rm.size; 294 return result; 295 296 zero_region: 297 r->size = r->base = r->offset = 0; 298 return result; 299 } 300 301 /** 302 * ps3_mm_region_destroy - destroy a memory region 303 * @r: pointer to struct mem_region 304 */ 305 306 static void ps3_mm_region_destroy(struct mem_region *r) 307 { 308 int result; 309 310 if (!r->destroy) { 311 return; 312 } 313 314 if (r->base) { 315 result = lv1_release_memory(r->base); 316 317 if (result) { 318 lv1_panic(0); 319 } 320 321 r->size = r->base = r->offset = 0; 322 map.total = map.rm.size; 323 } 324 325 ps3_mm_set_repository_highmem(NULL); 326 } 327 328 /*============================================================================*/ 329 /* dma routines */ 330 /*============================================================================*/ 331 332 /** 333 * dma_sb_lpar_to_bus - Translate an lpar address to ioc mapped bus address. 334 * @r: pointer to dma region structure 335 * @lpar_addr: HV lpar address 336 */ 337 338 static unsigned long dma_sb_lpar_to_bus(struct ps3_dma_region *r, 339 unsigned long lpar_addr) 340 { 341 if (lpar_addr >= map.rm.size) 342 lpar_addr -= map.r1.offset; 343 BUG_ON(lpar_addr < r->offset); 344 BUG_ON(lpar_addr >= r->offset + r->len); 345 return r->bus_addr + lpar_addr - r->offset; 346 } 347 348 #define dma_dump_region(_a) _dma_dump_region(_a, __func__, __LINE__) 349 static void __maybe_unused _dma_dump_region(const struct ps3_dma_region *r, 350 const char *func, int line) 351 { 352 DBG("%s:%d: dev %llu:%llu\n", func, line, r->dev->bus_id, 353 r->dev->dev_id); 354 DBG("%s:%d: page_size %u\n", func, line, r->page_size); 355 DBG("%s:%d: bus_addr %lxh\n", func, line, r->bus_addr); 356 DBG("%s:%d: len %lxh\n", func, line, r->len); 357 DBG("%s:%d: offset %lxh\n", func, line, r->offset); 358 } 359 360 /** 361 * dma_chunk - A chunk of dma pages mapped by the io controller. 362 * @region - The dma region that owns this chunk. 363 * @lpar_addr: Starting lpar address of the area to map. 364 * @bus_addr: Starting ioc bus address of the area to map. 365 * @len: Length in bytes of the area to map. 366 * @link: A struct list_head used with struct ps3_dma_region.chunk_list, the 367 * list of all chuncks owned by the region. 368 * 369 * This implementation uses a very simple dma page manager 370 * based on the dma_chunk structure. This scheme assumes 371 * that all drivers use very well behaved dma ops. 372 */ 373 374 struct dma_chunk { 375 struct ps3_dma_region *region; 376 unsigned long lpar_addr; 377 unsigned long bus_addr; 378 unsigned long len; 379 struct list_head link; 380 unsigned int usage_count; 381 }; 382 383 #define dma_dump_chunk(_a) _dma_dump_chunk(_a, __func__, __LINE__) 384 static void _dma_dump_chunk (const struct dma_chunk* c, const char* func, 385 int line) 386 { 387 DBG("%s:%d: r.dev %llu:%llu\n", func, line, 388 c->region->dev->bus_id, c->region->dev->dev_id); 389 DBG("%s:%d: r.bus_addr %lxh\n", func, line, c->region->bus_addr); 390 DBG("%s:%d: r.page_size %u\n", func, line, c->region->page_size); 391 DBG("%s:%d: r.len %lxh\n", func, line, c->region->len); 392 DBG("%s:%d: r.offset %lxh\n", func, line, c->region->offset); 393 DBG("%s:%d: c.lpar_addr %lxh\n", func, line, c->lpar_addr); 394 DBG("%s:%d: c.bus_addr %lxh\n", func, line, c->bus_addr); 395 DBG("%s:%d: c.len %lxh\n", func, line, c->len); 396 } 397 398 static struct dma_chunk * dma_find_chunk(struct ps3_dma_region *r, 399 unsigned long bus_addr, unsigned long len) 400 { 401 struct dma_chunk *c; 402 unsigned long aligned_bus = ALIGN_DOWN(bus_addr, 1 << r->page_size); 403 unsigned long aligned_len = ALIGN(len+bus_addr-aligned_bus, 404 1 << r->page_size); 405 406 list_for_each_entry(c, &r->chunk_list.head, link) { 407 /* intersection */ 408 if (aligned_bus >= c->bus_addr && 409 aligned_bus + aligned_len <= c->bus_addr + c->len) 410 return c; 411 412 /* below */ 413 if (aligned_bus + aligned_len <= c->bus_addr) 414 continue; 415 416 /* above */ 417 if (aligned_bus >= c->bus_addr + c->len) 418 continue; 419 420 /* we don't handle the multi-chunk case for now */ 421 dma_dump_chunk(c); 422 BUG(); 423 } 424 return NULL; 425 } 426 427 static struct dma_chunk *dma_find_chunk_lpar(struct ps3_dma_region *r, 428 unsigned long lpar_addr, unsigned long len) 429 { 430 struct dma_chunk *c; 431 unsigned long aligned_lpar = ALIGN_DOWN(lpar_addr, 1 << r->page_size); 432 unsigned long aligned_len = ALIGN(len + lpar_addr - aligned_lpar, 433 1 << r->page_size); 434 435 list_for_each_entry(c, &r->chunk_list.head, link) { 436 /* intersection */ 437 if (c->lpar_addr <= aligned_lpar && 438 aligned_lpar < c->lpar_addr + c->len) { 439 if (aligned_lpar + aligned_len <= c->lpar_addr + c->len) 440 return c; 441 else { 442 dma_dump_chunk(c); 443 BUG(); 444 } 445 } 446 /* below */ 447 if (aligned_lpar + aligned_len <= c->lpar_addr) { 448 continue; 449 } 450 /* above */ 451 if (c->lpar_addr + c->len <= aligned_lpar) { 452 continue; 453 } 454 } 455 return NULL; 456 } 457 458 static int dma_sb_free_chunk(struct dma_chunk *c) 459 { 460 int result = 0; 461 462 if (c->bus_addr) { 463 result = lv1_unmap_device_dma_region(c->region->dev->bus_id, 464 c->region->dev->dev_id, c->bus_addr, c->len); 465 BUG_ON(result); 466 } 467 468 kfree(c); 469 return result; 470 } 471 472 static int dma_ioc0_free_chunk(struct dma_chunk *c) 473 { 474 int result = 0; 475 int iopage; 476 unsigned long offset; 477 struct ps3_dma_region *r = c->region; 478 479 DBG("%s:start\n", __func__); 480 for (iopage = 0; iopage < (c->len >> r->page_size); iopage++) { 481 offset = (1 << r->page_size) * iopage; 482 /* put INVALID entry */ 483 result = lv1_put_iopte(0, 484 c->bus_addr + offset, 485 c->lpar_addr + offset, 486 r->ioid, 487 0); 488 DBG("%s: bus=%#lx, lpar=%#lx, ioid=%d\n", __func__, 489 c->bus_addr + offset, 490 c->lpar_addr + offset, 491 r->ioid); 492 493 if (result) { 494 DBG("%s:%d: lv1_put_iopte failed: %s\n", __func__, 495 __LINE__, ps3_result(result)); 496 } 497 } 498 kfree(c); 499 DBG("%s:end\n", __func__); 500 return result; 501 } 502 503 /** 504 * dma_sb_map_pages - Maps dma pages into the io controller bus address space. 505 * @r: Pointer to a struct ps3_dma_region. 506 * @phys_addr: Starting physical address of the area to map. 507 * @len: Length in bytes of the area to map. 508 * c_out: A pointer to receive an allocated struct dma_chunk for this area. 509 * 510 * This is the lowest level dma mapping routine, and is the one that will 511 * make the HV call to add the pages into the io controller address space. 512 */ 513 514 static int dma_sb_map_pages(struct ps3_dma_region *r, unsigned long phys_addr, 515 unsigned long len, struct dma_chunk **c_out, u64 iopte_flag) 516 { 517 int result; 518 struct dma_chunk *c; 519 520 c = kzalloc(sizeof(*c), GFP_ATOMIC); 521 if (!c) { 522 result = -ENOMEM; 523 goto fail_alloc; 524 } 525 526 c->region = r; 527 c->lpar_addr = ps3_mm_phys_to_lpar(phys_addr); 528 c->bus_addr = dma_sb_lpar_to_bus(r, c->lpar_addr); 529 c->len = len; 530 531 BUG_ON(iopte_flag != 0xf800000000000000UL); 532 result = lv1_map_device_dma_region(c->region->dev->bus_id, 533 c->region->dev->dev_id, c->lpar_addr, 534 c->bus_addr, c->len, iopte_flag); 535 if (result) { 536 DBG("%s:%d: lv1_map_device_dma_region failed: %s\n", 537 __func__, __LINE__, ps3_result(result)); 538 goto fail_map; 539 } 540 541 list_add(&c->link, &r->chunk_list.head); 542 543 *c_out = c; 544 return 0; 545 546 fail_map: 547 kfree(c); 548 fail_alloc: 549 *c_out = NULL; 550 DBG(" <- %s:%d\n", __func__, __LINE__); 551 return result; 552 } 553 554 static int dma_ioc0_map_pages(struct ps3_dma_region *r, unsigned long phys_addr, 555 unsigned long len, struct dma_chunk **c_out, 556 u64 iopte_flag) 557 { 558 int result; 559 struct dma_chunk *c, *last; 560 int iopage, pages; 561 unsigned long offset; 562 563 DBG(KERN_ERR "%s: phy=%#lx, lpar%#lx, len=%#lx\n", __func__, 564 phys_addr, ps3_mm_phys_to_lpar(phys_addr), len); 565 c = kzalloc(sizeof(*c), GFP_ATOMIC); 566 if (!c) { 567 result = -ENOMEM; 568 goto fail_alloc; 569 } 570 571 c->region = r; 572 c->len = len; 573 c->lpar_addr = ps3_mm_phys_to_lpar(phys_addr); 574 /* allocate IO address */ 575 if (list_empty(&r->chunk_list.head)) { 576 /* first one */ 577 c->bus_addr = r->bus_addr; 578 } else { 579 /* derive from last bus addr*/ 580 last = list_entry(r->chunk_list.head.next, 581 struct dma_chunk, link); 582 c->bus_addr = last->bus_addr + last->len; 583 DBG("%s: last bus=%#lx, len=%#lx\n", __func__, 584 last->bus_addr, last->len); 585 } 586 587 /* FIXME: check whether length exceeds region size */ 588 589 /* build ioptes for the area */ 590 pages = len >> r->page_size; 591 DBG("%s: pgsize=%#x len=%#lx pages=%#x iopteflag=%#llx\n", __func__, 592 r->page_size, r->len, pages, iopte_flag); 593 for (iopage = 0; iopage < pages; iopage++) { 594 offset = (1 << r->page_size) * iopage; 595 result = lv1_put_iopte(0, 596 c->bus_addr + offset, 597 c->lpar_addr + offset, 598 r->ioid, 599 iopte_flag); 600 if (result) { 601 pr_warn("%s:%d: lv1_put_iopte failed: %s\n", 602 __func__, __LINE__, ps3_result(result)); 603 goto fail_map; 604 } 605 DBG("%s: pg=%d bus=%#lx, lpar=%#lx, ioid=%#x\n", __func__, 606 iopage, c->bus_addr + offset, c->lpar_addr + offset, 607 r->ioid); 608 } 609 610 /* be sure that last allocated one is inserted at head */ 611 list_add(&c->link, &r->chunk_list.head); 612 613 *c_out = c; 614 DBG("%s: end\n", __func__); 615 return 0; 616 617 fail_map: 618 for (iopage--; 0 <= iopage; iopage--) { 619 lv1_put_iopte(0, 620 c->bus_addr + offset, 621 c->lpar_addr + offset, 622 r->ioid, 623 0); 624 } 625 kfree(c); 626 fail_alloc: 627 *c_out = NULL; 628 return result; 629 } 630 631 /** 632 * dma_sb_region_create - Create a device dma region. 633 * @r: Pointer to a struct ps3_dma_region. 634 * 635 * This is the lowest level dma region create routine, and is the one that 636 * will make the HV call to create the region. 637 */ 638 639 static int dma_sb_region_create(struct ps3_dma_region *r) 640 { 641 int result; 642 u64 bus_addr; 643 644 DBG(" -> %s:%d:\n", __func__, __LINE__); 645 646 BUG_ON(!r); 647 648 if (!r->dev->bus_id) { 649 pr_info("%s:%d: %llu:%llu no dma\n", __func__, __LINE__, 650 r->dev->bus_id, r->dev->dev_id); 651 return 0; 652 } 653 654 DBG("%s:%u: len = 0x%lx, page_size = %u, offset = 0x%lx\n", __func__, 655 __LINE__, r->len, r->page_size, r->offset); 656 657 BUG_ON(!r->len); 658 BUG_ON(!r->page_size); 659 BUG_ON(!r->region_ops); 660 661 INIT_LIST_HEAD(&r->chunk_list.head); 662 spin_lock_init(&r->chunk_list.lock); 663 664 result = lv1_allocate_device_dma_region(r->dev->bus_id, r->dev->dev_id, 665 roundup_pow_of_two(r->len), r->page_size, r->region_type, 666 &bus_addr); 667 r->bus_addr = bus_addr; 668 669 if (result) { 670 DBG("%s:%d: lv1_allocate_device_dma_region failed: %s\n", 671 __func__, __LINE__, ps3_result(result)); 672 r->len = r->bus_addr = 0; 673 } 674 675 return result; 676 } 677 678 static int dma_ioc0_region_create(struct ps3_dma_region *r) 679 { 680 int result; 681 u64 bus_addr; 682 683 INIT_LIST_HEAD(&r->chunk_list.head); 684 spin_lock_init(&r->chunk_list.lock); 685 686 result = lv1_allocate_io_segment(0, 687 r->len, 688 r->page_size, 689 &bus_addr); 690 r->bus_addr = bus_addr; 691 if (result) { 692 DBG("%s:%d: lv1_allocate_io_segment failed: %s\n", 693 __func__, __LINE__, ps3_result(result)); 694 r->len = r->bus_addr = 0; 695 } 696 DBG("%s: len=%#lx, pg=%d, bus=%#lx\n", __func__, 697 r->len, r->page_size, r->bus_addr); 698 return result; 699 } 700 701 /** 702 * dma_region_free - Free a device dma region. 703 * @r: Pointer to a struct ps3_dma_region. 704 * 705 * This is the lowest level dma region free routine, and is the one that 706 * will make the HV call to free the region. 707 */ 708 709 static int dma_sb_region_free(struct ps3_dma_region *r) 710 { 711 int result; 712 struct dma_chunk *c; 713 struct dma_chunk *tmp; 714 715 BUG_ON(!r); 716 717 if (!r->dev->bus_id) { 718 pr_info("%s:%d: %llu:%llu no dma\n", __func__, __LINE__, 719 r->dev->bus_id, r->dev->dev_id); 720 return 0; 721 } 722 723 list_for_each_entry_safe(c, tmp, &r->chunk_list.head, link) { 724 list_del(&c->link); 725 dma_sb_free_chunk(c); 726 } 727 728 result = lv1_free_device_dma_region(r->dev->bus_id, r->dev->dev_id, 729 r->bus_addr); 730 731 if (result) 732 DBG("%s:%d: lv1_free_device_dma_region failed: %s\n", 733 __func__, __LINE__, ps3_result(result)); 734 735 r->bus_addr = 0; 736 737 return result; 738 } 739 740 static int dma_ioc0_region_free(struct ps3_dma_region *r) 741 { 742 int result; 743 struct dma_chunk *c, *n; 744 745 DBG("%s: start\n", __func__); 746 list_for_each_entry_safe(c, n, &r->chunk_list.head, link) { 747 list_del(&c->link); 748 dma_ioc0_free_chunk(c); 749 } 750 751 result = lv1_release_io_segment(0, r->bus_addr); 752 753 if (result) 754 DBG("%s:%d: lv1_free_device_dma_region failed: %s\n", 755 __func__, __LINE__, ps3_result(result)); 756 757 r->bus_addr = 0; 758 DBG("%s: end\n", __func__); 759 760 return result; 761 } 762 763 /** 764 * dma_sb_map_area - Map an area of memory into a device dma region. 765 * @r: Pointer to a struct ps3_dma_region. 766 * @virt_addr: Starting virtual address of the area to map. 767 * @len: Length in bytes of the area to map. 768 * @bus_addr: A pointer to return the starting ioc bus address of the area to 769 * map. 770 * 771 * This is the common dma mapping routine. 772 */ 773 774 static int dma_sb_map_area(struct ps3_dma_region *r, unsigned long virt_addr, 775 unsigned long len, dma_addr_t *bus_addr, 776 u64 iopte_flag) 777 { 778 int result; 779 unsigned long flags; 780 struct dma_chunk *c; 781 unsigned long phys_addr = is_kernel_addr(virt_addr) ? __pa(virt_addr) 782 : virt_addr; 783 unsigned long aligned_phys = ALIGN_DOWN(phys_addr, 1 << r->page_size); 784 unsigned long aligned_len = ALIGN(len + phys_addr - aligned_phys, 785 1 << r->page_size); 786 *bus_addr = dma_sb_lpar_to_bus(r, ps3_mm_phys_to_lpar(phys_addr)); 787 788 if (!USE_DYNAMIC_DMA) { 789 unsigned long lpar_addr = ps3_mm_phys_to_lpar(phys_addr); 790 DBG(" -> %s:%d\n", __func__, __LINE__); 791 DBG("%s:%d virt_addr %lxh\n", __func__, __LINE__, 792 virt_addr); 793 DBG("%s:%d phys_addr %lxh\n", __func__, __LINE__, 794 phys_addr); 795 DBG("%s:%d lpar_addr %lxh\n", __func__, __LINE__, 796 lpar_addr); 797 DBG("%s:%d len %lxh\n", __func__, __LINE__, len); 798 DBG("%s:%d bus_addr %llxh (%lxh)\n", __func__, __LINE__, 799 *bus_addr, len); 800 } 801 802 spin_lock_irqsave(&r->chunk_list.lock, flags); 803 c = dma_find_chunk(r, *bus_addr, len); 804 805 if (c) { 806 DBG("%s:%d: reusing mapped chunk", __func__, __LINE__); 807 dma_dump_chunk(c); 808 c->usage_count++; 809 spin_unlock_irqrestore(&r->chunk_list.lock, flags); 810 return 0; 811 } 812 813 result = dma_sb_map_pages(r, aligned_phys, aligned_len, &c, iopte_flag); 814 815 if (result) { 816 *bus_addr = 0; 817 DBG("%s:%d: dma_sb_map_pages failed (%d)\n", 818 __func__, __LINE__, result); 819 spin_unlock_irqrestore(&r->chunk_list.lock, flags); 820 return result; 821 } 822 823 c->usage_count = 1; 824 825 spin_unlock_irqrestore(&r->chunk_list.lock, flags); 826 return result; 827 } 828 829 static int dma_ioc0_map_area(struct ps3_dma_region *r, unsigned long virt_addr, 830 unsigned long len, dma_addr_t *bus_addr, 831 u64 iopte_flag) 832 { 833 int result; 834 unsigned long flags; 835 struct dma_chunk *c; 836 unsigned long phys_addr = is_kernel_addr(virt_addr) ? __pa(virt_addr) 837 : virt_addr; 838 unsigned long aligned_phys = ALIGN_DOWN(phys_addr, 1 << r->page_size); 839 unsigned long aligned_len = ALIGN(len + phys_addr - aligned_phys, 840 1 << r->page_size); 841 842 DBG(KERN_ERR "%s: vaddr=%#lx, len=%#lx\n", __func__, 843 virt_addr, len); 844 DBG(KERN_ERR "%s: ph=%#lx a_ph=%#lx a_l=%#lx\n", __func__, 845 phys_addr, aligned_phys, aligned_len); 846 847 spin_lock_irqsave(&r->chunk_list.lock, flags); 848 c = dma_find_chunk_lpar(r, ps3_mm_phys_to_lpar(phys_addr), len); 849 850 if (c) { 851 /* FIXME */ 852 BUG(); 853 *bus_addr = c->bus_addr + phys_addr - aligned_phys; 854 c->usage_count++; 855 spin_unlock_irqrestore(&r->chunk_list.lock, flags); 856 return 0; 857 } 858 859 result = dma_ioc0_map_pages(r, aligned_phys, aligned_len, &c, 860 iopte_flag); 861 862 if (result) { 863 *bus_addr = 0; 864 DBG("%s:%d: dma_ioc0_map_pages failed (%d)\n", 865 __func__, __LINE__, result); 866 spin_unlock_irqrestore(&r->chunk_list.lock, flags); 867 return result; 868 } 869 *bus_addr = c->bus_addr + phys_addr - aligned_phys; 870 DBG("%s: va=%#lx pa=%#lx a_pa=%#lx bus=%#llx\n", __func__, 871 virt_addr, phys_addr, aligned_phys, *bus_addr); 872 c->usage_count = 1; 873 874 spin_unlock_irqrestore(&r->chunk_list.lock, flags); 875 return result; 876 } 877 878 /** 879 * dma_sb_unmap_area - Unmap an area of memory from a device dma region. 880 * @r: Pointer to a struct ps3_dma_region. 881 * @bus_addr: The starting ioc bus address of the area to unmap. 882 * @len: Length in bytes of the area to unmap. 883 * 884 * This is the common dma unmap routine. 885 */ 886 887 static int dma_sb_unmap_area(struct ps3_dma_region *r, dma_addr_t bus_addr, 888 unsigned long len) 889 { 890 unsigned long flags; 891 struct dma_chunk *c; 892 893 spin_lock_irqsave(&r->chunk_list.lock, flags); 894 c = dma_find_chunk(r, bus_addr, len); 895 896 if (!c) { 897 unsigned long aligned_bus = ALIGN_DOWN(bus_addr, 898 1 << r->page_size); 899 unsigned long aligned_len = ALIGN(len + bus_addr 900 - aligned_bus, 1 << r->page_size); 901 DBG("%s:%d: not found: bus_addr %llxh\n", 902 __func__, __LINE__, bus_addr); 903 DBG("%s:%d: not found: len %lxh\n", 904 __func__, __LINE__, len); 905 DBG("%s:%d: not found: aligned_bus %lxh\n", 906 __func__, __LINE__, aligned_bus); 907 DBG("%s:%d: not found: aligned_len %lxh\n", 908 __func__, __LINE__, aligned_len); 909 BUG(); 910 } 911 912 c->usage_count--; 913 914 if (!c->usage_count) { 915 list_del(&c->link); 916 dma_sb_free_chunk(c); 917 } 918 919 spin_unlock_irqrestore(&r->chunk_list.lock, flags); 920 return 0; 921 } 922 923 static int dma_ioc0_unmap_area(struct ps3_dma_region *r, 924 dma_addr_t bus_addr, unsigned long len) 925 { 926 unsigned long flags; 927 struct dma_chunk *c; 928 929 DBG("%s: start a=%#llx l=%#lx\n", __func__, bus_addr, len); 930 spin_lock_irqsave(&r->chunk_list.lock, flags); 931 c = dma_find_chunk(r, bus_addr, len); 932 933 if (!c) { 934 unsigned long aligned_bus = ALIGN_DOWN(bus_addr, 935 1 << r->page_size); 936 unsigned long aligned_len = ALIGN(len + bus_addr 937 - aligned_bus, 938 1 << r->page_size); 939 DBG("%s:%d: not found: bus_addr %llxh\n", 940 __func__, __LINE__, bus_addr); 941 DBG("%s:%d: not found: len %lxh\n", 942 __func__, __LINE__, len); 943 DBG("%s:%d: not found: aligned_bus %lxh\n", 944 __func__, __LINE__, aligned_bus); 945 DBG("%s:%d: not found: aligned_len %lxh\n", 946 __func__, __LINE__, aligned_len); 947 BUG(); 948 } 949 950 c->usage_count--; 951 952 if (!c->usage_count) { 953 list_del(&c->link); 954 dma_ioc0_free_chunk(c); 955 } 956 957 spin_unlock_irqrestore(&r->chunk_list.lock, flags); 958 DBG("%s: end\n", __func__); 959 return 0; 960 } 961 962 /** 963 * dma_sb_region_create_linear - Setup a linear dma mapping for a device. 964 * @r: Pointer to a struct ps3_dma_region. 965 * 966 * This routine creates an HV dma region for the device and maps all available 967 * ram into the io controller bus address space. 968 */ 969 970 static int dma_sb_region_create_linear(struct ps3_dma_region *r) 971 { 972 int result; 973 unsigned long virt_addr, len; 974 dma_addr_t tmp; 975 976 if (r->len > 16*1024*1024) { /* FIXME: need proper fix */ 977 /* force 16M dma pages for linear mapping */ 978 if (r->page_size != PS3_DMA_16M) { 979 pr_info("%s:%d: forcing 16M pages for linear map\n", 980 __func__, __LINE__); 981 r->page_size = PS3_DMA_16M; 982 r->len = ALIGN(r->len, 1 << r->page_size); 983 } 984 } 985 986 result = dma_sb_region_create(r); 987 BUG_ON(result); 988 989 if (r->offset < map.rm.size) { 990 /* Map (part of) 1st RAM chunk */ 991 virt_addr = map.rm.base + r->offset; 992 len = map.rm.size - r->offset; 993 if (len > r->len) 994 len = r->len; 995 result = dma_sb_map_area(r, virt_addr, len, &tmp, 996 CBE_IOPTE_PP_W | CBE_IOPTE_PP_R | CBE_IOPTE_SO_RW | 997 CBE_IOPTE_M); 998 BUG_ON(result); 999 } 1000 1001 if (r->offset + r->len > map.rm.size) { 1002 /* Map (part of) 2nd RAM chunk */ 1003 virt_addr = map.rm.size; 1004 len = r->len; 1005 if (r->offset >= map.rm.size) 1006 virt_addr += r->offset - map.rm.size; 1007 else 1008 len -= map.rm.size - r->offset; 1009 result = dma_sb_map_area(r, virt_addr, len, &tmp, 1010 CBE_IOPTE_PP_W | CBE_IOPTE_PP_R | CBE_IOPTE_SO_RW | 1011 CBE_IOPTE_M); 1012 BUG_ON(result); 1013 } 1014 1015 return result; 1016 } 1017 1018 /** 1019 * dma_sb_region_free_linear - Free a linear dma mapping for a device. 1020 * @r: Pointer to a struct ps3_dma_region. 1021 * 1022 * This routine will unmap all mapped areas and free the HV dma region. 1023 */ 1024 1025 static int dma_sb_region_free_linear(struct ps3_dma_region *r) 1026 { 1027 int result; 1028 dma_addr_t bus_addr; 1029 unsigned long len, lpar_addr; 1030 1031 if (r->offset < map.rm.size) { 1032 /* Unmap (part of) 1st RAM chunk */ 1033 lpar_addr = map.rm.base + r->offset; 1034 len = map.rm.size - r->offset; 1035 if (len > r->len) 1036 len = r->len; 1037 bus_addr = dma_sb_lpar_to_bus(r, lpar_addr); 1038 result = dma_sb_unmap_area(r, bus_addr, len); 1039 BUG_ON(result); 1040 } 1041 1042 if (r->offset + r->len > map.rm.size) { 1043 /* Unmap (part of) 2nd RAM chunk */ 1044 lpar_addr = map.r1.base; 1045 len = r->len; 1046 if (r->offset >= map.rm.size) 1047 lpar_addr += r->offset - map.rm.size; 1048 else 1049 len -= map.rm.size - r->offset; 1050 bus_addr = dma_sb_lpar_to_bus(r, lpar_addr); 1051 result = dma_sb_unmap_area(r, bus_addr, len); 1052 BUG_ON(result); 1053 } 1054 1055 result = dma_sb_region_free(r); 1056 BUG_ON(result); 1057 1058 return result; 1059 } 1060 1061 /** 1062 * dma_sb_map_area_linear - Map an area of memory into a device dma region. 1063 * @r: Pointer to a struct ps3_dma_region. 1064 * @virt_addr: Starting virtual address of the area to map. 1065 * @len: Length in bytes of the area to map. 1066 * @bus_addr: A pointer to return the starting ioc bus address of the area to 1067 * map. 1068 * 1069 * This routine just returns the corresponding bus address. Actual mapping 1070 * occurs in dma_region_create_linear(). 1071 */ 1072 1073 static int dma_sb_map_area_linear(struct ps3_dma_region *r, 1074 unsigned long virt_addr, unsigned long len, dma_addr_t *bus_addr, 1075 u64 iopte_flag) 1076 { 1077 unsigned long phys_addr = is_kernel_addr(virt_addr) ? __pa(virt_addr) 1078 : virt_addr; 1079 *bus_addr = dma_sb_lpar_to_bus(r, ps3_mm_phys_to_lpar(phys_addr)); 1080 return 0; 1081 } 1082 1083 /** 1084 * dma_unmap_area_linear - Unmap an area of memory from a device dma region. 1085 * @r: Pointer to a struct ps3_dma_region. 1086 * @bus_addr: The starting ioc bus address of the area to unmap. 1087 * @len: Length in bytes of the area to unmap. 1088 * 1089 * This routine does nothing. Unmapping occurs in dma_sb_region_free_linear(). 1090 */ 1091 1092 static int dma_sb_unmap_area_linear(struct ps3_dma_region *r, 1093 dma_addr_t bus_addr, unsigned long len) 1094 { 1095 return 0; 1096 }; 1097 1098 static const struct ps3_dma_region_ops ps3_dma_sb_region_ops = { 1099 .create = dma_sb_region_create, 1100 .free = dma_sb_region_free, 1101 .map = dma_sb_map_area, 1102 .unmap = dma_sb_unmap_area 1103 }; 1104 1105 static const struct ps3_dma_region_ops ps3_dma_sb_region_linear_ops = { 1106 .create = dma_sb_region_create_linear, 1107 .free = dma_sb_region_free_linear, 1108 .map = dma_sb_map_area_linear, 1109 .unmap = dma_sb_unmap_area_linear 1110 }; 1111 1112 static const struct ps3_dma_region_ops ps3_dma_ioc0_region_ops = { 1113 .create = dma_ioc0_region_create, 1114 .free = dma_ioc0_region_free, 1115 .map = dma_ioc0_map_area, 1116 .unmap = dma_ioc0_unmap_area 1117 }; 1118 1119 int ps3_dma_region_init(struct ps3_system_bus_device *dev, 1120 struct ps3_dma_region *r, enum ps3_dma_page_size page_size, 1121 enum ps3_dma_region_type region_type, void *addr, unsigned long len) 1122 { 1123 unsigned long lpar_addr; 1124 int result; 1125 1126 lpar_addr = addr ? ps3_mm_phys_to_lpar(__pa(addr)) : 0; 1127 1128 r->dev = dev; 1129 r->page_size = page_size; 1130 r->region_type = region_type; 1131 r->offset = lpar_addr; 1132 if (r->offset >= map.rm.size) 1133 r->offset -= map.r1.offset; 1134 r->len = len ? len : ALIGN(map.total, 1 << r->page_size); 1135 1136 dev->core.dma_mask = &r->dma_mask; 1137 1138 result = dma_set_mask_and_coherent(&dev->core, DMA_BIT_MASK(32)); 1139 1140 if (result < 0) { 1141 dev_err(&dev->core, "%s:%d: dma_set_mask_and_coherent failed: %d\n", 1142 __func__, __LINE__, result); 1143 return result; 1144 } 1145 1146 switch (dev->dev_type) { 1147 case PS3_DEVICE_TYPE_SB: 1148 r->region_ops = (USE_DYNAMIC_DMA) 1149 ? &ps3_dma_sb_region_ops 1150 : &ps3_dma_sb_region_linear_ops; 1151 break; 1152 case PS3_DEVICE_TYPE_IOC0: 1153 r->region_ops = &ps3_dma_ioc0_region_ops; 1154 break; 1155 default: 1156 BUG(); 1157 return -EINVAL; 1158 } 1159 return 0; 1160 } 1161 EXPORT_SYMBOL(ps3_dma_region_init); 1162 1163 int ps3_dma_region_create(struct ps3_dma_region *r) 1164 { 1165 BUG_ON(!r); 1166 BUG_ON(!r->region_ops); 1167 BUG_ON(!r->region_ops->create); 1168 return r->region_ops->create(r); 1169 } 1170 EXPORT_SYMBOL(ps3_dma_region_create); 1171 1172 int ps3_dma_region_free(struct ps3_dma_region *r) 1173 { 1174 BUG_ON(!r); 1175 BUG_ON(!r->region_ops); 1176 BUG_ON(!r->region_ops->free); 1177 return r->region_ops->free(r); 1178 } 1179 EXPORT_SYMBOL(ps3_dma_region_free); 1180 1181 int ps3_dma_map(struct ps3_dma_region *r, unsigned long virt_addr, 1182 unsigned long len, dma_addr_t *bus_addr, 1183 u64 iopte_flag) 1184 { 1185 return r->region_ops->map(r, virt_addr, len, bus_addr, iopte_flag); 1186 } 1187 1188 int ps3_dma_unmap(struct ps3_dma_region *r, dma_addr_t bus_addr, 1189 unsigned long len) 1190 { 1191 return r->region_ops->unmap(r, bus_addr, len); 1192 } 1193 1194 /*============================================================================*/ 1195 /* system startup routines */ 1196 /*============================================================================*/ 1197 1198 /** 1199 * ps3_mm_init - initialize the address space state variables 1200 */ 1201 1202 void __init ps3_mm_init(void) 1203 { 1204 int result; 1205 1206 DBG(" -> %s:%d\n", __func__, __LINE__); 1207 1208 result = ps3_repository_read_mm_info(&map.rm.base, &map.rm.size, 1209 &map.total); 1210 1211 if (result) 1212 panic("ps3_repository_read_mm_info() failed"); 1213 1214 map.rm.offset = map.rm.base; 1215 map.vas_id = map.htab_size = 0; 1216 1217 /* this implementation assumes map.rm.base is zero */ 1218 1219 BUG_ON(map.rm.base); 1220 BUG_ON(!map.rm.size); 1221 1222 /* Check if we got the highmem region from an earlier boot step */ 1223 1224 if (ps3_mm_get_repository_highmem(&map.r1)) { 1225 result = ps3_mm_region_create(&map.r1, map.total - map.rm.size); 1226 1227 if (!result) 1228 ps3_mm_set_repository_highmem(&map.r1); 1229 } 1230 1231 /* correct map.total for the real total amount of memory we use */ 1232 map.total = map.rm.size + map.r1.size; 1233 1234 if (!map.r1.size) { 1235 DBG("%s:%d: No highmem region found\n", __func__, __LINE__); 1236 } else { 1237 DBG("%s:%d: Adding highmem region: %llxh %llxh\n", 1238 __func__, __LINE__, map.rm.size, 1239 map.total - map.rm.size); 1240 memblock_add(map.rm.size, map.total - map.rm.size); 1241 } 1242 1243 DBG(" <- %s:%d\n", __func__, __LINE__); 1244 } 1245 1246 /** 1247 * ps3_mm_shutdown - final cleanup of address space 1248 * 1249 * called during kexec sequence with MMU off. 1250 */ 1251 1252 notrace void ps3_mm_shutdown(void) 1253 { 1254 ps3_mm_region_destroy(&map.r1); 1255 } 1256