]> bbs.cooldavid.org Git - net-next-2.6.git/blame - drivers/gpu/drm/ttm/ttm_bo_util.c
drm/ttm: ttm_fault callback to allow driver to handle bo placement V6
[net-next-2.6.git] / drivers / gpu / drm / ttm / ttm_bo_util.c
CommitLineData
ba4e7d97
TH
1/**************************************************************************
2 *
3 * Copyright (c) 2007-2009 VMware, Inc., Palo Alto, CA., USA
4 * All Rights Reserved.
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a
7 * copy of this software and associated documentation files (the
8 * "Software"), to deal in the Software without restriction, including
9 * without limitation the rights to use, copy, modify, merge, publish,
10 * distribute, sub license, and/or sell copies of the Software, and to
11 * permit persons to whom the Software is furnished to do so, subject to
12 * the following conditions:
13 *
14 * The above copyright notice and this permission notice (including the
15 * next paragraph) shall be included in all copies or substantial portions
16 * of the Software.
17 *
18 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
19 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
20 * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
21 * THE COPYRIGHT HOLDERS, AUTHORS AND/OR ITS SUPPLIERS BE LIABLE FOR ANY CLAIM,
22 * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
23 * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
24 * USE OR OTHER DEALINGS IN THE SOFTWARE.
25 *
26 **************************************************************************/
27/*
28 * Authors: Thomas Hellstrom <thellstrom-at-vmware-dot-com>
29 */
30
31#include "ttm/ttm_bo_driver.h"
32#include "ttm/ttm_placement.h"
33#include <linux/io.h>
34#include <linux/highmem.h>
35#include <linux/wait.h>
36#include <linux/vmalloc.h>
ba4e7d97
TH
37#include <linux/module.h>
38
39void ttm_bo_free_old_node(struct ttm_buffer_object *bo)
40{
41 struct ttm_mem_reg *old_mem = &bo->mem;
42
43 if (old_mem->mm_node) {
a987fcaa 44 spin_lock(&bo->glob->lru_lock);
ba4e7d97 45 drm_mm_put_block(old_mem->mm_node);
a987fcaa 46 spin_unlock(&bo->glob->lru_lock);
ba4e7d97
TH
47 }
48 old_mem->mm_node = NULL;
49}
50
51int ttm_bo_move_ttm(struct ttm_buffer_object *bo,
9d87fa21
JG
52 bool evict, bool no_wait_reserve,
53 bool no_wait_gpu, struct ttm_mem_reg *new_mem)
ba4e7d97
TH
54{
55 struct ttm_tt *ttm = bo->ttm;
56 struct ttm_mem_reg *old_mem = &bo->mem;
ba4e7d97
TH
57 int ret;
58
59 if (old_mem->mem_type != TTM_PL_SYSTEM) {
60 ttm_tt_unbind(ttm);
61 ttm_bo_free_old_node(bo);
62 ttm_flag_masked(&old_mem->placement, TTM_PL_FLAG_SYSTEM,
63 TTM_PL_MASK_MEM);
64 old_mem->mem_type = TTM_PL_SYSTEM;
ba4e7d97
TH
65 }
66
67 ret = ttm_tt_set_placement_caching(ttm, new_mem->placement);
68 if (unlikely(ret != 0))
69 return ret;
70
71 if (new_mem->mem_type != TTM_PL_SYSTEM) {
72 ret = ttm_tt_bind(ttm, new_mem);
73 if (unlikely(ret != 0))
74 return ret;
75 }
76
77 *old_mem = *new_mem;
78 new_mem->mm_node = NULL;
110b20c3 79
ba4e7d97
TH
80 return 0;
81}
82EXPORT_SYMBOL(ttm_bo_move_ttm);
83
82c5da6b
JG
84int ttm_mem_io_reserve(struct ttm_bo_device *bdev, struct ttm_mem_reg *mem)
85{
86 struct ttm_mem_type_manager *man = &bdev->man[mem->mem_type];
87 int ret;
88
89 if (bdev->driver->io_mem_reserve) {
90 if (!mem->bus.io_reserved) {
91 mem->bus.io_reserved = true;
92 ret = bdev->driver->io_mem_reserve(bdev, mem);
93 if (unlikely(ret != 0))
94 return ret;
95 }
96 } else {
97 ret = ttm_bo_pci_offset(bdev, mem, &mem->bus.base, &mem->bus.offset, &mem->bus.size);
98 if (unlikely(ret != 0))
99 return ret;
100 mem->bus.addr = NULL;
101 if (!(man->flags & TTM_MEMTYPE_FLAG_NEEDS_IOREMAP))
102 mem->bus.addr = (void *)(((u8 *)man->io_addr) + mem->bus.offset);
103 mem->bus.is_iomem = (mem->bus.size > 0) ? 1 : 0;
104 }
105 return 0;
106}
107
108void ttm_mem_io_free(struct ttm_bo_device *bdev, struct ttm_mem_reg *mem)
109{
110 if (bdev->driver->io_mem_reserve) {
111 if (mem->bus.io_reserved) {
112 mem->bus.io_reserved = false;
113 bdev->driver->io_mem_free(bdev, mem);
114 }
115 }
116}
117
ba4e7d97
TH
118int ttm_mem_reg_ioremap(struct ttm_bo_device *bdev, struct ttm_mem_reg *mem,
119 void **virtual)
120{
ba4e7d97
TH
121 int ret;
122 void *addr;
123
124 *virtual = NULL;
82c5da6b
JG
125 ret = ttm_mem_io_reserve(bdev, mem);
126 if (ret)
ba4e7d97
TH
127 return ret;
128
82c5da6b
JG
129 if (mem->bus.addr) {
130 addr = mem->bus.addr;
131 } else {
ba4e7d97 132 if (mem->placement & TTM_PL_FLAG_WC)
82c5da6b 133 addr = ioremap_wc(mem->bus.base + mem->bus.offset, mem->bus.size);
ba4e7d97 134 else
82c5da6b
JG
135 addr = ioremap_nocache(mem->bus.base + mem->bus.offset, mem->bus.size);
136 if (!addr) {
137 ttm_mem_io_free(bdev, mem);
ba4e7d97 138 return -ENOMEM;
82c5da6b 139 }
ba4e7d97
TH
140 }
141 *virtual = addr;
142 return 0;
143}
144
145void ttm_mem_reg_iounmap(struct ttm_bo_device *bdev, struct ttm_mem_reg *mem,
146 void *virtual)
147{
148 struct ttm_mem_type_manager *man;
149
150 man = &bdev->man[mem->mem_type];
151
82c5da6b 152 if (virtual && (man->flags & TTM_MEMTYPE_FLAG_NEEDS_IOREMAP || mem->bus.addr == NULL))
ba4e7d97 153 iounmap(virtual);
82c5da6b 154 ttm_mem_io_free(bdev, mem);
ba4e7d97
TH
155}
156
157static int ttm_copy_io_page(void *dst, void *src, unsigned long page)
158{
159 uint32_t *dstP =
160 (uint32_t *) ((unsigned long)dst + (page << PAGE_SHIFT));
161 uint32_t *srcP =
162 (uint32_t *) ((unsigned long)src + (page << PAGE_SHIFT));
163
164 int i;
165 for (i = 0; i < PAGE_SIZE / sizeof(uint32_t); ++i)
166 iowrite32(ioread32(srcP++), dstP++);
167 return 0;
168}
169
170static int ttm_copy_io_ttm_page(struct ttm_tt *ttm, void *src,
542c6f6d
TH
171 unsigned long page,
172 pgprot_t prot)
ba4e7d97
TH
173{
174 struct page *d = ttm_tt_get_page(ttm, page);
175 void *dst;
176
177 if (!d)
178 return -ENOMEM;
179
180 src = (void *)((unsigned long)src + (page << PAGE_SHIFT));
542c6f6d
TH
181
182#ifdef CONFIG_X86
183 dst = kmap_atomic_prot(d, KM_USER0, prot);
184#else
6d0897ba 185 if (pgprot_val(prot) != pgprot_val(PAGE_KERNEL))
542c6f6d
TH
186 dst = vmap(&d, 1, 0, prot);
187 else
188 dst = kmap(d);
189#endif
ba4e7d97
TH
190 if (!dst)
191 return -ENOMEM;
192
193 memcpy_fromio(dst, src, PAGE_SIZE);
542c6f6d
TH
194
195#ifdef CONFIG_X86
196 kunmap_atomic(dst, KM_USER0);
197#else
6d0897ba 198 if (pgprot_val(prot) != pgprot_val(PAGE_KERNEL))
542c6f6d
TH
199 vunmap(dst);
200 else
201 kunmap(d);
202#endif
203
ba4e7d97
TH
204 return 0;
205}
206
207static int ttm_copy_ttm_io_page(struct ttm_tt *ttm, void *dst,
542c6f6d
TH
208 unsigned long page,
209 pgprot_t prot)
ba4e7d97
TH
210{
211 struct page *s = ttm_tt_get_page(ttm, page);
212 void *src;
213
214 if (!s)
215 return -ENOMEM;
216
217 dst = (void *)((unsigned long)dst + (page << PAGE_SHIFT));
542c6f6d
TH
218#ifdef CONFIG_X86
219 src = kmap_atomic_prot(s, KM_USER0, prot);
220#else
6d0897ba 221 if (pgprot_val(prot) != pgprot_val(PAGE_KERNEL))
542c6f6d
TH
222 src = vmap(&s, 1, 0, prot);
223 else
224 src = kmap(s);
225#endif
ba4e7d97
TH
226 if (!src)
227 return -ENOMEM;
228
229 memcpy_toio(dst, src, PAGE_SIZE);
542c6f6d
TH
230
231#ifdef CONFIG_X86
232 kunmap_atomic(src, KM_USER0);
233#else
6d0897ba 234 if (pgprot_val(prot) != pgprot_val(PAGE_KERNEL))
542c6f6d
TH
235 vunmap(src);
236 else
237 kunmap(s);
238#endif
239
ba4e7d97
TH
240 return 0;
241}
242
243int ttm_bo_move_memcpy(struct ttm_buffer_object *bo,
9d87fa21
JG
244 bool evict, bool no_wait_reserve, bool no_wait_gpu,
245 struct ttm_mem_reg *new_mem)
ba4e7d97
TH
246{
247 struct ttm_bo_device *bdev = bo->bdev;
248 struct ttm_mem_type_manager *man = &bdev->man[new_mem->mem_type];
249 struct ttm_tt *ttm = bo->ttm;
250 struct ttm_mem_reg *old_mem = &bo->mem;
251 struct ttm_mem_reg old_copy = *old_mem;
252 void *old_iomap;
253 void *new_iomap;
254 int ret;
ba4e7d97
TH
255 unsigned long i;
256 unsigned long page;
257 unsigned long add = 0;
258 int dir;
259
260 ret = ttm_mem_reg_ioremap(bdev, old_mem, &old_iomap);
261 if (ret)
262 return ret;
263 ret = ttm_mem_reg_ioremap(bdev, new_mem, &new_iomap);
264 if (ret)
265 goto out;
266
267 if (old_iomap == NULL && new_iomap == NULL)
268 goto out2;
269 if (old_iomap == NULL && ttm == NULL)
270 goto out2;
271
272 add = 0;
273 dir = 1;
274
275 if ((old_mem->mem_type == new_mem->mem_type) &&
276 (new_mem->mm_node->start <
277 old_mem->mm_node->start + old_mem->mm_node->size)) {
278 dir = -1;
279 add = new_mem->num_pages - 1;
280 }
281
282 for (i = 0; i < new_mem->num_pages; ++i) {
283 page = i * dir + add;
542c6f6d
TH
284 if (old_iomap == NULL) {
285 pgprot_t prot = ttm_io_prot(old_mem->placement,
286 PAGE_KERNEL);
287 ret = ttm_copy_ttm_io_page(ttm, new_iomap, page,
288 prot);
289 } else if (new_iomap == NULL) {
290 pgprot_t prot = ttm_io_prot(new_mem->placement,
291 PAGE_KERNEL);
292 ret = ttm_copy_io_ttm_page(ttm, old_iomap, page,
293 prot);
294 } else
ba4e7d97
TH
295 ret = ttm_copy_io_page(new_iomap, old_iomap, page);
296 if (ret)
297 goto out1;
298 }
299 mb();
300out2:
301 ttm_bo_free_old_node(bo);
302
303 *old_mem = *new_mem;
304 new_mem->mm_node = NULL;
ba4e7d97
TH
305
306 if ((man->flags & TTM_MEMTYPE_FLAG_FIXED) && (ttm != NULL)) {
307 ttm_tt_unbind(ttm);
308 ttm_tt_destroy(ttm);
309 bo->ttm = NULL;
310 }
311
312out1:
313 ttm_mem_reg_iounmap(bdev, new_mem, new_iomap);
314out:
315 ttm_mem_reg_iounmap(bdev, &old_copy, old_iomap);
316 return ret;
317}
318EXPORT_SYMBOL(ttm_bo_move_memcpy);
319
320static void ttm_transfered_destroy(struct ttm_buffer_object *bo)
321{
322 kfree(bo);
323}
324
325/**
326 * ttm_buffer_object_transfer
327 *
328 * @bo: A pointer to a struct ttm_buffer_object.
329 * @new_obj: A pointer to a pointer to a newly created ttm_buffer_object,
330 * holding the data of @bo with the old placement.
331 *
332 * This is a utility function that may be called after an accelerated move
333 * has been scheduled. A new buffer object is created as a placeholder for
334 * the old data while it's being copied. When that buffer object is idle,
335 * it can be destroyed, releasing the space of the old placement.
336 * Returns:
337 * !0: Failure.
338 */
339
340static int ttm_buffer_object_transfer(struct ttm_buffer_object *bo,
341 struct ttm_buffer_object **new_obj)
342{
343 struct ttm_buffer_object *fbo;
344 struct ttm_bo_device *bdev = bo->bdev;
345 struct ttm_bo_driver *driver = bdev->driver;
346
347 fbo = kzalloc(sizeof(*fbo), GFP_KERNEL);
348 if (!fbo)
349 return -ENOMEM;
350
351 *fbo = *bo;
352
353 /**
354 * Fix up members that we shouldn't copy directly:
355 * TODO: Explicit member copy would probably be better here.
356 */
357
358 spin_lock_init(&fbo->lock);
359 init_waitqueue_head(&fbo->event_queue);
360 INIT_LIST_HEAD(&fbo->ddestroy);
361 INIT_LIST_HEAD(&fbo->lru);
362 INIT_LIST_HEAD(&fbo->swap);
363 fbo->vm_node = NULL;
364
365 fbo->sync_obj = driver->sync_obj_ref(bo->sync_obj);
366 if (fbo->mem.mm_node)
367 fbo->mem.mm_node->private = (void *)fbo;
368 kref_init(&fbo->list_kref);
369 kref_init(&fbo->kref);
370 fbo->destroy = &ttm_transfered_destroy;
371
372 *new_obj = fbo;
373 return 0;
374}
375
376pgprot_t ttm_io_prot(uint32_t caching_flags, pgprot_t tmp)
377{
378#if defined(__i386__) || defined(__x86_64__)
379 if (caching_flags & TTM_PL_FLAG_WC)
380 tmp = pgprot_writecombine(tmp);
381 else if (boot_cpu_data.x86 > 3)
382 tmp = pgprot_noncached(tmp);
383
384#elif defined(__powerpc__)
385 if (!(caching_flags & TTM_PL_FLAG_CACHED)) {
386 pgprot_val(tmp) |= _PAGE_NO_CACHE;
387 if (caching_flags & TTM_PL_FLAG_UNCACHED)
388 pgprot_val(tmp) |= _PAGE_GUARDED;
389 }
390#endif
391#if defined(__ia64__)
392 if (caching_flags & TTM_PL_FLAG_WC)
393 tmp = pgprot_writecombine(tmp);
394 else
395 tmp = pgprot_noncached(tmp);
396#endif
397#if defined(__sparc__)
398 if (!(caching_flags & TTM_PL_FLAG_CACHED))
399 tmp = pgprot_noncached(tmp);
400#endif
401 return tmp;
402}
4bfd75cb 403EXPORT_SYMBOL(ttm_io_prot);
ba4e7d97
TH
404
405static int ttm_bo_ioremap(struct ttm_buffer_object *bo,
82c5da6b
JG
406 unsigned long offset,
407 unsigned long size,
ba4e7d97
TH
408 struct ttm_bo_kmap_obj *map)
409{
ba4e7d97 410 struct ttm_mem_reg *mem = &bo->mem;
ba4e7d97 411
82c5da6b 412 if (bo->mem.bus.addr) {
ba4e7d97 413 map->bo_kmap_type = ttm_bo_map_premapped;
82c5da6b 414 map->virtual = (void *)(((u8 *)bo->mem.bus.addr) + offset);
ba4e7d97
TH
415 } else {
416 map->bo_kmap_type = ttm_bo_map_iomap;
417 if (mem->placement & TTM_PL_FLAG_WC)
82c5da6b
JG
418 map->virtual = ioremap_wc(bo->mem.bus.base + bo->mem.bus.offset + offset,
419 size);
ba4e7d97 420 else
82c5da6b
JG
421 map->virtual = ioremap_nocache(bo->mem.bus.base + bo->mem.bus.offset + offset,
422 size);
ba4e7d97
TH
423 }
424 return (!map->virtual) ? -ENOMEM : 0;
425}
426
427static int ttm_bo_kmap_ttm(struct ttm_buffer_object *bo,
428 unsigned long start_page,
429 unsigned long num_pages,
430 struct ttm_bo_kmap_obj *map)
431{
432 struct ttm_mem_reg *mem = &bo->mem; pgprot_t prot;
433 struct ttm_tt *ttm = bo->ttm;
434 struct page *d;
435 int i;
436
437 BUG_ON(!ttm);
438 if (num_pages == 1 && (mem->placement & TTM_PL_FLAG_CACHED)) {
439 /*
440 * We're mapping a single page, and the desired
441 * page protection is consistent with the bo.
442 */
443
444 map->bo_kmap_type = ttm_bo_map_kmap;
445 map->page = ttm_tt_get_page(ttm, start_page);
446 map->virtual = kmap(map->page);
447 } else {
448 /*
449 * Populate the part we're mapping;
450 */
451 for (i = start_page; i < start_page + num_pages; ++i) {
452 d = ttm_tt_get_page(ttm, i);
453 if (!d)
454 return -ENOMEM;
455 }
456
457 /*
458 * We need to use vmap to get the desired page protection
af901ca1 459 * or to make the buffer object look contiguous.
ba4e7d97
TH
460 */
461 prot = (mem->placement & TTM_PL_FLAG_CACHED) ?
462 PAGE_KERNEL :
463 ttm_io_prot(mem->placement, PAGE_KERNEL);
464 map->bo_kmap_type = ttm_bo_map_vmap;
465 map->virtual = vmap(ttm->pages + start_page, num_pages,
466 0, prot);
467 }
468 return (!map->virtual) ? -ENOMEM : 0;
469}
470
471int ttm_bo_kmap(struct ttm_buffer_object *bo,
472 unsigned long start_page, unsigned long num_pages,
473 struct ttm_bo_kmap_obj *map)
474{
82c5da6b 475 unsigned long offset, size;
ba4e7d97 476 int ret;
ba4e7d97
TH
477
478 BUG_ON(!list_empty(&bo->swap));
479 map->virtual = NULL;
82c5da6b 480 map->bo = bo;
ba4e7d97
TH
481 if (num_pages > bo->num_pages)
482 return -EINVAL;
483 if (start_page > bo->num_pages)
484 return -EINVAL;
485#if 0
486 if (num_pages > 1 && !DRM_SUSER(DRM_CURPROC))
487 return -EPERM;
488#endif
82c5da6b 489 ret = ttm_mem_io_reserve(bo->bdev, &bo->mem);
ba4e7d97
TH
490 if (ret)
491 return ret;
82c5da6b 492 if (!bo->mem.bus.is_iomem) {
ba4e7d97
TH
493 return ttm_bo_kmap_ttm(bo, start_page, num_pages, map);
494 } else {
82c5da6b
JG
495 offset = start_page << PAGE_SHIFT;
496 size = num_pages << PAGE_SHIFT;
497 return ttm_bo_ioremap(bo, offset, size, map);
ba4e7d97
TH
498 }
499}
500EXPORT_SYMBOL(ttm_bo_kmap);
501
502void ttm_bo_kunmap(struct ttm_bo_kmap_obj *map)
503{
504 if (!map->virtual)
505 return;
506 switch (map->bo_kmap_type) {
507 case ttm_bo_map_iomap:
508 iounmap(map->virtual);
82c5da6b 509 ttm_mem_io_free(map->bo->bdev, &map->bo->mem);
ba4e7d97
TH
510 break;
511 case ttm_bo_map_vmap:
512 vunmap(map->virtual);
513 break;
514 case ttm_bo_map_kmap:
515 kunmap(map->page);
516 break;
517 case ttm_bo_map_premapped:
518 break;
519 default:
520 BUG();
521 }
522 map->virtual = NULL;
523 map->page = NULL;
524}
525EXPORT_SYMBOL(ttm_bo_kunmap);
526
ba4e7d97
TH
527int ttm_bo_move_accel_cleanup(struct ttm_buffer_object *bo,
528 void *sync_obj,
529 void *sync_obj_arg,
9d87fa21
JG
530 bool evict, bool no_wait_reserve,
531 bool no_wait_gpu,
ba4e7d97
TH
532 struct ttm_mem_reg *new_mem)
533{
534 struct ttm_bo_device *bdev = bo->bdev;
535 struct ttm_bo_driver *driver = bdev->driver;
536 struct ttm_mem_type_manager *man = &bdev->man[new_mem->mem_type];
537 struct ttm_mem_reg *old_mem = &bo->mem;
538 int ret;
ba4e7d97
TH
539 struct ttm_buffer_object *ghost_obj;
540 void *tmp_obj = NULL;
541
542 spin_lock(&bo->lock);
543 if (bo->sync_obj) {
544 tmp_obj = bo->sync_obj;
545 bo->sync_obj = NULL;
546 }
547 bo->sync_obj = driver->sync_obj_ref(sync_obj);
548 bo->sync_obj_arg = sync_obj_arg;
549 if (evict) {
550 ret = ttm_bo_wait(bo, false, false, false);
551 spin_unlock(&bo->lock);
4677f15c
TH
552 if (tmp_obj)
553 driver->sync_obj_unref(&tmp_obj);
ba4e7d97
TH
554 if (ret)
555 return ret;
556
557 ttm_bo_free_old_node(bo);
558 if ((man->flags & TTM_MEMTYPE_FLAG_FIXED) &&
559 (bo->ttm != NULL)) {
560 ttm_tt_unbind(bo->ttm);
561 ttm_tt_destroy(bo->ttm);
562 bo->ttm = NULL;
563 }
564 } else {
565 /**
566 * This should help pipeline ordinary buffer moves.
567 *
568 * Hang old buffer memory on a new buffer object,
569 * and leave it to be released when the GPU
570 * operation has completed.
571 */
572
573 set_bit(TTM_BO_PRIV_FLAG_MOVING, &bo->priv_flags);
574 spin_unlock(&bo->lock);
4677f15c
TH
575 if (tmp_obj)
576 driver->sync_obj_unref(&tmp_obj);
ba4e7d97
TH
577
578 ret = ttm_buffer_object_transfer(bo, &ghost_obj);
579 if (ret)
580 return ret;
581
582 /**
583 * If we're not moving to fixed memory, the TTM object
584 * needs to stay alive. Otherwhise hang it on the ghost
585 * bo to be unbound and destroyed.
586 */
587
588 if (!(man->flags & TTM_MEMTYPE_FLAG_FIXED))
589 ghost_obj->ttm = NULL;
590 else
591 bo->ttm = NULL;
592
593 ttm_bo_unreserve(ghost_obj);
594 ttm_bo_unref(&ghost_obj);
595 }
596
597 *old_mem = *new_mem;
598 new_mem->mm_node = NULL;
110b20c3 599
ba4e7d97
TH
600 return 0;
601}
602EXPORT_SYMBOL(ttm_bo_move_accel_cleanup);