2 * Copyright 2008 Red Hat Inc.
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
11 * The above copyright notice and this permission notice shall be included in
12 * all copies or substantial portions of the Software.
14 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
15 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
16 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
17 * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
18 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
19 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
20 * OTHER DEALINGS IN THE SOFTWARE.
27 #include "radeon_drm.h"
28 #include "radeon_drv.h"
30 static int radeon_gem_ib_init(struct drm_device *dev);
31 static int radeon_gem_ib_destroy(struct drm_device *dev);
32 static int radeon_gem_dma_bufs_init(struct drm_device *dev);
33 static void radeon_gem_dma_bufs_destroy(struct drm_device *dev);
35 int radeon_gem_init_object(struct drm_gem_object *obj)
37 struct drm_radeon_gem_object *obj_priv;
39 obj_priv = drm_calloc(1, sizeof(*obj_priv), DRM_MEM_DRIVER);
44 obj->driver_private = obj_priv;
49 void radeon_gem_free_object(struct drm_gem_object *obj)
52 struct drm_radeon_gem_object *obj_priv = obj->driver_private;
54 /* tear down the buffer object - gem holds struct mutex */
55 drm_bo_takedown_vm_locked(obj_priv->bo);
56 drm_bo_usage_deref_locked(&obj_priv->bo);
57 drm_free(obj->driver_private, 1, DRM_MEM_DRIVER);
60 int radeon_gem_info_ioctl(struct drm_device *dev, void *data,
61 struct drm_file *file_priv)
63 struct drm_radeon_private *dev_priv = dev->dev_private;
64 struct drm_radeon_gem_info *args = data;
66 args->vram_start = dev_priv->mm.vram_offset;
67 args->vram_size = dev_priv->mm.vram_size;
68 args->vram_visible = dev_priv->mm.vram_visible;
70 args->gart_start = dev_priv->mm.gart_start;
71 args->gart_size = dev_priv->mm.gart_useable;
76 struct drm_gem_object *radeon_gem_object_alloc(struct drm_device *dev, int size, int alignment,
77 int initial_domain, bool discardable)
79 struct drm_gem_object *obj;
80 struct drm_radeon_gem_object *obj_priv;
85 obj = drm_gem_object_alloc(dev, size);
89 obj_priv = obj->driver_private;
90 flags = DRM_BO_FLAG_MAPPABLE;
91 if (initial_domain == RADEON_GEM_DOMAIN_VRAM)
92 flags |= DRM_BO_FLAG_MEM_VRAM;
93 else if (initial_domain == RADEON_GEM_DOMAIN_GTT)
94 flags |= DRM_BO_FLAG_MEM_TT;
96 flags |= DRM_BO_FLAG_MEM_LOCAL | DRM_BO_FLAG_CACHED;
98 flags |= DRM_BO_FLAG_READ | DRM_BO_FLAG_WRITE | DRM_BO_FLAG_EXE;
101 flags |= DRM_BO_FLAG_DISCARDABLE;
104 alignment = PAGE_SIZE;
106 page_align = alignment >> PAGE_SHIFT;
107 /* create a TTM BO */
108 ret = drm_buffer_object_create(dev,
109 size, drm_bo_type_device,
110 flags, 0, page_align,
115 DRM_DEBUG("%p : size 0x%x, alignment %d, initial_domain %d\n", obj_priv->bo, size, alignment, initial_domain);
122 int radeon_gem_create_ioctl(struct drm_device *dev, void *data,
123 struct drm_file *file_priv)
125 struct drm_radeon_gem_create *args = data;
126 struct drm_radeon_gem_object *obj_priv;
127 struct drm_gem_object *obj;
131 /* create a gem object to contain this object in */
132 args->size = roundup(args->size, PAGE_SIZE);
134 obj = radeon_gem_object_alloc(dev, args->size, args->alignment, args->initial_domain, args->no_backing_store);
138 obj_priv = obj->driver_private;
139 DRM_DEBUG("obj is %p bo is %p, %d\n", obj, obj_priv->bo, obj_priv->bo->num_pages);
140 ret = drm_gem_handle_create(file_priv, obj, &handle);
141 mutex_lock(&dev->struct_mutex);
142 drm_gem_object_handle_unreference(obj);
143 mutex_unlock(&dev->struct_mutex);
148 args->handle = handle;
152 drm_gem_object_unreference(obj);
157 int radeon_gem_set_domain(struct drm_gem_object *obj, uint32_t read_domains, uint32_t write_domain, uint32_t *flags_p, bool unfenced)
159 struct drm_radeon_gem_object *obj_priv;
163 obj_priv = obj->driver_private;
165 /* work out where to validate the buffer to */
166 if (write_domain) { /* write domains always win */
167 if (write_domain == RADEON_GEM_DOMAIN_VRAM)
168 flags = DRM_BO_FLAG_MEM_VRAM;
169 else if (write_domain == RADEON_GEM_DOMAIN_GTT)
170 flags = DRM_BO_FLAG_MEM_TT; // need a can write gart check
172 return -EINVAL; // we can't write to system RAM
174 /* okay for a read domain - prefer wherever the object is now or close enough */
175 if (read_domains == 0)
178 /* if its already a local memory and CPU is valid do nothing */
179 if (read_domains & RADEON_GEM_DOMAIN_CPU) {
180 if (obj_priv->bo->mem.mem_type == DRM_BO_MEM_LOCAL)
182 if (read_domains == RADEON_GEM_DOMAIN_CPU)
186 /* simple case no choice in domains */
187 if (read_domains == RADEON_GEM_DOMAIN_VRAM)
188 flags = DRM_BO_FLAG_MEM_VRAM;
189 else if (read_domains == RADEON_GEM_DOMAIN_GTT)
190 flags = DRM_BO_FLAG_MEM_TT;
191 else if ((obj_priv->bo->mem.mem_type == DRM_BO_MEM_VRAM) && (read_domains & RADEON_GEM_DOMAIN_VRAM))
192 flags = DRM_BO_FLAG_MEM_VRAM;
193 else if ((obj_priv->bo->mem.mem_type == DRM_BO_MEM_TT) && (read_domains & RADEON_GEM_DOMAIN_GTT))
194 flags = DRM_BO_FLAG_MEM_TT;
195 else if ((obj_priv->bo->mem.mem_type == DRM_BO_MEM_LOCAL) && (read_domains & RADEON_GEM_DOMAIN_GTT))
196 flags = DRM_BO_FLAG_MEM_TT;
198 /* no idea here just set whatever we are input */
200 if (read_domains & RADEON_GEM_DOMAIN_VRAM)
201 flags |= DRM_BO_FLAG_MEM_VRAM;
202 if (read_domains & RADEON_GEM_DOMAIN_GTT)
203 flags |= DRM_BO_FLAG_MEM_TT;
207 /* if this BO is pinned then we ain't moving it anywhere */
208 if (obj_priv->bo->pinned_mem_type && unfenced)
211 DRM_DEBUG("validating %p from %d into %x %d %d\n", obj_priv->bo, obj_priv->bo->mem.mem_type, flags, read_domains, write_domain);
212 ret = drm_bo_do_validate(obj_priv->bo, flags, DRM_BO_MASK_MEM | DRM_BO_FLAG_CACHED,
213 unfenced ? DRM_BO_HINT_DONT_FENCE : 0, 0);
223 int radeon_gem_set_domain_ioctl(struct drm_device *dev, void *data,
224 struct drm_file *file_priv)
226 /* transition the BO to a domain - just validate the BO into a certain domain */
227 struct drm_radeon_gem_set_domain *args = data;
228 struct drm_gem_object *obj;
229 struct drm_radeon_gem_object *obj_priv;
232 /* for now if someone requests domain CPU - just make sure the buffer is finished with */
234 /* just do a BO wait for now */
235 obj = drm_gem_object_lookup(dev, file_priv, args->handle);
239 obj_priv = obj->driver_private;
241 ret = radeon_gem_set_domain(obj, args->read_domains, args->write_domain, NULL, true);
243 mutex_lock(&dev->struct_mutex);
244 drm_gem_object_unreference(obj);
245 mutex_unlock(&dev->struct_mutex);
249 int radeon_gem_pread_ioctl(struct drm_device *dev, void *data,
250 struct drm_file *file_priv)
255 int radeon_gem_pwrite_ioctl(struct drm_device *dev, void *data,
256 struct drm_file *file_priv)
258 struct drm_radeon_gem_pwrite *args = data;
259 struct drm_gem_object *obj;
260 struct drm_radeon_gem_object *obj_priv;
263 obj = drm_gem_object_lookup(dev, file_priv, args->handle);
267 obj_priv = obj->driver_private;
269 /* check where the buffer is first - if not in VRAM
270 fallback to userspace copying for now */
271 mutex_lock(&obj_priv->bo->mutex);
272 if (obj_priv->bo->mem.mem_type != DRM_BO_MEM_VRAM) {
277 DRM_ERROR("pwriting data->size %lld %llx\n", args->size, args->offset);
281 /* so need to grab an IB, copy the data into it in a loop
282 and send them to VRAM using HDB */
283 while ((buf = radeon_host_data_blit(dev, cpp, w, dst_pitch_off, &buf_pitch,
284 x, &y, (unsigned int*)&h, &hpass)) != 0) {
285 radeon_host_data_blit_copy_pass(dev, cpp, buf, (uint8_t *)src,
286 hpass, buf_pitch, src_pitch);
287 src += hpass * src_pitch;
291 mutex_unlock(&obj_priv->bo->mutex);
292 mutex_lock(&dev->struct_mutex);
293 drm_gem_object_unreference(obj);
294 mutex_unlock(&dev->struct_mutex);
298 int radeon_gem_mmap_ioctl(struct drm_device *dev, void *data,
299 struct drm_file *file_priv)
301 struct drm_radeon_gem_mmap *args = data;
302 struct drm_gem_object *obj;
303 struct drm_radeon_gem_object *obj_priv;
307 obj = drm_gem_object_lookup(dev, file_priv, args->handle);
311 offset = args->offset;
313 DRM_DEBUG("got here %p\n", obj);
314 obj_priv = obj->driver_private;
316 DRM_DEBUG("got here %p %p %lld %ld\n", obj, obj_priv->bo, args->size, obj_priv->bo->num_pages);
318 mutex_lock(&dev->struct_mutex);
319 drm_gem_object_unreference(obj);
320 mutex_unlock(&dev->struct_mutex);
324 down_write(¤t->mm->mmap_sem);
325 addr = do_mmap_pgoff(file_priv->filp, 0, args->size,
326 PROT_READ | PROT_WRITE, MAP_SHARED,
327 obj_priv->bo->map_list.hash.key);
328 up_write(¤t->mm->mmap_sem);
330 DRM_DEBUG("got here %p %d\n", obj, obj_priv->bo->mem.mem_type);
331 mutex_lock(&dev->struct_mutex);
332 drm_gem_object_unreference(obj);
333 mutex_unlock(&dev->struct_mutex);
334 if (IS_ERR((void *)addr))
337 args->addr_ptr = (uint64_t) addr;
343 int radeon_gem_pin_ioctl(struct drm_device *dev, void *data,
344 struct drm_file *file_priv)
346 struct drm_radeon_gem_pin *args = data;
347 struct drm_gem_object *obj;
348 struct drm_radeon_gem_object *obj_priv;
350 int flags = DRM_BO_FLAG_NO_EVICT;
351 int mask = DRM_BO_FLAG_NO_EVICT;
353 /* check for valid args */
354 if (args->pin_domain) {
355 mask |= DRM_BO_MASK_MEM;
356 if (args->pin_domain == RADEON_GEM_DOMAIN_GTT)
357 flags |= DRM_BO_FLAG_MEM_TT;
358 else if (args->pin_domain == RADEON_GEM_DOMAIN_VRAM)
359 flags |= DRM_BO_FLAG_MEM_VRAM;
360 else /* hand back the offset we currently have if no args supplied
361 - this is to allow old mesa to work - its a hack */
365 obj = drm_gem_object_lookup(dev, file_priv, args->handle);
369 obj_priv = obj->driver_private;
371 /* validate into a pin with no fence */
372 DRM_DEBUG("got here %p %p %d\n", obj, obj_priv->bo, atomic_read(&obj_priv->bo->usage));
373 if (flags && !(obj_priv->bo->type != drm_bo_type_kernel && !DRM_SUSER(DRM_CURPROC))) {
374 ret = drm_bo_do_validate(obj_priv->bo, flags, mask,
375 DRM_BO_HINT_DONT_FENCE, 0);
379 args->offset = obj_priv->bo->offset;
380 DRM_DEBUG("got here %p %p %x\n", obj, obj_priv->bo, obj_priv->bo->offset);
382 mutex_lock(&dev->struct_mutex);
383 drm_gem_object_unreference(obj);
384 mutex_unlock(&dev->struct_mutex);
388 int radeon_gem_unpin_ioctl(struct drm_device *dev, void *data,
389 struct drm_file *file_priv)
391 struct drm_radeon_gem_unpin *args = data;
392 struct drm_gem_object *obj;
393 struct drm_radeon_gem_object *obj_priv;
396 obj = drm_gem_object_lookup(dev, file_priv, args->handle);
400 obj_priv = obj->driver_private;
402 /* validate into a pin with no fence */
404 ret = drm_bo_do_validate(obj_priv->bo, 0, DRM_BO_FLAG_NO_EVICT,
405 DRM_BO_HINT_DONT_FENCE, 0);
407 mutex_lock(&dev->struct_mutex);
408 drm_gem_object_unreference(obj);
409 mutex_unlock(&dev->struct_mutex);
413 int radeon_gem_busy(struct drm_device *dev, void *data,
414 struct drm_file *file_priv)
419 int radeon_gem_wait_rendering(struct drm_device *dev, void *data,
420 struct drm_file *file_priv)
422 struct drm_radeon_gem_wait_rendering *args = data;
423 struct drm_gem_object *obj;
424 struct drm_radeon_gem_object *obj_priv;
428 obj = drm_gem_object_lookup(dev, file_priv, args->handle);
432 obj_priv = obj->driver_private;
434 mutex_lock(&obj_priv->bo->mutex);
435 ret = drm_bo_wait(obj_priv->bo, 0, 1, 1, 0);
436 mutex_unlock(&obj_priv->bo->mutex);
438 mutex_lock(&dev->struct_mutex);
439 drm_gem_object_unreference(obj);
440 mutex_unlock(&dev->struct_mutex);
447 * Depending on card genertation, chipset bugs, etc... the amount of vram
448 * accessible to the CPU can vary. This function is our best shot at figuring
449 * it out. Returns a value in KB.
451 static uint32_t radeon_get_accessible_vram(struct drm_device *dev)
453 drm_radeon_private_t *dev_priv = dev->dev_private;
457 if (dev_priv->chip_family >= CHIP_R600)
458 aper_size = RADEON_READ(R600_CONFIG_APER_SIZE) / 1024;
460 aper_size = RADEON_READ(RADEON_CONFIG_APER_SIZE) / 1024;
462 /* Set HDP_APER_CNTL only on cards that are known not to be broken,
463 * that is has the 2nd generation multifunction PCI interface
465 if (dev_priv->chip_family == CHIP_RV280 ||
466 dev_priv->chip_family == CHIP_RV350 ||
467 dev_priv->chip_family == CHIP_RV380 ||
468 dev_priv->chip_family == CHIP_R420 ||
469 dev_priv->chip_family == CHIP_R423 ||
470 dev_priv->chip_family == CHIP_RV410 ||
471 radeon_is_avivo(dev_priv)) {
472 uint32_t temp = RADEON_READ(RADEON_HOST_PATH_CNTL);
473 temp |= RADEON_HDP_APER_CNTL;
474 RADEON_WRITE(RADEON_HOST_PATH_CNTL, temp);
475 return aper_size * 2;
478 /* Older cards have all sorts of funny issues to deal with. First
479 * check if it's a multifunction card by reading the PCI config
480 * header type... Limit those to one aperture size
482 pci_read_config_byte(dev->pdev, 0xe, &byte);
486 /* Single function older card. We read HDP_APER_CNTL to see how the BIOS
487 * have set it up. We don't write this as it's broken on some ASICs but
488 * we expect the BIOS to have done the right thing (might be too optimistic...)
490 if (RADEON_READ(RADEON_HOST_PATH_CNTL) & RADEON_HDP_APER_CNTL)
491 return aper_size * 2;
496 /* code from the DDX - do memory sizing */
497 void radeon_vram_setup(struct drm_device *dev)
499 drm_radeon_private_t *dev_priv = dev->dev_private;
501 uint32_t accessible, bar_size;
503 if (!radeon_is_avivo(dev_priv) && (dev_priv->flags & RADEON_IS_IGP)) {
504 uint32_t tom = RADEON_READ(RADEON_NB_TOM);
506 vram = (((tom >> 16) - (tom & 0xffff) + 1) << 6);
507 RADEON_WRITE(RADEON_CONFIG_MEMSIZE, vram * 1024);
509 if (dev_priv->chip_family >= CHIP_R600)
510 vram = RADEON_READ(R600_CONFIG_MEMSIZE) / 1024;
512 vram = RADEON_READ(RADEON_CONFIG_MEMSIZE) / 1024;
514 /* Some production boards of m6 will return 0 if it's 8 MB */
517 RADEON_WRITE(RADEON_CONFIG_MEMSIZE, 0x800000);
522 accessible = radeon_get_accessible_vram(dev);
524 bar_size = drm_get_resource_len(dev, 0) / 1024;
527 if (accessible > bar_size)
528 accessible = bar_size;
530 if (accessible > vram)
533 DRM_INFO("Detected VRAM RAM=%dK, accessible=%uK, BAR=%uK\n",
534 vram, accessible, bar_size);
536 dev_priv->mm.vram_offset = dev_priv->fb_aper_offset;
537 dev_priv->mm.vram_size = vram * 1024;
538 dev_priv->mm.vram_visible = accessible * 1024;
543 static int radeon_gart_init(struct drm_device *dev)
545 drm_radeon_private_t *dev_priv = dev->dev_private;
549 /* setup a 32MB GART */
550 dev_priv->gart_size = dev_priv->mm.gart_size;
552 dev_priv->gart_info.table_size = RADEON_PCIGART_TABLE_SIZE;
555 /* setup VRAM vs GART here */
556 if (dev_priv->flags & RADEON_IS_AGP) {
557 base = dev->agp->base;
558 if ((base + dev_priv->gart_size - 1) >= dev_priv->fb_location &&
559 base < (dev_priv->fb_location + dev_priv->fb_size - 1)) {
560 DRM_INFO("Can't use agp base @0x%08lx, won't fit\n",
568 base = dev_priv->fb_location + dev_priv->fb_size;
569 if (base < dev_priv->fb_location ||
570 ((base + dev_priv->gart_size) & 0xfffffffful) < base)
571 base = dev_priv->fb_location
572 - dev_priv->gart_size;
574 /* start on the card */
575 dev_priv->gart_vm_start = base & 0xffc00000u;
576 if (dev_priv->gart_vm_start != base)
577 DRM_INFO("GART aligned down from 0x%08x to 0x%08x\n",
578 base, dev_priv->gart_vm_start);
580 /* if on PCIE we need to allocate an fb object for the PCIE GART table */
581 if (dev_priv->flags & RADEON_IS_PCIE) {
582 ret = drm_buffer_object_create(dev, RADEON_PCIGART_TABLE_SIZE,
584 DRM_BO_FLAG_READ | DRM_BO_FLAG_MEM_VRAM | DRM_BO_FLAG_MAPPABLE | DRM_BO_FLAG_NO_EVICT,
585 0, 1, 0, &dev_priv->mm.pcie_table.bo);
589 /* subtract from VRAM value reporting to userspace */
590 dev_priv->mm.vram_visible -= RADEON_PCIGART_TABLE_SIZE;
592 dev_priv->mm.pcie_table_backup = kzalloc(RADEON_PCIGART_TABLE_SIZE, GFP_KERNEL);
593 if (!dev_priv->mm.pcie_table_backup)
596 ret = drm_bo_kmap(dev_priv->mm.pcie_table.bo, 0, RADEON_PCIGART_TABLE_SIZE >> PAGE_SHIFT,
597 &dev_priv->mm.pcie_table.kmap);
601 dev_priv->pcigart_offset_set = 2;
602 dev_priv->gart_info.bus_addr = dev_priv->fb_location + dev_priv->mm.pcie_table.bo->offset;
603 dev_priv->gart_info.addr = dev_priv->mm.pcie_table.kmap.virtual;
604 dev_priv->gart_info.gart_reg_if = DRM_ATI_GART_PCIE;
605 dev_priv->gart_info.gart_table_location = DRM_ATI_GART_FB;
606 memset(dev_priv->gart_info.addr, 0, RADEON_PCIGART_TABLE_SIZE);
607 } else if (!(dev_priv->flags & RADEON_IS_AGP)) {
608 /* allocate PCI GART table */
609 dev_priv->gart_info.table_mask = DMA_BIT_MASK(32);
610 dev_priv->gart_info.gart_table_location = DRM_ATI_GART_MAIN;
611 if (dev_priv->flags & RADEON_IS_IGPGART)
612 dev_priv->gart_info.gart_reg_if = DRM_ATI_GART_IGP;
614 dev_priv->gart_info.gart_reg_if = DRM_ATI_GART_PCI;
616 ret = drm_ati_alloc_pcigart_table(dev, &dev_priv->gart_info);
618 DRM_ERROR("cannot allocate PCI GART page!\n");
622 dev_priv->gart_info.addr = dev_priv->gart_info.table_handle->vaddr;
623 dev_priv->gart_info.bus_addr = dev_priv->gart_info.table_handle->busaddr;
626 /* gart values setup - start the GART */
627 if (dev_priv->flags & RADEON_IS_AGP) {
628 radeon_set_pcigart(dev_priv, 0);
630 radeon_set_pcigart(dev_priv, 1);
636 int radeon_alloc_gart_objects(struct drm_device *dev)
638 drm_radeon_private_t *dev_priv = dev->dev_private;
641 ret = drm_buffer_object_create(dev, RADEON_DEFAULT_RING_SIZE,
643 DRM_BO_FLAG_READ | DRM_BO_FLAG_MEM_TT |
644 DRM_BO_FLAG_MAPPABLE | DRM_BO_FLAG_NO_EVICT,
645 0, 1, 0, &dev_priv->mm.ring.bo);
647 if (dev_priv->flags & RADEON_IS_AGP)
648 DRM_ERROR("failed to allocate ring - most likely an AGP driver bug\n");
650 DRM_ERROR("failed to allocate ring\n");
654 ret = drm_bo_kmap(dev_priv->mm.ring.bo, 0, RADEON_DEFAULT_RING_SIZE >> PAGE_SHIFT,
655 &dev_priv->mm.ring.kmap);
657 DRM_ERROR("failed to map ring\n");
661 ret = drm_buffer_object_create(dev, PAGE_SIZE,
663 DRM_BO_FLAG_WRITE |DRM_BO_FLAG_READ | DRM_BO_FLAG_MEM_TT |
664 DRM_BO_FLAG_MAPPABLE | DRM_BO_FLAG_NO_EVICT,
665 0, 1, 0, &dev_priv->mm.ring_read.bo);
667 DRM_ERROR("failed to allocate ring read\n");
671 ret = drm_bo_kmap(dev_priv->mm.ring_read.bo, 0,
672 PAGE_SIZE >> PAGE_SHIFT,
673 &dev_priv->mm.ring_read.kmap);
675 DRM_ERROR("failed to map ring read\n");
679 DRM_DEBUG("Ring ptr %p mapped at %ld %p, read ptr %p maped at %ld %p\n",
680 dev_priv->mm.ring.bo, dev_priv->mm.ring.bo->offset, dev_priv->mm.ring.kmap.virtual,
681 dev_priv->mm.ring_read.bo, dev_priv->mm.ring_read.bo->offset, dev_priv->mm.ring_read.kmap.virtual);
683 dev_priv->mm.gart_useable -= RADEON_DEFAULT_RING_SIZE + PAGE_SIZE;
685 /* init the indirect buffers */
686 radeon_gem_ib_init(dev);
687 radeon_gem_dma_bufs_init(dev);
692 static bool avivo_get_mc_idle(struct drm_device *dev)
694 drm_radeon_private_t *dev_priv = dev->dev_private;
696 if (dev_priv->chip_family >= CHIP_R600) {
697 /* no idea where this is on r600 yet */
699 } else if (dev_priv->chip_family == CHIP_RV515) {
700 if (radeon_read_mc_reg(dev_priv, RV515_MC_STATUS) & RV515_MC_STATUS_IDLE)
704 } else if (dev_priv->chip_family == CHIP_RS600) {
705 if (radeon_read_mc_reg(dev_priv, RS600_MC_STATUS) & RS600_MC_STATUS_IDLE)
709 } else if ((dev_priv->chip_family == CHIP_RS690) ||
710 (dev_priv->chip_family == CHIP_RS740)) {
711 if (radeon_read_mc_reg(dev_priv, RS690_MC_STATUS) & RS690_MC_STATUS_IDLE)
716 if (radeon_read_mc_reg(dev_priv, R520_MC_STATUS) & R520_MC_STATUS_IDLE)
724 static void avivo_disable_mc_clients(struct drm_device *dev)
726 drm_radeon_private_t *dev_priv = dev->dev_private;
730 radeon_do_wait_for_idle(dev_priv);
732 RADEON_WRITE(AVIVO_D1VGA_CONTROL, RADEON_READ(AVIVO_D1VGA_CONTROL) & ~AVIVO_DVGA_CONTROL_MODE_ENABLE);
733 RADEON_WRITE(AVIVO_D2VGA_CONTROL, RADEON_READ(AVIVO_D2VGA_CONTROL) & ~AVIVO_DVGA_CONTROL_MODE_ENABLE);
735 tmp = RADEON_READ(AVIVO_D1CRTC_CONTROL);
736 RADEON_WRITE(AVIVO_D1CRTC_CONTROL, tmp & ~AVIVO_CRTC_EN);
738 tmp = RADEON_READ(AVIVO_D2CRTC_CONTROL);
739 RADEON_WRITE(AVIVO_D2CRTC_CONTROL, tmp & ~AVIVO_CRTC_EN);
741 tmp = RADEON_READ(AVIVO_D2CRTC_CONTROL);
746 while (!(avivo_get_mc_idle(dev))) {
747 if (++timeout > 100000) {
748 DRM_ERROR("Timeout waiting for memory controller to update settings\n");
749 DRM_ERROR("Bad things may or may not happen\n");
755 static inline u32 radeon_busy_wait(struct drm_device *dev, uint32_t reg, uint32_t bits,
756 unsigned int timeout)
758 drm_radeon_private_t *dev_priv = dev->dev_private;
763 status = RADEON_READ(reg);
765 } while(status != 0xffffffff && (status & bits) && (timeout > 0));
773 /* Wait for vertical sync on primary CRTC */
774 static void radeon_wait_for_vsync(struct drm_device *dev)
776 drm_radeon_private_t *dev_priv = dev->dev_private;
777 uint32_t crtc_gen_cntl;
779 crtc_gen_cntl = RADEON_READ(RADEON_CRTC_GEN_CNTL);
780 if ((crtc_gen_cntl & RADEON_CRTC_DISP_REQ_EN_B) ||
781 !(crtc_gen_cntl & RADEON_CRTC_EN))
784 /* Clear the CRTC_VBLANK_SAVE bit */
785 RADEON_WRITE(RADEON_CRTC_STATUS, RADEON_CRTC_VBLANK_SAVE_CLEAR);
787 radeon_busy_wait(dev, RADEON_CRTC_STATUS, RADEON_CRTC_VBLANK_SAVE, 2000);
791 /* Wait for vertical sync on primary CRTC */
792 static void radeon_wait_for_vsync2(struct drm_device *dev)
794 drm_radeon_private_t *dev_priv = dev->dev_private;
795 uint32_t crtc2_gen_cntl;
797 crtc2_gen_cntl = RADEON_READ(RADEON_CRTC2_GEN_CNTL);
798 if ((crtc2_gen_cntl & RADEON_CRTC2_DISP_REQ_EN_B) ||
799 !(crtc2_gen_cntl & RADEON_CRTC2_EN))
802 /* Clear the CRTC_VBLANK_SAVE bit */
803 RADEON_WRITE(RADEON_CRTC2_STATUS, RADEON_CRTC2_VBLANK_SAVE_CLEAR);
805 radeon_busy_wait(dev, RADEON_CRTC2_STATUS, RADEON_CRTC2_VBLANK_SAVE, 2000);
808 static void legacy_disable_mc_clients(struct drm_device *dev)
810 drm_radeon_private_t *dev_priv = dev->dev_private;
811 uint32_t old_mc_status, status_idle;
812 uint32_t ov0_scale_cntl, crtc_ext_cntl, crtc_gen_cntl, crtc2_gen_cntl;
815 radeon_do_wait_for_idle(dev_priv);
817 if (dev_priv->flags & RADEON_IS_IGP)
820 old_mc_status = RADEON_READ(RADEON_MC_STATUS);
822 /* stop display and memory access */
823 ov0_scale_cntl = RADEON_READ(RADEON_OV0_SCALE_CNTL);
824 RADEON_WRITE(RADEON_OV0_SCALE_CNTL, ov0_scale_cntl & ~RADEON_SCALER_ENABLE);
825 crtc_ext_cntl = RADEON_READ(RADEON_CRTC_EXT_CNTL);
826 RADEON_WRITE(RADEON_CRTC_EXT_CNTL, crtc_ext_cntl | RADEON_CRTC_DISPLAY_DIS);
827 crtc_gen_cntl = RADEON_READ(RADEON_CRTC_GEN_CNTL);
829 radeon_wait_for_vsync(dev);
831 RADEON_WRITE(RADEON_CRTC_GEN_CNTL,
832 (crtc_gen_cntl & ~(RADEON_CRTC_CUR_EN | RADEON_CRTC_ICON_EN)) |
833 RADEON_CRTC_DISP_REQ_EN_B | RADEON_CRTC_EXT_DISP_EN);
835 if (!(dev_priv->flags & RADEON_SINGLE_CRTC)) {
836 crtc2_gen_cntl = RADEON_READ(RADEON_CRTC2_GEN_CNTL);
838 radeon_wait_for_vsync2(dev);
839 RADEON_WRITE(RADEON_CRTC2_GEN_CNTL,
841 ~(RADEON_CRTC2_CUR_EN | RADEON_CRTC2_ICON_EN)) |
842 RADEON_CRTC2_DISP_REQ_EN_B);
847 if (radeon_is_r300(dev_priv))
848 status_idle = R300_MC_IDLE;
850 status_idle = RADEON_MC_IDLE;
852 status = radeon_busy_wait(dev, RADEON_MC_STATUS, status_idle, 200000);
853 if (status == 0xffffffff) {
854 DRM_ERROR("Timeout waiting for memory controller to update settings\n");
855 DRM_ERROR("Bad things may or may not happen\n");
860 void radeon_init_memory_map(struct drm_device *dev)
862 drm_radeon_private_t *dev_priv = dev->dev_private;
863 u32 mem_size, aper_size;
865 dev_priv->mc_fb_location = radeon_read_fb_location(dev_priv);
866 radeon_read_agp_location(dev_priv, &dev_priv->mc_agp_loc_lo, &dev_priv->mc_agp_loc_hi);
868 if (dev_priv->chip_family >= CHIP_R600) {
869 mem_size = RADEON_READ(R600_CONFIG_MEMSIZE);
870 aper_size = RADEON_READ(R600_CONFIG_APER_SIZE);
872 mem_size = RADEON_READ(RADEON_CONFIG_MEMSIZE);
873 aper_size = RADEON_READ(RADEON_CONFIG_APER_SIZE);
876 /* M6s report illegal memory size */
878 mem_size = 8 * 1024 * 1024;
880 /* for RN50/M6/M7 - Novell bug 204882 */
881 if (aper_size > mem_size)
882 mem_size = aper_size;
884 if ((dev_priv->chip_family != CHIP_RS600) &&
885 (dev_priv->chip_family != CHIP_RS690) &&
886 (dev_priv->chip_family != CHIP_RS740)) {
887 if (dev_priv->flags & RADEON_IS_IGP)
888 dev_priv->mc_fb_location = RADEON_READ(RADEON_NB_TOM);
892 if (dev_priv->chip_family >= CHIP_R600)
893 aper0_base = RADEON_READ(R600_CONFIG_F0_BASE);
895 aper0_base = RADEON_READ(RADEON_CONFIG_APER_0_BASE);
898 /* Some chips have an "issue" with the memory controller, the
899 * location must be aligned to the size. We just align it down,
900 * too bad if we walk over the top of system memory, we don't
901 * use DMA without a remapped anyway.
902 * Affected chips are rv280, all r3xx, and all r4xx, but not IGP
904 if (dev_priv->chip_family == CHIP_RV280 ||
905 dev_priv->chip_family == CHIP_R300 ||
906 dev_priv->chip_family == CHIP_R350 ||
907 dev_priv->chip_family == CHIP_RV350 ||
908 dev_priv->chip_family == CHIP_RV380 ||
909 dev_priv->chip_family == CHIP_R420 ||
910 dev_priv->chip_family == CHIP_R423 ||
911 dev_priv->chip_family == CHIP_RV410)
912 aper0_base &= ~(mem_size - 1);
914 if (dev_priv->chip_family >= CHIP_R600) {
915 dev_priv->mc_fb_location = (aper0_base >> 24) |
916 (((aper0_base + mem_size - 1) & 0xff000000U) >> 8);
918 dev_priv->mc_fb_location = (aper0_base >> 16) |
919 ((aper0_base + mem_size - 1) & 0xffff0000U);
924 if (dev_priv->chip_family >= CHIP_R600)
925 dev_priv->fb_location = (dev_priv->mc_fb_location & 0xffff) << 24;
927 dev_priv->fb_location = (dev_priv->mc_fb_location & 0xffff) << 16;
929 /* updating mc regs here */
930 if (radeon_is_avivo(dev_priv))
931 avivo_disable_mc_clients(dev);
933 legacy_disable_mc_clients(dev);
935 radeon_write_fb_location(dev_priv, dev_priv->mc_fb_location);
937 if (radeon_is_avivo(dev_priv)) {
938 if (dev_priv->chip_family >= CHIP_R600)
939 RADEON_WRITE(R600_HDP_NONSURFACE_BASE, (dev_priv->mc_fb_location << 16) & 0xff0000);
941 RADEON_WRITE(AVIVO_HDP_FB_LOCATION, dev_priv->mc_fb_location);
944 if (dev_priv->chip_family >= CHIP_R600) {
945 dev_priv->fb_location = (radeon_read_fb_location(dev_priv) & 0xffffff) << 24;
946 dev_priv->fb_size = ((radeon_read_fb_location(dev_priv) & 0xff000000u) + 0x1000000)
947 - dev_priv->fb_location;
949 dev_priv->fb_location = (radeon_read_fb_location(dev_priv) & 0xffff) << 16;
951 ((radeon_read_fb_location(dev_priv) & 0xffff0000u) + 0x10000)
952 - dev_priv->fb_location;
955 /* add an MTRR for the VRAM */
956 dev_priv->aper_size = aper_size;
957 dev_priv->vram_mtrr = mtrr_add(dev_priv->fb_aper_offset, dev_priv->aper_size, MTRR_TYPE_WRCOMB, 1);
961 /* init memory manager - start with all of VRAM and a 32MB GART aperture for now */
962 int radeon_gem_mm_init(struct drm_device *dev)
964 drm_radeon_private_t *dev_priv = dev->dev_private;
968 /* init TTM underneath */
969 drm_bo_driver_init(dev);
971 /* use the uncached allocator */
972 dev->bm.allocator_type = _DRM_BM_ALLOCATOR_UNCACHED;
974 /* size the mappable VRAM memory for now */
975 radeon_vram_setup(dev);
977 radeon_init_memory_map(dev);
979 #define VRAM_RESERVE_TEXT (256*1024) /* need to reserve 256 for text mode for now */
980 dev_priv->mm.vram_visible -= VRAM_RESERVE_TEXT;
981 pg_offset = VRAM_RESERVE_TEXT >> PAGE_SHIFT;
982 drm_bo_init_mm(dev, DRM_BO_MEM_VRAM, pg_offset, /*dev_priv->mm.vram_offset >> PAGE_SHIFT,*/
983 ((dev_priv->mm.vram_visible) >> PAGE_SHIFT) - 16,
987 if (dev_priv->chip_family > CHIP_R600) {
988 dev_priv->mm_enabled = true;
992 dev_priv->mm.gart_size = (32 * 1024 * 1024);
993 dev_priv->mm.gart_start = 0;
994 dev_priv->mm.gart_useable = dev_priv->mm.gart_size;
995 ret = radeon_gart_init(dev);
999 drm_bo_init_mm(dev, DRM_BO_MEM_TT, 0,
1000 dev_priv->mm.gart_size >> PAGE_SHIFT,
1003 /* need to allocate some objects in the GART */
1004 /* ring + ring read ptr */
1005 ret = radeon_alloc_gart_objects(dev);
1007 radeon_gem_mm_fini(dev);
1011 dev_priv->mm_enabled = true;
1015 void radeon_gem_mm_fini(struct drm_device *dev)
1017 drm_radeon_private_t *dev_priv = dev->dev_private;
1019 radeon_gem_dma_bufs_destroy(dev);
1020 radeon_gem_ib_destroy(dev);
1022 mutex_lock(&dev->struct_mutex);
1024 if (dev_priv->mm.ring_read.bo) {
1025 drm_bo_kunmap(&dev_priv->mm.ring_read.kmap);
1026 drm_bo_usage_deref_locked(&dev_priv->mm.ring_read.bo);
1029 if (dev_priv->mm.ring.bo) {
1030 drm_bo_kunmap(&dev_priv->mm.ring.kmap);
1031 drm_bo_usage_deref_locked(&dev_priv->mm.ring.bo);
1034 if (drm_bo_clean_mm(dev, DRM_BO_MEM_TT, 1)) {
1035 DRM_DEBUG("delaying takedown of TTM memory\n");
1038 if (dev_priv->flags & RADEON_IS_PCIE) {
1039 if (dev_priv->mm.pcie_table_backup) {
1040 kfree(dev_priv->mm.pcie_table_backup);
1041 dev_priv->mm.pcie_table_backup = NULL;
1043 if (dev_priv->mm.pcie_table.bo) {
1044 drm_bo_kunmap(&dev_priv->mm.pcie_table.kmap);
1045 drm_bo_usage_deref_locked(&dev_priv->mm.pcie_table.bo);
1049 if (drm_bo_clean_mm(dev, DRM_BO_MEM_VRAM, 1)) {
1050 DRM_DEBUG("delaying takedown of VRAM memory\n");
1053 if (dev_priv->vram_mtrr)
1054 mtrr_del(dev_priv->vram_mtrr, dev_priv->fb_aper_offset, dev_priv->aper_size);
1055 mutex_unlock(&dev->struct_mutex);
1057 drm_bo_driver_finish(dev);
1058 dev_priv->mm_enabled = false;
1061 int radeon_gem_object_pin(struct drm_gem_object *obj,
1062 uint32_t alignment, uint32_t pin_domain)
1064 struct drm_radeon_gem_object *obj_priv;
1066 uint32_t flags = DRM_BO_FLAG_NO_EVICT;
1067 uint32_t mask = DRM_BO_FLAG_NO_EVICT;
1069 obj_priv = obj->driver_private;
1072 mask |= DRM_BO_MASK_MEM;
1073 if (pin_domain == RADEON_GEM_DOMAIN_GTT)
1074 flags |= DRM_BO_FLAG_MEM_TT;
1075 else if (pin_domain == RADEON_GEM_DOMAIN_VRAM)
1076 flags |= DRM_BO_FLAG_MEM_VRAM;
1080 ret = drm_bo_do_validate(obj_priv->bo, flags, mask,
1081 DRM_BO_HINT_DONT_FENCE, 0);
1086 int radeon_gem_object_unpin(struct drm_gem_object *obj)
1088 struct drm_radeon_gem_object *obj_priv;
1091 obj_priv = obj->driver_private;
1093 ret = drm_bo_do_validate(obj_priv->bo, 0, DRM_BO_FLAG_NO_EVICT,
1094 DRM_BO_HINT_DONT_FENCE, 0);
1099 #define RADEON_IB_MEMORY (1*1024*1024)
1100 #define RADEON_IB_SIZE (65536)
1102 #define RADEON_NUM_IB (RADEON_IB_MEMORY / RADEON_IB_SIZE)
1104 int radeon_gem_ib_get(struct drm_radeon_cs_parser *parser)
1108 drm_radeon_private_t *dev_priv = parser->dev->dev_private;
1110 for (i = 0; i < RADEON_NUM_IB; i++) {
1111 if (!(dev_priv->ib_alloc_bitmap & (1 << i))){
1117 /* if all in use we need to wait */
1119 for (i = 0; i < RADEON_NUM_IB; i++) {
1120 if (dev_priv->ib_alloc_bitmap & (1 << i)) {
1121 mutex_lock(&dev_priv->ib_objs[i]->bo->mutex);
1122 ret = drm_bo_wait(dev_priv->ib_objs[i]->bo, 0, 1, 0, 0);
1123 mutex_unlock(&dev_priv->ib_objs[i]->bo->mutex);
1126 dev_priv->ib_alloc_bitmap &= ~(1 << i);
1134 DRM_ERROR("Major case fail to allocate IB from freelist %llx\n", dev_priv->ib_alloc_bitmap);
1139 if (parser->chunks[parser->ib_index].length_dw > RADEON_IB_SIZE / sizeof(uint32_t))
1142 ret = drm_bo_do_validate(dev_priv->ib_objs[index]->bo, 0,
1143 DRM_BO_FLAG_NO_EVICT,
1146 DRM_ERROR("Failed to validate IB %d\n", index);
1150 parser->ib = dev_priv->ib_objs[index]->kmap.virtual;
1151 parser->card_offset = dev_priv->gart_vm_start + dev_priv->ib_objs[index]->bo->offset;
1152 dev_priv->ib_alloc_bitmap |= (1 << i);
1156 static void radeon_gem_ib_free(struct drm_radeon_cs_parser *parser)
1158 struct drm_device *dev = parser->dev;
1159 drm_radeon_private_t *dev_priv = dev->dev_private;
1160 struct drm_fence_object *fence;
1164 for (i = 0; i < RADEON_NUM_IB; i++) {
1165 if (dev_priv->ib_objs[i]->kmap.virtual == parser->ib) {
1166 /* emit a fence object */
1167 ret = drm_fence_buffer_objects(dev, NULL, 0, NULL, &fence);
1168 dev_priv->irq_emitted = 0;
1170 drm_putback_buffer_objects(dev);
1172 /* dereference the fence object */
1174 drm_fence_usage_deref_unlocked(&fence);
1180 static int radeon_gem_ib_destroy(struct drm_device *dev)
1182 drm_radeon_private_t *dev_priv = dev->dev_private;
1185 if (dev_priv->ib_objs) {
1186 for (i = 0; i < RADEON_NUM_IB; i++) {
1187 if (dev_priv->ib_objs[i]) {
1188 drm_bo_kunmap(&dev_priv->ib_objs[i]->kmap);
1189 drm_bo_usage_deref_unlocked(&dev_priv->ib_objs[i]->bo);
1191 drm_free(dev_priv->ib_objs[i], sizeof(struct radeon_mm_obj), DRM_MEM_DRIVER);
1193 drm_free(dev_priv->ib_objs, RADEON_NUM_IB*sizeof(struct radeon_mm_obj *), DRM_MEM_DRIVER);
1195 dev_priv->ib_objs = NULL;
1199 static int radeon_gem_find_reloc(struct drm_radeon_cs_parser *parser,
1200 uint32_t offset, uint32_t *handle,
1201 uint32_t *read_domains, uint32_t *write_domain)
1203 struct drm_device *dev = parser->dev;
1204 drm_radeon_private_t *dev_priv = dev->dev_private;
1205 struct drm_radeon_kernel_chunk *reloc_chunk = &parser->chunks[parser->reloc_index];
1207 if (!reloc_chunk->kdata)
1210 if (offset > reloc_chunk->length_dw){
1211 DRM_ERROR("Offset larger than chunk %d %d\n", offset, reloc_chunk->length_dw);
1215 *handle = reloc_chunk->kdata[offset];
1216 *read_domains = reloc_chunk->kdata[offset + 1];
1217 *write_domain = reloc_chunk->kdata[offset + 2];
1221 static int radeon_gem_relocate(struct drm_radeon_cs_parser *parser,
1222 uint32_t *reloc, uint32_t *offset)
1224 struct drm_device *dev = parser->dev;
1225 drm_radeon_private_t *dev_priv = dev->dev_private;
1226 /* relocate the handle */
1227 uint32_t read_domains, write_domain;
1228 struct drm_gem_object *obj;
1231 struct drm_radeon_gem_object *obj_priv;
1233 if (parser->reloc_index == -1) {
1234 obj = drm_gem_object_lookup(dev, parser->file_priv, reloc[1]);
1237 read_domains = reloc[2];
1238 write_domain = reloc[3];
1242 /* have to lookup handle in other chunk */
1243 ret = radeon_gem_find_reloc(parser, reloc[1], &handle, &read_domains, &write_domain);
1247 obj = drm_gem_object_lookup(dev, parser->file_priv, handle);
1252 obj_priv = obj->driver_private;
1253 radeon_gem_set_domain(obj, read_domains, write_domain, &flags, false);
1255 obj_priv->bo->mem.flags &= ~DRM_BO_FLAG_CLEAN;
1256 obj_priv->bo->mem.proposed_flags &= ~DRM_BO_FLAG_CLEAN;
1258 if (flags == DRM_BO_FLAG_MEM_VRAM)
1259 *offset = obj_priv->bo->offset + dev_priv->fb_location;
1260 else if (flags == DRM_BO_FLAG_MEM_TT)
1261 *offset = obj_priv->bo->offset + dev_priv->gart_vm_start;
1263 /* BAD BAD BAD - LINKED LIST THE OBJS and UNREF ONCE IB is SUBMITTED */
1264 drm_gem_object_unreference(obj);
1268 /* allocate 1MB of 64k IBs the the kernel can keep mapped */
1269 static int radeon_gem_ib_init(struct drm_device *dev)
1271 drm_radeon_private_t *dev_priv = dev->dev_private;
1275 dev_priv->ib_objs = drm_calloc(RADEON_NUM_IB, sizeof(struct radeon_mm_obj *), DRM_MEM_DRIVER);
1276 if (!dev_priv->ib_objs)
1279 for (i = 0; i < RADEON_NUM_IB; i++) {
1280 dev_priv->ib_objs[i] = drm_calloc(1, sizeof(struct radeon_mm_obj), DRM_MEM_DRIVER);
1281 if (!dev_priv->ib_objs[i])
1284 ret = drm_buffer_object_create(dev, RADEON_IB_SIZE,
1286 DRM_BO_FLAG_READ | DRM_BO_FLAG_MEM_TT |
1287 DRM_BO_FLAG_MAPPABLE, 0,
1288 0, 0, &dev_priv->ib_objs[i]->bo);
1292 ret = drm_bo_kmap(dev_priv->ib_objs[i]->bo, 0, RADEON_IB_SIZE >> PAGE_SHIFT,
1293 &dev_priv->ib_objs[i]->kmap);
1299 dev_priv->mm.gart_useable -= RADEON_IB_SIZE * RADEON_NUM_IB;
1300 dev_priv->ib_alloc_bitmap = 0;
1302 dev_priv->cs.ib_get = radeon_gem_ib_get;
1303 dev_priv->cs.ib_free = radeon_gem_ib_free;
1305 radeon_cs_init(dev);
1306 dev_priv->cs.relocate = radeon_gem_relocate;
1310 radeon_gem_ib_destroy(dev);
1314 #define RADEON_DMA_BUFFER_SIZE (64 * 1024)
1315 #define RADEON_DMA_BUFFER_COUNT (16)
1319 * Cleanup after an error on one of the addbufs() functions.
1321 * \param dev DRM device.
1322 * \param entry buffer entry where the error occurred.
1324 * Frees any pages and buffers associated with the given entry.
1326 static void drm_cleanup_buf_error(struct drm_device * dev,
1327 struct drm_buf_entry * entry)
1331 if (entry->seg_count) {
1332 for (i = 0; i < entry->seg_count; i++) {
1333 if (entry->seglist[i]) {
1334 drm_pci_free(dev, entry->seglist[i]);
1337 drm_free(entry->seglist,
1339 sizeof(*entry->seglist), DRM_MEM_SEGS);
1341 entry->seg_count = 0;
1344 if (entry->buf_count) {
1345 for (i = 0; i < entry->buf_count; i++) {
1346 if (entry->buflist[i].dev_private) {
1347 drm_free(entry->buflist[i].dev_private,
1348 entry->buflist[i].dev_priv_size,
1352 drm_free(entry->buflist,
1354 sizeof(*entry->buflist), DRM_MEM_BUFS);
1356 entry->buf_count = 0;
1360 static int radeon_gem_addbufs(struct drm_device *dev)
1362 struct drm_radeon_private *dev_priv = dev->dev_private;
1363 struct drm_device_dma *dma = dev->dma;
1364 struct drm_buf_entry *entry;
1365 struct drm_buf *buf;
1366 unsigned long offset;
1367 unsigned long agp_offset;
1376 struct drm_buf **temp_buflist;
1381 count = RADEON_DMA_BUFFER_COUNT;
1382 order = drm_order(RADEON_DMA_BUFFER_SIZE);
1385 alignment = PAGE_ALIGN(size);
1386 page_order = order - PAGE_SHIFT > 0 ? order - PAGE_SHIFT : 0;
1387 total = PAGE_SIZE << page_order;
1390 agp_offset = dev_priv->mm.dma_bufs.bo->offset;
1392 DRM_DEBUG("count: %d\n", count);
1393 DRM_DEBUG("order: %d\n", order);
1394 DRM_DEBUG("size: %d\n", size);
1395 DRM_DEBUG("agp_offset: %lu\n", agp_offset);
1396 DRM_DEBUG("alignment: %d\n", alignment);
1397 DRM_DEBUG("page_order: %d\n", page_order);
1398 DRM_DEBUG("total: %d\n", total);
1400 if (order < DRM_MIN_ORDER || order > DRM_MAX_ORDER)
1402 if (dev->queue_count)
1403 return -EBUSY; /* Not while in use */
1405 spin_lock(&dev->count_lock);
1407 spin_unlock(&dev->count_lock);
1410 atomic_inc(&dev->buf_alloc);
1411 spin_unlock(&dev->count_lock);
1413 mutex_lock(&dev->struct_mutex);
1414 entry = &dma->bufs[order];
1415 if (entry->buf_count) {
1416 mutex_unlock(&dev->struct_mutex);
1417 atomic_dec(&dev->buf_alloc);
1418 return -ENOMEM; /* May only call once for each order */
1421 if (count < 0 || count > 4096) {
1422 mutex_unlock(&dev->struct_mutex);
1423 atomic_dec(&dev->buf_alloc);
1427 entry->buflist = drm_alloc(count * sizeof(*entry->buflist),
1429 if (!entry->buflist) {
1430 mutex_unlock(&dev->struct_mutex);
1431 atomic_dec(&dev->buf_alloc);
1434 memset(entry->buflist, 0, count * sizeof(*entry->buflist));
1436 entry->buf_size = size;
1437 entry->page_order = page_order;
1441 while (entry->buf_count < count) {
1442 buf = &entry->buflist[entry->buf_count];
1443 buf->idx = dma->buf_count + entry->buf_count;
1444 buf->total = alignment;
1448 buf->offset = (dma->byte_count + offset);
1449 buf->bus_address = dev_priv->gart_vm_start + agp_offset + offset;
1450 buf->address = (void *)(agp_offset + offset);
1454 init_waitqueue_head(&buf->dma_wait);
1455 buf->file_priv = NULL;
1457 buf->dev_priv_size = dev->driver->dev_priv_size;
1458 buf->dev_private = drm_alloc(buf->dev_priv_size, DRM_MEM_BUFS);
1459 if (!buf->dev_private) {
1460 /* Set count correctly so we free the proper amount. */
1461 entry->buf_count = count;
1462 drm_cleanup_buf_error(dev, entry);
1463 mutex_unlock(&dev->struct_mutex);
1464 atomic_dec(&dev->buf_alloc);
1468 memset(buf->dev_private, 0, buf->dev_priv_size);
1470 DRM_DEBUG("buffer %d @ %p\n", entry->buf_count, buf->address);
1472 offset += alignment;
1474 byte_count += PAGE_SIZE << page_order;
1477 DRM_DEBUG("byte_count: %d\n", byte_count);
1479 temp_buflist = drm_realloc(dma->buflist,
1480 dma->buf_count * sizeof(*dma->buflist),
1481 (dma->buf_count + entry->buf_count)
1482 * sizeof(*dma->buflist), DRM_MEM_BUFS);
1483 if (!temp_buflist) {
1484 /* Free the entry because it isn't valid */
1485 drm_cleanup_buf_error(dev, entry);
1486 mutex_unlock(&dev->struct_mutex);
1487 atomic_dec(&dev->buf_alloc);
1490 dma->buflist = temp_buflist;
1492 for (i = 0; i < entry->buf_count; i++) {
1493 dma->buflist[i + dma->buf_count] = &entry->buflist[i];
1496 dma->buf_count += entry->buf_count;
1497 dma->seg_count += entry->seg_count;
1498 dma->page_count += byte_count >> PAGE_SHIFT;
1499 dma->byte_count += byte_count;
1501 DRM_DEBUG("dma->buf_count : %d\n", dma->buf_count);
1502 DRM_DEBUG("entry->buf_count : %d\n", entry->buf_count);
1504 mutex_unlock(&dev->struct_mutex);
1506 dma->flags = _DRM_DMA_USE_SG;
1507 atomic_dec(&dev->buf_alloc);
1511 static int radeon_gem_dma_bufs_init(struct drm_device *dev)
1513 struct drm_radeon_private *dev_priv = dev->dev_private;
1514 int size = RADEON_DMA_BUFFER_SIZE * RADEON_DMA_BUFFER_COUNT;
1517 ret = drm_dma_setup(dev);
1521 ret = drm_buffer_object_create(dev, size, drm_bo_type_kernel,
1522 DRM_BO_FLAG_READ | DRM_BO_FLAG_WRITE | DRM_BO_FLAG_NO_EVICT |
1523 DRM_BO_FLAG_MEM_TT | DRM_BO_FLAG_MAPPABLE, 0,
1524 0, 0, &dev_priv->mm.dma_bufs.bo);
1526 DRM_ERROR("Failed to create DMA bufs\n");
1530 ret = drm_bo_kmap(dev_priv->mm.dma_bufs.bo, 0, size >> PAGE_SHIFT,
1531 &dev_priv->mm.dma_bufs.kmap);
1533 DRM_ERROR("Failed to mmap DMA buffers\n");
1536 dev_priv->mm.gart_useable -= size;
1538 radeon_gem_addbufs(dev);
1540 DRM_DEBUG("%lx %d\n", dev_priv->mm.dma_bufs.bo->map_list.hash.key, size);
1541 dev->agp_buffer_token = dev_priv->mm.dma_bufs.bo->map_list.hash.key << PAGE_SHIFT;
1542 dev_priv->mm.fake_agp_map.handle = dev_priv->mm.dma_bufs.kmap.virtual;
1543 dev_priv->mm.fake_agp_map.size = size;
1545 dev->agp_buffer_map = &dev_priv->mm.fake_agp_map;
1546 dev_priv->gart_buffers_offset = dev_priv->mm.dma_bufs.bo->offset + dev_priv->gart_vm_start;
1550 static void radeon_gem_dma_bufs_destroy(struct drm_device *dev)
1553 struct drm_radeon_private *dev_priv = dev->dev_private;
1554 drm_dma_takedown(dev);
1556 if (dev_priv->mm.dma_bufs.bo) {
1557 drm_bo_kunmap(&dev_priv->mm.dma_bufs.kmap);
1558 drm_bo_usage_deref_unlocked(&dev_priv->mm.dma_bufs.bo);
1563 static struct drm_gem_object *gem_object_get(struct drm_device *dev, uint32_t name)
1565 struct drm_gem_object *obj;
1567 spin_lock(&dev->object_name_lock);
1568 obj = idr_find(&dev->object_name_idr, name);
1570 drm_gem_object_reference(obj);
1571 spin_unlock(&dev->object_name_lock);
1575 void radeon_gem_update_offsets(struct drm_device *dev, struct drm_master *master)
1577 drm_radeon_private_t *dev_priv = dev->dev_private;
1578 struct drm_radeon_master_private *master_priv = master->driver_priv;
1579 drm_radeon_sarea_t *sarea_priv = master_priv->sarea_priv;
1580 struct drm_gem_object *obj;
1581 struct drm_radeon_gem_object *obj_priv;
1583 /* update front_pitch_offset and back_pitch_offset */
1584 obj = gem_object_get(dev, sarea_priv->front_handle);
1586 obj_priv = obj->driver_private;
1588 dev_priv->front_offset = obj_priv->bo->offset;
1589 dev_priv->front_pitch_offset = (((sarea_priv->front_pitch / 64) << 22) |
1590 ((obj_priv->bo->offset
1591 + dev_priv->fb_location) >> 10));
1592 drm_gem_object_unreference(obj);
1595 obj = gem_object_get(dev, sarea_priv->back_handle);
1597 obj_priv = obj->driver_private;
1598 dev_priv->back_offset = obj_priv->bo->offset;
1599 dev_priv->back_pitch_offset = (((sarea_priv->back_pitch / 64) << 22) |
1600 ((obj_priv->bo->offset
1601 + dev_priv->fb_location) >> 10));
1602 drm_gem_object_unreference(obj);
1604 dev_priv->color_fmt = RADEON_COLOR_FORMAT_ARGB8888;