1 /*
2 * Copyright 2008 Advanced Micro Devices, Inc.
3 * Copyright 2008 Red Hat Inc.
4 * Copyright 2009 Jerome Glisse.
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a
7 * copy of this software and associated documentation files (the "Software"),
8 * to deal in the Software without restriction, including without limitation
9 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
10 * and/or sell copies of the Software, and to permit persons to whom the
11 * Software is furnished to do so, subject to the following conditions:
12 *
13 * The above copyright notice and this permission notice shall be included in
14 * all copies or substantial portions of the Software.
15 *
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
19 * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
20 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
21 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
22 * OTHER DEALINGS IN THE SOFTWARE.
23 *
24 * Authors: Dave Airlie
25 * Alex Deucher
26 * Jerome Glisse
27 */
28 #include <linux/seq_file.h>
29 #include <linux/slab.h>
30 #include "drmP.h"
31 #include "radeon_drm.h"
32 #include "radeon_reg.h"
33 #include "radeon.h"
34 #include "atom.h"
35
36 int radeon_debugfs_ib_init(struct radeon_device *rdev);
37 int radeon_debugfs_ring_init(struct radeon_device *rdev);
38
radeon_get_ib_value(struct radeon_cs_parser * p,int idx)39 u32 radeon_get_ib_value(struct radeon_cs_parser *p, int idx)
40 {
41 struct radeon_cs_chunk *ibc = &p->chunks[p->chunk_ib_idx];
42 u32 pg_idx, pg_offset;
43 u32 idx_value = 0;
44 int new_page;
45
46 pg_idx = (idx * 4) / PAGE_SIZE;
47 pg_offset = (idx * 4) % PAGE_SIZE;
48
49 if (ibc->kpage_idx[0] == pg_idx)
50 return ibc->kpage[0][pg_offset/4];
51 if (ibc->kpage_idx[1] == pg_idx)
52 return ibc->kpage[1][pg_offset/4];
53
54 new_page = radeon_cs_update_pages(p, pg_idx);
55 if (new_page < 0) {
56 p->parser_error = new_page;
57 return 0;
58 }
59
60 idx_value = ibc->kpage[new_page][pg_offset/4];
61 return idx_value;
62 }
63
radeon_ring_write(struct radeon_ring * ring,uint32_t v)64 void radeon_ring_write(struct radeon_ring *ring, uint32_t v)
65 {
66 #if DRM_DEBUG_CODE
67 if (ring->count_dw <= 0) {
68 DRM_ERROR("radeon: writting more dword to ring than expected !\n");
69 }
70 #endif
71 ring->ring[ring->wptr++] = v;
72 ring->wptr &= ring->ptr_mask;
73 ring->count_dw--;
74 ring->ring_free_dw--;
75 }
76
77 /*
78 * IB.
79 */
radeon_ib_try_free(struct radeon_device * rdev,struct radeon_ib * ib)80 bool radeon_ib_try_free(struct radeon_device *rdev, struct radeon_ib *ib)
81 {
82 bool done = false;
83
84 /* only free ib which have been emited */
85 if (ib->fence && ib->fence->emitted) {
86 if (radeon_fence_signaled(ib->fence)) {
87 radeon_fence_unref(&ib->fence);
88 radeon_sa_bo_free(rdev, &ib->sa_bo);
89 done = true;
90 }
91 }
92 return done;
93 }
94
radeon_ib_get(struct radeon_device * rdev,int ring,struct radeon_ib ** ib,unsigned size)95 int radeon_ib_get(struct radeon_device *rdev, int ring,
96 struct radeon_ib **ib, unsigned size)
97 {
98 struct radeon_fence *fence;
99 unsigned cretry = 0;
100 int r = 0, i, idx;
101
102 *ib = NULL;
103 /* align size on 256 bytes */
104 size = ALIGN(size, 256);
105
106 r = radeon_fence_create(rdev, &fence, ring);
107 if (r) {
108 dev_err(rdev->dev, "failed to create fence for new IB\n");
109 return r;
110 }
111
112 radeon_mutex_lock(&rdev->ib_pool.mutex);
113 idx = rdev->ib_pool.head_id;
114 retry:
115 if (cretry > 5) {
116 dev_err(rdev->dev, "failed to get an ib after 5 retry\n");
117 radeon_mutex_unlock(&rdev->ib_pool.mutex);
118 radeon_fence_unref(&fence);
119 return -ENOMEM;
120 }
121 cretry++;
122 for (i = 0; i < RADEON_IB_POOL_SIZE; i++) {
123 radeon_ib_try_free(rdev, &rdev->ib_pool.ibs[idx]);
124 if (rdev->ib_pool.ibs[idx].fence == NULL) {
125 r = radeon_sa_bo_new(rdev, &rdev->ib_pool.sa_manager,
126 &rdev->ib_pool.ibs[idx].sa_bo,
127 size, 256);
128 if (!r) {
129 *ib = &rdev->ib_pool.ibs[idx];
130 (*ib)->ptr = rdev->ib_pool.sa_manager.cpu_ptr;
131 (*ib)->ptr += ((*ib)->sa_bo.offset >> 2);
132 (*ib)->gpu_addr = rdev->ib_pool.sa_manager.gpu_addr;
133 (*ib)->gpu_addr += (*ib)->sa_bo.offset;
134 (*ib)->fence = fence;
135 (*ib)->vm_id = 0;
136 (*ib)->is_const_ib = false;
137 /* ib are most likely to be allocated in a ring fashion
138 * thus rdev->ib_pool.head_id should be the id of the
139 * oldest ib
140 */
141 rdev->ib_pool.head_id = (1 + idx);
142 rdev->ib_pool.head_id &= (RADEON_IB_POOL_SIZE - 1);
143 radeon_mutex_unlock(&rdev->ib_pool.mutex);
144 return 0;
145 }
146 }
147 idx = (idx + 1) & (RADEON_IB_POOL_SIZE - 1);
148 }
149 /* this should be rare event, ie all ib scheduled none signaled yet.
150 */
151 for (i = 0; i < RADEON_IB_POOL_SIZE; i++) {
152 if (rdev->ib_pool.ibs[idx].fence && rdev->ib_pool.ibs[idx].fence->emitted) {
153 r = radeon_fence_wait(rdev->ib_pool.ibs[idx].fence, false);
154 if (!r) {
155 goto retry;
156 }
157 /* an error happened */
158 break;
159 }
160 idx = (idx + 1) & (RADEON_IB_POOL_SIZE - 1);
161 }
162 radeon_mutex_unlock(&rdev->ib_pool.mutex);
163 radeon_fence_unref(&fence);
164 return r;
165 }
166
radeon_ib_free(struct radeon_device * rdev,struct radeon_ib ** ib)167 void radeon_ib_free(struct radeon_device *rdev, struct radeon_ib **ib)
168 {
169 struct radeon_ib *tmp = *ib;
170
171 *ib = NULL;
172 if (tmp == NULL) {
173 return;
174 }
175 radeon_mutex_lock(&rdev->ib_pool.mutex);
176 if (tmp->fence && !tmp->fence->emitted) {
177 radeon_sa_bo_free(rdev, &tmp->sa_bo);
178 radeon_fence_unref(&tmp->fence);
179 }
180 radeon_mutex_unlock(&rdev->ib_pool.mutex);
181 }
182
radeon_ib_schedule(struct radeon_device * rdev,struct radeon_ib * ib)183 int radeon_ib_schedule(struct radeon_device *rdev, struct radeon_ib *ib)
184 {
185 struct radeon_ring *ring = &rdev->ring[ib->fence->ring];
186 int r = 0;
187
188 if (!ib->length_dw || !ring->ready) {
189 /* TODO: Nothings in the ib we should report. */
190 DRM_ERROR("radeon: couldn't schedule IB(%u).\n", ib->idx);
191 return -EINVAL;
192 }
193
194 /* 64 dwords should be enough for fence too */
195 r = radeon_ring_lock(rdev, ring, 64);
196 if (r) {
197 DRM_ERROR("radeon: scheduling IB failed (%d).\n", r);
198 return r;
199 }
200 radeon_ring_ib_execute(rdev, ib->fence->ring, ib);
201 radeon_fence_emit(rdev, ib->fence);
202 radeon_ring_unlock_commit(rdev, ring);
203 return 0;
204 }
205
radeon_ib_pool_init(struct radeon_device * rdev)206 int radeon_ib_pool_init(struct radeon_device *rdev)
207 {
208 struct radeon_sa_manager tmp;
209 int i, r;
210
211 r = radeon_sa_bo_manager_init(rdev, &tmp,
212 RADEON_IB_POOL_SIZE*64*1024,
213 RADEON_GEM_DOMAIN_GTT);
214 if (r) {
215 return r;
216 }
217
218 radeon_mutex_lock(&rdev->ib_pool.mutex);
219 if (rdev->ib_pool.ready) {
220 radeon_mutex_unlock(&rdev->ib_pool.mutex);
221 radeon_sa_bo_manager_fini(rdev, &tmp);
222 return 0;
223 }
224
225 rdev->ib_pool.sa_manager = tmp;
226 INIT_LIST_HEAD(&rdev->ib_pool.sa_manager.sa_bo);
227 for (i = 0; i < RADEON_IB_POOL_SIZE; i++) {
228 rdev->ib_pool.ibs[i].fence = NULL;
229 rdev->ib_pool.ibs[i].idx = i;
230 rdev->ib_pool.ibs[i].length_dw = 0;
231 INIT_LIST_HEAD(&rdev->ib_pool.ibs[i].sa_bo.list);
232 }
233 rdev->ib_pool.head_id = 0;
234 rdev->ib_pool.ready = true;
235 DRM_INFO("radeon: ib pool ready.\n");
236
237 if (radeon_debugfs_ib_init(rdev)) {
238 DRM_ERROR("Failed to register debugfs file for IB !\n");
239 }
240 if (radeon_debugfs_ring_init(rdev)) {
241 DRM_ERROR("Failed to register debugfs file for rings !\n");
242 }
243 radeon_mutex_unlock(&rdev->ib_pool.mutex);
244 return 0;
245 }
246
radeon_ib_pool_fini(struct radeon_device * rdev)247 void radeon_ib_pool_fini(struct radeon_device *rdev)
248 {
249 unsigned i;
250
251 radeon_mutex_lock(&rdev->ib_pool.mutex);
252 if (rdev->ib_pool.ready) {
253 for (i = 0; i < RADEON_IB_POOL_SIZE; i++) {
254 radeon_sa_bo_free(rdev, &rdev->ib_pool.ibs[i].sa_bo);
255 radeon_fence_unref(&rdev->ib_pool.ibs[i].fence);
256 }
257 radeon_sa_bo_manager_fini(rdev, &rdev->ib_pool.sa_manager);
258 rdev->ib_pool.ready = false;
259 }
260 radeon_mutex_unlock(&rdev->ib_pool.mutex);
261 }
262
radeon_ib_pool_start(struct radeon_device * rdev)263 int radeon_ib_pool_start(struct radeon_device *rdev)
264 {
265 return radeon_sa_bo_manager_start(rdev, &rdev->ib_pool.sa_manager);
266 }
267
radeon_ib_pool_suspend(struct radeon_device * rdev)268 int radeon_ib_pool_suspend(struct radeon_device *rdev)
269 {
270 return radeon_sa_bo_manager_suspend(rdev, &rdev->ib_pool.sa_manager);
271 }
272
273 /*
274 * Ring.
275 */
radeon_ring_index(struct radeon_device * rdev,struct radeon_ring * ring)276 int radeon_ring_index(struct radeon_device *rdev, struct radeon_ring *ring)
277 {
278 /* r1xx-r5xx only has CP ring */
279 if (rdev->family < CHIP_R600)
280 return RADEON_RING_TYPE_GFX_INDEX;
281
282 if (rdev->family >= CHIP_CAYMAN) {
283 if (ring == &rdev->ring[CAYMAN_RING_TYPE_CP1_INDEX])
284 return CAYMAN_RING_TYPE_CP1_INDEX;
285 else if (ring == &rdev->ring[CAYMAN_RING_TYPE_CP2_INDEX])
286 return CAYMAN_RING_TYPE_CP2_INDEX;
287 }
288 return RADEON_RING_TYPE_GFX_INDEX;
289 }
290
radeon_ring_free_size(struct radeon_device * rdev,struct radeon_ring * ring)291 void radeon_ring_free_size(struct radeon_device *rdev, struct radeon_ring *ring)
292 {
293 u32 rptr;
294
295 if (rdev->wb.enabled)
296 rptr = le32_to_cpu(rdev->wb.wb[ring->rptr_offs/4]);
297 else
298 rptr = RREG32(ring->rptr_reg);
299 ring->rptr = (rptr & ring->ptr_reg_mask) >> ring->ptr_reg_shift;
300 /* This works because ring_size is a power of 2 */
301 ring->ring_free_dw = (ring->rptr + (ring->ring_size / 4));
302 ring->ring_free_dw -= ring->wptr;
303 ring->ring_free_dw &= ring->ptr_mask;
304 if (!ring->ring_free_dw) {
305 ring->ring_free_dw = ring->ring_size / 4;
306 }
307 }
308
309
radeon_ring_alloc(struct radeon_device * rdev,struct radeon_ring * ring,unsigned ndw)310 int radeon_ring_alloc(struct radeon_device *rdev, struct radeon_ring *ring, unsigned ndw)
311 {
312 int r;
313
314 /* make sure we aren't trying to allocate more space than there is on the ring */
315 if (ndw > (ring->ring_size / 4))
316 return -ENOMEM;
317 /* Align requested size with padding so unlock_commit can
318 * pad safely */
319 ndw = (ndw + ring->align_mask) & ~ring->align_mask;
320 while (ndw > (ring->ring_free_dw - 1)) {
321 radeon_ring_free_size(rdev, ring);
322 if (ndw < ring->ring_free_dw) {
323 break;
324 }
325 r = radeon_fence_wait_next(rdev, radeon_ring_index(rdev, ring));
326 if (r)
327 return r;
328 }
329 ring->count_dw = ndw;
330 ring->wptr_old = ring->wptr;
331 return 0;
332 }
333
radeon_ring_lock(struct radeon_device * rdev,struct radeon_ring * ring,unsigned ndw)334 int radeon_ring_lock(struct radeon_device *rdev, struct radeon_ring *ring, unsigned ndw)
335 {
336 int r;
337
338 mutex_lock(&ring->mutex);
339 r = radeon_ring_alloc(rdev, ring, ndw);
340 if (r) {
341 mutex_unlock(&ring->mutex);
342 return r;
343 }
344 return 0;
345 }
346
radeon_ring_commit(struct radeon_device * rdev,struct radeon_ring * ring)347 void radeon_ring_commit(struct radeon_device *rdev, struct radeon_ring *ring)
348 {
349 unsigned count_dw_pad;
350 unsigned i;
351
352 /* We pad to match fetch size */
353 count_dw_pad = (ring->align_mask + 1) -
354 (ring->wptr & ring->align_mask);
355 for (i = 0; i < count_dw_pad; i++) {
356 radeon_ring_write(ring, ring->nop);
357 }
358 DRM_MEMORYBARRIER();
359 WREG32(ring->wptr_reg, (ring->wptr << ring->ptr_reg_shift) & ring->ptr_reg_mask);
360 (void)RREG32(ring->wptr_reg);
361 }
362
radeon_ring_unlock_commit(struct radeon_device * rdev,struct radeon_ring * ring)363 void radeon_ring_unlock_commit(struct radeon_device *rdev, struct radeon_ring *ring)
364 {
365 radeon_ring_commit(rdev, ring);
366 mutex_unlock(&ring->mutex);
367 }
368
radeon_ring_unlock_undo(struct radeon_device * rdev,struct radeon_ring * ring)369 void radeon_ring_unlock_undo(struct radeon_device *rdev, struct radeon_ring *ring)
370 {
371 ring->wptr = ring->wptr_old;
372 mutex_unlock(&ring->mutex);
373 }
374
radeon_ring_init(struct radeon_device * rdev,struct radeon_ring * ring,unsigned ring_size,unsigned rptr_offs,unsigned rptr_reg,unsigned wptr_reg,u32 ptr_reg_shift,u32 ptr_reg_mask,u32 nop)375 int radeon_ring_init(struct radeon_device *rdev, struct radeon_ring *ring, unsigned ring_size,
376 unsigned rptr_offs, unsigned rptr_reg, unsigned wptr_reg,
377 u32 ptr_reg_shift, u32 ptr_reg_mask, u32 nop)
378 {
379 int r;
380
381 ring->ring_size = ring_size;
382 ring->rptr_offs = rptr_offs;
383 ring->rptr_reg = rptr_reg;
384 ring->wptr_reg = wptr_reg;
385 ring->ptr_reg_shift = ptr_reg_shift;
386 ring->ptr_reg_mask = ptr_reg_mask;
387 ring->nop = nop;
388 /* Allocate ring buffer */
389 if (ring->ring_obj == NULL) {
390 r = radeon_bo_create(rdev, ring->ring_size, PAGE_SIZE, true,
391 RADEON_GEM_DOMAIN_GTT,
392 &ring->ring_obj);
393 if (r) {
394 dev_err(rdev->dev, "(%d) ring create failed\n", r);
395 return r;
396 }
397 r = radeon_bo_reserve(ring->ring_obj, false);
398 if (unlikely(r != 0))
399 return r;
400 r = radeon_bo_pin(ring->ring_obj, RADEON_GEM_DOMAIN_GTT,
401 &ring->gpu_addr);
402 if (r) {
403 radeon_bo_unreserve(ring->ring_obj);
404 dev_err(rdev->dev, "(%d) ring pin failed\n", r);
405 return r;
406 }
407 r = radeon_bo_kmap(ring->ring_obj,
408 (void **)&ring->ring);
409 radeon_bo_unreserve(ring->ring_obj);
410 if (r) {
411 dev_err(rdev->dev, "(%d) ring map failed\n", r);
412 return r;
413 }
414 }
415 ring->ptr_mask = (ring->ring_size / 4) - 1;
416 ring->ring_free_dw = ring->ring_size / 4;
417 return 0;
418 }
419
radeon_ring_fini(struct radeon_device * rdev,struct radeon_ring * ring)420 void radeon_ring_fini(struct radeon_device *rdev, struct radeon_ring *ring)
421 {
422 int r;
423 struct radeon_bo *ring_obj;
424
425 mutex_lock(&ring->mutex);
426 ring_obj = ring->ring_obj;
427 ring->ring = NULL;
428 ring->ring_obj = NULL;
429 mutex_unlock(&ring->mutex);
430
431 if (ring_obj) {
432 r = radeon_bo_reserve(ring_obj, false);
433 if (likely(r == 0)) {
434 radeon_bo_kunmap(ring_obj);
435 radeon_bo_unpin(ring_obj);
436 radeon_bo_unreserve(ring_obj);
437 }
438 radeon_bo_unref(&ring_obj);
439 }
440 }
441
442 /*
443 * Debugfs info
444 */
445 #if defined(CONFIG_DEBUG_FS)
446
radeon_debugfs_ring_info(struct seq_file * m,void * data)447 static int radeon_debugfs_ring_info(struct seq_file *m, void *data)
448 {
449 struct drm_info_node *node = (struct drm_info_node *) m->private;
450 struct drm_device *dev = node->minor->dev;
451 struct radeon_device *rdev = dev->dev_private;
452 int ridx = *(int*)node->info_ent->data;
453 struct radeon_ring *ring = &rdev->ring[ridx];
454 unsigned count, i, j;
455
456 radeon_ring_free_size(rdev, ring);
457 count = (ring->ring_size / 4) - ring->ring_free_dw;
458 seq_printf(m, "wptr(0x%04x): 0x%08x\n", ring->wptr_reg, RREG32(ring->wptr_reg));
459 seq_printf(m, "rptr(0x%04x): 0x%08x\n", ring->rptr_reg, RREG32(ring->rptr_reg));
460 seq_printf(m, "driver's copy of the wptr: 0x%08x\n", ring->wptr);
461 seq_printf(m, "driver's copy of the rptr: 0x%08x\n", ring->rptr);
462 seq_printf(m, "%u free dwords in ring\n", ring->ring_free_dw);
463 seq_printf(m, "%u dwords in ring\n", count);
464 i = ring->rptr;
465 for (j = 0; j <= count; j++) {
466 seq_printf(m, "r[%04d]=0x%08x\n", i, ring->ring[i]);
467 i = (i + 1) & ring->ptr_mask;
468 }
469 return 0;
470 }
471
472 static int radeon_ring_type_gfx_index = RADEON_RING_TYPE_GFX_INDEX;
473 static int cayman_ring_type_cp1_index = CAYMAN_RING_TYPE_CP1_INDEX;
474 static int cayman_ring_type_cp2_index = CAYMAN_RING_TYPE_CP2_INDEX;
475
476 static struct drm_info_list radeon_debugfs_ring_info_list[] = {
477 {"radeon_ring_gfx", radeon_debugfs_ring_info, 0, &radeon_ring_type_gfx_index},
478 {"radeon_ring_cp1", radeon_debugfs_ring_info, 0, &cayman_ring_type_cp1_index},
479 {"radeon_ring_cp2", radeon_debugfs_ring_info, 0, &cayman_ring_type_cp2_index},
480 };
481
radeon_debugfs_ib_info(struct seq_file * m,void * data)482 static int radeon_debugfs_ib_info(struct seq_file *m, void *data)
483 {
484 struct drm_info_node *node = (struct drm_info_node *) m->private;
485 struct drm_device *dev = node->minor->dev;
486 struct radeon_device *rdev = dev->dev_private;
487 struct radeon_ib *ib = &rdev->ib_pool.ibs[*((unsigned*)node->info_ent->data)];
488 unsigned i;
489
490 if (ib == NULL) {
491 return 0;
492 }
493 seq_printf(m, "IB %04u\n", ib->idx);
494 seq_printf(m, "IB fence %p\n", ib->fence);
495 seq_printf(m, "IB size %05u dwords\n", ib->length_dw);
496 for (i = 0; i < ib->length_dw; i++) {
497 seq_printf(m, "[%05u]=0x%08X\n", i, ib->ptr[i]);
498 }
499 return 0;
500 }
501
502 static struct drm_info_list radeon_debugfs_ib_list[RADEON_IB_POOL_SIZE];
503 static char radeon_debugfs_ib_names[RADEON_IB_POOL_SIZE][32];
504 static unsigned radeon_debugfs_ib_idx[RADEON_IB_POOL_SIZE];
505 #endif
506
radeon_debugfs_ring_init(struct radeon_device * rdev)507 int radeon_debugfs_ring_init(struct radeon_device *rdev)
508 {
509 #if defined(CONFIG_DEBUG_FS)
510 if (rdev->family >= CHIP_CAYMAN)
511 return radeon_debugfs_add_files(rdev, radeon_debugfs_ring_info_list,
512 ARRAY_SIZE(radeon_debugfs_ring_info_list));
513 else
514 return radeon_debugfs_add_files(rdev, radeon_debugfs_ring_info_list, 1);
515 #else
516 return 0;
517 #endif
518 }
519
radeon_debugfs_ib_init(struct radeon_device * rdev)520 int radeon_debugfs_ib_init(struct radeon_device *rdev)
521 {
522 #if defined(CONFIG_DEBUG_FS)
523 unsigned i;
524
525 for (i = 0; i < RADEON_IB_POOL_SIZE; i++) {
526 sprintf(radeon_debugfs_ib_names[i], "radeon_ib_%04u", i);
527 radeon_debugfs_ib_idx[i] = i;
528 radeon_debugfs_ib_list[i].name = radeon_debugfs_ib_names[i];
529 radeon_debugfs_ib_list[i].show = &radeon_debugfs_ib_info;
530 radeon_debugfs_ib_list[i].driver_features = 0;
531 radeon_debugfs_ib_list[i].data = &radeon_debugfs_ib_idx[i];
532 }
533 return radeon_debugfs_add_files(rdev, radeon_debugfs_ib_list,
534 RADEON_IB_POOL_SIZE);
535 #else
536 return 0;
537 #endif
538 }
539