3beb26d747196b74700c08e2cb51a324868581bf
[safe/jmp/linux-2.6] / drivers / gpu / drm / radeon / radeon_fence.c
1 /*
2  * Copyright 2009 Jerome Glisse.
3  * All Rights Reserved.
4  *
5  * Permission is hereby granted, free of charge, to any person obtaining a
6  * copy of this software and associated documentation files (the
7  * "Software"), to deal in the Software without restriction, including
8  * without limitation the rights to use, copy, modify, merge, publish,
9  * distribute, sub license, and/or sell copies of the Software, and to
10  * permit persons to whom the Software is furnished to do so, subject to
11  * the following conditions:
12  *
13  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
14  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
15  * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
16  * THE COPYRIGHT HOLDERS, AUTHORS AND/OR ITS SUPPLIERS BE LIABLE FOR ANY CLAIM,
17  * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
18  * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
19  * USE OR OTHER DEALINGS IN THE SOFTWARE.
20  *
21  * The above copyright notice and this permission notice (including the
22  * next paragraph) shall be included in all copies or substantial portions
23  * of the Software.
24  *
25  */
26 /*
27  * Authors:
28  *    Jerome Glisse <glisse@freedesktop.org>
29  *    Dave Airlie
30  */
31 #include <linux/seq_file.h>
32 #include <asm/atomic.h>
33 #include <linux/wait.h>
34 #include <linux/list.h>
35 #include <linux/kref.h>
36 #include "drmP.h"
37 #include "drm.h"
38 #include "radeon_reg.h"
39 #include "radeon.h"
40
41 int radeon_fence_emit(struct radeon_device *rdev, struct radeon_fence *fence)
42 {
43         unsigned long irq_flags;
44
45         write_lock_irqsave(&rdev->fence_drv.lock, irq_flags);
46         if (fence->emited) {
47                 write_unlock_irqrestore(&rdev->fence_drv.lock, irq_flags);
48                 return 0;
49         }
50         fence->seq = atomic_add_return(1, &rdev->fence_drv.seq);
51         if (!rdev->cp.ready) {
52                 /* FIXME: cp is not running assume everythings is done right
53                  * away
54                  */
55                 WREG32(rdev->fence_drv.scratch_reg, fence->seq);
56         } else
57                 radeon_fence_ring_emit(rdev, fence);
58
59         fence->emited = true;
60         fence->timeout = jiffies + ((2000 * HZ) / 1000);
61         list_del(&fence->list);
62         list_add_tail(&fence->list, &rdev->fence_drv.emited);
63         write_unlock_irqrestore(&rdev->fence_drv.lock, irq_flags);
64         return 0;
65 }
66
67 static bool radeon_fence_poll_locked(struct radeon_device *rdev)
68 {
69         struct radeon_fence *fence;
70         struct list_head *i, *n;
71         uint32_t seq;
72         bool wake = false;
73
74         if (rdev == NULL) {
75                 return true;
76         }
77         if (rdev->shutdown) {
78                 return true;
79         }
80         seq = RREG32(rdev->fence_drv.scratch_reg);
81         rdev->fence_drv.last_seq = seq;
82         n = NULL;
83         list_for_each(i, &rdev->fence_drv.emited) {
84                 fence = list_entry(i, struct radeon_fence, list);
85                 if (fence->seq == seq) {
86                         n = i;
87                         break;
88                 }
89         }
90         /* all fence previous to this one are considered as signaled */
91         if (n) {
92                 i = n;
93                 do {
94                         n = i->prev;
95                         list_del(i);
96                         list_add_tail(i, &rdev->fence_drv.signaled);
97                         fence = list_entry(i, struct radeon_fence, list);
98                         fence->signaled = true;
99                         i = n;
100                 } while (i != &rdev->fence_drv.emited);
101                 wake = true;
102         }
103         return wake;
104 }
105
106 static void radeon_fence_destroy(struct kref *kref)
107 {
108         unsigned long irq_flags;
109         struct radeon_fence *fence;
110
111         fence = container_of(kref, struct radeon_fence, kref);
112         write_lock_irqsave(&fence->rdev->fence_drv.lock, irq_flags);
113         list_del(&fence->list);
114         fence->emited = false;
115         write_unlock_irqrestore(&fence->rdev->fence_drv.lock, irq_flags);
116         kfree(fence);
117 }
118
119 int radeon_fence_create(struct radeon_device *rdev, struct radeon_fence **fence)
120 {
121         unsigned long irq_flags;
122
123         *fence = kmalloc(sizeof(struct radeon_fence), GFP_KERNEL);
124         if ((*fence) == NULL) {
125                 return -ENOMEM;
126         }
127         kref_init(&((*fence)->kref));
128         (*fence)->rdev = rdev;
129         (*fence)->emited = false;
130         (*fence)->signaled = false;
131         (*fence)->seq = 0;
132         INIT_LIST_HEAD(&(*fence)->list);
133
134         write_lock_irqsave(&rdev->fence_drv.lock, irq_flags);
135         list_add_tail(&(*fence)->list, &rdev->fence_drv.created);
136         write_unlock_irqrestore(&rdev->fence_drv.lock, irq_flags);
137         return 0;
138 }
139
140
141 bool radeon_fence_signaled(struct radeon_fence *fence)
142 {
143         struct radeon_device *rdev = fence->rdev;
144         unsigned long irq_flags;
145         bool signaled = false;
146
147         if (rdev->gpu_lockup) {
148                 return true;
149         }
150         if (fence == NULL) {
151                 return true;
152         }
153         write_lock_irqsave(&fence->rdev->fence_drv.lock, irq_flags);
154         signaled = fence->signaled;
155         /* if we are shuting down report all fence as signaled */
156         if (fence->rdev->shutdown) {
157                 signaled = true;
158         }
159         if (!fence->emited) {
160                 WARN(1, "Querying an unemited fence : %p !\n", fence);
161                 signaled = true;
162         }
163         if (!signaled) {
164                 radeon_fence_poll_locked(fence->rdev);
165                 signaled = fence->signaled;
166         }
167         write_unlock_irqrestore(&fence->rdev->fence_drv.lock, irq_flags);
168         return signaled;
169 }
170
171 int r600_fence_wait(struct radeon_fence *fence,  bool intr, bool lazy)
172 {
173         struct radeon_device *rdev;
174         int ret = 0;
175
176         rdev = fence->rdev;
177
178         __set_current_state(intr ? TASK_INTERRUPTIBLE : TASK_UNINTERRUPTIBLE);
179
180         while (1) {
181                 if (radeon_fence_signaled(fence))
182                         break;
183
184                 if (time_after_eq(jiffies, fence->timeout)) {
185                         ret = -EBUSY;
186                         break;
187                 }
188
189                 if (lazy)
190                         schedule_timeout(1);
191
192                 if (intr && signal_pending(current)) {
193                         ret = -ERESTARTSYS;
194                         break;
195                 }
196         }
197         __set_current_state(TASK_RUNNING);
198         return ret;
199 }
200
201
202 int radeon_fence_wait(struct radeon_fence *fence, bool intr)
203 {
204         struct radeon_device *rdev;
205         unsigned long cur_jiffies;
206         unsigned long timeout;
207         bool expired = false;
208         int r;
209
210         if (fence == NULL) {
211                 WARN(1, "Querying an invalid fence : %p !\n", fence);
212                 return 0;
213         }
214         rdev = fence->rdev;
215         if (radeon_fence_signaled(fence)) {
216                 return 0;
217         }
218
219         if (rdev->family >= CHIP_R600) {
220                 r = r600_fence_wait(fence, intr, 0);
221                 if (r == -ERESTARTSYS)
222                         return -EBUSY;
223                 return r;
224         }
225
226 retry:
227         cur_jiffies = jiffies;
228         timeout = HZ / 100;
229         if (time_after(fence->timeout, cur_jiffies)) {
230                 timeout = fence->timeout - cur_jiffies;
231         }
232
233         if (intr) {
234                 r = wait_event_interruptible_timeout(rdev->fence_drv.queue,
235                                 radeon_fence_signaled(fence), timeout);
236                 if (unlikely(r == -ERESTARTSYS)) {
237                         return -EBUSY;
238                 }
239         } else {
240                 r = wait_event_timeout(rdev->fence_drv.queue,
241                          radeon_fence_signaled(fence), timeout);
242         }
243         if (unlikely(!radeon_fence_signaled(fence))) {
244                 if (unlikely(r == 0)) {
245                         expired = true;
246                 }
247                 if (unlikely(expired)) {
248                         timeout = 1;
249                         if (time_after(cur_jiffies, fence->timeout)) {
250                                 timeout = cur_jiffies - fence->timeout;
251                         }
252                         timeout = jiffies_to_msecs(timeout);
253                         if (timeout > 500) {
254                                 DRM_ERROR("fence(%p:0x%08X) %lums timeout "
255                                           "going to reset GPU\n",
256                                           fence, fence->seq, timeout);
257                                 radeon_gpu_reset(rdev);
258                                 WREG32(rdev->fence_drv.scratch_reg, fence->seq);
259                         }
260                 }
261                 goto retry;
262         }
263         if (unlikely(expired)) {
264                 rdev->fence_drv.count_timeout++;
265                 cur_jiffies = jiffies;
266                 timeout = 1;
267                 if (time_after(cur_jiffies, fence->timeout)) {
268                         timeout = cur_jiffies - fence->timeout;
269                 }
270                 timeout = jiffies_to_msecs(timeout);
271                 DRM_ERROR("fence(%p:0x%08X) %lums timeout\n",
272                           fence, fence->seq, timeout);
273                 DRM_ERROR("last signaled fence(0x%08X)\n",
274                           rdev->fence_drv.last_seq);
275         }
276         return 0;
277 }
278
279 int radeon_fence_wait_next(struct radeon_device *rdev)
280 {
281         unsigned long irq_flags;
282         struct radeon_fence *fence;
283         int r;
284
285         if (rdev->gpu_lockup) {
286                 return 0;
287         }
288         write_lock_irqsave(&rdev->fence_drv.lock, irq_flags);
289         if (list_empty(&rdev->fence_drv.emited)) {
290                 write_unlock_irqrestore(&rdev->fence_drv.lock, irq_flags);
291                 return 0;
292         }
293         fence = list_entry(rdev->fence_drv.emited.next,
294                            struct radeon_fence, list);
295         radeon_fence_ref(fence);
296         write_unlock_irqrestore(&rdev->fence_drv.lock, irq_flags);
297         r = radeon_fence_wait(fence, false);
298         radeon_fence_unref(&fence);
299         return r;
300 }
301
302 int radeon_fence_wait_last(struct radeon_device *rdev)
303 {
304         unsigned long irq_flags;
305         struct radeon_fence *fence;
306         int r;
307
308         if (rdev->gpu_lockup) {
309                 return 0;
310         }
311         write_lock_irqsave(&rdev->fence_drv.lock, irq_flags);
312         if (list_empty(&rdev->fence_drv.emited)) {
313                 write_unlock_irqrestore(&rdev->fence_drv.lock, irq_flags);
314                 return 0;
315         }
316         fence = list_entry(rdev->fence_drv.emited.prev,
317                            struct radeon_fence, list);
318         radeon_fence_ref(fence);
319         write_unlock_irqrestore(&rdev->fence_drv.lock, irq_flags);
320         r = radeon_fence_wait(fence, false);
321         radeon_fence_unref(&fence);
322         return r;
323 }
324
325 struct radeon_fence *radeon_fence_ref(struct radeon_fence *fence)
326 {
327         kref_get(&fence->kref);
328         return fence;
329 }
330
331 void radeon_fence_unref(struct radeon_fence **fence)
332 {
333         struct radeon_fence *tmp = *fence;
334
335         *fence = NULL;
336         if (tmp) {
337                 kref_put(&tmp->kref, &radeon_fence_destroy);
338         }
339 }
340
341 void radeon_fence_process(struct radeon_device *rdev)
342 {
343         unsigned long irq_flags;
344         bool wake;
345
346         write_lock_irqsave(&rdev->fence_drv.lock, irq_flags);
347         wake = radeon_fence_poll_locked(rdev);
348         write_unlock_irqrestore(&rdev->fence_drv.lock, irq_flags);
349         if (wake) {
350                 wake_up_all(&rdev->fence_drv.queue);
351         }
352 }
353
354 int radeon_fence_driver_init(struct radeon_device *rdev)
355 {
356         unsigned long irq_flags;
357         int r;
358
359         write_lock_irqsave(&rdev->fence_drv.lock, irq_flags);
360         r = radeon_scratch_get(rdev, &rdev->fence_drv.scratch_reg);
361         if (r) {
362                 DRM_ERROR("Fence failed to get a scratch register.");
363                 write_unlock_irqrestore(&rdev->fence_drv.lock, irq_flags);
364                 return r;
365         }
366         WREG32(rdev->fence_drv.scratch_reg, 0);
367         atomic_set(&rdev->fence_drv.seq, 0);
368         INIT_LIST_HEAD(&rdev->fence_drv.created);
369         INIT_LIST_HEAD(&rdev->fence_drv.emited);
370         INIT_LIST_HEAD(&rdev->fence_drv.signaled);
371         rdev->fence_drv.count_timeout = 0;
372         init_waitqueue_head(&rdev->fence_drv.queue);
373         write_unlock_irqrestore(&rdev->fence_drv.lock, irq_flags);
374         if (radeon_debugfs_fence_init(rdev)) {
375                 DRM_ERROR("Failed to register debugfs file for fence !\n");
376         }
377         return 0;
378 }
379
380 void radeon_fence_driver_fini(struct radeon_device *rdev)
381 {
382         unsigned long irq_flags;
383
384         wake_up_all(&rdev->fence_drv.queue);
385         write_lock_irqsave(&rdev->fence_drv.lock, irq_flags);
386         radeon_scratch_free(rdev, rdev->fence_drv.scratch_reg);
387         write_unlock_irqrestore(&rdev->fence_drv.lock, irq_flags);
388         DRM_INFO("radeon: fence finalized\n");
389 }
390
391
392 /*
393  * Fence debugfs
394  */
395 #if defined(CONFIG_DEBUG_FS)
396 static int radeon_debugfs_fence_info(struct seq_file *m, void *data)
397 {
398         struct drm_info_node *node = (struct drm_info_node *)m->private;
399         struct drm_device *dev = node->minor->dev;
400         struct radeon_device *rdev = dev->dev_private;
401         struct radeon_fence *fence;
402
403         seq_printf(m, "Last signaled fence 0x%08X\n",
404                    RREG32(rdev->fence_drv.scratch_reg));
405         if (!list_empty(&rdev->fence_drv.emited)) {
406                    fence = list_entry(rdev->fence_drv.emited.prev,
407                                       struct radeon_fence, list);
408                    seq_printf(m, "Last emited fence %p with 0x%08X\n",
409                               fence,  fence->seq);
410         }
411         return 0;
412 }
413
414 static struct drm_info_list radeon_debugfs_fence_list[] = {
415         {"radeon_fence_info", &radeon_debugfs_fence_info, 0, NULL},
416 };
417 #endif
418
419 int radeon_debugfs_fence_init(struct radeon_device *rdev)
420 {
421 #if defined(CONFIG_DEBUG_FS)
422         return radeon_debugfs_add_files(rdev, radeon_debugfs_fence_list, 1);
423 #else
424         return 0;
425 #endif
426 }