1 // SPDX-License-Identifier: GPL-2.0 OR MIT
2 /**************************************************************************
3 *
4 * Copyright 2009-2015 VMware, Inc., Palo Alto, CA., USA
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a
7 * copy of this software and associated documentation files (the
8 * "Software"), to deal in the Software without restriction, including
9 * without limitation the rights to use, copy, modify, merge, publish,
10 * distribute, sub license, and/or sell copies of the Software, and to
11 * permit persons to whom the Software is furnished to do so, subject to
12 * the following conditions:
13 *
14 * The above copyright notice and this permission notice (including the
15 * next paragraph) shall be included in all copies or substantial portions
16 * of the Software.
17 *
18 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
19 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
20 * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
21 * THE COPYRIGHT HOLDERS, AUTHORS AND/OR ITS SUPPLIERS BE LIABLE FOR ANY CLAIM,
22 * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
23 * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
24 * USE OR OTHER DEALINGS IN THE SOFTWARE.
25 *
26 **************************************************************************/
27
28 #include <linux/sched/signal.h>
29
30 #include "vmwgfx_drv.h"
31
32 #define VMW_FENCE_WRAP (1 << 24)
33
34 /**
35 * vmw_thread_fn - Deferred (process context) irq handler
36 *
37 * @irq: irq number
38 * @arg: Closure argument. Pointer to a struct drm_device cast to void *
39 *
40 * This function implements the deferred part of irq processing.
41 * The function is guaranteed to run at least once after the
42 * vmw_irq_handler has returned with IRQ_WAKE_THREAD.
43 *
44 */
vmw_thread_fn(int irq,void * arg)45 static irqreturn_t vmw_thread_fn(int irq, void *arg)
46 {
47 struct drm_device *dev = (struct drm_device *)arg;
48 struct vmw_private *dev_priv = vmw_priv(dev);
49 irqreturn_t ret = IRQ_NONE;
50
51 if (test_and_clear_bit(VMW_IRQTHREAD_FENCE,
52 dev_priv->irqthread_pending)) {
53 vmw_fences_update(dev_priv->fman);
54 wake_up_all(&dev_priv->fence_queue);
55 ret = IRQ_HANDLED;
56 }
57
58 if (test_and_clear_bit(VMW_IRQTHREAD_CMDBUF,
59 dev_priv->irqthread_pending)) {
60 vmw_cmdbuf_irqthread(dev_priv->cman);
61 ret = IRQ_HANDLED;
62 }
63
64 return ret;
65 }
66
67 /**
68 * vmw_irq_handler irq handler
69 *
70 * @irq: irq number
71 * @arg: Closure argument. Pointer to a struct drm_device cast to void *
72 *
73 * This function implements the quick part of irq processing.
74 * The function performs fast actions like clearing the device interrupt
75 * flags and also reasonably quick actions like waking processes waiting for
76 * FIFO space. Other IRQ actions are deferred to the IRQ thread.
77 */
vmw_irq_handler(int irq,void * arg)78 static irqreturn_t vmw_irq_handler(int irq, void *arg)
79 {
80 struct drm_device *dev = (struct drm_device *)arg;
81 struct vmw_private *dev_priv = vmw_priv(dev);
82 uint32_t status, masked_status;
83 irqreturn_t ret = IRQ_HANDLED;
84
85 status = inl(dev_priv->io_start + VMWGFX_IRQSTATUS_PORT);
86 masked_status = status & READ_ONCE(dev_priv->irq_mask);
87
88 if (likely(status))
89 outl(status, dev_priv->io_start + VMWGFX_IRQSTATUS_PORT);
90
91 if (!status)
92 return IRQ_NONE;
93
94 if (masked_status & SVGA_IRQFLAG_FIFO_PROGRESS)
95 wake_up_all(&dev_priv->fifo_queue);
96
97 if ((masked_status & (SVGA_IRQFLAG_ANY_FENCE |
98 SVGA_IRQFLAG_FENCE_GOAL)) &&
99 !test_and_set_bit(VMW_IRQTHREAD_FENCE, dev_priv->irqthread_pending))
100 ret = IRQ_WAKE_THREAD;
101
102 if ((masked_status & (SVGA_IRQFLAG_COMMAND_BUFFER |
103 SVGA_IRQFLAG_ERROR)) &&
104 !test_and_set_bit(VMW_IRQTHREAD_CMDBUF,
105 dev_priv->irqthread_pending))
106 ret = IRQ_WAKE_THREAD;
107
108 return ret;
109 }
110
vmw_fifo_idle(struct vmw_private * dev_priv,uint32_t seqno)111 static bool vmw_fifo_idle(struct vmw_private *dev_priv, uint32_t seqno)
112 {
113
114 return (vmw_read(dev_priv, SVGA_REG_BUSY) == 0);
115 }
116
vmw_update_seqno(struct vmw_private * dev_priv,struct vmw_fifo_state * fifo_state)117 void vmw_update_seqno(struct vmw_private *dev_priv,
118 struct vmw_fifo_state *fifo_state)
119 {
120 u32 *fifo_mem = dev_priv->mmio_virt;
121 uint32_t seqno = vmw_mmio_read(fifo_mem + SVGA_FIFO_FENCE);
122
123 if (dev_priv->last_read_seqno != seqno) {
124 dev_priv->last_read_seqno = seqno;
125 vmw_marker_pull(&fifo_state->marker_queue, seqno);
126 vmw_fences_update(dev_priv->fman);
127 }
128 }
129
vmw_seqno_passed(struct vmw_private * dev_priv,uint32_t seqno)130 bool vmw_seqno_passed(struct vmw_private *dev_priv,
131 uint32_t seqno)
132 {
133 struct vmw_fifo_state *fifo_state;
134 bool ret;
135
136 if (likely(dev_priv->last_read_seqno - seqno < VMW_FENCE_WRAP))
137 return true;
138
139 fifo_state = &dev_priv->fifo;
140 vmw_update_seqno(dev_priv, fifo_state);
141 if (likely(dev_priv->last_read_seqno - seqno < VMW_FENCE_WRAP))
142 return true;
143
144 if (!(fifo_state->capabilities & SVGA_FIFO_CAP_FENCE) &&
145 vmw_fifo_idle(dev_priv, seqno))
146 return true;
147
148 /**
149 * Then check if the seqno is higher than what we've actually
150 * emitted. Then the fence is stale and signaled.
151 */
152
153 ret = ((atomic_read(&dev_priv->marker_seq) - seqno)
154 > VMW_FENCE_WRAP);
155
156 return ret;
157 }
158
vmw_fallback_wait(struct vmw_private * dev_priv,bool lazy,bool fifo_idle,uint32_t seqno,bool interruptible,unsigned long timeout)159 int vmw_fallback_wait(struct vmw_private *dev_priv,
160 bool lazy,
161 bool fifo_idle,
162 uint32_t seqno,
163 bool interruptible,
164 unsigned long timeout)
165 {
166 struct vmw_fifo_state *fifo_state = &dev_priv->fifo;
167
168 uint32_t count = 0;
169 uint32_t signal_seq;
170 int ret;
171 unsigned long end_jiffies = jiffies + timeout;
172 bool (*wait_condition)(struct vmw_private *, uint32_t);
173 DEFINE_WAIT(__wait);
174
175 wait_condition = (fifo_idle) ? &vmw_fifo_idle :
176 &vmw_seqno_passed;
177
178 /**
179 * Block command submission while waiting for idle.
180 */
181
182 if (fifo_idle) {
183 down_read(&fifo_state->rwsem);
184 if (dev_priv->cman) {
185 ret = vmw_cmdbuf_idle(dev_priv->cman, interruptible,
186 10*HZ);
187 if (ret)
188 goto out_err;
189 }
190 }
191
192 signal_seq = atomic_read(&dev_priv->marker_seq);
193 ret = 0;
194
195 for (;;) {
196 prepare_to_wait(&dev_priv->fence_queue, &__wait,
197 (interruptible) ?
198 TASK_INTERRUPTIBLE : TASK_UNINTERRUPTIBLE);
199 if (wait_condition(dev_priv, seqno))
200 break;
201 if (time_after_eq(jiffies, end_jiffies)) {
202 DRM_ERROR("SVGA device lockup.\n");
203 break;
204 }
205 if (lazy)
206 schedule_timeout(1);
207 else if ((++count & 0x0F) == 0) {
208 /**
209 * FIXME: Use schedule_hr_timeout here for
210 * newer kernels and lower CPU utilization.
211 */
212
213 __set_current_state(TASK_RUNNING);
214 schedule();
215 __set_current_state((interruptible) ?
216 TASK_INTERRUPTIBLE :
217 TASK_UNINTERRUPTIBLE);
218 }
219 if (interruptible && signal_pending(current)) {
220 ret = -ERESTARTSYS;
221 break;
222 }
223 }
224 finish_wait(&dev_priv->fence_queue, &__wait);
225 if (ret == 0 && fifo_idle) {
226 u32 *fifo_mem = dev_priv->mmio_virt;
227
228 vmw_mmio_write(signal_seq, fifo_mem + SVGA_FIFO_FENCE);
229 }
230 wake_up_all(&dev_priv->fence_queue);
231 out_err:
232 if (fifo_idle)
233 up_read(&fifo_state->rwsem);
234
235 return ret;
236 }
237
vmw_generic_waiter_add(struct vmw_private * dev_priv,u32 flag,int * waiter_count)238 void vmw_generic_waiter_add(struct vmw_private *dev_priv,
239 u32 flag, int *waiter_count)
240 {
241 spin_lock_bh(&dev_priv->waiter_lock);
242 if ((*waiter_count)++ == 0) {
243 outl(flag, dev_priv->io_start + VMWGFX_IRQSTATUS_PORT);
244 dev_priv->irq_mask |= flag;
245 vmw_write(dev_priv, SVGA_REG_IRQMASK, dev_priv->irq_mask);
246 }
247 spin_unlock_bh(&dev_priv->waiter_lock);
248 }
249
vmw_generic_waiter_remove(struct vmw_private * dev_priv,u32 flag,int * waiter_count)250 void vmw_generic_waiter_remove(struct vmw_private *dev_priv,
251 u32 flag, int *waiter_count)
252 {
253 spin_lock_bh(&dev_priv->waiter_lock);
254 if (--(*waiter_count) == 0) {
255 dev_priv->irq_mask &= ~flag;
256 vmw_write(dev_priv, SVGA_REG_IRQMASK, dev_priv->irq_mask);
257 }
258 spin_unlock_bh(&dev_priv->waiter_lock);
259 }
260
vmw_seqno_waiter_add(struct vmw_private * dev_priv)261 void vmw_seqno_waiter_add(struct vmw_private *dev_priv)
262 {
263 vmw_generic_waiter_add(dev_priv, SVGA_IRQFLAG_ANY_FENCE,
264 &dev_priv->fence_queue_waiters);
265 }
266
vmw_seqno_waiter_remove(struct vmw_private * dev_priv)267 void vmw_seqno_waiter_remove(struct vmw_private *dev_priv)
268 {
269 vmw_generic_waiter_remove(dev_priv, SVGA_IRQFLAG_ANY_FENCE,
270 &dev_priv->fence_queue_waiters);
271 }
272
vmw_goal_waiter_add(struct vmw_private * dev_priv)273 void vmw_goal_waiter_add(struct vmw_private *dev_priv)
274 {
275 vmw_generic_waiter_add(dev_priv, SVGA_IRQFLAG_FENCE_GOAL,
276 &dev_priv->goal_queue_waiters);
277 }
278
vmw_goal_waiter_remove(struct vmw_private * dev_priv)279 void vmw_goal_waiter_remove(struct vmw_private *dev_priv)
280 {
281 vmw_generic_waiter_remove(dev_priv, SVGA_IRQFLAG_FENCE_GOAL,
282 &dev_priv->goal_queue_waiters);
283 }
284
vmw_wait_seqno(struct vmw_private * dev_priv,bool lazy,uint32_t seqno,bool interruptible,unsigned long timeout)285 int vmw_wait_seqno(struct vmw_private *dev_priv,
286 bool lazy, uint32_t seqno,
287 bool interruptible, unsigned long timeout)
288 {
289 long ret;
290 struct vmw_fifo_state *fifo = &dev_priv->fifo;
291
292 if (likely(dev_priv->last_read_seqno - seqno < VMW_FENCE_WRAP))
293 return 0;
294
295 if (likely(vmw_seqno_passed(dev_priv, seqno)))
296 return 0;
297
298 vmw_fifo_ping_host(dev_priv, SVGA_SYNC_GENERIC);
299
300 if (!(fifo->capabilities & SVGA_FIFO_CAP_FENCE))
301 return vmw_fallback_wait(dev_priv, lazy, true, seqno,
302 interruptible, timeout);
303
304 if (!(dev_priv->capabilities & SVGA_CAP_IRQMASK))
305 return vmw_fallback_wait(dev_priv, lazy, false, seqno,
306 interruptible, timeout);
307
308 vmw_seqno_waiter_add(dev_priv);
309
310 if (interruptible)
311 ret = wait_event_interruptible_timeout
312 (dev_priv->fence_queue,
313 vmw_seqno_passed(dev_priv, seqno),
314 timeout);
315 else
316 ret = wait_event_timeout
317 (dev_priv->fence_queue,
318 vmw_seqno_passed(dev_priv, seqno),
319 timeout);
320
321 vmw_seqno_waiter_remove(dev_priv);
322
323 if (unlikely(ret == 0))
324 ret = -EBUSY;
325 else if (likely(ret > 0))
326 ret = 0;
327
328 return ret;
329 }
330
vmw_irq_preinstall(struct drm_device * dev)331 static void vmw_irq_preinstall(struct drm_device *dev)
332 {
333 struct vmw_private *dev_priv = vmw_priv(dev);
334 uint32_t status;
335
336 status = inl(dev_priv->io_start + VMWGFX_IRQSTATUS_PORT);
337 outl(status, dev_priv->io_start + VMWGFX_IRQSTATUS_PORT);
338 }
339
vmw_irq_uninstall(struct drm_device * dev)340 void vmw_irq_uninstall(struct drm_device *dev)
341 {
342 struct vmw_private *dev_priv = vmw_priv(dev);
343 uint32_t status;
344
345 if (!(dev_priv->capabilities & SVGA_CAP_IRQMASK))
346 return;
347
348 if (!dev->irq_enabled)
349 return;
350
351 vmw_write(dev_priv, SVGA_REG_IRQMASK, 0);
352
353 status = inl(dev_priv->io_start + VMWGFX_IRQSTATUS_PORT);
354 outl(status, dev_priv->io_start + VMWGFX_IRQSTATUS_PORT);
355
356 dev->irq_enabled = false;
357 free_irq(dev->irq, dev);
358 }
359
360 /**
361 * vmw_irq_install - Install the irq handlers
362 *
363 * @dev: Pointer to the drm device.
364 * @irq: The irq number.
365 * Return: Zero if successful. Negative number otherwise.
366 */
vmw_irq_install(struct drm_device * dev,int irq)367 int vmw_irq_install(struct drm_device *dev, int irq)
368 {
369 int ret;
370
371 if (dev->irq_enabled)
372 return -EBUSY;
373
374 vmw_irq_preinstall(dev);
375
376 ret = request_threaded_irq(irq, vmw_irq_handler, vmw_thread_fn,
377 IRQF_SHARED, VMWGFX_DRIVER_NAME, dev);
378 if (ret < 0)
379 return ret;
380
381 dev->irq_enabled = true;
382 dev->irq = irq;
383
384 return ret;
385 }
386