• Home
  • Line#
  • Scopes#
  • Navigate#
  • Raw
  • Download
1 /*
2  * Copyright (c) 2012 Intel Corporation. All rights reserved.
3  * Copyright (c) 2007 - 2012 QLogic Corporation. All rights reserved.
4  *
5  * This software is available to you under a choice of one of two
6  * licenses.  You may choose to be licensed under the terms of the GNU
7  * General Public License (GPL) Version 2, available from the file
8  * COPYING in the main directory of this source tree, or the
9  * OpenIB.org BSD license below:
10  *
11  *     Redistribution and use in source and binary forms, with or
12  *     without modification, are permitted provided that the following
13  *     conditions are met:
14  *
15  *      - Redistributions of source code must retain the above
16  *        copyright notice, this list of conditions and the following
17  *        disclaimer.
18  *
19  *      - Redistributions in binary form must reproduce the above
20  *        copyright notice, this list of conditions and the following
21  *        disclaimer in the documentation and/or other materials
22  *        provided with the distribution.
23  *
24  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
25  * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
26  * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
27  * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
28  * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
29  * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
30  * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
31  * SOFTWARE.
32  */
33 
34 #include <linux/spinlock.h>
35 #include <linux/netdevice.h>
36 #include <linux/moduleparam.h>
37 
38 #include "qib.h"
39 #include "qib_common.h"
40 
41 /* default pio off, sdma on */
42 static ushort sdma_descq_cnt = 256;
43 module_param_named(sdma_descq_cnt, sdma_descq_cnt, ushort, S_IRUGO);
44 MODULE_PARM_DESC(sdma_descq_cnt, "Number of SDMA descq entries");
45 
46 /*
47  * Bits defined in the send DMA descriptor.
48  */
49 #define SDMA_DESC_LAST          (1ULL << 11)
50 #define SDMA_DESC_FIRST         (1ULL << 12)
51 #define SDMA_DESC_DMA_HEAD      (1ULL << 13)
52 #define SDMA_DESC_USE_LARGE_BUF (1ULL << 14)
53 #define SDMA_DESC_INTR          (1ULL << 15)
54 #define SDMA_DESC_COUNT_LSB     16
55 #define SDMA_DESC_GEN_LSB       30
56 
57 char *qib_sdma_state_names[] = {
58 	[qib_sdma_state_s00_hw_down]          = "s00_HwDown",
59 	[qib_sdma_state_s10_hw_start_up_wait] = "s10_HwStartUpWait",
60 	[qib_sdma_state_s20_idle]             = "s20_Idle",
61 	[qib_sdma_state_s30_sw_clean_up_wait] = "s30_SwCleanUpWait",
62 	[qib_sdma_state_s40_hw_clean_up_wait] = "s40_HwCleanUpWait",
63 	[qib_sdma_state_s50_hw_halt_wait]     = "s50_HwHaltWait",
64 	[qib_sdma_state_s99_running]          = "s99_Running",
65 };
66 
67 char *qib_sdma_event_names[] = {
68 	[qib_sdma_event_e00_go_hw_down]   = "e00_GoHwDown",
69 	[qib_sdma_event_e10_go_hw_start]  = "e10_GoHwStart",
70 	[qib_sdma_event_e20_hw_started]   = "e20_HwStarted",
71 	[qib_sdma_event_e30_go_running]   = "e30_GoRunning",
72 	[qib_sdma_event_e40_sw_cleaned]   = "e40_SwCleaned",
73 	[qib_sdma_event_e50_hw_cleaned]   = "e50_HwCleaned",
74 	[qib_sdma_event_e60_hw_halted]    = "e60_HwHalted",
75 	[qib_sdma_event_e70_go_idle]      = "e70_GoIdle",
76 	[qib_sdma_event_e7220_err_halted] = "e7220_ErrHalted",
77 	[qib_sdma_event_e7322_err_halted] = "e7322_ErrHalted",
78 	[qib_sdma_event_e90_timer_tick]   = "e90_TimerTick",
79 };
80 
81 /* declare all statics here rather than keep sorting */
82 static int alloc_sdma(struct qib_pportdata *);
83 static void sdma_complete(struct kref *);
84 static void sdma_finalput(struct qib_sdma_state *);
85 static void sdma_get(struct qib_sdma_state *);
86 static void sdma_put(struct qib_sdma_state *);
87 static void sdma_set_state(struct qib_pportdata *, enum qib_sdma_states);
88 static void sdma_start_sw_clean_up(struct qib_pportdata *);
89 static void sdma_sw_clean_up_task(unsigned long);
90 static void unmap_desc(struct qib_pportdata *, unsigned);
91 
sdma_get(struct qib_sdma_state * ss)92 static void sdma_get(struct qib_sdma_state *ss)
93 {
94 	kref_get(&ss->kref);
95 }
96 
sdma_complete(struct kref * kref)97 static void sdma_complete(struct kref *kref)
98 {
99 	struct qib_sdma_state *ss =
100 		container_of(kref, struct qib_sdma_state, kref);
101 
102 	complete(&ss->comp);
103 }
104 
sdma_put(struct qib_sdma_state * ss)105 static void sdma_put(struct qib_sdma_state *ss)
106 {
107 	kref_put(&ss->kref, sdma_complete);
108 }
109 
sdma_finalput(struct qib_sdma_state * ss)110 static void sdma_finalput(struct qib_sdma_state *ss)
111 {
112 	sdma_put(ss);
113 	wait_for_completion(&ss->comp);
114 }
115 
116 /*
117  * Complete all the sdma requests on the active list, in the correct
118  * order, and with appropriate processing.   Called when cleaning up
119  * after sdma shutdown, and when new sdma requests are submitted for
120  * a link that is down.   This matches what is done for requests
121  * that complete normally, it's just the full list.
122  *
123  * Must be called with sdma_lock held
124  */
clear_sdma_activelist(struct qib_pportdata * ppd)125 static void clear_sdma_activelist(struct qib_pportdata *ppd)
126 {
127 	struct qib_sdma_txreq *txp, *txp_next;
128 
129 	list_for_each_entry_safe(txp, txp_next, &ppd->sdma_activelist, list) {
130 		list_del_init(&txp->list);
131 		if (txp->flags & QIB_SDMA_TXREQ_F_FREEDESC) {
132 			unsigned idx;
133 
134 			idx = txp->start_idx;
135 			while (idx != txp->next_descq_idx) {
136 				unmap_desc(ppd, idx);
137 				if (++idx == ppd->sdma_descq_cnt)
138 					idx = 0;
139 			}
140 		}
141 		if (txp->callback)
142 			(*txp->callback)(txp, QIB_SDMA_TXREQ_S_ABORTED);
143 	}
144 }
145 
sdma_sw_clean_up_task(unsigned long opaque)146 static void sdma_sw_clean_up_task(unsigned long opaque)
147 {
148 	struct qib_pportdata *ppd = (struct qib_pportdata *) opaque;
149 	unsigned long flags;
150 
151 	spin_lock_irqsave(&ppd->sdma_lock, flags);
152 
153 	/*
154 	 * At this point, the following should always be true:
155 	 * - We are halted, so no more descriptors are getting retired.
156 	 * - We are not running, so no one is submitting new work.
157 	 * - Only we can send the e40_sw_cleaned, so we can't start
158 	 *   running again until we say so.  So, the active list and
159 	 *   descq are ours to play with.
160 	 */
161 
162 	/* Process all retired requests. */
163 	qib_sdma_make_progress(ppd);
164 
165 	clear_sdma_activelist(ppd);
166 
167 	/*
168 	 * Resync count of added and removed.  It is VERY important that
169 	 * sdma_descq_removed NEVER decrement - user_sdma depends on it.
170 	 */
171 	ppd->sdma_descq_removed = ppd->sdma_descq_added;
172 
173 	/*
174 	 * Reset our notion of head and tail.
175 	 * Note that the HW registers will be reset when switching states
176 	 * due to calling __qib_sdma_process_event() below.
177 	 */
178 	ppd->sdma_descq_tail = 0;
179 	ppd->sdma_descq_head = 0;
180 	ppd->sdma_head_dma[0] = 0;
181 	ppd->sdma_generation = 0;
182 
183 	__qib_sdma_process_event(ppd, qib_sdma_event_e40_sw_cleaned);
184 
185 	spin_unlock_irqrestore(&ppd->sdma_lock, flags);
186 }
187 
188 /*
189  * This is called when changing to state qib_sdma_state_s10_hw_start_up_wait
190  * as a result of send buffer errors or send DMA descriptor errors.
191  * We want to disarm the buffers in these cases.
192  */
sdma_hw_start_up(struct qib_pportdata * ppd)193 static void sdma_hw_start_up(struct qib_pportdata *ppd)
194 {
195 	struct qib_sdma_state *ss = &ppd->sdma_state;
196 	unsigned bufno;
197 
198 	for (bufno = ss->first_sendbuf; bufno < ss->last_sendbuf; ++bufno)
199 		ppd->dd->f_sendctrl(ppd, QIB_SENDCTRL_DISARM_BUF(bufno));
200 
201 	ppd->dd->f_sdma_hw_start_up(ppd);
202 }
203 
sdma_sw_tear_down(struct qib_pportdata * ppd)204 static void sdma_sw_tear_down(struct qib_pportdata *ppd)
205 {
206 	struct qib_sdma_state *ss = &ppd->sdma_state;
207 
208 	/* Releasing this reference means the state machine has stopped. */
209 	sdma_put(ss);
210 }
211 
sdma_start_sw_clean_up(struct qib_pportdata * ppd)212 static void sdma_start_sw_clean_up(struct qib_pportdata *ppd)
213 {
214 	tasklet_hi_schedule(&ppd->sdma_sw_clean_up_task);
215 }
216 
sdma_set_state(struct qib_pportdata * ppd,enum qib_sdma_states next_state)217 static void sdma_set_state(struct qib_pportdata *ppd,
218 	enum qib_sdma_states next_state)
219 {
220 	struct qib_sdma_state *ss = &ppd->sdma_state;
221 	struct sdma_set_state_action *action = ss->set_state_action;
222 	unsigned op = 0;
223 
224 	/* debugging bookkeeping */
225 	ss->previous_state = ss->current_state;
226 	ss->previous_op = ss->current_op;
227 
228 	ss->current_state = next_state;
229 
230 	if (action[next_state].op_enable)
231 		op |= QIB_SDMA_SENDCTRL_OP_ENABLE;
232 
233 	if (action[next_state].op_intenable)
234 		op |= QIB_SDMA_SENDCTRL_OP_INTENABLE;
235 
236 	if (action[next_state].op_halt)
237 		op |= QIB_SDMA_SENDCTRL_OP_HALT;
238 
239 	if (action[next_state].op_drain)
240 		op |= QIB_SDMA_SENDCTRL_OP_DRAIN;
241 
242 	if (action[next_state].go_s99_running_tofalse)
243 		ss->go_s99_running = 0;
244 
245 	if (action[next_state].go_s99_running_totrue)
246 		ss->go_s99_running = 1;
247 
248 	ss->current_op = op;
249 
250 	ppd->dd->f_sdma_sendctrl(ppd, ss->current_op);
251 }
252 
unmap_desc(struct qib_pportdata * ppd,unsigned head)253 static void unmap_desc(struct qib_pportdata *ppd, unsigned head)
254 {
255 	__le64 *descqp = &ppd->sdma_descq[head].qw[0];
256 	u64 desc[2];
257 	dma_addr_t addr;
258 	size_t len;
259 
260 	desc[0] = le64_to_cpu(descqp[0]);
261 	desc[1] = le64_to_cpu(descqp[1]);
262 
263 	addr = (desc[1] << 32) | (desc[0] >> 32);
264 	len = (desc[0] >> 14) & (0x7ffULL << 2);
265 	dma_unmap_single(&ppd->dd->pcidev->dev, addr, len, DMA_TO_DEVICE);
266 }
267 
alloc_sdma(struct qib_pportdata * ppd)268 static int alloc_sdma(struct qib_pportdata *ppd)
269 {
270 	ppd->sdma_descq_cnt = sdma_descq_cnt;
271 	if (!ppd->sdma_descq_cnt)
272 		ppd->sdma_descq_cnt = 256;
273 
274 	/* Allocate memory for SendDMA descriptor FIFO */
275 	ppd->sdma_descq = dma_alloc_coherent(&ppd->dd->pcidev->dev,
276 		ppd->sdma_descq_cnt * sizeof(u64[2]), &ppd->sdma_descq_phys,
277 		GFP_KERNEL);
278 
279 	if (!ppd->sdma_descq) {
280 		qib_dev_err(ppd->dd,
281 			"failed to allocate SendDMA descriptor FIFO memory\n");
282 		goto bail;
283 	}
284 
285 	/* Allocate memory for DMA of head register to memory */
286 	ppd->sdma_head_dma = dma_alloc_coherent(&ppd->dd->pcidev->dev,
287 		PAGE_SIZE, &ppd->sdma_head_phys, GFP_KERNEL);
288 	if (!ppd->sdma_head_dma) {
289 		qib_dev_err(ppd->dd,
290 			"failed to allocate SendDMA head memory\n");
291 		goto cleanup_descq;
292 	}
293 	ppd->sdma_head_dma[0] = 0;
294 	return 0;
295 
296 cleanup_descq:
297 	dma_free_coherent(&ppd->dd->pcidev->dev,
298 		ppd->sdma_descq_cnt * sizeof(u64[2]), (void *)ppd->sdma_descq,
299 		ppd->sdma_descq_phys);
300 	ppd->sdma_descq = NULL;
301 	ppd->sdma_descq_phys = 0;
302 bail:
303 	ppd->sdma_descq_cnt = 0;
304 	return -ENOMEM;
305 }
306 
free_sdma(struct qib_pportdata * ppd)307 static void free_sdma(struct qib_pportdata *ppd)
308 {
309 	struct qib_devdata *dd = ppd->dd;
310 
311 	if (ppd->sdma_head_dma) {
312 		dma_free_coherent(&dd->pcidev->dev, PAGE_SIZE,
313 				  (void *)ppd->sdma_head_dma,
314 				  ppd->sdma_head_phys);
315 		ppd->sdma_head_dma = NULL;
316 		ppd->sdma_head_phys = 0;
317 	}
318 
319 	if (ppd->sdma_descq) {
320 		dma_free_coherent(&dd->pcidev->dev,
321 				  ppd->sdma_descq_cnt * sizeof(u64[2]),
322 				  ppd->sdma_descq, ppd->sdma_descq_phys);
323 		ppd->sdma_descq = NULL;
324 		ppd->sdma_descq_phys = 0;
325 	}
326 }
327 
make_sdma_desc(struct qib_pportdata * ppd,u64 * sdmadesc,u64 addr,u64 dwlen,u64 dwoffset)328 static inline void make_sdma_desc(struct qib_pportdata *ppd,
329 				  u64 *sdmadesc, u64 addr, u64 dwlen,
330 				  u64 dwoffset)
331 {
332 
333 	WARN_ON(addr & 3);
334 	/* SDmaPhyAddr[47:32] */
335 	sdmadesc[1] = addr >> 32;
336 	/* SDmaPhyAddr[31:0] */
337 	sdmadesc[0] = (addr & 0xfffffffcULL) << 32;
338 	/* SDmaGeneration[1:0] */
339 	sdmadesc[0] |= (ppd->sdma_generation & 3ULL) <<
340 		SDMA_DESC_GEN_LSB;
341 	/* SDmaDwordCount[10:0] */
342 	sdmadesc[0] |= (dwlen & 0x7ffULL) << SDMA_DESC_COUNT_LSB;
343 	/* SDmaBufOffset[12:2] */
344 	sdmadesc[0] |= dwoffset & 0x7ffULL;
345 }
346 
347 /* sdma_lock must be held */
qib_sdma_make_progress(struct qib_pportdata * ppd)348 int qib_sdma_make_progress(struct qib_pportdata *ppd)
349 {
350 	struct list_head *lp = NULL;
351 	struct qib_sdma_txreq *txp = NULL;
352 	struct qib_devdata *dd = ppd->dd;
353 	int progress = 0;
354 	u16 hwhead;
355 	u16 idx = 0;
356 
357 	hwhead = dd->f_sdma_gethead(ppd);
358 
359 	/* The reason for some of the complexity of this code is that
360 	 * not all descriptors have corresponding txps.  So, we have to
361 	 * be able to skip over descs until we wander into the range of
362 	 * the next txp on the list.
363 	 */
364 
365 	if (!list_empty(&ppd->sdma_activelist)) {
366 		lp = ppd->sdma_activelist.next;
367 		txp = list_entry(lp, struct qib_sdma_txreq, list);
368 		idx = txp->start_idx;
369 	}
370 
371 	while (ppd->sdma_descq_head != hwhead) {
372 		/* if desc is part of this txp, unmap if needed */
373 		if (txp && (txp->flags & QIB_SDMA_TXREQ_F_FREEDESC) &&
374 		    (idx == ppd->sdma_descq_head)) {
375 			unmap_desc(ppd, ppd->sdma_descq_head);
376 			if (++idx == ppd->sdma_descq_cnt)
377 				idx = 0;
378 		}
379 
380 		/* increment dequed desc count */
381 		ppd->sdma_descq_removed++;
382 
383 		/* advance head, wrap if needed */
384 		if (++ppd->sdma_descq_head == ppd->sdma_descq_cnt)
385 			ppd->sdma_descq_head = 0;
386 
387 		/* if now past this txp's descs, do the callback */
388 		if (txp && txp->next_descq_idx == ppd->sdma_descq_head) {
389 			/* remove from active list */
390 			list_del_init(&txp->list);
391 			if (txp->callback)
392 				(*txp->callback)(txp, QIB_SDMA_TXREQ_S_OK);
393 			/* see if there is another txp */
394 			if (list_empty(&ppd->sdma_activelist))
395 				txp = NULL;
396 			else {
397 				lp = ppd->sdma_activelist.next;
398 				txp = list_entry(lp, struct qib_sdma_txreq,
399 					list);
400 				idx = txp->start_idx;
401 			}
402 		}
403 		progress = 1;
404 	}
405 	if (progress)
406 		qib_verbs_sdma_desc_avail(ppd, qib_sdma_descq_freecnt(ppd));
407 	return progress;
408 }
409 
410 /*
411  * This is called from interrupt context.
412  */
qib_sdma_intr(struct qib_pportdata * ppd)413 void qib_sdma_intr(struct qib_pportdata *ppd)
414 {
415 	unsigned long flags;
416 
417 	spin_lock_irqsave(&ppd->sdma_lock, flags);
418 
419 	__qib_sdma_intr(ppd);
420 
421 	spin_unlock_irqrestore(&ppd->sdma_lock, flags);
422 }
423 
__qib_sdma_intr(struct qib_pportdata * ppd)424 void __qib_sdma_intr(struct qib_pportdata *ppd)
425 {
426 	if (__qib_sdma_running(ppd)) {
427 		qib_sdma_make_progress(ppd);
428 		if (!list_empty(&ppd->sdma_userpending))
429 			qib_user_sdma_send_desc(ppd, &ppd->sdma_userpending);
430 	}
431 }
432 
qib_setup_sdma(struct qib_pportdata * ppd)433 int qib_setup_sdma(struct qib_pportdata *ppd)
434 {
435 	struct qib_devdata *dd = ppd->dd;
436 	unsigned long flags;
437 	int ret = 0;
438 
439 	ret = alloc_sdma(ppd);
440 	if (ret)
441 		goto bail;
442 
443 	/* set consistent sdma state */
444 	ppd->dd->f_sdma_init_early(ppd);
445 	spin_lock_irqsave(&ppd->sdma_lock, flags);
446 	sdma_set_state(ppd, qib_sdma_state_s00_hw_down);
447 	spin_unlock_irqrestore(&ppd->sdma_lock, flags);
448 
449 	/* set up reference counting */
450 	kref_init(&ppd->sdma_state.kref);
451 	init_completion(&ppd->sdma_state.comp);
452 
453 	ppd->sdma_generation = 0;
454 	ppd->sdma_descq_head = 0;
455 	ppd->sdma_descq_removed = 0;
456 	ppd->sdma_descq_added = 0;
457 
458 	ppd->sdma_intrequest = 0;
459 	INIT_LIST_HEAD(&ppd->sdma_userpending);
460 
461 	INIT_LIST_HEAD(&ppd->sdma_activelist);
462 
463 	tasklet_init(&ppd->sdma_sw_clean_up_task, sdma_sw_clean_up_task,
464 		(unsigned long)ppd);
465 
466 	ret = dd->f_init_sdma_regs(ppd);
467 	if (ret)
468 		goto bail_alloc;
469 
470 	qib_sdma_process_event(ppd, qib_sdma_event_e10_go_hw_start);
471 
472 	return 0;
473 
474 bail_alloc:
475 	qib_teardown_sdma(ppd);
476 bail:
477 	return ret;
478 }
479 
qib_teardown_sdma(struct qib_pportdata * ppd)480 void qib_teardown_sdma(struct qib_pportdata *ppd)
481 {
482 	qib_sdma_process_event(ppd, qib_sdma_event_e00_go_hw_down);
483 
484 	/*
485 	 * This waits for the state machine to exit so it is not
486 	 * necessary to kill the sdma_sw_clean_up_task to make sure
487 	 * it is not running.
488 	 */
489 	sdma_finalput(&ppd->sdma_state);
490 
491 	free_sdma(ppd);
492 }
493 
qib_sdma_running(struct qib_pportdata * ppd)494 int qib_sdma_running(struct qib_pportdata *ppd)
495 {
496 	unsigned long flags;
497 	int ret;
498 
499 	spin_lock_irqsave(&ppd->sdma_lock, flags);
500 	ret = __qib_sdma_running(ppd);
501 	spin_unlock_irqrestore(&ppd->sdma_lock, flags);
502 
503 	return ret;
504 }
505 
506 /*
507  * Complete a request when sdma not running; likely only request
508  * but to simplify the code, always queue it, then process the full
509  * activelist.  We process the entire list to ensure that this particular
510  * request does get it's callback, but in the correct order.
511  * Must be called with sdma_lock held
512  */
complete_sdma_err_req(struct qib_pportdata * ppd,struct qib_verbs_txreq * tx)513 static void complete_sdma_err_req(struct qib_pportdata *ppd,
514 				  struct qib_verbs_txreq *tx)
515 {
516 	atomic_inc(&tx->qp->s_dma_busy);
517 	/* no sdma descriptors, so no unmap_desc */
518 	tx->txreq.start_idx = 0;
519 	tx->txreq.next_descq_idx = 0;
520 	list_add_tail(&tx->txreq.list, &ppd->sdma_activelist);
521 	clear_sdma_activelist(ppd);
522 }
523 
524 /*
525  * This function queues one IB packet onto the send DMA queue per call.
526  * The caller is responsible for checking:
527  * 1) The number of send DMA descriptor entries is less than the size of
528  *    the descriptor queue.
529  * 2) The IB SGE addresses and lengths are 32-bit aligned
530  *    (except possibly the last SGE's length)
531  * 3) The SGE addresses are suitable for passing to dma_map_single().
532  */
qib_sdma_verbs_send(struct qib_pportdata * ppd,struct qib_sge_state * ss,u32 dwords,struct qib_verbs_txreq * tx)533 int qib_sdma_verbs_send(struct qib_pportdata *ppd,
534 			struct qib_sge_state *ss, u32 dwords,
535 			struct qib_verbs_txreq *tx)
536 {
537 	unsigned long flags;
538 	struct qib_sge *sge;
539 	struct qib_qp *qp;
540 	int ret = 0;
541 	u16 tail;
542 	__le64 *descqp;
543 	u64 sdmadesc[2];
544 	u32 dwoffset;
545 	dma_addr_t addr;
546 
547 	spin_lock_irqsave(&ppd->sdma_lock, flags);
548 
549 retry:
550 	if (unlikely(!__qib_sdma_running(ppd))) {
551 		complete_sdma_err_req(ppd, tx);
552 		goto unlock;
553 	}
554 
555 	if (tx->txreq.sg_count > qib_sdma_descq_freecnt(ppd)) {
556 		if (qib_sdma_make_progress(ppd))
557 			goto retry;
558 		if (ppd->dd->flags & QIB_HAS_SDMA_TIMEOUT)
559 			ppd->dd->f_sdma_set_desc_cnt(ppd,
560 					ppd->sdma_descq_cnt / 2);
561 		goto busy;
562 	}
563 
564 	dwoffset = tx->hdr_dwords;
565 	make_sdma_desc(ppd, sdmadesc, (u64) tx->txreq.addr, dwoffset, 0);
566 
567 	sdmadesc[0] |= SDMA_DESC_FIRST;
568 	if (tx->txreq.flags & QIB_SDMA_TXREQ_F_USELARGEBUF)
569 		sdmadesc[0] |= SDMA_DESC_USE_LARGE_BUF;
570 
571 	/* write to the descq */
572 	tail = ppd->sdma_descq_tail;
573 	descqp = &ppd->sdma_descq[tail].qw[0];
574 	*descqp++ = cpu_to_le64(sdmadesc[0]);
575 	*descqp++ = cpu_to_le64(sdmadesc[1]);
576 
577 	/* increment the tail */
578 	if (++tail == ppd->sdma_descq_cnt) {
579 		tail = 0;
580 		descqp = &ppd->sdma_descq[0].qw[0];
581 		++ppd->sdma_generation;
582 	}
583 
584 	tx->txreq.start_idx = tail;
585 
586 	sge = &ss->sge;
587 	while (dwords) {
588 		u32 dw;
589 		u32 len;
590 
591 		len = dwords << 2;
592 		if (len > sge->length)
593 			len = sge->length;
594 		if (len > sge->sge_length)
595 			len = sge->sge_length;
596 		BUG_ON(len == 0);
597 		dw = (len + 3) >> 2;
598 		addr = dma_map_single(&ppd->dd->pcidev->dev, sge->vaddr,
599 				      dw << 2, DMA_TO_DEVICE);
600 		if (dma_mapping_error(&ppd->dd->pcidev->dev, addr)) {
601 			ret = -ENOMEM;
602 			goto unmap;
603 		}
604 		sdmadesc[0] = 0;
605 		make_sdma_desc(ppd, sdmadesc, (u64) addr, dw, dwoffset);
606 		/* SDmaUseLargeBuf has to be set in every descriptor */
607 		if (tx->txreq.flags & QIB_SDMA_TXREQ_F_USELARGEBUF)
608 			sdmadesc[0] |= SDMA_DESC_USE_LARGE_BUF;
609 		/* write to the descq */
610 		*descqp++ = cpu_to_le64(sdmadesc[0]);
611 		*descqp++ = cpu_to_le64(sdmadesc[1]);
612 
613 		/* increment the tail */
614 		if (++tail == ppd->sdma_descq_cnt) {
615 			tail = 0;
616 			descqp = &ppd->sdma_descq[0].qw[0];
617 			++ppd->sdma_generation;
618 		}
619 		sge->vaddr += len;
620 		sge->length -= len;
621 		sge->sge_length -= len;
622 		if (sge->sge_length == 0) {
623 			if (--ss->num_sge)
624 				*sge = *ss->sg_list++;
625 		} else if (sge->length == 0 && sge->mr->lkey) {
626 			if (++sge->n >= QIB_SEGSZ) {
627 				if (++sge->m >= sge->mr->mapsz)
628 					break;
629 				sge->n = 0;
630 			}
631 			sge->vaddr =
632 				sge->mr->map[sge->m]->segs[sge->n].vaddr;
633 			sge->length =
634 				sge->mr->map[sge->m]->segs[sge->n].length;
635 		}
636 
637 		dwoffset += dw;
638 		dwords -= dw;
639 	}
640 
641 	if (!tail)
642 		descqp = &ppd->sdma_descq[ppd->sdma_descq_cnt].qw[0];
643 	descqp -= 2;
644 	descqp[0] |= cpu_to_le64(SDMA_DESC_LAST);
645 	if (tx->txreq.flags & QIB_SDMA_TXREQ_F_HEADTOHOST)
646 		descqp[0] |= cpu_to_le64(SDMA_DESC_DMA_HEAD);
647 	if (tx->txreq.flags & QIB_SDMA_TXREQ_F_INTREQ)
648 		descqp[0] |= cpu_to_le64(SDMA_DESC_INTR);
649 
650 	atomic_inc(&tx->qp->s_dma_busy);
651 	tx->txreq.next_descq_idx = tail;
652 	ppd->dd->f_sdma_update_tail(ppd, tail);
653 	ppd->sdma_descq_added += tx->txreq.sg_count;
654 	list_add_tail(&tx->txreq.list, &ppd->sdma_activelist);
655 	goto unlock;
656 
657 unmap:
658 	for (;;) {
659 		if (!tail)
660 			tail = ppd->sdma_descq_cnt - 1;
661 		else
662 			tail--;
663 		if (tail == ppd->sdma_descq_tail)
664 			break;
665 		unmap_desc(ppd, tail);
666 	}
667 	qp = tx->qp;
668 	qib_put_txreq(tx);
669 	spin_lock(&qp->r_lock);
670 	spin_lock(&qp->s_lock);
671 	if (qp->ibqp.qp_type == IB_QPT_RC) {
672 		/* XXX what about error sending RDMA read responses? */
673 		if (ib_qib_state_ops[qp->state] & QIB_PROCESS_RECV_OK)
674 			qib_error_qp(qp, IB_WC_GENERAL_ERR);
675 	} else if (qp->s_wqe)
676 		qib_send_complete(qp, qp->s_wqe, IB_WC_GENERAL_ERR);
677 	spin_unlock(&qp->s_lock);
678 	spin_unlock(&qp->r_lock);
679 	/* return zero to process the next send work request */
680 	goto unlock;
681 
682 busy:
683 	qp = tx->qp;
684 	spin_lock(&qp->s_lock);
685 	if (ib_qib_state_ops[qp->state] & QIB_PROCESS_RECV_OK) {
686 		struct qib_ibdev *dev;
687 
688 		/*
689 		 * If we couldn't queue the DMA request, save the info
690 		 * and try again later rather than destroying the
691 		 * buffer and undoing the side effects of the copy.
692 		 */
693 		tx->ss = ss;
694 		tx->dwords = dwords;
695 		qp->s_tx = tx;
696 		dev = &ppd->dd->verbs_dev;
697 		spin_lock(&dev->pending_lock);
698 		if (list_empty(&qp->iowait)) {
699 			struct qib_ibport *ibp;
700 
701 			ibp = &ppd->ibport_data;
702 			ibp->n_dmawait++;
703 			qp->s_flags |= QIB_S_WAIT_DMA_DESC;
704 			list_add_tail(&qp->iowait, &dev->dmawait);
705 		}
706 		spin_unlock(&dev->pending_lock);
707 		qp->s_flags &= ~QIB_S_BUSY;
708 		spin_unlock(&qp->s_lock);
709 		ret = -EBUSY;
710 	} else {
711 		spin_unlock(&qp->s_lock);
712 		qib_put_txreq(tx);
713 	}
714 unlock:
715 	spin_unlock_irqrestore(&ppd->sdma_lock, flags);
716 	return ret;
717 }
718 
719 /*
720  * sdma_lock should be acquired before calling this routine
721  */
dump_sdma_state(struct qib_pportdata * ppd)722 void dump_sdma_state(struct qib_pportdata *ppd)
723 {
724 	struct qib_sdma_desc *descq;
725 	struct qib_sdma_txreq *txp, *txpnext;
726 	__le64 *descqp;
727 	u64 desc[2];
728 	u64 addr;
729 	u16 gen, dwlen, dwoffset;
730 	u16 head, tail, cnt;
731 
732 	head = ppd->sdma_descq_head;
733 	tail = ppd->sdma_descq_tail;
734 	cnt = qib_sdma_descq_freecnt(ppd);
735 	descq = ppd->sdma_descq;
736 
737 	qib_dev_porterr(ppd->dd, ppd->port,
738 		"SDMA ppd->sdma_descq_head: %u\n", head);
739 	qib_dev_porterr(ppd->dd, ppd->port,
740 		"SDMA ppd->sdma_descq_tail: %u\n", tail);
741 	qib_dev_porterr(ppd->dd, ppd->port,
742 		"SDMA sdma_descq_freecnt: %u\n", cnt);
743 
744 	/* print info for each entry in the descriptor queue */
745 	while (head != tail) {
746 		char flags[6] = { 'x', 'x', 'x', 'x', 'x', 0 };
747 
748 		descqp = &descq[head].qw[0];
749 		desc[0] = le64_to_cpu(descqp[0]);
750 		desc[1] = le64_to_cpu(descqp[1]);
751 		flags[0] = (desc[0] & 1<<15) ? 'I' : '-';
752 		flags[1] = (desc[0] & 1<<14) ? 'L' : 'S';
753 		flags[2] = (desc[0] & 1<<13) ? 'H' : '-';
754 		flags[3] = (desc[0] & 1<<12) ? 'F' : '-';
755 		flags[4] = (desc[0] & 1<<11) ? 'L' : '-';
756 		addr = (desc[1] << 32) | ((desc[0] >> 32) & 0xfffffffcULL);
757 		gen = (desc[0] >> 30) & 3ULL;
758 		dwlen = (desc[0] >> 14) & (0x7ffULL << 2);
759 		dwoffset = (desc[0] & 0x7ffULL) << 2;
760 		qib_dev_porterr(ppd->dd, ppd->port,
761 			"SDMA sdmadesc[%u]: flags:%s addr:0x%016llx gen:%u len:%u bytes offset:%u bytes\n",
762 			 head, flags, addr, gen, dwlen, dwoffset);
763 		if (++head == ppd->sdma_descq_cnt)
764 			head = 0;
765 	}
766 
767 	/* print dma descriptor indices from the TX requests */
768 	list_for_each_entry_safe(txp, txpnext, &ppd->sdma_activelist,
769 				 list)
770 		qib_dev_porterr(ppd->dd, ppd->port,
771 			"SDMA txp->start_idx: %u txp->next_descq_idx: %u\n",
772 			txp->start_idx, txp->next_descq_idx);
773 }
774 
qib_sdma_process_event(struct qib_pportdata * ppd,enum qib_sdma_events event)775 void qib_sdma_process_event(struct qib_pportdata *ppd,
776 	enum qib_sdma_events event)
777 {
778 	unsigned long flags;
779 
780 	spin_lock_irqsave(&ppd->sdma_lock, flags);
781 
782 	__qib_sdma_process_event(ppd, event);
783 
784 	if (ppd->sdma_state.current_state == qib_sdma_state_s99_running)
785 		qib_verbs_sdma_desc_avail(ppd, qib_sdma_descq_freecnt(ppd));
786 
787 	spin_unlock_irqrestore(&ppd->sdma_lock, flags);
788 }
789 
__qib_sdma_process_event(struct qib_pportdata * ppd,enum qib_sdma_events event)790 void __qib_sdma_process_event(struct qib_pportdata *ppd,
791 	enum qib_sdma_events event)
792 {
793 	struct qib_sdma_state *ss = &ppd->sdma_state;
794 
795 	switch (ss->current_state) {
796 	case qib_sdma_state_s00_hw_down:
797 		switch (event) {
798 		case qib_sdma_event_e00_go_hw_down:
799 			break;
800 		case qib_sdma_event_e30_go_running:
801 			/*
802 			 * If down, but running requested (usually result
803 			 * of link up, then we need to start up.
804 			 * This can happen when hw down is requested while
805 			 * bringing the link up with traffic active on
806 			 * 7220, e.g. */
807 			ss->go_s99_running = 1;
808 			/* fall through and start dma engine */
809 		case qib_sdma_event_e10_go_hw_start:
810 			/* This reference means the state machine is started */
811 			sdma_get(&ppd->sdma_state);
812 			sdma_set_state(ppd,
813 				       qib_sdma_state_s10_hw_start_up_wait);
814 			break;
815 		case qib_sdma_event_e20_hw_started:
816 			break;
817 		case qib_sdma_event_e40_sw_cleaned:
818 			sdma_sw_tear_down(ppd);
819 			break;
820 		case qib_sdma_event_e50_hw_cleaned:
821 			break;
822 		case qib_sdma_event_e60_hw_halted:
823 			break;
824 		case qib_sdma_event_e70_go_idle:
825 			break;
826 		case qib_sdma_event_e7220_err_halted:
827 			break;
828 		case qib_sdma_event_e7322_err_halted:
829 			break;
830 		case qib_sdma_event_e90_timer_tick:
831 			break;
832 		}
833 		break;
834 
835 	case qib_sdma_state_s10_hw_start_up_wait:
836 		switch (event) {
837 		case qib_sdma_event_e00_go_hw_down:
838 			sdma_set_state(ppd, qib_sdma_state_s00_hw_down);
839 			sdma_sw_tear_down(ppd);
840 			break;
841 		case qib_sdma_event_e10_go_hw_start:
842 			break;
843 		case qib_sdma_event_e20_hw_started:
844 			sdma_set_state(ppd, ss->go_s99_running ?
845 				       qib_sdma_state_s99_running :
846 				       qib_sdma_state_s20_idle);
847 			break;
848 		case qib_sdma_event_e30_go_running:
849 			ss->go_s99_running = 1;
850 			break;
851 		case qib_sdma_event_e40_sw_cleaned:
852 			break;
853 		case qib_sdma_event_e50_hw_cleaned:
854 			break;
855 		case qib_sdma_event_e60_hw_halted:
856 			break;
857 		case qib_sdma_event_e70_go_idle:
858 			ss->go_s99_running = 0;
859 			break;
860 		case qib_sdma_event_e7220_err_halted:
861 			break;
862 		case qib_sdma_event_e7322_err_halted:
863 			break;
864 		case qib_sdma_event_e90_timer_tick:
865 			break;
866 		}
867 		break;
868 
869 	case qib_sdma_state_s20_idle:
870 		switch (event) {
871 		case qib_sdma_event_e00_go_hw_down:
872 			sdma_set_state(ppd, qib_sdma_state_s00_hw_down);
873 			sdma_sw_tear_down(ppd);
874 			break;
875 		case qib_sdma_event_e10_go_hw_start:
876 			break;
877 		case qib_sdma_event_e20_hw_started:
878 			break;
879 		case qib_sdma_event_e30_go_running:
880 			sdma_set_state(ppd, qib_sdma_state_s99_running);
881 			ss->go_s99_running = 1;
882 			break;
883 		case qib_sdma_event_e40_sw_cleaned:
884 			break;
885 		case qib_sdma_event_e50_hw_cleaned:
886 			break;
887 		case qib_sdma_event_e60_hw_halted:
888 			break;
889 		case qib_sdma_event_e70_go_idle:
890 			break;
891 		case qib_sdma_event_e7220_err_halted:
892 			break;
893 		case qib_sdma_event_e7322_err_halted:
894 			break;
895 		case qib_sdma_event_e90_timer_tick:
896 			break;
897 		}
898 		break;
899 
900 	case qib_sdma_state_s30_sw_clean_up_wait:
901 		switch (event) {
902 		case qib_sdma_event_e00_go_hw_down:
903 			sdma_set_state(ppd, qib_sdma_state_s00_hw_down);
904 			break;
905 		case qib_sdma_event_e10_go_hw_start:
906 			break;
907 		case qib_sdma_event_e20_hw_started:
908 			break;
909 		case qib_sdma_event_e30_go_running:
910 			ss->go_s99_running = 1;
911 			break;
912 		case qib_sdma_event_e40_sw_cleaned:
913 			sdma_set_state(ppd,
914 				       qib_sdma_state_s10_hw_start_up_wait);
915 			sdma_hw_start_up(ppd);
916 			break;
917 		case qib_sdma_event_e50_hw_cleaned:
918 			break;
919 		case qib_sdma_event_e60_hw_halted:
920 			break;
921 		case qib_sdma_event_e70_go_idle:
922 			ss->go_s99_running = 0;
923 			break;
924 		case qib_sdma_event_e7220_err_halted:
925 			break;
926 		case qib_sdma_event_e7322_err_halted:
927 			break;
928 		case qib_sdma_event_e90_timer_tick:
929 			break;
930 		}
931 		break;
932 
933 	case qib_sdma_state_s40_hw_clean_up_wait:
934 		switch (event) {
935 		case qib_sdma_event_e00_go_hw_down:
936 			sdma_set_state(ppd, qib_sdma_state_s00_hw_down);
937 			sdma_start_sw_clean_up(ppd);
938 			break;
939 		case qib_sdma_event_e10_go_hw_start:
940 			break;
941 		case qib_sdma_event_e20_hw_started:
942 			break;
943 		case qib_sdma_event_e30_go_running:
944 			ss->go_s99_running = 1;
945 			break;
946 		case qib_sdma_event_e40_sw_cleaned:
947 			break;
948 		case qib_sdma_event_e50_hw_cleaned:
949 			sdma_set_state(ppd,
950 				       qib_sdma_state_s30_sw_clean_up_wait);
951 			sdma_start_sw_clean_up(ppd);
952 			break;
953 		case qib_sdma_event_e60_hw_halted:
954 			break;
955 		case qib_sdma_event_e70_go_idle:
956 			ss->go_s99_running = 0;
957 			break;
958 		case qib_sdma_event_e7220_err_halted:
959 			break;
960 		case qib_sdma_event_e7322_err_halted:
961 			break;
962 		case qib_sdma_event_e90_timer_tick:
963 			break;
964 		}
965 		break;
966 
967 	case qib_sdma_state_s50_hw_halt_wait:
968 		switch (event) {
969 		case qib_sdma_event_e00_go_hw_down:
970 			sdma_set_state(ppd, qib_sdma_state_s00_hw_down);
971 			sdma_start_sw_clean_up(ppd);
972 			break;
973 		case qib_sdma_event_e10_go_hw_start:
974 			break;
975 		case qib_sdma_event_e20_hw_started:
976 			break;
977 		case qib_sdma_event_e30_go_running:
978 			ss->go_s99_running = 1;
979 			break;
980 		case qib_sdma_event_e40_sw_cleaned:
981 			break;
982 		case qib_sdma_event_e50_hw_cleaned:
983 			break;
984 		case qib_sdma_event_e60_hw_halted:
985 			sdma_set_state(ppd,
986 				       qib_sdma_state_s40_hw_clean_up_wait);
987 			ppd->dd->f_sdma_hw_clean_up(ppd);
988 			break;
989 		case qib_sdma_event_e70_go_idle:
990 			ss->go_s99_running = 0;
991 			break;
992 		case qib_sdma_event_e7220_err_halted:
993 			break;
994 		case qib_sdma_event_e7322_err_halted:
995 			break;
996 		case qib_sdma_event_e90_timer_tick:
997 			break;
998 		}
999 		break;
1000 
1001 	case qib_sdma_state_s99_running:
1002 		switch (event) {
1003 		case qib_sdma_event_e00_go_hw_down:
1004 			sdma_set_state(ppd, qib_sdma_state_s00_hw_down);
1005 			sdma_start_sw_clean_up(ppd);
1006 			break;
1007 		case qib_sdma_event_e10_go_hw_start:
1008 			break;
1009 		case qib_sdma_event_e20_hw_started:
1010 			break;
1011 		case qib_sdma_event_e30_go_running:
1012 			break;
1013 		case qib_sdma_event_e40_sw_cleaned:
1014 			break;
1015 		case qib_sdma_event_e50_hw_cleaned:
1016 			break;
1017 		case qib_sdma_event_e60_hw_halted:
1018 			sdma_set_state(ppd,
1019 				       qib_sdma_state_s30_sw_clean_up_wait);
1020 			sdma_start_sw_clean_up(ppd);
1021 			break;
1022 		case qib_sdma_event_e70_go_idle:
1023 			sdma_set_state(ppd, qib_sdma_state_s50_hw_halt_wait);
1024 			ss->go_s99_running = 0;
1025 			break;
1026 		case qib_sdma_event_e7220_err_halted:
1027 			sdma_set_state(ppd,
1028 				       qib_sdma_state_s30_sw_clean_up_wait);
1029 			sdma_start_sw_clean_up(ppd);
1030 			break;
1031 		case qib_sdma_event_e7322_err_halted:
1032 			sdma_set_state(ppd, qib_sdma_state_s50_hw_halt_wait);
1033 			break;
1034 		case qib_sdma_event_e90_timer_tick:
1035 			break;
1036 		}
1037 		break;
1038 	}
1039 
1040 	ss->last_event = event;
1041 }
1042