1 /*
2 * linux/drivers/misc/xillybus_core.c
3 *
4 * Copyright 2011 Xillybus Ltd, http://xillybus.com
5 *
6 * Driver for the Xillybus FPGA/host framework.
7 *
8 * This driver interfaces with a special IP core in an FPGA, setting up
9 * a pipe between a hardware FIFO in the programmable logic and a device
10 * file in the host. The number of such pipes and their attributes are
11 * set up on the logic. This driver detects these automatically and
12 * creates the device files accordingly.
13 *
14 * This program is free software; you can redistribute it and/or modify
15 * it under the smems of the GNU General Public License as published by
16 * the Free Software Foundation; version 2 of the License.
17 */
18
19 #include <linux/list.h>
20 #include <linux/device.h>
21 #include <linux/module.h>
22 #include <linux/io.h>
23 #include <linux/dma-mapping.h>
24 #include <linux/interrupt.h>
25 #include <linux/sched.h>
26 #include <linux/fs.h>
27 #include <linux/cdev.h>
28 #include <linux/spinlock.h>
29 #include <linux/mutex.h>
30 #include <linux/crc32.h>
31 #include <linux/poll.h>
32 #include <linux/delay.h>
33 #include <linux/slab.h>
34 #include <linux/workqueue.h>
35 #include "xillybus.h"
36
37 MODULE_DESCRIPTION("Xillybus core functions");
38 MODULE_AUTHOR("Eli Billauer, Xillybus Ltd.");
39 MODULE_VERSION("1.07");
40 MODULE_ALIAS("xillybus_core");
41 MODULE_LICENSE("GPL v2");
42
43 /* General timeout is 100 ms, rx timeout is 10 ms */
44 #define XILLY_RX_TIMEOUT (10*HZ/1000)
45 #define XILLY_TIMEOUT (100*HZ/1000)
46
47 #define fpga_msg_ctrl_reg 0x0008
48 #define fpga_dma_control_reg 0x0020
49 #define fpga_dma_bufno_reg 0x0024
50 #define fpga_dma_bufaddr_lowaddr_reg 0x0028
51 #define fpga_dma_bufaddr_highaddr_reg 0x002c
52 #define fpga_buf_ctrl_reg 0x0030
53 #define fpga_buf_offset_reg 0x0034
54 #define fpga_endian_reg 0x0040
55
56 #define XILLYMSG_OPCODE_RELEASEBUF 1
57 #define XILLYMSG_OPCODE_QUIESCEACK 2
58 #define XILLYMSG_OPCODE_FIFOEOF 3
59 #define XILLYMSG_OPCODE_FATAL_ERROR 4
60 #define XILLYMSG_OPCODE_NONEMPTY 5
61
62 static const char xillyname[] = "xillybus";
63
64 static struct class *xillybus_class;
65
66 /*
67 * ep_list_lock is the last lock to be taken; No other lock requests are
68 * allowed while holding it. It merely protects list_of_endpoints, and not
69 * the endpoints listed in it.
70 */
71
72 static LIST_HEAD(list_of_endpoints);
73 static struct mutex ep_list_lock;
74 static struct workqueue_struct *xillybus_wq;
75
76 /*
77 * Locking scheme: Mutexes protect invocations of character device methods.
78 * If both locks are taken, wr_mutex is taken first, rd_mutex second.
79 *
80 * wr_spinlock protects wr_*_buf_idx, wr_empty, wr_sleepy, wr_ready and the
81 * buffers' end_offset fields against changes made by IRQ handler (and in
82 * theory, other file request handlers, but the mutex handles that). Nothing
83 * else.
84 * They are held for short direct memory manipulations. Needless to say,
85 * no mutex locking is allowed when a spinlock is held.
86 *
87 * rd_spinlock does the same with rd_*_buf_idx, rd_empty and end_offset.
88 *
89 * register_mutex is endpoint-specific, and is held when non-atomic
90 * register operations are performed. wr_mutex and rd_mutex may be
91 * held when register_mutex is taken, but none of the spinlocks. Note that
92 * register_mutex doesn't protect against sporadic buf_ctrl_reg writes
93 * which are unrelated to buf_offset_reg, since they are harmless.
94 *
95 * Blocking on the wait queues is allowed with mutexes held, but not with
96 * spinlocks.
97 *
98 * Only interruptible blocking is allowed on mutexes and wait queues.
99 *
100 * All in all, the locking order goes (with skips allowed, of course):
101 * wr_mutex -> rd_mutex -> register_mutex -> wr_spinlock -> rd_spinlock
102 */
103
malformed_message(struct xilly_endpoint * endpoint,u32 * buf)104 static void malformed_message(struct xilly_endpoint *endpoint, u32 *buf)
105 {
106 int opcode;
107 int msg_channel, msg_bufno, msg_data, msg_dir;
108
109 opcode = (buf[0] >> 24) & 0xff;
110 msg_dir = buf[0] & 1;
111 msg_channel = (buf[0] >> 1) & 0x7ff;
112 msg_bufno = (buf[0] >> 12) & 0x3ff;
113 msg_data = buf[1] & 0xfffffff;
114
115 dev_warn(endpoint->dev,
116 "Malformed message (skipping): opcode=%d, channel=%03x, dir=%d, bufno=%03x, data=%07x\n",
117 opcode, msg_channel, msg_dir, msg_bufno, msg_data);
118 }
119
120 /*
121 * xillybus_isr assumes the interrupt is allocated exclusively to it,
122 * which is the natural case MSI and several other hardware-oriented
123 * interrupts. Sharing is not allowed.
124 */
125
xillybus_isr(int irq,void * data)126 irqreturn_t xillybus_isr(int irq, void *data)
127 {
128 struct xilly_endpoint *ep = data;
129 u32 *buf;
130 unsigned int buf_size;
131 int i;
132 int opcode;
133 unsigned int msg_channel, msg_bufno, msg_data, msg_dir;
134 struct xilly_channel *channel;
135
136 buf = ep->msgbuf_addr;
137 buf_size = ep->msg_buf_size/sizeof(u32);
138
139 ep->ephw->hw_sync_sgl_for_cpu(ep,
140 ep->msgbuf_dma_addr,
141 ep->msg_buf_size,
142 DMA_FROM_DEVICE);
143
144 for (i = 0; i < buf_size; i += 2) {
145 if (((buf[i+1] >> 28) & 0xf) != ep->msg_counter) {
146 malformed_message(ep, &buf[i]);
147 dev_warn(ep->dev,
148 "Sending a NACK on counter %x (instead of %x) on entry %d\n",
149 ((buf[i+1] >> 28) & 0xf),
150 ep->msg_counter,
151 i/2);
152
153 if (++ep->failed_messages > 10) {
154 dev_err(ep->dev,
155 "Lost sync with interrupt messages. Stopping.\n");
156 } else {
157 ep->ephw->hw_sync_sgl_for_device(
158 ep,
159 ep->msgbuf_dma_addr,
160 ep->msg_buf_size,
161 DMA_FROM_DEVICE);
162
163 iowrite32(0x01, /* Message NACK */
164 ep->registers + fpga_msg_ctrl_reg);
165 }
166 return IRQ_HANDLED;
167 } else if (buf[i] & (1 << 22)) /* Last message */
168 break;
169 }
170
171 if (i >= buf_size) {
172 dev_err(ep->dev, "Bad interrupt message. Stopping.\n");
173 return IRQ_HANDLED;
174 }
175
176 buf_size = i + 2;
177
178 for (i = 0; i < buf_size; i += 2) { /* Scan through messages */
179 opcode = (buf[i] >> 24) & 0xff;
180
181 msg_dir = buf[i] & 1;
182 msg_channel = (buf[i] >> 1) & 0x7ff;
183 msg_bufno = (buf[i] >> 12) & 0x3ff;
184 msg_data = buf[i+1] & 0xfffffff;
185
186 switch (opcode) {
187 case XILLYMSG_OPCODE_RELEASEBUF:
188 if ((msg_channel > ep->num_channels) ||
189 (msg_channel == 0)) {
190 malformed_message(ep, &buf[i]);
191 break;
192 }
193
194 channel = ep->channels[msg_channel];
195
196 if (msg_dir) { /* Write channel */
197 if (msg_bufno >= channel->num_wr_buffers) {
198 malformed_message(ep, &buf[i]);
199 break;
200 }
201 spin_lock(&channel->wr_spinlock);
202 channel->wr_buffers[msg_bufno]->end_offset =
203 msg_data;
204 channel->wr_fpga_buf_idx = msg_bufno;
205 channel->wr_empty = 0;
206 channel->wr_sleepy = 0;
207 spin_unlock(&channel->wr_spinlock);
208
209 wake_up_interruptible(&channel->wr_wait);
210
211 } else {
212 /* Read channel */
213
214 if (msg_bufno >= channel->num_rd_buffers) {
215 malformed_message(ep, &buf[i]);
216 break;
217 }
218
219 spin_lock(&channel->rd_spinlock);
220 channel->rd_fpga_buf_idx = msg_bufno;
221 channel->rd_full = 0;
222 spin_unlock(&channel->rd_spinlock);
223
224 wake_up_interruptible(&channel->rd_wait);
225 if (!channel->rd_synchronous)
226 queue_delayed_work(
227 xillybus_wq,
228 &channel->rd_workitem,
229 XILLY_RX_TIMEOUT);
230 }
231
232 break;
233 case XILLYMSG_OPCODE_NONEMPTY:
234 if ((msg_channel > ep->num_channels) ||
235 (msg_channel == 0) || (!msg_dir) ||
236 !ep->channels[msg_channel]->wr_supports_nonempty) {
237 malformed_message(ep, &buf[i]);
238 break;
239 }
240
241 channel = ep->channels[msg_channel];
242
243 if (msg_bufno >= channel->num_wr_buffers) {
244 malformed_message(ep, &buf[i]);
245 break;
246 }
247 spin_lock(&channel->wr_spinlock);
248 if (msg_bufno == channel->wr_host_buf_idx)
249 channel->wr_ready = 1;
250 spin_unlock(&channel->wr_spinlock);
251
252 wake_up_interruptible(&channel->wr_ready_wait);
253
254 break;
255 case XILLYMSG_OPCODE_QUIESCEACK:
256 ep->idtlen = msg_data;
257 wake_up_interruptible(&ep->ep_wait);
258
259 break;
260 case XILLYMSG_OPCODE_FIFOEOF:
261 if ((msg_channel > ep->num_channels) ||
262 (msg_channel == 0) || (!msg_dir) ||
263 !ep->channels[msg_channel]->num_wr_buffers) {
264 malformed_message(ep, &buf[i]);
265 break;
266 }
267 channel = ep->channels[msg_channel];
268 spin_lock(&channel->wr_spinlock);
269 channel->wr_eof = msg_bufno;
270 channel->wr_sleepy = 0;
271
272 channel->wr_hangup = channel->wr_empty &&
273 (channel->wr_host_buf_idx == msg_bufno);
274
275 spin_unlock(&channel->wr_spinlock);
276
277 wake_up_interruptible(&channel->wr_wait);
278
279 break;
280 case XILLYMSG_OPCODE_FATAL_ERROR:
281 ep->fatal_error = 1;
282 wake_up_interruptible(&ep->ep_wait); /* For select() */
283 dev_err(ep->dev,
284 "FPGA reported a fatal error. This means that the low-level communication with the device has failed. This hardware problem is most likely unrelated to Xillybus (neither kernel module nor FPGA core), but reports are still welcome. All I/O is aborted.\n");
285 break;
286 default:
287 malformed_message(ep, &buf[i]);
288 break;
289 }
290 }
291
292 ep->ephw->hw_sync_sgl_for_device(ep,
293 ep->msgbuf_dma_addr,
294 ep->msg_buf_size,
295 DMA_FROM_DEVICE);
296
297 ep->msg_counter = (ep->msg_counter + 1) & 0xf;
298 ep->failed_messages = 0;
299 iowrite32(0x03, ep->registers + fpga_msg_ctrl_reg); /* Message ACK */
300
301 return IRQ_HANDLED;
302 }
303 EXPORT_SYMBOL(xillybus_isr);
304
305 /*
306 * A few trivial memory management functions.
307 * NOTE: These functions are used only on probe and remove, and therefore
308 * no locks are applied!
309 */
310
311 static void xillybus_autoflush(struct work_struct *work);
312
313 struct xilly_alloc_state {
314 void *salami;
315 int left_of_salami;
316 int nbuffer;
317 enum dma_data_direction direction;
318 u32 regdirection;
319 };
320
xilly_get_dma_buffers(struct xilly_endpoint * ep,struct xilly_alloc_state * s,struct xilly_buffer ** buffers,int bufnum,int bytebufsize)321 static int xilly_get_dma_buffers(struct xilly_endpoint *ep,
322 struct xilly_alloc_state *s,
323 struct xilly_buffer **buffers,
324 int bufnum, int bytebufsize)
325 {
326 int i, rc;
327 dma_addr_t dma_addr;
328 struct device *dev = ep->dev;
329 struct xilly_buffer *this_buffer = NULL; /* Init to silence warning */
330
331 if (buffers) { /* Not the message buffer */
332 this_buffer = devm_kcalloc(dev, bufnum,
333 sizeof(struct xilly_buffer),
334 GFP_KERNEL);
335 if (!this_buffer)
336 return -ENOMEM;
337 }
338
339 for (i = 0; i < bufnum; i++) {
340 /*
341 * Buffers are expected in descending size order, so there
342 * is either enough space for this buffer or none at all.
343 */
344
345 if ((s->left_of_salami < bytebufsize) &&
346 (s->left_of_salami > 0)) {
347 dev_err(ep->dev,
348 "Corrupt buffer allocation in IDT. Aborting.\n");
349 return -ENODEV;
350 }
351
352 if (s->left_of_salami == 0) {
353 int allocorder, allocsize;
354
355 allocsize = PAGE_SIZE;
356 allocorder = 0;
357 while (bytebufsize > allocsize) {
358 allocsize *= 2;
359 allocorder++;
360 }
361
362 s->salami = (void *) devm_get_free_pages(
363 dev,
364 GFP_KERNEL | __GFP_DMA32 | __GFP_ZERO,
365 allocorder);
366 if (!s->salami)
367 return -ENOMEM;
368
369 s->left_of_salami = allocsize;
370 }
371
372 rc = ep->ephw->map_single(ep, s->salami,
373 bytebufsize, s->direction,
374 &dma_addr);
375 if (rc)
376 return rc;
377
378 iowrite32((u32) (dma_addr & 0xffffffff),
379 ep->registers + fpga_dma_bufaddr_lowaddr_reg);
380 iowrite32(((u32) ((((u64) dma_addr) >> 32) & 0xffffffff)),
381 ep->registers + fpga_dma_bufaddr_highaddr_reg);
382
383 if (buffers) { /* Not the message buffer */
384 this_buffer->addr = s->salami;
385 this_buffer->dma_addr = dma_addr;
386 buffers[i] = this_buffer++;
387
388 iowrite32(s->regdirection | s->nbuffer++,
389 ep->registers + fpga_dma_bufno_reg);
390 } else {
391 ep->msgbuf_addr = s->salami;
392 ep->msgbuf_dma_addr = dma_addr;
393 ep->msg_buf_size = bytebufsize;
394
395 iowrite32(s->regdirection,
396 ep->registers + fpga_dma_bufno_reg);
397 }
398
399 s->left_of_salami -= bytebufsize;
400 s->salami += bytebufsize;
401 }
402 return 0;
403 }
404
xilly_setupchannels(struct xilly_endpoint * ep,unsigned char * chandesc,int entries)405 static int xilly_setupchannels(struct xilly_endpoint *ep,
406 unsigned char *chandesc,
407 int entries)
408 {
409 struct device *dev = ep->dev;
410 int i, entry, rc;
411 struct xilly_channel *channel;
412 int channelnum, bufnum, bufsize, format, is_writebuf;
413 int bytebufsize;
414 int synchronous, allowpartial, exclusive_open, seekable;
415 int supports_nonempty;
416 int msg_buf_done = 0;
417
418 struct xilly_alloc_state rd_alloc = {
419 .salami = NULL,
420 .left_of_salami = 0,
421 .nbuffer = 1,
422 .direction = DMA_TO_DEVICE,
423 .regdirection = 0,
424 };
425
426 struct xilly_alloc_state wr_alloc = {
427 .salami = NULL,
428 .left_of_salami = 0,
429 .nbuffer = 1,
430 .direction = DMA_FROM_DEVICE,
431 .regdirection = 0x80000000,
432 };
433
434 channel = devm_kcalloc(dev, ep->num_channels,
435 sizeof(struct xilly_channel), GFP_KERNEL);
436 if (!channel)
437 return -ENOMEM;
438
439 ep->channels = devm_kcalloc(dev, ep->num_channels + 1,
440 sizeof(struct xilly_channel *),
441 GFP_KERNEL);
442 if (!ep->channels)
443 return -ENOMEM;
444
445 ep->channels[0] = NULL; /* Channel 0 is message buf. */
446
447 /* Initialize all channels with defaults */
448
449 for (i = 1; i <= ep->num_channels; i++) {
450 channel->wr_buffers = NULL;
451 channel->rd_buffers = NULL;
452 channel->num_wr_buffers = 0;
453 channel->num_rd_buffers = 0;
454 channel->wr_fpga_buf_idx = -1;
455 channel->wr_host_buf_idx = 0;
456 channel->wr_host_buf_pos = 0;
457 channel->wr_empty = 1;
458 channel->wr_ready = 0;
459 channel->wr_sleepy = 1;
460 channel->rd_fpga_buf_idx = 0;
461 channel->rd_host_buf_idx = 0;
462 channel->rd_host_buf_pos = 0;
463 channel->rd_full = 0;
464 channel->wr_ref_count = 0;
465 channel->rd_ref_count = 0;
466
467 spin_lock_init(&channel->wr_spinlock);
468 spin_lock_init(&channel->rd_spinlock);
469 mutex_init(&channel->wr_mutex);
470 mutex_init(&channel->rd_mutex);
471 init_waitqueue_head(&channel->rd_wait);
472 init_waitqueue_head(&channel->wr_wait);
473 init_waitqueue_head(&channel->wr_ready_wait);
474
475 INIT_DELAYED_WORK(&channel->rd_workitem, xillybus_autoflush);
476
477 channel->endpoint = ep;
478 channel->chan_num = i;
479
480 channel->log2_element_size = 0;
481
482 ep->channels[i] = channel++;
483 }
484
485 for (entry = 0; entry < entries; entry++, chandesc += 4) {
486 struct xilly_buffer **buffers = NULL;
487
488 is_writebuf = chandesc[0] & 0x01;
489 channelnum = (chandesc[0] >> 1) | ((chandesc[1] & 0x0f) << 7);
490 format = (chandesc[1] >> 4) & 0x03;
491 allowpartial = (chandesc[1] >> 6) & 0x01;
492 synchronous = (chandesc[1] >> 7) & 0x01;
493 bufsize = 1 << (chandesc[2] & 0x1f);
494 bufnum = 1 << (chandesc[3] & 0x0f);
495 exclusive_open = (chandesc[2] >> 7) & 0x01;
496 seekable = (chandesc[2] >> 6) & 0x01;
497 supports_nonempty = (chandesc[2] >> 5) & 0x01;
498
499 if ((channelnum > ep->num_channels) ||
500 ((channelnum == 0) && !is_writebuf)) {
501 dev_err(ep->dev,
502 "IDT requests channel out of range. Aborting.\n");
503 return -ENODEV;
504 }
505
506 channel = ep->channels[channelnum]; /* NULL for msg channel */
507
508 if (!is_writebuf || channelnum > 0) {
509 channel->log2_element_size = ((format > 2) ?
510 2 : format);
511
512 bytebufsize = channel->rd_buf_size = bufsize *
513 (1 << channel->log2_element_size);
514
515 buffers = devm_kcalloc(dev, bufnum,
516 sizeof(struct xilly_buffer *),
517 GFP_KERNEL);
518 if (!buffers)
519 return -ENOMEM;
520 } else {
521 bytebufsize = bufsize << 2;
522 }
523
524 if (!is_writebuf) {
525 channel->num_rd_buffers = bufnum;
526 channel->rd_allow_partial = allowpartial;
527 channel->rd_synchronous = synchronous;
528 channel->rd_exclusive_open = exclusive_open;
529 channel->seekable = seekable;
530
531 channel->rd_buffers = buffers;
532 rc = xilly_get_dma_buffers(ep, &rd_alloc, buffers,
533 bufnum, bytebufsize);
534 } else if (channelnum > 0) {
535 channel->num_wr_buffers = bufnum;
536
537 channel->seekable = seekable;
538 channel->wr_supports_nonempty = supports_nonempty;
539
540 channel->wr_allow_partial = allowpartial;
541 channel->wr_synchronous = synchronous;
542 channel->wr_exclusive_open = exclusive_open;
543
544 channel->wr_buffers = buffers;
545 rc = xilly_get_dma_buffers(ep, &wr_alloc, buffers,
546 bufnum, bytebufsize);
547 } else {
548 rc = xilly_get_dma_buffers(ep, &wr_alloc, NULL,
549 bufnum, bytebufsize);
550 msg_buf_done++;
551 }
552
553 if (rc)
554 return -ENOMEM;
555 }
556
557 if (!msg_buf_done) {
558 dev_err(ep->dev,
559 "Corrupt IDT: No message buffer. Aborting.\n");
560 return -ENODEV;
561 }
562 return 0;
563 }
564
xilly_scan_idt(struct xilly_endpoint * endpoint,struct xilly_idt_handle * idt_handle)565 static int xilly_scan_idt(struct xilly_endpoint *endpoint,
566 struct xilly_idt_handle *idt_handle)
567 {
568 int count = 0;
569 unsigned char *idt = endpoint->channels[1]->wr_buffers[0]->addr;
570 unsigned char *end_of_idt = idt + endpoint->idtlen - 4;
571 unsigned char *scan;
572 int len;
573
574 scan = idt;
575 idt_handle->idt = idt;
576
577 scan++; /* Skip version number */
578
579 while ((scan <= end_of_idt) && *scan) {
580 while ((scan <= end_of_idt) && *scan++)
581 /* Do nothing, just scan thru string */;
582 count++;
583 }
584
585 scan++;
586
587 if (scan > end_of_idt) {
588 dev_err(endpoint->dev,
589 "IDT device name list overflow. Aborting.\n");
590 return -ENODEV;
591 }
592 idt_handle->chandesc = scan;
593
594 len = endpoint->idtlen - (3 + ((int) (scan - idt)));
595
596 if (len & 0x03) {
597 dev_err(endpoint->dev,
598 "Corrupt IDT device name list. Aborting.\n");
599 return -ENODEV;
600 }
601
602 idt_handle->entries = len >> 2;
603 endpoint->num_channels = count;
604
605 return 0;
606 }
607
xilly_obtain_idt(struct xilly_endpoint * endpoint)608 static int xilly_obtain_idt(struct xilly_endpoint *endpoint)
609 {
610 struct xilly_channel *channel;
611 unsigned char *version;
612 long t;
613
614 channel = endpoint->channels[1]; /* This should be generated ad-hoc */
615
616 channel->wr_sleepy = 1;
617
618 iowrite32(1 |
619 (3 << 24), /* Opcode 3 for channel 0 = Send IDT */
620 endpoint->registers + fpga_buf_ctrl_reg);
621
622 t = wait_event_interruptible_timeout(channel->wr_wait,
623 (!channel->wr_sleepy),
624 XILLY_TIMEOUT);
625
626 if (t <= 0) {
627 dev_err(endpoint->dev, "Failed to obtain IDT. Aborting.\n");
628
629 if (endpoint->fatal_error)
630 return -EIO;
631
632 return -ENODEV;
633 }
634
635 endpoint->ephw->hw_sync_sgl_for_cpu(
636 channel->endpoint,
637 channel->wr_buffers[0]->dma_addr,
638 channel->wr_buf_size,
639 DMA_FROM_DEVICE);
640
641 if (channel->wr_buffers[0]->end_offset != endpoint->idtlen) {
642 dev_err(endpoint->dev,
643 "IDT length mismatch (%d != %d). Aborting.\n",
644 channel->wr_buffers[0]->end_offset, endpoint->idtlen);
645 return -ENODEV;
646 }
647
648 if (crc32_le(~0, channel->wr_buffers[0]->addr,
649 endpoint->idtlen+1) != 0) {
650 dev_err(endpoint->dev, "IDT failed CRC check. Aborting.\n");
651 return -ENODEV;
652 }
653
654 version = channel->wr_buffers[0]->addr;
655
656 /* Check version number. Accept anything below 0x82 for now. */
657 if (*version > 0x82) {
658 dev_err(endpoint->dev,
659 "No support for IDT version 0x%02x. Maybe the xillybus driver needs an upgarde. Aborting.\n",
660 *version);
661 return -ENODEV;
662 }
663
664 return 0;
665 }
666
xillybus_read(struct file * filp,char __user * userbuf,size_t count,loff_t * f_pos)667 static ssize_t xillybus_read(struct file *filp, char __user *userbuf,
668 size_t count, loff_t *f_pos)
669 {
670 ssize_t rc;
671 unsigned long flags;
672 int bytes_done = 0;
673 int no_time_left = 0;
674 long deadline, left_to_sleep;
675 struct xilly_channel *channel = filp->private_data;
676
677 int empty, reached_eof, exhausted, ready;
678 /* Initializations are there only to silence warnings */
679
680 int howmany = 0, bufpos = 0, bufidx = 0, bufferdone = 0;
681 int waiting_bufidx;
682
683 if (channel->endpoint->fatal_error)
684 return -EIO;
685
686 deadline = jiffies + 1 + XILLY_RX_TIMEOUT;
687
688 rc = mutex_lock_interruptible(&channel->wr_mutex);
689 if (rc)
690 return rc;
691
692 while (1) { /* Note that we may drop mutex within this loop */
693 int bytes_to_do = count - bytes_done;
694
695 spin_lock_irqsave(&channel->wr_spinlock, flags);
696
697 empty = channel->wr_empty;
698 ready = !empty || channel->wr_ready;
699
700 if (!empty) {
701 bufidx = channel->wr_host_buf_idx;
702 bufpos = channel->wr_host_buf_pos;
703 howmany = ((channel->wr_buffers[bufidx]->end_offset
704 + 1) << channel->log2_element_size)
705 - bufpos;
706
707 /* Update wr_host_* to its post-operation state */
708 if (howmany > bytes_to_do) {
709 bufferdone = 0;
710
711 howmany = bytes_to_do;
712 channel->wr_host_buf_pos += howmany;
713 } else {
714 bufferdone = 1;
715
716 channel->wr_host_buf_pos = 0;
717
718 if (bufidx == channel->wr_fpga_buf_idx) {
719 channel->wr_empty = 1;
720 channel->wr_sleepy = 1;
721 channel->wr_ready = 0;
722 }
723
724 if (bufidx >= (channel->num_wr_buffers - 1))
725 channel->wr_host_buf_idx = 0;
726 else
727 channel->wr_host_buf_idx++;
728 }
729 }
730
731 /*
732 * Marking our situation after the possible changes above,
733 * for use after releasing the spinlock.
734 *
735 * empty = empty before change
736 * exhasted = empty after possible change
737 */
738
739 reached_eof = channel->wr_empty &&
740 (channel->wr_host_buf_idx == channel->wr_eof);
741 channel->wr_hangup = reached_eof;
742 exhausted = channel->wr_empty;
743 waiting_bufidx = channel->wr_host_buf_idx;
744
745 spin_unlock_irqrestore(&channel->wr_spinlock, flags);
746
747 if (!empty) { /* Go on, now without the spinlock */
748
749 if (bufpos == 0) /* Position zero means it's virgin */
750 channel->endpoint->ephw->hw_sync_sgl_for_cpu(
751 channel->endpoint,
752 channel->wr_buffers[bufidx]->dma_addr,
753 channel->wr_buf_size,
754 DMA_FROM_DEVICE);
755
756 if (copy_to_user(
757 userbuf,
758 channel->wr_buffers[bufidx]->addr
759 + bufpos, howmany))
760 rc = -EFAULT;
761
762 userbuf += howmany;
763 bytes_done += howmany;
764
765 if (bufferdone) {
766 channel->endpoint->ephw->hw_sync_sgl_for_device(
767 channel->endpoint,
768 channel->wr_buffers[bufidx]->dma_addr,
769 channel->wr_buf_size,
770 DMA_FROM_DEVICE);
771
772 /*
773 * Tell FPGA the buffer is done with. It's an
774 * atomic operation to the FPGA, so what
775 * happens with other channels doesn't matter,
776 * and the certain channel is protected with
777 * the channel-specific mutex.
778 */
779
780 iowrite32(1 | (channel->chan_num << 1) |
781 (bufidx << 12),
782 channel->endpoint->registers +
783 fpga_buf_ctrl_reg);
784 }
785
786 if (rc) {
787 mutex_unlock(&channel->wr_mutex);
788 return rc;
789 }
790 }
791
792 /* This includes a zero-count return = EOF */
793 if ((bytes_done >= count) || reached_eof)
794 break;
795
796 if (!exhausted)
797 continue; /* More in RAM buffer(s)? Just go on. */
798
799 if ((bytes_done > 0) &&
800 (no_time_left ||
801 (channel->wr_synchronous && channel->wr_allow_partial)))
802 break;
803
804 /*
805 * Nonblocking read: The "ready" flag tells us that the FPGA
806 * has data to send. In non-blocking mode, if it isn't on,
807 * just return. But if there is, we jump directly to the point
808 * where we ask for the FPGA to send all it has, and wait
809 * until that data arrives. So in a sense, we *do* block in
810 * nonblocking mode, but only for a very short time.
811 */
812
813 if (!no_time_left && (filp->f_flags & O_NONBLOCK)) {
814 if (bytes_done > 0)
815 break;
816
817 if (ready)
818 goto desperate;
819
820 rc = -EAGAIN;
821 break;
822 }
823
824 if (!no_time_left || (bytes_done > 0)) {
825 /*
826 * Note that in case of an element-misaligned read
827 * request, offsetlimit will include the last element,
828 * which will be partially read from.
829 */
830 int offsetlimit = ((count - bytes_done) - 1) >>
831 channel->log2_element_size;
832 int buf_elements = channel->wr_buf_size >>
833 channel->log2_element_size;
834
835 /*
836 * In synchronous mode, always send an offset limit.
837 * Just don't send a value too big.
838 */
839
840 if (channel->wr_synchronous) {
841 /* Don't request more than one buffer */
842 if (channel->wr_allow_partial &&
843 (offsetlimit >= buf_elements))
844 offsetlimit = buf_elements - 1;
845
846 /* Don't request more than all buffers */
847 if (!channel->wr_allow_partial &&
848 (offsetlimit >=
849 (buf_elements * channel->num_wr_buffers)))
850 offsetlimit = buf_elements *
851 channel->num_wr_buffers - 1;
852 }
853
854 /*
855 * In asynchronous mode, force early flush of a buffer
856 * only if that will allow returning a full count. The
857 * "offsetlimit < ( ... )" rather than "<=" excludes
858 * requesting a full buffer, which would obviously
859 * cause a buffer transmission anyhow
860 */
861
862 if (channel->wr_synchronous ||
863 (offsetlimit < (buf_elements - 1))) {
864 mutex_lock(&channel->endpoint->register_mutex);
865
866 iowrite32(offsetlimit,
867 channel->endpoint->registers +
868 fpga_buf_offset_reg);
869
870 iowrite32(1 | (channel->chan_num << 1) |
871 (2 << 24) | /* 2 = offset limit */
872 (waiting_bufidx << 12),
873 channel->endpoint->registers +
874 fpga_buf_ctrl_reg);
875
876 mutex_unlock(&channel->endpoint->
877 register_mutex);
878 }
879 }
880
881 /*
882 * If partial completion is disallowed, there is no point in
883 * timeout sleeping. Neither if no_time_left is set and
884 * there's no data.
885 */
886
887 if (!channel->wr_allow_partial ||
888 (no_time_left && (bytes_done == 0))) {
889 /*
890 * This do-loop will run more than once if another
891 * thread reasserted wr_sleepy before we got the mutex
892 * back, so we try again.
893 */
894
895 do {
896 mutex_unlock(&channel->wr_mutex);
897
898 if (wait_event_interruptible(
899 channel->wr_wait,
900 (!channel->wr_sleepy)))
901 goto interrupted;
902
903 if (mutex_lock_interruptible(
904 &channel->wr_mutex))
905 goto interrupted;
906 } while (channel->wr_sleepy);
907
908 continue;
909
910 interrupted: /* Mutex is not held if got here */
911 if (channel->endpoint->fatal_error)
912 return -EIO;
913 if (bytes_done)
914 return bytes_done;
915 if (filp->f_flags & O_NONBLOCK)
916 return -EAGAIN; /* Don't admit snoozing */
917 return -EINTR;
918 }
919
920 left_to_sleep = deadline - ((long) jiffies);
921
922 /*
923 * If our time is out, skip the waiting. We may miss wr_sleepy
924 * being deasserted but hey, almost missing the train is like
925 * missing it.
926 */
927
928 if (left_to_sleep > 0) {
929 left_to_sleep =
930 wait_event_interruptible_timeout(
931 channel->wr_wait,
932 (!channel->wr_sleepy),
933 left_to_sleep);
934
935 if (left_to_sleep > 0) /* wr_sleepy deasserted */
936 continue;
937
938 if (left_to_sleep < 0) { /* Interrupt */
939 mutex_unlock(&channel->wr_mutex);
940 if (channel->endpoint->fatal_error)
941 return -EIO;
942 if (bytes_done)
943 return bytes_done;
944 return -EINTR;
945 }
946 }
947
948 desperate:
949 no_time_left = 1; /* We're out of sleeping time. Desperate! */
950
951 if (bytes_done == 0) {
952 /*
953 * Reaching here means that we allow partial return,
954 * that we've run out of time, and that we have
955 * nothing to return.
956 * So tell the FPGA to send anything it has or gets.
957 */
958
959 iowrite32(1 | (channel->chan_num << 1) |
960 (3 << 24) | /* Opcode 3, flush it all! */
961 (waiting_bufidx << 12),
962 channel->endpoint->registers +
963 fpga_buf_ctrl_reg);
964 }
965
966 /*
967 * Reaching here means that we *do* have data in the buffer,
968 * but the "partial" flag disallows returning less than
969 * required. And we don't have as much. So loop again,
970 * which is likely to end up blocking indefinitely until
971 * enough data has arrived.
972 */
973 }
974
975 mutex_unlock(&channel->wr_mutex);
976
977 if (channel->endpoint->fatal_error)
978 return -EIO;
979
980 if (rc)
981 return rc;
982
983 return bytes_done;
984 }
985
986 /*
987 * The timeout argument takes values as follows:
988 * >0 : Flush with timeout
989 * ==0 : Flush, and wait idefinitely for the flush to complete
990 * <0 : Autoflush: Flush only if there's a single buffer occupied
991 */
992
xillybus_myflush(struct xilly_channel * channel,long timeout)993 static int xillybus_myflush(struct xilly_channel *channel, long timeout)
994 {
995 int rc;
996 unsigned long flags;
997
998 int end_offset_plus1;
999 int bufidx, bufidx_minus1;
1000 int i;
1001 int empty;
1002 int new_rd_host_buf_pos;
1003
1004 if (channel->endpoint->fatal_error)
1005 return -EIO;
1006 rc = mutex_lock_interruptible(&channel->rd_mutex);
1007 if (rc)
1008 return rc;
1009
1010 /*
1011 * Don't flush a closed channel. This can happen when the work queued
1012 * autoflush thread fires off after the file has closed. This is not
1013 * an error, just something to dismiss.
1014 */
1015
1016 if (!channel->rd_ref_count)
1017 goto done;
1018
1019 bufidx = channel->rd_host_buf_idx;
1020
1021 bufidx_minus1 = (bufidx == 0) ?
1022 channel->num_rd_buffers - 1 :
1023 bufidx - 1;
1024
1025 end_offset_plus1 = channel->rd_host_buf_pos >>
1026 channel->log2_element_size;
1027
1028 new_rd_host_buf_pos = channel->rd_host_buf_pos -
1029 (end_offset_plus1 << channel->log2_element_size);
1030
1031 /* Submit the current buffer if it's nonempty */
1032 if (end_offset_plus1) {
1033 unsigned char *tail = channel->rd_buffers[bufidx]->addr +
1034 (end_offset_plus1 << channel->log2_element_size);
1035
1036 /* Copy unflushed data, so we can put it in next buffer */
1037 for (i = 0; i < new_rd_host_buf_pos; i++)
1038 channel->rd_leftovers[i] = *tail++;
1039
1040 spin_lock_irqsave(&channel->rd_spinlock, flags);
1041
1042 /* Autoflush only if a single buffer is occupied */
1043
1044 if ((timeout < 0) &&
1045 (channel->rd_full ||
1046 (bufidx_minus1 != channel->rd_fpga_buf_idx))) {
1047 spin_unlock_irqrestore(&channel->rd_spinlock, flags);
1048 /*
1049 * A new work item may be queued by the ISR exactly
1050 * now, since the execution of a work item allows the
1051 * queuing of a new one while it's running.
1052 */
1053 goto done;
1054 }
1055
1056 /* The 4th element is never needed for data, so it's a flag */
1057 channel->rd_leftovers[3] = (new_rd_host_buf_pos != 0);
1058
1059 /* Set up rd_full to reflect a certain moment's state */
1060
1061 if (bufidx == channel->rd_fpga_buf_idx)
1062 channel->rd_full = 1;
1063 spin_unlock_irqrestore(&channel->rd_spinlock, flags);
1064
1065 if (bufidx >= (channel->num_rd_buffers - 1))
1066 channel->rd_host_buf_idx = 0;
1067 else
1068 channel->rd_host_buf_idx++;
1069
1070 channel->endpoint->ephw->hw_sync_sgl_for_device(
1071 channel->endpoint,
1072 channel->rd_buffers[bufidx]->dma_addr,
1073 channel->rd_buf_size,
1074 DMA_TO_DEVICE);
1075
1076 mutex_lock(&channel->endpoint->register_mutex);
1077
1078 iowrite32(end_offset_plus1 - 1,
1079 channel->endpoint->registers + fpga_buf_offset_reg);
1080
1081 iowrite32((channel->chan_num << 1) | /* Channel ID */
1082 (2 << 24) | /* Opcode 2, submit buffer */
1083 (bufidx << 12),
1084 channel->endpoint->registers + fpga_buf_ctrl_reg);
1085
1086 mutex_unlock(&channel->endpoint->register_mutex);
1087 } else if (bufidx == 0) {
1088 bufidx = channel->num_rd_buffers - 1;
1089 } else {
1090 bufidx--;
1091 }
1092
1093 channel->rd_host_buf_pos = new_rd_host_buf_pos;
1094
1095 if (timeout < 0)
1096 goto done; /* Autoflush */
1097
1098 /*
1099 * bufidx is now the last buffer written to (or equal to
1100 * rd_fpga_buf_idx if buffer was never written to), and
1101 * channel->rd_host_buf_idx the one after it.
1102 *
1103 * If bufidx == channel->rd_fpga_buf_idx we're either empty or full.
1104 */
1105
1106 while (1) { /* Loop waiting for draining of buffers */
1107 spin_lock_irqsave(&channel->rd_spinlock, flags);
1108
1109 if (bufidx != channel->rd_fpga_buf_idx)
1110 channel->rd_full = 1; /*
1111 * Not really full,
1112 * but needs waiting.
1113 */
1114
1115 empty = !channel->rd_full;
1116
1117 spin_unlock_irqrestore(&channel->rd_spinlock, flags);
1118
1119 if (empty)
1120 break;
1121
1122 /*
1123 * Indefinite sleep with mutex taken. With data waiting for
1124 * flushing user should not be surprised if open() for write
1125 * sleeps.
1126 */
1127 if (timeout == 0)
1128 wait_event_interruptible(channel->rd_wait,
1129 (!channel->rd_full));
1130
1131 else if (wait_event_interruptible_timeout(
1132 channel->rd_wait,
1133 (!channel->rd_full),
1134 timeout) == 0) {
1135 dev_warn(channel->endpoint->dev,
1136 "Timed out while flushing. Output data may be lost.\n");
1137
1138 rc = -ETIMEDOUT;
1139 break;
1140 }
1141
1142 if (channel->rd_full) {
1143 rc = -EINTR;
1144 break;
1145 }
1146 }
1147
1148 done:
1149 mutex_unlock(&channel->rd_mutex);
1150
1151 if (channel->endpoint->fatal_error)
1152 return -EIO;
1153
1154 return rc;
1155 }
1156
xillybus_flush(struct file * filp,fl_owner_t id)1157 static int xillybus_flush(struct file *filp, fl_owner_t id)
1158 {
1159 if (!(filp->f_mode & FMODE_WRITE))
1160 return 0;
1161
1162 return xillybus_myflush(filp->private_data, HZ); /* 1 second timeout */
1163 }
1164
xillybus_autoflush(struct work_struct * work)1165 static void xillybus_autoflush(struct work_struct *work)
1166 {
1167 struct delayed_work *workitem = container_of(
1168 work, struct delayed_work, work);
1169 struct xilly_channel *channel = container_of(
1170 workitem, struct xilly_channel, rd_workitem);
1171 int rc;
1172
1173 rc = xillybus_myflush(channel, -1);
1174 if (rc == -EINTR)
1175 dev_warn(channel->endpoint->dev,
1176 "Autoflush failed because work queue thread got a signal.\n");
1177 else if (rc)
1178 dev_err(channel->endpoint->dev,
1179 "Autoflush failed under weird circumstances.\n");
1180 }
1181
xillybus_write(struct file * filp,const char __user * userbuf,size_t count,loff_t * f_pos)1182 static ssize_t xillybus_write(struct file *filp, const char __user *userbuf,
1183 size_t count, loff_t *f_pos)
1184 {
1185 ssize_t rc;
1186 unsigned long flags;
1187 int bytes_done = 0;
1188 struct xilly_channel *channel = filp->private_data;
1189
1190 int full, exhausted;
1191 /* Initializations are there only to silence warnings */
1192
1193 int howmany = 0, bufpos = 0, bufidx = 0, bufferdone = 0;
1194 int end_offset_plus1 = 0;
1195
1196 if (channel->endpoint->fatal_error)
1197 return -EIO;
1198
1199 rc = mutex_lock_interruptible(&channel->rd_mutex);
1200 if (rc)
1201 return rc;
1202
1203 while (1) {
1204 int bytes_to_do = count - bytes_done;
1205
1206 spin_lock_irqsave(&channel->rd_spinlock, flags);
1207
1208 full = channel->rd_full;
1209
1210 if (!full) {
1211 bufidx = channel->rd_host_buf_idx;
1212 bufpos = channel->rd_host_buf_pos;
1213 howmany = channel->rd_buf_size - bufpos;
1214
1215 /*
1216 * Update rd_host_* to its state after this operation.
1217 * count=0 means committing the buffer immediately,
1218 * which is like flushing, but not necessarily block.
1219 */
1220
1221 if ((howmany > bytes_to_do) &&
1222 (count ||
1223 ((bufpos >> channel->log2_element_size) == 0))) {
1224 bufferdone = 0;
1225
1226 howmany = bytes_to_do;
1227 channel->rd_host_buf_pos += howmany;
1228 } else {
1229 bufferdone = 1;
1230
1231 if (count) {
1232 end_offset_plus1 =
1233 channel->rd_buf_size >>
1234 channel->log2_element_size;
1235 channel->rd_host_buf_pos = 0;
1236 } else {
1237 unsigned char *tail;
1238 int i;
1239
1240 howmany = 0;
1241
1242 end_offset_plus1 = bufpos >>
1243 channel->log2_element_size;
1244
1245 channel->rd_host_buf_pos -=
1246 end_offset_plus1 <<
1247 channel->log2_element_size;
1248
1249 tail = channel->
1250 rd_buffers[bufidx]->addr +
1251 (end_offset_plus1 <<
1252 channel->log2_element_size);
1253
1254 for (i = 0;
1255 i < channel->rd_host_buf_pos;
1256 i++)
1257 channel->rd_leftovers[i] =
1258 *tail++;
1259 }
1260
1261 if (bufidx == channel->rd_fpga_buf_idx)
1262 channel->rd_full = 1;
1263
1264 if (bufidx >= (channel->num_rd_buffers - 1))
1265 channel->rd_host_buf_idx = 0;
1266 else
1267 channel->rd_host_buf_idx++;
1268 }
1269 }
1270
1271 /*
1272 * Marking our situation after the possible changes above,
1273 * for use after releasing the spinlock.
1274 *
1275 * full = full before change
1276 * exhasted = full after possible change
1277 */
1278
1279 exhausted = channel->rd_full;
1280
1281 spin_unlock_irqrestore(&channel->rd_spinlock, flags);
1282
1283 if (!full) { /* Go on, now without the spinlock */
1284 unsigned char *head =
1285 channel->rd_buffers[bufidx]->addr;
1286 int i;
1287
1288 if ((bufpos == 0) || /* Zero means it's virgin */
1289 (channel->rd_leftovers[3] != 0)) {
1290 channel->endpoint->ephw->hw_sync_sgl_for_cpu(
1291 channel->endpoint,
1292 channel->rd_buffers[bufidx]->dma_addr,
1293 channel->rd_buf_size,
1294 DMA_TO_DEVICE);
1295
1296 /* Virgin, but leftovers are due */
1297 for (i = 0; i < bufpos; i++)
1298 *head++ = channel->rd_leftovers[i];
1299
1300 channel->rd_leftovers[3] = 0; /* Clear flag */
1301 }
1302
1303 if (copy_from_user(
1304 channel->rd_buffers[bufidx]->addr + bufpos,
1305 userbuf, howmany))
1306 rc = -EFAULT;
1307
1308 userbuf += howmany;
1309 bytes_done += howmany;
1310
1311 if (bufferdone) {
1312 channel->endpoint->ephw->hw_sync_sgl_for_device(
1313 channel->endpoint,
1314 channel->rd_buffers[bufidx]->dma_addr,
1315 channel->rd_buf_size,
1316 DMA_TO_DEVICE);
1317
1318 mutex_lock(&channel->endpoint->register_mutex);
1319
1320 iowrite32(end_offset_plus1 - 1,
1321 channel->endpoint->registers +
1322 fpga_buf_offset_reg);
1323
1324 iowrite32((channel->chan_num << 1) |
1325 (2 << 24) | /* 2 = submit buffer */
1326 (bufidx << 12),
1327 channel->endpoint->registers +
1328 fpga_buf_ctrl_reg);
1329
1330 mutex_unlock(&channel->endpoint->
1331 register_mutex);
1332
1333 channel->rd_leftovers[3] =
1334 (channel->rd_host_buf_pos != 0);
1335 }
1336
1337 if (rc) {
1338 mutex_unlock(&channel->rd_mutex);
1339
1340 if (channel->endpoint->fatal_error)
1341 return -EIO;
1342
1343 if (!channel->rd_synchronous)
1344 queue_delayed_work(
1345 xillybus_wq,
1346 &channel->rd_workitem,
1347 XILLY_RX_TIMEOUT);
1348
1349 return rc;
1350 }
1351 }
1352
1353 if (bytes_done >= count)
1354 break;
1355
1356 if (!exhausted)
1357 continue; /* If there's more space, just go on */
1358
1359 if ((bytes_done > 0) && channel->rd_allow_partial)
1360 break;
1361
1362 /*
1363 * Indefinite sleep with mutex taken. With data waiting for
1364 * flushing, user should not be surprised if open() for write
1365 * sleeps.
1366 */
1367
1368 if (filp->f_flags & O_NONBLOCK) {
1369 rc = -EAGAIN;
1370 break;
1371 }
1372
1373 if (wait_event_interruptible(channel->rd_wait,
1374 (!channel->rd_full))) {
1375 mutex_unlock(&channel->rd_mutex);
1376
1377 if (channel->endpoint->fatal_error)
1378 return -EIO;
1379
1380 if (bytes_done)
1381 return bytes_done;
1382 return -EINTR;
1383 }
1384 }
1385
1386 mutex_unlock(&channel->rd_mutex);
1387
1388 if (!channel->rd_synchronous)
1389 queue_delayed_work(xillybus_wq,
1390 &channel->rd_workitem,
1391 XILLY_RX_TIMEOUT);
1392
1393 if (channel->endpoint->fatal_error)
1394 return -EIO;
1395
1396 if (rc)
1397 return rc;
1398
1399 if ((channel->rd_synchronous) && (bytes_done > 0)) {
1400 rc = xillybus_myflush(filp->private_data, 0); /* No timeout */
1401
1402 if (rc && (rc != -EINTR))
1403 return rc;
1404 }
1405
1406 return bytes_done;
1407 }
1408
xillybus_open(struct inode * inode,struct file * filp)1409 static int xillybus_open(struct inode *inode, struct file *filp)
1410 {
1411 int rc = 0;
1412 unsigned long flags;
1413 int minor = iminor(inode);
1414 int major = imajor(inode);
1415 struct xilly_endpoint *ep_iter, *endpoint = NULL;
1416 struct xilly_channel *channel;
1417
1418 mutex_lock(&ep_list_lock);
1419
1420 list_for_each_entry(ep_iter, &list_of_endpoints, ep_list) {
1421 if ((ep_iter->major == major) &&
1422 (minor >= ep_iter->lowest_minor) &&
1423 (minor < (ep_iter->lowest_minor +
1424 ep_iter->num_channels))) {
1425 endpoint = ep_iter;
1426 break;
1427 }
1428 }
1429 mutex_unlock(&ep_list_lock);
1430
1431 if (!endpoint) {
1432 pr_err("xillybus: open() failed to find a device for major=%d and minor=%d\n",
1433 major, minor);
1434 return -ENODEV;
1435 }
1436
1437 if (endpoint->fatal_error)
1438 return -EIO;
1439
1440 channel = endpoint->channels[1 + minor - endpoint->lowest_minor];
1441 filp->private_data = channel;
1442
1443 /*
1444 * It gets complicated because:
1445 * 1. We don't want to take a mutex we don't have to
1446 * 2. We don't want to open one direction if the other will fail.
1447 */
1448
1449 if ((filp->f_mode & FMODE_READ) && (!channel->num_wr_buffers))
1450 return -ENODEV;
1451
1452 if ((filp->f_mode & FMODE_WRITE) && (!channel->num_rd_buffers))
1453 return -ENODEV;
1454
1455 if ((filp->f_mode & FMODE_READ) && (filp->f_flags & O_NONBLOCK) &&
1456 (channel->wr_synchronous || !channel->wr_allow_partial ||
1457 !channel->wr_supports_nonempty)) {
1458 dev_err(endpoint->dev,
1459 "open() failed: O_NONBLOCK not allowed for read on this device\n");
1460 return -ENODEV;
1461 }
1462
1463 if ((filp->f_mode & FMODE_WRITE) && (filp->f_flags & O_NONBLOCK) &&
1464 (channel->rd_synchronous || !channel->rd_allow_partial)) {
1465 dev_err(endpoint->dev,
1466 "open() failed: O_NONBLOCK not allowed for write on this device\n");
1467 return -ENODEV;
1468 }
1469
1470 /*
1471 * Note: open() may block on getting mutexes despite O_NONBLOCK.
1472 * This shouldn't occur normally, since multiple open of the same
1473 * file descriptor is almost always prohibited anyhow
1474 * (*_exclusive_open is normally set in real-life systems).
1475 */
1476
1477 if (filp->f_mode & FMODE_READ) {
1478 rc = mutex_lock_interruptible(&channel->wr_mutex);
1479 if (rc)
1480 return rc;
1481 }
1482
1483 if (filp->f_mode & FMODE_WRITE) {
1484 rc = mutex_lock_interruptible(&channel->rd_mutex);
1485 if (rc)
1486 goto unlock_wr;
1487 }
1488
1489 if ((filp->f_mode & FMODE_READ) &&
1490 (channel->wr_ref_count != 0) &&
1491 (channel->wr_exclusive_open)) {
1492 rc = -EBUSY;
1493 goto unlock;
1494 }
1495
1496 if ((filp->f_mode & FMODE_WRITE) &&
1497 (channel->rd_ref_count != 0) &&
1498 (channel->rd_exclusive_open)) {
1499 rc = -EBUSY;
1500 goto unlock;
1501 }
1502
1503 if (filp->f_mode & FMODE_READ) {
1504 if (channel->wr_ref_count == 0) { /* First open of file */
1505 /* Move the host to first buffer */
1506 spin_lock_irqsave(&channel->wr_spinlock, flags);
1507 channel->wr_host_buf_idx = 0;
1508 channel->wr_host_buf_pos = 0;
1509 channel->wr_fpga_buf_idx = -1;
1510 channel->wr_empty = 1;
1511 channel->wr_ready = 0;
1512 channel->wr_sleepy = 1;
1513 channel->wr_eof = -1;
1514 channel->wr_hangup = 0;
1515
1516 spin_unlock_irqrestore(&channel->wr_spinlock, flags);
1517
1518 iowrite32(1 | (channel->chan_num << 1) |
1519 (4 << 24) | /* Opcode 4, open channel */
1520 ((channel->wr_synchronous & 1) << 23),
1521 channel->endpoint->registers +
1522 fpga_buf_ctrl_reg);
1523 }
1524
1525 channel->wr_ref_count++;
1526 }
1527
1528 if (filp->f_mode & FMODE_WRITE) {
1529 if (channel->rd_ref_count == 0) { /* First open of file */
1530 /* Move the host to first buffer */
1531 spin_lock_irqsave(&channel->rd_spinlock, flags);
1532 channel->rd_host_buf_idx = 0;
1533 channel->rd_host_buf_pos = 0;
1534 channel->rd_leftovers[3] = 0; /* No leftovers. */
1535 channel->rd_fpga_buf_idx = channel->num_rd_buffers - 1;
1536 channel->rd_full = 0;
1537
1538 spin_unlock_irqrestore(&channel->rd_spinlock, flags);
1539
1540 iowrite32((channel->chan_num << 1) |
1541 (4 << 24), /* Opcode 4, open channel */
1542 channel->endpoint->registers +
1543 fpga_buf_ctrl_reg);
1544 }
1545
1546 channel->rd_ref_count++;
1547 }
1548
1549 unlock:
1550 if (filp->f_mode & FMODE_WRITE)
1551 mutex_unlock(&channel->rd_mutex);
1552 unlock_wr:
1553 if (filp->f_mode & FMODE_READ)
1554 mutex_unlock(&channel->wr_mutex);
1555
1556 if (!rc && (!channel->seekable))
1557 return nonseekable_open(inode, filp);
1558
1559 return rc;
1560 }
1561
xillybus_release(struct inode * inode,struct file * filp)1562 static int xillybus_release(struct inode *inode, struct file *filp)
1563 {
1564 unsigned long flags;
1565 struct xilly_channel *channel = filp->private_data;
1566
1567 int buf_idx;
1568 int eof;
1569
1570 if (channel->endpoint->fatal_error)
1571 return -EIO;
1572
1573 if (filp->f_mode & FMODE_WRITE) {
1574 mutex_lock(&channel->rd_mutex);
1575
1576 channel->rd_ref_count--;
1577
1578 if (channel->rd_ref_count == 0) {
1579 /*
1580 * We rely on the kernel calling flush()
1581 * before we get here.
1582 */
1583
1584 iowrite32((channel->chan_num << 1) | /* Channel ID */
1585 (5 << 24), /* Opcode 5, close channel */
1586 channel->endpoint->registers +
1587 fpga_buf_ctrl_reg);
1588 }
1589 mutex_unlock(&channel->rd_mutex);
1590 }
1591
1592 if (filp->f_mode & FMODE_READ) {
1593 mutex_lock(&channel->wr_mutex);
1594
1595 channel->wr_ref_count--;
1596
1597 if (channel->wr_ref_count == 0) {
1598 iowrite32(1 | (channel->chan_num << 1) |
1599 (5 << 24), /* Opcode 5, close channel */
1600 channel->endpoint->registers +
1601 fpga_buf_ctrl_reg);
1602
1603 /*
1604 * This is crazily cautious: We make sure that not
1605 * only that we got an EOF (be it because we closed
1606 * the channel or because of a user's EOF), but verify
1607 * that it's one beyond the last buffer arrived, so
1608 * we have no leftover buffers pending before wrapping
1609 * up (which can only happen in asynchronous channels,
1610 * BTW)
1611 */
1612
1613 while (1) {
1614 spin_lock_irqsave(&channel->wr_spinlock,
1615 flags);
1616 buf_idx = channel->wr_fpga_buf_idx;
1617 eof = channel->wr_eof;
1618 channel->wr_sleepy = 1;
1619 spin_unlock_irqrestore(&channel->wr_spinlock,
1620 flags);
1621
1622 /*
1623 * Check if eof points at the buffer after
1624 * the last one the FPGA submitted. Note that
1625 * no EOF is marked by negative eof.
1626 */
1627
1628 buf_idx++;
1629 if (buf_idx == channel->num_wr_buffers)
1630 buf_idx = 0;
1631
1632 if (buf_idx == eof)
1633 break;
1634
1635 /*
1636 * Steal extra 100 ms if awaken by interrupt.
1637 * This is a simple workaround for an
1638 * interrupt pending when entering, which would
1639 * otherwise result in declaring the hardware
1640 * non-responsive.
1641 */
1642
1643 if (wait_event_interruptible(
1644 channel->wr_wait,
1645 (!channel->wr_sleepy)))
1646 msleep(100);
1647
1648 if (channel->wr_sleepy) {
1649 mutex_unlock(&channel->wr_mutex);
1650 dev_warn(channel->endpoint->dev,
1651 "Hardware failed to respond to close command, therefore left in messy state.\n");
1652 return -EINTR;
1653 }
1654 }
1655 }
1656
1657 mutex_unlock(&channel->wr_mutex);
1658 }
1659
1660 return 0;
1661 }
1662
xillybus_llseek(struct file * filp,loff_t offset,int whence)1663 static loff_t xillybus_llseek(struct file *filp, loff_t offset, int whence)
1664 {
1665 struct xilly_channel *channel = filp->private_data;
1666 loff_t pos = filp->f_pos;
1667 int rc = 0;
1668
1669 /*
1670 * Take both mutexes not allowing interrupts, since it seems like
1671 * common applications don't expect an -EINTR here. Besides, multiple
1672 * access to a single file descriptor on seekable devices is a mess
1673 * anyhow.
1674 */
1675
1676 if (channel->endpoint->fatal_error)
1677 return -EIO;
1678
1679 mutex_lock(&channel->wr_mutex);
1680 mutex_lock(&channel->rd_mutex);
1681
1682 switch (whence) {
1683 case SEEK_SET:
1684 pos = offset;
1685 break;
1686 case SEEK_CUR:
1687 pos += offset;
1688 break;
1689 case SEEK_END:
1690 pos = offset; /* Going to the end => to the beginning */
1691 break;
1692 default:
1693 rc = -EINVAL;
1694 goto end;
1695 }
1696
1697 /* In any case, we must finish on an element boundary */
1698 if (pos & ((1 << channel->log2_element_size) - 1)) {
1699 rc = -EINVAL;
1700 goto end;
1701 }
1702
1703 mutex_lock(&channel->endpoint->register_mutex);
1704
1705 iowrite32(pos >> channel->log2_element_size,
1706 channel->endpoint->registers + fpga_buf_offset_reg);
1707
1708 iowrite32((channel->chan_num << 1) |
1709 (6 << 24), /* Opcode 6, set address */
1710 channel->endpoint->registers + fpga_buf_ctrl_reg);
1711
1712 mutex_unlock(&channel->endpoint->register_mutex);
1713
1714 end:
1715 mutex_unlock(&channel->rd_mutex);
1716 mutex_unlock(&channel->wr_mutex);
1717
1718 if (rc) /* Return error after releasing mutexes */
1719 return rc;
1720
1721 filp->f_pos = pos;
1722
1723 /*
1724 * Since seekable devices are allowed only when the channel is
1725 * synchronous, we assume that there is no data pending in either
1726 * direction (which holds true as long as no concurrent access on the
1727 * file descriptor takes place).
1728 * The only thing we may need to throw away is leftovers from partial
1729 * write() flush.
1730 */
1731
1732 channel->rd_leftovers[3] = 0;
1733
1734 return pos;
1735 }
1736
xillybus_poll(struct file * filp,poll_table * wait)1737 static unsigned int xillybus_poll(struct file *filp, poll_table *wait)
1738 {
1739 struct xilly_channel *channel = filp->private_data;
1740 unsigned int mask = 0;
1741 unsigned long flags;
1742
1743 poll_wait(filp, &channel->endpoint->ep_wait, wait);
1744
1745 /*
1746 * poll() won't play ball regarding read() channels which
1747 * aren't asynchronous and support the nonempty message. Allowing
1748 * that will create situations where data has been delivered at
1749 * the FPGA, and users expecting select() to wake up, which it may
1750 * not.
1751 */
1752
1753 if (!channel->wr_synchronous && channel->wr_supports_nonempty) {
1754 poll_wait(filp, &channel->wr_wait, wait);
1755 poll_wait(filp, &channel->wr_ready_wait, wait);
1756
1757 spin_lock_irqsave(&channel->wr_spinlock, flags);
1758 if (!channel->wr_empty || channel->wr_ready)
1759 mask |= POLLIN | POLLRDNORM;
1760
1761 if (channel->wr_hangup)
1762 /*
1763 * Not POLLHUP, because its behavior is in the
1764 * mist, and POLLIN does what we want: Wake up
1765 * the read file descriptor so it sees EOF.
1766 */
1767 mask |= POLLIN | POLLRDNORM;
1768 spin_unlock_irqrestore(&channel->wr_spinlock, flags);
1769 }
1770
1771 /*
1772 * If partial data write is disallowed on a write() channel,
1773 * it's pointless to ever signal OK to write, because is could
1774 * block despite some space being available.
1775 */
1776
1777 if (channel->rd_allow_partial) {
1778 poll_wait(filp, &channel->rd_wait, wait);
1779
1780 spin_lock_irqsave(&channel->rd_spinlock, flags);
1781 if (!channel->rd_full)
1782 mask |= POLLOUT | POLLWRNORM;
1783 spin_unlock_irqrestore(&channel->rd_spinlock, flags);
1784 }
1785
1786 if (channel->endpoint->fatal_error)
1787 mask |= POLLERR;
1788
1789 return mask;
1790 }
1791
1792 static const struct file_operations xillybus_fops = {
1793 .owner = THIS_MODULE,
1794 .read = xillybus_read,
1795 .write = xillybus_write,
1796 .open = xillybus_open,
1797 .flush = xillybus_flush,
1798 .release = xillybus_release,
1799 .llseek = xillybus_llseek,
1800 .poll = xillybus_poll,
1801 };
1802
xillybus_init_chrdev(struct xilly_endpoint * endpoint,const unsigned char * idt)1803 static int xillybus_init_chrdev(struct xilly_endpoint *endpoint,
1804 const unsigned char *idt)
1805 {
1806 int rc;
1807 dev_t dev;
1808 int devnum, i, minor, major;
1809 char devname[48];
1810 struct device *device;
1811
1812 rc = alloc_chrdev_region(&dev, 0, /* minor start */
1813 endpoint->num_channels,
1814 xillyname);
1815 if (rc) {
1816 dev_warn(endpoint->dev, "Failed to obtain major/minors");
1817 return rc;
1818 }
1819
1820 endpoint->major = major = MAJOR(dev);
1821 endpoint->lowest_minor = minor = MINOR(dev);
1822
1823 cdev_init(&endpoint->cdev, &xillybus_fops);
1824 endpoint->cdev.owner = endpoint->ephw->owner;
1825 rc = cdev_add(&endpoint->cdev, MKDEV(major, minor),
1826 endpoint->num_channels);
1827 if (rc) {
1828 dev_warn(endpoint->dev, "Failed to add cdev. Aborting.\n");
1829 goto unregister_chrdev;
1830 }
1831
1832 idt++;
1833
1834 for (i = minor, devnum = 0;
1835 devnum < endpoint->num_channels;
1836 devnum++, i++) {
1837 snprintf(devname, sizeof(devname)-1, "xillybus_%s", idt);
1838
1839 devname[sizeof(devname)-1] = 0; /* Should never matter */
1840
1841 while (*idt++)
1842 /* Skip to next */;
1843
1844 device = device_create(xillybus_class,
1845 NULL,
1846 MKDEV(major, i),
1847 NULL,
1848 "%s", devname);
1849
1850 if (IS_ERR(device)) {
1851 dev_warn(endpoint->dev,
1852 "Failed to create %s device. Aborting.\n",
1853 devname);
1854 rc = -ENODEV;
1855 goto unroll_device_create;
1856 }
1857 }
1858
1859 dev_info(endpoint->dev, "Created %d device files.\n",
1860 endpoint->num_channels);
1861 return 0; /* succeed */
1862
1863 unroll_device_create:
1864 devnum--; i--;
1865 for (; devnum >= 0; devnum--, i--)
1866 device_destroy(xillybus_class, MKDEV(major, i));
1867
1868 cdev_del(&endpoint->cdev);
1869 unregister_chrdev:
1870 unregister_chrdev_region(MKDEV(major, minor), endpoint->num_channels);
1871
1872 return rc;
1873 }
1874
xillybus_cleanup_chrdev(struct xilly_endpoint * endpoint)1875 static void xillybus_cleanup_chrdev(struct xilly_endpoint *endpoint)
1876 {
1877 int minor;
1878
1879 for (minor = endpoint->lowest_minor;
1880 minor < (endpoint->lowest_minor + endpoint->num_channels);
1881 minor++)
1882 device_destroy(xillybus_class, MKDEV(endpoint->major, minor));
1883 cdev_del(&endpoint->cdev);
1884 unregister_chrdev_region(MKDEV(endpoint->major,
1885 endpoint->lowest_minor),
1886 endpoint->num_channels);
1887
1888 dev_info(endpoint->dev, "Removed %d device files.\n",
1889 endpoint->num_channels);
1890 }
1891
xillybus_init_endpoint(struct pci_dev * pdev,struct device * dev,struct xilly_endpoint_hardware * ephw)1892 struct xilly_endpoint *xillybus_init_endpoint(struct pci_dev *pdev,
1893 struct device *dev,
1894 struct xilly_endpoint_hardware
1895 *ephw)
1896 {
1897 struct xilly_endpoint *endpoint;
1898
1899 endpoint = devm_kzalloc(dev, sizeof(*endpoint), GFP_KERNEL);
1900 if (!endpoint)
1901 return NULL;
1902
1903 endpoint->pdev = pdev;
1904 endpoint->dev = dev;
1905 endpoint->ephw = ephw;
1906 endpoint->msg_counter = 0x0b;
1907 endpoint->failed_messages = 0;
1908 endpoint->fatal_error = 0;
1909
1910 init_waitqueue_head(&endpoint->ep_wait);
1911 mutex_init(&endpoint->register_mutex);
1912
1913 return endpoint;
1914 }
1915 EXPORT_SYMBOL(xillybus_init_endpoint);
1916
xilly_quiesce(struct xilly_endpoint * endpoint)1917 static int xilly_quiesce(struct xilly_endpoint *endpoint)
1918 {
1919 long t;
1920
1921 endpoint->idtlen = -1;
1922
1923 iowrite32((u32) (endpoint->dma_using_dac & 0x0001),
1924 endpoint->registers + fpga_dma_control_reg);
1925
1926 t = wait_event_interruptible_timeout(endpoint->ep_wait,
1927 (endpoint->idtlen >= 0),
1928 XILLY_TIMEOUT);
1929 if (t <= 0) {
1930 dev_err(endpoint->dev,
1931 "Failed to quiesce the device on exit.\n");
1932 return -ENODEV;
1933 }
1934 return 0;
1935 }
1936
xillybus_endpoint_discovery(struct xilly_endpoint * endpoint)1937 int xillybus_endpoint_discovery(struct xilly_endpoint *endpoint)
1938 {
1939 int rc;
1940 long t;
1941
1942 void *bootstrap_resources;
1943 int idtbuffersize = (1 << PAGE_SHIFT);
1944 struct device *dev = endpoint->dev;
1945
1946 /*
1947 * The bogus IDT is used during bootstrap for allocating the initial
1948 * message buffer, and then the message buffer and space for the IDT
1949 * itself. The initial message buffer is of a single page's size, but
1950 * it's soon replaced with a more modest one (and memory is freed).
1951 */
1952
1953 unsigned char bogus_idt[8] = { 1, 224, (PAGE_SHIFT)-2, 0,
1954 3, 192, PAGE_SHIFT, 0 };
1955 struct xilly_idt_handle idt_handle;
1956
1957 /*
1958 * Writing the value 0x00000001 to Endianness register signals which
1959 * endianness this processor is using, so the FPGA can swap words as
1960 * necessary.
1961 */
1962
1963 iowrite32(1, endpoint->registers + fpga_endian_reg);
1964
1965 /* Bootstrap phase I: Allocate temporary message buffer */
1966
1967 bootstrap_resources = devres_open_group(dev, NULL, GFP_KERNEL);
1968 if (!bootstrap_resources)
1969 return -ENOMEM;
1970
1971 endpoint->num_channels = 0;
1972
1973 rc = xilly_setupchannels(endpoint, bogus_idt, 1);
1974 if (rc)
1975 return rc;
1976
1977 /* Clear the message subsystem (and counter in particular) */
1978 iowrite32(0x04, endpoint->registers + fpga_msg_ctrl_reg);
1979
1980 endpoint->idtlen = -1;
1981
1982 /*
1983 * Set DMA 32/64 bit mode, quiesce the device (?!) and get IDT
1984 * buffer size.
1985 */
1986 iowrite32((u32) (endpoint->dma_using_dac & 0x0001),
1987 endpoint->registers + fpga_dma_control_reg);
1988
1989 t = wait_event_interruptible_timeout(endpoint->ep_wait,
1990 (endpoint->idtlen >= 0),
1991 XILLY_TIMEOUT);
1992 if (t <= 0) {
1993 dev_err(endpoint->dev, "No response from FPGA. Aborting.\n");
1994 return -ENODEV;
1995 }
1996
1997 /* Enable DMA */
1998 iowrite32((u32) (0x0002 | (endpoint->dma_using_dac & 0x0001)),
1999 endpoint->registers + fpga_dma_control_reg);
2000
2001 /* Bootstrap phase II: Allocate buffer for IDT and obtain it */
2002 while (endpoint->idtlen >= idtbuffersize) {
2003 idtbuffersize *= 2;
2004 bogus_idt[6]++;
2005 }
2006
2007 endpoint->num_channels = 1;
2008
2009 rc = xilly_setupchannels(endpoint, bogus_idt, 2);
2010 if (rc)
2011 goto failed_idt;
2012
2013 rc = xilly_obtain_idt(endpoint);
2014 if (rc)
2015 goto failed_idt;
2016
2017 rc = xilly_scan_idt(endpoint, &idt_handle);
2018 if (rc)
2019 goto failed_idt;
2020
2021 devres_close_group(dev, bootstrap_resources);
2022
2023 /* Bootstrap phase III: Allocate buffers according to IDT */
2024
2025 rc = xilly_setupchannels(endpoint,
2026 idt_handle.chandesc,
2027 idt_handle.entries);
2028 if (rc)
2029 goto failed_idt;
2030
2031 /*
2032 * endpoint is now completely configured. We put it on the list
2033 * available to open() before registering the char device(s)
2034 */
2035
2036 mutex_lock(&ep_list_lock);
2037 list_add_tail(&endpoint->ep_list, &list_of_endpoints);
2038 mutex_unlock(&ep_list_lock);
2039
2040 rc = xillybus_init_chrdev(endpoint, idt_handle.idt);
2041 if (rc)
2042 goto failed_chrdevs;
2043
2044 devres_release_group(dev, bootstrap_resources);
2045
2046 return 0;
2047
2048 failed_chrdevs:
2049 mutex_lock(&ep_list_lock);
2050 list_del(&endpoint->ep_list);
2051 mutex_unlock(&ep_list_lock);
2052
2053 failed_idt:
2054 xilly_quiesce(endpoint);
2055 flush_workqueue(xillybus_wq);
2056
2057 return rc;
2058 }
2059 EXPORT_SYMBOL(xillybus_endpoint_discovery);
2060
xillybus_endpoint_remove(struct xilly_endpoint * endpoint)2061 void xillybus_endpoint_remove(struct xilly_endpoint *endpoint)
2062 {
2063 xillybus_cleanup_chrdev(endpoint);
2064
2065 mutex_lock(&ep_list_lock);
2066 list_del(&endpoint->ep_list);
2067 mutex_unlock(&ep_list_lock);
2068
2069 xilly_quiesce(endpoint);
2070
2071 /*
2072 * Flushing is done upon endpoint release to prevent access to memory
2073 * just about to be released. This makes the quiesce complete.
2074 */
2075 flush_workqueue(xillybus_wq);
2076 }
2077 EXPORT_SYMBOL(xillybus_endpoint_remove);
2078
xillybus_init(void)2079 static int __init xillybus_init(void)
2080 {
2081 mutex_init(&ep_list_lock);
2082
2083 xillybus_class = class_create(THIS_MODULE, xillyname);
2084 if (IS_ERR(xillybus_class))
2085 return PTR_ERR(xillybus_class);
2086
2087 xillybus_wq = alloc_workqueue(xillyname, 0, 0);
2088 if (!xillybus_wq) {
2089 class_destroy(xillybus_class);
2090 return -ENOMEM;
2091 }
2092
2093 return 0;
2094 }
2095
xillybus_exit(void)2096 static void __exit xillybus_exit(void)
2097 {
2098 /* flush_workqueue() was called for each endpoint released */
2099 destroy_workqueue(xillybus_wq);
2100
2101 class_destroy(xillybus_class);
2102 }
2103
2104 module_init(xillybus_init);
2105 module_exit(xillybus_exit);
2106