1 // SPDX-License-Identifier: GPL-2.0-or-later
2 /*
3 * Copyright 2015 IBM Corp.
4 */
5
6 #include <linux/spinlock.h>
7 #include <linux/uaccess.h>
8 #include <linux/delay.h>
9
10 #include "cxl.h"
11 #include "hcalls.h"
12 #include "trace.h"
13
14 #define CXL_ERROR_DETECTED_EVENT 1
15 #define CXL_SLOT_RESET_EVENT 2
16 #define CXL_RESUME_EVENT 3
17
pci_error_handlers(struct cxl_afu * afu,int bus_error_event,pci_channel_state_t state)18 static void pci_error_handlers(struct cxl_afu *afu,
19 int bus_error_event,
20 pci_channel_state_t state)
21 {
22 struct pci_dev *afu_dev;
23
24 if (afu->phb == NULL)
25 return;
26
27 list_for_each_entry(afu_dev, &afu->phb->bus->devices, bus_list) {
28 if (!afu_dev->driver)
29 continue;
30
31 switch (bus_error_event) {
32 case CXL_ERROR_DETECTED_EVENT:
33 afu_dev->error_state = state;
34
35 if (afu_dev->driver->err_handler &&
36 afu_dev->driver->err_handler->error_detected)
37 afu_dev->driver->err_handler->error_detected(afu_dev, state);
38 break;
39 case CXL_SLOT_RESET_EVENT:
40 afu_dev->error_state = state;
41
42 if (afu_dev->driver->err_handler &&
43 afu_dev->driver->err_handler->slot_reset)
44 afu_dev->driver->err_handler->slot_reset(afu_dev);
45 break;
46 case CXL_RESUME_EVENT:
47 if (afu_dev->driver->err_handler &&
48 afu_dev->driver->err_handler->resume)
49 afu_dev->driver->err_handler->resume(afu_dev);
50 break;
51 }
52 }
53 }
54
guest_handle_psl_slice_error(struct cxl_context * ctx,u64 dsisr,u64 errstat)55 static irqreturn_t guest_handle_psl_slice_error(struct cxl_context *ctx, u64 dsisr,
56 u64 errstat)
57 {
58 pr_devel("in %s\n", __func__);
59 dev_crit(&ctx->afu->dev, "PSL ERROR STATUS: 0x%.16llx\n", errstat);
60
61 return cxl_ops->ack_irq(ctx, 0, errstat);
62 }
63
guest_collect_vpd(struct cxl * adapter,struct cxl_afu * afu,void * buf,size_t len)64 static ssize_t guest_collect_vpd(struct cxl *adapter, struct cxl_afu *afu,
65 void *buf, size_t len)
66 {
67 unsigned int entries, mod;
68 unsigned long **vpd_buf = NULL;
69 struct sg_list *le;
70 int rc = 0, i, tocopy;
71 u64 out = 0;
72
73 if (buf == NULL)
74 return -EINVAL;
75
76 /* number of entries in the list */
77 entries = len / SG_BUFFER_SIZE;
78 mod = len % SG_BUFFER_SIZE;
79 if (mod)
80 entries++;
81
82 if (entries > SG_MAX_ENTRIES) {
83 entries = SG_MAX_ENTRIES;
84 len = SG_MAX_ENTRIES * SG_BUFFER_SIZE;
85 mod = 0;
86 }
87
88 vpd_buf = kcalloc(entries, sizeof(unsigned long *), GFP_KERNEL);
89 if (!vpd_buf)
90 return -ENOMEM;
91
92 le = (struct sg_list *)get_zeroed_page(GFP_KERNEL);
93 if (!le) {
94 rc = -ENOMEM;
95 goto err1;
96 }
97
98 for (i = 0; i < entries; i++) {
99 vpd_buf[i] = (unsigned long *)get_zeroed_page(GFP_KERNEL);
100 if (!vpd_buf[i]) {
101 rc = -ENOMEM;
102 goto err2;
103 }
104 le[i].phys_addr = cpu_to_be64(virt_to_phys(vpd_buf[i]));
105 le[i].len = cpu_to_be64(SG_BUFFER_SIZE);
106 if ((i == (entries - 1)) && mod)
107 le[i].len = cpu_to_be64(mod);
108 }
109
110 if (adapter)
111 rc = cxl_h_collect_vpd_adapter(adapter->guest->handle,
112 virt_to_phys(le), entries, &out);
113 else
114 rc = cxl_h_collect_vpd(afu->guest->handle, 0,
115 virt_to_phys(le), entries, &out);
116 pr_devel("length of available (entries: %i), vpd: %#llx\n",
117 entries, out);
118
119 if (!rc) {
120 /*
121 * hcall returns in 'out' the size of available VPDs.
122 * It fills the buffer with as much data as possible.
123 */
124 if (out < len)
125 len = out;
126 rc = len;
127 if (out) {
128 for (i = 0; i < entries; i++) {
129 if (len < SG_BUFFER_SIZE)
130 tocopy = len;
131 else
132 tocopy = SG_BUFFER_SIZE;
133 memcpy(buf, vpd_buf[i], tocopy);
134 buf += tocopy;
135 len -= tocopy;
136 }
137 }
138 }
139 err2:
140 for (i = 0; i < entries; i++) {
141 if (vpd_buf[i])
142 free_page((unsigned long) vpd_buf[i]);
143 }
144 free_page((unsigned long) le);
145 err1:
146 kfree(vpd_buf);
147 return rc;
148 }
149
guest_get_irq_info(struct cxl_context * ctx,struct cxl_irq_info * info)150 static int guest_get_irq_info(struct cxl_context *ctx, struct cxl_irq_info *info)
151 {
152 return cxl_h_collect_int_info(ctx->afu->guest->handle, ctx->process_token, info);
153 }
154
guest_psl_irq(int irq,void * data)155 static irqreturn_t guest_psl_irq(int irq, void *data)
156 {
157 struct cxl_context *ctx = data;
158 struct cxl_irq_info irq_info;
159 int rc;
160
161 pr_devel("%d: received PSL interrupt %i\n", ctx->pe, irq);
162 rc = guest_get_irq_info(ctx, &irq_info);
163 if (rc) {
164 WARN(1, "Unable to get IRQ info: %i\n", rc);
165 return IRQ_HANDLED;
166 }
167
168 rc = cxl_irq_psl8(irq, ctx, &irq_info);
169 return rc;
170 }
171
afu_read_error_state(struct cxl_afu * afu,int * state_out)172 static int afu_read_error_state(struct cxl_afu *afu, int *state_out)
173 {
174 u64 state;
175 int rc = 0;
176
177 if (!afu)
178 return -EIO;
179
180 rc = cxl_h_read_error_state(afu->guest->handle, &state);
181 if (!rc) {
182 WARN_ON(state != H_STATE_NORMAL &&
183 state != H_STATE_DISABLE &&
184 state != H_STATE_TEMP_UNAVAILABLE &&
185 state != H_STATE_PERM_UNAVAILABLE);
186 *state_out = state & 0xffffffff;
187 }
188 return rc;
189 }
190
guest_slice_irq_err(int irq,void * data)191 static irqreturn_t guest_slice_irq_err(int irq, void *data)
192 {
193 struct cxl_afu *afu = data;
194 int rc;
195 u64 serr, afu_error, dsisr;
196
197 rc = cxl_h_get_fn_error_interrupt(afu->guest->handle, &serr);
198 if (rc) {
199 dev_crit(&afu->dev, "Couldn't read PSL_SERR_An: %d\n", rc);
200 return IRQ_HANDLED;
201 }
202 afu_error = cxl_p2n_read(afu, CXL_AFU_ERR_An);
203 dsisr = cxl_p2n_read(afu, CXL_PSL_DSISR_An);
204 cxl_afu_decode_psl_serr(afu, serr);
205 dev_crit(&afu->dev, "AFU_ERR_An: 0x%.16llx\n", afu_error);
206 dev_crit(&afu->dev, "PSL_DSISR_An: 0x%.16llx\n", dsisr);
207
208 rc = cxl_h_ack_fn_error_interrupt(afu->guest->handle, serr);
209 if (rc)
210 dev_crit(&afu->dev, "Couldn't ack slice error interrupt: %d\n",
211 rc);
212
213 return IRQ_HANDLED;
214 }
215
216
irq_alloc_range(struct cxl * adapter,int len,int * irq)217 static int irq_alloc_range(struct cxl *adapter, int len, int *irq)
218 {
219 int i, n;
220 struct irq_avail *cur;
221
222 for (i = 0; i < adapter->guest->irq_nranges; i++) {
223 cur = &adapter->guest->irq_avail[i];
224 n = bitmap_find_next_zero_area(cur->bitmap, cur->range,
225 0, len, 0);
226 if (n < cur->range) {
227 bitmap_set(cur->bitmap, n, len);
228 *irq = cur->offset + n;
229 pr_devel("guest: allocate IRQs %#x->%#x\n",
230 *irq, *irq + len - 1);
231
232 return 0;
233 }
234 }
235 return -ENOSPC;
236 }
237
irq_free_range(struct cxl * adapter,int irq,int len)238 static int irq_free_range(struct cxl *adapter, int irq, int len)
239 {
240 int i, n;
241 struct irq_avail *cur;
242
243 if (len == 0)
244 return -ENOENT;
245
246 for (i = 0; i < adapter->guest->irq_nranges; i++) {
247 cur = &adapter->guest->irq_avail[i];
248 if (irq >= cur->offset &&
249 (irq + len) <= (cur->offset + cur->range)) {
250 n = irq - cur->offset;
251 bitmap_clear(cur->bitmap, n, len);
252 pr_devel("guest: release IRQs %#x->%#x\n",
253 irq, irq + len - 1);
254 return 0;
255 }
256 }
257 return -ENOENT;
258 }
259
guest_reset(struct cxl * adapter)260 static int guest_reset(struct cxl *adapter)
261 {
262 struct cxl_afu *afu = NULL;
263 int i, rc;
264
265 pr_devel("Adapter reset request\n");
266 spin_lock(&adapter->afu_list_lock);
267 for (i = 0; i < adapter->slices; i++) {
268 if ((afu = adapter->afu[i])) {
269 pci_error_handlers(afu, CXL_ERROR_DETECTED_EVENT,
270 pci_channel_io_frozen);
271 cxl_context_detach_all(afu);
272 }
273 }
274
275 rc = cxl_h_reset_adapter(adapter->guest->handle);
276 for (i = 0; i < adapter->slices; i++) {
277 if (!rc && (afu = adapter->afu[i])) {
278 pci_error_handlers(afu, CXL_SLOT_RESET_EVENT,
279 pci_channel_io_normal);
280 pci_error_handlers(afu, CXL_RESUME_EVENT, 0);
281 }
282 }
283 spin_unlock(&adapter->afu_list_lock);
284 return rc;
285 }
286
guest_alloc_one_irq(struct cxl * adapter)287 static int guest_alloc_one_irq(struct cxl *adapter)
288 {
289 int irq;
290
291 spin_lock(&adapter->guest->irq_alloc_lock);
292 if (irq_alloc_range(adapter, 1, &irq))
293 irq = -ENOSPC;
294 spin_unlock(&adapter->guest->irq_alloc_lock);
295 return irq;
296 }
297
guest_release_one_irq(struct cxl * adapter,int irq)298 static void guest_release_one_irq(struct cxl *adapter, int irq)
299 {
300 spin_lock(&adapter->guest->irq_alloc_lock);
301 irq_free_range(adapter, irq, 1);
302 spin_unlock(&adapter->guest->irq_alloc_lock);
303 }
304
guest_alloc_irq_ranges(struct cxl_irq_ranges * irqs,struct cxl * adapter,unsigned int num)305 static int guest_alloc_irq_ranges(struct cxl_irq_ranges *irqs,
306 struct cxl *adapter, unsigned int num)
307 {
308 int i, try, irq;
309
310 memset(irqs, 0, sizeof(struct cxl_irq_ranges));
311
312 spin_lock(&adapter->guest->irq_alloc_lock);
313 for (i = 0; i < CXL_IRQ_RANGES && num; i++) {
314 try = num;
315 while (try) {
316 if (irq_alloc_range(adapter, try, &irq) == 0)
317 break;
318 try /= 2;
319 }
320 if (!try)
321 goto error;
322 irqs->offset[i] = irq;
323 irqs->range[i] = try;
324 num -= try;
325 }
326 if (num)
327 goto error;
328 spin_unlock(&adapter->guest->irq_alloc_lock);
329 return 0;
330
331 error:
332 for (i = 0; i < CXL_IRQ_RANGES; i++)
333 irq_free_range(adapter, irqs->offset[i], irqs->range[i]);
334 spin_unlock(&adapter->guest->irq_alloc_lock);
335 return -ENOSPC;
336 }
337
guest_release_irq_ranges(struct cxl_irq_ranges * irqs,struct cxl * adapter)338 static void guest_release_irq_ranges(struct cxl_irq_ranges *irqs,
339 struct cxl *adapter)
340 {
341 int i;
342
343 spin_lock(&adapter->guest->irq_alloc_lock);
344 for (i = 0; i < CXL_IRQ_RANGES; i++)
345 irq_free_range(adapter, irqs->offset[i], irqs->range[i]);
346 spin_unlock(&adapter->guest->irq_alloc_lock);
347 }
348
guest_register_serr_irq(struct cxl_afu * afu)349 static int guest_register_serr_irq(struct cxl_afu *afu)
350 {
351 afu->err_irq_name = kasprintf(GFP_KERNEL, "cxl-%s-err",
352 dev_name(&afu->dev));
353 if (!afu->err_irq_name)
354 return -ENOMEM;
355
356 if (!(afu->serr_virq = cxl_map_irq(afu->adapter, afu->serr_hwirq,
357 guest_slice_irq_err, afu, afu->err_irq_name))) {
358 kfree(afu->err_irq_name);
359 afu->err_irq_name = NULL;
360 return -ENOMEM;
361 }
362
363 return 0;
364 }
365
guest_release_serr_irq(struct cxl_afu * afu)366 static void guest_release_serr_irq(struct cxl_afu *afu)
367 {
368 cxl_unmap_irq(afu->serr_virq, afu);
369 cxl_ops->release_one_irq(afu->adapter, afu->serr_hwirq);
370 kfree(afu->err_irq_name);
371 }
372
guest_ack_irq(struct cxl_context * ctx,u64 tfc,u64 psl_reset_mask)373 static int guest_ack_irq(struct cxl_context *ctx, u64 tfc, u64 psl_reset_mask)
374 {
375 return cxl_h_control_faults(ctx->afu->guest->handle, ctx->process_token,
376 tfc >> 32, (psl_reset_mask != 0));
377 }
378
disable_afu_irqs(struct cxl_context * ctx)379 static void disable_afu_irqs(struct cxl_context *ctx)
380 {
381 irq_hw_number_t hwirq;
382 unsigned int virq;
383 int r, i;
384
385 pr_devel("Disabling AFU(%d) interrupts\n", ctx->afu->slice);
386 for (r = 0; r < CXL_IRQ_RANGES; r++) {
387 hwirq = ctx->irqs.offset[r];
388 for (i = 0; i < ctx->irqs.range[r]; hwirq++, i++) {
389 virq = irq_find_mapping(NULL, hwirq);
390 disable_irq(virq);
391 }
392 }
393 }
394
enable_afu_irqs(struct cxl_context * ctx)395 static void enable_afu_irqs(struct cxl_context *ctx)
396 {
397 irq_hw_number_t hwirq;
398 unsigned int virq;
399 int r, i;
400
401 pr_devel("Enabling AFU(%d) interrupts\n", ctx->afu->slice);
402 for (r = 0; r < CXL_IRQ_RANGES; r++) {
403 hwirq = ctx->irqs.offset[r];
404 for (i = 0; i < ctx->irqs.range[r]; hwirq++, i++) {
405 virq = irq_find_mapping(NULL, hwirq);
406 enable_irq(virq);
407 }
408 }
409 }
410
_guest_afu_cr_readXX(int sz,struct cxl_afu * afu,int cr_idx,u64 offset,u64 * val)411 static int _guest_afu_cr_readXX(int sz, struct cxl_afu *afu, int cr_idx,
412 u64 offset, u64 *val)
413 {
414 unsigned long cr;
415 char c;
416 int rc = 0;
417
418 if (afu->crs_len < sz)
419 return -ENOENT;
420
421 if (unlikely(offset >= afu->crs_len))
422 return -ERANGE;
423
424 cr = get_zeroed_page(GFP_KERNEL);
425 if (!cr)
426 return -ENOMEM;
427
428 rc = cxl_h_get_config(afu->guest->handle, cr_idx, offset,
429 virt_to_phys((void *)cr), sz);
430 if (rc)
431 goto err;
432
433 switch (sz) {
434 case 1:
435 c = *((char *) cr);
436 *val = c;
437 break;
438 case 2:
439 *val = in_le16((u16 *)cr);
440 break;
441 case 4:
442 *val = in_le32((unsigned *)cr);
443 break;
444 case 8:
445 *val = in_le64((u64 *)cr);
446 break;
447 default:
448 WARN_ON(1);
449 }
450 err:
451 free_page(cr);
452 return rc;
453 }
454
guest_afu_cr_read32(struct cxl_afu * afu,int cr_idx,u64 offset,u32 * out)455 static int guest_afu_cr_read32(struct cxl_afu *afu, int cr_idx, u64 offset,
456 u32 *out)
457 {
458 int rc;
459 u64 val;
460
461 rc = _guest_afu_cr_readXX(4, afu, cr_idx, offset, &val);
462 if (!rc)
463 *out = (u32) val;
464 return rc;
465 }
466
guest_afu_cr_read16(struct cxl_afu * afu,int cr_idx,u64 offset,u16 * out)467 static int guest_afu_cr_read16(struct cxl_afu *afu, int cr_idx, u64 offset,
468 u16 *out)
469 {
470 int rc;
471 u64 val;
472
473 rc = _guest_afu_cr_readXX(2, afu, cr_idx, offset, &val);
474 if (!rc)
475 *out = (u16) val;
476 return rc;
477 }
478
guest_afu_cr_read8(struct cxl_afu * afu,int cr_idx,u64 offset,u8 * out)479 static int guest_afu_cr_read8(struct cxl_afu *afu, int cr_idx, u64 offset,
480 u8 *out)
481 {
482 int rc;
483 u64 val;
484
485 rc = _guest_afu_cr_readXX(1, afu, cr_idx, offset, &val);
486 if (!rc)
487 *out = (u8) val;
488 return rc;
489 }
490
guest_afu_cr_read64(struct cxl_afu * afu,int cr_idx,u64 offset,u64 * out)491 static int guest_afu_cr_read64(struct cxl_afu *afu, int cr_idx, u64 offset,
492 u64 *out)
493 {
494 return _guest_afu_cr_readXX(8, afu, cr_idx, offset, out);
495 }
496
guest_afu_cr_write32(struct cxl_afu * afu,int cr,u64 off,u32 in)497 static int guest_afu_cr_write32(struct cxl_afu *afu, int cr, u64 off, u32 in)
498 {
499 /* config record is not writable from guest */
500 return -EPERM;
501 }
502
guest_afu_cr_write16(struct cxl_afu * afu,int cr,u64 off,u16 in)503 static int guest_afu_cr_write16(struct cxl_afu *afu, int cr, u64 off, u16 in)
504 {
505 /* config record is not writable from guest */
506 return -EPERM;
507 }
508
guest_afu_cr_write8(struct cxl_afu * afu,int cr,u64 off,u8 in)509 static int guest_afu_cr_write8(struct cxl_afu *afu, int cr, u64 off, u8 in)
510 {
511 /* config record is not writable from guest */
512 return -EPERM;
513 }
514
attach_afu_directed(struct cxl_context * ctx,u64 wed,u64 amr)515 static int attach_afu_directed(struct cxl_context *ctx, u64 wed, u64 amr)
516 {
517 struct cxl_process_element_hcall *elem;
518 struct cxl *adapter = ctx->afu->adapter;
519 const struct cred *cred;
520 u32 pid, idx;
521 int rc, r, i;
522 u64 mmio_addr, mmio_size;
523 __be64 flags = 0;
524
525 /* Must be 8 byte aligned and cannot cross a 4096 byte boundary */
526 if (!(elem = (struct cxl_process_element_hcall *)
527 get_zeroed_page(GFP_KERNEL)))
528 return -ENOMEM;
529
530 elem->version = cpu_to_be64(CXL_PROCESS_ELEMENT_VERSION);
531 if (ctx->kernel) {
532 pid = 0;
533 flags |= CXL_PE_TRANSLATION_ENABLED;
534 flags |= CXL_PE_PRIVILEGED_PROCESS;
535 if (mfmsr() & MSR_SF)
536 flags |= CXL_PE_64_BIT;
537 } else {
538 pid = current->pid;
539 flags |= CXL_PE_PROBLEM_STATE;
540 flags |= CXL_PE_TRANSLATION_ENABLED;
541 if (!test_tsk_thread_flag(current, TIF_32BIT))
542 flags |= CXL_PE_64_BIT;
543 cred = get_current_cred();
544 if (uid_eq(cred->euid, GLOBAL_ROOT_UID))
545 flags |= CXL_PE_PRIVILEGED_PROCESS;
546 put_cred(cred);
547 }
548 elem->flags = cpu_to_be64(flags);
549 elem->common.tid = cpu_to_be32(0); /* Unused */
550 elem->common.pid = cpu_to_be32(pid);
551 elem->common.csrp = cpu_to_be64(0); /* disable */
552 elem->common.u.psl8.aurp0 = cpu_to_be64(0); /* disable */
553 elem->common.u.psl8.aurp1 = cpu_to_be64(0); /* disable */
554
555 cxl_prefault(ctx, wed);
556
557 elem->common.u.psl8.sstp0 = cpu_to_be64(ctx->sstp0);
558 elem->common.u.psl8.sstp1 = cpu_to_be64(ctx->sstp1);
559
560 /*
561 * Ensure we have at least one interrupt allocated to take faults for
562 * kernel contexts that may not have allocated any AFU IRQs at all:
563 */
564 if (ctx->irqs.range[0] == 0) {
565 rc = afu_register_irqs(ctx, 0);
566 if (rc)
567 goto out_free;
568 }
569
570 for (r = 0; r < CXL_IRQ_RANGES; r++) {
571 for (i = 0; i < ctx->irqs.range[r]; i++) {
572 if (r == 0 && i == 0) {
573 elem->pslVirtualIsn = cpu_to_be32(ctx->irqs.offset[0]);
574 } else {
575 idx = ctx->irqs.offset[r] + i - adapter->guest->irq_base_offset;
576 elem->applicationVirtualIsnBitmap[idx / 8] |= 0x80 >> (idx % 8);
577 }
578 }
579 }
580 elem->common.amr = cpu_to_be64(amr);
581 elem->common.wed = cpu_to_be64(wed);
582
583 disable_afu_irqs(ctx);
584
585 rc = cxl_h_attach_process(ctx->afu->guest->handle, elem,
586 &ctx->process_token, &mmio_addr, &mmio_size);
587 if (rc == H_SUCCESS) {
588 if (ctx->master || !ctx->afu->pp_psa) {
589 ctx->psn_phys = ctx->afu->psn_phys;
590 ctx->psn_size = ctx->afu->adapter->ps_size;
591 } else {
592 ctx->psn_phys = mmio_addr;
593 ctx->psn_size = mmio_size;
594 }
595 if (ctx->afu->pp_psa && mmio_size &&
596 ctx->afu->pp_size == 0) {
597 /*
598 * There's no property in the device tree to read the
599 * pp_size. We only find out at the 1st attach.
600 * Compared to bare-metal, it is too late and we
601 * should really lock here. However, on powerVM,
602 * pp_size is really only used to display in /sys.
603 * Being discussed with pHyp for their next release.
604 */
605 ctx->afu->pp_size = mmio_size;
606 }
607 /* from PAPR: process element is bytes 4-7 of process token */
608 ctx->external_pe = ctx->process_token & 0xFFFFFFFF;
609 pr_devel("CXL pe=%i is known as %i for pHyp, mmio_size=%#llx",
610 ctx->pe, ctx->external_pe, ctx->psn_size);
611 ctx->pe_inserted = true;
612 enable_afu_irqs(ctx);
613 }
614
615 out_free:
616 free_page((u64)elem);
617 return rc;
618 }
619
guest_attach_process(struct cxl_context * ctx,bool kernel,u64 wed,u64 amr)620 static int guest_attach_process(struct cxl_context *ctx, bool kernel, u64 wed, u64 amr)
621 {
622 pr_devel("in %s\n", __func__);
623
624 ctx->kernel = kernel;
625 if (ctx->afu->current_mode == CXL_MODE_DIRECTED)
626 return attach_afu_directed(ctx, wed, amr);
627
628 /* dedicated mode not supported on FW840 */
629
630 return -EINVAL;
631 }
632
detach_afu_directed(struct cxl_context * ctx)633 static int detach_afu_directed(struct cxl_context *ctx)
634 {
635 if (!ctx->pe_inserted)
636 return 0;
637 if (cxl_h_detach_process(ctx->afu->guest->handle, ctx->process_token))
638 return -1;
639 return 0;
640 }
641
guest_detach_process(struct cxl_context * ctx)642 static int guest_detach_process(struct cxl_context *ctx)
643 {
644 pr_devel("in %s\n", __func__);
645 trace_cxl_detach(ctx);
646
647 if (!cxl_ops->link_ok(ctx->afu->adapter, ctx->afu))
648 return -EIO;
649
650 if (ctx->afu->current_mode == CXL_MODE_DIRECTED)
651 return detach_afu_directed(ctx);
652
653 return -EINVAL;
654 }
655
guest_release_afu(struct device * dev)656 static void guest_release_afu(struct device *dev)
657 {
658 struct cxl_afu *afu = to_cxl_afu(dev);
659
660 pr_devel("%s\n", __func__);
661
662 idr_destroy(&afu->contexts_idr);
663
664 kfree(afu->guest);
665 kfree(afu);
666 }
667
cxl_guest_read_afu_vpd(struct cxl_afu * afu,void * buf,size_t len)668 ssize_t cxl_guest_read_afu_vpd(struct cxl_afu *afu, void *buf, size_t len)
669 {
670 return guest_collect_vpd(NULL, afu, buf, len);
671 }
672
673 #define ERR_BUFF_MAX_COPY_SIZE PAGE_SIZE
guest_afu_read_err_buffer(struct cxl_afu * afu,char * buf,loff_t off,size_t count)674 static ssize_t guest_afu_read_err_buffer(struct cxl_afu *afu, char *buf,
675 loff_t off, size_t count)
676 {
677 void *tbuf = NULL;
678 int rc = 0;
679
680 tbuf = (void *) get_zeroed_page(GFP_KERNEL);
681 if (!tbuf)
682 return -ENOMEM;
683
684 rc = cxl_h_get_afu_err(afu->guest->handle,
685 off & 0x7,
686 virt_to_phys(tbuf),
687 count);
688 if (rc)
689 goto err;
690
691 if (count > ERR_BUFF_MAX_COPY_SIZE)
692 count = ERR_BUFF_MAX_COPY_SIZE - (off & 0x7);
693 memcpy(buf, tbuf, count);
694 err:
695 free_page((u64)tbuf);
696
697 return rc;
698 }
699
guest_afu_check_and_enable(struct cxl_afu * afu)700 static int guest_afu_check_and_enable(struct cxl_afu *afu)
701 {
702 return 0;
703 }
704
guest_support_attributes(const char * attr_name,enum cxl_attrs type)705 static bool guest_support_attributes(const char *attr_name,
706 enum cxl_attrs type)
707 {
708 switch (type) {
709 case CXL_ADAPTER_ATTRS:
710 if ((strcmp(attr_name, "base_image") == 0) ||
711 (strcmp(attr_name, "load_image_on_perst") == 0) ||
712 (strcmp(attr_name, "perst_reloads_same_image") == 0) ||
713 (strcmp(attr_name, "image_loaded") == 0))
714 return false;
715 break;
716 case CXL_AFU_MASTER_ATTRS:
717 if ((strcmp(attr_name, "pp_mmio_off") == 0))
718 return false;
719 break;
720 case CXL_AFU_ATTRS:
721 break;
722 default:
723 break;
724 }
725
726 return true;
727 }
728
activate_afu_directed(struct cxl_afu * afu)729 static int activate_afu_directed(struct cxl_afu *afu)
730 {
731 int rc;
732
733 dev_info(&afu->dev, "Activating AFU(%d) directed mode\n", afu->slice);
734
735 afu->current_mode = CXL_MODE_DIRECTED;
736
737 afu->num_procs = afu->max_procs_virtualised;
738
739 if ((rc = cxl_chardev_m_afu_add(afu)))
740 return rc;
741
742 if ((rc = cxl_sysfs_afu_m_add(afu)))
743 goto err;
744
745 if ((rc = cxl_chardev_s_afu_add(afu)))
746 goto err1;
747
748 return 0;
749 err1:
750 cxl_sysfs_afu_m_remove(afu);
751 err:
752 cxl_chardev_afu_remove(afu);
753 return rc;
754 }
755
guest_afu_activate_mode(struct cxl_afu * afu,int mode)756 static int guest_afu_activate_mode(struct cxl_afu *afu, int mode)
757 {
758 if (!mode)
759 return 0;
760 if (!(mode & afu->modes_supported))
761 return -EINVAL;
762
763 if (mode == CXL_MODE_DIRECTED)
764 return activate_afu_directed(afu);
765
766 if (mode == CXL_MODE_DEDICATED)
767 dev_err(&afu->dev, "Dedicated mode not supported\n");
768
769 return -EINVAL;
770 }
771
deactivate_afu_directed(struct cxl_afu * afu)772 static int deactivate_afu_directed(struct cxl_afu *afu)
773 {
774 dev_info(&afu->dev, "Deactivating AFU(%d) directed mode\n", afu->slice);
775
776 afu->current_mode = 0;
777 afu->num_procs = 0;
778
779 cxl_sysfs_afu_m_remove(afu);
780 cxl_chardev_afu_remove(afu);
781
782 cxl_ops->afu_reset(afu);
783
784 return 0;
785 }
786
guest_afu_deactivate_mode(struct cxl_afu * afu,int mode)787 static int guest_afu_deactivate_mode(struct cxl_afu *afu, int mode)
788 {
789 if (!mode)
790 return 0;
791 if (!(mode & afu->modes_supported))
792 return -EINVAL;
793
794 if (mode == CXL_MODE_DIRECTED)
795 return deactivate_afu_directed(afu);
796 return 0;
797 }
798
guest_afu_reset(struct cxl_afu * afu)799 static int guest_afu_reset(struct cxl_afu *afu)
800 {
801 pr_devel("AFU(%d) reset request\n", afu->slice);
802 return cxl_h_reset_afu(afu->guest->handle);
803 }
804
guest_map_slice_regs(struct cxl_afu * afu)805 static int guest_map_slice_regs(struct cxl_afu *afu)
806 {
807 if (!(afu->p2n_mmio = ioremap(afu->guest->p2n_phys, afu->guest->p2n_size))) {
808 dev_err(&afu->dev, "Error mapping AFU(%d) MMIO regions\n",
809 afu->slice);
810 return -ENOMEM;
811 }
812 return 0;
813 }
814
guest_unmap_slice_regs(struct cxl_afu * afu)815 static void guest_unmap_slice_regs(struct cxl_afu *afu)
816 {
817 if (afu->p2n_mmio)
818 iounmap(afu->p2n_mmio);
819 }
820
afu_update_state(struct cxl_afu * afu)821 static int afu_update_state(struct cxl_afu *afu)
822 {
823 int rc, cur_state;
824
825 rc = afu_read_error_state(afu, &cur_state);
826 if (rc)
827 return rc;
828
829 if (afu->guest->previous_state == cur_state)
830 return 0;
831
832 pr_devel("AFU(%d) update state to %#x\n", afu->slice, cur_state);
833
834 switch (cur_state) {
835 case H_STATE_NORMAL:
836 afu->guest->previous_state = cur_state;
837 break;
838
839 case H_STATE_DISABLE:
840 pci_error_handlers(afu, CXL_ERROR_DETECTED_EVENT,
841 pci_channel_io_frozen);
842
843 cxl_context_detach_all(afu);
844 if ((rc = cxl_ops->afu_reset(afu)))
845 pr_devel("reset hcall failed %d\n", rc);
846
847 rc = afu_read_error_state(afu, &cur_state);
848 if (!rc && cur_state == H_STATE_NORMAL) {
849 pci_error_handlers(afu, CXL_SLOT_RESET_EVENT,
850 pci_channel_io_normal);
851 pci_error_handlers(afu, CXL_RESUME_EVENT, 0);
852 }
853 afu->guest->previous_state = 0;
854 break;
855
856 case H_STATE_TEMP_UNAVAILABLE:
857 afu->guest->previous_state = cur_state;
858 break;
859
860 case H_STATE_PERM_UNAVAILABLE:
861 dev_err(&afu->dev, "AFU is in permanent error state\n");
862 pci_error_handlers(afu, CXL_ERROR_DETECTED_EVENT,
863 pci_channel_io_perm_failure);
864 afu->guest->previous_state = cur_state;
865 break;
866
867 default:
868 pr_err("Unexpected AFU(%d) error state: %#x\n",
869 afu->slice, cur_state);
870 return -EINVAL;
871 }
872
873 return rc;
874 }
875
afu_handle_errstate(struct work_struct * work)876 static void afu_handle_errstate(struct work_struct *work)
877 {
878 struct cxl_afu_guest *afu_guest =
879 container_of(to_delayed_work(work), struct cxl_afu_guest, work_err);
880
881 if (!afu_update_state(afu_guest->parent) &&
882 afu_guest->previous_state == H_STATE_PERM_UNAVAILABLE)
883 return;
884
885 if (afu_guest->handle_err)
886 schedule_delayed_work(&afu_guest->work_err,
887 msecs_to_jiffies(3000));
888 }
889
guest_link_ok(struct cxl * cxl,struct cxl_afu * afu)890 static bool guest_link_ok(struct cxl *cxl, struct cxl_afu *afu)
891 {
892 int state;
893
894 if (afu && (!afu_read_error_state(afu, &state))) {
895 if (state == H_STATE_NORMAL)
896 return true;
897 }
898
899 return false;
900 }
901
afu_properties_look_ok(struct cxl_afu * afu)902 static int afu_properties_look_ok(struct cxl_afu *afu)
903 {
904 if (afu->pp_irqs < 0) {
905 dev_err(&afu->dev, "Unexpected per-process minimum interrupt value\n");
906 return -EINVAL;
907 }
908
909 if (afu->max_procs_virtualised < 1) {
910 dev_err(&afu->dev, "Unexpected max number of processes virtualised value\n");
911 return -EINVAL;
912 }
913
914 return 0;
915 }
916
cxl_guest_init_afu(struct cxl * adapter,int slice,struct device_node * afu_np)917 int cxl_guest_init_afu(struct cxl *adapter, int slice, struct device_node *afu_np)
918 {
919 struct cxl_afu *afu;
920 bool free = true;
921 int rc;
922
923 pr_devel("in %s - AFU(%d)\n", __func__, slice);
924 if (!(afu = cxl_alloc_afu(adapter, slice)))
925 return -ENOMEM;
926
927 if (!(afu->guest = kzalloc(sizeof(struct cxl_afu_guest), GFP_KERNEL))) {
928 kfree(afu);
929 return -ENOMEM;
930 }
931
932 if ((rc = dev_set_name(&afu->dev, "afu%i.%i",
933 adapter->adapter_num,
934 slice)))
935 goto err1;
936
937 adapter->slices++;
938
939 if ((rc = cxl_of_read_afu_handle(afu, afu_np)))
940 goto err1;
941
942 if ((rc = cxl_ops->afu_reset(afu)))
943 goto err1;
944
945 if ((rc = cxl_of_read_afu_properties(afu, afu_np)))
946 goto err1;
947
948 if ((rc = afu_properties_look_ok(afu)))
949 goto err1;
950
951 if ((rc = guest_map_slice_regs(afu)))
952 goto err1;
953
954 if ((rc = guest_register_serr_irq(afu)))
955 goto err2;
956
957 /*
958 * After we call this function we must not free the afu directly, even
959 * if it returns an error!
960 */
961 if ((rc = cxl_register_afu(afu)))
962 goto err_put_dev;
963
964 if ((rc = cxl_sysfs_afu_add(afu)))
965 goto err_del_dev;
966
967 /*
968 * pHyp doesn't expose the programming models supported by the
969 * AFU. pHyp currently only supports directed mode. If it adds
970 * dedicated mode later, this version of cxl has no way to
971 * detect it. So we'll initialize the driver, but the first
972 * attach will fail.
973 * Being discussed with pHyp to do better (likely new property)
974 */
975 if (afu->max_procs_virtualised == 1)
976 afu->modes_supported = CXL_MODE_DEDICATED;
977 else
978 afu->modes_supported = CXL_MODE_DIRECTED;
979
980 if ((rc = cxl_afu_select_best_mode(afu)))
981 goto err_remove_sysfs;
982
983 adapter->afu[afu->slice] = afu;
984
985 afu->enabled = true;
986
987 /*
988 * wake up the cpu periodically to check the state
989 * of the AFU using "afu" stored in the guest structure.
990 */
991 afu->guest->parent = afu;
992 afu->guest->handle_err = true;
993 INIT_DELAYED_WORK(&afu->guest->work_err, afu_handle_errstate);
994 schedule_delayed_work(&afu->guest->work_err, msecs_to_jiffies(1000));
995
996 if ((rc = cxl_pci_vphb_add(afu)))
997 dev_info(&afu->dev, "Can't register vPHB\n");
998
999 return 0;
1000
1001 err_remove_sysfs:
1002 cxl_sysfs_afu_remove(afu);
1003 err_del_dev:
1004 device_del(&afu->dev);
1005 err_put_dev:
1006 put_device(&afu->dev);
1007 free = false;
1008 guest_release_serr_irq(afu);
1009 err2:
1010 guest_unmap_slice_regs(afu);
1011 err1:
1012 if (free) {
1013 kfree(afu->guest);
1014 kfree(afu);
1015 }
1016 return rc;
1017 }
1018
cxl_guest_remove_afu(struct cxl_afu * afu)1019 void cxl_guest_remove_afu(struct cxl_afu *afu)
1020 {
1021 if (!afu)
1022 return;
1023
1024 /* flush and stop pending job */
1025 afu->guest->handle_err = false;
1026 flush_delayed_work(&afu->guest->work_err);
1027
1028 cxl_pci_vphb_remove(afu);
1029 cxl_sysfs_afu_remove(afu);
1030
1031 spin_lock(&afu->adapter->afu_list_lock);
1032 afu->adapter->afu[afu->slice] = NULL;
1033 spin_unlock(&afu->adapter->afu_list_lock);
1034
1035 cxl_context_detach_all(afu);
1036 cxl_ops->afu_deactivate_mode(afu, afu->current_mode);
1037 guest_release_serr_irq(afu);
1038 guest_unmap_slice_regs(afu);
1039
1040 device_unregister(&afu->dev);
1041 }
1042
free_adapter(struct cxl * adapter)1043 static void free_adapter(struct cxl *adapter)
1044 {
1045 struct irq_avail *cur;
1046 int i;
1047
1048 if (adapter->guest) {
1049 if (adapter->guest->irq_avail) {
1050 for (i = 0; i < adapter->guest->irq_nranges; i++) {
1051 cur = &adapter->guest->irq_avail[i];
1052 kfree(cur->bitmap);
1053 }
1054 kfree(adapter->guest->irq_avail);
1055 }
1056 kfree(adapter->guest->status);
1057 kfree(adapter->guest);
1058 }
1059 cxl_remove_adapter_nr(adapter);
1060 kfree(adapter);
1061 }
1062
properties_look_ok(struct cxl * adapter)1063 static int properties_look_ok(struct cxl *adapter)
1064 {
1065 /* The absence of this property means that the operational
1066 * status is unknown or okay
1067 */
1068 if (strlen(adapter->guest->status) &&
1069 strcmp(adapter->guest->status, "okay")) {
1070 pr_err("ABORTING:Bad operational status of the device\n");
1071 return -EINVAL;
1072 }
1073
1074 return 0;
1075 }
1076
cxl_guest_read_adapter_vpd(struct cxl * adapter,void * buf,size_t len)1077 ssize_t cxl_guest_read_adapter_vpd(struct cxl *adapter, void *buf, size_t len)
1078 {
1079 return guest_collect_vpd(adapter, NULL, buf, len);
1080 }
1081
cxl_guest_remove_adapter(struct cxl * adapter)1082 void cxl_guest_remove_adapter(struct cxl *adapter)
1083 {
1084 pr_devel("in %s\n", __func__);
1085
1086 cxl_sysfs_adapter_remove(adapter);
1087
1088 cxl_guest_remove_chardev(adapter);
1089 device_unregister(&adapter->dev);
1090 }
1091
release_adapter(struct device * dev)1092 static void release_adapter(struct device *dev)
1093 {
1094 free_adapter(to_cxl_adapter(dev));
1095 }
1096
cxl_guest_init_adapter(struct device_node * np,struct platform_device * pdev)1097 struct cxl *cxl_guest_init_adapter(struct device_node *np, struct platform_device *pdev)
1098 {
1099 struct cxl *adapter;
1100 bool free = true;
1101 int rc;
1102
1103 if (!(adapter = cxl_alloc_adapter()))
1104 return ERR_PTR(-ENOMEM);
1105
1106 if (!(adapter->guest = kzalloc(sizeof(struct cxl_guest), GFP_KERNEL))) {
1107 free_adapter(adapter);
1108 return ERR_PTR(-ENOMEM);
1109 }
1110
1111 adapter->slices = 0;
1112 adapter->guest->pdev = pdev;
1113 adapter->dev.parent = &pdev->dev;
1114 adapter->dev.release = release_adapter;
1115 dev_set_drvdata(&pdev->dev, adapter);
1116
1117 /*
1118 * Hypervisor controls PSL timebase initialization (p1 register).
1119 * On FW840, PSL is initialized.
1120 */
1121 adapter->psl_timebase_synced = true;
1122
1123 if ((rc = cxl_of_read_adapter_handle(adapter, np)))
1124 goto err1;
1125
1126 if ((rc = cxl_of_read_adapter_properties(adapter, np)))
1127 goto err1;
1128
1129 if ((rc = properties_look_ok(adapter)))
1130 goto err1;
1131
1132 if ((rc = cxl_guest_add_chardev(adapter)))
1133 goto err1;
1134
1135 /*
1136 * After we call this function we must not free the adapter directly,
1137 * even if it returns an error!
1138 */
1139 if ((rc = cxl_register_adapter(adapter)))
1140 goto err_put_dev;
1141
1142 if ((rc = cxl_sysfs_adapter_add(adapter)))
1143 goto err_del_dev;
1144
1145 /* release the context lock as the adapter is configured */
1146 cxl_adapter_context_unlock(adapter);
1147
1148 return adapter;
1149
1150 err_del_dev:
1151 device_del(&adapter->dev);
1152 err_put_dev:
1153 put_device(&adapter->dev);
1154 free = false;
1155 cxl_guest_remove_chardev(adapter);
1156 err1:
1157 if (free)
1158 free_adapter(adapter);
1159 return ERR_PTR(rc);
1160 }
1161
cxl_guest_reload_module(struct cxl * adapter)1162 void cxl_guest_reload_module(struct cxl *adapter)
1163 {
1164 struct platform_device *pdev;
1165
1166 pdev = adapter->guest->pdev;
1167 cxl_guest_remove_adapter(adapter);
1168
1169 cxl_of_probe(pdev);
1170 }
1171
1172 const struct cxl_backend_ops cxl_guest_ops = {
1173 .module = THIS_MODULE,
1174 .adapter_reset = guest_reset,
1175 .alloc_one_irq = guest_alloc_one_irq,
1176 .release_one_irq = guest_release_one_irq,
1177 .alloc_irq_ranges = guest_alloc_irq_ranges,
1178 .release_irq_ranges = guest_release_irq_ranges,
1179 .setup_irq = NULL,
1180 .handle_psl_slice_error = guest_handle_psl_slice_error,
1181 .psl_interrupt = guest_psl_irq,
1182 .ack_irq = guest_ack_irq,
1183 .attach_process = guest_attach_process,
1184 .detach_process = guest_detach_process,
1185 .update_ivtes = NULL,
1186 .support_attributes = guest_support_attributes,
1187 .link_ok = guest_link_ok,
1188 .release_afu = guest_release_afu,
1189 .afu_read_err_buffer = guest_afu_read_err_buffer,
1190 .afu_check_and_enable = guest_afu_check_and_enable,
1191 .afu_activate_mode = guest_afu_activate_mode,
1192 .afu_deactivate_mode = guest_afu_deactivate_mode,
1193 .afu_reset = guest_afu_reset,
1194 .afu_cr_read8 = guest_afu_cr_read8,
1195 .afu_cr_read16 = guest_afu_cr_read16,
1196 .afu_cr_read32 = guest_afu_cr_read32,
1197 .afu_cr_read64 = guest_afu_cr_read64,
1198 .afu_cr_write8 = guest_afu_cr_write8,
1199 .afu_cr_write16 = guest_afu_cr_write16,
1200 .afu_cr_write32 = guest_afu_cr_write32,
1201 .read_adapter_vpd = cxl_guest_read_adapter_vpd,
1202 };
1203