xref: /kernel/linux/linux-5.10/drivers/misc/cxl/guest.c (revision 8c2ecf20)
1// SPDX-License-Identifier: GPL-2.0-or-later
2/*
3 * Copyright 2015 IBM Corp.
4 */
5
6#include <linux/spinlock.h>
7#include <linux/uaccess.h>
8#include <linux/delay.h>
9
10#include "cxl.h"
11#include "hcalls.h"
12#include "trace.h"
13
14#define CXL_ERROR_DETECTED_EVENT	1
15#define CXL_SLOT_RESET_EVENT		2
16#define CXL_RESUME_EVENT		3
17
18static void pci_error_handlers(struct cxl_afu *afu,
19				int bus_error_event,
20				pci_channel_state_t state)
21{
22	struct pci_dev *afu_dev;
23
24	if (afu->phb == NULL)
25		return;
26
27	list_for_each_entry(afu_dev, &afu->phb->bus->devices, bus_list) {
28		if (!afu_dev->driver)
29			continue;
30
31		switch (bus_error_event) {
32		case CXL_ERROR_DETECTED_EVENT:
33			afu_dev->error_state = state;
34
35			if (afu_dev->driver->err_handler &&
36			    afu_dev->driver->err_handler->error_detected)
37				afu_dev->driver->err_handler->error_detected(afu_dev, state);
38		break;
39		case CXL_SLOT_RESET_EVENT:
40			afu_dev->error_state = state;
41
42			if (afu_dev->driver->err_handler &&
43			    afu_dev->driver->err_handler->slot_reset)
44				afu_dev->driver->err_handler->slot_reset(afu_dev);
45		break;
46		case CXL_RESUME_EVENT:
47			if (afu_dev->driver->err_handler &&
48			    afu_dev->driver->err_handler->resume)
49				afu_dev->driver->err_handler->resume(afu_dev);
50		break;
51		}
52	}
53}
54
55static irqreturn_t guest_handle_psl_slice_error(struct cxl_context *ctx, u64 dsisr,
56					u64 errstat)
57{
58	pr_devel("in %s\n", __func__);
59	dev_crit(&ctx->afu->dev, "PSL ERROR STATUS: 0x%.16llx\n", errstat);
60
61	return cxl_ops->ack_irq(ctx, 0, errstat);
62}
63
64static ssize_t guest_collect_vpd(struct cxl *adapter, struct cxl_afu *afu,
65			void *buf, size_t len)
66{
67	unsigned int entries, mod;
68	unsigned long **vpd_buf = NULL;
69	struct sg_list *le;
70	int rc = 0, i, tocopy;
71	u64 out = 0;
72
73	if (buf == NULL)
74		return -EINVAL;
75
76	/* number of entries in the list */
77	entries = len / SG_BUFFER_SIZE;
78	mod = len % SG_BUFFER_SIZE;
79	if (mod)
80		entries++;
81
82	if (entries > SG_MAX_ENTRIES) {
83		entries = SG_MAX_ENTRIES;
84		len = SG_MAX_ENTRIES * SG_BUFFER_SIZE;
85		mod = 0;
86	}
87
88	vpd_buf = kcalloc(entries, sizeof(unsigned long *), GFP_KERNEL);
89	if (!vpd_buf)
90		return -ENOMEM;
91
92	le = (struct sg_list *)get_zeroed_page(GFP_KERNEL);
93	if (!le) {
94		rc = -ENOMEM;
95		goto err1;
96	}
97
98	for (i = 0; i < entries; i++) {
99		vpd_buf[i] = (unsigned long *)get_zeroed_page(GFP_KERNEL);
100		if (!vpd_buf[i]) {
101			rc = -ENOMEM;
102			goto err2;
103		}
104		le[i].phys_addr = cpu_to_be64(virt_to_phys(vpd_buf[i]));
105		le[i].len = cpu_to_be64(SG_BUFFER_SIZE);
106		if ((i == (entries - 1)) && mod)
107			le[i].len = cpu_to_be64(mod);
108	}
109
110	if (adapter)
111		rc = cxl_h_collect_vpd_adapter(adapter->guest->handle,
112					virt_to_phys(le), entries, &out);
113	else
114		rc = cxl_h_collect_vpd(afu->guest->handle, 0,
115				virt_to_phys(le), entries, &out);
116	pr_devel("length of available (entries: %i), vpd: %#llx\n",
117		entries, out);
118
119	if (!rc) {
120		/*
121		 * hcall returns in 'out' the size of available VPDs.
122		 * It fills the buffer with as much data as possible.
123		 */
124		if (out < len)
125			len = out;
126		rc = len;
127		if (out) {
128			for (i = 0; i < entries; i++) {
129				if (len < SG_BUFFER_SIZE)
130					tocopy = len;
131				else
132					tocopy = SG_BUFFER_SIZE;
133				memcpy(buf, vpd_buf[i], tocopy);
134				buf += tocopy;
135				len -= tocopy;
136			}
137		}
138	}
139err2:
140	for (i = 0; i < entries; i++) {
141		if (vpd_buf[i])
142			free_page((unsigned long) vpd_buf[i]);
143	}
144	free_page((unsigned long) le);
145err1:
146	kfree(vpd_buf);
147	return rc;
148}
149
150static int guest_get_irq_info(struct cxl_context *ctx, struct cxl_irq_info *info)
151{
152	return cxl_h_collect_int_info(ctx->afu->guest->handle, ctx->process_token, info);
153}
154
155static irqreturn_t guest_psl_irq(int irq, void *data)
156{
157	struct cxl_context *ctx = data;
158	struct cxl_irq_info irq_info;
159	int rc;
160
161	pr_devel("%d: received PSL interrupt %i\n", ctx->pe, irq);
162	rc = guest_get_irq_info(ctx, &irq_info);
163	if (rc) {
164		WARN(1, "Unable to get IRQ info: %i\n", rc);
165		return IRQ_HANDLED;
166	}
167
168	rc = cxl_irq_psl8(irq, ctx, &irq_info);
169	return rc;
170}
171
172static int afu_read_error_state(struct cxl_afu *afu, int *state_out)
173{
174	u64 state;
175	int rc = 0;
176
177	if (!afu)
178		return -EIO;
179
180	rc = cxl_h_read_error_state(afu->guest->handle, &state);
181	if (!rc) {
182		WARN_ON(state != H_STATE_NORMAL &&
183			state != H_STATE_DISABLE &&
184			state != H_STATE_TEMP_UNAVAILABLE &&
185			state != H_STATE_PERM_UNAVAILABLE);
186		*state_out = state & 0xffffffff;
187	}
188	return rc;
189}
190
191static irqreturn_t guest_slice_irq_err(int irq, void *data)
192{
193	struct cxl_afu *afu = data;
194	int rc;
195	u64 serr, afu_error, dsisr;
196
197	rc = cxl_h_get_fn_error_interrupt(afu->guest->handle, &serr);
198	if (rc) {
199		dev_crit(&afu->dev, "Couldn't read PSL_SERR_An: %d\n", rc);
200		return IRQ_HANDLED;
201	}
202	afu_error = cxl_p2n_read(afu, CXL_AFU_ERR_An);
203	dsisr = cxl_p2n_read(afu, CXL_PSL_DSISR_An);
204	cxl_afu_decode_psl_serr(afu, serr);
205	dev_crit(&afu->dev, "AFU_ERR_An: 0x%.16llx\n", afu_error);
206	dev_crit(&afu->dev, "PSL_DSISR_An: 0x%.16llx\n", dsisr);
207
208	rc = cxl_h_ack_fn_error_interrupt(afu->guest->handle, serr);
209	if (rc)
210		dev_crit(&afu->dev, "Couldn't ack slice error interrupt: %d\n",
211			rc);
212
213	return IRQ_HANDLED;
214}
215
216
217static int irq_alloc_range(struct cxl *adapter, int len, int *irq)
218{
219	int i, n;
220	struct irq_avail *cur;
221
222	for (i = 0; i < adapter->guest->irq_nranges; i++) {
223		cur = &adapter->guest->irq_avail[i];
224		n = bitmap_find_next_zero_area(cur->bitmap, cur->range,
225					0, len, 0);
226		if (n < cur->range) {
227			bitmap_set(cur->bitmap, n, len);
228			*irq = cur->offset + n;
229			pr_devel("guest: allocate IRQs %#x->%#x\n",
230				*irq, *irq + len - 1);
231
232			return 0;
233		}
234	}
235	return -ENOSPC;
236}
237
238static int irq_free_range(struct cxl *adapter, int irq, int len)
239{
240	int i, n;
241	struct irq_avail *cur;
242
243	if (len == 0)
244		return -ENOENT;
245
246	for (i = 0; i < adapter->guest->irq_nranges; i++) {
247		cur = &adapter->guest->irq_avail[i];
248		if (irq >= cur->offset &&
249			(irq + len) <= (cur->offset + cur->range)) {
250			n = irq - cur->offset;
251			bitmap_clear(cur->bitmap, n, len);
252			pr_devel("guest: release IRQs %#x->%#x\n",
253				irq, irq + len - 1);
254			return 0;
255		}
256	}
257	return -ENOENT;
258}
259
260static int guest_reset(struct cxl *adapter)
261{
262	struct cxl_afu *afu = NULL;
263	int i, rc;
264
265	pr_devel("Adapter reset request\n");
266	spin_lock(&adapter->afu_list_lock);
267	for (i = 0; i < adapter->slices; i++) {
268		if ((afu = adapter->afu[i])) {
269			pci_error_handlers(afu, CXL_ERROR_DETECTED_EVENT,
270					pci_channel_io_frozen);
271			cxl_context_detach_all(afu);
272		}
273	}
274
275	rc = cxl_h_reset_adapter(adapter->guest->handle);
276	for (i = 0; i < adapter->slices; i++) {
277		if (!rc && (afu = adapter->afu[i])) {
278			pci_error_handlers(afu, CXL_SLOT_RESET_EVENT,
279					pci_channel_io_normal);
280			pci_error_handlers(afu, CXL_RESUME_EVENT, 0);
281		}
282	}
283	spin_unlock(&adapter->afu_list_lock);
284	return rc;
285}
286
287static int guest_alloc_one_irq(struct cxl *adapter)
288{
289	int irq;
290
291	spin_lock(&adapter->guest->irq_alloc_lock);
292	if (irq_alloc_range(adapter, 1, &irq))
293		irq = -ENOSPC;
294	spin_unlock(&adapter->guest->irq_alloc_lock);
295	return irq;
296}
297
298static void guest_release_one_irq(struct cxl *adapter, int irq)
299{
300	spin_lock(&adapter->guest->irq_alloc_lock);
301	irq_free_range(adapter, irq, 1);
302	spin_unlock(&adapter->guest->irq_alloc_lock);
303}
304
305static int guest_alloc_irq_ranges(struct cxl_irq_ranges *irqs,
306				struct cxl *adapter, unsigned int num)
307{
308	int i, try, irq;
309
310	memset(irqs, 0, sizeof(struct cxl_irq_ranges));
311
312	spin_lock(&adapter->guest->irq_alloc_lock);
313	for (i = 0; i < CXL_IRQ_RANGES && num; i++) {
314		try = num;
315		while (try) {
316			if (irq_alloc_range(adapter, try, &irq) == 0)
317				break;
318			try /= 2;
319		}
320		if (!try)
321			goto error;
322		irqs->offset[i] = irq;
323		irqs->range[i] = try;
324		num -= try;
325	}
326	if (num)
327		goto error;
328	spin_unlock(&adapter->guest->irq_alloc_lock);
329	return 0;
330
331error:
332	for (i = 0; i < CXL_IRQ_RANGES; i++)
333		irq_free_range(adapter, irqs->offset[i], irqs->range[i]);
334	spin_unlock(&adapter->guest->irq_alloc_lock);
335	return -ENOSPC;
336}
337
338static void guest_release_irq_ranges(struct cxl_irq_ranges *irqs,
339				struct cxl *adapter)
340{
341	int i;
342
343	spin_lock(&adapter->guest->irq_alloc_lock);
344	for (i = 0; i < CXL_IRQ_RANGES; i++)
345		irq_free_range(adapter, irqs->offset[i], irqs->range[i]);
346	spin_unlock(&adapter->guest->irq_alloc_lock);
347}
348
349static int guest_register_serr_irq(struct cxl_afu *afu)
350{
351	afu->err_irq_name = kasprintf(GFP_KERNEL, "cxl-%s-err",
352				      dev_name(&afu->dev));
353	if (!afu->err_irq_name)
354		return -ENOMEM;
355
356	if (!(afu->serr_virq = cxl_map_irq(afu->adapter, afu->serr_hwirq,
357				 guest_slice_irq_err, afu, afu->err_irq_name))) {
358		kfree(afu->err_irq_name);
359		afu->err_irq_name = NULL;
360		return -ENOMEM;
361	}
362
363	return 0;
364}
365
366static void guest_release_serr_irq(struct cxl_afu *afu)
367{
368	cxl_unmap_irq(afu->serr_virq, afu);
369	cxl_ops->release_one_irq(afu->adapter, afu->serr_hwirq);
370	kfree(afu->err_irq_name);
371}
372
373static int guest_ack_irq(struct cxl_context *ctx, u64 tfc, u64 psl_reset_mask)
374{
375	return cxl_h_control_faults(ctx->afu->guest->handle, ctx->process_token,
376				tfc >> 32, (psl_reset_mask != 0));
377}
378
379static void disable_afu_irqs(struct cxl_context *ctx)
380{
381	irq_hw_number_t hwirq;
382	unsigned int virq;
383	int r, i;
384
385	pr_devel("Disabling AFU(%d) interrupts\n", ctx->afu->slice);
386	for (r = 0; r < CXL_IRQ_RANGES; r++) {
387		hwirq = ctx->irqs.offset[r];
388		for (i = 0; i < ctx->irqs.range[r]; hwirq++, i++) {
389			virq = irq_find_mapping(NULL, hwirq);
390			disable_irq(virq);
391		}
392	}
393}
394
395static void enable_afu_irqs(struct cxl_context *ctx)
396{
397	irq_hw_number_t hwirq;
398	unsigned int virq;
399	int r, i;
400
401	pr_devel("Enabling AFU(%d) interrupts\n", ctx->afu->slice);
402	for (r = 0; r < CXL_IRQ_RANGES; r++) {
403		hwirq = ctx->irqs.offset[r];
404		for (i = 0; i < ctx->irqs.range[r]; hwirq++, i++) {
405			virq = irq_find_mapping(NULL, hwirq);
406			enable_irq(virq);
407		}
408	}
409}
410
411static int _guest_afu_cr_readXX(int sz, struct cxl_afu *afu, int cr_idx,
412			u64 offset, u64 *val)
413{
414	unsigned long cr;
415	char c;
416	int rc = 0;
417
418	if (afu->crs_len < sz)
419		return -ENOENT;
420
421	if (unlikely(offset >= afu->crs_len))
422		return -ERANGE;
423
424	cr = get_zeroed_page(GFP_KERNEL);
425	if (!cr)
426		return -ENOMEM;
427
428	rc = cxl_h_get_config(afu->guest->handle, cr_idx, offset,
429			virt_to_phys((void *)cr), sz);
430	if (rc)
431		goto err;
432
433	switch (sz) {
434	case 1:
435		c = *((char *) cr);
436		*val = c;
437		break;
438	case 2:
439		*val = in_le16((u16 *)cr);
440		break;
441	case 4:
442		*val = in_le32((unsigned *)cr);
443		break;
444	case 8:
445		*val = in_le64((u64 *)cr);
446		break;
447	default:
448		WARN_ON(1);
449	}
450err:
451	free_page(cr);
452	return rc;
453}
454
455static int guest_afu_cr_read32(struct cxl_afu *afu, int cr_idx, u64 offset,
456			u32 *out)
457{
458	int rc;
459	u64 val;
460
461	rc = _guest_afu_cr_readXX(4, afu, cr_idx, offset, &val);
462	if (!rc)
463		*out = (u32) val;
464	return rc;
465}
466
467static int guest_afu_cr_read16(struct cxl_afu *afu, int cr_idx, u64 offset,
468			u16 *out)
469{
470	int rc;
471	u64 val;
472
473	rc = _guest_afu_cr_readXX(2, afu, cr_idx, offset, &val);
474	if (!rc)
475		*out = (u16) val;
476	return rc;
477}
478
479static int guest_afu_cr_read8(struct cxl_afu *afu, int cr_idx, u64 offset,
480			u8 *out)
481{
482	int rc;
483	u64 val;
484
485	rc = _guest_afu_cr_readXX(1, afu, cr_idx, offset, &val);
486	if (!rc)
487		*out = (u8) val;
488	return rc;
489}
490
491static int guest_afu_cr_read64(struct cxl_afu *afu, int cr_idx, u64 offset,
492			u64 *out)
493{
494	return _guest_afu_cr_readXX(8, afu, cr_idx, offset, out);
495}
496
497static int guest_afu_cr_write32(struct cxl_afu *afu, int cr, u64 off, u32 in)
498{
499	/* config record is not writable from guest */
500	return -EPERM;
501}
502
503static int guest_afu_cr_write16(struct cxl_afu *afu, int cr, u64 off, u16 in)
504{
505	/* config record is not writable from guest */
506	return -EPERM;
507}
508
509static int guest_afu_cr_write8(struct cxl_afu *afu, int cr, u64 off, u8 in)
510{
511	/* config record is not writable from guest */
512	return -EPERM;
513}
514
515static int attach_afu_directed(struct cxl_context *ctx, u64 wed, u64 amr)
516{
517	struct cxl_process_element_hcall *elem;
518	struct cxl *adapter = ctx->afu->adapter;
519	const struct cred *cred;
520	u32 pid, idx;
521	int rc, r, i;
522	u64 mmio_addr, mmio_size;
523	__be64 flags = 0;
524
525	/* Must be 8 byte aligned and cannot cross a 4096 byte boundary */
526	if (!(elem = (struct cxl_process_element_hcall *)
527			get_zeroed_page(GFP_KERNEL)))
528		return -ENOMEM;
529
530	elem->version = cpu_to_be64(CXL_PROCESS_ELEMENT_VERSION);
531	if (ctx->kernel) {
532		pid = 0;
533		flags |= CXL_PE_TRANSLATION_ENABLED;
534		flags |= CXL_PE_PRIVILEGED_PROCESS;
535		if (mfmsr() & MSR_SF)
536			flags |= CXL_PE_64_BIT;
537	} else {
538		pid = current->pid;
539		flags |= CXL_PE_PROBLEM_STATE;
540		flags |= CXL_PE_TRANSLATION_ENABLED;
541		if (!test_tsk_thread_flag(current, TIF_32BIT))
542			flags |= CXL_PE_64_BIT;
543		cred = get_current_cred();
544		if (uid_eq(cred->euid, GLOBAL_ROOT_UID))
545			flags |= CXL_PE_PRIVILEGED_PROCESS;
546		put_cred(cred);
547	}
548	elem->flags         = cpu_to_be64(flags);
549	elem->common.tid    = cpu_to_be32(0); /* Unused */
550	elem->common.pid    = cpu_to_be32(pid);
551	elem->common.csrp   = cpu_to_be64(0); /* disable */
552	elem->common.u.psl8.aurp0  = cpu_to_be64(0); /* disable */
553	elem->common.u.psl8.aurp1  = cpu_to_be64(0); /* disable */
554
555	cxl_prefault(ctx, wed);
556
557	elem->common.u.psl8.sstp0  = cpu_to_be64(ctx->sstp0);
558	elem->common.u.psl8.sstp1  = cpu_to_be64(ctx->sstp1);
559
560	/*
561	 * Ensure we have at least one interrupt allocated to take faults for
562	 * kernel contexts that may not have allocated any AFU IRQs at all:
563	 */
564	if (ctx->irqs.range[0] == 0) {
565		rc = afu_register_irqs(ctx, 0);
566		if (rc)
567			goto out_free;
568	}
569
570	for (r = 0; r < CXL_IRQ_RANGES; r++) {
571		for (i = 0; i < ctx->irqs.range[r]; i++) {
572			if (r == 0 && i == 0) {
573				elem->pslVirtualIsn = cpu_to_be32(ctx->irqs.offset[0]);
574			} else {
575				idx = ctx->irqs.offset[r] + i - adapter->guest->irq_base_offset;
576				elem->applicationVirtualIsnBitmap[idx / 8] |= 0x80 >> (idx % 8);
577			}
578		}
579	}
580	elem->common.amr = cpu_to_be64(amr);
581	elem->common.wed = cpu_to_be64(wed);
582
583	disable_afu_irqs(ctx);
584
585	rc = cxl_h_attach_process(ctx->afu->guest->handle, elem,
586				&ctx->process_token, &mmio_addr, &mmio_size);
587	if (rc == H_SUCCESS) {
588		if (ctx->master || !ctx->afu->pp_psa) {
589			ctx->psn_phys = ctx->afu->psn_phys;
590			ctx->psn_size = ctx->afu->adapter->ps_size;
591		} else {
592			ctx->psn_phys = mmio_addr;
593			ctx->psn_size = mmio_size;
594		}
595		if (ctx->afu->pp_psa && mmio_size &&
596			ctx->afu->pp_size == 0) {
597			/*
598			 * There's no property in the device tree to read the
599			 * pp_size. We only find out at the 1st attach.
600			 * Compared to bare-metal, it is too late and we
601			 * should really lock here. However, on powerVM,
602			 * pp_size is really only used to display in /sys.
603			 * Being discussed with pHyp for their next release.
604			 */
605			ctx->afu->pp_size = mmio_size;
606		}
607		/* from PAPR: process element is bytes 4-7 of process token */
608		ctx->external_pe = ctx->process_token & 0xFFFFFFFF;
609		pr_devel("CXL pe=%i is known as %i for pHyp, mmio_size=%#llx",
610			ctx->pe, ctx->external_pe, ctx->psn_size);
611		ctx->pe_inserted = true;
612		enable_afu_irqs(ctx);
613	}
614
615out_free:
616	free_page((u64)elem);
617	return rc;
618}
619
620static int guest_attach_process(struct cxl_context *ctx, bool kernel, u64 wed, u64 amr)
621{
622	pr_devel("in %s\n", __func__);
623
624	ctx->kernel = kernel;
625	if (ctx->afu->current_mode == CXL_MODE_DIRECTED)
626		return attach_afu_directed(ctx, wed, amr);
627
628	/* dedicated mode not supported on FW840 */
629
630	return -EINVAL;
631}
632
633static int detach_afu_directed(struct cxl_context *ctx)
634{
635	if (!ctx->pe_inserted)
636		return 0;
637	if (cxl_h_detach_process(ctx->afu->guest->handle, ctx->process_token))
638		return -1;
639	return 0;
640}
641
642static int guest_detach_process(struct cxl_context *ctx)
643{
644	pr_devel("in %s\n", __func__);
645	trace_cxl_detach(ctx);
646
647	if (!cxl_ops->link_ok(ctx->afu->adapter, ctx->afu))
648		return -EIO;
649
650	if (ctx->afu->current_mode == CXL_MODE_DIRECTED)
651		return detach_afu_directed(ctx);
652
653	return -EINVAL;
654}
655
656static void guest_release_afu(struct device *dev)
657{
658	struct cxl_afu *afu = to_cxl_afu(dev);
659
660	pr_devel("%s\n", __func__);
661
662	idr_destroy(&afu->contexts_idr);
663
664	kfree(afu->guest);
665	kfree(afu);
666}
667
668ssize_t cxl_guest_read_afu_vpd(struct cxl_afu *afu, void *buf, size_t len)
669{
670	return guest_collect_vpd(NULL, afu, buf, len);
671}
672
673#define ERR_BUFF_MAX_COPY_SIZE PAGE_SIZE
674static ssize_t guest_afu_read_err_buffer(struct cxl_afu *afu, char *buf,
675					loff_t off, size_t count)
676{
677	void *tbuf = NULL;
678	int rc = 0;
679
680	tbuf = (void *) get_zeroed_page(GFP_KERNEL);
681	if (!tbuf)
682		return -ENOMEM;
683
684	rc = cxl_h_get_afu_err(afu->guest->handle,
685			       off & 0x7,
686			       virt_to_phys(tbuf),
687			       count);
688	if (rc)
689		goto err;
690
691	if (count > ERR_BUFF_MAX_COPY_SIZE)
692		count = ERR_BUFF_MAX_COPY_SIZE - (off & 0x7);
693	memcpy(buf, tbuf, count);
694err:
695	free_page((u64)tbuf);
696
697	return rc;
698}
699
700static int guest_afu_check_and_enable(struct cxl_afu *afu)
701{
702	return 0;
703}
704
705static bool guest_support_attributes(const char *attr_name,
706				     enum cxl_attrs type)
707{
708	switch (type) {
709	case CXL_ADAPTER_ATTRS:
710		if ((strcmp(attr_name, "base_image") == 0) ||
711			(strcmp(attr_name, "load_image_on_perst") == 0) ||
712			(strcmp(attr_name, "perst_reloads_same_image") == 0) ||
713			(strcmp(attr_name, "image_loaded") == 0))
714			return false;
715		break;
716	case CXL_AFU_MASTER_ATTRS:
717		if ((strcmp(attr_name, "pp_mmio_off") == 0))
718			return false;
719		break;
720	case CXL_AFU_ATTRS:
721		break;
722	default:
723		break;
724	}
725
726	return true;
727}
728
729static int activate_afu_directed(struct cxl_afu *afu)
730{
731	int rc;
732
733	dev_info(&afu->dev, "Activating AFU(%d) directed mode\n", afu->slice);
734
735	afu->current_mode = CXL_MODE_DIRECTED;
736
737	afu->num_procs = afu->max_procs_virtualised;
738
739	if ((rc = cxl_chardev_m_afu_add(afu)))
740		return rc;
741
742	if ((rc = cxl_sysfs_afu_m_add(afu)))
743		goto err;
744
745	if ((rc = cxl_chardev_s_afu_add(afu)))
746		goto err1;
747
748	return 0;
749err1:
750	cxl_sysfs_afu_m_remove(afu);
751err:
752	cxl_chardev_afu_remove(afu);
753	return rc;
754}
755
756static int guest_afu_activate_mode(struct cxl_afu *afu, int mode)
757{
758	if (!mode)
759		return 0;
760	if (!(mode & afu->modes_supported))
761		return -EINVAL;
762
763	if (mode == CXL_MODE_DIRECTED)
764		return activate_afu_directed(afu);
765
766	if (mode == CXL_MODE_DEDICATED)
767		dev_err(&afu->dev, "Dedicated mode not supported\n");
768
769	return -EINVAL;
770}
771
772static int deactivate_afu_directed(struct cxl_afu *afu)
773{
774	dev_info(&afu->dev, "Deactivating AFU(%d) directed mode\n", afu->slice);
775
776	afu->current_mode = 0;
777	afu->num_procs = 0;
778
779	cxl_sysfs_afu_m_remove(afu);
780	cxl_chardev_afu_remove(afu);
781
782	cxl_ops->afu_reset(afu);
783
784	return 0;
785}
786
787static int guest_afu_deactivate_mode(struct cxl_afu *afu, int mode)
788{
789	if (!mode)
790		return 0;
791	if (!(mode & afu->modes_supported))
792		return -EINVAL;
793
794	if (mode == CXL_MODE_DIRECTED)
795		return deactivate_afu_directed(afu);
796	return 0;
797}
798
799static int guest_afu_reset(struct cxl_afu *afu)
800{
801	pr_devel("AFU(%d) reset request\n", afu->slice);
802	return cxl_h_reset_afu(afu->guest->handle);
803}
804
805static int guest_map_slice_regs(struct cxl_afu *afu)
806{
807	if (!(afu->p2n_mmio = ioremap(afu->guest->p2n_phys, afu->guest->p2n_size))) {
808		dev_err(&afu->dev, "Error mapping AFU(%d) MMIO regions\n",
809			afu->slice);
810		return -ENOMEM;
811	}
812	return 0;
813}
814
815static void guest_unmap_slice_regs(struct cxl_afu *afu)
816{
817	if (afu->p2n_mmio)
818		iounmap(afu->p2n_mmio);
819}
820
821static int afu_update_state(struct cxl_afu *afu)
822{
823	int rc, cur_state;
824
825	rc = afu_read_error_state(afu, &cur_state);
826	if (rc)
827		return rc;
828
829	if (afu->guest->previous_state == cur_state)
830		return 0;
831
832	pr_devel("AFU(%d) update state to %#x\n", afu->slice, cur_state);
833
834	switch (cur_state) {
835	case H_STATE_NORMAL:
836		afu->guest->previous_state = cur_state;
837		break;
838
839	case H_STATE_DISABLE:
840		pci_error_handlers(afu, CXL_ERROR_DETECTED_EVENT,
841				pci_channel_io_frozen);
842
843		cxl_context_detach_all(afu);
844		if ((rc = cxl_ops->afu_reset(afu)))
845			pr_devel("reset hcall failed %d\n", rc);
846
847		rc = afu_read_error_state(afu, &cur_state);
848		if (!rc && cur_state == H_STATE_NORMAL) {
849			pci_error_handlers(afu, CXL_SLOT_RESET_EVENT,
850					pci_channel_io_normal);
851			pci_error_handlers(afu, CXL_RESUME_EVENT, 0);
852		}
853		afu->guest->previous_state = 0;
854		break;
855
856	case H_STATE_TEMP_UNAVAILABLE:
857		afu->guest->previous_state = cur_state;
858		break;
859
860	case H_STATE_PERM_UNAVAILABLE:
861		dev_err(&afu->dev, "AFU is in permanent error state\n");
862		pci_error_handlers(afu, CXL_ERROR_DETECTED_EVENT,
863				pci_channel_io_perm_failure);
864		afu->guest->previous_state = cur_state;
865		break;
866
867	default:
868		pr_err("Unexpected AFU(%d) error state: %#x\n",
869		       afu->slice, cur_state);
870		return -EINVAL;
871	}
872
873	return rc;
874}
875
876static void afu_handle_errstate(struct work_struct *work)
877{
878	struct cxl_afu_guest *afu_guest =
879		container_of(to_delayed_work(work), struct cxl_afu_guest, work_err);
880
881	if (!afu_update_state(afu_guest->parent) &&
882	    afu_guest->previous_state == H_STATE_PERM_UNAVAILABLE)
883		return;
884
885	if (afu_guest->handle_err)
886		schedule_delayed_work(&afu_guest->work_err,
887				      msecs_to_jiffies(3000));
888}
889
890static bool guest_link_ok(struct cxl *cxl, struct cxl_afu *afu)
891{
892	int state;
893
894	if (afu && (!afu_read_error_state(afu, &state))) {
895		if (state == H_STATE_NORMAL)
896			return true;
897	}
898
899	return false;
900}
901
902static int afu_properties_look_ok(struct cxl_afu *afu)
903{
904	if (afu->pp_irqs < 0) {
905		dev_err(&afu->dev, "Unexpected per-process minimum interrupt value\n");
906		return -EINVAL;
907	}
908
909	if (afu->max_procs_virtualised < 1) {
910		dev_err(&afu->dev, "Unexpected max number of processes virtualised value\n");
911		return -EINVAL;
912	}
913
914	return 0;
915}
916
917int cxl_guest_init_afu(struct cxl *adapter, int slice, struct device_node *afu_np)
918{
919	struct cxl_afu *afu;
920	bool free = true;
921	int rc;
922
923	pr_devel("in %s - AFU(%d)\n", __func__, slice);
924	if (!(afu = cxl_alloc_afu(adapter, slice)))
925		return -ENOMEM;
926
927	if (!(afu->guest = kzalloc(sizeof(struct cxl_afu_guest), GFP_KERNEL))) {
928		kfree(afu);
929		return -ENOMEM;
930	}
931
932	if ((rc = dev_set_name(&afu->dev, "afu%i.%i",
933					  adapter->adapter_num,
934					  slice)))
935		goto err1;
936
937	adapter->slices++;
938
939	if ((rc = cxl_of_read_afu_handle(afu, afu_np)))
940		goto err1;
941
942	if ((rc = cxl_ops->afu_reset(afu)))
943		goto err1;
944
945	if ((rc = cxl_of_read_afu_properties(afu, afu_np)))
946		goto err1;
947
948	if ((rc = afu_properties_look_ok(afu)))
949		goto err1;
950
951	if ((rc = guest_map_slice_regs(afu)))
952		goto err1;
953
954	if ((rc = guest_register_serr_irq(afu)))
955		goto err2;
956
957	/*
958	 * After we call this function we must not free the afu directly, even
959	 * if it returns an error!
960	 */
961	if ((rc = cxl_register_afu(afu)))
962		goto err_put_dev;
963
964	if ((rc = cxl_sysfs_afu_add(afu)))
965		goto err_del_dev;
966
967	/*
968	 * pHyp doesn't expose the programming models supported by the
969	 * AFU. pHyp currently only supports directed mode. If it adds
970	 * dedicated mode later, this version of cxl has no way to
971	 * detect it. So we'll initialize the driver, but the first
972	 * attach will fail.
973	 * Being discussed with pHyp to do better (likely new property)
974	 */
975	if (afu->max_procs_virtualised == 1)
976		afu->modes_supported = CXL_MODE_DEDICATED;
977	else
978		afu->modes_supported = CXL_MODE_DIRECTED;
979
980	if ((rc = cxl_afu_select_best_mode(afu)))
981		goto err_remove_sysfs;
982
983	adapter->afu[afu->slice] = afu;
984
985	afu->enabled = true;
986
987	/*
988	 * wake up the cpu periodically to check the state
989	 * of the AFU using "afu" stored in the guest structure.
990	 */
991	afu->guest->parent = afu;
992	afu->guest->handle_err = true;
993	INIT_DELAYED_WORK(&afu->guest->work_err, afu_handle_errstate);
994	schedule_delayed_work(&afu->guest->work_err, msecs_to_jiffies(1000));
995
996	if ((rc = cxl_pci_vphb_add(afu)))
997		dev_info(&afu->dev, "Can't register vPHB\n");
998
999	return 0;
1000
1001err_remove_sysfs:
1002	cxl_sysfs_afu_remove(afu);
1003err_del_dev:
1004	device_del(&afu->dev);
1005err_put_dev:
1006	put_device(&afu->dev);
1007	free = false;
1008	guest_release_serr_irq(afu);
1009err2:
1010	guest_unmap_slice_regs(afu);
1011err1:
1012	if (free) {
1013		kfree(afu->guest);
1014		kfree(afu);
1015	}
1016	return rc;
1017}
1018
1019void cxl_guest_remove_afu(struct cxl_afu *afu)
1020{
1021	if (!afu)
1022		return;
1023
1024	/* flush and stop pending job */
1025	afu->guest->handle_err = false;
1026	flush_delayed_work(&afu->guest->work_err);
1027
1028	cxl_pci_vphb_remove(afu);
1029	cxl_sysfs_afu_remove(afu);
1030
1031	spin_lock(&afu->adapter->afu_list_lock);
1032	afu->adapter->afu[afu->slice] = NULL;
1033	spin_unlock(&afu->adapter->afu_list_lock);
1034
1035	cxl_context_detach_all(afu);
1036	cxl_ops->afu_deactivate_mode(afu, afu->current_mode);
1037	guest_release_serr_irq(afu);
1038	guest_unmap_slice_regs(afu);
1039
1040	device_unregister(&afu->dev);
1041}
1042
1043static void free_adapter(struct cxl *adapter)
1044{
1045	struct irq_avail *cur;
1046	int i;
1047
1048	if (adapter->guest) {
1049		if (adapter->guest->irq_avail) {
1050			for (i = 0; i < adapter->guest->irq_nranges; i++) {
1051				cur = &adapter->guest->irq_avail[i];
1052				kfree(cur->bitmap);
1053			}
1054			kfree(adapter->guest->irq_avail);
1055		}
1056		kfree(adapter->guest->status);
1057		kfree(adapter->guest);
1058	}
1059	cxl_remove_adapter_nr(adapter);
1060	kfree(adapter);
1061}
1062
1063static int properties_look_ok(struct cxl *adapter)
1064{
1065	/* The absence of this property means that the operational
1066	 * status is unknown or okay
1067	 */
1068	if (strlen(adapter->guest->status) &&
1069	    strcmp(adapter->guest->status, "okay")) {
1070		pr_err("ABORTING:Bad operational status of the device\n");
1071		return -EINVAL;
1072	}
1073
1074	return 0;
1075}
1076
1077ssize_t cxl_guest_read_adapter_vpd(struct cxl *adapter, void *buf, size_t len)
1078{
1079	return guest_collect_vpd(adapter, NULL, buf, len);
1080}
1081
1082void cxl_guest_remove_adapter(struct cxl *adapter)
1083{
1084	pr_devel("in %s\n", __func__);
1085
1086	cxl_sysfs_adapter_remove(adapter);
1087
1088	cxl_guest_remove_chardev(adapter);
1089	device_unregister(&adapter->dev);
1090}
1091
1092static void release_adapter(struct device *dev)
1093{
1094	free_adapter(to_cxl_adapter(dev));
1095}
1096
1097struct cxl *cxl_guest_init_adapter(struct device_node *np, struct platform_device *pdev)
1098{
1099	struct cxl *adapter;
1100	bool free = true;
1101	int rc;
1102
1103	if (!(adapter = cxl_alloc_adapter()))
1104		return ERR_PTR(-ENOMEM);
1105
1106	if (!(adapter->guest = kzalloc(sizeof(struct cxl_guest), GFP_KERNEL))) {
1107		free_adapter(adapter);
1108		return ERR_PTR(-ENOMEM);
1109	}
1110
1111	adapter->slices = 0;
1112	adapter->guest->pdev = pdev;
1113	adapter->dev.parent = &pdev->dev;
1114	adapter->dev.release = release_adapter;
1115	dev_set_drvdata(&pdev->dev, adapter);
1116
1117	/*
1118	 * Hypervisor controls PSL timebase initialization (p1 register).
1119	 * On FW840, PSL is initialized.
1120	 */
1121	adapter->psl_timebase_synced = true;
1122
1123	if ((rc = cxl_of_read_adapter_handle(adapter, np)))
1124		goto err1;
1125
1126	if ((rc = cxl_of_read_adapter_properties(adapter, np)))
1127		goto err1;
1128
1129	if ((rc = properties_look_ok(adapter)))
1130		goto err1;
1131
1132	if ((rc = cxl_guest_add_chardev(adapter)))
1133		goto err1;
1134
1135	/*
1136	 * After we call this function we must not free the adapter directly,
1137	 * even if it returns an error!
1138	 */
1139	if ((rc = cxl_register_adapter(adapter)))
1140		goto err_put_dev;
1141
1142	if ((rc = cxl_sysfs_adapter_add(adapter)))
1143		goto err_del_dev;
1144
1145	/* release the context lock as the adapter is configured */
1146	cxl_adapter_context_unlock(adapter);
1147
1148	return adapter;
1149
1150err_del_dev:
1151	device_del(&adapter->dev);
1152err_put_dev:
1153	put_device(&adapter->dev);
1154	free = false;
1155	cxl_guest_remove_chardev(adapter);
1156err1:
1157	if (free)
1158		free_adapter(adapter);
1159	return ERR_PTR(rc);
1160}
1161
1162void cxl_guest_reload_module(struct cxl *adapter)
1163{
1164	struct platform_device *pdev;
1165
1166	pdev = adapter->guest->pdev;
1167	cxl_guest_remove_adapter(adapter);
1168
1169	cxl_of_probe(pdev);
1170}
1171
1172const struct cxl_backend_ops cxl_guest_ops = {
1173	.module = THIS_MODULE,
1174	.adapter_reset = guest_reset,
1175	.alloc_one_irq = guest_alloc_one_irq,
1176	.release_one_irq = guest_release_one_irq,
1177	.alloc_irq_ranges = guest_alloc_irq_ranges,
1178	.release_irq_ranges = guest_release_irq_ranges,
1179	.setup_irq = NULL,
1180	.handle_psl_slice_error = guest_handle_psl_slice_error,
1181	.psl_interrupt = guest_psl_irq,
1182	.ack_irq = guest_ack_irq,
1183	.attach_process = guest_attach_process,
1184	.detach_process = guest_detach_process,
1185	.update_ivtes = NULL,
1186	.support_attributes = guest_support_attributes,
1187	.link_ok = guest_link_ok,
1188	.release_afu = guest_release_afu,
1189	.afu_read_err_buffer = guest_afu_read_err_buffer,
1190	.afu_check_and_enable = guest_afu_check_and_enable,
1191	.afu_activate_mode = guest_afu_activate_mode,
1192	.afu_deactivate_mode = guest_afu_deactivate_mode,
1193	.afu_reset = guest_afu_reset,
1194	.afu_cr_read8 = guest_afu_cr_read8,
1195	.afu_cr_read16 = guest_afu_cr_read16,
1196	.afu_cr_read32 = guest_afu_cr_read32,
1197	.afu_cr_read64 = guest_afu_cr_read64,
1198	.afu_cr_write8 = guest_afu_cr_write8,
1199	.afu_cr_write16 = guest_afu_cr_write16,
1200	.afu_cr_write32 = guest_afu_cr_write32,
1201	.read_adapter_vpd = cxl_guest_read_adapter_vpd,
1202};
1203