xref: /kernel/linux/linux-5.10/drivers/dma/idxd/dma.c (revision 8c2ecf20)
1// SPDX-License-Identifier: GPL-2.0
2/* Copyright(c) 2019 Intel Corporation. All rights rsvd. */
3#include <linux/init.h>
4#include <linux/kernel.h>
5#include <linux/module.h>
6#include <linux/pci.h>
7#include <linux/device.h>
8#include <linux/io-64-nonatomic-lo-hi.h>
9#include <linux/dmaengine.h>
10#include <uapi/linux/idxd.h>
11#include "../dmaengine.h"
12#include "registers.h"
13#include "idxd.h"
14
15static inline struct idxd_wq *to_idxd_wq(struct dma_chan *c)
16{
17	struct idxd_dma_chan *idxd_chan;
18
19	idxd_chan = container_of(c, struct idxd_dma_chan, chan);
20	return idxd_chan->wq;
21}
22
23void idxd_dma_complete_txd(struct idxd_desc *desc,
24			   enum idxd_complete_type comp_type)
25{
26	struct dma_async_tx_descriptor *tx;
27	struct dmaengine_result res;
28	int complete = 1;
29
30	if (desc->completion->status == DSA_COMP_SUCCESS)
31		res.result = DMA_TRANS_NOERROR;
32	else if (desc->completion->status)
33		res.result = DMA_TRANS_WRITE_FAILED;
34	else if (comp_type == IDXD_COMPLETE_ABORT)
35		res.result = DMA_TRANS_ABORTED;
36	else
37		complete = 0;
38
39	tx = &desc->txd;
40	if (complete && tx->cookie) {
41		dma_cookie_complete(tx);
42		dma_descriptor_unmap(tx);
43		dmaengine_desc_get_callback_invoke(tx, &res);
44		tx->callback = NULL;
45		tx->callback_result = NULL;
46	}
47}
48
49static void op_flag_setup(unsigned long flags, u32 *desc_flags)
50{
51	*desc_flags = IDXD_OP_FLAG_CRAV | IDXD_OP_FLAG_RCR;
52	if (flags & DMA_PREP_INTERRUPT)
53		*desc_flags |= IDXD_OP_FLAG_RCI;
54}
55
56static inline void set_completion_address(struct idxd_desc *desc,
57					  u64 *compl_addr)
58{
59		*compl_addr = desc->compl_dma;
60}
61
62static inline void idxd_prep_desc_common(struct idxd_wq *wq,
63					 struct dsa_hw_desc *hw, char opcode,
64					 u64 addr_f1, u64 addr_f2, u64 len,
65					 u64 compl, u32 flags)
66{
67	struct idxd_device *idxd = wq->idxd;
68
69	hw->flags = flags;
70	hw->opcode = opcode;
71	hw->src_addr = addr_f1;
72	hw->dst_addr = addr_f2;
73	hw->xfer_size = len;
74	hw->priv = !!(wq->type == IDXD_WQT_KERNEL);
75	hw->completion_addr = compl;
76
77	/*
78	 * Descriptor completion vectors are 1-8 for MSIX. We will round
79	 * robin through the 8 vectors.
80	 */
81	wq->vec_ptr = (wq->vec_ptr % idxd->num_wq_irqs) + 1;
82	hw->int_handle =  wq->vec_ptr;
83}
84
85static struct dma_async_tx_descriptor *
86idxd_dma_prep_interrupt(struct dma_chan *c, unsigned long flags)
87{
88	struct idxd_wq *wq = to_idxd_wq(c);
89	u32 desc_flags;
90	struct idxd_desc *desc;
91
92	if (wq->state != IDXD_WQ_ENABLED)
93		return NULL;
94
95	op_flag_setup(flags, &desc_flags);
96	desc = idxd_alloc_desc(wq, IDXD_OP_BLOCK);
97	if (IS_ERR(desc))
98		return NULL;
99
100	idxd_prep_desc_common(wq, desc->hw, DSA_OPCODE_NOOP,
101			      0, 0, 0, desc->compl_dma, desc_flags);
102	desc->txd.flags = flags;
103	return &desc->txd;
104}
105
106static struct dma_async_tx_descriptor *
107idxd_dma_submit_memcpy(struct dma_chan *c, dma_addr_t dma_dest,
108		       dma_addr_t dma_src, size_t len, unsigned long flags)
109{
110	struct idxd_wq *wq = to_idxd_wq(c);
111	u32 desc_flags;
112	struct idxd_device *idxd = wq->idxd;
113	struct idxd_desc *desc;
114
115	if (wq->state != IDXD_WQ_ENABLED)
116		return NULL;
117
118	if (len > idxd->max_xfer_bytes)
119		return NULL;
120
121	op_flag_setup(flags, &desc_flags);
122	desc = idxd_alloc_desc(wq, IDXD_OP_BLOCK);
123	if (IS_ERR(desc))
124		return NULL;
125
126	idxd_prep_desc_common(wq, desc->hw, DSA_OPCODE_MEMMOVE,
127			      dma_src, dma_dest, len, desc->compl_dma,
128			      desc_flags);
129
130	desc->txd.flags = flags;
131
132	return &desc->txd;
133}
134
135static int idxd_dma_alloc_chan_resources(struct dma_chan *chan)
136{
137	struct idxd_wq *wq = to_idxd_wq(chan);
138	struct device *dev = &wq->idxd->pdev->dev;
139
140	idxd_wq_get(wq);
141	dev_dbg(dev, "%s: client_count: %d\n", __func__,
142		idxd_wq_refcount(wq));
143	return 0;
144}
145
146static void idxd_dma_free_chan_resources(struct dma_chan *chan)
147{
148	struct idxd_wq *wq = to_idxd_wq(chan);
149	struct device *dev = &wq->idxd->pdev->dev;
150
151	idxd_wq_put(wq);
152	dev_dbg(dev, "%s: client_count: %d\n", __func__,
153		idxd_wq_refcount(wq));
154}
155
156static enum dma_status idxd_dma_tx_status(struct dma_chan *dma_chan,
157					  dma_cookie_t cookie,
158					  struct dma_tx_state *txstate)
159{
160	return DMA_OUT_OF_ORDER;
161}
162
163/*
164 * issue_pending() does not need to do anything since tx_submit() does the job
165 * already.
166 */
167static void idxd_dma_issue_pending(struct dma_chan *dma_chan)
168{
169}
170
171static dma_cookie_t idxd_dma_tx_submit(struct dma_async_tx_descriptor *tx)
172{
173	struct dma_chan *c = tx->chan;
174	struct idxd_wq *wq = to_idxd_wq(c);
175	dma_cookie_t cookie;
176	int rc;
177	struct idxd_desc *desc = container_of(tx, struct idxd_desc, txd);
178
179	cookie = dma_cookie_assign(tx);
180
181	rc = idxd_submit_desc(wq, desc);
182	if (rc < 0) {
183		idxd_free_desc(wq, desc);
184		return rc;
185	}
186
187	return cookie;
188}
189
190static void idxd_dma_release(struct dma_device *device)
191{
192	struct idxd_dma_dev *idxd_dma = container_of(device, struct idxd_dma_dev, dma);
193
194	kfree(idxd_dma);
195}
196
197int idxd_register_dma_device(struct idxd_device *idxd)
198{
199	struct idxd_dma_dev *idxd_dma;
200	struct dma_device *dma;
201	struct device *dev = &idxd->pdev->dev;
202	int rc;
203
204	idxd_dma = kzalloc_node(sizeof(*idxd_dma), GFP_KERNEL, dev_to_node(dev));
205	if (!idxd_dma)
206		return -ENOMEM;
207
208	dma = &idxd_dma->dma;
209	INIT_LIST_HEAD(&dma->channels);
210	dma->dev = dev;
211
212	dma_cap_set(DMA_INTERRUPT, dma->cap_mask);
213	dma_cap_set(DMA_PRIVATE, dma->cap_mask);
214	dma_cap_set(DMA_COMPLETION_NO_ORDER, dma->cap_mask);
215	dma->device_release = idxd_dma_release;
216
217	dma->device_prep_dma_interrupt = idxd_dma_prep_interrupt;
218	if (idxd->hw.opcap.bits[0] & IDXD_OPCAP_MEMMOVE) {
219		dma_cap_set(DMA_MEMCPY, dma->cap_mask);
220		dma->device_prep_dma_memcpy = idxd_dma_submit_memcpy;
221	}
222
223	dma->device_tx_status = idxd_dma_tx_status;
224	dma->device_issue_pending = idxd_dma_issue_pending;
225	dma->device_alloc_chan_resources = idxd_dma_alloc_chan_resources;
226	dma->device_free_chan_resources = idxd_dma_free_chan_resources;
227
228	rc = dma_async_device_register(dma);
229	if (rc < 0) {
230		kfree(idxd_dma);
231		return rc;
232	}
233
234	idxd_dma->idxd = idxd;
235	/*
236	 * This pointer is protected by the refs taken by the dma_chan. It will remain valid
237	 * as long as there are outstanding channels.
238	 */
239	idxd->idxd_dma = idxd_dma;
240	return 0;
241}
242
243void idxd_unregister_dma_device(struct idxd_device *idxd)
244{
245	dma_async_device_unregister(&idxd->idxd_dma->dma);
246}
247
248int idxd_register_dma_channel(struct idxd_wq *wq)
249{
250	struct idxd_device *idxd = wq->idxd;
251	struct dma_device *dma = &idxd->idxd_dma->dma;
252	struct device *dev = &idxd->pdev->dev;
253	struct idxd_dma_chan *idxd_chan;
254	struct dma_chan *chan;
255	int rc, i;
256
257	idxd_chan = kzalloc_node(sizeof(*idxd_chan), GFP_KERNEL, dev_to_node(dev));
258	if (!idxd_chan)
259		return -ENOMEM;
260
261	chan = &idxd_chan->chan;
262	chan->device = dma;
263	list_add_tail(&chan->device_node, &dma->channels);
264
265	for (i = 0; i < wq->num_descs; i++) {
266		struct idxd_desc *desc = wq->descs[i];
267
268		dma_async_tx_descriptor_init(&desc->txd, chan);
269		desc->txd.tx_submit = idxd_dma_tx_submit;
270	}
271
272	rc = dma_async_device_channel_register(dma, chan);
273	if (rc < 0) {
274		kfree(idxd_chan);
275		return rc;
276	}
277
278	wq->idxd_chan = idxd_chan;
279	idxd_chan->wq = wq;
280	get_device(&wq->conf_dev);
281
282	return 0;
283}
284
285void idxd_unregister_dma_channel(struct idxd_wq *wq)
286{
287	struct idxd_dma_chan *idxd_chan = wq->idxd_chan;
288	struct dma_chan *chan = &idxd_chan->chan;
289	struct idxd_dma_dev *idxd_dma = wq->idxd->idxd_dma;
290
291	dma_async_device_channel_unregister(&idxd_dma->dma, chan);
292	list_del(&chan->device_node);
293	kfree(wq->idxd_chan);
294	wq->idxd_chan = NULL;
295	put_device(&wq->conf_dev);
296}
297