1/*
2 * Copyright (C) 2017 Broadcom
3 *
4 * This program is free software; you can redistribute it and/or
5 * modify it under the terms of the GNU General Public License as
6 * published by the Free Software Foundation version 2.
7 *
8 * This program is distributed "as is" WITHOUT ANY WARRANTY of any
9 * kind, whether express or implied; without even the implied warranty
10 * of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
11 * GNU General Public License for more details.
12 */
13
14/*
15 * Broadcom SBA RAID Driver
16 *
17 * The Broadcom stream buffer accelerator (SBA) provides offloading
18 * capabilities for RAID operations. The SBA offload engine is accessible
19 * via Broadcom SoC specific ring manager. Two or more offload engines
20 * can share same Broadcom SoC specific ring manager due to this Broadcom
21 * SoC specific ring manager driver is implemented as a mailbox controller
22 * driver and offload engine drivers are implemented as mallbox clients.
23 *
24 * Typically, Broadcom SoC specific ring manager will implement larger
25 * number of hardware rings over one or more SBA hardware devices. By
26 * design, the internal buffer size of SBA hardware device is limited
27 * but all offload operations supported by SBA can be broken down into
28 * multiple small size requests and executed parallely on multiple SBA
29 * hardware devices for achieving high through-put.
30 *
31 * The Broadcom SBA RAID driver does not require any register programming
32 * except submitting request to SBA hardware device via mailbox channels.
33 * This driver implements a DMA device with one DMA channel using a single
34 * mailbox channel provided by Broadcom SoC specific ring manager driver.
35 * For having more SBA DMA channels, we can create more SBA device nodes
36 * in Broadcom SoC specific DTS based on number of hardware rings supported
37 * by Broadcom SoC ring manager.
38 */
39
40#include <linux/bitops.h>
41#include <linux/debugfs.h>
42#include <linux/dma-mapping.h>
43#include <linux/dmaengine.h>
44#include <linux/list.h>
45#include <linux/mailbox_client.h>
46#include <linux/mailbox/brcm-message.h>
47#include <linux/module.h>
48#include <linux/of_device.h>
49#include <linux/slab.h>
50#include <linux/raid/pq.h>
51
52#include "dmaengine.h"
53
54/* ====== Driver macros and defines ===== */
55
56#define SBA_TYPE_SHIFT					48
57#define SBA_TYPE_MASK					GENMASK(1, 0)
58#define SBA_TYPE_A					0x0
59#define SBA_TYPE_B					0x2
60#define SBA_TYPE_C					0x3
61#define SBA_USER_DEF_SHIFT				32
62#define SBA_USER_DEF_MASK				GENMASK(15, 0)
63#define SBA_R_MDATA_SHIFT				24
64#define SBA_R_MDATA_MASK				GENMASK(7, 0)
65#define SBA_C_MDATA_MS_SHIFT				18
66#define SBA_C_MDATA_MS_MASK				GENMASK(1, 0)
67#define SBA_INT_SHIFT					17
68#define SBA_INT_MASK					BIT(0)
69#define SBA_RESP_SHIFT					16
70#define SBA_RESP_MASK					BIT(0)
71#define SBA_C_MDATA_SHIFT				8
72#define SBA_C_MDATA_MASK				GENMASK(7, 0)
73#define SBA_C_MDATA_BNUMx_SHIFT(__bnum)			(2 * (__bnum))
74#define SBA_C_MDATA_BNUMx_MASK				GENMASK(1, 0)
75#define SBA_C_MDATA_DNUM_SHIFT				5
76#define SBA_C_MDATA_DNUM_MASK				GENMASK(4, 0)
77#define SBA_C_MDATA_LS(__v)				((__v) & 0xff)
78#define SBA_C_MDATA_MS(__v)				(((__v) >> 8) & 0x3)
79#define SBA_CMD_SHIFT					0
80#define SBA_CMD_MASK					GENMASK(3, 0)
81#define SBA_CMD_ZERO_BUFFER				0x4
82#define SBA_CMD_ZERO_ALL_BUFFERS			0x8
83#define SBA_CMD_LOAD_BUFFER				0x9
84#define SBA_CMD_XOR					0xa
85#define SBA_CMD_GALOIS_XOR				0xb
86#define SBA_CMD_WRITE_BUFFER				0xc
87#define SBA_CMD_GALOIS					0xe
88
89#define SBA_MAX_REQ_PER_MBOX_CHANNEL			8192
90#define SBA_MAX_MSG_SEND_PER_MBOX_CHANNEL		8
91
92/* Driver helper macros */
93#define to_sba_request(tx)		\
94	container_of(tx, struct sba_request, tx)
95#define to_sba_device(dchan)		\
96	container_of(dchan, struct sba_device, dma_chan)
97
98/* ===== Driver data structures ===== */
99
100enum sba_request_flags {
101	SBA_REQUEST_STATE_FREE		= 0x001,
102	SBA_REQUEST_STATE_ALLOCED	= 0x002,
103	SBA_REQUEST_STATE_PENDING	= 0x004,
104	SBA_REQUEST_STATE_ACTIVE	= 0x008,
105	SBA_REQUEST_STATE_ABORTED	= 0x010,
106	SBA_REQUEST_STATE_MASK		= 0x0ff,
107	SBA_REQUEST_FENCE		= 0x100,
108};
109
110struct sba_request {
111	/* Global state */
112	struct list_head node;
113	struct sba_device *sba;
114	u32 flags;
115	/* Chained requests management */
116	struct sba_request *first;
117	struct list_head next;
118	atomic_t next_pending_count;
119	/* BRCM message data */
120	struct brcm_message msg;
121	struct dma_async_tx_descriptor tx;
122	/* SBA commands */
123	struct brcm_sba_command cmds[];
124};
125
126enum sba_version {
127	SBA_VER_1 = 0,
128	SBA_VER_2
129};
130
131struct sba_device {
132	/* Underlying device */
133	struct device *dev;
134	/* DT configuration parameters */
135	enum sba_version ver;
136	/* Derived configuration parameters */
137	u32 max_req;
138	u32 hw_buf_size;
139	u32 hw_resp_size;
140	u32 max_pq_coefs;
141	u32 max_pq_srcs;
142	u32 max_cmd_per_req;
143	u32 max_xor_srcs;
144	u32 max_resp_pool_size;
145	u32 max_cmds_pool_size;
146	/* Maibox client and Mailbox channels */
147	struct mbox_client client;
148	struct mbox_chan *mchan;
149	struct device *mbox_dev;
150	/* DMA device and DMA channel */
151	struct dma_device dma_dev;
152	struct dma_chan dma_chan;
153	/* DMA channel resources */
154	void *resp_base;
155	dma_addr_t resp_dma_base;
156	void *cmds_base;
157	dma_addr_t cmds_dma_base;
158	spinlock_t reqs_lock;
159	bool reqs_fence;
160	struct list_head reqs_alloc_list;
161	struct list_head reqs_pending_list;
162	struct list_head reqs_active_list;
163	struct list_head reqs_aborted_list;
164	struct list_head reqs_free_list;
165	/* DebugFS directory entries */
166	struct dentry *root;
167};
168
169/* ====== Command helper routines ===== */
170
171static inline u64 __pure sba_cmd_enc(u64 cmd, u32 val, u32 shift, u32 mask)
172{
173	cmd &= ~((u64)mask << shift);
174	cmd |= ((u64)(val & mask) << shift);
175	return cmd;
176}
177
178static inline u32 __pure sba_cmd_load_c_mdata(u32 b0)
179{
180	return b0 & SBA_C_MDATA_BNUMx_MASK;
181}
182
183static inline u32 __pure sba_cmd_write_c_mdata(u32 b0)
184{
185	return b0 & SBA_C_MDATA_BNUMx_MASK;
186}
187
188static inline u32 __pure sba_cmd_xor_c_mdata(u32 b1, u32 b0)
189{
190	return (b0 & SBA_C_MDATA_BNUMx_MASK) |
191	       ((b1 & SBA_C_MDATA_BNUMx_MASK) << SBA_C_MDATA_BNUMx_SHIFT(1));
192}
193
194static inline u32 __pure sba_cmd_pq_c_mdata(u32 d, u32 b1, u32 b0)
195{
196	return (b0 & SBA_C_MDATA_BNUMx_MASK) |
197	       ((b1 & SBA_C_MDATA_BNUMx_MASK) << SBA_C_MDATA_BNUMx_SHIFT(1)) |
198	       ((d & SBA_C_MDATA_DNUM_MASK) << SBA_C_MDATA_DNUM_SHIFT);
199}
200
201/* ====== General helper routines ===== */
202
203static struct sba_request *sba_alloc_request(struct sba_device *sba)
204{
205	bool found = false;
206	unsigned long flags;
207	struct sba_request *req = NULL;
208
209	spin_lock_irqsave(&sba->reqs_lock, flags);
210	list_for_each_entry(req, &sba->reqs_free_list, node) {
211		if (async_tx_test_ack(&req->tx)) {
212			list_move_tail(&req->node, &sba->reqs_alloc_list);
213			found = true;
214			break;
215		}
216	}
217	spin_unlock_irqrestore(&sba->reqs_lock, flags);
218
219	if (!found) {
220		/*
221		 * We have no more free requests so, we peek
222		 * mailbox channels hoping few active requests
223		 * would have completed which will create more
224		 * room for new requests.
225		 */
226		mbox_client_peek_data(sba->mchan);
227		return NULL;
228	}
229
230	req->flags = SBA_REQUEST_STATE_ALLOCED;
231	req->first = req;
232	INIT_LIST_HEAD(&req->next);
233	atomic_set(&req->next_pending_count, 1);
234
235	dma_async_tx_descriptor_init(&req->tx, &sba->dma_chan);
236	async_tx_ack(&req->tx);
237
238	return req;
239}
240
241/* Note: Must be called with sba->reqs_lock held */
242static void _sba_pending_request(struct sba_device *sba,
243				 struct sba_request *req)
244{
245	lockdep_assert_held(&sba->reqs_lock);
246	req->flags &= ~SBA_REQUEST_STATE_MASK;
247	req->flags |= SBA_REQUEST_STATE_PENDING;
248	list_move_tail(&req->node, &sba->reqs_pending_list);
249	if (list_empty(&sba->reqs_active_list))
250		sba->reqs_fence = false;
251}
252
253/* Note: Must be called with sba->reqs_lock held */
254static bool _sba_active_request(struct sba_device *sba,
255				struct sba_request *req)
256{
257	lockdep_assert_held(&sba->reqs_lock);
258	if (list_empty(&sba->reqs_active_list))
259		sba->reqs_fence = false;
260	if (sba->reqs_fence)
261		return false;
262	req->flags &= ~SBA_REQUEST_STATE_MASK;
263	req->flags |= SBA_REQUEST_STATE_ACTIVE;
264	list_move_tail(&req->node, &sba->reqs_active_list);
265	if (req->flags & SBA_REQUEST_FENCE)
266		sba->reqs_fence = true;
267	return true;
268}
269
270/* Note: Must be called with sba->reqs_lock held */
271static void _sba_abort_request(struct sba_device *sba,
272			       struct sba_request *req)
273{
274	lockdep_assert_held(&sba->reqs_lock);
275	req->flags &= ~SBA_REQUEST_STATE_MASK;
276	req->flags |= SBA_REQUEST_STATE_ABORTED;
277	list_move_tail(&req->node, &sba->reqs_aborted_list);
278	if (list_empty(&sba->reqs_active_list))
279		sba->reqs_fence = false;
280}
281
282/* Note: Must be called with sba->reqs_lock held */
283static void _sba_free_request(struct sba_device *sba,
284			      struct sba_request *req)
285{
286	lockdep_assert_held(&sba->reqs_lock);
287	req->flags &= ~SBA_REQUEST_STATE_MASK;
288	req->flags |= SBA_REQUEST_STATE_FREE;
289	list_move_tail(&req->node, &sba->reqs_free_list);
290	if (list_empty(&sba->reqs_active_list))
291		sba->reqs_fence = false;
292}
293
294static void sba_free_chained_requests(struct sba_request *req)
295{
296	unsigned long flags;
297	struct sba_request *nreq;
298	struct sba_device *sba = req->sba;
299
300	spin_lock_irqsave(&sba->reqs_lock, flags);
301
302	_sba_free_request(sba, req);
303	list_for_each_entry(nreq, &req->next, next)
304		_sba_free_request(sba, nreq);
305
306	spin_unlock_irqrestore(&sba->reqs_lock, flags);
307}
308
309static void sba_chain_request(struct sba_request *first,
310			      struct sba_request *req)
311{
312	unsigned long flags;
313	struct sba_device *sba = req->sba;
314
315	spin_lock_irqsave(&sba->reqs_lock, flags);
316
317	list_add_tail(&req->next, &first->next);
318	req->first = first;
319	atomic_inc(&first->next_pending_count);
320
321	spin_unlock_irqrestore(&sba->reqs_lock, flags);
322}
323
324static void sba_cleanup_nonpending_requests(struct sba_device *sba)
325{
326	unsigned long flags;
327	struct sba_request *req, *req1;
328
329	spin_lock_irqsave(&sba->reqs_lock, flags);
330
331	/* Freeup all alloced request */
332	list_for_each_entry_safe(req, req1, &sba->reqs_alloc_list, node)
333		_sba_free_request(sba, req);
334
335	/* Set all active requests as aborted */
336	list_for_each_entry_safe(req, req1, &sba->reqs_active_list, node)
337		_sba_abort_request(sba, req);
338
339	/*
340	 * Note: We expect that aborted request will be eventually
341	 * freed by sba_receive_message()
342	 */
343
344	spin_unlock_irqrestore(&sba->reqs_lock, flags);
345}
346
347static void sba_cleanup_pending_requests(struct sba_device *sba)
348{
349	unsigned long flags;
350	struct sba_request *req, *req1;
351
352	spin_lock_irqsave(&sba->reqs_lock, flags);
353
354	/* Freeup all pending request */
355	list_for_each_entry_safe(req, req1, &sba->reqs_pending_list, node)
356		_sba_free_request(sba, req);
357
358	spin_unlock_irqrestore(&sba->reqs_lock, flags);
359}
360
361static int sba_send_mbox_request(struct sba_device *sba,
362				 struct sba_request *req)
363{
364	int ret = 0;
365
366	/* Send message for the request */
367	req->msg.error = 0;
368	ret = mbox_send_message(sba->mchan, &req->msg);
369	if (ret < 0) {
370		dev_err(sba->dev, "send message failed with error %d", ret);
371		return ret;
372	}
373
374	/* Check error returned by mailbox controller */
375	ret = req->msg.error;
376	if (ret < 0) {
377		dev_err(sba->dev, "message error %d", ret);
378	}
379
380	/* Signal txdone for mailbox channel */
381	mbox_client_txdone(sba->mchan, ret);
382
383	return ret;
384}
385
386/* Note: Must be called with sba->reqs_lock held */
387static void _sba_process_pending_requests(struct sba_device *sba)
388{
389	int ret;
390	u32 count;
391	struct sba_request *req;
392
393	/* Process few pending requests */
394	count = SBA_MAX_MSG_SEND_PER_MBOX_CHANNEL;
395	while (!list_empty(&sba->reqs_pending_list) && count) {
396		/* Get the first pending request */
397		req = list_first_entry(&sba->reqs_pending_list,
398				       struct sba_request, node);
399
400		/* Try to make request active */
401		if (!_sba_active_request(sba, req))
402			break;
403
404		/* Send request to mailbox channel */
405		ret = sba_send_mbox_request(sba, req);
406		if (ret < 0) {
407			_sba_pending_request(sba, req);
408			break;
409		}
410
411		count--;
412	}
413}
414
415static void sba_process_received_request(struct sba_device *sba,
416					 struct sba_request *req)
417{
418	unsigned long flags;
419	struct dma_async_tx_descriptor *tx;
420	struct sba_request *nreq, *first = req->first;
421
422	/* Process only after all chained requests are received */
423	if (!atomic_dec_return(&first->next_pending_count)) {
424		tx = &first->tx;
425
426		WARN_ON(tx->cookie < 0);
427		if (tx->cookie > 0) {
428			spin_lock_irqsave(&sba->reqs_lock, flags);
429			dma_cookie_complete(tx);
430			spin_unlock_irqrestore(&sba->reqs_lock, flags);
431			dmaengine_desc_get_callback_invoke(tx, NULL);
432			dma_descriptor_unmap(tx);
433			tx->callback = NULL;
434			tx->callback_result = NULL;
435		}
436
437		dma_run_dependencies(tx);
438
439		spin_lock_irqsave(&sba->reqs_lock, flags);
440
441		/* Free all requests chained to first request */
442		list_for_each_entry(nreq, &first->next, next)
443			_sba_free_request(sba, nreq);
444		INIT_LIST_HEAD(&first->next);
445
446		/* Free the first request */
447		_sba_free_request(sba, first);
448
449		/* Process pending requests */
450		_sba_process_pending_requests(sba);
451
452		spin_unlock_irqrestore(&sba->reqs_lock, flags);
453	}
454}
455
456static void sba_write_stats_in_seqfile(struct sba_device *sba,
457				       struct seq_file *file)
458{
459	unsigned long flags;
460	struct sba_request *req;
461	u32 free_count = 0, alloced_count = 0;
462	u32 pending_count = 0, active_count = 0, aborted_count = 0;
463
464	spin_lock_irqsave(&sba->reqs_lock, flags);
465
466	list_for_each_entry(req, &sba->reqs_free_list, node)
467		if (async_tx_test_ack(&req->tx))
468			free_count++;
469
470	list_for_each_entry(req, &sba->reqs_alloc_list, node)
471		alloced_count++;
472
473	list_for_each_entry(req, &sba->reqs_pending_list, node)
474		pending_count++;
475
476	list_for_each_entry(req, &sba->reqs_active_list, node)
477		active_count++;
478
479	list_for_each_entry(req, &sba->reqs_aborted_list, node)
480		aborted_count++;
481
482	spin_unlock_irqrestore(&sba->reqs_lock, flags);
483
484	seq_printf(file, "maximum requests   = %d\n", sba->max_req);
485	seq_printf(file, "free requests      = %d\n", free_count);
486	seq_printf(file, "alloced requests   = %d\n", alloced_count);
487	seq_printf(file, "pending requests   = %d\n", pending_count);
488	seq_printf(file, "active requests    = %d\n", active_count);
489	seq_printf(file, "aborted requests   = %d\n", aborted_count);
490}
491
492/* ====== DMAENGINE callbacks ===== */
493
494static void sba_free_chan_resources(struct dma_chan *dchan)
495{
496	/*
497	 * Channel resources are pre-alloced so we just free-up
498	 * whatever we can so that we can re-use pre-alloced
499	 * channel resources next time.
500	 */
501	sba_cleanup_nonpending_requests(to_sba_device(dchan));
502}
503
504static int sba_device_terminate_all(struct dma_chan *dchan)
505{
506	/* Cleanup all pending requests */
507	sba_cleanup_pending_requests(to_sba_device(dchan));
508
509	return 0;
510}
511
512static void sba_issue_pending(struct dma_chan *dchan)
513{
514	unsigned long flags;
515	struct sba_device *sba = to_sba_device(dchan);
516
517	/* Process pending requests */
518	spin_lock_irqsave(&sba->reqs_lock, flags);
519	_sba_process_pending_requests(sba);
520	spin_unlock_irqrestore(&sba->reqs_lock, flags);
521}
522
523static dma_cookie_t sba_tx_submit(struct dma_async_tx_descriptor *tx)
524{
525	unsigned long flags;
526	dma_cookie_t cookie;
527	struct sba_device *sba;
528	struct sba_request *req, *nreq;
529
530	if (unlikely(!tx))
531		return -EINVAL;
532
533	sba = to_sba_device(tx->chan);
534	req = to_sba_request(tx);
535
536	/* Assign cookie and mark all chained requests pending */
537	spin_lock_irqsave(&sba->reqs_lock, flags);
538	cookie = dma_cookie_assign(tx);
539	_sba_pending_request(sba, req);
540	list_for_each_entry(nreq, &req->next, next)
541		_sba_pending_request(sba, nreq);
542	spin_unlock_irqrestore(&sba->reqs_lock, flags);
543
544	return cookie;
545}
546
547static enum dma_status sba_tx_status(struct dma_chan *dchan,
548				     dma_cookie_t cookie,
549				     struct dma_tx_state *txstate)
550{
551	enum dma_status ret;
552	struct sba_device *sba = to_sba_device(dchan);
553
554	ret = dma_cookie_status(dchan, cookie, txstate);
555	if (ret == DMA_COMPLETE)
556		return ret;
557
558	mbox_client_peek_data(sba->mchan);
559
560	return dma_cookie_status(dchan, cookie, txstate);
561}
562
563static void sba_fillup_interrupt_msg(struct sba_request *req,
564				     struct brcm_sba_command *cmds,
565				     struct brcm_message *msg)
566{
567	u64 cmd;
568	u32 c_mdata;
569	dma_addr_t resp_dma = req->tx.phys;
570	struct brcm_sba_command *cmdsp = cmds;
571
572	/* Type-B command to load dummy data into buf0 */
573	cmd = sba_cmd_enc(0x0, SBA_TYPE_B,
574			  SBA_TYPE_SHIFT, SBA_TYPE_MASK);
575	cmd = sba_cmd_enc(cmd, req->sba->hw_resp_size,
576			  SBA_USER_DEF_SHIFT, SBA_USER_DEF_MASK);
577	c_mdata = sba_cmd_load_c_mdata(0);
578	cmd = sba_cmd_enc(cmd, SBA_C_MDATA_LS(c_mdata),
579			  SBA_C_MDATA_SHIFT, SBA_C_MDATA_MASK);
580	cmd = sba_cmd_enc(cmd, SBA_CMD_LOAD_BUFFER,
581			  SBA_CMD_SHIFT, SBA_CMD_MASK);
582	cmdsp->cmd = cmd;
583	*cmdsp->cmd_dma = cpu_to_le64(cmd);
584	cmdsp->flags = BRCM_SBA_CMD_TYPE_B;
585	cmdsp->data = resp_dma;
586	cmdsp->data_len = req->sba->hw_resp_size;
587	cmdsp++;
588
589	/* Type-A command to write buf0 to dummy location */
590	cmd = sba_cmd_enc(0x0, SBA_TYPE_A,
591			  SBA_TYPE_SHIFT, SBA_TYPE_MASK);
592	cmd = sba_cmd_enc(cmd, req->sba->hw_resp_size,
593			  SBA_USER_DEF_SHIFT, SBA_USER_DEF_MASK);
594	cmd = sba_cmd_enc(cmd, 0x1,
595			  SBA_RESP_SHIFT, SBA_RESP_MASK);
596	c_mdata = sba_cmd_write_c_mdata(0);
597	cmd = sba_cmd_enc(cmd, SBA_C_MDATA_LS(c_mdata),
598			  SBA_C_MDATA_SHIFT, SBA_C_MDATA_MASK);
599	cmd = sba_cmd_enc(cmd, SBA_CMD_WRITE_BUFFER,
600			  SBA_CMD_SHIFT, SBA_CMD_MASK);
601	cmdsp->cmd = cmd;
602	*cmdsp->cmd_dma = cpu_to_le64(cmd);
603	cmdsp->flags = BRCM_SBA_CMD_TYPE_A;
604	if (req->sba->hw_resp_size) {
605		cmdsp->flags |= BRCM_SBA_CMD_HAS_RESP;
606		cmdsp->resp = resp_dma;
607		cmdsp->resp_len = req->sba->hw_resp_size;
608	}
609	cmdsp->flags |= BRCM_SBA_CMD_HAS_OUTPUT;
610	cmdsp->data = resp_dma;
611	cmdsp->data_len = req->sba->hw_resp_size;
612	cmdsp++;
613
614	/* Fillup brcm_message */
615	msg->type = BRCM_MESSAGE_SBA;
616	msg->sba.cmds = cmds;
617	msg->sba.cmds_count = cmdsp - cmds;
618	msg->ctx = req;
619	msg->error = 0;
620}
621
622static struct dma_async_tx_descriptor *
623sba_prep_dma_interrupt(struct dma_chan *dchan, unsigned long flags)
624{
625	struct sba_request *req = NULL;
626	struct sba_device *sba = to_sba_device(dchan);
627
628	/* Alloc new request */
629	req = sba_alloc_request(sba);
630	if (!req)
631		return NULL;
632
633	/*
634	 * Force fence so that no requests are submitted
635	 * until DMA callback for this request is invoked.
636	 */
637	req->flags |= SBA_REQUEST_FENCE;
638
639	/* Fillup request message */
640	sba_fillup_interrupt_msg(req, req->cmds, &req->msg);
641
642	/* Init async_tx descriptor */
643	req->tx.flags = flags;
644	req->tx.cookie = -EBUSY;
645
646	return &req->tx;
647}
648
649static void sba_fillup_memcpy_msg(struct sba_request *req,
650				  struct brcm_sba_command *cmds,
651				  struct brcm_message *msg,
652				  dma_addr_t msg_offset, size_t msg_len,
653				  dma_addr_t dst, dma_addr_t src)
654{
655	u64 cmd;
656	u32 c_mdata;
657	dma_addr_t resp_dma = req->tx.phys;
658	struct brcm_sba_command *cmdsp = cmds;
659
660	/* Type-B command to load data into buf0 */
661	cmd = sba_cmd_enc(0x0, SBA_TYPE_B,
662			  SBA_TYPE_SHIFT, SBA_TYPE_MASK);
663	cmd = sba_cmd_enc(cmd, msg_len,
664			  SBA_USER_DEF_SHIFT, SBA_USER_DEF_MASK);
665	c_mdata = sba_cmd_load_c_mdata(0);
666	cmd = sba_cmd_enc(cmd, SBA_C_MDATA_LS(c_mdata),
667			  SBA_C_MDATA_SHIFT, SBA_C_MDATA_MASK);
668	cmd = sba_cmd_enc(cmd, SBA_CMD_LOAD_BUFFER,
669			  SBA_CMD_SHIFT, SBA_CMD_MASK);
670	cmdsp->cmd = cmd;
671	*cmdsp->cmd_dma = cpu_to_le64(cmd);
672	cmdsp->flags = BRCM_SBA_CMD_TYPE_B;
673	cmdsp->data = src + msg_offset;
674	cmdsp->data_len = msg_len;
675	cmdsp++;
676
677	/* Type-A command to write buf0 */
678	cmd = sba_cmd_enc(0x0, SBA_TYPE_A,
679			  SBA_TYPE_SHIFT, SBA_TYPE_MASK);
680	cmd = sba_cmd_enc(cmd, msg_len,
681			  SBA_USER_DEF_SHIFT, SBA_USER_DEF_MASK);
682	cmd = sba_cmd_enc(cmd, 0x1,
683			  SBA_RESP_SHIFT, SBA_RESP_MASK);
684	c_mdata = sba_cmd_write_c_mdata(0);
685	cmd = sba_cmd_enc(cmd, SBA_C_MDATA_LS(c_mdata),
686			  SBA_C_MDATA_SHIFT, SBA_C_MDATA_MASK);
687	cmd = sba_cmd_enc(cmd, SBA_CMD_WRITE_BUFFER,
688			  SBA_CMD_SHIFT, SBA_CMD_MASK);
689	cmdsp->cmd = cmd;
690	*cmdsp->cmd_dma = cpu_to_le64(cmd);
691	cmdsp->flags = BRCM_SBA_CMD_TYPE_A;
692	if (req->sba->hw_resp_size) {
693		cmdsp->flags |= BRCM_SBA_CMD_HAS_RESP;
694		cmdsp->resp = resp_dma;
695		cmdsp->resp_len = req->sba->hw_resp_size;
696	}
697	cmdsp->flags |= BRCM_SBA_CMD_HAS_OUTPUT;
698	cmdsp->data = dst + msg_offset;
699	cmdsp->data_len = msg_len;
700	cmdsp++;
701
702	/* Fillup brcm_message */
703	msg->type = BRCM_MESSAGE_SBA;
704	msg->sba.cmds = cmds;
705	msg->sba.cmds_count = cmdsp - cmds;
706	msg->ctx = req;
707	msg->error = 0;
708}
709
710static struct sba_request *
711sba_prep_dma_memcpy_req(struct sba_device *sba,
712			dma_addr_t off, dma_addr_t dst, dma_addr_t src,
713			size_t len, unsigned long flags)
714{
715	struct sba_request *req = NULL;
716
717	/* Alloc new request */
718	req = sba_alloc_request(sba);
719	if (!req)
720		return NULL;
721	if (flags & DMA_PREP_FENCE)
722		req->flags |= SBA_REQUEST_FENCE;
723
724	/* Fillup request message */
725	sba_fillup_memcpy_msg(req, req->cmds, &req->msg,
726			      off, len, dst, src);
727
728	/* Init async_tx descriptor */
729	req->tx.flags = flags;
730	req->tx.cookie = -EBUSY;
731
732	return req;
733}
734
735static struct dma_async_tx_descriptor *
736sba_prep_dma_memcpy(struct dma_chan *dchan, dma_addr_t dst, dma_addr_t src,
737		    size_t len, unsigned long flags)
738{
739	size_t req_len;
740	dma_addr_t off = 0;
741	struct sba_device *sba = to_sba_device(dchan);
742	struct sba_request *first = NULL, *req;
743
744	/* Create chained requests where each request is upto hw_buf_size */
745	while (len) {
746		req_len = (len < sba->hw_buf_size) ? len : sba->hw_buf_size;
747
748		req = sba_prep_dma_memcpy_req(sba, off, dst, src,
749					      req_len, flags);
750		if (!req) {
751			if (first)
752				sba_free_chained_requests(first);
753			return NULL;
754		}
755
756		if (first)
757			sba_chain_request(first, req);
758		else
759			first = req;
760
761		off += req_len;
762		len -= req_len;
763	}
764
765	return (first) ? &first->tx : NULL;
766}
767
768static void sba_fillup_xor_msg(struct sba_request *req,
769				struct brcm_sba_command *cmds,
770				struct brcm_message *msg,
771				dma_addr_t msg_offset, size_t msg_len,
772				dma_addr_t dst, dma_addr_t *src, u32 src_cnt)
773{
774	u64 cmd;
775	u32 c_mdata;
776	unsigned int i;
777	dma_addr_t resp_dma = req->tx.phys;
778	struct brcm_sba_command *cmdsp = cmds;
779
780	/* Type-B command to load data into buf0 */
781	cmd = sba_cmd_enc(0x0, SBA_TYPE_B,
782			  SBA_TYPE_SHIFT, SBA_TYPE_MASK);
783	cmd = sba_cmd_enc(cmd, msg_len,
784			  SBA_USER_DEF_SHIFT, SBA_USER_DEF_MASK);
785	c_mdata = sba_cmd_load_c_mdata(0);
786	cmd = sba_cmd_enc(cmd, SBA_C_MDATA_LS(c_mdata),
787			  SBA_C_MDATA_SHIFT, SBA_C_MDATA_MASK);
788	cmd = sba_cmd_enc(cmd, SBA_CMD_LOAD_BUFFER,
789			  SBA_CMD_SHIFT, SBA_CMD_MASK);
790	cmdsp->cmd = cmd;
791	*cmdsp->cmd_dma = cpu_to_le64(cmd);
792	cmdsp->flags = BRCM_SBA_CMD_TYPE_B;
793	cmdsp->data = src[0] + msg_offset;
794	cmdsp->data_len = msg_len;
795	cmdsp++;
796
797	/* Type-B commands to xor data with buf0 and put it back in buf0 */
798	for (i = 1; i < src_cnt; i++) {
799		cmd = sba_cmd_enc(0x0, SBA_TYPE_B,
800				  SBA_TYPE_SHIFT, SBA_TYPE_MASK);
801		cmd = sba_cmd_enc(cmd, msg_len,
802				  SBA_USER_DEF_SHIFT, SBA_USER_DEF_MASK);
803		c_mdata = sba_cmd_xor_c_mdata(0, 0);
804		cmd = sba_cmd_enc(cmd, SBA_C_MDATA_LS(c_mdata),
805				  SBA_C_MDATA_SHIFT, SBA_C_MDATA_MASK);
806		cmd = sba_cmd_enc(cmd, SBA_CMD_XOR,
807				  SBA_CMD_SHIFT, SBA_CMD_MASK);
808		cmdsp->cmd = cmd;
809		*cmdsp->cmd_dma = cpu_to_le64(cmd);
810		cmdsp->flags = BRCM_SBA_CMD_TYPE_B;
811		cmdsp->data = src[i] + msg_offset;
812		cmdsp->data_len = msg_len;
813		cmdsp++;
814	}
815
816	/* Type-A command to write buf0 */
817	cmd = sba_cmd_enc(0x0, SBA_TYPE_A,
818			  SBA_TYPE_SHIFT, SBA_TYPE_MASK);
819	cmd = sba_cmd_enc(cmd, msg_len,
820			  SBA_USER_DEF_SHIFT, SBA_USER_DEF_MASK);
821	cmd = sba_cmd_enc(cmd, 0x1,
822			  SBA_RESP_SHIFT, SBA_RESP_MASK);
823	c_mdata = sba_cmd_write_c_mdata(0);
824	cmd = sba_cmd_enc(cmd, SBA_C_MDATA_LS(c_mdata),
825			  SBA_C_MDATA_SHIFT, SBA_C_MDATA_MASK);
826	cmd = sba_cmd_enc(cmd, SBA_CMD_WRITE_BUFFER,
827			  SBA_CMD_SHIFT, SBA_CMD_MASK);
828	cmdsp->cmd = cmd;
829	*cmdsp->cmd_dma = cpu_to_le64(cmd);
830	cmdsp->flags = BRCM_SBA_CMD_TYPE_A;
831	if (req->sba->hw_resp_size) {
832		cmdsp->flags |= BRCM_SBA_CMD_HAS_RESP;
833		cmdsp->resp = resp_dma;
834		cmdsp->resp_len = req->sba->hw_resp_size;
835	}
836	cmdsp->flags |= BRCM_SBA_CMD_HAS_OUTPUT;
837	cmdsp->data = dst + msg_offset;
838	cmdsp->data_len = msg_len;
839	cmdsp++;
840
841	/* Fillup brcm_message */
842	msg->type = BRCM_MESSAGE_SBA;
843	msg->sba.cmds = cmds;
844	msg->sba.cmds_count = cmdsp - cmds;
845	msg->ctx = req;
846	msg->error = 0;
847}
848
849static struct sba_request *
850sba_prep_dma_xor_req(struct sba_device *sba,
851		     dma_addr_t off, dma_addr_t dst, dma_addr_t *src,
852		     u32 src_cnt, size_t len, unsigned long flags)
853{
854	struct sba_request *req = NULL;
855
856	/* Alloc new request */
857	req = sba_alloc_request(sba);
858	if (!req)
859		return NULL;
860	if (flags & DMA_PREP_FENCE)
861		req->flags |= SBA_REQUEST_FENCE;
862
863	/* Fillup request message */
864	sba_fillup_xor_msg(req, req->cmds, &req->msg,
865			   off, len, dst, src, src_cnt);
866
867	/* Init async_tx descriptor */
868	req->tx.flags = flags;
869	req->tx.cookie = -EBUSY;
870
871	return req;
872}
873
874static struct dma_async_tx_descriptor *
875sba_prep_dma_xor(struct dma_chan *dchan, dma_addr_t dst, dma_addr_t *src,
876		 u32 src_cnt, size_t len, unsigned long flags)
877{
878	size_t req_len;
879	dma_addr_t off = 0;
880	struct sba_device *sba = to_sba_device(dchan);
881	struct sba_request *first = NULL, *req;
882
883	/* Sanity checks */
884	if (unlikely(src_cnt > sba->max_xor_srcs))
885		return NULL;
886
887	/* Create chained requests where each request is upto hw_buf_size */
888	while (len) {
889		req_len = (len < sba->hw_buf_size) ? len : sba->hw_buf_size;
890
891		req = sba_prep_dma_xor_req(sba, off, dst, src, src_cnt,
892					   req_len, flags);
893		if (!req) {
894			if (first)
895				sba_free_chained_requests(first);
896			return NULL;
897		}
898
899		if (first)
900			sba_chain_request(first, req);
901		else
902			first = req;
903
904		off += req_len;
905		len -= req_len;
906	}
907
908	return (first) ? &first->tx : NULL;
909}
910
911static void sba_fillup_pq_msg(struct sba_request *req,
912				bool pq_continue,
913				struct brcm_sba_command *cmds,
914				struct brcm_message *msg,
915				dma_addr_t msg_offset, size_t msg_len,
916				dma_addr_t *dst_p, dma_addr_t *dst_q,
917				const u8 *scf, dma_addr_t *src, u32 src_cnt)
918{
919	u64 cmd;
920	u32 c_mdata;
921	unsigned int i;
922	dma_addr_t resp_dma = req->tx.phys;
923	struct brcm_sba_command *cmdsp = cmds;
924
925	if (pq_continue) {
926		/* Type-B command to load old P into buf0 */
927		if (dst_p) {
928			cmd = sba_cmd_enc(0x0, SBA_TYPE_B,
929				SBA_TYPE_SHIFT, SBA_TYPE_MASK);
930			cmd = sba_cmd_enc(cmd, msg_len,
931				SBA_USER_DEF_SHIFT, SBA_USER_DEF_MASK);
932			c_mdata = sba_cmd_load_c_mdata(0);
933			cmd = sba_cmd_enc(cmd, SBA_C_MDATA_LS(c_mdata),
934				SBA_C_MDATA_SHIFT, SBA_C_MDATA_MASK);
935			cmd = sba_cmd_enc(cmd, SBA_CMD_LOAD_BUFFER,
936				SBA_CMD_SHIFT, SBA_CMD_MASK);
937			cmdsp->cmd = cmd;
938			*cmdsp->cmd_dma = cpu_to_le64(cmd);
939			cmdsp->flags = BRCM_SBA_CMD_TYPE_B;
940			cmdsp->data = *dst_p + msg_offset;
941			cmdsp->data_len = msg_len;
942			cmdsp++;
943		}
944
945		/* Type-B command to load old Q into buf1 */
946		if (dst_q) {
947			cmd = sba_cmd_enc(0x0, SBA_TYPE_B,
948				SBA_TYPE_SHIFT, SBA_TYPE_MASK);
949			cmd = sba_cmd_enc(cmd, msg_len,
950				SBA_USER_DEF_SHIFT, SBA_USER_DEF_MASK);
951			c_mdata = sba_cmd_load_c_mdata(1);
952			cmd = sba_cmd_enc(cmd, SBA_C_MDATA_LS(c_mdata),
953				SBA_C_MDATA_SHIFT, SBA_C_MDATA_MASK);
954			cmd = sba_cmd_enc(cmd, SBA_CMD_LOAD_BUFFER,
955				SBA_CMD_SHIFT, SBA_CMD_MASK);
956			cmdsp->cmd = cmd;
957			*cmdsp->cmd_dma = cpu_to_le64(cmd);
958			cmdsp->flags = BRCM_SBA_CMD_TYPE_B;
959			cmdsp->data = *dst_q + msg_offset;
960			cmdsp->data_len = msg_len;
961			cmdsp++;
962		}
963	} else {
964		/* Type-A command to zero all buffers */
965		cmd = sba_cmd_enc(0x0, SBA_TYPE_A,
966				  SBA_TYPE_SHIFT, SBA_TYPE_MASK);
967		cmd = sba_cmd_enc(cmd, msg_len,
968				  SBA_USER_DEF_SHIFT, SBA_USER_DEF_MASK);
969		cmd = sba_cmd_enc(cmd, SBA_CMD_ZERO_ALL_BUFFERS,
970				  SBA_CMD_SHIFT, SBA_CMD_MASK);
971		cmdsp->cmd = cmd;
972		*cmdsp->cmd_dma = cpu_to_le64(cmd);
973		cmdsp->flags = BRCM_SBA_CMD_TYPE_A;
974		cmdsp++;
975	}
976
977	/* Type-B commands for generate P onto buf0 and Q onto buf1 */
978	for (i = 0; i < src_cnt; i++) {
979		cmd = sba_cmd_enc(0x0, SBA_TYPE_B,
980				  SBA_TYPE_SHIFT, SBA_TYPE_MASK);
981		cmd = sba_cmd_enc(cmd, msg_len,
982				  SBA_USER_DEF_SHIFT, SBA_USER_DEF_MASK);
983		c_mdata = sba_cmd_pq_c_mdata(raid6_gflog[scf[i]], 1, 0);
984		cmd = sba_cmd_enc(cmd, SBA_C_MDATA_LS(c_mdata),
985				  SBA_C_MDATA_SHIFT, SBA_C_MDATA_MASK);
986		cmd = sba_cmd_enc(cmd, SBA_C_MDATA_MS(c_mdata),
987				  SBA_C_MDATA_MS_SHIFT, SBA_C_MDATA_MS_MASK);
988		cmd = sba_cmd_enc(cmd, SBA_CMD_GALOIS_XOR,
989				  SBA_CMD_SHIFT, SBA_CMD_MASK);
990		cmdsp->cmd = cmd;
991		*cmdsp->cmd_dma = cpu_to_le64(cmd);
992		cmdsp->flags = BRCM_SBA_CMD_TYPE_B;
993		cmdsp->data = src[i] + msg_offset;
994		cmdsp->data_len = msg_len;
995		cmdsp++;
996	}
997
998	/* Type-A command to write buf0 */
999	if (dst_p) {
1000		cmd = sba_cmd_enc(0x0, SBA_TYPE_A,
1001				  SBA_TYPE_SHIFT, SBA_TYPE_MASK);
1002		cmd = sba_cmd_enc(cmd, msg_len,
1003				  SBA_USER_DEF_SHIFT, SBA_USER_DEF_MASK);
1004		cmd = sba_cmd_enc(cmd, 0x1,
1005				  SBA_RESP_SHIFT, SBA_RESP_MASK);
1006		c_mdata = sba_cmd_write_c_mdata(0);
1007		cmd = sba_cmd_enc(cmd, SBA_C_MDATA_LS(c_mdata),
1008				  SBA_C_MDATA_SHIFT, SBA_C_MDATA_MASK);
1009		cmd = sba_cmd_enc(cmd, SBA_CMD_WRITE_BUFFER,
1010				  SBA_CMD_SHIFT, SBA_CMD_MASK);
1011		cmdsp->cmd = cmd;
1012		*cmdsp->cmd_dma = cpu_to_le64(cmd);
1013		cmdsp->flags = BRCM_SBA_CMD_TYPE_A;
1014		if (req->sba->hw_resp_size) {
1015			cmdsp->flags |= BRCM_SBA_CMD_HAS_RESP;
1016			cmdsp->resp = resp_dma;
1017			cmdsp->resp_len = req->sba->hw_resp_size;
1018		}
1019		cmdsp->flags |= BRCM_SBA_CMD_HAS_OUTPUT;
1020		cmdsp->data = *dst_p + msg_offset;
1021		cmdsp->data_len = msg_len;
1022		cmdsp++;
1023	}
1024
1025	/* Type-A command to write buf1 */
1026	if (dst_q) {
1027		cmd = sba_cmd_enc(0x0, SBA_TYPE_A,
1028				  SBA_TYPE_SHIFT, SBA_TYPE_MASK);
1029		cmd = sba_cmd_enc(cmd, msg_len,
1030				  SBA_USER_DEF_SHIFT, SBA_USER_DEF_MASK);
1031		cmd = sba_cmd_enc(cmd, 0x1,
1032				  SBA_RESP_SHIFT, SBA_RESP_MASK);
1033		c_mdata = sba_cmd_write_c_mdata(1);
1034		cmd = sba_cmd_enc(cmd, SBA_C_MDATA_LS(c_mdata),
1035				  SBA_C_MDATA_SHIFT, SBA_C_MDATA_MASK);
1036		cmd = sba_cmd_enc(cmd, SBA_CMD_WRITE_BUFFER,
1037				  SBA_CMD_SHIFT, SBA_CMD_MASK);
1038		cmdsp->cmd = cmd;
1039		*cmdsp->cmd_dma = cpu_to_le64(cmd);
1040		cmdsp->flags = BRCM_SBA_CMD_TYPE_A;
1041		if (req->sba->hw_resp_size) {
1042			cmdsp->flags |= BRCM_SBA_CMD_HAS_RESP;
1043			cmdsp->resp = resp_dma;
1044			cmdsp->resp_len = req->sba->hw_resp_size;
1045		}
1046		cmdsp->flags |= BRCM_SBA_CMD_HAS_OUTPUT;
1047		cmdsp->data = *dst_q + msg_offset;
1048		cmdsp->data_len = msg_len;
1049		cmdsp++;
1050	}
1051
1052	/* Fillup brcm_message */
1053	msg->type = BRCM_MESSAGE_SBA;
1054	msg->sba.cmds = cmds;
1055	msg->sba.cmds_count = cmdsp - cmds;
1056	msg->ctx = req;
1057	msg->error = 0;
1058}
1059
1060static struct sba_request *
1061sba_prep_dma_pq_req(struct sba_device *sba, dma_addr_t off,
1062		    dma_addr_t *dst_p, dma_addr_t *dst_q, dma_addr_t *src,
1063		    u32 src_cnt, const u8 *scf, size_t len, unsigned long flags)
1064{
1065	struct sba_request *req = NULL;
1066
1067	/* Alloc new request */
1068	req = sba_alloc_request(sba);
1069	if (!req)
1070		return NULL;
1071	if (flags & DMA_PREP_FENCE)
1072		req->flags |= SBA_REQUEST_FENCE;
1073
1074	/* Fillup request messages */
1075	sba_fillup_pq_msg(req, dmaf_continue(flags),
1076			  req->cmds, &req->msg,
1077			  off, len, dst_p, dst_q, scf, src, src_cnt);
1078
1079	/* Init async_tx descriptor */
1080	req->tx.flags = flags;
1081	req->tx.cookie = -EBUSY;
1082
1083	return req;
1084}
1085
1086static void sba_fillup_pq_single_msg(struct sba_request *req,
1087				bool pq_continue,
1088				struct brcm_sba_command *cmds,
1089				struct brcm_message *msg,
1090				dma_addr_t msg_offset, size_t msg_len,
1091				dma_addr_t *dst_p, dma_addr_t *dst_q,
1092				dma_addr_t src, u8 scf)
1093{
1094	u64 cmd;
1095	u32 c_mdata;
1096	u8 pos, dpos = raid6_gflog[scf];
1097	dma_addr_t resp_dma = req->tx.phys;
1098	struct brcm_sba_command *cmdsp = cmds;
1099
1100	if (!dst_p)
1101		goto skip_p;
1102
1103	if (pq_continue) {
1104		/* Type-B command to load old P into buf0 */
1105		cmd = sba_cmd_enc(0x0, SBA_TYPE_B,
1106				  SBA_TYPE_SHIFT, SBA_TYPE_MASK);
1107		cmd = sba_cmd_enc(cmd, msg_len,
1108				  SBA_USER_DEF_SHIFT, SBA_USER_DEF_MASK);
1109		c_mdata = sba_cmd_load_c_mdata(0);
1110		cmd = sba_cmd_enc(cmd, SBA_C_MDATA_LS(c_mdata),
1111				  SBA_C_MDATA_SHIFT, SBA_C_MDATA_MASK);
1112		cmd = sba_cmd_enc(cmd, SBA_CMD_LOAD_BUFFER,
1113				  SBA_CMD_SHIFT, SBA_CMD_MASK);
1114		cmdsp->cmd = cmd;
1115		*cmdsp->cmd_dma = cpu_to_le64(cmd);
1116		cmdsp->flags = BRCM_SBA_CMD_TYPE_B;
1117		cmdsp->data = *dst_p + msg_offset;
1118		cmdsp->data_len = msg_len;
1119		cmdsp++;
1120
1121		/*
1122		 * Type-B commands to xor data with buf0 and put it
1123		 * back in buf0
1124		 */
1125		cmd = sba_cmd_enc(0x0, SBA_TYPE_B,
1126				  SBA_TYPE_SHIFT, SBA_TYPE_MASK);
1127		cmd = sba_cmd_enc(cmd, msg_len,
1128				  SBA_USER_DEF_SHIFT, SBA_USER_DEF_MASK);
1129		c_mdata = sba_cmd_xor_c_mdata(0, 0);
1130		cmd = sba_cmd_enc(cmd, SBA_C_MDATA_LS(c_mdata),
1131				  SBA_C_MDATA_SHIFT, SBA_C_MDATA_MASK);
1132		cmd = sba_cmd_enc(cmd, SBA_CMD_XOR,
1133				  SBA_CMD_SHIFT, SBA_CMD_MASK);
1134		cmdsp->cmd = cmd;
1135		*cmdsp->cmd_dma = cpu_to_le64(cmd);
1136		cmdsp->flags = BRCM_SBA_CMD_TYPE_B;
1137		cmdsp->data = src + msg_offset;
1138		cmdsp->data_len = msg_len;
1139		cmdsp++;
1140	} else {
1141		/* Type-B command to load old P into buf0 */
1142		cmd = sba_cmd_enc(0x0, SBA_TYPE_B,
1143				  SBA_TYPE_SHIFT, SBA_TYPE_MASK);
1144		cmd = sba_cmd_enc(cmd, msg_len,
1145				  SBA_USER_DEF_SHIFT, SBA_USER_DEF_MASK);
1146		c_mdata = sba_cmd_load_c_mdata(0);
1147		cmd = sba_cmd_enc(cmd, SBA_C_MDATA_LS(c_mdata),
1148				  SBA_C_MDATA_SHIFT, SBA_C_MDATA_MASK);
1149		cmd = sba_cmd_enc(cmd, SBA_CMD_LOAD_BUFFER,
1150				  SBA_CMD_SHIFT, SBA_CMD_MASK);
1151		cmdsp->cmd = cmd;
1152		*cmdsp->cmd_dma = cpu_to_le64(cmd);
1153		cmdsp->flags = BRCM_SBA_CMD_TYPE_B;
1154		cmdsp->data = src + msg_offset;
1155		cmdsp->data_len = msg_len;
1156		cmdsp++;
1157	}
1158
1159	/* Type-A command to write buf0 */
1160	cmd = sba_cmd_enc(0x0, SBA_TYPE_A,
1161			  SBA_TYPE_SHIFT, SBA_TYPE_MASK);
1162	cmd = sba_cmd_enc(cmd, msg_len,
1163			  SBA_USER_DEF_SHIFT, SBA_USER_DEF_MASK);
1164	cmd = sba_cmd_enc(cmd, 0x1,
1165			  SBA_RESP_SHIFT, SBA_RESP_MASK);
1166	c_mdata = sba_cmd_write_c_mdata(0);
1167	cmd = sba_cmd_enc(cmd, SBA_C_MDATA_LS(c_mdata),
1168			  SBA_C_MDATA_SHIFT, SBA_C_MDATA_MASK);
1169	cmd = sba_cmd_enc(cmd, SBA_CMD_WRITE_BUFFER,
1170			  SBA_CMD_SHIFT, SBA_CMD_MASK);
1171	cmdsp->cmd = cmd;
1172	*cmdsp->cmd_dma = cpu_to_le64(cmd);
1173	cmdsp->flags = BRCM_SBA_CMD_TYPE_A;
1174	if (req->sba->hw_resp_size) {
1175		cmdsp->flags |= BRCM_SBA_CMD_HAS_RESP;
1176		cmdsp->resp = resp_dma;
1177		cmdsp->resp_len = req->sba->hw_resp_size;
1178	}
1179	cmdsp->flags |= BRCM_SBA_CMD_HAS_OUTPUT;
1180	cmdsp->data = *dst_p + msg_offset;
1181	cmdsp->data_len = msg_len;
1182	cmdsp++;
1183
1184skip_p:
1185	if (!dst_q)
1186		goto skip_q;
1187
1188	/* Type-A command to zero all buffers */
1189	cmd = sba_cmd_enc(0x0, SBA_TYPE_A,
1190			  SBA_TYPE_SHIFT, SBA_TYPE_MASK);
1191	cmd = sba_cmd_enc(cmd, msg_len,
1192			  SBA_USER_DEF_SHIFT, SBA_USER_DEF_MASK);
1193	cmd = sba_cmd_enc(cmd, SBA_CMD_ZERO_ALL_BUFFERS,
1194			  SBA_CMD_SHIFT, SBA_CMD_MASK);
1195	cmdsp->cmd = cmd;
1196	*cmdsp->cmd_dma = cpu_to_le64(cmd);
1197	cmdsp->flags = BRCM_SBA_CMD_TYPE_A;
1198	cmdsp++;
1199
1200	if (dpos == 255)
1201		goto skip_q_computation;
1202	pos = (dpos < req->sba->max_pq_coefs) ?
1203		dpos : (req->sba->max_pq_coefs - 1);
1204
1205	/*
1206	 * Type-B command to generate initial Q from data
1207	 * and store output into buf0
1208	 */
1209	cmd = sba_cmd_enc(0x0, SBA_TYPE_B,
1210			  SBA_TYPE_SHIFT, SBA_TYPE_MASK);
1211	cmd = sba_cmd_enc(cmd, msg_len,
1212			  SBA_USER_DEF_SHIFT, SBA_USER_DEF_MASK);
1213	c_mdata = sba_cmd_pq_c_mdata(pos, 0, 0);
1214	cmd = sba_cmd_enc(cmd, SBA_C_MDATA_LS(c_mdata),
1215			  SBA_C_MDATA_SHIFT, SBA_C_MDATA_MASK);
1216	cmd = sba_cmd_enc(cmd, SBA_C_MDATA_MS(c_mdata),
1217			  SBA_C_MDATA_MS_SHIFT, SBA_C_MDATA_MS_MASK);
1218	cmd = sba_cmd_enc(cmd, SBA_CMD_GALOIS,
1219			  SBA_CMD_SHIFT, SBA_CMD_MASK);
1220	cmdsp->cmd = cmd;
1221	*cmdsp->cmd_dma = cpu_to_le64(cmd);
1222	cmdsp->flags = BRCM_SBA_CMD_TYPE_B;
1223	cmdsp->data = src + msg_offset;
1224	cmdsp->data_len = msg_len;
1225	cmdsp++;
1226
1227	dpos -= pos;
1228
1229	/* Multiple Type-A command to generate final Q */
1230	while (dpos) {
1231		pos = (dpos < req->sba->max_pq_coefs) ?
1232			dpos : (req->sba->max_pq_coefs - 1);
1233
1234		/*
1235		 * Type-A command to generate Q with buf0 and
1236		 * buf1 store result in buf0
1237		 */
1238		cmd = sba_cmd_enc(0x0, SBA_TYPE_A,
1239				  SBA_TYPE_SHIFT, SBA_TYPE_MASK);
1240		cmd = sba_cmd_enc(cmd, msg_len,
1241				  SBA_USER_DEF_SHIFT, SBA_USER_DEF_MASK);
1242		c_mdata = sba_cmd_pq_c_mdata(pos, 0, 1);
1243		cmd = sba_cmd_enc(cmd, SBA_C_MDATA_LS(c_mdata),
1244				  SBA_C_MDATA_SHIFT, SBA_C_MDATA_MASK);
1245		cmd = sba_cmd_enc(cmd, SBA_C_MDATA_MS(c_mdata),
1246				  SBA_C_MDATA_MS_SHIFT, SBA_C_MDATA_MS_MASK);
1247		cmd = sba_cmd_enc(cmd, SBA_CMD_GALOIS,
1248				  SBA_CMD_SHIFT, SBA_CMD_MASK);
1249		cmdsp->cmd = cmd;
1250		*cmdsp->cmd_dma = cpu_to_le64(cmd);
1251		cmdsp->flags = BRCM_SBA_CMD_TYPE_A;
1252		cmdsp++;
1253
1254		dpos -= pos;
1255	}
1256
1257skip_q_computation:
1258	if (pq_continue) {
1259		/*
1260		 * Type-B command to XOR previous output with
1261		 * buf0 and write it into buf0
1262		 */
1263		cmd = sba_cmd_enc(0x0, SBA_TYPE_B,
1264				  SBA_TYPE_SHIFT, SBA_TYPE_MASK);
1265		cmd = sba_cmd_enc(cmd, msg_len,
1266				  SBA_USER_DEF_SHIFT, SBA_USER_DEF_MASK);
1267		c_mdata = sba_cmd_xor_c_mdata(0, 0);
1268		cmd = sba_cmd_enc(cmd, SBA_C_MDATA_LS(c_mdata),
1269				  SBA_C_MDATA_SHIFT, SBA_C_MDATA_MASK);
1270		cmd = sba_cmd_enc(cmd, SBA_CMD_XOR,
1271				  SBA_CMD_SHIFT, SBA_CMD_MASK);
1272		cmdsp->cmd = cmd;
1273		*cmdsp->cmd_dma = cpu_to_le64(cmd);
1274		cmdsp->flags = BRCM_SBA_CMD_TYPE_B;
1275		cmdsp->data = *dst_q + msg_offset;
1276		cmdsp->data_len = msg_len;
1277		cmdsp++;
1278	}
1279
1280	/* Type-A command to write buf0 */
1281	cmd = sba_cmd_enc(0x0, SBA_TYPE_A,
1282			  SBA_TYPE_SHIFT, SBA_TYPE_MASK);
1283	cmd = sba_cmd_enc(cmd, msg_len,
1284			  SBA_USER_DEF_SHIFT, SBA_USER_DEF_MASK);
1285	cmd = sba_cmd_enc(cmd, 0x1,
1286			  SBA_RESP_SHIFT, SBA_RESP_MASK);
1287	c_mdata = sba_cmd_write_c_mdata(0);
1288	cmd = sba_cmd_enc(cmd, SBA_C_MDATA_LS(c_mdata),
1289			  SBA_C_MDATA_SHIFT, SBA_C_MDATA_MASK);
1290	cmd = sba_cmd_enc(cmd, SBA_CMD_WRITE_BUFFER,
1291			  SBA_CMD_SHIFT, SBA_CMD_MASK);
1292	cmdsp->cmd = cmd;
1293	*cmdsp->cmd_dma = cpu_to_le64(cmd);
1294	cmdsp->flags = BRCM_SBA_CMD_TYPE_A;
1295	if (req->sba->hw_resp_size) {
1296		cmdsp->flags |= BRCM_SBA_CMD_HAS_RESP;
1297		cmdsp->resp = resp_dma;
1298		cmdsp->resp_len = req->sba->hw_resp_size;
1299	}
1300	cmdsp->flags |= BRCM_SBA_CMD_HAS_OUTPUT;
1301	cmdsp->data = *dst_q + msg_offset;
1302	cmdsp->data_len = msg_len;
1303	cmdsp++;
1304
1305skip_q:
1306	/* Fillup brcm_message */
1307	msg->type = BRCM_MESSAGE_SBA;
1308	msg->sba.cmds = cmds;
1309	msg->sba.cmds_count = cmdsp - cmds;
1310	msg->ctx = req;
1311	msg->error = 0;
1312}
1313
1314static struct sba_request *
1315sba_prep_dma_pq_single_req(struct sba_device *sba, dma_addr_t off,
1316			   dma_addr_t *dst_p, dma_addr_t *dst_q,
1317			   dma_addr_t src, u8 scf, size_t len,
1318			   unsigned long flags)
1319{
1320	struct sba_request *req = NULL;
1321
1322	/* Alloc new request */
1323	req = sba_alloc_request(sba);
1324	if (!req)
1325		return NULL;
1326	if (flags & DMA_PREP_FENCE)
1327		req->flags |= SBA_REQUEST_FENCE;
1328
1329	/* Fillup request messages */
1330	sba_fillup_pq_single_msg(req,  dmaf_continue(flags),
1331				 req->cmds, &req->msg, off, len,
1332				 dst_p, dst_q, src, scf);
1333
1334	/* Init async_tx descriptor */
1335	req->tx.flags = flags;
1336	req->tx.cookie = -EBUSY;
1337
1338	return req;
1339}
1340
1341static struct dma_async_tx_descriptor *
1342sba_prep_dma_pq(struct dma_chan *dchan, dma_addr_t *dst, dma_addr_t *src,
1343		u32 src_cnt, const u8 *scf, size_t len, unsigned long flags)
1344{
1345	u32 i, dst_q_index;
1346	size_t req_len;
1347	bool slow = false;
1348	dma_addr_t off = 0;
1349	dma_addr_t *dst_p = NULL, *dst_q = NULL;
1350	struct sba_device *sba = to_sba_device(dchan);
1351	struct sba_request *first = NULL, *req;
1352
1353	/* Sanity checks */
1354	if (unlikely(src_cnt > sba->max_pq_srcs))
1355		return NULL;
1356	for (i = 0; i < src_cnt; i++)
1357		if (sba->max_pq_coefs <= raid6_gflog[scf[i]])
1358			slow = true;
1359
1360	/* Figure-out P and Q destination addresses */
1361	if (!(flags & DMA_PREP_PQ_DISABLE_P))
1362		dst_p = &dst[0];
1363	if (!(flags & DMA_PREP_PQ_DISABLE_Q))
1364		dst_q = &dst[1];
1365
1366	/* Create chained requests where each request is upto hw_buf_size */
1367	while (len) {
1368		req_len = (len < sba->hw_buf_size) ? len : sba->hw_buf_size;
1369
1370		if (slow) {
1371			dst_q_index = src_cnt;
1372
1373			if (dst_q) {
1374				for (i = 0; i < src_cnt; i++) {
1375					if (*dst_q == src[i]) {
1376						dst_q_index = i;
1377						break;
1378					}
1379				}
1380			}
1381
1382			if (dst_q_index < src_cnt) {
1383				i = dst_q_index;
1384				req = sba_prep_dma_pq_single_req(sba,
1385					off, dst_p, dst_q, src[i], scf[i],
1386					req_len, flags | DMA_PREP_FENCE);
1387				if (!req)
1388					goto fail;
1389
1390				if (first)
1391					sba_chain_request(first, req);
1392				else
1393					first = req;
1394
1395				flags |= DMA_PREP_CONTINUE;
1396			}
1397
1398			for (i = 0; i < src_cnt; i++) {
1399				if (dst_q_index == i)
1400					continue;
1401
1402				req = sba_prep_dma_pq_single_req(sba,
1403					off, dst_p, dst_q, src[i], scf[i],
1404					req_len, flags | DMA_PREP_FENCE);
1405				if (!req)
1406					goto fail;
1407
1408				if (first)
1409					sba_chain_request(first, req);
1410				else
1411					first = req;
1412
1413				flags |= DMA_PREP_CONTINUE;
1414			}
1415		} else {
1416			req = sba_prep_dma_pq_req(sba, off,
1417						  dst_p, dst_q, src, src_cnt,
1418						  scf, req_len, flags);
1419			if (!req)
1420				goto fail;
1421
1422			if (first)
1423				sba_chain_request(first, req);
1424			else
1425				first = req;
1426		}
1427
1428		off += req_len;
1429		len -= req_len;
1430	}
1431
1432	return (first) ? &first->tx : NULL;
1433
1434fail:
1435	if (first)
1436		sba_free_chained_requests(first);
1437	return NULL;
1438}
1439
1440/* ====== Mailbox callbacks ===== */
1441
1442static void sba_receive_message(struct mbox_client *cl, void *msg)
1443{
1444	struct brcm_message *m = msg;
1445	struct sba_request *req = m->ctx;
1446	struct sba_device *sba = req->sba;
1447
1448	/* Error count if message has error */
1449	if (m->error < 0)
1450		dev_err(sba->dev, "%s got message with error %d",
1451			dma_chan_name(&sba->dma_chan), m->error);
1452
1453	/* Process received request */
1454	sba_process_received_request(sba, req);
1455}
1456
1457/* ====== Debugfs callbacks ====== */
1458
1459static int sba_debugfs_stats_show(struct seq_file *file, void *offset)
1460{
1461	struct sba_device *sba = dev_get_drvdata(file->private);
1462
1463	/* Write stats in file */
1464	sba_write_stats_in_seqfile(sba, file);
1465
1466	return 0;
1467}
1468
1469/* ====== Platform driver routines ===== */
1470
1471static int sba_prealloc_channel_resources(struct sba_device *sba)
1472{
1473	int i, j, ret = 0;
1474	struct sba_request *req = NULL;
1475
1476	sba->resp_base = dma_alloc_coherent(sba->mbox_dev,
1477					    sba->max_resp_pool_size,
1478					    &sba->resp_dma_base, GFP_KERNEL);
1479	if (!sba->resp_base)
1480		return -ENOMEM;
1481
1482	sba->cmds_base = dma_alloc_coherent(sba->mbox_dev,
1483					    sba->max_cmds_pool_size,
1484					    &sba->cmds_dma_base, GFP_KERNEL);
1485	if (!sba->cmds_base) {
1486		ret = -ENOMEM;
1487		goto fail_free_resp_pool;
1488	}
1489
1490	spin_lock_init(&sba->reqs_lock);
1491	sba->reqs_fence = false;
1492	INIT_LIST_HEAD(&sba->reqs_alloc_list);
1493	INIT_LIST_HEAD(&sba->reqs_pending_list);
1494	INIT_LIST_HEAD(&sba->reqs_active_list);
1495	INIT_LIST_HEAD(&sba->reqs_aborted_list);
1496	INIT_LIST_HEAD(&sba->reqs_free_list);
1497
1498	for (i = 0; i < sba->max_req; i++) {
1499		req = devm_kzalloc(sba->dev,
1500				   struct_size(req, cmds, sba->max_cmd_per_req),
1501				   GFP_KERNEL);
1502		if (!req) {
1503			ret = -ENOMEM;
1504			goto fail_free_cmds_pool;
1505		}
1506		INIT_LIST_HEAD(&req->node);
1507		req->sba = sba;
1508		req->flags = SBA_REQUEST_STATE_FREE;
1509		INIT_LIST_HEAD(&req->next);
1510		atomic_set(&req->next_pending_count, 0);
1511		for (j = 0; j < sba->max_cmd_per_req; j++) {
1512			req->cmds[j].cmd = 0;
1513			req->cmds[j].cmd_dma = sba->cmds_base +
1514				(i * sba->max_cmd_per_req + j) * sizeof(u64);
1515			req->cmds[j].cmd_dma_addr = sba->cmds_dma_base +
1516				(i * sba->max_cmd_per_req + j) * sizeof(u64);
1517			req->cmds[j].flags = 0;
1518		}
1519		memset(&req->msg, 0, sizeof(req->msg));
1520		dma_async_tx_descriptor_init(&req->tx, &sba->dma_chan);
1521		async_tx_ack(&req->tx);
1522		req->tx.tx_submit = sba_tx_submit;
1523		req->tx.phys = sba->resp_dma_base + i * sba->hw_resp_size;
1524		list_add_tail(&req->node, &sba->reqs_free_list);
1525	}
1526
1527	return 0;
1528
1529fail_free_cmds_pool:
1530	dma_free_coherent(sba->mbox_dev,
1531			  sba->max_cmds_pool_size,
1532			  sba->cmds_base, sba->cmds_dma_base);
1533fail_free_resp_pool:
1534	dma_free_coherent(sba->mbox_dev,
1535			  sba->max_resp_pool_size,
1536			  sba->resp_base, sba->resp_dma_base);
1537	return ret;
1538}
1539
1540static void sba_freeup_channel_resources(struct sba_device *sba)
1541{
1542	dmaengine_terminate_all(&sba->dma_chan);
1543	dma_free_coherent(sba->mbox_dev, sba->max_cmds_pool_size,
1544			  sba->cmds_base, sba->cmds_dma_base);
1545	dma_free_coherent(sba->mbox_dev, sba->max_resp_pool_size,
1546			  sba->resp_base, sba->resp_dma_base);
1547	sba->resp_base = NULL;
1548	sba->resp_dma_base = 0;
1549}
1550
1551static int sba_async_register(struct sba_device *sba)
1552{
1553	int ret;
1554	struct dma_device *dma_dev = &sba->dma_dev;
1555
1556	/* Initialize DMA channel cookie */
1557	sba->dma_chan.device = dma_dev;
1558	dma_cookie_init(&sba->dma_chan);
1559
1560	/* Initialize DMA device capability mask */
1561	dma_cap_zero(dma_dev->cap_mask);
1562	dma_cap_set(DMA_INTERRUPT, dma_dev->cap_mask);
1563	dma_cap_set(DMA_MEMCPY, dma_dev->cap_mask);
1564	dma_cap_set(DMA_XOR, dma_dev->cap_mask);
1565	dma_cap_set(DMA_PQ, dma_dev->cap_mask);
1566
1567	/*
1568	 * Set mailbox channel device as the base device of
1569	 * our dma_device because the actual memory accesses
1570	 * will be done by mailbox controller
1571	 */
1572	dma_dev->dev = sba->mbox_dev;
1573
1574	/* Set base prep routines */
1575	dma_dev->device_free_chan_resources = sba_free_chan_resources;
1576	dma_dev->device_terminate_all = sba_device_terminate_all;
1577	dma_dev->device_issue_pending = sba_issue_pending;
1578	dma_dev->device_tx_status = sba_tx_status;
1579
1580	/* Set interrupt routine */
1581	if (dma_has_cap(DMA_INTERRUPT, dma_dev->cap_mask))
1582		dma_dev->device_prep_dma_interrupt = sba_prep_dma_interrupt;
1583
1584	/* Set memcpy routine */
1585	if (dma_has_cap(DMA_MEMCPY, dma_dev->cap_mask))
1586		dma_dev->device_prep_dma_memcpy = sba_prep_dma_memcpy;
1587
1588	/* Set xor routine and capability */
1589	if (dma_has_cap(DMA_XOR, dma_dev->cap_mask)) {
1590		dma_dev->device_prep_dma_xor = sba_prep_dma_xor;
1591		dma_dev->max_xor = sba->max_xor_srcs;
1592	}
1593
1594	/* Set pq routine and capability */
1595	if (dma_has_cap(DMA_PQ, dma_dev->cap_mask)) {
1596		dma_dev->device_prep_dma_pq = sba_prep_dma_pq;
1597		dma_set_maxpq(dma_dev, sba->max_pq_srcs, 0);
1598	}
1599
1600	/* Initialize DMA device channel list */
1601	INIT_LIST_HEAD(&dma_dev->channels);
1602	list_add_tail(&sba->dma_chan.device_node, &dma_dev->channels);
1603
1604	/* Register with Linux async DMA framework*/
1605	ret = dma_async_device_register(dma_dev);
1606	if (ret) {
1607		dev_err(sba->dev, "async device register error %d", ret);
1608		return ret;
1609	}
1610
1611	dev_info(sba->dev, "%s capabilities: %s%s%s%s\n",
1612	dma_chan_name(&sba->dma_chan),
1613	dma_has_cap(DMA_INTERRUPT, dma_dev->cap_mask) ? "interrupt " : "",
1614	dma_has_cap(DMA_MEMCPY, dma_dev->cap_mask) ? "memcpy " : "",
1615	dma_has_cap(DMA_XOR, dma_dev->cap_mask) ? "xor " : "",
1616	dma_has_cap(DMA_PQ, dma_dev->cap_mask) ? "pq " : "");
1617
1618	return 0;
1619}
1620
1621static int sba_probe(struct platform_device *pdev)
1622{
1623	int ret = 0;
1624	struct sba_device *sba;
1625	struct platform_device *mbox_pdev;
1626	struct of_phandle_args args;
1627
1628	/* Allocate main SBA struct */
1629	sba = devm_kzalloc(&pdev->dev, sizeof(*sba), GFP_KERNEL);
1630	if (!sba)
1631		return -ENOMEM;
1632
1633	sba->dev = &pdev->dev;
1634	platform_set_drvdata(pdev, sba);
1635
1636	/* Number of mailbox channels should be atleast 1 */
1637	ret = of_count_phandle_with_args(pdev->dev.of_node,
1638					 "mboxes", "#mbox-cells");
1639	if (ret <= 0)
1640		return -ENODEV;
1641
1642	/* Determine SBA version from DT compatible string */
1643	if (of_device_is_compatible(sba->dev->of_node, "brcm,iproc-sba"))
1644		sba->ver = SBA_VER_1;
1645	else if (of_device_is_compatible(sba->dev->of_node,
1646					 "brcm,iproc-sba-v2"))
1647		sba->ver = SBA_VER_2;
1648	else
1649		return -ENODEV;
1650
1651	/* Derived Configuration parameters */
1652	switch (sba->ver) {
1653	case SBA_VER_1:
1654		sba->hw_buf_size = 4096;
1655		sba->hw_resp_size = 8;
1656		sba->max_pq_coefs = 6;
1657		sba->max_pq_srcs = 6;
1658		break;
1659	case SBA_VER_2:
1660		sba->hw_buf_size = 4096;
1661		sba->hw_resp_size = 8;
1662		sba->max_pq_coefs = 30;
1663		/*
1664		 * We can support max_pq_srcs == max_pq_coefs because
1665		 * we are limited by number of SBA commands that we can
1666		 * fit in one message for underlying ring manager HW.
1667		 */
1668		sba->max_pq_srcs = 12;
1669		break;
1670	default:
1671		return -EINVAL;
1672	}
1673	sba->max_req = SBA_MAX_REQ_PER_MBOX_CHANNEL;
1674	sba->max_cmd_per_req = sba->max_pq_srcs + 3;
1675	sba->max_xor_srcs = sba->max_cmd_per_req - 1;
1676	sba->max_resp_pool_size = sba->max_req * sba->hw_resp_size;
1677	sba->max_cmds_pool_size = sba->max_req *
1678				  sba->max_cmd_per_req * sizeof(u64);
1679
1680	/* Setup mailbox client */
1681	sba->client.dev			= &pdev->dev;
1682	sba->client.rx_callback		= sba_receive_message;
1683	sba->client.tx_block		= false;
1684	sba->client.knows_txdone	= true;
1685	sba->client.tx_tout		= 0;
1686
1687	/* Request mailbox channel */
1688	sba->mchan = mbox_request_channel(&sba->client, 0);
1689	if (IS_ERR(sba->mchan)) {
1690		ret = PTR_ERR(sba->mchan);
1691		goto fail_free_mchan;
1692	}
1693
1694	/* Find-out underlying mailbox device */
1695	ret = of_parse_phandle_with_args(pdev->dev.of_node,
1696					 "mboxes", "#mbox-cells", 0, &args);
1697	if (ret)
1698		goto fail_free_mchan;
1699	mbox_pdev = of_find_device_by_node(args.np);
1700	of_node_put(args.np);
1701	if (!mbox_pdev) {
1702		ret = -ENODEV;
1703		goto fail_free_mchan;
1704	}
1705	sba->mbox_dev = &mbox_pdev->dev;
1706
1707	/* Prealloc channel resource */
1708	ret = sba_prealloc_channel_resources(sba);
1709	if (ret)
1710		goto fail_free_mchan;
1711
1712	/* Check availability of debugfs */
1713	if (!debugfs_initialized())
1714		goto skip_debugfs;
1715
1716	/* Create debugfs root entry */
1717	sba->root = debugfs_create_dir(dev_name(sba->dev), NULL);
1718
1719	/* Create debugfs stats entry */
1720	debugfs_create_devm_seqfile(sba->dev, "stats", sba->root,
1721				    sba_debugfs_stats_show);
1722
1723skip_debugfs:
1724
1725	/* Register DMA device with Linux async framework */
1726	ret = sba_async_register(sba);
1727	if (ret)
1728		goto fail_free_resources;
1729
1730	/* Print device info */
1731	dev_info(sba->dev, "%s using SBAv%d mailbox channel from %s",
1732		 dma_chan_name(&sba->dma_chan), sba->ver+1,
1733		 dev_name(sba->mbox_dev));
1734
1735	return 0;
1736
1737fail_free_resources:
1738	debugfs_remove_recursive(sba->root);
1739	sba_freeup_channel_resources(sba);
1740fail_free_mchan:
1741	mbox_free_channel(sba->mchan);
1742	return ret;
1743}
1744
1745static int sba_remove(struct platform_device *pdev)
1746{
1747	struct sba_device *sba = platform_get_drvdata(pdev);
1748
1749	dma_async_device_unregister(&sba->dma_dev);
1750
1751	debugfs_remove_recursive(sba->root);
1752
1753	sba_freeup_channel_resources(sba);
1754
1755	mbox_free_channel(sba->mchan);
1756
1757	return 0;
1758}
1759
1760static const struct of_device_id sba_of_match[] = {
1761	{ .compatible = "brcm,iproc-sba", },
1762	{ .compatible = "brcm,iproc-sba-v2", },
1763	{},
1764};
1765MODULE_DEVICE_TABLE(of, sba_of_match);
1766
1767static struct platform_driver sba_driver = {
1768	.probe = sba_probe,
1769	.remove = sba_remove,
1770	.driver = {
1771		.name = "bcm-sba-raid",
1772		.of_match_table = sba_of_match,
1773	},
1774};
1775module_platform_driver(sba_driver);
1776
1777MODULE_DESCRIPTION("Broadcom SBA RAID driver");
1778MODULE_AUTHOR("Anup Patel <anup.patel@broadcom.com>");
1779MODULE_LICENSE("GPL v2");
1780