1/**********************************************************************
2 * Author: Cavium, Inc.
3 *
4 * Contact: support@cavium.com
5 *          Please include "LiquidIO" in the subject.
6 *
7 * Copyright (c) 2003-2016 Cavium, Inc.
8 *
9 * This file is free software; you can redistribute it and/or modify
10 * it under the terms of the GNU General Public License, Version 2, as
11 * published by the Free Software Foundation.
12 *
13 * This file is distributed in the hope that it will be useful, but
14 * AS-IS and WITHOUT ANY WARRANTY; without even the implied warranty
15 * of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE, TITLE, or
16 * NONINFRINGEMENT.  See the GNU General Public License for more
17 * details.
18 **********************************************************************/
19#include <linux/pci.h>
20#include <linux/netdevice.h>
21#include <linux/vmalloc.h>
22#include "liquidio_common.h"
23#include "octeon_droq.h"
24#include "octeon_iq.h"
25#include "response_manager.h"
26#include "octeon_device.h"
27#include "octeon_main.h"
28#include "octeon_network.h"
29#include "cn66xx_device.h"
30#include "cn23xx_pf_device.h"
31#include "cn23xx_vf_device.h"
32
33struct iq_post_status {
34	int status;
35	int index;
36};
37
38static void check_db_timeout(struct work_struct *work);
39static void  __check_db_timeout(struct octeon_device *oct, u64 iq_no);
40
41static void (*reqtype_free_fn[MAX_OCTEON_DEVICES][REQTYPE_LAST + 1]) (void *);
42
43/* Define this to return the request status comaptible to old code */
44/*#define OCTEON_USE_OLD_REQ_STATUS*/
45
46/* Return 0 on success, 1 on failure */
47int octeon_init_instr_queue(struct octeon_device *oct,
48			    union oct_txpciq txpciq,
49			    u32 num_descs)
50{
51	struct octeon_instr_queue *iq;
52	struct octeon_iq_config *conf = NULL;
53	u32 iq_no = (u32)txpciq.s.q_no;
54	u32 q_size;
55	struct cavium_wq *db_wq;
56	int numa_node = dev_to_node(&oct->pci_dev->dev);
57
58	if (OCTEON_CN6XXX(oct))
59		conf = &(CFG_GET_IQ_CFG(CHIP_CONF(oct, cn6xxx)));
60	else if (OCTEON_CN23XX_PF(oct))
61		conf = &(CFG_GET_IQ_CFG(CHIP_CONF(oct, cn23xx_pf)));
62	else if (OCTEON_CN23XX_VF(oct))
63		conf = &(CFG_GET_IQ_CFG(CHIP_CONF(oct, cn23xx_vf)));
64
65	if (!conf) {
66		dev_err(&oct->pci_dev->dev, "Unsupported Chip %x\n",
67			oct->chip_id);
68		return 1;
69	}
70
71	q_size = (u32)conf->instr_type * num_descs;
72
73	iq = oct->instr_queue[iq_no];
74
75	iq->oct_dev = oct;
76
77	iq->base_addr = lio_dma_alloc(oct, q_size, &iq->base_addr_dma);
78	if (!iq->base_addr) {
79		dev_err(&oct->pci_dev->dev, "Cannot allocate memory for instr queue %d\n",
80			iq_no);
81		return 1;
82	}
83
84	iq->max_count = num_descs;
85
86	/* Initialize a list to holds requests that have been posted to Octeon
87	 * but has yet to be fetched by octeon
88	 */
89	iq->request_list = vzalloc_node(array_size(num_descs, sizeof(*iq->request_list)),
90					numa_node);
91	if (!iq->request_list)
92		iq->request_list = vzalloc(array_size(num_descs, sizeof(*iq->request_list)));
93	if (!iq->request_list) {
94		lio_dma_free(oct, q_size, iq->base_addr, iq->base_addr_dma);
95		dev_err(&oct->pci_dev->dev, "Alloc failed for IQ[%d] nr free list\n",
96			iq_no);
97		return 1;
98	}
99
100	dev_dbg(&oct->pci_dev->dev, "IQ[%d]: base: %p basedma: %pad count: %d\n",
101		iq_no, iq->base_addr, &iq->base_addr_dma, iq->max_count);
102
103	iq->txpciq.u64 = txpciq.u64;
104	iq->fill_threshold = (u32)conf->db_min;
105	iq->fill_cnt = 0;
106	iq->host_write_index = 0;
107	iq->octeon_read_index = 0;
108	iq->flush_index = 0;
109	iq->last_db_time = 0;
110	iq->do_auto_flush = 1;
111	iq->db_timeout = (u32)conf->db_timeout;
112	atomic_set(&iq->instr_pending, 0);
113	iq->pkts_processed = 0;
114
115	/* Initialize the spinlock for this instruction queue */
116	spin_lock_init(&iq->lock);
117	if (iq_no == 0) {
118		iq->allow_soft_cmds = true;
119		spin_lock_init(&iq->post_lock);
120	} else {
121		iq->allow_soft_cmds = false;
122	}
123
124	spin_lock_init(&iq->iq_flush_running_lock);
125
126	oct->io_qmask.iq |= BIT_ULL(iq_no);
127
128	/* Set the 32B/64B mode for each input queue */
129	oct->io_qmask.iq64B |= ((conf->instr_type == 64) << iq_no);
130	iq->iqcmd_64B = (conf->instr_type == 64);
131
132	oct->fn_list.setup_iq_regs(oct, iq_no);
133
134	oct->check_db_wq[iq_no].wq = alloc_workqueue("check_iq_db",
135						     WQ_MEM_RECLAIM,
136						     0);
137	if (!oct->check_db_wq[iq_no].wq) {
138		vfree(iq->request_list);
139		iq->request_list = NULL;
140		lio_dma_free(oct, q_size, iq->base_addr, iq->base_addr_dma);
141		dev_err(&oct->pci_dev->dev, "check db wq create failed for iq %d\n",
142			iq_no);
143		return 1;
144	}
145
146	db_wq = &oct->check_db_wq[iq_no];
147
148	INIT_DELAYED_WORK(&db_wq->wk.work, check_db_timeout);
149	db_wq->wk.ctxptr = oct;
150	db_wq->wk.ctxul = iq_no;
151	queue_delayed_work(db_wq->wq, &db_wq->wk.work, msecs_to_jiffies(1));
152
153	return 0;
154}
155
156int octeon_delete_instr_queue(struct octeon_device *oct, u32 iq_no)
157{
158	u64 desc_size = 0, q_size;
159	struct octeon_instr_queue *iq = oct->instr_queue[iq_no];
160
161	cancel_delayed_work_sync(&oct->check_db_wq[iq_no].wk.work);
162	destroy_workqueue(oct->check_db_wq[iq_no].wq);
163
164	if (OCTEON_CN6XXX(oct))
165		desc_size =
166		    CFG_GET_IQ_INSTR_TYPE(CHIP_CONF(oct, cn6xxx));
167	else if (OCTEON_CN23XX_PF(oct))
168		desc_size =
169		    CFG_GET_IQ_INSTR_TYPE(CHIP_CONF(oct, cn23xx_pf));
170	else if (OCTEON_CN23XX_VF(oct))
171		desc_size =
172		    CFG_GET_IQ_INSTR_TYPE(CHIP_CONF(oct, cn23xx_vf));
173
174	vfree(iq->request_list);
175
176	if (iq->base_addr) {
177		q_size = iq->max_count * desc_size;
178		lio_dma_free(oct, (u32)q_size, iq->base_addr,
179			     iq->base_addr_dma);
180		oct->io_qmask.iq &= ~(1ULL << iq_no);
181		vfree(oct->instr_queue[iq_no]);
182		oct->instr_queue[iq_no] = NULL;
183		oct->num_iqs--;
184		return 0;
185	}
186	return 1;
187}
188EXPORT_SYMBOL_GPL(octeon_delete_instr_queue);
189
190/* Return 0 on success, 1 on failure */
191int octeon_setup_iq(struct octeon_device *oct,
192		    int ifidx,
193		    int q_index,
194		    union oct_txpciq txpciq,
195		    u32 num_descs,
196		    void *app_ctx)
197{
198	u32 iq_no = (u32)txpciq.s.q_no;
199	int numa_node = dev_to_node(&oct->pci_dev->dev);
200
201	if (oct->instr_queue[iq_no]) {
202		dev_dbg(&oct->pci_dev->dev, "IQ is in use. Cannot create the IQ: %d again\n",
203			iq_no);
204		oct->instr_queue[iq_no]->txpciq.u64 = txpciq.u64;
205		oct->instr_queue[iq_no]->app_ctx = app_ctx;
206		return 0;
207	}
208	oct->instr_queue[iq_no] =
209	    vzalloc_node(sizeof(struct octeon_instr_queue), numa_node);
210	if (!oct->instr_queue[iq_no])
211		oct->instr_queue[iq_no] =
212		    vzalloc(sizeof(struct octeon_instr_queue));
213	if (!oct->instr_queue[iq_no])
214		return 1;
215
216
217	oct->instr_queue[iq_no]->q_index = q_index;
218	oct->instr_queue[iq_no]->app_ctx = app_ctx;
219	oct->instr_queue[iq_no]->ifidx = ifidx;
220
221	if (octeon_init_instr_queue(oct, txpciq, num_descs)) {
222		vfree(oct->instr_queue[iq_no]);
223		oct->instr_queue[iq_no] = NULL;
224		return 1;
225	}
226
227	oct->num_iqs++;
228	if (oct->fn_list.enable_io_queues(oct)) {
229		octeon_delete_instr_queue(oct, iq_no);
230		return 1;
231	}
232
233	return 0;
234}
235
236int lio_wait_for_instr_fetch(struct octeon_device *oct)
237{
238	int i, retry = 1000, pending, instr_cnt = 0;
239
240	do {
241		instr_cnt = 0;
242
243		for (i = 0; i < MAX_OCTEON_INSTR_QUEUES(oct); i++) {
244			if (!(oct->io_qmask.iq & BIT_ULL(i)))
245				continue;
246			pending =
247			    atomic_read(&oct->instr_queue[i]->instr_pending);
248			if (pending)
249				__check_db_timeout(oct, i);
250			instr_cnt += pending;
251		}
252
253		if (instr_cnt == 0)
254			break;
255
256		schedule_timeout_uninterruptible(1);
257
258	} while (retry-- && instr_cnt);
259
260	return instr_cnt;
261}
262EXPORT_SYMBOL_GPL(lio_wait_for_instr_fetch);
263
264static inline void
265ring_doorbell(struct octeon_device *oct, struct octeon_instr_queue *iq)
266{
267	if (atomic_read(&oct->status) == OCT_DEV_RUNNING) {
268		writel(iq->fill_cnt, iq->doorbell_reg);
269		/* make sure doorbell write goes through */
270		iq->fill_cnt = 0;
271		iq->last_db_time = jiffies;
272		return;
273	}
274}
275
276void
277octeon_ring_doorbell_locked(struct octeon_device *oct, u32 iq_no)
278{
279	struct octeon_instr_queue *iq;
280
281	iq = oct->instr_queue[iq_no];
282	spin_lock(&iq->post_lock);
283	if (iq->fill_cnt)
284		ring_doorbell(oct, iq);
285	spin_unlock(&iq->post_lock);
286}
287EXPORT_SYMBOL_GPL(octeon_ring_doorbell_locked);
288
289static inline void __copy_cmd_into_iq(struct octeon_instr_queue *iq,
290				      u8 *cmd)
291{
292	u8 *iqptr, cmdsize;
293
294	cmdsize = ((iq->iqcmd_64B) ? 64 : 32);
295	iqptr = iq->base_addr + (cmdsize * iq->host_write_index);
296
297	memcpy(iqptr, cmd, cmdsize);
298}
299
300static inline struct iq_post_status
301__post_command2(struct octeon_instr_queue *iq, u8 *cmd)
302{
303	struct iq_post_status st;
304
305	st.status = IQ_SEND_OK;
306
307	/* This ensures that the read index does not wrap around to the same
308	 * position if queue gets full before Octeon could fetch any instr.
309	 */
310	if (atomic_read(&iq->instr_pending) >= (s32)(iq->max_count - 1)) {
311		st.status = IQ_SEND_FAILED;
312		st.index = -1;
313		return st;
314	}
315
316	if (atomic_read(&iq->instr_pending) >= (s32)(iq->max_count - 2))
317		st.status = IQ_SEND_STOP;
318
319	__copy_cmd_into_iq(iq, cmd);
320
321	/* "index" is returned, host_write_index is modified. */
322	st.index = iq->host_write_index;
323	iq->host_write_index = incr_index(iq->host_write_index, 1,
324					  iq->max_count);
325	iq->fill_cnt++;
326
327	/* Flush the command into memory. We need to be sure the data is in
328	 * memory before indicating that the instruction is pending.
329	 */
330	wmb();
331
332	atomic_inc(&iq->instr_pending);
333
334	return st;
335}
336
337int
338octeon_register_reqtype_free_fn(struct octeon_device *oct, int reqtype,
339				void (*fn)(void *))
340{
341	if (reqtype > REQTYPE_LAST) {
342		dev_err(&oct->pci_dev->dev, "%s: Invalid reqtype: %d\n",
343			__func__, reqtype);
344		return -EINVAL;
345	}
346
347	reqtype_free_fn[oct->octeon_id][reqtype] = fn;
348
349	return 0;
350}
351EXPORT_SYMBOL_GPL(octeon_register_reqtype_free_fn);
352
353static inline void
354__add_to_request_list(struct octeon_instr_queue *iq,
355		      int idx, void *buf, int reqtype)
356{
357	iq->request_list[idx].buf = buf;
358	iq->request_list[idx].reqtype = reqtype;
359}
360
361/* Can only run in process context */
362int
363lio_process_iq_request_list(struct octeon_device *oct,
364			    struct octeon_instr_queue *iq, u32 napi_budget)
365{
366	struct cavium_wq *cwq = &oct->dma_comp_wq;
367	int reqtype;
368	void *buf;
369	u32 old = iq->flush_index;
370	u32 inst_count = 0;
371	unsigned int pkts_compl = 0, bytes_compl = 0;
372	struct octeon_soft_command *sc;
373	unsigned long flags;
374
375	while (old != iq->octeon_read_index) {
376		reqtype = iq->request_list[old].reqtype;
377		buf     = iq->request_list[old].buf;
378
379		if (reqtype == REQTYPE_NONE)
380			goto skip_this;
381
382		octeon_update_tx_completion_counters(buf, reqtype, &pkts_compl,
383						     &bytes_compl);
384
385		switch (reqtype) {
386		case REQTYPE_NORESP_NET:
387		case REQTYPE_NORESP_NET_SG:
388		case REQTYPE_RESP_NET_SG:
389			reqtype_free_fn[oct->octeon_id][reqtype](buf);
390			break;
391		case REQTYPE_RESP_NET:
392		case REQTYPE_SOFT_COMMAND:
393			sc = buf;
394			/* We're expecting a response from Octeon.
395			 * It's up to lio_process_ordered_list() to
396			 * process  sc. Add sc to the ordered soft
397			 * command response list because we expect
398			 * a response from Octeon.
399			 */
400			spin_lock_irqsave(&oct->response_list
401					  [OCTEON_ORDERED_SC_LIST].lock, flags);
402			atomic_inc(&oct->response_list
403				   [OCTEON_ORDERED_SC_LIST].pending_req_count);
404			list_add_tail(&sc->node, &oct->response_list
405				[OCTEON_ORDERED_SC_LIST].head);
406			spin_unlock_irqrestore(&oct->response_list
407					       [OCTEON_ORDERED_SC_LIST].lock,
408					       flags);
409			break;
410		default:
411			dev_err(&oct->pci_dev->dev,
412				"%s Unknown reqtype: %d buf: %p at idx %d\n",
413				__func__, reqtype, buf, old);
414		}
415
416		iq->request_list[old].buf = NULL;
417		iq->request_list[old].reqtype = 0;
418
419 skip_this:
420		inst_count++;
421		old = incr_index(old, 1, iq->max_count);
422
423		if ((napi_budget) && (inst_count >= napi_budget))
424			break;
425	}
426	if (bytes_compl)
427		octeon_report_tx_completion_to_bql(iq->app_ctx, pkts_compl,
428						   bytes_compl);
429	iq->flush_index = old;
430
431	if (atomic_read(&oct->response_list
432			[OCTEON_ORDERED_SC_LIST].pending_req_count))
433		queue_work(cwq->wq, &cwq->wk.work.work);
434
435	return inst_count;
436}
437EXPORT_SYMBOL_GPL(lio_process_iq_request_list);
438
439/* Can only be called from process context */
440int
441octeon_flush_iq(struct octeon_device *oct, struct octeon_instr_queue *iq,
442		u32 napi_budget)
443{
444	u32 inst_processed = 0;
445	u32 tot_inst_processed = 0;
446	int tx_done = 1;
447
448	if (!spin_trylock(&iq->iq_flush_running_lock))
449		return tx_done;
450
451	spin_lock_bh(&iq->lock);
452
453	iq->octeon_read_index = oct->fn_list.update_iq_read_idx(iq);
454
455	do {
456		/* Process any outstanding IQ packets. */
457		if (iq->flush_index == iq->octeon_read_index)
458			break;
459
460		if (napi_budget)
461			inst_processed =
462				lio_process_iq_request_list(oct, iq,
463							    napi_budget -
464							    tot_inst_processed);
465		else
466			inst_processed =
467				lio_process_iq_request_list(oct, iq, 0);
468
469		if (inst_processed) {
470			iq->pkts_processed += inst_processed;
471			atomic_sub(inst_processed, &iq->instr_pending);
472			iq->stats.instr_processed += inst_processed;
473		}
474
475		tot_inst_processed += inst_processed;
476	} while (tot_inst_processed < napi_budget);
477
478	if (napi_budget && (tot_inst_processed >= napi_budget))
479		tx_done = 0;
480
481	iq->last_db_time = jiffies;
482
483	spin_unlock_bh(&iq->lock);
484
485	spin_unlock(&iq->iq_flush_running_lock);
486
487	return tx_done;
488}
489
490/* Process instruction queue after timeout.
491 * This routine gets called from a workqueue or when removing the module.
492 */
493static void __check_db_timeout(struct octeon_device *oct, u64 iq_no)
494{
495	struct octeon_instr_queue *iq;
496	u64 next_time;
497
498	if (!oct)
499		return;
500
501	iq = oct->instr_queue[iq_no];
502	if (!iq)
503		return;
504
505	/* return immediately, if no work pending */
506	if (!atomic_read(&iq->instr_pending))
507		return;
508	/* If jiffies - last_db_time < db_timeout do nothing  */
509	next_time = iq->last_db_time + iq->db_timeout;
510	if (!time_after(jiffies, (unsigned long)next_time))
511		return;
512	iq->last_db_time = jiffies;
513
514	/* Flush the instruction queue */
515	octeon_flush_iq(oct, iq, 0);
516
517	lio_enable_irq(NULL, iq);
518}
519
520/* Called by the Poll thread at regular intervals to check the instruction
521 * queue for commands to be posted and for commands that were fetched by Octeon.
522 */
523static void check_db_timeout(struct work_struct *work)
524{
525	struct cavium_wk *wk = (struct cavium_wk *)work;
526	struct octeon_device *oct = (struct octeon_device *)wk->ctxptr;
527	u64 iq_no = wk->ctxul;
528	struct cavium_wq *db_wq = &oct->check_db_wq[iq_no];
529	u32 delay = 10;
530
531	__check_db_timeout(oct, iq_no);
532	queue_delayed_work(db_wq->wq, &db_wq->wk.work, msecs_to_jiffies(delay));
533}
534
535int
536octeon_send_command(struct octeon_device *oct, u32 iq_no,
537		    u32 force_db, void *cmd, void *buf,
538		    u32 datasize, u32 reqtype)
539{
540	int xmit_stopped;
541	struct iq_post_status st;
542	struct octeon_instr_queue *iq = oct->instr_queue[iq_no];
543
544	/* Get the lock and prevent other tasks and tx interrupt handler from
545	 * running.
546	 */
547	if (iq->allow_soft_cmds)
548		spin_lock_bh(&iq->post_lock);
549
550	st = __post_command2(iq, cmd);
551
552	if (st.status != IQ_SEND_FAILED) {
553		xmit_stopped = octeon_report_sent_bytes_to_bql(buf, reqtype);
554		__add_to_request_list(iq, st.index, buf, reqtype);
555		INCR_INSTRQUEUE_PKT_COUNT(oct, iq_no, bytes_sent, datasize);
556		INCR_INSTRQUEUE_PKT_COUNT(oct, iq_no, instr_posted, 1);
557
558		if (iq->fill_cnt >= MAX_OCTEON_FILL_COUNT || force_db ||
559		    xmit_stopped || st.status == IQ_SEND_STOP)
560			ring_doorbell(oct, iq);
561	} else {
562		INCR_INSTRQUEUE_PKT_COUNT(oct, iq_no, instr_dropped, 1);
563	}
564
565	if (iq->allow_soft_cmds)
566		spin_unlock_bh(&iq->post_lock);
567
568	/* This is only done here to expedite packets being flushed
569	 * for cases where there are no IQ completion interrupts.
570	 */
571
572	return st.status;
573}
574EXPORT_SYMBOL_GPL(octeon_send_command);
575
576void
577octeon_prepare_soft_command(struct octeon_device *oct,
578			    struct octeon_soft_command *sc,
579			    u8 opcode,
580			    u8 subcode,
581			    u32 irh_ossp,
582			    u64 ossp0,
583			    u64 ossp1)
584{
585	struct octeon_config *oct_cfg;
586	struct octeon_instr_ih2 *ih2;
587	struct octeon_instr_ih3 *ih3;
588	struct octeon_instr_pki_ih3 *pki_ih3;
589	struct octeon_instr_irh *irh;
590	struct octeon_instr_rdp *rdp;
591
592	WARN_ON(opcode > 15);
593	WARN_ON(subcode > 127);
594
595	oct_cfg = octeon_get_conf(oct);
596
597	if (OCTEON_CN23XX_PF(oct) || OCTEON_CN23XX_VF(oct)) {
598		ih3 = (struct octeon_instr_ih3 *)&sc->cmd.cmd3.ih3;
599
600		ih3->pkind = oct->instr_queue[sc->iq_no]->txpciq.s.pkind;
601
602		pki_ih3 = (struct octeon_instr_pki_ih3 *)&sc->cmd.cmd3.pki_ih3;
603
604		pki_ih3->w           = 1;
605		pki_ih3->raw         = 1;
606		pki_ih3->utag        = 1;
607		pki_ih3->uqpg        =
608			oct->instr_queue[sc->iq_no]->txpciq.s.use_qpg;
609		pki_ih3->utt         = 1;
610		pki_ih3->tag     = LIO_CONTROL;
611		pki_ih3->tagtype = ATOMIC_TAG;
612		pki_ih3->qpg         =
613			oct->instr_queue[sc->iq_no]->txpciq.s.ctrl_qpg;
614
615		pki_ih3->pm          = 0x7;
616		pki_ih3->sl          = 8;
617
618		if (sc->datasize)
619			ih3->dlengsz = sc->datasize;
620
621		irh            = (struct octeon_instr_irh *)&sc->cmd.cmd3.irh;
622		irh->opcode    = opcode;
623		irh->subcode   = subcode;
624
625		/* opcode/subcode specific parameters (ossp) */
626		irh->ossp       = irh_ossp;
627		sc->cmd.cmd3.ossp[0] = ossp0;
628		sc->cmd.cmd3.ossp[1] = ossp1;
629
630		if (sc->rdatasize) {
631			rdp = (struct octeon_instr_rdp *)&sc->cmd.cmd3.rdp;
632			rdp->pcie_port = oct->pcie_port;
633			rdp->rlen      = sc->rdatasize;
634
635			irh->rflag =  1;
636			/*PKI IH3*/
637			/* pki_ih3 irh+ossp[0]+ossp[1]+rdp+rptr = 48 bytes */
638			ih3->fsz    = LIO_SOFTCMDRESP_IH3;
639		} else {
640			irh->rflag =  0;
641			/*PKI IH3*/
642			/* pki_h3 + irh + ossp[0] + ossp[1] = 32 bytes */
643			ih3->fsz    = LIO_PCICMD_O3;
644		}
645
646	} else {
647		ih2          = (struct octeon_instr_ih2 *)&sc->cmd.cmd2.ih2;
648		ih2->tagtype = ATOMIC_TAG;
649		ih2->tag     = LIO_CONTROL;
650		ih2->raw     = 1;
651		ih2->grp     = CFG_GET_CTRL_Q_GRP(oct_cfg);
652
653		if (sc->datasize) {
654			ih2->dlengsz = sc->datasize;
655			ih2->rs = 1;
656		}
657
658		irh            = (struct octeon_instr_irh *)&sc->cmd.cmd2.irh;
659		irh->opcode    = opcode;
660		irh->subcode   = subcode;
661
662		/* opcode/subcode specific parameters (ossp) */
663		irh->ossp       = irh_ossp;
664		sc->cmd.cmd2.ossp[0] = ossp0;
665		sc->cmd.cmd2.ossp[1] = ossp1;
666
667		if (sc->rdatasize) {
668			rdp = (struct octeon_instr_rdp *)&sc->cmd.cmd2.rdp;
669			rdp->pcie_port = oct->pcie_port;
670			rdp->rlen      = sc->rdatasize;
671
672			irh->rflag =  1;
673			/* irh+ossp[0]+ossp[1]+rdp+rptr = 40 bytes */
674			ih2->fsz   = LIO_SOFTCMDRESP_IH2;
675		} else {
676			irh->rflag =  0;
677			/* irh + ossp[0] + ossp[1] = 24 bytes */
678			ih2->fsz   = LIO_PCICMD_O2;
679		}
680	}
681}
682EXPORT_SYMBOL_GPL(octeon_prepare_soft_command);
683
684int octeon_send_soft_command(struct octeon_device *oct,
685			     struct octeon_soft_command *sc)
686{
687	struct octeon_instr_queue *iq;
688	struct octeon_instr_ih2 *ih2;
689	struct octeon_instr_ih3 *ih3;
690	struct octeon_instr_irh *irh;
691	u32 len;
692
693	iq = oct->instr_queue[sc->iq_no];
694	if (!iq->allow_soft_cmds) {
695		dev_err(&oct->pci_dev->dev, "Soft commands are not allowed on Queue %d\n",
696			sc->iq_no);
697		INCR_INSTRQUEUE_PKT_COUNT(oct, sc->iq_no, instr_dropped, 1);
698		return IQ_SEND_FAILED;
699	}
700
701	if (OCTEON_CN23XX_PF(oct) || OCTEON_CN23XX_VF(oct)) {
702		ih3 =  (struct octeon_instr_ih3 *)&sc->cmd.cmd3.ih3;
703		if (ih3->dlengsz) {
704			WARN_ON(!sc->dmadptr);
705			sc->cmd.cmd3.dptr = sc->dmadptr;
706		}
707		irh = (struct octeon_instr_irh *)&sc->cmd.cmd3.irh;
708		if (irh->rflag) {
709			WARN_ON(!sc->dmarptr);
710			WARN_ON(!sc->status_word);
711			*sc->status_word = COMPLETION_WORD_INIT;
712			sc->cmd.cmd3.rptr = sc->dmarptr;
713		}
714		len = (u32)ih3->dlengsz;
715	} else {
716		ih2 = (struct octeon_instr_ih2 *)&sc->cmd.cmd2.ih2;
717		if (ih2->dlengsz) {
718			WARN_ON(!sc->dmadptr);
719			sc->cmd.cmd2.dptr = sc->dmadptr;
720		}
721		irh = (struct octeon_instr_irh *)&sc->cmd.cmd2.irh;
722		if (irh->rflag) {
723			WARN_ON(!sc->dmarptr);
724			WARN_ON(!sc->status_word);
725			*sc->status_word = COMPLETION_WORD_INIT;
726			sc->cmd.cmd2.rptr = sc->dmarptr;
727		}
728		len = (u32)ih2->dlengsz;
729	}
730
731	sc->expiry_time = jiffies + msecs_to_jiffies(LIO_SC_MAX_TMO_MS);
732
733	return (octeon_send_command(oct, sc->iq_no, 1, &sc->cmd, sc,
734				    len, REQTYPE_SOFT_COMMAND));
735}
736EXPORT_SYMBOL_GPL(octeon_send_soft_command);
737
738int octeon_setup_sc_buffer_pool(struct octeon_device *oct)
739{
740	int i;
741	u64 dma_addr;
742	struct octeon_soft_command *sc;
743
744	INIT_LIST_HEAD(&oct->sc_buf_pool.head);
745	spin_lock_init(&oct->sc_buf_pool.lock);
746	atomic_set(&oct->sc_buf_pool.alloc_buf_count, 0);
747
748	for (i = 0; i < MAX_SOFT_COMMAND_BUFFERS; i++) {
749		sc = (struct octeon_soft_command *)
750			lio_dma_alloc(oct,
751				      SOFT_COMMAND_BUFFER_SIZE,
752					  (dma_addr_t *)&dma_addr);
753		if (!sc) {
754			octeon_free_sc_buffer_pool(oct);
755			return 1;
756		}
757
758		sc->dma_addr = dma_addr;
759		sc->size = SOFT_COMMAND_BUFFER_SIZE;
760
761		list_add_tail(&sc->node, &oct->sc_buf_pool.head);
762	}
763
764	return 0;
765}
766EXPORT_SYMBOL_GPL(octeon_setup_sc_buffer_pool);
767
768int octeon_free_sc_done_list(struct octeon_device *oct)
769{
770	struct octeon_response_list *done_sc_list, *zombie_sc_list;
771	struct octeon_soft_command *sc;
772	struct list_head *tmp, *tmp2;
773	spinlock_t *sc_lists_lock; /* lock for response_list */
774
775	done_sc_list = &oct->response_list[OCTEON_DONE_SC_LIST];
776	zombie_sc_list = &oct->response_list[OCTEON_ZOMBIE_SC_LIST];
777
778	if (!atomic_read(&done_sc_list->pending_req_count))
779		return 0;
780
781	sc_lists_lock = &oct->response_list[OCTEON_ORDERED_SC_LIST].lock;
782
783	spin_lock_bh(sc_lists_lock);
784
785	list_for_each_safe(tmp, tmp2, &done_sc_list->head) {
786		sc = list_entry(tmp, struct octeon_soft_command, node);
787
788		if (READ_ONCE(sc->caller_is_done)) {
789			list_del(&sc->node);
790			atomic_dec(&done_sc_list->pending_req_count);
791
792			if (*sc->status_word == COMPLETION_WORD_INIT) {
793				/* timeout; move sc to zombie list */
794				list_add_tail(&sc->node, &zombie_sc_list->head);
795				atomic_inc(&zombie_sc_list->pending_req_count);
796			} else {
797				octeon_free_soft_command(oct, sc);
798			}
799		}
800	}
801
802	spin_unlock_bh(sc_lists_lock);
803
804	return 0;
805}
806EXPORT_SYMBOL_GPL(octeon_free_sc_done_list);
807
808int octeon_free_sc_zombie_list(struct octeon_device *oct)
809{
810	struct octeon_response_list *zombie_sc_list;
811	struct octeon_soft_command *sc;
812	struct list_head *tmp, *tmp2;
813	spinlock_t *sc_lists_lock; /* lock for response_list */
814
815	zombie_sc_list = &oct->response_list[OCTEON_ZOMBIE_SC_LIST];
816	sc_lists_lock = &oct->response_list[OCTEON_ORDERED_SC_LIST].lock;
817
818	spin_lock_bh(sc_lists_lock);
819
820	list_for_each_safe(tmp, tmp2, &zombie_sc_list->head) {
821		list_del(tmp);
822		atomic_dec(&zombie_sc_list->pending_req_count);
823		sc = list_entry(tmp, struct octeon_soft_command, node);
824		octeon_free_soft_command(oct, sc);
825	}
826
827	spin_unlock_bh(sc_lists_lock);
828
829	return 0;
830}
831EXPORT_SYMBOL_GPL(octeon_free_sc_zombie_list);
832
833int octeon_free_sc_buffer_pool(struct octeon_device *oct)
834{
835	struct list_head *tmp, *tmp2;
836	struct octeon_soft_command *sc;
837
838	octeon_free_sc_zombie_list(oct);
839
840	spin_lock_bh(&oct->sc_buf_pool.lock);
841
842	list_for_each_safe(tmp, tmp2, &oct->sc_buf_pool.head) {
843		list_del(tmp);
844
845		sc = (struct octeon_soft_command *)tmp;
846
847		lio_dma_free(oct, sc->size, sc, sc->dma_addr);
848	}
849
850	INIT_LIST_HEAD(&oct->sc_buf_pool.head);
851
852	spin_unlock_bh(&oct->sc_buf_pool.lock);
853
854	return 0;
855}
856EXPORT_SYMBOL_GPL(octeon_free_sc_buffer_pool);
857
858struct octeon_soft_command *octeon_alloc_soft_command(struct octeon_device *oct,
859						      u32 datasize,
860						      u32 rdatasize,
861						      u32 ctxsize)
862{
863	u64 dma_addr;
864	u32 size;
865	u32 offset = sizeof(struct octeon_soft_command);
866	struct octeon_soft_command *sc = NULL;
867	struct list_head *tmp;
868
869	if (!rdatasize)
870		rdatasize = 16;
871
872	WARN_ON((offset + datasize + rdatasize + ctxsize) >
873	       SOFT_COMMAND_BUFFER_SIZE);
874
875	spin_lock_bh(&oct->sc_buf_pool.lock);
876
877	if (list_empty(&oct->sc_buf_pool.head)) {
878		spin_unlock_bh(&oct->sc_buf_pool.lock);
879		return NULL;
880	}
881
882	list_for_each(tmp, &oct->sc_buf_pool.head)
883		break;
884
885	list_del(tmp);
886
887	atomic_inc(&oct->sc_buf_pool.alloc_buf_count);
888
889	spin_unlock_bh(&oct->sc_buf_pool.lock);
890
891	sc = (struct octeon_soft_command *)tmp;
892
893	dma_addr = sc->dma_addr;
894	size = sc->size;
895
896	memset(sc, 0, sc->size);
897
898	sc->dma_addr = dma_addr;
899	sc->size = size;
900
901	if (ctxsize) {
902		sc->ctxptr = (u8 *)sc + offset;
903		sc->ctxsize = ctxsize;
904	}
905
906	/* Start data at 128 byte boundary */
907	offset = (offset + ctxsize + 127) & 0xffffff80;
908
909	if (datasize) {
910		sc->virtdptr = (u8 *)sc + offset;
911		sc->dmadptr = dma_addr + offset;
912		sc->datasize = datasize;
913	}
914
915	/* Start rdata at 128 byte boundary */
916	offset = (offset + datasize + 127) & 0xffffff80;
917
918	if (rdatasize) {
919		WARN_ON(rdatasize < 16);
920		sc->virtrptr = (u8 *)sc + offset;
921		sc->dmarptr = dma_addr + offset;
922		sc->rdatasize = rdatasize;
923		sc->status_word = (u64 *)((u8 *)(sc->virtrptr) + rdatasize - 8);
924	}
925
926	return sc;
927}
928EXPORT_SYMBOL_GPL(octeon_alloc_soft_command);
929
930void octeon_free_soft_command(struct octeon_device *oct,
931			      struct octeon_soft_command *sc)
932{
933	spin_lock_bh(&oct->sc_buf_pool.lock);
934
935	list_add_tail(&sc->node, &oct->sc_buf_pool.head);
936
937	atomic_dec(&oct->sc_buf_pool.alloc_buf_count);
938
939	spin_unlock_bh(&oct->sc_buf_pool.lock);
940}
941EXPORT_SYMBOL_GPL(octeon_free_soft_command);
942