162306a36Sopenharmony_ci// SPDX-License-Identifier: GPL-2.0 262306a36Sopenharmony_ci 362306a36Sopenharmony_ci/* 462306a36Sopenharmony_ci * Copyright 2016-2022 HabanaLabs, Ltd. 562306a36Sopenharmony_ci * All Rights Reserved. 662306a36Sopenharmony_ci */ 762306a36Sopenharmony_ci 862306a36Sopenharmony_ci#include "habanalabs.h" 962306a36Sopenharmony_ci 1062306a36Sopenharmony_ci#include <linux/slab.h> 1162306a36Sopenharmony_ci 1262306a36Sopenharmony_ci/** 1362306a36Sopenharmony_ci * struct hl_eqe_work - This structure is used to schedule work of EQ 1462306a36Sopenharmony_ci * entry and cpucp_reset event 1562306a36Sopenharmony_ci * 1662306a36Sopenharmony_ci * @eq_work: workqueue object to run when EQ entry is received 1762306a36Sopenharmony_ci * @hdev: pointer to device structure 1862306a36Sopenharmony_ci * @eq_entry: copy of the EQ entry 1962306a36Sopenharmony_ci */ 2062306a36Sopenharmony_cistruct hl_eqe_work { 2162306a36Sopenharmony_ci struct work_struct eq_work; 2262306a36Sopenharmony_ci struct hl_device *hdev; 2362306a36Sopenharmony_ci struct hl_eq_entry eq_entry; 2462306a36Sopenharmony_ci}; 2562306a36Sopenharmony_ci 2662306a36Sopenharmony_ci/** 2762306a36Sopenharmony_ci * hl_cq_inc_ptr - increment ci or pi of cq 2862306a36Sopenharmony_ci * 2962306a36Sopenharmony_ci * @ptr: the current ci or pi value of the completion queue 3062306a36Sopenharmony_ci * 3162306a36Sopenharmony_ci * Increment ptr by 1. If it reaches the number of completion queue 3262306a36Sopenharmony_ci * entries, set it to 0 3362306a36Sopenharmony_ci */ 3462306a36Sopenharmony_ciinline u32 hl_cq_inc_ptr(u32 ptr) 3562306a36Sopenharmony_ci{ 3662306a36Sopenharmony_ci ptr++; 3762306a36Sopenharmony_ci if (unlikely(ptr == HL_CQ_LENGTH)) 3862306a36Sopenharmony_ci ptr = 0; 3962306a36Sopenharmony_ci return ptr; 4062306a36Sopenharmony_ci} 4162306a36Sopenharmony_ci 4262306a36Sopenharmony_ci/** 4362306a36Sopenharmony_ci * hl_eq_inc_ptr - increment ci of eq 4462306a36Sopenharmony_ci * 4562306a36Sopenharmony_ci * @ptr: the current ci value of the event queue 4662306a36Sopenharmony_ci * 4762306a36Sopenharmony_ci * Increment ptr by 1. If it reaches the number of event queue 4862306a36Sopenharmony_ci * entries, set it to 0 4962306a36Sopenharmony_ci */ 5062306a36Sopenharmony_cistatic inline u32 hl_eq_inc_ptr(u32 ptr) 5162306a36Sopenharmony_ci{ 5262306a36Sopenharmony_ci ptr++; 5362306a36Sopenharmony_ci if (unlikely(ptr == HL_EQ_LENGTH)) 5462306a36Sopenharmony_ci ptr = 0; 5562306a36Sopenharmony_ci return ptr; 5662306a36Sopenharmony_ci} 5762306a36Sopenharmony_ci 5862306a36Sopenharmony_cistatic void irq_handle_eqe(struct work_struct *work) 5962306a36Sopenharmony_ci{ 6062306a36Sopenharmony_ci struct hl_eqe_work *eqe_work = container_of(work, struct hl_eqe_work, 6162306a36Sopenharmony_ci eq_work); 6262306a36Sopenharmony_ci struct hl_device *hdev = eqe_work->hdev; 6362306a36Sopenharmony_ci 6462306a36Sopenharmony_ci hdev->asic_funcs->handle_eqe(hdev, &eqe_work->eq_entry); 6562306a36Sopenharmony_ci 6662306a36Sopenharmony_ci kfree(eqe_work); 6762306a36Sopenharmony_ci} 6862306a36Sopenharmony_ci 6962306a36Sopenharmony_ci/** 7062306a36Sopenharmony_ci * job_finish - queue job finish work 7162306a36Sopenharmony_ci * 7262306a36Sopenharmony_ci * @hdev: pointer to device structure 7362306a36Sopenharmony_ci * @cs_seq: command submission sequence 7462306a36Sopenharmony_ci * @cq: completion queue 7562306a36Sopenharmony_ci * @timestamp: interrupt timestamp 7662306a36Sopenharmony_ci * 7762306a36Sopenharmony_ci */ 7862306a36Sopenharmony_cistatic void job_finish(struct hl_device *hdev, u32 cs_seq, struct hl_cq *cq, ktime_t timestamp) 7962306a36Sopenharmony_ci{ 8062306a36Sopenharmony_ci struct hl_hw_queue *queue; 8162306a36Sopenharmony_ci struct hl_cs_job *job; 8262306a36Sopenharmony_ci 8362306a36Sopenharmony_ci queue = &hdev->kernel_queues[cq->hw_queue_id]; 8462306a36Sopenharmony_ci job = queue->shadow_queue[hl_pi_2_offset(cs_seq)]; 8562306a36Sopenharmony_ci job->timestamp = timestamp; 8662306a36Sopenharmony_ci queue_work(hdev->cq_wq[cq->cq_idx], &job->finish_work); 8762306a36Sopenharmony_ci 8862306a36Sopenharmony_ci atomic_inc(&queue->ci); 8962306a36Sopenharmony_ci} 9062306a36Sopenharmony_ci 9162306a36Sopenharmony_ci/** 9262306a36Sopenharmony_ci * cs_finish - queue all cs jobs finish work 9362306a36Sopenharmony_ci * 9462306a36Sopenharmony_ci * @hdev: pointer to device structure 9562306a36Sopenharmony_ci * @cs_seq: command submission sequence 9662306a36Sopenharmony_ci * @timestamp: interrupt timestamp 9762306a36Sopenharmony_ci * 9862306a36Sopenharmony_ci */ 9962306a36Sopenharmony_cistatic void cs_finish(struct hl_device *hdev, u16 cs_seq, ktime_t timestamp) 10062306a36Sopenharmony_ci{ 10162306a36Sopenharmony_ci struct asic_fixed_properties *prop = &hdev->asic_prop; 10262306a36Sopenharmony_ci struct hl_hw_queue *queue; 10362306a36Sopenharmony_ci struct hl_cs *cs; 10462306a36Sopenharmony_ci struct hl_cs_job *job; 10562306a36Sopenharmony_ci 10662306a36Sopenharmony_ci cs = hdev->shadow_cs_queue[cs_seq & (prop->max_pending_cs - 1)]; 10762306a36Sopenharmony_ci if (!cs) { 10862306a36Sopenharmony_ci dev_warn(hdev->dev, 10962306a36Sopenharmony_ci "No pointer to CS in shadow array at index %d\n", 11062306a36Sopenharmony_ci cs_seq); 11162306a36Sopenharmony_ci return; 11262306a36Sopenharmony_ci } 11362306a36Sopenharmony_ci 11462306a36Sopenharmony_ci list_for_each_entry(job, &cs->job_list, cs_node) { 11562306a36Sopenharmony_ci queue = &hdev->kernel_queues[job->hw_queue_id]; 11662306a36Sopenharmony_ci atomic_inc(&queue->ci); 11762306a36Sopenharmony_ci } 11862306a36Sopenharmony_ci 11962306a36Sopenharmony_ci cs->completion_timestamp = timestamp; 12062306a36Sopenharmony_ci queue_work(hdev->cs_cmplt_wq, &cs->finish_work); 12162306a36Sopenharmony_ci} 12262306a36Sopenharmony_ci 12362306a36Sopenharmony_ci/** 12462306a36Sopenharmony_ci * hl_irq_handler_cq - irq handler for completion queue 12562306a36Sopenharmony_ci * 12662306a36Sopenharmony_ci * @irq: irq number 12762306a36Sopenharmony_ci * @arg: pointer to completion queue structure 12862306a36Sopenharmony_ci * 12962306a36Sopenharmony_ci */ 13062306a36Sopenharmony_ciirqreturn_t hl_irq_handler_cq(int irq, void *arg) 13162306a36Sopenharmony_ci{ 13262306a36Sopenharmony_ci struct hl_cq *cq = arg; 13362306a36Sopenharmony_ci struct hl_device *hdev = cq->hdev; 13462306a36Sopenharmony_ci bool shadow_index_valid, entry_ready; 13562306a36Sopenharmony_ci u16 shadow_index; 13662306a36Sopenharmony_ci struct hl_cq_entry *cq_entry, *cq_base; 13762306a36Sopenharmony_ci ktime_t timestamp = ktime_get(); 13862306a36Sopenharmony_ci 13962306a36Sopenharmony_ci if (hdev->disabled) { 14062306a36Sopenharmony_ci dev_dbg(hdev->dev, 14162306a36Sopenharmony_ci "Device disabled but received IRQ %d for CQ %d\n", 14262306a36Sopenharmony_ci irq, cq->hw_queue_id); 14362306a36Sopenharmony_ci return IRQ_HANDLED; 14462306a36Sopenharmony_ci } 14562306a36Sopenharmony_ci 14662306a36Sopenharmony_ci cq_base = cq->kernel_address; 14762306a36Sopenharmony_ci 14862306a36Sopenharmony_ci while (1) { 14962306a36Sopenharmony_ci cq_entry = (struct hl_cq_entry *) &cq_base[cq->ci]; 15062306a36Sopenharmony_ci 15162306a36Sopenharmony_ci entry_ready = !!FIELD_GET(CQ_ENTRY_READY_MASK, 15262306a36Sopenharmony_ci le32_to_cpu(cq_entry->data)); 15362306a36Sopenharmony_ci if (!entry_ready) 15462306a36Sopenharmony_ci break; 15562306a36Sopenharmony_ci 15662306a36Sopenharmony_ci /* Make sure we read CQ entry contents after we've 15762306a36Sopenharmony_ci * checked the ownership bit. 15862306a36Sopenharmony_ci */ 15962306a36Sopenharmony_ci dma_rmb(); 16062306a36Sopenharmony_ci 16162306a36Sopenharmony_ci shadow_index_valid = 16262306a36Sopenharmony_ci !!FIELD_GET(CQ_ENTRY_SHADOW_INDEX_VALID_MASK, 16362306a36Sopenharmony_ci le32_to_cpu(cq_entry->data)); 16462306a36Sopenharmony_ci 16562306a36Sopenharmony_ci shadow_index = FIELD_GET(CQ_ENTRY_SHADOW_INDEX_MASK, 16662306a36Sopenharmony_ci le32_to_cpu(cq_entry->data)); 16762306a36Sopenharmony_ci 16862306a36Sopenharmony_ci /* 16962306a36Sopenharmony_ci * CQ interrupt handler has 2 modes of operation: 17062306a36Sopenharmony_ci * 1. Interrupt per CS completion: (Single CQ for all queues) 17162306a36Sopenharmony_ci * CQ entry represents a completed CS 17262306a36Sopenharmony_ci * 17362306a36Sopenharmony_ci * 2. Interrupt per CS job completion in queue: (CQ per queue) 17462306a36Sopenharmony_ci * CQ entry represents a completed job in a certain queue 17562306a36Sopenharmony_ci */ 17662306a36Sopenharmony_ci if (shadow_index_valid && !hdev->disabled) { 17762306a36Sopenharmony_ci if (hdev->asic_prop.completion_mode == 17862306a36Sopenharmony_ci HL_COMPLETION_MODE_CS) 17962306a36Sopenharmony_ci cs_finish(hdev, shadow_index, timestamp); 18062306a36Sopenharmony_ci else 18162306a36Sopenharmony_ci job_finish(hdev, shadow_index, cq, timestamp); 18262306a36Sopenharmony_ci } 18362306a36Sopenharmony_ci 18462306a36Sopenharmony_ci /* Clear CQ entry ready bit */ 18562306a36Sopenharmony_ci cq_entry->data = cpu_to_le32(le32_to_cpu(cq_entry->data) & 18662306a36Sopenharmony_ci ~CQ_ENTRY_READY_MASK); 18762306a36Sopenharmony_ci 18862306a36Sopenharmony_ci cq->ci = hl_cq_inc_ptr(cq->ci); 18962306a36Sopenharmony_ci 19062306a36Sopenharmony_ci /* Increment free slots */ 19162306a36Sopenharmony_ci atomic_inc(&cq->free_slots_cnt); 19262306a36Sopenharmony_ci } 19362306a36Sopenharmony_ci 19462306a36Sopenharmony_ci return IRQ_HANDLED; 19562306a36Sopenharmony_ci} 19662306a36Sopenharmony_ci 19762306a36Sopenharmony_ci/* 19862306a36Sopenharmony_ci * hl_ts_free_objects - handler of the free objects workqueue. 19962306a36Sopenharmony_ci * This function should put refcount to objects that the registration node 20062306a36Sopenharmony_ci * took refcount to them. 20162306a36Sopenharmony_ci * @work: workqueue object pointer 20262306a36Sopenharmony_ci */ 20362306a36Sopenharmony_cistatic void hl_ts_free_objects(struct work_struct *work) 20462306a36Sopenharmony_ci{ 20562306a36Sopenharmony_ci struct timestamp_reg_work_obj *job = 20662306a36Sopenharmony_ci container_of(work, struct timestamp_reg_work_obj, free_obj); 20762306a36Sopenharmony_ci struct timestamp_reg_free_node *free_obj, *temp_free_obj; 20862306a36Sopenharmony_ci struct list_head *free_list_head = job->free_obj_head; 20962306a36Sopenharmony_ci struct hl_device *hdev = job->hdev; 21062306a36Sopenharmony_ci 21162306a36Sopenharmony_ci list_for_each_entry_safe(free_obj, temp_free_obj, free_list_head, free_objects_node) { 21262306a36Sopenharmony_ci dev_dbg(hdev->dev, "About to put refcount to buf (%p) cq_cb(%p)\n", 21362306a36Sopenharmony_ci free_obj->buf, 21462306a36Sopenharmony_ci free_obj->cq_cb); 21562306a36Sopenharmony_ci 21662306a36Sopenharmony_ci hl_mmap_mem_buf_put(free_obj->buf); 21762306a36Sopenharmony_ci hl_cb_put(free_obj->cq_cb); 21862306a36Sopenharmony_ci kfree(free_obj); 21962306a36Sopenharmony_ci } 22062306a36Sopenharmony_ci 22162306a36Sopenharmony_ci kfree(free_list_head); 22262306a36Sopenharmony_ci kfree(job); 22362306a36Sopenharmony_ci} 22462306a36Sopenharmony_ci 22562306a36Sopenharmony_ci/* 22662306a36Sopenharmony_ci * This function called with spin_lock of wait_list_lock taken 22762306a36Sopenharmony_ci * This function will set timestamp and delete the registration node from the 22862306a36Sopenharmony_ci * wait_list_lock. 22962306a36Sopenharmony_ci * and since we're protected with spin_lock here, so we cannot just put the refcount 23062306a36Sopenharmony_ci * for the objects here, since the release function may be called and it's also a long 23162306a36Sopenharmony_ci * logic (which might sleep also) that cannot be handled in irq context. 23262306a36Sopenharmony_ci * so here we'll be filling a list with nodes of "put" jobs and then will send this 23362306a36Sopenharmony_ci * list to a dedicated workqueue to do the actual put. 23462306a36Sopenharmony_ci */ 23562306a36Sopenharmony_cistatic int handle_registration_node(struct hl_device *hdev, struct hl_user_pending_interrupt *pend, 23662306a36Sopenharmony_ci struct list_head **free_list, ktime_t now) 23762306a36Sopenharmony_ci{ 23862306a36Sopenharmony_ci struct timestamp_reg_free_node *free_node; 23962306a36Sopenharmony_ci u64 timestamp; 24062306a36Sopenharmony_ci 24162306a36Sopenharmony_ci if (!(*free_list)) { 24262306a36Sopenharmony_ci /* Alloc/Init the timestamp registration free objects list */ 24362306a36Sopenharmony_ci *free_list = kmalloc(sizeof(struct list_head), GFP_ATOMIC); 24462306a36Sopenharmony_ci if (!(*free_list)) 24562306a36Sopenharmony_ci return -ENOMEM; 24662306a36Sopenharmony_ci 24762306a36Sopenharmony_ci INIT_LIST_HEAD(*free_list); 24862306a36Sopenharmony_ci } 24962306a36Sopenharmony_ci 25062306a36Sopenharmony_ci free_node = kmalloc(sizeof(*free_node), GFP_ATOMIC); 25162306a36Sopenharmony_ci if (!free_node) 25262306a36Sopenharmony_ci return -ENOMEM; 25362306a36Sopenharmony_ci 25462306a36Sopenharmony_ci timestamp = ktime_to_ns(now); 25562306a36Sopenharmony_ci 25662306a36Sopenharmony_ci *pend->ts_reg_info.timestamp_kernel_addr = timestamp; 25762306a36Sopenharmony_ci 25862306a36Sopenharmony_ci dev_dbg(hdev->dev, "Timestamp is set to ts cb address (%p), ts: 0x%llx\n", 25962306a36Sopenharmony_ci pend->ts_reg_info.timestamp_kernel_addr, 26062306a36Sopenharmony_ci *(u64 *)pend->ts_reg_info.timestamp_kernel_addr); 26162306a36Sopenharmony_ci 26262306a36Sopenharmony_ci list_del(&pend->wait_list_node); 26362306a36Sopenharmony_ci 26462306a36Sopenharmony_ci /* Mark kernel CB node as free */ 26562306a36Sopenharmony_ci pend->ts_reg_info.in_use = 0; 26662306a36Sopenharmony_ci 26762306a36Sopenharmony_ci /* Putting the refcount for ts_buff and cq_cb objects will be handled 26862306a36Sopenharmony_ci * in workqueue context, just add job to free_list. 26962306a36Sopenharmony_ci */ 27062306a36Sopenharmony_ci free_node->buf = pend->ts_reg_info.buf; 27162306a36Sopenharmony_ci free_node->cq_cb = pend->ts_reg_info.cq_cb; 27262306a36Sopenharmony_ci list_add(&free_node->free_objects_node, *free_list); 27362306a36Sopenharmony_ci 27462306a36Sopenharmony_ci return 0; 27562306a36Sopenharmony_ci} 27662306a36Sopenharmony_ci 27762306a36Sopenharmony_cistatic void handle_user_interrupt(struct hl_device *hdev, struct hl_user_interrupt *intr) 27862306a36Sopenharmony_ci{ 27962306a36Sopenharmony_ci struct hl_user_pending_interrupt *pend, *temp_pend; 28062306a36Sopenharmony_ci struct list_head *ts_reg_free_list_head = NULL; 28162306a36Sopenharmony_ci struct timestamp_reg_work_obj *job; 28262306a36Sopenharmony_ci bool reg_node_handle_fail = false; 28362306a36Sopenharmony_ci int rc; 28462306a36Sopenharmony_ci 28562306a36Sopenharmony_ci /* For registration nodes: 28662306a36Sopenharmony_ci * As part of handling the registration nodes, we should put refcount to 28762306a36Sopenharmony_ci * some objects. the problem is that we cannot do that under spinlock 28862306a36Sopenharmony_ci * or in irq handler context at all (since release functions are long and 28962306a36Sopenharmony_ci * might sleep), so we will need to handle that part in workqueue context. 29062306a36Sopenharmony_ci * To avoid handling kmalloc failure which compels us rolling back actions 29162306a36Sopenharmony_ci * and move nodes hanged on the free list back to the interrupt wait list 29262306a36Sopenharmony_ci * we always alloc the job of the WQ at the beginning. 29362306a36Sopenharmony_ci */ 29462306a36Sopenharmony_ci job = kmalloc(sizeof(*job), GFP_ATOMIC); 29562306a36Sopenharmony_ci if (!job) 29662306a36Sopenharmony_ci return; 29762306a36Sopenharmony_ci 29862306a36Sopenharmony_ci spin_lock(&intr->wait_list_lock); 29962306a36Sopenharmony_ci list_for_each_entry_safe(pend, temp_pend, &intr->wait_list_head, wait_list_node) { 30062306a36Sopenharmony_ci if ((pend->cq_kernel_addr && *(pend->cq_kernel_addr) >= pend->cq_target_value) || 30162306a36Sopenharmony_ci !pend->cq_kernel_addr) { 30262306a36Sopenharmony_ci if (pend->ts_reg_info.buf) { 30362306a36Sopenharmony_ci if (!reg_node_handle_fail) { 30462306a36Sopenharmony_ci rc = handle_registration_node(hdev, pend, 30562306a36Sopenharmony_ci &ts_reg_free_list_head, intr->timestamp); 30662306a36Sopenharmony_ci if (rc) 30762306a36Sopenharmony_ci reg_node_handle_fail = true; 30862306a36Sopenharmony_ci } 30962306a36Sopenharmony_ci } else { 31062306a36Sopenharmony_ci /* Handle wait target value node */ 31162306a36Sopenharmony_ci pend->fence.timestamp = intr->timestamp; 31262306a36Sopenharmony_ci complete_all(&pend->fence.completion); 31362306a36Sopenharmony_ci } 31462306a36Sopenharmony_ci } 31562306a36Sopenharmony_ci } 31662306a36Sopenharmony_ci spin_unlock(&intr->wait_list_lock); 31762306a36Sopenharmony_ci 31862306a36Sopenharmony_ci if (ts_reg_free_list_head) { 31962306a36Sopenharmony_ci INIT_WORK(&job->free_obj, hl_ts_free_objects); 32062306a36Sopenharmony_ci job->free_obj_head = ts_reg_free_list_head; 32162306a36Sopenharmony_ci job->hdev = hdev; 32262306a36Sopenharmony_ci queue_work(hdev->ts_free_obj_wq, &job->free_obj); 32362306a36Sopenharmony_ci } else { 32462306a36Sopenharmony_ci kfree(job); 32562306a36Sopenharmony_ci } 32662306a36Sopenharmony_ci} 32762306a36Sopenharmony_ci 32862306a36Sopenharmony_cistatic void handle_tpc_interrupt(struct hl_device *hdev) 32962306a36Sopenharmony_ci{ 33062306a36Sopenharmony_ci u64 event_mask; 33162306a36Sopenharmony_ci u32 flags; 33262306a36Sopenharmony_ci 33362306a36Sopenharmony_ci event_mask = HL_NOTIFIER_EVENT_TPC_ASSERT | 33462306a36Sopenharmony_ci HL_NOTIFIER_EVENT_USER_ENGINE_ERR | 33562306a36Sopenharmony_ci HL_NOTIFIER_EVENT_DEVICE_RESET; 33662306a36Sopenharmony_ci 33762306a36Sopenharmony_ci flags = HL_DRV_RESET_DELAY; 33862306a36Sopenharmony_ci 33962306a36Sopenharmony_ci dev_err_ratelimited(hdev->dev, "Received TPC assert\n"); 34062306a36Sopenharmony_ci hl_device_cond_reset(hdev, flags, event_mask); 34162306a36Sopenharmony_ci} 34262306a36Sopenharmony_ci 34362306a36Sopenharmony_cistatic void handle_unexpected_user_interrupt(struct hl_device *hdev) 34462306a36Sopenharmony_ci{ 34562306a36Sopenharmony_ci dev_err_ratelimited(hdev->dev, "Received unexpected user error interrupt\n"); 34662306a36Sopenharmony_ci} 34762306a36Sopenharmony_ci 34862306a36Sopenharmony_ci/** 34962306a36Sopenharmony_ci * hl_irq_handler_user_interrupt - irq handler for user interrupts 35062306a36Sopenharmony_ci * 35162306a36Sopenharmony_ci * @irq: irq number 35262306a36Sopenharmony_ci * @arg: pointer to user interrupt structure 35362306a36Sopenharmony_ci * 35462306a36Sopenharmony_ci */ 35562306a36Sopenharmony_ciirqreturn_t hl_irq_handler_user_interrupt(int irq, void *arg) 35662306a36Sopenharmony_ci{ 35762306a36Sopenharmony_ci struct hl_user_interrupt *user_int = arg; 35862306a36Sopenharmony_ci 35962306a36Sopenharmony_ci user_int->timestamp = ktime_get(); 36062306a36Sopenharmony_ci 36162306a36Sopenharmony_ci return IRQ_WAKE_THREAD; 36262306a36Sopenharmony_ci} 36362306a36Sopenharmony_ci 36462306a36Sopenharmony_ci/** 36562306a36Sopenharmony_ci * hl_irq_user_interrupt_thread_handler - irq thread handler for user interrupts. 36662306a36Sopenharmony_ci * This function is invoked by threaded irq mechanism 36762306a36Sopenharmony_ci * 36862306a36Sopenharmony_ci * @irq: irq number 36962306a36Sopenharmony_ci * @arg: pointer to user interrupt structure 37062306a36Sopenharmony_ci * 37162306a36Sopenharmony_ci */ 37262306a36Sopenharmony_ciirqreturn_t hl_irq_user_interrupt_thread_handler(int irq, void *arg) 37362306a36Sopenharmony_ci{ 37462306a36Sopenharmony_ci struct hl_user_interrupt *user_int = arg; 37562306a36Sopenharmony_ci struct hl_device *hdev = user_int->hdev; 37662306a36Sopenharmony_ci 37762306a36Sopenharmony_ci switch (user_int->type) { 37862306a36Sopenharmony_ci case HL_USR_INTERRUPT_CQ: 37962306a36Sopenharmony_ci handle_user_interrupt(hdev, &hdev->common_user_cq_interrupt); 38062306a36Sopenharmony_ci 38162306a36Sopenharmony_ci /* Handle user cq interrupt registered on this specific irq */ 38262306a36Sopenharmony_ci handle_user_interrupt(hdev, user_int); 38362306a36Sopenharmony_ci break; 38462306a36Sopenharmony_ci case HL_USR_INTERRUPT_DECODER: 38562306a36Sopenharmony_ci handle_user_interrupt(hdev, &hdev->common_decoder_interrupt); 38662306a36Sopenharmony_ci 38762306a36Sopenharmony_ci /* Handle decoder interrupt registered on this specific irq */ 38862306a36Sopenharmony_ci handle_user_interrupt(hdev, user_int); 38962306a36Sopenharmony_ci break; 39062306a36Sopenharmony_ci case HL_USR_INTERRUPT_TPC: 39162306a36Sopenharmony_ci handle_tpc_interrupt(hdev); 39262306a36Sopenharmony_ci break; 39362306a36Sopenharmony_ci case HL_USR_INTERRUPT_UNEXPECTED: 39462306a36Sopenharmony_ci handle_unexpected_user_interrupt(hdev); 39562306a36Sopenharmony_ci break; 39662306a36Sopenharmony_ci default: 39762306a36Sopenharmony_ci break; 39862306a36Sopenharmony_ci } 39962306a36Sopenharmony_ci 40062306a36Sopenharmony_ci return IRQ_HANDLED; 40162306a36Sopenharmony_ci} 40262306a36Sopenharmony_ci 40362306a36Sopenharmony_ci/** 40462306a36Sopenharmony_ci * hl_irq_handler_eq - irq handler for event queue 40562306a36Sopenharmony_ci * 40662306a36Sopenharmony_ci * @irq: irq number 40762306a36Sopenharmony_ci * @arg: pointer to event queue structure 40862306a36Sopenharmony_ci * 40962306a36Sopenharmony_ci */ 41062306a36Sopenharmony_ciirqreturn_t hl_irq_handler_eq(int irq, void *arg) 41162306a36Sopenharmony_ci{ 41262306a36Sopenharmony_ci struct hl_eq *eq = arg; 41362306a36Sopenharmony_ci struct hl_device *hdev = eq->hdev; 41462306a36Sopenharmony_ci struct hl_eq_entry *eq_entry; 41562306a36Sopenharmony_ci struct hl_eq_entry *eq_base; 41662306a36Sopenharmony_ci struct hl_eqe_work *handle_eqe_work; 41762306a36Sopenharmony_ci bool entry_ready; 41862306a36Sopenharmony_ci u32 cur_eqe, ctl; 41962306a36Sopenharmony_ci u16 cur_eqe_index, event_type; 42062306a36Sopenharmony_ci 42162306a36Sopenharmony_ci eq_base = eq->kernel_address; 42262306a36Sopenharmony_ci 42362306a36Sopenharmony_ci while (1) { 42462306a36Sopenharmony_ci cur_eqe = le32_to_cpu(eq_base[eq->ci].hdr.ctl); 42562306a36Sopenharmony_ci entry_ready = !!FIELD_GET(EQ_CTL_READY_MASK, cur_eqe); 42662306a36Sopenharmony_ci 42762306a36Sopenharmony_ci if (!entry_ready) 42862306a36Sopenharmony_ci break; 42962306a36Sopenharmony_ci 43062306a36Sopenharmony_ci cur_eqe_index = FIELD_GET(EQ_CTL_INDEX_MASK, cur_eqe); 43162306a36Sopenharmony_ci if ((hdev->event_queue.check_eqe_index) && 43262306a36Sopenharmony_ci (((eq->prev_eqe_index + 1) & EQ_CTL_INDEX_MASK) != cur_eqe_index)) { 43362306a36Sopenharmony_ci dev_err(hdev->dev, 43462306a36Sopenharmony_ci "EQE %#x in queue is ready but index does not match %d!=%d", 43562306a36Sopenharmony_ci cur_eqe, 43662306a36Sopenharmony_ci ((eq->prev_eqe_index + 1) & EQ_CTL_INDEX_MASK), 43762306a36Sopenharmony_ci cur_eqe_index); 43862306a36Sopenharmony_ci break; 43962306a36Sopenharmony_ci } 44062306a36Sopenharmony_ci 44162306a36Sopenharmony_ci eq->prev_eqe_index++; 44262306a36Sopenharmony_ci 44362306a36Sopenharmony_ci eq_entry = &eq_base[eq->ci]; 44462306a36Sopenharmony_ci 44562306a36Sopenharmony_ci /* 44662306a36Sopenharmony_ci * Make sure we read EQ entry contents after we've 44762306a36Sopenharmony_ci * checked the ownership bit. 44862306a36Sopenharmony_ci */ 44962306a36Sopenharmony_ci dma_rmb(); 45062306a36Sopenharmony_ci 45162306a36Sopenharmony_ci if (hdev->disabled && !hdev->reset_info.in_compute_reset) { 45262306a36Sopenharmony_ci ctl = le32_to_cpu(eq_entry->hdr.ctl); 45362306a36Sopenharmony_ci event_type = ((ctl & EQ_CTL_EVENT_TYPE_MASK) >> EQ_CTL_EVENT_TYPE_SHIFT); 45462306a36Sopenharmony_ci dev_warn(hdev->dev, 45562306a36Sopenharmony_ci "Device disabled but received an EQ event (%u)\n", event_type); 45662306a36Sopenharmony_ci goto skip_irq; 45762306a36Sopenharmony_ci } 45862306a36Sopenharmony_ci 45962306a36Sopenharmony_ci handle_eqe_work = kmalloc(sizeof(*handle_eqe_work), GFP_ATOMIC); 46062306a36Sopenharmony_ci if (handle_eqe_work) { 46162306a36Sopenharmony_ci INIT_WORK(&handle_eqe_work->eq_work, irq_handle_eqe); 46262306a36Sopenharmony_ci handle_eqe_work->hdev = hdev; 46362306a36Sopenharmony_ci 46462306a36Sopenharmony_ci memcpy(&handle_eqe_work->eq_entry, eq_entry, 46562306a36Sopenharmony_ci sizeof(*eq_entry)); 46662306a36Sopenharmony_ci 46762306a36Sopenharmony_ci queue_work(hdev->eq_wq, &handle_eqe_work->eq_work); 46862306a36Sopenharmony_ci } 46962306a36Sopenharmony_ciskip_irq: 47062306a36Sopenharmony_ci /* Clear EQ entry ready bit */ 47162306a36Sopenharmony_ci eq_entry->hdr.ctl = 47262306a36Sopenharmony_ci cpu_to_le32(le32_to_cpu(eq_entry->hdr.ctl) & 47362306a36Sopenharmony_ci ~EQ_CTL_READY_MASK); 47462306a36Sopenharmony_ci 47562306a36Sopenharmony_ci eq->ci = hl_eq_inc_ptr(eq->ci); 47662306a36Sopenharmony_ci 47762306a36Sopenharmony_ci hdev->asic_funcs->update_eq_ci(hdev, eq->ci); 47862306a36Sopenharmony_ci } 47962306a36Sopenharmony_ci 48062306a36Sopenharmony_ci return IRQ_HANDLED; 48162306a36Sopenharmony_ci} 48262306a36Sopenharmony_ci 48362306a36Sopenharmony_ci/** 48462306a36Sopenharmony_ci * hl_irq_handler_dec_abnrm - Decoder error interrupt handler 48562306a36Sopenharmony_ci * @irq: IRQ number 48662306a36Sopenharmony_ci * @arg: pointer to decoder structure. 48762306a36Sopenharmony_ci */ 48862306a36Sopenharmony_ciirqreturn_t hl_irq_handler_dec_abnrm(int irq, void *arg) 48962306a36Sopenharmony_ci{ 49062306a36Sopenharmony_ci struct hl_dec *dec = arg; 49162306a36Sopenharmony_ci 49262306a36Sopenharmony_ci schedule_work(&dec->abnrm_intr_work); 49362306a36Sopenharmony_ci 49462306a36Sopenharmony_ci return IRQ_HANDLED; 49562306a36Sopenharmony_ci} 49662306a36Sopenharmony_ci 49762306a36Sopenharmony_ci/** 49862306a36Sopenharmony_ci * hl_cq_init - main initialization function for an cq object 49962306a36Sopenharmony_ci * 50062306a36Sopenharmony_ci * @hdev: pointer to device structure 50162306a36Sopenharmony_ci * @q: pointer to cq structure 50262306a36Sopenharmony_ci * @hw_queue_id: The H/W queue ID this completion queue belongs to 50362306a36Sopenharmony_ci * HL_INVALID_QUEUE if cq is not attached to any specific queue 50462306a36Sopenharmony_ci * 50562306a36Sopenharmony_ci * Allocate dma-able memory for the completion queue and initialize fields 50662306a36Sopenharmony_ci * Returns 0 on success 50762306a36Sopenharmony_ci */ 50862306a36Sopenharmony_ciint hl_cq_init(struct hl_device *hdev, struct hl_cq *q, u32 hw_queue_id) 50962306a36Sopenharmony_ci{ 51062306a36Sopenharmony_ci void *p; 51162306a36Sopenharmony_ci 51262306a36Sopenharmony_ci p = hl_asic_dma_alloc_coherent(hdev, HL_CQ_SIZE_IN_BYTES, &q->bus_address, 51362306a36Sopenharmony_ci GFP_KERNEL | __GFP_ZERO); 51462306a36Sopenharmony_ci if (!p) 51562306a36Sopenharmony_ci return -ENOMEM; 51662306a36Sopenharmony_ci 51762306a36Sopenharmony_ci q->hdev = hdev; 51862306a36Sopenharmony_ci q->kernel_address = p; 51962306a36Sopenharmony_ci q->hw_queue_id = hw_queue_id; 52062306a36Sopenharmony_ci q->ci = 0; 52162306a36Sopenharmony_ci q->pi = 0; 52262306a36Sopenharmony_ci 52362306a36Sopenharmony_ci atomic_set(&q->free_slots_cnt, HL_CQ_LENGTH); 52462306a36Sopenharmony_ci 52562306a36Sopenharmony_ci return 0; 52662306a36Sopenharmony_ci} 52762306a36Sopenharmony_ci 52862306a36Sopenharmony_ci/** 52962306a36Sopenharmony_ci * hl_cq_fini - destroy completion queue 53062306a36Sopenharmony_ci * 53162306a36Sopenharmony_ci * @hdev: pointer to device structure 53262306a36Sopenharmony_ci * @q: pointer to cq structure 53362306a36Sopenharmony_ci * 53462306a36Sopenharmony_ci * Free the completion queue memory 53562306a36Sopenharmony_ci */ 53662306a36Sopenharmony_civoid hl_cq_fini(struct hl_device *hdev, struct hl_cq *q) 53762306a36Sopenharmony_ci{ 53862306a36Sopenharmony_ci hl_asic_dma_free_coherent(hdev, HL_CQ_SIZE_IN_BYTES, q->kernel_address, q->bus_address); 53962306a36Sopenharmony_ci} 54062306a36Sopenharmony_ci 54162306a36Sopenharmony_civoid hl_cq_reset(struct hl_device *hdev, struct hl_cq *q) 54262306a36Sopenharmony_ci{ 54362306a36Sopenharmony_ci q->ci = 0; 54462306a36Sopenharmony_ci q->pi = 0; 54562306a36Sopenharmony_ci 54662306a36Sopenharmony_ci atomic_set(&q->free_slots_cnt, HL_CQ_LENGTH); 54762306a36Sopenharmony_ci 54862306a36Sopenharmony_ci /* 54962306a36Sopenharmony_ci * It's not enough to just reset the PI/CI because the H/W may have 55062306a36Sopenharmony_ci * written valid completion entries before it was halted and therefore 55162306a36Sopenharmony_ci * we need to clean the actual queues so we won't process old entries 55262306a36Sopenharmony_ci * when the device is operational again 55362306a36Sopenharmony_ci */ 55462306a36Sopenharmony_ci 55562306a36Sopenharmony_ci memset(q->kernel_address, 0, HL_CQ_SIZE_IN_BYTES); 55662306a36Sopenharmony_ci} 55762306a36Sopenharmony_ci 55862306a36Sopenharmony_ci/** 55962306a36Sopenharmony_ci * hl_eq_init - main initialization function for an event queue object 56062306a36Sopenharmony_ci * 56162306a36Sopenharmony_ci * @hdev: pointer to device structure 56262306a36Sopenharmony_ci * @q: pointer to eq structure 56362306a36Sopenharmony_ci * 56462306a36Sopenharmony_ci * Allocate dma-able memory for the event queue and initialize fields 56562306a36Sopenharmony_ci * Returns 0 on success 56662306a36Sopenharmony_ci */ 56762306a36Sopenharmony_ciint hl_eq_init(struct hl_device *hdev, struct hl_eq *q) 56862306a36Sopenharmony_ci{ 56962306a36Sopenharmony_ci void *p; 57062306a36Sopenharmony_ci 57162306a36Sopenharmony_ci p = hl_cpu_accessible_dma_pool_alloc(hdev, HL_EQ_SIZE_IN_BYTES, &q->bus_address); 57262306a36Sopenharmony_ci if (!p) 57362306a36Sopenharmony_ci return -ENOMEM; 57462306a36Sopenharmony_ci 57562306a36Sopenharmony_ci q->hdev = hdev; 57662306a36Sopenharmony_ci q->kernel_address = p; 57762306a36Sopenharmony_ci q->ci = 0; 57862306a36Sopenharmony_ci q->prev_eqe_index = 0; 57962306a36Sopenharmony_ci 58062306a36Sopenharmony_ci return 0; 58162306a36Sopenharmony_ci} 58262306a36Sopenharmony_ci 58362306a36Sopenharmony_ci/** 58462306a36Sopenharmony_ci * hl_eq_fini - destroy event queue 58562306a36Sopenharmony_ci * 58662306a36Sopenharmony_ci * @hdev: pointer to device structure 58762306a36Sopenharmony_ci * @q: pointer to eq structure 58862306a36Sopenharmony_ci * 58962306a36Sopenharmony_ci * Free the event queue memory 59062306a36Sopenharmony_ci */ 59162306a36Sopenharmony_civoid hl_eq_fini(struct hl_device *hdev, struct hl_eq *q) 59262306a36Sopenharmony_ci{ 59362306a36Sopenharmony_ci flush_workqueue(hdev->eq_wq); 59462306a36Sopenharmony_ci 59562306a36Sopenharmony_ci hl_cpu_accessible_dma_pool_free(hdev, HL_EQ_SIZE_IN_BYTES, q->kernel_address); 59662306a36Sopenharmony_ci} 59762306a36Sopenharmony_ci 59862306a36Sopenharmony_civoid hl_eq_reset(struct hl_device *hdev, struct hl_eq *q) 59962306a36Sopenharmony_ci{ 60062306a36Sopenharmony_ci q->ci = 0; 60162306a36Sopenharmony_ci q->prev_eqe_index = 0; 60262306a36Sopenharmony_ci 60362306a36Sopenharmony_ci /* 60462306a36Sopenharmony_ci * It's not enough to just reset the PI/CI because the H/W may have 60562306a36Sopenharmony_ci * written valid completion entries before it was halted and therefore 60662306a36Sopenharmony_ci * we need to clean the actual queues so we won't process old entries 60762306a36Sopenharmony_ci * when the device is operational again 60862306a36Sopenharmony_ci */ 60962306a36Sopenharmony_ci 61062306a36Sopenharmony_ci memset(q->kernel_address, 0, HL_EQ_SIZE_IN_BYTES); 61162306a36Sopenharmony_ci} 612