162306a36Sopenharmony_ci/* 262306a36Sopenharmony_ci * Copyright (c) 2004, 2005 Topspin Communications. All rights reserved. 362306a36Sopenharmony_ci * Copyright (c) 2005 Mellanox Technologies. All rights reserved. 462306a36Sopenharmony_ci * Copyright (c) 2006, 2007 Cisco Systems, Inc. All rights reserved. 562306a36Sopenharmony_ci * 662306a36Sopenharmony_ci * This software is available to you under a choice of one of two 762306a36Sopenharmony_ci * licenses. You may choose to be licensed under the terms of the GNU 862306a36Sopenharmony_ci * General Public License (GPL) Version 2, available from the file 962306a36Sopenharmony_ci * COPYING in the main directory of this source tree, or the 1062306a36Sopenharmony_ci * OpenIB.org BSD license below: 1162306a36Sopenharmony_ci * 1262306a36Sopenharmony_ci * Redistribution and use in source and binary forms, with or 1362306a36Sopenharmony_ci * without modification, are permitted provided that the following 1462306a36Sopenharmony_ci * conditions are met: 1562306a36Sopenharmony_ci * 1662306a36Sopenharmony_ci * - Redistributions of source code must retain the above 1762306a36Sopenharmony_ci * copyright notice, this list of conditions and the following 1862306a36Sopenharmony_ci * disclaimer. 1962306a36Sopenharmony_ci * 2062306a36Sopenharmony_ci * - Redistributions in binary form must reproduce the above 2162306a36Sopenharmony_ci * copyright notice, this list of conditions and the following 2262306a36Sopenharmony_ci * disclaimer in the documentation and/or other materials 2362306a36Sopenharmony_ci * provided with the distribution. 2462306a36Sopenharmony_ci * 2562306a36Sopenharmony_ci * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, 2662306a36Sopenharmony_ci * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF 2762306a36Sopenharmony_ci * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND 2862306a36Sopenharmony_ci * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS 2962306a36Sopenharmony_ci * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN 3062306a36Sopenharmony_ci * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN 3162306a36Sopenharmony_ci * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE 3262306a36Sopenharmony_ci * SOFTWARE. 3362306a36Sopenharmony_ci */ 3462306a36Sopenharmony_ci 3562306a36Sopenharmony_ci#include <linux/slab.h> 3662306a36Sopenharmony_ci 3762306a36Sopenharmony_ci#include "mlx4.h" 3862306a36Sopenharmony_ci#include "fw.h" 3962306a36Sopenharmony_ci 4062306a36Sopenharmony_cienum { 4162306a36Sopenharmony_ci MLX4_RES_QP, 4262306a36Sopenharmony_ci MLX4_RES_RDMARC, 4362306a36Sopenharmony_ci MLX4_RES_ALTC, 4462306a36Sopenharmony_ci MLX4_RES_AUXC, 4562306a36Sopenharmony_ci MLX4_RES_SRQ, 4662306a36Sopenharmony_ci MLX4_RES_CQ, 4762306a36Sopenharmony_ci MLX4_RES_EQ, 4862306a36Sopenharmony_ci MLX4_RES_DMPT, 4962306a36Sopenharmony_ci MLX4_RES_CMPT, 5062306a36Sopenharmony_ci MLX4_RES_MTT, 5162306a36Sopenharmony_ci MLX4_RES_MCG, 5262306a36Sopenharmony_ci MLX4_RES_NUM 5362306a36Sopenharmony_ci}; 5462306a36Sopenharmony_ci 5562306a36Sopenharmony_cistatic const char *res_name[] = { 5662306a36Sopenharmony_ci [MLX4_RES_QP] = "QP", 5762306a36Sopenharmony_ci [MLX4_RES_RDMARC] = "RDMARC", 5862306a36Sopenharmony_ci [MLX4_RES_ALTC] = "ALTC", 5962306a36Sopenharmony_ci [MLX4_RES_AUXC] = "AUXC", 6062306a36Sopenharmony_ci [MLX4_RES_SRQ] = "SRQ", 6162306a36Sopenharmony_ci [MLX4_RES_CQ] = "CQ", 6262306a36Sopenharmony_ci [MLX4_RES_EQ] = "EQ", 6362306a36Sopenharmony_ci [MLX4_RES_DMPT] = "DMPT", 6462306a36Sopenharmony_ci [MLX4_RES_CMPT] = "CMPT", 6562306a36Sopenharmony_ci [MLX4_RES_MTT] = "MTT", 6662306a36Sopenharmony_ci [MLX4_RES_MCG] = "MCG", 6762306a36Sopenharmony_ci}; 6862306a36Sopenharmony_ci 6962306a36Sopenharmony_ciu64 mlx4_make_profile(struct mlx4_dev *dev, 7062306a36Sopenharmony_ci struct mlx4_profile *request, 7162306a36Sopenharmony_ci struct mlx4_dev_cap *dev_cap, 7262306a36Sopenharmony_ci struct mlx4_init_hca_param *init_hca) 7362306a36Sopenharmony_ci{ 7462306a36Sopenharmony_ci struct mlx4_priv *priv = mlx4_priv(dev); 7562306a36Sopenharmony_ci struct mlx4_resource { 7662306a36Sopenharmony_ci u64 size; 7762306a36Sopenharmony_ci u64 start; 7862306a36Sopenharmony_ci int type; 7962306a36Sopenharmony_ci u32 num; 8062306a36Sopenharmony_ci int log_num; 8162306a36Sopenharmony_ci }; 8262306a36Sopenharmony_ci 8362306a36Sopenharmony_ci u64 total_size = 0; 8462306a36Sopenharmony_ci struct mlx4_resource *profile; 8562306a36Sopenharmony_ci struct sysinfo si; 8662306a36Sopenharmony_ci int i, j; 8762306a36Sopenharmony_ci 8862306a36Sopenharmony_ci profile = kcalloc(MLX4_RES_NUM, sizeof(*profile), GFP_KERNEL); 8962306a36Sopenharmony_ci if (!profile) 9062306a36Sopenharmony_ci return -ENOMEM; 9162306a36Sopenharmony_ci 9262306a36Sopenharmony_ci /* 9362306a36Sopenharmony_ci * We want to scale the number of MTTs with the size of the 9462306a36Sopenharmony_ci * system memory, since it makes sense to register a lot of 9562306a36Sopenharmony_ci * memory on a system with a lot of memory. As a heuristic, 9662306a36Sopenharmony_ci * make sure we have enough MTTs to cover twice the system 9762306a36Sopenharmony_ci * memory (with PAGE_SIZE entries). 9862306a36Sopenharmony_ci * 9962306a36Sopenharmony_ci * This number has to be a power of two and fit into 32 bits 10062306a36Sopenharmony_ci * due to device limitations, so cap this at 2^31 as well. 10162306a36Sopenharmony_ci * That limits us to 8TB of memory registration per HCA with 10262306a36Sopenharmony_ci * 4KB pages, which is probably OK for the next few months. 10362306a36Sopenharmony_ci */ 10462306a36Sopenharmony_ci si_meminfo(&si); 10562306a36Sopenharmony_ci request->num_mtt = 10662306a36Sopenharmony_ci roundup_pow_of_two(max_t(unsigned, request->num_mtt, 10762306a36Sopenharmony_ci min(1UL << (31 - log_mtts_per_seg), 10862306a36Sopenharmony_ci (si.totalram << 1) >> log_mtts_per_seg))); 10962306a36Sopenharmony_ci 11062306a36Sopenharmony_ci 11162306a36Sopenharmony_ci profile[MLX4_RES_QP].size = dev_cap->qpc_entry_sz; 11262306a36Sopenharmony_ci profile[MLX4_RES_RDMARC].size = dev_cap->rdmarc_entry_sz; 11362306a36Sopenharmony_ci profile[MLX4_RES_ALTC].size = dev_cap->altc_entry_sz; 11462306a36Sopenharmony_ci profile[MLX4_RES_AUXC].size = dev_cap->aux_entry_sz; 11562306a36Sopenharmony_ci profile[MLX4_RES_SRQ].size = dev_cap->srq_entry_sz; 11662306a36Sopenharmony_ci profile[MLX4_RES_CQ].size = dev_cap->cqc_entry_sz; 11762306a36Sopenharmony_ci profile[MLX4_RES_EQ].size = dev_cap->eqc_entry_sz; 11862306a36Sopenharmony_ci profile[MLX4_RES_DMPT].size = dev_cap->dmpt_entry_sz; 11962306a36Sopenharmony_ci profile[MLX4_RES_CMPT].size = dev_cap->cmpt_entry_sz; 12062306a36Sopenharmony_ci profile[MLX4_RES_MTT].size = dev_cap->mtt_entry_sz; 12162306a36Sopenharmony_ci profile[MLX4_RES_MCG].size = mlx4_get_mgm_entry_size(dev); 12262306a36Sopenharmony_ci 12362306a36Sopenharmony_ci profile[MLX4_RES_QP].num = request->num_qp; 12462306a36Sopenharmony_ci profile[MLX4_RES_RDMARC].num = request->num_qp * request->rdmarc_per_qp; 12562306a36Sopenharmony_ci profile[MLX4_RES_ALTC].num = request->num_qp; 12662306a36Sopenharmony_ci profile[MLX4_RES_AUXC].num = request->num_qp; 12762306a36Sopenharmony_ci profile[MLX4_RES_SRQ].num = request->num_srq; 12862306a36Sopenharmony_ci profile[MLX4_RES_CQ].num = request->num_cq; 12962306a36Sopenharmony_ci profile[MLX4_RES_EQ].num = mlx4_is_mfunc(dev) ? dev->phys_caps.num_phys_eqs : 13062306a36Sopenharmony_ci min_t(unsigned, dev_cap->max_eqs, MAX_MSIX); 13162306a36Sopenharmony_ci profile[MLX4_RES_DMPT].num = request->num_mpt; 13262306a36Sopenharmony_ci profile[MLX4_RES_CMPT].num = MLX4_NUM_CMPTS; 13362306a36Sopenharmony_ci profile[MLX4_RES_MTT].num = request->num_mtt * (1 << log_mtts_per_seg); 13462306a36Sopenharmony_ci profile[MLX4_RES_MCG].num = request->num_mcg; 13562306a36Sopenharmony_ci 13662306a36Sopenharmony_ci for (i = 0; i < MLX4_RES_NUM; ++i) { 13762306a36Sopenharmony_ci profile[i].type = i; 13862306a36Sopenharmony_ci profile[i].num = roundup_pow_of_two(profile[i].num); 13962306a36Sopenharmony_ci profile[i].log_num = ilog2(profile[i].num); 14062306a36Sopenharmony_ci profile[i].size *= profile[i].num; 14162306a36Sopenharmony_ci profile[i].size = max(profile[i].size, (u64) PAGE_SIZE); 14262306a36Sopenharmony_ci } 14362306a36Sopenharmony_ci 14462306a36Sopenharmony_ci /* 14562306a36Sopenharmony_ci * Sort the resources in decreasing order of size. Since they 14662306a36Sopenharmony_ci * all have sizes that are powers of 2, we'll be able to keep 14762306a36Sopenharmony_ci * resources aligned to their size and pack them without gaps 14862306a36Sopenharmony_ci * using the sorted order. 14962306a36Sopenharmony_ci */ 15062306a36Sopenharmony_ci for (i = MLX4_RES_NUM; i > 0; --i) 15162306a36Sopenharmony_ci for (j = 1; j < i; ++j) { 15262306a36Sopenharmony_ci if (profile[j].size > profile[j - 1].size) 15362306a36Sopenharmony_ci swap(profile[j], profile[j - 1]); 15462306a36Sopenharmony_ci } 15562306a36Sopenharmony_ci 15662306a36Sopenharmony_ci for (i = 0; i < MLX4_RES_NUM; ++i) { 15762306a36Sopenharmony_ci if (profile[i].size) { 15862306a36Sopenharmony_ci profile[i].start = total_size; 15962306a36Sopenharmony_ci total_size += profile[i].size; 16062306a36Sopenharmony_ci } 16162306a36Sopenharmony_ci 16262306a36Sopenharmony_ci if (total_size > dev_cap->max_icm_sz) { 16362306a36Sopenharmony_ci mlx4_err(dev, "Profile requires 0x%llx bytes; won't fit in 0x%llx bytes of context memory\n", 16462306a36Sopenharmony_ci (unsigned long long) total_size, 16562306a36Sopenharmony_ci (unsigned long long) dev_cap->max_icm_sz); 16662306a36Sopenharmony_ci kfree(profile); 16762306a36Sopenharmony_ci return -ENOMEM; 16862306a36Sopenharmony_ci } 16962306a36Sopenharmony_ci 17062306a36Sopenharmony_ci if (profile[i].size) 17162306a36Sopenharmony_ci mlx4_dbg(dev, " profile[%2d] (%6s): 2^%02d entries @ 0x%10llx, size 0x%10llx\n", 17262306a36Sopenharmony_ci i, res_name[profile[i].type], 17362306a36Sopenharmony_ci profile[i].log_num, 17462306a36Sopenharmony_ci (unsigned long long) profile[i].start, 17562306a36Sopenharmony_ci (unsigned long long) profile[i].size); 17662306a36Sopenharmony_ci } 17762306a36Sopenharmony_ci 17862306a36Sopenharmony_ci mlx4_dbg(dev, "HCA context memory: reserving %d KB\n", 17962306a36Sopenharmony_ci (int) (total_size >> 10)); 18062306a36Sopenharmony_ci 18162306a36Sopenharmony_ci for (i = 0; i < MLX4_RES_NUM; ++i) { 18262306a36Sopenharmony_ci switch (profile[i].type) { 18362306a36Sopenharmony_ci case MLX4_RES_QP: 18462306a36Sopenharmony_ci dev->caps.num_qps = profile[i].num; 18562306a36Sopenharmony_ci init_hca->qpc_base = profile[i].start; 18662306a36Sopenharmony_ci init_hca->log_num_qps = profile[i].log_num; 18762306a36Sopenharmony_ci break; 18862306a36Sopenharmony_ci case MLX4_RES_RDMARC: 18962306a36Sopenharmony_ci for (priv->qp_table.rdmarc_shift = 0; 19062306a36Sopenharmony_ci request->num_qp << priv->qp_table.rdmarc_shift < profile[i].num; 19162306a36Sopenharmony_ci ++priv->qp_table.rdmarc_shift) 19262306a36Sopenharmony_ci ; /* nothing */ 19362306a36Sopenharmony_ci dev->caps.max_qp_dest_rdma = 1 << priv->qp_table.rdmarc_shift; 19462306a36Sopenharmony_ci priv->qp_table.rdmarc_base = (u32) profile[i].start; 19562306a36Sopenharmony_ci init_hca->rdmarc_base = profile[i].start; 19662306a36Sopenharmony_ci init_hca->log_rd_per_qp = priv->qp_table.rdmarc_shift; 19762306a36Sopenharmony_ci break; 19862306a36Sopenharmony_ci case MLX4_RES_ALTC: 19962306a36Sopenharmony_ci init_hca->altc_base = profile[i].start; 20062306a36Sopenharmony_ci break; 20162306a36Sopenharmony_ci case MLX4_RES_AUXC: 20262306a36Sopenharmony_ci init_hca->auxc_base = profile[i].start; 20362306a36Sopenharmony_ci break; 20462306a36Sopenharmony_ci case MLX4_RES_SRQ: 20562306a36Sopenharmony_ci dev->caps.num_srqs = profile[i].num; 20662306a36Sopenharmony_ci init_hca->srqc_base = profile[i].start; 20762306a36Sopenharmony_ci init_hca->log_num_srqs = profile[i].log_num; 20862306a36Sopenharmony_ci break; 20962306a36Sopenharmony_ci case MLX4_RES_CQ: 21062306a36Sopenharmony_ci dev->caps.num_cqs = profile[i].num; 21162306a36Sopenharmony_ci init_hca->cqc_base = profile[i].start; 21262306a36Sopenharmony_ci init_hca->log_num_cqs = profile[i].log_num; 21362306a36Sopenharmony_ci break; 21462306a36Sopenharmony_ci case MLX4_RES_EQ: 21562306a36Sopenharmony_ci if (dev_cap->flags2 & MLX4_DEV_CAP_FLAG2_SYS_EQS) { 21662306a36Sopenharmony_ci init_hca->log_num_eqs = 0x1f; 21762306a36Sopenharmony_ci init_hca->eqc_base = profile[i].start; 21862306a36Sopenharmony_ci init_hca->num_sys_eqs = dev_cap->num_sys_eqs; 21962306a36Sopenharmony_ci } else { 22062306a36Sopenharmony_ci dev->caps.num_eqs = roundup_pow_of_two( 22162306a36Sopenharmony_ci min_t(unsigned, 22262306a36Sopenharmony_ci dev_cap->max_eqs, 22362306a36Sopenharmony_ci MAX_MSIX)); 22462306a36Sopenharmony_ci init_hca->eqc_base = profile[i].start; 22562306a36Sopenharmony_ci init_hca->log_num_eqs = ilog2(dev->caps.num_eqs); 22662306a36Sopenharmony_ci } 22762306a36Sopenharmony_ci break; 22862306a36Sopenharmony_ci case MLX4_RES_DMPT: 22962306a36Sopenharmony_ci dev->caps.num_mpts = profile[i].num; 23062306a36Sopenharmony_ci priv->mr_table.mpt_base = profile[i].start; 23162306a36Sopenharmony_ci init_hca->dmpt_base = profile[i].start; 23262306a36Sopenharmony_ci init_hca->log_mpt_sz = profile[i].log_num; 23362306a36Sopenharmony_ci break; 23462306a36Sopenharmony_ci case MLX4_RES_CMPT: 23562306a36Sopenharmony_ci init_hca->cmpt_base = profile[i].start; 23662306a36Sopenharmony_ci break; 23762306a36Sopenharmony_ci case MLX4_RES_MTT: 23862306a36Sopenharmony_ci dev->caps.num_mtts = profile[i].num; 23962306a36Sopenharmony_ci priv->mr_table.mtt_base = profile[i].start; 24062306a36Sopenharmony_ci init_hca->mtt_base = profile[i].start; 24162306a36Sopenharmony_ci break; 24262306a36Sopenharmony_ci case MLX4_RES_MCG: 24362306a36Sopenharmony_ci init_hca->mc_base = profile[i].start; 24462306a36Sopenharmony_ci init_hca->log_mc_entry_sz = 24562306a36Sopenharmony_ci ilog2(mlx4_get_mgm_entry_size(dev)); 24662306a36Sopenharmony_ci init_hca->log_mc_table_sz = profile[i].log_num; 24762306a36Sopenharmony_ci if (dev->caps.steering_mode == 24862306a36Sopenharmony_ci MLX4_STEERING_MODE_DEVICE_MANAGED) { 24962306a36Sopenharmony_ci dev->caps.num_mgms = profile[i].num; 25062306a36Sopenharmony_ci } else { 25162306a36Sopenharmony_ci init_hca->log_mc_hash_sz = 25262306a36Sopenharmony_ci profile[i].log_num - 1; 25362306a36Sopenharmony_ci dev->caps.num_mgms = profile[i].num >> 1; 25462306a36Sopenharmony_ci dev->caps.num_amgms = profile[i].num >> 1; 25562306a36Sopenharmony_ci } 25662306a36Sopenharmony_ci break; 25762306a36Sopenharmony_ci default: 25862306a36Sopenharmony_ci break; 25962306a36Sopenharmony_ci } 26062306a36Sopenharmony_ci } 26162306a36Sopenharmony_ci 26262306a36Sopenharmony_ci /* 26362306a36Sopenharmony_ci * PDs don't take any HCA memory, but we assign them as part 26462306a36Sopenharmony_ci * of the HCA profile anyway. 26562306a36Sopenharmony_ci */ 26662306a36Sopenharmony_ci dev->caps.num_pds = MLX4_NUM_PDS; 26762306a36Sopenharmony_ci 26862306a36Sopenharmony_ci kfree(profile); 26962306a36Sopenharmony_ci return total_size; 27062306a36Sopenharmony_ci} 271