Back to home page

OSCL-LXR

 
 

    


0001 // SPDX-License-Identifier: GPL-2.0-only
0002 /*
0003  *  Copyright (C) 2017 Chelsio Communications.  All rights reserved.
0004  */
0005 
0006 #include <linux/sort.h>
0007 #include <linux/string.h>
0008 
0009 #include "t4_regs.h"
0010 #include "cxgb4.h"
0011 #include "cxgb4_cudbg.h"
0012 #include "cudbg_if.h"
0013 #include "cudbg_lib_common.h"
0014 #include "cudbg_entity.h"
0015 #include "cudbg_lib.h"
0016 #include "cudbg_zlib.h"
0017 #include "cxgb4_tc_mqprio.h"
0018 
0019 static const u32 t6_tp_pio_array[][IREG_NUM_ELEM] = {
0020     {0x7e40, 0x7e44, 0x020, 28}, /* t6_tp_pio_regs_20_to_3b */
0021     {0x7e40, 0x7e44, 0x040, 10}, /* t6_tp_pio_regs_40_to_49 */
0022     {0x7e40, 0x7e44, 0x050, 10}, /* t6_tp_pio_regs_50_to_59 */
0023     {0x7e40, 0x7e44, 0x060, 14}, /* t6_tp_pio_regs_60_to_6d */
0024     {0x7e40, 0x7e44, 0x06F, 1}, /* t6_tp_pio_regs_6f */
0025     {0x7e40, 0x7e44, 0x070, 6}, /* t6_tp_pio_regs_70_to_75 */
0026     {0x7e40, 0x7e44, 0x130, 18}, /* t6_tp_pio_regs_130_to_141 */
0027     {0x7e40, 0x7e44, 0x145, 19}, /* t6_tp_pio_regs_145_to_157 */
0028     {0x7e40, 0x7e44, 0x160, 1}, /* t6_tp_pio_regs_160 */
0029     {0x7e40, 0x7e44, 0x230, 25}, /* t6_tp_pio_regs_230_to_248 */
0030     {0x7e40, 0x7e44, 0x24a, 3}, /* t6_tp_pio_regs_24c */
0031     {0x7e40, 0x7e44, 0x8C0, 1} /* t6_tp_pio_regs_8c0 */
0032 };
0033 
0034 static const u32 t5_tp_pio_array[][IREG_NUM_ELEM] = {
0035     {0x7e40, 0x7e44, 0x020, 28}, /* t5_tp_pio_regs_20_to_3b */
0036     {0x7e40, 0x7e44, 0x040, 19}, /* t5_tp_pio_regs_40_to_52 */
0037     {0x7e40, 0x7e44, 0x054, 2}, /* t5_tp_pio_regs_54_to_55 */
0038     {0x7e40, 0x7e44, 0x060, 13}, /* t5_tp_pio_regs_60_to_6c */
0039     {0x7e40, 0x7e44, 0x06F, 1}, /* t5_tp_pio_regs_6f */
0040     {0x7e40, 0x7e44, 0x120, 4}, /* t5_tp_pio_regs_120_to_123 */
0041     {0x7e40, 0x7e44, 0x12b, 2}, /* t5_tp_pio_regs_12b_to_12c */
0042     {0x7e40, 0x7e44, 0x12f, 21}, /* t5_tp_pio_regs_12f_to_143 */
0043     {0x7e40, 0x7e44, 0x145, 19}, /* t5_tp_pio_regs_145_to_157 */
0044     {0x7e40, 0x7e44, 0x230, 25}, /* t5_tp_pio_regs_230_to_248 */
0045     {0x7e40, 0x7e44, 0x8C0, 1} /* t5_tp_pio_regs_8c0 */
0046 };
0047 
0048 static const u32 t6_tp_tm_pio_array[][IREG_NUM_ELEM] = {
0049     {0x7e18, 0x7e1c, 0x0, 12}
0050 };
0051 
0052 static const u32 t5_tp_tm_pio_array[][IREG_NUM_ELEM] = {
0053     {0x7e18, 0x7e1c, 0x0, 12}
0054 };
0055 
0056 static const u32 t6_tp_mib_index_array[6][IREG_NUM_ELEM] = {
0057     {0x7e50, 0x7e54, 0x0, 13},
0058     {0x7e50, 0x7e54, 0x10, 6},
0059     {0x7e50, 0x7e54, 0x18, 21},
0060     {0x7e50, 0x7e54, 0x30, 32},
0061     {0x7e50, 0x7e54, 0x50, 22},
0062     {0x7e50, 0x7e54, 0x68, 12}
0063 };
0064 
0065 static const u32 t5_tp_mib_index_array[9][IREG_NUM_ELEM] = {
0066     {0x7e50, 0x7e54, 0x0, 13},
0067     {0x7e50, 0x7e54, 0x10, 6},
0068     {0x7e50, 0x7e54, 0x18, 8},
0069     {0x7e50, 0x7e54, 0x20, 13},
0070     {0x7e50, 0x7e54, 0x30, 16},
0071     {0x7e50, 0x7e54, 0x40, 16},
0072     {0x7e50, 0x7e54, 0x50, 16},
0073     {0x7e50, 0x7e54, 0x60, 6},
0074     {0x7e50, 0x7e54, 0x68, 4}
0075 };
0076 
0077 static const u32 t5_sge_dbg_index_array[2][IREG_NUM_ELEM] = {
0078     {0x10cc, 0x10d0, 0x0, 16},
0079     {0x10cc, 0x10d4, 0x0, 16},
0080 };
0081 
0082 static const u32 t6_sge_qbase_index_array[] = {
0083     /* 1 addr reg SGE_QBASE_INDEX and 4 data reg SGE_QBASE_MAP[0-3] */
0084     0x1250, 0x1240, 0x1244, 0x1248, 0x124c,
0085 };
0086 
0087 static const u32 t5_pcie_pdbg_array[][IREG_NUM_ELEM] = {
0088     {0x5a04, 0x5a0c, 0x00, 0x20}, /* t5_pcie_pdbg_regs_00_to_20 */
0089     {0x5a04, 0x5a0c, 0x21, 0x20}, /* t5_pcie_pdbg_regs_21_to_40 */
0090     {0x5a04, 0x5a0c, 0x41, 0x10}, /* t5_pcie_pdbg_regs_41_to_50 */
0091 };
0092 
0093 static const u32 t5_pcie_cdbg_array[][IREG_NUM_ELEM] = {
0094     {0x5a10, 0x5a18, 0x00, 0x20}, /* t5_pcie_cdbg_regs_00_to_20 */
0095     {0x5a10, 0x5a18, 0x21, 0x18}, /* t5_pcie_cdbg_regs_21_to_37 */
0096 };
0097 
0098 static const u32 t5_pm_rx_array[][IREG_NUM_ELEM] = {
0099     {0x8FD0, 0x8FD4, 0x10000, 0x20}, /* t5_pm_rx_regs_10000_to_10020 */
0100     {0x8FD0, 0x8FD4, 0x10021, 0x0D}, /* t5_pm_rx_regs_10021_to_1002c */
0101 };
0102 
0103 static const u32 t5_pm_tx_array[][IREG_NUM_ELEM] = {
0104     {0x8FF0, 0x8FF4, 0x10000, 0x20}, /* t5_pm_tx_regs_10000_to_10020 */
0105     {0x8FF0, 0x8FF4, 0x10021, 0x1D}, /* t5_pm_tx_regs_10021_to_1003c */
0106 };
0107 
0108 static const u32 t5_pcie_config_array[][2] = {
0109     {0x0, 0x34},
0110     {0x3c, 0x40},
0111     {0x50, 0x64},
0112     {0x70, 0x80},
0113     {0x94, 0xa0},
0114     {0xb0, 0xb8},
0115     {0xd0, 0xd4},
0116     {0x100, 0x128},
0117     {0x140, 0x148},
0118     {0x150, 0x164},
0119     {0x170, 0x178},
0120     {0x180, 0x194},
0121     {0x1a0, 0x1b8},
0122     {0x1c0, 0x208},
0123 };
0124 
0125 static const u32 t6_ma_ireg_array[][IREG_NUM_ELEM] = {
0126     {0x78f8, 0x78fc, 0xa000, 23}, /* t6_ma_regs_a000_to_a016 */
0127     {0x78f8, 0x78fc, 0xa400, 30}, /* t6_ma_regs_a400_to_a41e */
0128     {0x78f8, 0x78fc, 0xa800, 20} /* t6_ma_regs_a800_to_a813 */
0129 };
0130 
0131 static const u32 t6_ma_ireg_array2[][IREG_NUM_ELEM] = {
0132     {0x78f8, 0x78fc, 0xe400, 17}, /* t6_ma_regs_e400_to_e600 */
0133     {0x78f8, 0x78fc, 0xe640, 13} /* t6_ma_regs_e640_to_e7c0 */
0134 };
0135 
0136 static const u32 t6_up_cim_reg_array[][IREG_NUM_ELEM + 1] = {
0137     {0x7b50, 0x7b54, 0x2000, 0x20, 0}, /* up_cim_2000_to_207c */
0138     {0x7b50, 0x7b54, 0x2080, 0x1d, 0}, /* up_cim_2080_to_20fc */
0139     {0x7b50, 0x7b54, 0x00, 0x20, 0}, /* up_cim_00_to_7c */
0140     {0x7b50, 0x7b54, 0x80, 0x20, 0}, /* up_cim_80_to_fc */
0141     {0x7b50, 0x7b54, 0x100, 0x11, 0}, /* up_cim_100_to_14c */
0142     {0x7b50, 0x7b54, 0x200, 0x10, 0}, /* up_cim_200_to_23c */
0143     {0x7b50, 0x7b54, 0x240, 0x2, 0}, /* up_cim_240_to_244 */
0144     {0x7b50, 0x7b54, 0x250, 0x2, 0}, /* up_cim_250_to_254 */
0145     {0x7b50, 0x7b54, 0x260, 0x2, 0}, /* up_cim_260_to_264 */
0146     {0x7b50, 0x7b54, 0x270, 0x2, 0}, /* up_cim_270_to_274 */
0147     {0x7b50, 0x7b54, 0x280, 0x20, 0}, /* up_cim_280_to_2fc */
0148     {0x7b50, 0x7b54, 0x300, 0x20, 0}, /* up_cim_300_to_37c */
0149     {0x7b50, 0x7b54, 0x380, 0x14, 0}, /* up_cim_380_to_3cc */
0150     {0x7b50, 0x7b54, 0x4900, 0x4, 0x4}, /* up_cim_4900_to_4c60 */
0151     {0x7b50, 0x7b54, 0x4904, 0x4, 0x4}, /* up_cim_4904_to_4c64 */
0152     {0x7b50, 0x7b54, 0x4908, 0x4, 0x4}, /* up_cim_4908_to_4c68 */
0153     {0x7b50, 0x7b54, 0x4910, 0x4, 0x4}, /* up_cim_4910_to_4c70 */
0154     {0x7b50, 0x7b54, 0x4914, 0x4, 0x4}, /* up_cim_4914_to_4c74 */
0155     {0x7b50, 0x7b54, 0x4920, 0x10, 0x10}, /* up_cim_4920_to_4a10 */
0156     {0x7b50, 0x7b54, 0x4924, 0x10, 0x10}, /* up_cim_4924_to_4a14 */
0157     {0x7b50, 0x7b54, 0x4928, 0x10, 0x10}, /* up_cim_4928_to_4a18 */
0158     {0x7b50, 0x7b54, 0x492c, 0x10, 0x10}, /* up_cim_492c_to_4a1c */
0159 };
0160 
0161 static const u32 t5_up_cim_reg_array[][IREG_NUM_ELEM + 1] = {
0162     {0x7b50, 0x7b54, 0x2000, 0x20, 0}, /* up_cim_2000_to_207c */
0163     {0x7b50, 0x7b54, 0x2080, 0x19, 0}, /* up_cim_2080_to_20ec */
0164     {0x7b50, 0x7b54, 0x00, 0x20, 0}, /* up_cim_00_to_7c */
0165     {0x7b50, 0x7b54, 0x80, 0x20, 0}, /* up_cim_80_to_fc */
0166     {0x7b50, 0x7b54, 0x100, 0x11, 0}, /* up_cim_100_to_14c */
0167     {0x7b50, 0x7b54, 0x200, 0x10, 0}, /* up_cim_200_to_23c */
0168     {0x7b50, 0x7b54, 0x240, 0x2, 0}, /* up_cim_240_to_244 */
0169     {0x7b50, 0x7b54, 0x250, 0x2, 0}, /* up_cim_250_to_254 */
0170     {0x7b50, 0x7b54, 0x260, 0x2, 0}, /* up_cim_260_to_264 */
0171     {0x7b50, 0x7b54, 0x270, 0x2, 0}, /* up_cim_270_to_274 */
0172     {0x7b50, 0x7b54, 0x280, 0x20, 0}, /* up_cim_280_to_2fc */
0173     {0x7b50, 0x7b54, 0x300, 0x20, 0}, /* up_cim_300_to_37c */
0174     {0x7b50, 0x7b54, 0x380, 0x14, 0}, /* up_cim_380_to_3cc */
0175 };
0176 
0177 static const u32 t6_hma_ireg_array[][IREG_NUM_ELEM] = {
0178     {0x51320, 0x51324, 0xa000, 32} /* t6_hma_regs_a000_to_a01f */
0179 };
0180 
0181 u32 cudbg_get_entity_length(struct adapter *adap, u32 entity)
0182 {
0183     struct cudbg_tcam tcam_region = { 0 };
0184     u32 value, n = 0, len = 0;
0185 
0186     switch (entity) {
0187     case CUDBG_REG_DUMP:
0188         switch (CHELSIO_CHIP_VERSION(adap->params.chip)) {
0189         case CHELSIO_T4:
0190             len = T4_REGMAP_SIZE;
0191             break;
0192         case CHELSIO_T5:
0193         case CHELSIO_T6:
0194             len = T5_REGMAP_SIZE;
0195             break;
0196         default:
0197             break;
0198         }
0199         break;
0200     case CUDBG_DEV_LOG:
0201         len = adap->params.devlog.size;
0202         break;
0203     case CUDBG_CIM_LA:
0204         if (is_t6(adap->params.chip)) {
0205             len = adap->params.cim_la_size / 10 + 1;
0206             len *= 10 * sizeof(u32);
0207         } else {
0208             len = adap->params.cim_la_size / 8;
0209             len *= 8 * sizeof(u32);
0210         }
0211         len += sizeof(u32); /* for reading CIM LA configuration */
0212         break;
0213     case CUDBG_CIM_MA_LA:
0214         len = 2 * CIM_MALA_SIZE * 5 * sizeof(u32);
0215         break;
0216     case CUDBG_CIM_QCFG:
0217         len = sizeof(struct cudbg_cim_qcfg);
0218         break;
0219     case CUDBG_CIM_IBQ_TP0:
0220     case CUDBG_CIM_IBQ_TP1:
0221     case CUDBG_CIM_IBQ_ULP:
0222     case CUDBG_CIM_IBQ_SGE0:
0223     case CUDBG_CIM_IBQ_SGE1:
0224     case CUDBG_CIM_IBQ_NCSI:
0225         len = CIM_IBQ_SIZE * 4 * sizeof(u32);
0226         break;
0227     case CUDBG_CIM_OBQ_ULP0:
0228         len = cudbg_cim_obq_size(adap, 0);
0229         break;
0230     case CUDBG_CIM_OBQ_ULP1:
0231         len = cudbg_cim_obq_size(adap, 1);
0232         break;
0233     case CUDBG_CIM_OBQ_ULP2:
0234         len = cudbg_cim_obq_size(adap, 2);
0235         break;
0236     case CUDBG_CIM_OBQ_ULP3:
0237         len = cudbg_cim_obq_size(adap, 3);
0238         break;
0239     case CUDBG_CIM_OBQ_SGE:
0240         len = cudbg_cim_obq_size(adap, 4);
0241         break;
0242     case CUDBG_CIM_OBQ_NCSI:
0243         len = cudbg_cim_obq_size(adap, 5);
0244         break;
0245     case CUDBG_CIM_OBQ_RXQ0:
0246         len = cudbg_cim_obq_size(adap, 6);
0247         break;
0248     case CUDBG_CIM_OBQ_RXQ1:
0249         len = cudbg_cim_obq_size(adap, 7);
0250         break;
0251     case CUDBG_EDC0:
0252         value = t4_read_reg(adap, MA_TARGET_MEM_ENABLE_A);
0253         if (value & EDRAM0_ENABLE_F) {
0254             value = t4_read_reg(adap, MA_EDRAM0_BAR_A);
0255             len = EDRAM0_SIZE_G(value);
0256         }
0257         len = cudbg_mbytes_to_bytes(len);
0258         break;
0259     case CUDBG_EDC1:
0260         value = t4_read_reg(adap, MA_TARGET_MEM_ENABLE_A);
0261         if (value & EDRAM1_ENABLE_F) {
0262             value = t4_read_reg(adap, MA_EDRAM1_BAR_A);
0263             len = EDRAM1_SIZE_G(value);
0264         }
0265         len = cudbg_mbytes_to_bytes(len);
0266         break;
0267     case CUDBG_MC0:
0268         value = t4_read_reg(adap, MA_TARGET_MEM_ENABLE_A);
0269         if (value & EXT_MEM0_ENABLE_F) {
0270             value = t4_read_reg(adap, MA_EXT_MEMORY0_BAR_A);
0271             len = EXT_MEM0_SIZE_G(value);
0272         }
0273         len = cudbg_mbytes_to_bytes(len);
0274         break;
0275     case CUDBG_MC1:
0276         value = t4_read_reg(adap, MA_TARGET_MEM_ENABLE_A);
0277         if (value & EXT_MEM1_ENABLE_F) {
0278             value = t4_read_reg(adap, MA_EXT_MEMORY1_BAR_A);
0279             len = EXT_MEM1_SIZE_G(value);
0280         }
0281         len = cudbg_mbytes_to_bytes(len);
0282         break;
0283     case CUDBG_RSS:
0284         len = t4_chip_rss_size(adap) * sizeof(u16);
0285         break;
0286     case CUDBG_RSS_VF_CONF:
0287         len = adap->params.arch.vfcount *
0288               sizeof(struct cudbg_rss_vf_conf);
0289         break;
0290     case CUDBG_PATH_MTU:
0291         len = NMTUS * sizeof(u16);
0292         break;
0293     case CUDBG_PM_STATS:
0294         len = sizeof(struct cudbg_pm_stats);
0295         break;
0296     case CUDBG_HW_SCHED:
0297         len = sizeof(struct cudbg_hw_sched);
0298         break;
0299     case CUDBG_TP_INDIRECT:
0300         switch (CHELSIO_CHIP_VERSION(adap->params.chip)) {
0301         case CHELSIO_T5:
0302             n = sizeof(t5_tp_pio_array) +
0303                 sizeof(t5_tp_tm_pio_array) +
0304                 sizeof(t5_tp_mib_index_array);
0305             break;
0306         case CHELSIO_T6:
0307             n = sizeof(t6_tp_pio_array) +
0308                 sizeof(t6_tp_tm_pio_array) +
0309                 sizeof(t6_tp_mib_index_array);
0310             break;
0311         default:
0312             break;
0313         }
0314         n = n / (IREG_NUM_ELEM * sizeof(u32));
0315         len = sizeof(struct ireg_buf) * n;
0316         break;
0317     case CUDBG_SGE_INDIRECT:
0318         len = sizeof(struct ireg_buf) * 2 +
0319               sizeof(struct sge_qbase_reg_field);
0320         break;
0321     case CUDBG_ULPRX_LA:
0322         len = sizeof(struct cudbg_ulprx_la);
0323         break;
0324     case CUDBG_TP_LA:
0325         len = sizeof(struct cudbg_tp_la) + TPLA_SIZE * sizeof(u64);
0326         break;
0327     case CUDBG_MEMINFO:
0328         len = sizeof(struct cudbg_ver_hdr) +
0329               sizeof(struct cudbg_meminfo);
0330         break;
0331     case CUDBG_CIM_PIF_LA:
0332         len = sizeof(struct cudbg_cim_pif_la);
0333         len += 2 * CIM_PIFLA_SIZE * 6 * sizeof(u32);
0334         break;
0335     case CUDBG_CLK:
0336         len = sizeof(struct cudbg_clk_info);
0337         break;
0338     case CUDBG_PCIE_INDIRECT:
0339         n = sizeof(t5_pcie_pdbg_array) / (IREG_NUM_ELEM * sizeof(u32));
0340         len = sizeof(struct ireg_buf) * n * 2;
0341         break;
0342     case CUDBG_PM_INDIRECT:
0343         n = sizeof(t5_pm_rx_array) / (IREG_NUM_ELEM * sizeof(u32));
0344         len = sizeof(struct ireg_buf) * n * 2;
0345         break;
0346     case CUDBG_TID_INFO:
0347         len = sizeof(struct cudbg_tid_info_region_rev1);
0348         break;
0349     case CUDBG_PCIE_CONFIG:
0350         len = sizeof(u32) * CUDBG_NUM_PCIE_CONFIG_REGS;
0351         break;
0352     case CUDBG_DUMP_CONTEXT:
0353         len = cudbg_dump_context_size(adap);
0354         break;
0355     case CUDBG_MPS_TCAM:
0356         len = sizeof(struct cudbg_mps_tcam) *
0357               adap->params.arch.mps_tcam_size;
0358         break;
0359     case CUDBG_VPD_DATA:
0360         len = sizeof(struct cudbg_vpd_data);
0361         break;
0362     case CUDBG_LE_TCAM:
0363         cudbg_fill_le_tcam_info(adap, &tcam_region);
0364         len = sizeof(struct cudbg_tcam) +
0365               sizeof(struct cudbg_tid_data) * tcam_region.max_tid;
0366         break;
0367     case CUDBG_CCTRL:
0368         len = sizeof(u16) * NMTUS * NCCTRL_WIN;
0369         break;
0370     case CUDBG_MA_INDIRECT:
0371         if (CHELSIO_CHIP_VERSION(adap->params.chip) > CHELSIO_T5) {
0372             n = sizeof(t6_ma_ireg_array) /
0373                 (IREG_NUM_ELEM * sizeof(u32));
0374             len = sizeof(struct ireg_buf) * n * 2;
0375         }
0376         break;
0377     case CUDBG_ULPTX_LA:
0378         len = sizeof(struct cudbg_ver_hdr) +
0379               sizeof(struct cudbg_ulptx_la);
0380         break;
0381     case CUDBG_UP_CIM_INDIRECT:
0382         n = 0;
0383         if (is_t5(adap->params.chip))
0384             n = sizeof(t5_up_cim_reg_array) /
0385                 ((IREG_NUM_ELEM + 1) * sizeof(u32));
0386         else if (is_t6(adap->params.chip))
0387             n = sizeof(t6_up_cim_reg_array) /
0388                 ((IREG_NUM_ELEM + 1) * sizeof(u32));
0389         len = sizeof(struct ireg_buf) * n;
0390         break;
0391     case CUDBG_PBT_TABLE:
0392         len = sizeof(struct cudbg_pbt_tables);
0393         break;
0394     case CUDBG_MBOX_LOG:
0395         len = sizeof(struct cudbg_mbox_log) * adap->mbox_log->size;
0396         break;
0397     case CUDBG_HMA_INDIRECT:
0398         if (CHELSIO_CHIP_VERSION(adap->params.chip) > CHELSIO_T5) {
0399             n = sizeof(t6_hma_ireg_array) /
0400                 (IREG_NUM_ELEM * sizeof(u32));
0401             len = sizeof(struct ireg_buf) * n;
0402         }
0403         break;
0404     case CUDBG_HMA:
0405         value = t4_read_reg(adap, MA_TARGET_MEM_ENABLE_A);
0406         if (value & HMA_MUX_F) {
0407             /* In T6, there's no MC1.  So, HMA shares MC1
0408              * address space.
0409              */
0410             value = t4_read_reg(adap, MA_EXT_MEMORY1_BAR_A);
0411             len = EXT_MEM1_SIZE_G(value);
0412         }
0413         len = cudbg_mbytes_to_bytes(len);
0414         break;
0415     case CUDBG_QDESC:
0416         cudbg_fill_qdesc_num_and_size(adap, NULL, &len);
0417         break;
0418     default:
0419         break;
0420     }
0421 
0422     return len;
0423 }
0424 
0425 static int cudbg_do_compression(struct cudbg_init *pdbg_init,
0426                 struct cudbg_buffer *pin_buff,
0427                 struct cudbg_buffer *dbg_buff)
0428 {
0429     struct cudbg_buffer temp_in_buff = { 0 };
0430     int bytes_left, bytes_read, bytes;
0431     u32 offset = dbg_buff->offset;
0432     int rc;
0433 
0434     temp_in_buff.offset = pin_buff->offset;
0435     temp_in_buff.data = pin_buff->data;
0436     temp_in_buff.size = pin_buff->size;
0437 
0438     bytes_left = pin_buff->size;
0439     bytes_read = 0;
0440     while (bytes_left > 0) {
0441         /* Do compression in smaller chunks */
0442         bytes = min_t(unsigned long, bytes_left,
0443                   (unsigned long)CUDBG_CHUNK_SIZE);
0444         temp_in_buff.data = (char *)pin_buff->data + bytes_read;
0445         temp_in_buff.size = bytes;
0446         rc = cudbg_compress_buff(pdbg_init, &temp_in_buff, dbg_buff);
0447         if (rc)
0448             return rc;
0449         bytes_left -= bytes;
0450         bytes_read += bytes;
0451     }
0452 
0453     pin_buff->size = dbg_buff->offset - offset;
0454     return 0;
0455 }
0456 
0457 static int cudbg_write_and_release_buff(struct cudbg_init *pdbg_init,
0458                     struct cudbg_buffer *pin_buff,
0459                     struct cudbg_buffer *dbg_buff)
0460 {
0461     int rc = 0;
0462 
0463     if (pdbg_init->compress_type == CUDBG_COMPRESSION_NONE) {
0464         cudbg_update_buff(pin_buff, dbg_buff);
0465     } else {
0466         rc = cudbg_do_compression(pdbg_init, pin_buff, dbg_buff);
0467         if (rc)
0468             goto out;
0469     }
0470 
0471 out:
0472     cudbg_put_buff(pdbg_init, pin_buff);
0473     return rc;
0474 }
0475 
0476 static int is_fw_attached(struct cudbg_init *pdbg_init)
0477 {
0478     struct adapter *padap = pdbg_init->adap;
0479 
0480     if (!(padap->flags & CXGB4_FW_OK) || padap->use_bd)
0481         return 0;
0482 
0483     return 1;
0484 }
0485 
0486 /* This function will add additional padding bytes into debug_buffer to make it
0487  * 4 byte aligned.
0488  */
0489 void cudbg_align_debug_buffer(struct cudbg_buffer *dbg_buff,
0490                   struct cudbg_entity_hdr *entity_hdr)
0491 {
0492     u8 zero_buf[4] = {0};
0493     u8 padding, remain;
0494 
0495     remain = (dbg_buff->offset - entity_hdr->start_offset) % 4;
0496     padding = 4 - remain;
0497     if (remain) {
0498         memcpy(((u8 *)dbg_buff->data) + dbg_buff->offset, &zero_buf,
0499                padding);
0500         dbg_buff->offset += padding;
0501         entity_hdr->num_pad = padding;
0502     }
0503     entity_hdr->size = dbg_buff->offset - entity_hdr->start_offset;
0504 }
0505 
0506 struct cudbg_entity_hdr *cudbg_get_entity_hdr(void *outbuf, int i)
0507 {
0508     struct cudbg_hdr *cudbg_hdr = (struct cudbg_hdr *)outbuf;
0509 
0510     return (struct cudbg_entity_hdr *)
0511            ((char *)outbuf + cudbg_hdr->hdr_len +
0512         (sizeof(struct cudbg_entity_hdr) * (i - 1)));
0513 }
0514 
0515 static int cudbg_read_vpd_reg(struct adapter *padap, u32 addr, u32 len,
0516                   void *dest)
0517 {
0518     int vaddr, rc;
0519 
0520     vaddr = t4_eeprom_ptov(addr, padap->pf, EEPROMPFSIZE);
0521     if (vaddr < 0)
0522         return vaddr;
0523 
0524     rc = pci_read_vpd(padap->pdev, vaddr, len, dest);
0525     if (rc < 0)
0526         return rc;
0527 
0528     return 0;
0529 }
0530 
0531 static int cudbg_mem_desc_cmp(const void *a, const void *b)
0532 {
0533     return ((const struct cudbg_mem_desc *)a)->base -
0534            ((const struct cudbg_mem_desc *)b)->base;
0535 }
0536 
0537 int cudbg_fill_meminfo(struct adapter *padap,
0538                struct cudbg_meminfo *meminfo_buff)
0539 {
0540     struct cudbg_mem_desc *md;
0541     u32 lo, hi, used, alloc;
0542     int n, i;
0543 
0544     memset(meminfo_buff->avail, 0,
0545            ARRAY_SIZE(meminfo_buff->avail) *
0546            sizeof(struct cudbg_mem_desc));
0547     memset(meminfo_buff->mem, 0,
0548            (ARRAY_SIZE(cudbg_region) + 3) * sizeof(struct cudbg_mem_desc));
0549     md  = meminfo_buff->mem;
0550 
0551     for (i = 0; i < ARRAY_SIZE(meminfo_buff->mem); i++) {
0552         meminfo_buff->mem[i].limit = 0;
0553         meminfo_buff->mem[i].idx = i;
0554     }
0555 
0556     /* Find and sort the populated memory ranges */
0557     i = 0;
0558     lo = t4_read_reg(padap, MA_TARGET_MEM_ENABLE_A);
0559     if (lo & EDRAM0_ENABLE_F) {
0560         hi = t4_read_reg(padap, MA_EDRAM0_BAR_A);
0561         meminfo_buff->avail[i].base =
0562             cudbg_mbytes_to_bytes(EDRAM0_BASE_G(hi));
0563         meminfo_buff->avail[i].limit =
0564             meminfo_buff->avail[i].base +
0565             cudbg_mbytes_to_bytes(EDRAM0_SIZE_G(hi));
0566         meminfo_buff->avail[i].idx = 0;
0567         i++;
0568     }
0569 
0570     if (lo & EDRAM1_ENABLE_F) {
0571         hi =  t4_read_reg(padap, MA_EDRAM1_BAR_A);
0572         meminfo_buff->avail[i].base =
0573             cudbg_mbytes_to_bytes(EDRAM1_BASE_G(hi));
0574         meminfo_buff->avail[i].limit =
0575             meminfo_buff->avail[i].base +
0576             cudbg_mbytes_to_bytes(EDRAM1_SIZE_G(hi));
0577         meminfo_buff->avail[i].idx = 1;
0578         i++;
0579     }
0580 
0581     if (is_t5(padap->params.chip)) {
0582         if (lo & EXT_MEM0_ENABLE_F) {
0583             hi = t4_read_reg(padap, MA_EXT_MEMORY0_BAR_A);
0584             meminfo_buff->avail[i].base =
0585                 cudbg_mbytes_to_bytes(EXT_MEM_BASE_G(hi));
0586             meminfo_buff->avail[i].limit =
0587                 meminfo_buff->avail[i].base +
0588                 cudbg_mbytes_to_bytes(EXT_MEM_SIZE_G(hi));
0589             meminfo_buff->avail[i].idx = 3;
0590             i++;
0591         }
0592 
0593         if (lo & EXT_MEM1_ENABLE_F) {
0594             hi = t4_read_reg(padap, MA_EXT_MEMORY1_BAR_A);
0595             meminfo_buff->avail[i].base =
0596                 cudbg_mbytes_to_bytes(EXT_MEM1_BASE_G(hi));
0597             meminfo_buff->avail[i].limit =
0598                 meminfo_buff->avail[i].base +
0599                 cudbg_mbytes_to_bytes(EXT_MEM1_SIZE_G(hi));
0600             meminfo_buff->avail[i].idx = 4;
0601             i++;
0602         }
0603     } else {
0604         if (lo & EXT_MEM_ENABLE_F) {
0605             hi = t4_read_reg(padap, MA_EXT_MEMORY_BAR_A);
0606             meminfo_buff->avail[i].base =
0607                 cudbg_mbytes_to_bytes(EXT_MEM_BASE_G(hi));
0608             meminfo_buff->avail[i].limit =
0609                 meminfo_buff->avail[i].base +
0610                 cudbg_mbytes_to_bytes(EXT_MEM_SIZE_G(hi));
0611             meminfo_buff->avail[i].idx = 2;
0612             i++;
0613         }
0614 
0615         if (lo & HMA_MUX_F) {
0616             hi = t4_read_reg(padap, MA_EXT_MEMORY1_BAR_A);
0617             meminfo_buff->avail[i].base =
0618                 cudbg_mbytes_to_bytes(EXT_MEM1_BASE_G(hi));
0619             meminfo_buff->avail[i].limit =
0620                 meminfo_buff->avail[i].base +
0621                 cudbg_mbytes_to_bytes(EXT_MEM1_SIZE_G(hi));
0622             meminfo_buff->avail[i].idx = 5;
0623             i++;
0624         }
0625     }
0626 
0627     if (!i) /* no memory available */
0628         return CUDBG_STATUS_ENTITY_NOT_FOUND;
0629 
0630     meminfo_buff->avail_c = i;
0631     sort(meminfo_buff->avail, i, sizeof(struct cudbg_mem_desc),
0632          cudbg_mem_desc_cmp, NULL);
0633     (md++)->base = t4_read_reg(padap, SGE_DBQ_CTXT_BADDR_A);
0634     (md++)->base = t4_read_reg(padap, SGE_IMSG_CTXT_BADDR_A);
0635     (md++)->base = t4_read_reg(padap, SGE_FLM_CACHE_BADDR_A);
0636     (md++)->base = t4_read_reg(padap, TP_CMM_TCB_BASE_A);
0637     (md++)->base = t4_read_reg(padap, TP_CMM_MM_BASE_A);
0638     (md++)->base = t4_read_reg(padap, TP_CMM_TIMER_BASE_A);
0639     (md++)->base = t4_read_reg(padap, TP_CMM_MM_RX_FLST_BASE_A);
0640     (md++)->base = t4_read_reg(padap, TP_CMM_MM_TX_FLST_BASE_A);
0641     (md++)->base = t4_read_reg(padap, TP_CMM_MM_PS_FLST_BASE_A);
0642 
0643     /* the next few have explicit upper bounds */
0644     md->base = t4_read_reg(padap, TP_PMM_TX_BASE_A);
0645     md->limit = md->base - 1 +
0646             t4_read_reg(padap, TP_PMM_TX_PAGE_SIZE_A) *
0647             PMTXMAXPAGE_G(t4_read_reg(padap, TP_PMM_TX_MAX_PAGE_A));
0648     md++;
0649 
0650     md->base = t4_read_reg(padap, TP_PMM_RX_BASE_A);
0651     md->limit = md->base - 1 +
0652             t4_read_reg(padap, TP_PMM_RX_PAGE_SIZE_A) *
0653             PMRXMAXPAGE_G(t4_read_reg(padap, TP_PMM_RX_MAX_PAGE_A));
0654     md++;
0655 
0656     if (t4_read_reg(padap, LE_DB_CONFIG_A) & HASHEN_F) {
0657         if (CHELSIO_CHIP_VERSION(padap->params.chip) <= CHELSIO_T5) {
0658             hi = t4_read_reg(padap, LE_DB_TID_HASHBASE_A) / 4;
0659             md->base = t4_read_reg(padap, LE_DB_HASH_TID_BASE_A);
0660         } else {
0661             hi = t4_read_reg(padap, LE_DB_HASH_TID_BASE_A);
0662             md->base = t4_read_reg(padap,
0663                            LE_DB_HASH_TBL_BASE_ADDR_A);
0664         }
0665         md->limit = 0;
0666     } else {
0667         md->base = 0;
0668         md->idx = ARRAY_SIZE(cudbg_region);  /* hide it */
0669     }
0670     md++;
0671 
0672 #define ulp_region(reg) do { \
0673     md->base = t4_read_reg(padap, ULP_ ## reg ## _LLIMIT_A);\
0674     (md++)->limit = t4_read_reg(padap, ULP_ ## reg ## _ULIMIT_A);\
0675 } while (0)
0676 
0677     ulp_region(RX_ISCSI);
0678     ulp_region(RX_TDDP);
0679     ulp_region(TX_TPT);
0680     ulp_region(RX_STAG);
0681     ulp_region(RX_RQ);
0682     ulp_region(RX_RQUDP);
0683     ulp_region(RX_PBL);
0684     ulp_region(TX_PBL);
0685 #undef ulp_region
0686     md->base = 0;
0687     md->idx = ARRAY_SIZE(cudbg_region);
0688     if (!is_t4(padap->params.chip)) {
0689         u32 fifo_size = t4_read_reg(padap, SGE_DBVFIFO_SIZE_A);
0690         u32 sge_ctrl = t4_read_reg(padap, SGE_CONTROL2_A);
0691         u32 size = 0;
0692 
0693         if (is_t5(padap->params.chip)) {
0694             if (sge_ctrl & VFIFO_ENABLE_F)
0695                 size = DBVFIFO_SIZE_G(fifo_size);
0696         } else {
0697             size = T6_DBVFIFO_SIZE_G(fifo_size);
0698         }
0699 
0700         if (size) {
0701             md->base = BASEADDR_G(t4_read_reg(padap,
0702                               SGE_DBVFIFO_BADDR_A));
0703             md->limit = md->base + (size << 2) - 1;
0704         }
0705     }
0706 
0707     md++;
0708 
0709     md->base = t4_read_reg(padap, ULP_RX_CTX_BASE_A);
0710     md->limit = 0;
0711     md++;
0712     md->base = t4_read_reg(padap, ULP_TX_ERR_TABLE_BASE_A);
0713     md->limit = 0;
0714     md++;
0715 
0716     md->base = padap->vres.ocq.start;
0717     if (padap->vres.ocq.size)
0718         md->limit = md->base + padap->vres.ocq.size - 1;
0719     else
0720         md->idx = ARRAY_SIZE(cudbg_region);  /* hide it */
0721     md++;
0722 
0723     /* add any address-space holes, there can be up to 3 */
0724     for (n = 0; n < i - 1; n++)
0725         if (meminfo_buff->avail[n].limit <
0726             meminfo_buff->avail[n + 1].base)
0727             (md++)->base = meminfo_buff->avail[n].limit;
0728 
0729     if (meminfo_buff->avail[n].limit)
0730         (md++)->base = meminfo_buff->avail[n].limit;
0731 
0732     n = md - meminfo_buff->mem;
0733     meminfo_buff->mem_c = n;
0734 
0735     sort(meminfo_buff->mem, n, sizeof(struct cudbg_mem_desc),
0736          cudbg_mem_desc_cmp, NULL);
0737 
0738     lo = t4_read_reg(padap, CIM_SDRAM_BASE_ADDR_A);
0739     hi = t4_read_reg(padap, CIM_SDRAM_ADDR_SIZE_A) + lo - 1;
0740     meminfo_buff->up_ram_lo = lo;
0741     meminfo_buff->up_ram_hi = hi;
0742 
0743     lo = t4_read_reg(padap, CIM_EXTMEM2_BASE_ADDR_A);
0744     hi = t4_read_reg(padap, CIM_EXTMEM2_ADDR_SIZE_A) + lo - 1;
0745     meminfo_buff->up_extmem2_lo = lo;
0746     meminfo_buff->up_extmem2_hi = hi;
0747 
0748     lo = t4_read_reg(padap, TP_PMM_RX_MAX_PAGE_A);
0749     for (i = 0, meminfo_buff->free_rx_cnt = 0; i < 2; i++)
0750         meminfo_buff->free_rx_cnt +=
0751             FREERXPAGECOUNT_G(t4_read_reg(padap,
0752                               TP_FLM_FREE_RX_CNT_A));
0753 
0754     meminfo_buff->rx_pages_data[0] =  PMRXMAXPAGE_G(lo);
0755     meminfo_buff->rx_pages_data[1] =
0756         t4_read_reg(padap, TP_PMM_RX_PAGE_SIZE_A) >> 10;
0757     meminfo_buff->rx_pages_data[2] = (lo & PMRXNUMCHN_F) ? 2 : 1;
0758 
0759     lo = t4_read_reg(padap, TP_PMM_TX_MAX_PAGE_A);
0760     hi = t4_read_reg(padap, TP_PMM_TX_PAGE_SIZE_A);
0761     for (i = 0, meminfo_buff->free_tx_cnt = 0; i < 4; i++)
0762         meminfo_buff->free_tx_cnt +=
0763             FREETXPAGECOUNT_G(t4_read_reg(padap,
0764                               TP_FLM_FREE_TX_CNT_A));
0765 
0766     meminfo_buff->tx_pages_data[0] = PMTXMAXPAGE_G(lo);
0767     meminfo_buff->tx_pages_data[1] =
0768         hi >= (1 << 20) ? (hi >> 20) : (hi >> 10);
0769     meminfo_buff->tx_pages_data[2] =
0770         hi >= (1 << 20) ? 'M' : 'K';
0771     meminfo_buff->tx_pages_data[3] = 1 << PMTXNUMCHN_G(lo);
0772 
0773     meminfo_buff->p_structs = t4_read_reg(padap, TP_CMM_MM_MAX_PSTRUCT_A);
0774     meminfo_buff->p_structs_free_cnt =
0775         FREEPSTRUCTCOUNT_G(t4_read_reg(padap, TP_FLM_FREE_PS_CNT_A));
0776 
0777     for (i = 0; i < 4; i++) {
0778         if (CHELSIO_CHIP_VERSION(padap->params.chip) > CHELSIO_T5)
0779             lo = t4_read_reg(padap,
0780                      MPS_RX_MAC_BG_PG_CNT0_A + i * 4);
0781         else
0782             lo = t4_read_reg(padap, MPS_RX_PG_RSV0_A + i * 4);
0783         if (is_t5(padap->params.chip)) {
0784             used = T5_USED_G(lo);
0785             alloc = T5_ALLOC_G(lo);
0786         } else {
0787             used = USED_G(lo);
0788             alloc = ALLOC_G(lo);
0789         }
0790         meminfo_buff->port_used[i] = used;
0791         meminfo_buff->port_alloc[i] = alloc;
0792     }
0793 
0794     for (i = 0; i < padap->params.arch.nchan; i++) {
0795         if (CHELSIO_CHIP_VERSION(padap->params.chip) > CHELSIO_T5)
0796             lo = t4_read_reg(padap,
0797                      MPS_RX_LPBK_BG_PG_CNT0_A + i * 4);
0798         else
0799             lo = t4_read_reg(padap, MPS_RX_PG_RSV4_A + i * 4);
0800         if (is_t5(padap->params.chip)) {
0801             used = T5_USED_G(lo);
0802             alloc = T5_ALLOC_G(lo);
0803         } else {
0804             used = USED_G(lo);
0805             alloc = ALLOC_G(lo);
0806         }
0807         meminfo_buff->loopback_used[i] = used;
0808         meminfo_buff->loopback_alloc[i] = alloc;
0809     }
0810 
0811     return 0;
0812 }
0813 
0814 int cudbg_collect_reg_dump(struct cudbg_init *pdbg_init,
0815                struct cudbg_buffer *dbg_buff,
0816                struct cudbg_error *cudbg_err)
0817 {
0818     struct adapter *padap = pdbg_init->adap;
0819     struct cudbg_buffer temp_buff = { 0 };
0820     u32 buf_size = 0;
0821     int rc = 0;
0822 
0823     if (is_t4(padap->params.chip))
0824         buf_size = T4_REGMAP_SIZE;
0825     else if (is_t5(padap->params.chip) || is_t6(padap->params.chip))
0826         buf_size = T5_REGMAP_SIZE;
0827 
0828     rc = cudbg_get_buff(pdbg_init, dbg_buff, buf_size, &temp_buff);
0829     if (rc)
0830         return rc;
0831     t4_get_regs(padap, (void *)temp_buff.data, temp_buff.size);
0832     return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
0833 }
0834 
0835 int cudbg_collect_fw_devlog(struct cudbg_init *pdbg_init,
0836                 struct cudbg_buffer *dbg_buff,
0837                 struct cudbg_error *cudbg_err)
0838 {
0839     struct adapter *padap = pdbg_init->adap;
0840     struct cudbg_buffer temp_buff = { 0 };
0841     struct devlog_params *dparams;
0842     int rc = 0;
0843 
0844     rc = t4_init_devlog_params(padap);
0845     if (rc < 0) {
0846         cudbg_err->sys_err = rc;
0847         return rc;
0848     }
0849 
0850     dparams = &padap->params.devlog;
0851     rc = cudbg_get_buff(pdbg_init, dbg_buff, dparams->size, &temp_buff);
0852     if (rc)
0853         return rc;
0854 
0855     /* Collect FW devlog */
0856     if (dparams->start != 0) {
0857         spin_lock(&padap->win0_lock);
0858         rc = t4_memory_rw(padap, padap->params.drv_memwin,
0859                   dparams->memtype, dparams->start,
0860                   dparams->size,
0861                   (__be32 *)(char *)temp_buff.data,
0862                   1);
0863         spin_unlock(&padap->win0_lock);
0864         if (rc) {
0865             cudbg_err->sys_err = rc;
0866             cudbg_put_buff(pdbg_init, &temp_buff);
0867             return rc;
0868         }
0869     }
0870     return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
0871 }
0872 
0873 int cudbg_collect_cim_la(struct cudbg_init *pdbg_init,
0874              struct cudbg_buffer *dbg_buff,
0875              struct cudbg_error *cudbg_err)
0876 {
0877     struct adapter *padap = pdbg_init->adap;
0878     struct cudbg_buffer temp_buff = { 0 };
0879     int size, rc;
0880     u32 cfg = 0;
0881 
0882     if (is_t6(padap->params.chip)) {
0883         size = padap->params.cim_la_size / 10 + 1;
0884         size *= 10 * sizeof(u32);
0885     } else {
0886         size = padap->params.cim_la_size / 8;
0887         size *= 8 * sizeof(u32);
0888     }
0889 
0890     size += sizeof(cfg);
0891     rc = cudbg_get_buff(pdbg_init, dbg_buff, size, &temp_buff);
0892     if (rc)
0893         return rc;
0894 
0895     rc = t4_cim_read(padap, UP_UP_DBG_LA_CFG_A, 1, &cfg);
0896     if (rc) {
0897         cudbg_err->sys_err = rc;
0898         cudbg_put_buff(pdbg_init, &temp_buff);
0899         return rc;
0900     }
0901 
0902     memcpy((char *)temp_buff.data, &cfg, sizeof(cfg));
0903     rc = t4_cim_read_la(padap,
0904                 (u32 *)((char *)temp_buff.data + sizeof(cfg)),
0905                 NULL);
0906     if (rc < 0) {
0907         cudbg_err->sys_err = rc;
0908         cudbg_put_buff(pdbg_init, &temp_buff);
0909         return rc;
0910     }
0911     return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
0912 }
0913 
0914 int cudbg_collect_cim_ma_la(struct cudbg_init *pdbg_init,
0915                 struct cudbg_buffer *dbg_buff,
0916                 struct cudbg_error *cudbg_err)
0917 {
0918     struct adapter *padap = pdbg_init->adap;
0919     struct cudbg_buffer temp_buff = { 0 };
0920     int size, rc;
0921 
0922     size = 2 * CIM_MALA_SIZE * 5 * sizeof(u32);
0923     rc = cudbg_get_buff(pdbg_init, dbg_buff, size, &temp_buff);
0924     if (rc)
0925         return rc;
0926 
0927     t4_cim_read_ma_la(padap,
0928               (u32 *)temp_buff.data,
0929               (u32 *)((char *)temp_buff.data +
0930                   5 * CIM_MALA_SIZE));
0931     return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
0932 }
0933 
0934 int cudbg_collect_cim_qcfg(struct cudbg_init *pdbg_init,
0935                struct cudbg_buffer *dbg_buff,
0936                struct cudbg_error *cudbg_err)
0937 {
0938     struct adapter *padap = pdbg_init->adap;
0939     struct cudbg_buffer temp_buff = { 0 };
0940     struct cudbg_cim_qcfg *cim_qcfg_data;
0941     int rc;
0942 
0943     rc = cudbg_get_buff(pdbg_init, dbg_buff, sizeof(struct cudbg_cim_qcfg),
0944                 &temp_buff);
0945     if (rc)
0946         return rc;
0947 
0948     cim_qcfg_data = (struct cudbg_cim_qcfg *)temp_buff.data;
0949     cim_qcfg_data->chip = padap->params.chip;
0950     rc = t4_cim_read(padap, UP_IBQ_0_RDADDR_A,
0951              ARRAY_SIZE(cim_qcfg_data->stat), cim_qcfg_data->stat);
0952     if (rc) {
0953         cudbg_err->sys_err = rc;
0954         cudbg_put_buff(pdbg_init, &temp_buff);
0955         return rc;
0956     }
0957 
0958     rc = t4_cim_read(padap, UP_OBQ_0_REALADDR_A,
0959              ARRAY_SIZE(cim_qcfg_data->obq_wr),
0960              cim_qcfg_data->obq_wr);
0961     if (rc) {
0962         cudbg_err->sys_err = rc;
0963         cudbg_put_buff(pdbg_init, &temp_buff);
0964         return rc;
0965     }
0966 
0967     t4_read_cimq_cfg(padap, cim_qcfg_data->base, cim_qcfg_data->size,
0968              cim_qcfg_data->thres);
0969     return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
0970 }
0971 
0972 static int cudbg_read_cim_ibq(struct cudbg_init *pdbg_init,
0973                   struct cudbg_buffer *dbg_buff,
0974                   struct cudbg_error *cudbg_err, int qid)
0975 {
0976     struct adapter *padap = pdbg_init->adap;
0977     struct cudbg_buffer temp_buff = { 0 };
0978     int no_of_read_words, rc = 0;
0979     u32 qsize;
0980 
0981     /* collect CIM IBQ */
0982     qsize = CIM_IBQ_SIZE * 4 * sizeof(u32);
0983     rc = cudbg_get_buff(pdbg_init, dbg_buff, qsize, &temp_buff);
0984     if (rc)
0985         return rc;
0986 
0987     /* t4_read_cim_ibq will return no. of read words or error */
0988     no_of_read_words = t4_read_cim_ibq(padap, qid,
0989                        (u32 *)temp_buff.data, qsize);
0990     /* no_of_read_words is less than or equal to 0 means error */
0991     if (no_of_read_words <= 0) {
0992         if (!no_of_read_words)
0993             rc = CUDBG_SYSTEM_ERROR;
0994         else
0995             rc = no_of_read_words;
0996         cudbg_err->sys_err = rc;
0997         cudbg_put_buff(pdbg_init, &temp_buff);
0998         return rc;
0999     }
1000     return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
1001 }
1002 
1003 int cudbg_collect_cim_ibq_tp0(struct cudbg_init *pdbg_init,
1004                   struct cudbg_buffer *dbg_buff,
1005                   struct cudbg_error *cudbg_err)
1006 {
1007     return cudbg_read_cim_ibq(pdbg_init, dbg_buff, cudbg_err, 0);
1008 }
1009 
1010 int cudbg_collect_cim_ibq_tp1(struct cudbg_init *pdbg_init,
1011                   struct cudbg_buffer *dbg_buff,
1012                   struct cudbg_error *cudbg_err)
1013 {
1014     return cudbg_read_cim_ibq(pdbg_init, dbg_buff, cudbg_err, 1);
1015 }
1016 
1017 int cudbg_collect_cim_ibq_ulp(struct cudbg_init *pdbg_init,
1018                   struct cudbg_buffer *dbg_buff,
1019                   struct cudbg_error *cudbg_err)
1020 {
1021     return cudbg_read_cim_ibq(pdbg_init, dbg_buff, cudbg_err, 2);
1022 }
1023 
1024 int cudbg_collect_cim_ibq_sge0(struct cudbg_init *pdbg_init,
1025                    struct cudbg_buffer *dbg_buff,
1026                    struct cudbg_error *cudbg_err)
1027 {
1028     return cudbg_read_cim_ibq(pdbg_init, dbg_buff, cudbg_err, 3);
1029 }
1030 
1031 int cudbg_collect_cim_ibq_sge1(struct cudbg_init *pdbg_init,
1032                    struct cudbg_buffer *dbg_buff,
1033                    struct cudbg_error *cudbg_err)
1034 {
1035     return cudbg_read_cim_ibq(pdbg_init, dbg_buff, cudbg_err, 4);
1036 }
1037 
1038 int cudbg_collect_cim_ibq_ncsi(struct cudbg_init *pdbg_init,
1039                    struct cudbg_buffer *dbg_buff,
1040                    struct cudbg_error *cudbg_err)
1041 {
1042     return cudbg_read_cim_ibq(pdbg_init, dbg_buff, cudbg_err, 5);
1043 }
1044 
1045 u32 cudbg_cim_obq_size(struct adapter *padap, int qid)
1046 {
1047     u32 value;
1048 
1049     t4_write_reg(padap, CIM_QUEUE_CONFIG_REF_A, OBQSELECT_F |
1050              QUENUMSELECT_V(qid));
1051     value = t4_read_reg(padap, CIM_QUEUE_CONFIG_CTRL_A);
1052     value = CIMQSIZE_G(value) * 64; /* size in number of words */
1053     return value * sizeof(u32);
1054 }
1055 
1056 static int cudbg_read_cim_obq(struct cudbg_init *pdbg_init,
1057                   struct cudbg_buffer *dbg_buff,
1058                   struct cudbg_error *cudbg_err, int qid)
1059 {
1060     struct adapter *padap = pdbg_init->adap;
1061     struct cudbg_buffer temp_buff = { 0 };
1062     int no_of_read_words, rc = 0;
1063     u32 qsize;
1064 
1065     /* collect CIM OBQ */
1066     qsize =  cudbg_cim_obq_size(padap, qid);
1067     rc = cudbg_get_buff(pdbg_init, dbg_buff, qsize, &temp_buff);
1068     if (rc)
1069         return rc;
1070 
1071     /* t4_read_cim_obq will return no. of read words or error */
1072     no_of_read_words = t4_read_cim_obq(padap, qid,
1073                        (u32 *)temp_buff.data, qsize);
1074     /* no_of_read_words is less than or equal to 0 means error */
1075     if (no_of_read_words <= 0) {
1076         if (!no_of_read_words)
1077             rc = CUDBG_SYSTEM_ERROR;
1078         else
1079             rc = no_of_read_words;
1080         cudbg_err->sys_err = rc;
1081         cudbg_put_buff(pdbg_init, &temp_buff);
1082         return rc;
1083     }
1084     return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
1085 }
1086 
1087 int cudbg_collect_cim_obq_ulp0(struct cudbg_init *pdbg_init,
1088                    struct cudbg_buffer *dbg_buff,
1089                    struct cudbg_error *cudbg_err)
1090 {
1091     return cudbg_read_cim_obq(pdbg_init, dbg_buff, cudbg_err, 0);
1092 }
1093 
1094 int cudbg_collect_cim_obq_ulp1(struct cudbg_init *pdbg_init,
1095                    struct cudbg_buffer *dbg_buff,
1096                    struct cudbg_error *cudbg_err)
1097 {
1098     return cudbg_read_cim_obq(pdbg_init, dbg_buff, cudbg_err, 1);
1099 }
1100 
1101 int cudbg_collect_cim_obq_ulp2(struct cudbg_init *pdbg_init,
1102                    struct cudbg_buffer *dbg_buff,
1103                    struct cudbg_error *cudbg_err)
1104 {
1105     return cudbg_read_cim_obq(pdbg_init, dbg_buff, cudbg_err, 2);
1106 }
1107 
1108 int cudbg_collect_cim_obq_ulp3(struct cudbg_init *pdbg_init,
1109                    struct cudbg_buffer *dbg_buff,
1110                    struct cudbg_error *cudbg_err)
1111 {
1112     return cudbg_read_cim_obq(pdbg_init, dbg_buff, cudbg_err, 3);
1113 }
1114 
1115 int cudbg_collect_cim_obq_sge(struct cudbg_init *pdbg_init,
1116                   struct cudbg_buffer *dbg_buff,
1117                   struct cudbg_error *cudbg_err)
1118 {
1119     return cudbg_read_cim_obq(pdbg_init, dbg_buff, cudbg_err, 4);
1120 }
1121 
1122 int cudbg_collect_cim_obq_ncsi(struct cudbg_init *pdbg_init,
1123                    struct cudbg_buffer *dbg_buff,
1124                    struct cudbg_error *cudbg_err)
1125 {
1126     return cudbg_read_cim_obq(pdbg_init, dbg_buff, cudbg_err, 5);
1127 }
1128 
1129 int cudbg_collect_obq_sge_rx_q0(struct cudbg_init *pdbg_init,
1130                 struct cudbg_buffer *dbg_buff,
1131                 struct cudbg_error *cudbg_err)
1132 {
1133     return cudbg_read_cim_obq(pdbg_init, dbg_buff, cudbg_err, 6);
1134 }
1135 
1136 int cudbg_collect_obq_sge_rx_q1(struct cudbg_init *pdbg_init,
1137                 struct cudbg_buffer *dbg_buff,
1138                 struct cudbg_error *cudbg_err)
1139 {
1140     return cudbg_read_cim_obq(pdbg_init, dbg_buff, cudbg_err, 7);
1141 }
1142 
1143 static int cudbg_meminfo_get_mem_index(struct adapter *padap,
1144                        struct cudbg_meminfo *mem_info,
1145                        u8 mem_type, u8 *idx)
1146 {
1147     u8 i, flag;
1148 
1149     switch (mem_type) {
1150     case MEM_EDC0:
1151         flag = EDC0_FLAG;
1152         break;
1153     case MEM_EDC1:
1154         flag = EDC1_FLAG;
1155         break;
1156     case MEM_MC0:
1157         /* Some T5 cards have both MC0 and MC1. */
1158         flag = is_t5(padap->params.chip) ? MC0_FLAG : MC_FLAG;
1159         break;
1160     case MEM_MC1:
1161         flag = MC1_FLAG;
1162         break;
1163     case MEM_HMA:
1164         flag = HMA_FLAG;
1165         break;
1166     default:
1167         return CUDBG_STATUS_ENTITY_NOT_FOUND;
1168     }
1169 
1170     for (i = 0; i < mem_info->avail_c; i++) {
1171         if (mem_info->avail[i].idx == flag) {
1172             *idx = i;
1173             return 0;
1174         }
1175     }
1176 
1177     return CUDBG_STATUS_ENTITY_NOT_FOUND;
1178 }
1179 
1180 /* Fetch the @region_name's start and end from @meminfo. */
1181 static int cudbg_get_mem_region(struct adapter *padap,
1182                 struct cudbg_meminfo *meminfo,
1183                 u8 mem_type, const char *region_name,
1184                 struct cudbg_mem_desc *mem_desc)
1185 {
1186     u8 mc, found = 0;
1187     u32 idx = 0;
1188     int rc, i;
1189 
1190     rc = cudbg_meminfo_get_mem_index(padap, meminfo, mem_type, &mc);
1191     if (rc)
1192         return rc;
1193 
1194     i = match_string(cudbg_region, ARRAY_SIZE(cudbg_region), region_name);
1195     if (i < 0)
1196         return -EINVAL;
1197 
1198     idx = i;
1199     for (i = 0; i < meminfo->mem_c; i++) {
1200         if (meminfo->mem[i].idx >= ARRAY_SIZE(cudbg_region))
1201             continue; /* Skip holes */
1202 
1203         if (!(meminfo->mem[i].limit))
1204             meminfo->mem[i].limit =
1205                 i < meminfo->mem_c - 1 ?
1206                 meminfo->mem[i + 1].base - 1 : ~0;
1207 
1208         if (meminfo->mem[i].idx == idx) {
1209             /* Check if the region exists in @mem_type memory */
1210             if (meminfo->mem[i].base < meminfo->avail[mc].base &&
1211                 meminfo->mem[i].limit < meminfo->avail[mc].base)
1212                 return -EINVAL;
1213 
1214             if (meminfo->mem[i].base > meminfo->avail[mc].limit)
1215                 return -EINVAL;
1216 
1217             memcpy(mem_desc, &meminfo->mem[i],
1218                    sizeof(struct cudbg_mem_desc));
1219             found = 1;
1220             break;
1221         }
1222     }
1223     if (!found)
1224         return -EINVAL;
1225 
1226     return 0;
1227 }
1228 
1229 /* Fetch and update the start and end of the requested memory region w.r.t 0
1230  * in the corresponding EDC/MC/HMA.
1231  */
1232 static int cudbg_get_mem_relative(struct adapter *padap,
1233                   struct cudbg_meminfo *meminfo,
1234                   u8 mem_type, u32 *out_base, u32 *out_end)
1235 {
1236     u8 mc_idx;
1237     int rc;
1238 
1239     rc = cudbg_meminfo_get_mem_index(padap, meminfo, mem_type, &mc_idx);
1240     if (rc)
1241         return rc;
1242 
1243     if (*out_base < meminfo->avail[mc_idx].base)
1244         *out_base = 0;
1245     else
1246         *out_base -= meminfo->avail[mc_idx].base;
1247 
1248     if (*out_end > meminfo->avail[mc_idx].limit)
1249         *out_end = meminfo->avail[mc_idx].limit;
1250     else
1251         *out_end -= meminfo->avail[mc_idx].base;
1252 
1253     return 0;
1254 }
1255 
1256 /* Get TX and RX Payload region */
1257 static int cudbg_get_payload_range(struct adapter *padap, u8 mem_type,
1258                    const char *region_name,
1259                    struct cudbg_region_info *payload)
1260 {
1261     struct cudbg_mem_desc mem_desc = { 0 };
1262     struct cudbg_meminfo meminfo;
1263     int rc;
1264 
1265     rc = cudbg_fill_meminfo(padap, &meminfo);
1266     if (rc)
1267         return rc;
1268 
1269     rc = cudbg_get_mem_region(padap, &meminfo, mem_type, region_name,
1270                   &mem_desc);
1271     if (rc) {
1272         payload->exist = false;
1273         return 0;
1274     }
1275 
1276     payload->exist = true;
1277     payload->start = mem_desc.base;
1278     payload->end = mem_desc.limit;
1279 
1280     return cudbg_get_mem_relative(padap, &meminfo, mem_type,
1281                       &payload->start, &payload->end);
1282 }
1283 
1284 static int cudbg_memory_read(struct cudbg_init *pdbg_init, int win,
1285                  int mtype, u32 addr, u32 len, void *hbuf)
1286 {
1287     u32 win_pf, memoffset, mem_aperture, mem_base;
1288     struct adapter *adap = pdbg_init->adap;
1289     u32 pos, offset, resid;
1290     u32 *res_buf;
1291     u64 *buf;
1292     int ret;
1293 
1294     /* Argument sanity checks ...
1295      */
1296     if (addr & 0x3 || (uintptr_t)hbuf & 0x3)
1297         return -EINVAL;
1298 
1299     buf = (u64 *)hbuf;
1300 
1301     /* Try to do 64-bit reads.  Residual will be handled later. */
1302     resid = len & 0x7;
1303     len -= resid;
1304 
1305     ret = t4_memory_rw_init(adap, win, mtype, &memoffset, &mem_base,
1306                 &mem_aperture);
1307     if (ret)
1308         return ret;
1309 
1310     addr = addr + memoffset;
1311     win_pf = is_t4(adap->params.chip) ? 0 : PFNUM_V(adap->pf);
1312 
1313     pos = addr & ~(mem_aperture - 1);
1314     offset = addr - pos;
1315 
1316     /* Set up initial PCI-E Memory Window to cover the start of our
1317      * transfer.
1318      */
1319     t4_memory_update_win(adap, win, pos | win_pf);
1320 
1321     /* Transfer data from the adapter */
1322     while (len > 0) {
1323         *buf++ = le64_to_cpu((__force __le64)
1324                      t4_read_reg64(adap, mem_base + offset));
1325         offset += sizeof(u64);
1326         len -= sizeof(u64);
1327 
1328         /* If we've reached the end of our current window aperture,
1329          * move the PCI-E Memory Window on to the next.
1330          */
1331         if (offset == mem_aperture) {
1332             pos += mem_aperture;
1333             offset = 0;
1334             t4_memory_update_win(adap, win, pos | win_pf);
1335         }
1336     }
1337 
1338     res_buf = (u32 *)buf;
1339     /* Read residual in 32-bit multiples */
1340     while (resid > sizeof(u32)) {
1341         *res_buf++ = le32_to_cpu((__force __le32)
1342                      t4_read_reg(adap, mem_base + offset));
1343         offset += sizeof(u32);
1344         resid -= sizeof(u32);
1345 
1346         /* If we've reached the end of our current window aperture,
1347          * move the PCI-E Memory Window on to the next.
1348          */
1349         if (offset == mem_aperture) {
1350             pos += mem_aperture;
1351             offset = 0;
1352             t4_memory_update_win(adap, win, pos | win_pf);
1353         }
1354     }
1355 
1356     /* Transfer residual < 32-bits */
1357     if (resid)
1358         t4_memory_rw_residual(adap, resid, mem_base + offset,
1359                       (u8 *)res_buf, T4_MEMORY_READ);
1360 
1361     return 0;
1362 }
1363 
1364 #define CUDBG_YIELD_ITERATION 256
1365 
1366 static int cudbg_read_fw_mem(struct cudbg_init *pdbg_init,
1367                  struct cudbg_buffer *dbg_buff, u8 mem_type,
1368                  unsigned long tot_len,
1369                  struct cudbg_error *cudbg_err)
1370 {
1371     static const char * const region_name[] = { "Tx payload:",
1372                             "Rx payload:" };
1373     unsigned long bytes, bytes_left, bytes_read = 0;
1374     struct adapter *padap = pdbg_init->adap;
1375     struct cudbg_buffer temp_buff = { 0 };
1376     struct cudbg_region_info payload[2];
1377     u32 yield_count = 0;
1378     int rc = 0;
1379     u8 i;
1380 
1381     /* Get TX/RX Payload region range if they exist */
1382     memset(payload, 0, sizeof(payload));
1383     for (i = 0; i < ARRAY_SIZE(region_name); i++) {
1384         rc = cudbg_get_payload_range(padap, mem_type, region_name[i],
1385                          &payload[i]);
1386         if (rc)
1387             return rc;
1388 
1389         if (payload[i].exist) {
1390             /* Align start and end to avoid wrap around */
1391             payload[i].start = roundup(payload[i].start,
1392                            CUDBG_CHUNK_SIZE);
1393             payload[i].end = rounddown(payload[i].end,
1394                            CUDBG_CHUNK_SIZE);
1395         }
1396     }
1397 
1398     bytes_left = tot_len;
1399     while (bytes_left > 0) {
1400         /* As MC size is huge and read through PIO access, this
1401          * loop will hold cpu for a longer time. OS may think that
1402          * the process is hanged and will generate CPU stall traces.
1403          * So yield the cpu regularly.
1404          */
1405         yield_count++;
1406         if (!(yield_count % CUDBG_YIELD_ITERATION))
1407             schedule();
1408 
1409         bytes = min_t(unsigned long, bytes_left,
1410                   (unsigned long)CUDBG_CHUNK_SIZE);
1411         rc = cudbg_get_buff(pdbg_init, dbg_buff, bytes, &temp_buff);
1412         if (rc)
1413             return rc;
1414 
1415         for (i = 0; i < ARRAY_SIZE(payload); i++)
1416             if (payload[i].exist &&
1417                 bytes_read >= payload[i].start &&
1418                 bytes_read + bytes <= payload[i].end)
1419                 /* TX and RX Payload regions can't overlap */
1420                 goto skip_read;
1421 
1422         spin_lock(&padap->win0_lock);
1423         rc = cudbg_memory_read(pdbg_init, MEMWIN_NIC, mem_type,
1424                        bytes_read, bytes, temp_buff.data);
1425         spin_unlock(&padap->win0_lock);
1426         if (rc) {
1427             cudbg_err->sys_err = rc;
1428             cudbg_put_buff(pdbg_init, &temp_buff);
1429             return rc;
1430         }
1431 
1432 skip_read:
1433         bytes_left -= bytes;
1434         bytes_read += bytes;
1435         rc = cudbg_write_and_release_buff(pdbg_init, &temp_buff,
1436                           dbg_buff);
1437         if (rc) {
1438             cudbg_put_buff(pdbg_init, &temp_buff);
1439             return rc;
1440         }
1441     }
1442     return rc;
1443 }
1444 
1445 static void cudbg_t4_fwcache(struct cudbg_init *pdbg_init,
1446                  struct cudbg_error *cudbg_err)
1447 {
1448     struct adapter *padap = pdbg_init->adap;
1449     int rc;
1450 
1451     if (is_fw_attached(pdbg_init)) {
1452         /* Flush uP dcache before reading edcX/mcX  */
1453         rc = t4_fwcache(padap, FW_PARAM_DEV_FWCACHE_FLUSH);
1454         if (rc)
1455             cudbg_err->sys_warn = rc;
1456     }
1457 }
1458 
1459 static int cudbg_mem_region_size(struct cudbg_init *pdbg_init,
1460                  struct cudbg_error *cudbg_err,
1461                  u8 mem_type, unsigned long *region_size)
1462 {
1463     struct adapter *padap = pdbg_init->adap;
1464     struct cudbg_meminfo mem_info;
1465     u8 mc_idx;
1466     int rc;
1467 
1468     memset(&mem_info, 0, sizeof(struct cudbg_meminfo));
1469     rc = cudbg_fill_meminfo(padap, &mem_info);
1470     if (rc) {
1471         cudbg_err->sys_err = rc;
1472         return rc;
1473     }
1474 
1475     cudbg_t4_fwcache(pdbg_init, cudbg_err);
1476     rc = cudbg_meminfo_get_mem_index(padap, &mem_info, mem_type, &mc_idx);
1477     if (rc) {
1478         cudbg_err->sys_err = rc;
1479         return rc;
1480     }
1481 
1482     if (region_size)
1483         *region_size = mem_info.avail[mc_idx].limit -
1484                    mem_info.avail[mc_idx].base;
1485 
1486     return 0;
1487 }
1488 
1489 static int cudbg_collect_mem_region(struct cudbg_init *pdbg_init,
1490                     struct cudbg_buffer *dbg_buff,
1491                     struct cudbg_error *cudbg_err,
1492                     u8 mem_type)
1493 {
1494     unsigned long size = 0;
1495     int rc;
1496 
1497     rc = cudbg_mem_region_size(pdbg_init, cudbg_err, mem_type, &size);
1498     if (rc)
1499         return rc;
1500 
1501     return cudbg_read_fw_mem(pdbg_init, dbg_buff, mem_type, size,
1502                  cudbg_err);
1503 }
1504 
1505 int cudbg_collect_edc0_meminfo(struct cudbg_init *pdbg_init,
1506                    struct cudbg_buffer *dbg_buff,
1507                    struct cudbg_error *cudbg_err)
1508 {
1509     return cudbg_collect_mem_region(pdbg_init, dbg_buff, cudbg_err,
1510                     MEM_EDC0);
1511 }
1512 
1513 int cudbg_collect_edc1_meminfo(struct cudbg_init *pdbg_init,
1514                    struct cudbg_buffer *dbg_buff,
1515                    struct cudbg_error *cudbg_err)
1516 {
1517     return cudbg_collect_mem_region(pdbg_init, dbg_buff, cudbg_err,
1518                     MEM_EDC1);
1519 }
1520 
1521 int cudbg_collect_mc0_meminfo(struct cudbg_init *pdbg_init,
1522                   struct cudbg_buffer *dbg_buff,
1523                   struct cudbg_error *cudbg_err)
1524 {
1525     return cudbg_collect_mem_region(pdbg_init, dbg_buff, cudbg_err,
1526                     MEM_MC0);
1527 }
1528 
1529 int cudbg_collect_mc1_meminfo(struct cudbg_init *pdbg_init,
1530                   struct cudbg_buffer *dbg_buff,
1531                   struct cudbg_error *cudbg_err)
1532 {
1533     return cudbg_collect_mem_region(pdbg_init, dbg_buff, cudbg_err,
1534                     MEM_MC1);
1535 }
1536 
1537 int cudbg_collect_hma_meminfo(struct cudbg_init *pdbg_init,
1538                   struct cudbg_buffer *dbg_buff,
1539                   struct cudbg_error *cudbg_err)
1540 {
1541     return cudbg_collect_mem_region(pdbg_init, dbg_buff, cudbg_err,
1542                     MEM_HMA);
1543 }
1544 
1545 int cudbg_collect_rss(struct cudbg_init *pdbg_init,
1546               struct cudbg_buffer *dbg_buff,
1547               struct cudbg_error *cudbg_err)
1548 {
1549     struct adapter *padap = pdbg_init->adap;
1550     struct cudbg_buffer temp_buff = { 0 };
1551     int rc, nentries;
1552 
1553     nentries = t4_chip_rss_size(padap);
1554     rc = cudbg_get_buff(pdbg_init, dbg_buff, nentries * sizeof(u16),
1555                 &temp_buff);
1556     if (rc)
1557         return rc;
1558 
1559     rc = t4_read_rss(padap, (u16 *)temp_buff.data);
1560     if (rc) {
1561         cudbg_err->sys_err = rc;
1562         cudbg_put_buff(pdbg_init, &temp_buff);
1563         return rc;
1564     }
1565     return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
1566 }
1567 
1568 int cudbg_collect_rss_vf_config(struct cudbg_init *pdbg_init,
1569                 struct cudbg_buffer *dbg_buff,
1570                 struct cudbg_error *cudbg_err)
1571 {
1572     struct adapter *padap = pdbg_init->adap;
1573     struct cudbg_buffer temp_buff = { 0 };
1574     struct cudbg_rss_vf_conf *vfconf;
1575     int vf, rc, vf_count;
1576 
1577     vf_count = padap->params.arch.vfcount;
1578     rc = cudbg_get_buff(pdbg_init, dbg_buff,
1579                 vf_count * sizeof(struct cudbg_rss_vf_conf),
1580                 &temp_buff);
1581     if (rc)
1582         return rc;
1583 
1584     vfconf = (struct cudbg_rss_vf_conf *)temp_buff.data;
1585     for (vf = 0; vf < vf_count; vf++)
1586         t4_read_rss_vf_config(padap, vf, &vfconf[vf].rss_vf_vfl,
1587                       &vfconf[vf].rss_vf_vfh, true);
1588     return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
1589 }
1590 
1591 int cudbg_collect_path_mtu(struct cudbg_init *pdbg_init,
1592                struct cudbg_buffer *dbg_buff,
1593                struct cudbg_error *cudbg_err)
1594 {
1595     struct adapter *padap = pdbg_init->adap;
1596     struct cudbg_buffer temp_buff = { 0 };
1597     int rc;
1598 
1599     rc = cudbg_get_buff(pdbg_init, dbg_buff, NMTUS * sizeof(u16),
1600                 &temp_buff);
1601     if (rc)
1602         return rc;
1603 
1604     t4_read_mtu_tbl(padap, (u16 *)temp_buff.data, NULL);
1605     return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
1606 }
1607 
1608 int cudbg_collect_pm_stats(struct cudbg_init *pdbg_init,
1609                struct cudbg_buffer *dbg_buff,
1610                struct cudbg_error *cudbg_err)
1611 {
1612     struct adapter *padap = pdbg_init->adap;
1613     struct cudbg_buffer temp_buff = { 0 };
1614     struct cudbg_pm_stats *pm_stats_buff;
1615     int rc;
1616 
1617     rc = cudbg_get_buff(pdbg_init, dbg_buff, sizeof(struct cudbg_pm_stats),
1618                 &temp_buff);
1619     if (rc)
1620         return rc;
1621 
1622     pm_stats_buff = (struct cudbg_pm_stats *)temp_buff.data;
1623     t4_pmtx_get_stats(padap, pm_stats_buff->tx_cnt, pm_stats_buff->tx_cyc);
1624     t4_pmrx_get_stats(padap, pm_stats_buff->rx_cnt, pm_stats_buff->rx_cyc);
1625     return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
1626 }
1627 
1628 int cudbg_collect_hw_sched(struct cudbg_init *pdbg_init,
1629                struct cudbg_buffer *dbg_buff,
1630                struct cudbg_error *cudbg_err)
1631 {
1632     struct adapter *padap = pdbg_init->adap;
1633     struct cudbg_buffer temp_buff = { 0 };
1634     struct cudbg_hw_sched *hw_sched_buff;
1635     int i, rc = 0;
1636 
1637     if (!padap->params.vpd.cclk)
1638         return CUDBG_STATUS_CCLK_NOT_DEFINED;
1639 
1640     rc = cudbg_get_buff(pdbg_init, dbg_buff, sizeof(struct cudbg_hw_sched),
1641                 &temp_buff);
1642 
1643     if (rc)
1644         return rc;
1645 
1646     hw_sched_buff = (struct cudbg_hw_sched *)temp_buff.data;
1647     hw_sched_buff->map = t4_read_reg(padap, TP_TX_MOD_QUEUE_REQ_MAP_A);
1648     hw_sched_buff->mode = TIMERMODE_G(t4_read_reg(padap, TP_MOD_CONFIG_A));
1649     t4_read_pace_tbl(padap, hw_sched_buff->pace_tab);
1650     for (i = 0; i < NTX_SCHED; ++i)
1651         t4_get_tx_sched(padap, i, &hw_sched_buff->kbps[i],
1652                 &hw_sched_buff->ipg[i], true);
1653     return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
1654 }
1655 
1656 int cudbg_collect_tp_indirect(struct cudbg_init *pdbg_init,
1657                   struct cudbg_buffer *dbg_buff,
1658                   struct cudbg_error *cudbg_err)
1659 {
1660     struct adapter *padap = pdbg_init->adap;
1661     struct cudbg_buffer temp_buff = { 0 };
1662     struct ireg_buf *ch_tp_pio;
1663     int i, rc, n = 0;
1664     u32 size;
1665 
1666     if (is_t5(padap->params.chip))
1667         n = sizeof(t5_tp_pio_array) +
1668             sizeof(t5_tp_tm_pio_array) +
1669             sizeof(t5_tp_mib_index_array);
1670     else
1671         n = sizeof(t6_tp_pio_array) +
1672             sizeof(t6_tp_tm_pio_array) +
1673             sizeof(t6_tp_mib_index_array);
1674 
1675     n = n / (IREG_NUM_ELEM * sizeof(u32));
1676     size = sizeof(struct ireg_buf) * n;
1677     rc = cudbg_get_buff(pdbg_init, dbg_buff, size, &temp_buff);
1678     if (rc)
1679         return rc;
1680 
1681     ch_tp_pio = (struct ireg_buf *)temp_buff.data;
1682 
1683     /* TP_PIO */
1684     if (is_t5(padap->params.chip))
1685         n = sizeof(t5_tp_pio_array) / (IREG_NUM_ELEM * sizeof(u32));
1686     else if (is_t6(padap->params.chip))
1687         n = sizeof(t6_tp_pio_array) / (IREG_NUM_ELEM * sizeof(u32));
1688 
1689     for (i = 0; i < n; i++) {
1690         struct ireg_field *tp_pio = &ch_tp_pio->tp_pio;
1691         u32 *buff = ch_tp_pio->outbuf;
1692 
1693         if (is_t5(padap->params.chip)) {
1694             tp_pio->ireg_addr = t5_tp_pio_array[i][0];
1695             tp_pio->ireg_data = t5_tp_pio_array[i][1];
1696             tp_pio->ireg_local_offset = t5_tp_pio_array[i][2];
1697             tp_pio->ireg_offset_range = t5_tp_pio_array[i][3];
1698         } else if (is_t6(padap->params.chip)) {
1699             tp_pio->ireg_addr = t6_tp_pio_array[i][0];
1700             tp_pio->ireg_data = t6_tp_pio_array[i][1];
1701             tp_pio->ireg_local_offset = t6_tp_pio_array[i][2];
1702             tp_pio->ireg_offset_range = t6_tp_pio_array[i][3];
1703         }
1704         t4_tp_pio_read(padap, buff, tp_pio->ireg_offset_range,
1705                    tp_pio->ireg_local_offset, true);
1706         ch_tp_pio++;
1707     }
1708 
1709     /* TP_TM_PIO */
1710     if (is_t5(padap->params.chip))
1711         n = sizeof(t5_tp_tm_pio_array) / (IREG_NUM_ELEM * sizeof(u32));
1712     else if (is_t6(padap->params.chip))
1713         n = sizeof(t6_tp_tm_pio_array) / (IREG_NUM_ELEM * sizeof(u32));
1714 
1715     for (i = 0; i < n; i++) {
1716         struct ireg_field *tp_pio = &ch_tp_pio->tp_pio;
1717         u32 *buff = ch_tp_pio->outbuf;
1718 
1719         if (is_t5(padap->params.chip)) {
1720             tp_pio->ireg_addr = t5_tp_tm_pio_array[i][0];
1721             tp_pio->ireg_data = t5_tp_tm_pio_array[i][1];
1722             tp_pio->ireg_local_offset = t5_tp_tm_pio_array[i][2];
1723             tp_pio->ireg_offset_range = t5_tp_tm_pio_array[i][3];
1724         } else if (is_t6(padap->params.chip)) {
1725             tp_pio->ireg_addr = t6_tp_tm_pio_array[i][0];
1726             tp_pio->ireg_data = t6_tp_tm_pio_array[i][1];
1727             tp_pio->ireg_local_offset = t6_tp_tm_pio_array[i][2];
1728             tp_pio->ireg_offset_range = t6_tp_tm_pio_array[i][3];
1729         }
1730         t4_tp_tm_pio_read(padap, buff, tp_pio->ireg_offset_range,
1731                   tp_pio->ireg_local_offset, true);
1732         ch_tp_pio++;
1733     }
1734 
1735     /* TP_MIB_INDEX */
1736     if (is_t5(padap->params.chip))
1737         n = sizeof(t5_tp_mib_index_array) /
1738             (IREG_NUM_ELEM * sizeof(u32));
1739     else if (is_t6(padap->params.chip))
1740         n = sizeof(t6_tp_mib_index_array) /
1741             (IREG_NUM_ELEM * sizeof(u32));
1742 
1743     for (i = 0; i < n ; i++) {
1744         struct ireg_field *tp_pio = &ch_tp_pio->tp_pio;
1745         u32 *buff = ch_tp_pio->outbuf;
1746 
1747         if (is_t5(padap->params.chip)) {
1748             tp_pio->ireg_addr = t5_tp_mib_index_array[i][0];
1749             tp_pio->ireg_data = t5_tp_mib_index_array[i][1];
1750             tp_pio->ireg_local_offset =
1751                 t5_tp_mib_index_array[i][2];
1752             tp_pio->ireg_offset_range =
1753                 t5_tp_mib_index_array[i][3];
1754         } else if (is_t6(padap->params.chip)) {
1755             tp_pio->ireg_addr = t6_tp_mib_index_array[i][0];
1756             tp_pio->ireg_data = t6_tp_mib_index_array[i][1];
1757             tp_pio->ireg_local_offset =
1758                 t6_tp_mib_index_array[i][2];
1759             tp_pio->ireg_offset_range =
1760                 t6_tp_mib_index_array[i][3];
1761         }
1762         t4_tp_mib_read(padap, buff, tp_pio->ireg_offset_range,
1763                    tp_pio->ireg_local_offset, true);
1764         ch_tp_pio++;
1765     }
1766     return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
1767 }
1768 
1769 static void cudbg_read_sge_qbase_indirect_reg(struct adapter *padap,
1770                           struct sge_qbase_reg_field *qbase,
1771                           u32 func, bool is_pf)
1772 {
1773     u32 *buff, i;
1774 
1775     if (is_pf) {
1776         buff = qbase->pf_data_value[func];
1777     } else {
1778         buff = qbase->vf_data_value[func];
1779         /* In SGE_QBASE_INDEX,
1780          * Entries 0->7 are PF0->7, Entries 8->263 are VFID0->256.
1781          */
1782         func += 8;
1783     }
1784 
1785     t4_write_reg(padap, qbase->reg_addr, func);
1786     for (i = 0; i < SGE_QBASE_DATA_REG_NUM; i++, buff++)
1787         *buff = t4_read_reg(padap, qbase->reg_data[i]);
1788 }
1789 
1790 int cudbg_collect_sge_indirect(struct cudbg_init *pdbg_init,
1791                    struct cudbg_buffer *dbg_buff,
1792                    struct cudbg_error *cudbg_err)
1793 {
1794     struct adapter *padap = pdbg_init->adap;
1795     struct cudbg_buffer temp_buff = { 0 };
1796     struct sge_qbase_reg_field *sge_qbase;
1797     struct ireg_buf *ch_sge_dbg;
1798     u8 padap_running = 0;
1799     int i, rc;
1800     u32 size;
1801 
1802     /* Accessing SGE_QBASE_MAP[0-3] and SGE_QBASE_INDEX regs can
1803      * lead to SGE missing doorbells under heavy traffic. So, only
1804      * collect them when adapter is idle.
1805      */
1806     for_each_port(padap, i) {
1807         padap_running = netif_running(padap->port[i]);
1808         if (padap_running)
1809             break;
1810     }
1811 
1812     size = sizeof(*ch_sge_dbg) * 2;
1813     if (!padap_running)
1814         size += sizeof(*sge_qbase);
1815 
1816     rc = cudbg_get_buff(pdbg_init, dbg_buff, size, &temp_buff);
1817     if (rc)
1818         return rc;
1819 
1820     ch_sge_dbg = (struct ireg_buf *)temp_buff.data;
1821     for (i = 0; i < 2; i++) {
1822         struct ireg_field *sge_pio = &ch_sge_dbg->tp_pio;
1823         u32 *buff = ch_sge_dbg->outbuf;
1824 
1825         sge_pio->ireg_addr = t5_sge_dbg_index_array[i][0];
1826         sge_pio->ireg_data = t5_sge_dbg_index_array[i][1];
1827         sge_pio->ireg_local_offset = t5_sge_dbg_index_array[i][2];
1828         sge_pio->ireg_offset_range = t5_sge_dbg_index_array[i][3];
1829         t4_read_indirect(padap,
1830                  sge_pio->ireg_addr,
1831                  sge_pio->ireg_data,
1832                  buff,
1833                  sge_pio->ireg_offset_range,
1834                  sge_pio->ireg_local_offset);
1835         ch_sge_dbg++;
1836     }
1837 
1838     if (CHELSIO_CHIP_VERSION(padap->params.chip) > CHELSIO_T5 &&
1839         !padap_running) {
1840         sge_qbase = (struct sge_qbase_reg_field *)ch_sge_dbg;
1841         /* 1 addr reg SGE_QBASE_INDEX and 4 data reg
1842          * SGE_QBASE_MAP[0-3]
1843          */
1844         sge_qbase->reg_addr = t6_sge_qbase_index_array[0];
1845         for (i = 0; i < SGE_QBASE_DATA_REG_NUM; i++)
1846             sge_qbase->reg_data[i] =
1847                 t6_sge_qbase_index_array[i + 1];
1848 
1849         for (i = 0; i <= PCIE_FW_MASTER_M; i++)
1850             cudbg_read_sge_qbase_indirect_reg(padap, sge_qbase,
1851                               i, true);
1852 
1853         for (i = 0; i < padap->params.arch.vfcount; i++)
1854             cudbg_read_sge_qbase_indirect_reg(padap, sge_qbase,
1855                               i, false);
1856 
1857         sge_qbase->vfcount = padap->params.arch.vfcount;
1858     }
1859 
1860     return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
1861 }
1862 
1863 int cudbg_collect_ulprx_la(struct cudbg_init *pdbg_init,
1864                struct cudbg_buffer *dbg_buff,
1865                struct cudbg_error *cudbg_err)
1866 {
1867     struct adapter *padap = pdbg_init->adap;
1868     struct cudbg_buffer temp_buff = { 0 };
1869     struct cudbg_ulprx_la *ulprx_la_buff;
1870     int rc;
1871 
1872     rc = cudbg_get_buff(pdbg_init, dbg_buff, sizeof(struct cudbg_ulprx_la),
1873                 &temp_buff);
1874     if (rc)
1875         return rc;
1876 
1877     ulprx_la_buff = (struct cudbg_ulprx_la *)temp_buff.data;
1878     t4_ulprx_read_la(padap, (u32 *)ulprx_la_buff->data);
1879     ulprx_la_buff->size = ULPRX_LA_SIZE;
1880     return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
1881 }
1882 
1883 int cudbg_collect_tp_la(struct cudbg_init *pdbg_init,
1884             struct cudbg_buffer *dbg_buff,
1885             struct cudbg_error *cudbg_err)
1886 {
1887     struct adapter *padap = pdbg_init->adap;
1888     struct cudbg_buffer temp_buff = { 0 };
1889     struct cudbg_tp_la *tp_la_buff;
1890     int size, rc;
1891 
1892     size = sizeof(struct cudbg_tp_la) + TPLA_SIZE *  sizeof(u64);
1893     rc = cudbg_get_buff(pdbg_init, dbg_buff, size, &temp_buff);
1894     if (rc)
1895         return rc;
1896 
1897     tp_la_buff = (struct cudbg_tp_la *)temp_buff.data;
1898     tp_la_buff->mode = DBGLAMODE_G(t4_read_reg(padap, TP_DBG_LA_CONFIG_A));
1899     t4_tp_read_la(padap, (u64 *)tp_la_buff->data, NULL);
1900     return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
1901 }
1902 
1903 int cudbg_collect_meminfo(struct cudbg_init *pdbg_init,
1904               struct cudbg_buffer *dbg_buff,
1905               struct cudbg_error *cudbg_err)
1906 {
1907     struct adapter *padap = pdbg_init->adap;
1908     struct cudbg_buffer temp_buff = { 0 };
1909     struct cudbg_meminfo *meminfo_buff;
1910     struct cudbg_ver_hdr *ver_hdr;
1911     int rc;
1912 
1913     rc = cudbg_get_buff(pdbg_init, dbg_buff,
1914                 sizeof(struct cudbg_ver_hdr) +
1915                 sizeof(struct cudbg_meminfo),
1916                 &temp_buff);
1917     if (rc)
1918         return rc;
1919 
1920     ver_hdr = (struct cudbg_ver_hdr *)temp_buff.data;
1921     ver_hdr->signature = CUDBG_ENTITY_SIGNATURE;
1922     ver_hdr->revision = CUDBG_MEMINFO_REV;
1923     ver_hdr->size = sizeof(struct cudbg_meminfo);
1924 
1925     meminfo_buff = (struct cudbg_meminfo *)(temp_buff.data +
1926                         sizeof(*ver_hdr));
1927     rc = cudbg_fill_meminfo(padap, meminfo_buff);
1928     if (rc) {
1929         cudbg_err->sys_err = rc;
1930         cudbg_put_buff(pdbg_init, &temp_buff);
1931         return rc;
1932     }
1933 
1934     return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
1935 }
1936 
1937 int cudbg_collect_cim_pif_la(struct cudbg_init *pdbg_init,
1938                  struct cudbg_buffer *dbg_buff,
1939                  struct cudbg_error *cudbg_err)
1940 {
1941     struct cudbg_cim_pif_la *cim_pif_la_buff;
1942     struct adapter *padap = pdbg_init->adap;
1943     struct cudbg_buffer temp_buff = { 0 };
1944     int size, rc;
1945 
1946     size = sizeof(struct cudbg_cim_pif_la) +
1947            2 * CIM_PIFLA_SIZE * 6 * sizeof(u32);
1948     rc = cudbg_get_buff(pdbg_init, dbg_buff, size, &temp_buff);
1949     if (rc)
1950         return rc;
1951 
1952     cim_pif_la_buff = (struct cudbg_cim_pif_la *)temp_buff.data;
1953     cim_pif_la_buff->size = CIM_PIFLA_SIZE;
1954     t4_cim_read_pif_la(padap, (u32 *)cim_pif_la_buff->data,
1955                (u32 *)cim_pif_la_buff->data + 6 * CIM_PIFLA_SIZE,
1956                NULL, NULL);
1957     return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
1958 }
1959 
1960 int cudbg_collect_clk_info(struct cudbg_init *pdbg_init,
1961                struct cudbg_buffer *dbg_buff,
1962                struct cudbg_error *cudbg_err)
1963 {
1964     struct adapter *padap = pdbg_init->adap;
1965     struct cudbg_buffer temp_buff = { 0 };
1966     struct cudbg_clk_info *clk_info_buff;
1967     u64 tp_tick_us;
1968     int rc;
1969 
1970     if (!padap->params.vpd.cclk)
1971         return CUDBG_STATUS_CCLK_NOT_DEFINED;
1972 
1973     rc = cudbg_get_buff(pdbg_init, dbg_buff, sizeof(struct cudbg_clk_info),
1974                 &temp_buff);
1975     if (rc)
1976         return rc;
1977 
1978     clk_info_buff = (struct cudbg_clk_info *)temp_buff.data;
1979     clk_info_buff->cclk_ps = 1000000000 / padap->params.vpd.cclk; /* psec */
1980     clk_info_buff->res = t4_read_reg(padap, TP_TIMER_RESOLUTION_A);
1981     clk_info_buff->tre = TIMERRESOLUTION_G(clk_info_buff->res);
1982     clk_info_buff->dack_re = DELAYEDACKRESOLUTION_G(clk_info_buff->res);
1983     tp_tick_us = (clk_info_buff->cclk_ps << clk_info_buff->tre) / 1000000;
1984 
1985     clk_info_buff->dack_timer =
1986         (clk_info_buff->cclk_ps << clk_info_buff->dack_re) / 1000000 *
1987         t4_read_reg(padap, TP_DACK_TIMER_A);
1988     clk_info_buff->retransmit_min =
1989         tp_tick_us * t4_read_reg(padap, TP_RXT_MIN_A);
1990     clk_info_buff->retransmit_max =
1991         tp_tick_us * t4_read_reg(padap, TP_RXT_MAX_A);
1992     clk_info_buff->persist_timer_min =
1993         tp_tick_us * t4_read_reg(padap, TP_PERS_MIN_A);
1994     clk_info_buff->persist_timer_max =
1995         tp_tick_us * t4_read_reg(padap, TP_PERS_MAX_A);
1996     clk_info_buff->keepalive_idle_timer =
1997         tp_tick_us * t4_read_reg(padap, TP_KEEP_IDLE_A);
1998     clk_info_buff->keepalive_interval =
1999         tp_tick_us * t4_read_reg(padap, TP_KEEP_INTVL_A);
2000     clk_info_buff->initial_srtt =
2001         tp_tick_us * INITSRTT_G(t4_read_reg(padap, TP_INIT_SRTT_A));
2002     clk_info_buff->finwait2_timer =
2003         tp_tick_us * t4_read_reg(padap, TP_FINWAIT2_TIMER_A);
2004 
2005     return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
2006 }
2007 
2008 int cudbg_collect_pcie_indirect(struct cudbg_init *pdbg_init,
2009                 struct cudbg_buffer *dbg_buff,
2010                 struct cudbg_error *cudbg_err)
2011 {
2012     struct adapter *padap = pdbg_init->adap;
2013     struct cudbg_buffer temp_buff = { 0 };
2014     struct ireg_buf *ch_pcie;
2015     int i, rc, n;
2016     u32 size;
2017 
2018     n = sizeof(t5_pcie_pdbg_array) / (IREG_NUM_ELEM * sizeof(u32));
2019     size = sizeof(struct ireg_buf) * n * 2;
2020     rc = cudbg_get_buff(pdbg_init, dbg_buff, size, &temp_buff);
2021     if (rc)
2022         return rc;
2023 
2024     ch_pcie = (struct ireg_buf *)temp_buff.data;
2025     /* PCIE_PDBG */
2026     for (i = 0; i < n; i++) {
2027         struct ireg_field *pcie_pio = &ch_pcie->tp_pio;
2028         u32 *buff = ch_pcie->outbuf;
2029 
2030         pcie_pio->ireg_addr = t5_pcie_pdbg_array[i][0];
2031         pcie_pio->ireg_data = t5_pcie_pdbg_array[i][1];
2032         pcie_pio->ireg_local_offset = t5_pcie_pdbg_array[i][2];
2033         pcie_pio->ireg_offset_range = t5_pcie_pdbg_array[i][3];
2034         t4_read_indirect(padap,
2035                  pcie_pio->ireg_addr,
2036                  pcie_pio->ireg_data,
2037                  buff,
2038                  pcie_pio->ireg_offset_range,
2039                  pcie_pio->ireg_local_offset);
2040         ch_pcie++;
2041     }
2042 
2043     /* PCIE_CDBG */
2044     n = sizeof(t5_pcie_cdbg_array) / (IREG_NUM_ELEM * sizeof(u32));
2045     for (i = 0; i < n; i++) {
2046         struct ireg_field *pcie_pio = &ch_pcie->tp_pio;
2047         u32 *buff = ch_pcie->outbuf;
2048 
2049         pcie_pio->ireg_addr = t5_pcie_cdbg_array[i][0];
2050         pcie_pio->ireg_data = t5_pcie_cdbg_array[i][1];
2051         pcie_pio->ireg_local_offset = t5_pcie_cdbg_array[i][2];
2052         pcie_pio->ireg_offset_range = t5_pcie_cdbg_array[i][3];
2053         t4_read_indirect(padap,
2054                  pcie_pio->ireg_addr,
2055                  pcie_pio->ireg_data,
2056                  buff,
2057                  pcie_pio->ireg_offset_range,
2058                  pcie_pio->ireg_local_offset);
2059         ch_pcie++;
2060     }
2061     return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
2062 }
2063 
2064 int cudbg_collect_pm_indirect(struct cudbg_init *pdbg_init,
2065                   struct cudbg_buffer *dbg_buff,
2066                   struct cudbg_error *cudbg_err)
2067 {
2068     struct adapter *padap = pdbg_init->adap;
2069     struct cudbg_buffer temp_buff = { 0 };
2070     struct ireg_buf *ch_pm;
2071     int i, rc, n;
2072     u32 size;
2073 
2074     n = sizeof(t5_pm_rx_array) / (IREG_NUM_ELEM * sizeof(u32));
2075     size = sizeof(struct ireg_buf) * n * 2;
2076     rc = cudbg_get_buff(pdbg_init, dbg_buff, size, &temp_buff);
2077     if (rc)
2078         return rc;
2079 
2080     ch_pm = (struct ireg_buf *)temp_buff.data;
2081     /* PM_RX */
2082     for (i = 0; i < n; i++) {
2083         struct ireg_field *pm_pio = &ch_pm->tp_pio;
2084         u32 *buff = ch_pm->outbuf;
2085 
2086         pm_pio->ireg_addr = t5_pm_rx_array[i][0];
2087         pm_pio->ireg_data = t5_pm_rx_array[i][1];
2088         pm_pio->ireg_local_offset = t5_pm_rx_array[i][2];
2089         pm_pio->ireg_offset_range = t5_pm_rx_array[i][3];
2090         t4_read_indirect(padap,
2091                  pm_pio->ireg_addr,
2092                  pm_pio->ireg_data,
2093                  buff,
2094                  pm_pio->ireg_offset_range,
2095                  pm_pio->ireg_local_offset);
2096         ch_pm++;
2097     }
2098 
2099     /* PM_TX */
2100     n = sizeof(t5_pm_tx_array) / (IREG_NUM_ELEM * sizeof(u32));
2101     for (i = 0; i < n; i++) {
2102         struct ireg_field *pm_pio = &ch_pm->tp_pio;
2103         u32 *buff = ch_pm->outbuf;
2104 
2105         pm_pio->ireg_addr = t5_pm_tx_array[i][0];
2106         pm_pio->ireg_data = t5_pm_tx_array[i][1];
2107         pm_pio->ireg_local_offset = t5_pm_tx_array[i][2];
2108         pm_pio->ireg_offset_range = t5_pm_tx_array[i][3];
2109         t4_read_indirect(padap,
2110                  pm_pio->ireg_addr,
2111                  pm_pio->ireg_data,
2112                  buff,
2113                  pm_pio->ireg_offset_range,
2114                  pm_pio->ireg_local_offset);
2115         ch_pm++;
2116     }
2117     return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
2118 }
2119 
2120 int cudbg_collect_tid(struct cudbg_init *pdbg_init,
2121               struct cudbg_buffer *dbg_buff,
2122               struct cudbg_error *cudbg_err)
2123 {
2124     struct adapter *padap = pdbg_init->adap;
2125     struct cudbg_tid_info_region_rev1 *tid1;
2126     struct cudbg_buffer temp_buff = { 0 };
2127     struct cudbg_tid_info_region *tid;
2128     u32 para[2], val[2];
2129     int rc;
2130 
2131     rc = cudbg_get_buff(pdbg_init, dbg_buff,
2132                 sizeof(struct cudbg_tid_info_region_rev1),
2133                 &temp_buff);
2134     if (rc)
2135         return rc;
2136 
2137     tid1 = (struct cudbg_tid_info_region_rev1 *)temp_buff.data;
2138     tid = &tid1->tid;
2139     tid1->ver_hdr.signature = CUDBG_ENTITY_SIGNATURE;
2140     tid1->ver_hdr.revision = CUDBG_TID_INFO_REV;
2141     tid1->ver_hdr.size = sizeof(struct cudbg_tid_info_region_rev1) -
2142                  sizeof(struct cudbg_ver_hdr);
2143 
2144     /* If firmware is not attached/alive, use backdoor register
2145      * access to collect dump.
2146      */
2147     if (!is_fw_attached(pdbg_init))
2148         goto fill_tid;
2149 
2150 #define FW_PARAM_PFVF_A(param) \
2151     (FW_PARAMS_MNEM_V(FW_PARAMS_MNEM_PFVF) | \
2152      FW_PARAMS_PARAM_X_V(FW_PARAMS_PARAM_PFVF_##param) | \
2153      FW_PARAMS_PARAM_Y_V(0) | \
2154      FW_PARAMS_PARAM_Z_V(0))
2155 
2156     para[0] = FW_PARAM_PFVF_A(ETHOFLD_START);
2157     para[1] = FW_PARAM_PFVF_A(ETHOFLD_END);
2158     rc = t4_query_params(padap, padap->mbox, padap->pf, 0, 2, para, val);
2159     if (rc <  0) {
2160         cudbg_err->sys_err = rc;
2161         cudbg_put_buff(pdbg_init, &temp_buff);
2162         return rc;
2163     }
2164     tid->uotid_base = val[0];
2165     tid->nuotids = val[1] - val[0] + 1;
2166 
2167     if (is_t5(padap->params.chip)) {
2168         tid->sb = t4_read_reg(padap, LE_DB_SERVER_INDEX_A) / 4;
2169     } else if (is_t6(padap->params.chip)) {
2170         tid1->tid_start =
2171             t4_read_reg(padap, LE_DB_ACTIVE_TABLE_START_INDEX_A);
2172         tid->sb = t4_read_reg(padap, LE_DB_SRVR_START_INDEX_A);
2173 
2174         para[0] = FW_PARAM_PFVF_A(HPFILTER_START);
2175         para[1] = FW_PARAM_PFVF_A(HPFILTER_END);
2176         rc = t4_query_params(padap, padap->mbox, padap->pf, 0, 2,
2177                      para, val);
2178         if (rc < 0) {
2179             cudbg_err->sys_err = rc;
2180             cudbg_put_buff(pdbg_init, &temp_buff);
2181             return rc;
2182         }
2183         tid->hpftid_base = val[0];
2184         tid->nhpftids = val[1] - val[0] + 1;
2185     }
2186 
2187 #undef FW_PARAM_PFVF_A
2188 
2189 fill_tid:
2190     tid->ntids = padap->tids.ntids;
2191     tid->nstids = padap->tids.nstids;
2192     tid->stid_base = padap->tids.stid_base;
2193     tid->hash_base = padap->tids.hash_base;
2194 
2195     tid->natids = padap->tids.natids;
2196     tid->nftids = padap->tids.nftids;
2197     tid->ftid_base = padap->tids.ftid_base;
2198     tid->aftid_base = padap->tids.aftid_base;
2199     tid->aftid_end = padap->tids.aftid_end;
2200 
2201     tid->sftid_base = padap->tids.sftid_base;
2202     tid->nsftids = padap->tids.nsftids;
2203 
2204     tid->flags = padap->flags;
2205     tid->le_db_conf = t4_read_reg(padap, LE_DB_CONFIG_A);
2206     tid->ip_users = t4_read_reg(padap, LE_DB_ACT_CNT_IPV4_A);
2207     tid->ipv6_users = t4_read_reg(padap, LE_DB_ACT_CNT_IPV6_A);
2208 
2209     return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
2210 }
2211 
2212 int cudbg_collect_pcie_config(struct cudbg_init *pdbg_init,
2213                   struct cudbg_buffer *dbg_buff,
2214                   struct cudbg_error *cudbg_err)
2215 {
2216     struct adapter *padap = pdbg_init->adap;
2217     struct cudbg_buffer temp_buff = { 0 };
2218     u32 size, *value, j;
2219     int i, rc, n;
2220 
2221     size = sizeof(u32) * CUDBG_NUM_PCIE_CONFIG_REGS;
2222     n = sizeof(t5_pcie_config_array) / (2 * sizeof(u32));
2223     rc = cudbg_get_buff(pdbg_init, dbg_buff, size, &temp_buff);
2224     if (rc)
2225         return rc;
2226 
2227     value = (u32 *)temp_buff.data;
2228     for (i = 0; i < n; i++) {
2229         for (j = t5_pcie_config_array[i][0];
2230              j <= t5_pcie_config_array[i][1]; j += 4) {
2231             t4_hw_pci_read_cfg4(padap, j, value);
2232             value++;
2233         }
2234     }
2235     return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
2236 }
2237 
2238 static int cudbg_sge_ctxt_check_valid(u32 *buf, int type)
2239 {
2240     int index, bit, bit_pos = 0;
2241 
2242     switch (type) {
2243     case CTXT_EGRESS:
2244         bit_pos = 176;
2245         break;
2246     case CTXT_INGRESS:
2247         bit_pos = 141;
2248         break;
2249     case CTXT_FLM:
2250         bit_pos = 89;
2251         break;
2252     }
2253     index = bit_pos / 32;
2254     bit =  bit_pos % 32;
2255     return buf[index] & (1U << bit);
2256 }
2257 
2258 static int cudbg_get_ctxt_region_info(struct adapter *padap,
2259                       struct cudbg_region_info *ctx_info,
2260                       u8 *mem_type)
2261 {
2262     struct cudbg_mem_desc mem_desc;
2263     struct cudbg_meminfo meminfo;
2264     u32 i, j, value, found;
2265     u8 flq;
2266     int rc;
2267 
2268     rc = cudbg_fill_meminfo(padap, &meminfo);
2269     if (rc)
2270         return rc;
2271 
2272     /* Get EGRESS and INGRESS context region size */
2273     for (i = CTXT_EGRESS; i <= CTXT_INGRESS; i++) {
2274         found = 0;
2275         memset(&mem_desc, 0, sizeof(struct cudbg_mem_desc));
2276         for (j = 0; j < ARRAY_SIZE(meminfo.avail); j++) {
2277             rc = cudbg_get_mem_region(padap, &meminfo, j,
2278                           cudbg_region[i],
2279                           &mem_desc);
2280             if (!rc) {
2281                 found = 1;
2282                 rc = cudbg_get_mem_relative(padap, &meminfo, j,
2283                                 &mem_desc.base,
2284                                 &mem_desc.limit);
2285                 if (rc) {
2286                     ctx_info[i].exist = false;
2287                     break;
2288                 }
2289                 ctx_info[i].exist = true;
2290                 ctx_info[i].start = mem_desc.base;
2291                 ctx_info[i].end = mem_desc.limit;
2292                 mem_type[i] = j;
2293                 break;
2294             }
2295         }
2296         if (!found)
2297             ctx_info[i].exist = false;
2298     }
2299 
2300     /* Get FLM and CNM max qid. */
2301     value = t4_read_reg(padap, SGE_FLM_CFG_A);
2302 
2303     /* Get number of data freelist queues */
2304     flq = HDRSTARTFLQ_G(value);
2305     ctx_info[CTXT_FLM].exist = true;
2306     ctx_info[CTXT_FLM].end = (CUDBG_MAX_FL_QIDS >> flq) * SGE_CTXT_SIZE;
2307 
2308     /* The number of CONM contexts are same as number of freelist
2309      * queues.
2310      */
2311     ctx_info[CTXT_CNM].exist = true;
2312     ctx_info[CTXT_CNM].end = ctx_info[CTXT_FLM].end;
2313 
2314     return 0;
2315 }
2316 
2317 int cudbg_dump_context_size(struct adapter *padap)
2318 {
2319     struct cudbg_region_info region_info[CTXT_CNM + 1] = { {0} };
2320     u8 mem_type[CTXT_INGRESS + 1] = { 0 };
2321     u32 i, size = 0;
2322     int rc;
2323 
2324     /* Get max valid qid for each type of queue */
2325     rc = cudbg_get_ctxt_region_info(padap, region_info, mem_type);
2326     if (rc)
2327         return rc;
2328 
2329     for (i = 0; i < CTXT_CNM; i++) {
2330         if (!region_info[i].exist) {
2331             if (i == CTXT_EGRESS || i == CTXT_INGRESS)
2332                 size += CUDBG_LOWMEM_MAX_CTXT_QIDS *
2333                     SGE_CTXT_SIZE;
2334             continue;
2335         }
2336 
2337         size += (region_info[i].end - region_info[i].start + 1) /
2338             SGE_CTXT_SIZE;
2339     }
2340     return size * sizeof(struct cudbg_ch_cntxt);
2341 }
2342 
2343 static void cudbg_read_sge_ctxt(struct cudbg_init *pdbg_init, u32 cid,
2344                 enum ctxt_type ctype, u32 *data)
2345 {
2346     struct adapter *padap = pdbg_init->adap;
2347     int rc = -1;
2348 
2349     /* Under heavy traffic, the SGE Queue contexts registers will be
2350      * frequently accessed by firmware.
2351      *
2352      * To avoid conflicts with firmware, always ask firmware to fetch
2353      * the SGE Queue contexts via mailbox. On failure, fallback to
2354      * accessing hardware registers directly.
2355      */
2356     if (is_fw_attached(pdbg_init))
2357         rc = t4_sge_ctxt_rd(padap, padap->mbox, cid, ctype, data);
2358     if (rc)
2359         t4_sge_ctxt_rd_bd(padap, cid, ctype, data);
2360 }
2361 
2362 static void cudbg_get_sge_ctxt_fw(struct cudbg_init *pdbg_init, u32 max_qid,
2363                   u8 ctxt_type,
2364                   struct cudbg_ch_cntxt **out_buff)
2365 {
2366     struct cudbg_ch_cntxt *buff = *out_buff;
2367     int rc;
2368     u32 j;
2369 
2370     for (j = 0; j < max_qid; j++) {
2371         cudbg_read_sge_ctxt(pdbg_init, j, ctxt_type, buff->data);
2372         rc = cudbg_sge_ctxt_check_valid(buff->data, ctxt_type);
2373         if (!rc)
2374             continue;
2375 
2376         buff->cntxt_type = ctxt_type;
2377         buff->cntxt_id = j;
2378         buff++;
2379         if (ctxt_type == CTXT_FLM) {
2380             cudbg_read_sge_ctxt(pdbg_init, j, CTXT_CNM, buff->data);
2381             buff->cntxt_type = CTXT_CNM;
2382             buff->cntxt_id = j;
2383             buff++;
2384         }
2385     }
2386 
2387     *out_buff = buff;
2388 }
2389 
2390 int cudbg_collect_dump_context(struct cudbg_init *pdbg_init,
2391                    struct cudbg_buffer *dbg_buff,
2392                    struct cudbg_error *cudbg_err)
2393 {
2394     struct cudbg_region_info region_info[CTXT_CNM + 1] = { {0} };
2395     struct adapter *padap = pdbg_init->adap;
2396     u32 j, size, max_ctx_size, max_ctx_qid;
2397     u8 mem_type[CTXT_INGRESS + 1] = { 0 };
2398     struct cudbg_buffer temp_buff = { 0 };
2399     struct cudbg_ch_cntxt *buff;
2400     u8 *ctx_buf;
2401     u8 i, k;
2402     int rc;
2403 
2404     /* Get max valid qid for each type of queue */
2405     rc = cudbg_get_ctxt_region_info(padap, region_info, mem_type);
2406     if (rc)
2407         return rc;
2408 
2409     rc = cudbg_dump_context_size(padap);
2410     if (rc <= 0)
2411         return CUDBG_STATUS_ENTITY_NOT_FOUND;
2412 
2413     size = rc;
2414     rc = cudbg_get_buff(pdbg_init, dbg_buff, size, &temp_buff);
2415     if (rc)
2416         return rc;
2417 
2418     /* Get buffer with enough space to read the biggest context
2419      * region in memory.
2420      */
2421     max_ctx_size = max(region_info[CTXT_EGRESS].end -
2422                region_info[CTXT_EGRESS].start + 1,
2423                region_info[CTXT_INGRESS].end -
2424                region_info[CTXT_INGRESS].start + 1);
2425 
2426     ctx_buf = kvzalloc(max_ctx_size, GFP_KERNEL);
2427     if (!ctx_buf) {
2428         cudbg_put_buff(pdbg_init, &temp_buff);
2429         return -ENOMEM;
2430     }
2431 
2432     buff = (struct cudbg_ch_cntxt *)temp_buff.data;
2433 
2434     /* Collect EGRESS and INGRESS context data.
2435      * In case of failures, fallback to collecting via FW or
2436      * backdoor access.
2437      */
2438     for (i = CTXT_EGRESS; i <= CTXT_INGRESS; i++) {
2439         if (!region_info[i].exist) {
2440             max_ctx_qid = CUDBG_LOWMEM_MAX_CTXT_QIDS;
2441             cudbg_get_sge_ctxt_fw(pdbg_init, max_ctx_qid, i,
2442                           &buff);
2443             continue;
2444         }
2445 
2446         max_ctx_size = region_info[i].end - region_info[i].start + 1;
2447         max_ctx_qid = max_ctx_size / SGE_CTXT_SIZE;
2448 
2449         /* If firmware is not attached/alive, use backdoor register
2450          * access to collect dump.
2451          */
2452         if (is_fw_attached(pdbg_init)) {
2453             t4_sge_ctxt_flush(padap, padap->mbox, i);
2454 
2455             rc = t4_memory_rw(padap, MEMWIN_NIC, mem_type[i],
2456                       region_info[i].start, max_ctx_size,
2457                       (__be32 *)ctx_buf, 1);
2458         }
2459 
2460         if (rc || !is_fw_attached(pdbg_init)) {
2461             max_ctx_qid = CUDBG_LOWMEM_MAX_CTXT_QIDS;
2462             cudbg_get_sge_ctxt_fw(pdbg_init, max_ctx_qid, i,
2463                           &buff);
2464             continue;
2465         }
2466 
2467         for (j = 0; j < max_ctx_qid; j++) {
2468             __be64 *dst_off;
2469             u64 *src_off;
2470 
2471             src_off = (u64 *)(ctx_buf + j * SGE_CTXT_SIZE);
2472             dst_off = (__be64 *)buff->data;
2473 
2474             /* The data is stored in 64-bit cpu order.  Convert it
2475              * to big endian before parsing.
2476              */
2477             for (k = 0; k < SGE_CTXT_SIZE / sizeof(u64); k++)
2478                 dst_off[k] = cpu_to_be64(src_off[k]);
2479 
2480             rc = cudbg_sge_ctxt_check_valid(buff->data, i);
2481             if (!rc)
2482                 continue;
2483 
2484             buff->cntxt_type = i;
2485             buff->cntxt_id = j;
2486             buff++;
2487         }
2488     }
2489 
2490     kvfree(ctx_buf);
2491 
2492     /* Collect FREELIST and CONGESTION MANAGER contexts */
2493     max_ctx_size = region_info[CTXT_FLM].end -
2494                region_info[CTXT_FLM].start + 1;
2495     max_ctx_qid = max_ctx_size / SGE_CTXT_SIZE;
2496     /* Since FLM and CONM are 1-to-1 mapped, the below function
2497      * will fetch both FLM and CONM contexts.
2498      */
2499     cudbg_get_sge_ctxt_fw(pdbg_init, max_ctx_qid, CTXT_FLM, &buff);
2500 
2501     return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
2502 }
2503 
2504 static inline void cudbg_tcamxy2valmask(u64 x, u64 y, u8 *addr, u64 *mask)
2505 {
2506     *mask = x | y;
2507     y = (__force u64)cpu_to_be64(y);
2508     memcpy(addr, (char *)&y + 2, ETH_ALEN);
2509 }
2510 
2511 static void cudbg_mps_rpl_backdoor(struct adapter *padap,
2512                    struct fw_ldst_mps_rplc *mps_rplc)
2513 {
2514     if (is_t5(padap->params.chip)) {
2515         mps_rplc->rplc255_224 = htonl(t4_read_reg(padap,
2516                               MPS_VF_RPLCT_MAP3_A));
2517         mps_rplc->rplc223_192 = htonl(t4_read_reg(padap,
2518                               MPS_VF_RPLCT_MAP2_A));
2519         mps_rplc->rplc191_160 = htonl(t4_read_reg(padap,
2520                               MPS_VF_RPLCT_MAP1_A));
2521         mps_rplc->rplc159_128 = htonl(t4_read_reg(padap,
2522                               MPS_VF_RPLCT_MAP0_A));
2523     } else {
2524         mps_rplc->rplc255_224 = htonl(t4_read_reg(padap,
2525                               MPS_VF_RPLCT_MAP7_A));
2526         mps_rplc->rplc223_192 = htonl(t4_read_reg(padap,
2527                               MPS_VF_RPLCT_MAP6_A));
2528         mps_rplc->rplc191_160 = htonl(t4_read_reg(padap,
2529                               MPS_VF_RPLCT_MAP5_A));
2530         mps_rplc->rplc159_128 = htonl(t4_read_reg(padap,
2531                               MPS_VF_RPLCT_MAP4_A));
2532     }
2533     mps_rplc->rplc127_96 = htonl(t4_read_reg(padap, MPS_VF_RPLCT_MAP3_A));
2534     mps_rplc->rplc95_64 = htonl(t4_read_reg(padap, MPS_VF_RPLCT_MAP2_A));
2535     mps_rplc->rplc63_32 = htonl(t4_read_reg(padap, MPS_VF_RPLCT_MAP1_A));
2536     mps_rplc->rplc31_0 = htonl(t4_read_reg(padap, MPS_VF_RPLCT_MAP0_A));
2537 }
2538 
2539 static int cudbg_collect_tcam_index(struct cudbg_init *pdbg_init,
2540                     struct cudbg_mps_tcam *tcam, u32 idx)
2541 {
2542     struct adapter *padap = pdbg_init->adap;
2543     u64 tcamy, tcamx, val;
2544     u32 ctl, data2;
2545     int rc = 0;
2546 
2547     if (CHELSIO_CHIP_VERSION(padap->params.chip) >= CHELSIO_T6) {
2548         /* CtlReqID   - 1: use Host Driver Requester ID
2549          * CtlCmdType - 0: Read, 1: Write
2550          * CtlTcamSel - 0: TCAM0, 1: TCAM1
2551          * CtlXYBitSel- 0: Y bit, 1: X bit
2552          */
2553 
2554         /* Read tcamy */
2555         ctl = CTLREQID_V(1) | CTLCMDTYPE_V(0) | CTLXYBITSEL_V(0);
2556         if (idx < 256)
2557             ctl |= CTLTCAMINDEX_V(idx) | CTLTCAMSEL_V(0);
2558         else
2559             ctl |= CTLTCAMINDEX_V(idx - 256) | CTLTCAMSEL_V(1);
2560 
2561         t4_write_reg(padap, MPS_CLS_TCAM_DATA2_CTL_A, ctl);
2562         val = t4_read_reg(padap, MPS_CLS_TCAM_RDATA1_REQ_ID1_A);
2563         tcamy = DMACH_G(val) << 32;
2564         tcamy |= t4_read_reg(padap, MPS_CLS_TCAM_RDATA0_REQ_ID1_A);
2565         data2 = t4_read_reg(padap, MPS_CLS_TCAM_RDATA2_REQ_ID1_A);
2566         tcam->lookup_type = DATALKPTYPE_G(data2);
2567 
2568         /* 0 - Outer header, 1 - Inner header
2569          * [71:48] bit locations are overloaded for
2570          * outer vs. inner lookup types.
2571          */
2572         if (tcam->lookup_type && tcam->lookup_type != DATALKPTYPE_M) {
2573             /* Inner header VNI */
2574             tcam->vniy = (data2 & DATAVIDH2_F) | DATAVIDH1_G(data2);
2575             tcam->vniy = (tcam->vniy << 16) | VIDL_G(val);
2576             tcam->dip_hit = data2 & DATADIPHIT_F;
2577         } else {
2578             tcam->vlan_vld = data2 & DATAVIDH2_F;
2579             tcam->ivlan = VIDL_G(val);
2580         }
2581 
2582         tcam->port_num = DATAPORTNUM_G(data2);
2583 
2584         /* Read tcamx. Change the control param */
2585         ctl |= CTLXYBITSEL_V(1);
2586         t4_write_reg(padap, MPS_CLS_TCAM_DATA2_CTL_A, ctl);
2587         val = t4_read_reg(padap, MPS_CLS_TCAM_RDATA1_REQ_ID1_A);
2588         tcamx = DMACH_G(val) << 32;
2589         tcamx |= t4_read_reg(padap, MPS_CLS_TCAM_RDATA0_REQ_ID1_A);
2590         data2 = t4_read_reg(padap, MPS_CLS_TCAM_RDATA2_REQ_ID1_A);
2591         if (tcam->lookup_type && tcam->lookup_type != DATALKPTYPE_M) {
2592             /* Inner header VNI mask */
2593             tcam->vnix = (data2 & DATAVIDH2_F) | DATAVIDH1_G(data2);
2594             tcam->vnix = (tcam->vnix << 16) | VIDL_G(val);
2595         }
2596     } else {
2597         tcamy = t4_read_reg64(padap, MPS_CLS_TCAM_Y_L(idx));
2598         tcamx = t4_read_reg64(padap, MPS_CLS_TCAM_X_L(idx));
2599     }
2600 
2601     /* If no entry, return */
2602     if (tcamx & tcamy)
2603         return rc;
2604 
2605     tcam->cls_lo = t4_read_reg(padap, MPS_CLS_SRAM_L(idx));
2606     tcam->cls_hi = t4_read_reg(padap, MPS_CLS_SRAM_H(idx));
2607 
2608     if (is_t5(padap->params.chip))
2609         tcam->repli = (tcam->cls_lo & REPLICATE_F);
2610     else if (is_t6(padap->params.chip))
2611         tcam->repli = (tcam->cls_lo & T6_REPLICATE_F);
2612 
2613     if (tcam->repli) {
2614         struct fw_ldst_cmd ldst_cmd;
2615         struct fw_ldst_mps_rplc mps_rplc;
2616 
2617         memset(&ldst_cmd, 0, sizeof(ldst_cmd));
2618         ldst_cmd.op_to_addrspace =
2619             htonl(FW_CMD_OP_V(FW_LDST_CMD) |
2620                   FW_CMD_REQUEST_F | FW_CMD_READ_F |
2621                   FW_LDST_CMD_ADDRSPACE_V(FW_LDST_ADDRSPC_MPS));
2622         ldst_cmd.cycles_to_len16 = htonl(FW_LEN16(ldst_cmd));
2623         ldst_cmd.u.mps.rplc.fid_idx =
2624             htons(FW_LDST_CMD_FID_V(FW_LDST_MPS_RPLC) |
2625                   FW_LDST_CMD_IDX_V(idx));
2626 
2627         /* If firmware is not attached/alive, use backdoor register
2628          * access to collect dump.
2629          */
2630         if (is_fw_attached(pdbg_init))
2631             rc = t4_wr_mbox(padap, padap->mbox, &ldst_cmd,
2632                     sizeof(ldst_cmd), &ldst_cmd);
2633 
2634         if (rc || !is_fw_attached(pdbg_init)) {
2635             cudbg_mps_rpl_backdoor(padap, &mps_rplc);
2636             /* Ignore error since we collected directly from
2637              * reading registers.
2638              */
2639             rc = 0;
2640         } else {
2641             mps_rplc = ldst_cmd.u.mps.rplc;
2642         }
2643 
2644         tcam->rplc[0] = ntohl(mps_rplc.rplc31_0);
2645         tcam->rplc[1] = ntohl(mps_rplc.rplc63_32);
2646         tcam->rplc[2] = ntohl(mps_rplc.rplc95_64);
2647         tcam->rplc[3] = ntohl(mps_rplc.rplc127_96);
2648         if (padap->params.arch.mps_rplc_size > CUDBG_MAX_RPLC_SIZE) {
2649             tcam->rplc[4] = ntohl(mps_rplc.rplc159_128);
2650             tcam->rplc[5] = ntohl(mps_rplc.rplc191_160);
2651             tcam->rplc[6] = ntohl(mps_rplc.rplc223_192);
2652             tcam->rplc[7] = ntohl(mps_rplc.rplc255_224);
2653         }
2654     }
2655     cudbg_tcamxy2valmask(tcamx, tcamy, tcam->addr, &tcam->mask);
2656     tcam->idx = idx;
2657     tcam->rplc_size = padap->params.arch.mps_rplc_size;
2658     return rc;
2659 }
2660 
2661 int cudbg_collect_mps_tcam(struct cudbg_init *pdbg_init,
2662                struct cudbg_buffer *dbg_buff,
2663                struct cudbg_error *cudbg_err)
2664 {
2665     struct adapter *padap = pdbg_init->adap;
2666     struct cudbg_buffer temp_buff = { 0 };
2667     u32 size = 0, i, n, total_size = 0;
2668     struct cudbg_mps_tcam *tcam;
2669     int rc;
2670 
2671     n = padap->params.arch.mps_tcam_size;
2672     size = sizeof(struct cudbg_mps_tcam) * n;
2673     rc = cudbg_get_buff(pdbg_init, dbg_buff, size, &temp_buff);
2674     if (rc)
2675         return rc;
2676 
2677     tcam = (struct cudbg_mps_tcam *)temp_buff.data;
2678     for (i = 0; i < n; i++) {
2679         rc = cudbg_collect_tcam_index(pdbg_init, tcam, i);
2680         if (rc) {
2681             cudbg_err->sys_err = rc;
2682             cudbg_put_buff(pdbg_init, &temp_buff);
2683             return rc;
2684         }
2685         total_size += sizeof(struct cudbg_mps_tcam);
2686         tcam++;
2687     }
2688 
2689     if (!total_size) {
2690         rc = CUDBG_SYSTEM_ERROR;
2691         cudbg_err->sys_err = rc;
2692         cudbg_put_buff(pdbg_init, &temp_buff);
2693         return rc;
2694     }
2695     return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
2696 }
2697 
2698 int cudbg_collect_vpd_data(struct cudbg_init *pdbg_init,
2699                struct cudbg_buffer *dbg_buff,
2700                struct cudbg_error *cudbg_err)
2701 {
2702     struct adapter *padap = pdbg_init->adap;
2703     struct cudbg_buffer temp_buff = { 0 };
2704     char vpd_str[CUDBG_VPD_VER_LEN + 1];
2705     struct cudbg_vpd_data *vpd_data;
2706     struct vpd_params vpd = { 0 };
2707     u32 vpd_vers, fw_vers;
2708     int rc;
2709 
2710     rc = t4_get_raw_vpd_params(padap, &vpd);
2711     if (rc)
2712         return rc;
2713 
2714     rc = t4_get_fw_version(padap, &fw_vers);
2715     if (rc)
2716         return rc;
2717 
2718     rc = cudbg_read_vpd_reg(padap, CUDBG_VPD_VER_ADDR, CUDBG_VPD_VER_LEN,
2719                 vpd_str);
2720     if (rc)
2721         return rc;
2722 
2723     vpd_str[CUDBG_VPD_VER_LEN] = '\0';
2724     rc = kstrtouint(vpd_str, 0, &vpd_vers);
2725     if (rc)
2726         return rc;
2727 
2728     rc = cudbg_get_buff(pdbg_init, dbg_buff, sizeof(struct cudbg_vpd_data),
2729                 &temp_buff);
2730     if (rc)
2731         return rc;
2732 
2733     vpd_data = (struct cudbg_vpd_data *)temp_buff.data;
2734     memcpy(vpd_data->sn, vpd.sn, SERNUM_LEN + 1);
2735     memcpy(vpd_data->bn, vpd.pn, PN_LEN + 1);
2736     memcpy(vpd_data->na, vpd.na, MACADDR_LEN + 1);
2737     memcpy(vpd_data->mn, vpd.id, ID_LEN + 1);
2738     vpd_data->scfg_vers = t4_read_reg(padap, PCIE_STATIC_SPARE2_A);
2739     vpd_data->vpd_vers = vpd_vers;
2740     vpd_data->fw_major = FW_HDR_FW_VER_MAJOR_G(fw_vers);
2741     vpd_data->fw_minor = FW_HDR_FW_VER_MINOR_G(fw_vers);
2742     vpd_data->fw_micro = FW_HDR_FW_VER_MICRO_G(fw_vers);
2743     vpd_data->fw_build = FW_HDR_FW_VER_BUILD_G(fw_vers);
2744     return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
2745 }
2746 
2747 static int cudbg_read_tid(struct cudbg_init *pdbg_init, u32 tid,
2748               struct cudbg_tid_data *tid_data)
2749 {
2750     struct adapter *padap = pdbg_init->adap;
2751     int i, cmd_retry = 8;
2752     u32 val;
2753 
2754     /* Fill REQ_DATA regs with 0's */
2755     for (i = 0; i < NUM_LE_DB_DBGI_REQ_DATA_INSTANCES; i++)
2756         t4_write_reg(padap, LE_DB_DBGI_REQ_DATA_A + (i << 2), 0);
2757 
2758     /* Write DBIG command */
2759     val = DBGICMD_V(4) | DBGITID_V(tid);
2760     t4_write_reg(padap, LE_DB_DBGI_REQ_TCAM_CMD_A, val);
2761     tid_data->dbig_cmd = val;
2762 
2763     val = DBGICMDSTRT_F | DBGICMDMODE_V(1); /* LE mode */
2764     t4_write_reg(padap, LE_DB_DBGI_CONFIG_A, val);
2765     tid_data->dbig_conf = val;
2766 
2767     /* Poll the DBGICMDBUSY bit */
2768     val = 1;
2769     while (val) {
2770         val = t4_read_reg(padap, LE_DB_DBGI_CONFIG_A);
2771         val = val & DBGICMDBUSY_F;
2772         cmd_retry--;
2773         if (!cmd_retry)
2774             return CUDBG_SYSTEM_ERROR;
2775     }
2776 
2777     /* Check RESP status */
2778     val = t4_read_reg(padap, LE_DB_DBGI_RSP_STATUS_A);
2779     tid_data->dbig_rsp_stat = val;
2780     if (!(val & 1))
2781         return CUDBG_SYSTEM_ERROR;
2782 
2783     /* Read RESP data */
2784     for (i = 0; i < NUM_LE_DB_DBGI_RSP_DATA_INSTANCES; i++)
2785         tid_data->data[i] = t4_read_reg(padap,
2786                         LE_DB_DBGI_RSP_DATA_A +
2787                         (i << 2));
2788     tid_data->tid = tid;
2789     return 0;
2790 }
2791 
2792 static int cudbg_get_le_type(u32 tid, struct cudbg_tcam tcam_region)
2793 {
2794     int type = LE_ET_UNKNOWN;
2795 
2796     if (tid < tcam_region.server_start)
2797         type = LE_ET_TCAM_CON;
2798     else if (tid < tcam_region.filter_start)
2799         type = LE_ET_TCAM_SERVER;
2800     else if (tid < tcam_region.clip_start)
2801         type = LE_ET_TCAM_FILTER;
2802     else if (tid < tcam_region.routing_start)
2803         type = LE_ET_TCAM_CLIP;
2804     else if (tid < tcam_region.tid_hash_base)
2805         type = LE_ET_TCAM_ROUTING;
2806     else if (tid < tcam_region.max_tid)
2807         type = LE_ET_HASH_CON;
2808     else
2809         type = LE_ET_INVALID_TID;
2810 
2811     return type;
2812 }
2813 
2814 static int cudbg_is_ipv6_entry(struct cudbg_tid_data *tid_data,
2815                    struct cudbg_tcam tcam_region)
2816 {
2817     int ipv6 = 0;
2818     int le_type;
2819 
2820     le_type = cudbg_get_le_type(tid_data->tid, tcam_region);
2821     if (tid_data->tid & 1)
2822         return 0;
2823 
2824     if (le_type == LE_ET_HASH_CON) {
2825         ipv6 = tid_data->data[16] & 0x8000;
2826     } else if (le_type == LE_ET_TCAM_CON) {
2827         ipv6 = tid_data->data[16] & 0x8000;
2828         if (ipv6)
2829             ipv6 = tid_data->data[9] == 0x00C00000;
2830     } else {
2831         ipv6 = 0;
2832     }
2833     return ipv6;
2834 }
2835 
2836 void cudbg_fill_le_tcam_info(struct adapter *padap,
2837                  struct cudbg_tcam *tcam_region)
2838 {
2839     u32 value;
2840 
2841     /* Get the LE regions */
2842     value = t4_read_reg(padap, LE_DB_TID_HASHBASE_A); /* hash base index */
2843     tcam_region->tid_hash_base = value;
2844 
2845     /* Get routing table index */
2846     value = t4_read_reg(padap, LE_DB_ROUTING_TABLE_INDEX_A);
2847     tcam_region->routing_start = value;
2848 
2849     /* Get clip table index. For T6 there is separate CLIP TCAM */
2850     if (is_t6(padap->params.chip))
2851         value = t4_read_reg(padap, LE_DB_CLCAM_TID_BASE_A);
2852     else
2853         value = t4_read_reg(padap, LE_DB_CLIP_TABLE_INDEX_A);
2854     tcam_region->clip_start = value;
2855 
2856     /* Get filter table index */
2857     value = t4_read_reg(padap, LE_DB_FILTER_TABLE_INDEX_A);
2858     tcam_region->filter_start = value;
2859 
2860     /* Get server table index */
2861     value = t4_read_reg(padap, LE_DB_SERVER_INDEX_A);
2862     tcam_region->server_start = value;
2863 
2864     /* Check whether hash is enabled and calculate the max tids */
2865     value = t4_read_reg(padap, LE_DB_CONFIG_A);
2866     if ((value >> HASHEN_S) & 1) {
2867         value = t4_read_reg(padap, LE_DB_HASH_CONFIG_A);
2868         if (CHELSIO_CHIP_VERSION(padap->params.chip) > CHELSIO_T5) {
2869             tcam_region->max_tid = (value & 0xFFFFF) +
2870                            tcam_region->tid_hash_base;
2871         } else {
2872             value = HASHTIDSIZE_G(value);
2873             value = 1 << value;
2874             tcam_region->max_tid = value +
2875                            tcam_region->tid_hash_base;
2876         }
2877     } else { /* hash not enabled */
2878         if (is_t6(padap->params.chip))
2879             tcam_region->max_tid = (value & ASLIPCOMPEN_F) ?
2880                            CUDBG_MAX_TID_COMP_EN :
2881                            CUDBG_MAX_TID_COMP_DIS;
2882         else
2883             tcam_region->max_tid = CUDBG_MAX_TCAM_TID;
2884     }
2885 
2886     if (is_t6(padap->params.chip))
2887         tcam_region->max_tid += CUDBG_T6_CLIP;
2888 }
2889 
2890 int cudbg_collect_le_tcam(struct cudbg_init *pdbg_init,
2891               struct cudbg_buffer *dbg_buff,
2892               struct cudbg_error *cudbg_err)
2893 {
2894     struct adapter *padap = pdbg_init->adap;
2895     struct cudbg_buffer temp_buff = { 0 };
2896     struct cudbg_tcam tcam_region = { 0 };
2897     struct cudbg_tid_data *tid_data;
2898     u32 bytes = 0;
2899     int rc, size;
2900     u32 i;
2901 
2902     cudbg_fill_le_tcam_info(padap, &tcam_region);
2903 
2904     size = sizeof(struct cudbg_tid_data) * tcam_region.max_tid;
2905     size += sizeof(struct cudbg_tcam);
2906     rc = cudbg_get_buff(pdbg_init, dbg_buff, size, &temp_buff);
2907     if (rc)
2908         return rc;
2909 
2910     memcpy(temp_buff.data, &tcam_region, sizeof(struct cudbg_tcam));
2911     bytes = sizeof(struct cudbg_tcam);
2912     tid_data = (struct cudbg_tid_data *)(temp_buff.data + bytes);
2913     /* read all tid */
2914     for (i = 0; i < tcam_region.max_tid; ) {
2915         rc = cudbg_read_tid(pdbg_init, i, tid_data);
2916         if (rc) {
2917             cudbg_err->sys_warn = CUDBG_STATUS_PARTIAL_DATA;
2918             /* Update tcam header and exit */
2919             tcam_region.max_tid = i;
2920             memcpy(temp_buff.data, &tcam_region,
2921                    sizeof(struct cudbg_tcam));
2922             goto out;
2923         }
2924 
2925         if (cudbg_is_ipv6_entry(tid_data, tcam_region)) {
2926             /* T6 CLIP TCAM: ipv6 takes 4 entries */
2927             if (is_t6(padap->params.chip) &&
2928                 i >= tcam_region.clip_start &&
2929                 i < tcam_region.clip_start + CUDBG_T6_CLIP)
2930                 i += 4;
2931             else /* Main TCAM: ipv6 takes two tids */
2932                 i += 2;
2933         } else {
2934             i++;
2935         }
2936 
2937         tid_data++;
2938         bytes += sizeof(struct cudbg_tid_data);
2939     }
2940 
2941 out:
2942     return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
2943 }
2944 
2945 int cudbg_collect_cctrl(struct cudbg_init *pdbg_init,
2946             struct cudbg_buffer *dbg_buff,
2947             struct cudbg_error *cudbg_err)
2948 {
2949     struct adapter *padap = pdbg_init->adap;
2950     struct cudbg_buffer temp_buff = { 0 };
2951     u32 size;
2952     int rc;
2953 
2954     size = sizeof(u16) * NMTUS * NCCTRL_WIN;
2955     rc = cudbg_get_buff(pdbg_init, dbg_buff, size, &temp_buff);
2956     if (rc)
2957         return rc;
2958 
2959     t4_read_cong_tbl(padap, (void *)temp_buff.data);
2960     return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
2961 }
2962 
2963 int cudbg_collect_ma_indirect(struct cudbg_init *pdbg_init,
2964                   struct cudbg_buffer *dbg_buff,
2965                   struct cudbg_error *cudbg_err)
2966 {
2967     struct adapter *padap = pdbg_init->adap;
2968     struct cudbg_buffer temp_buff = { 0 };
2969     struct ireg_buf *ma_indr;
2970     int i, rc, n;
2971     u32 size, j;
2972 
2973     if (CHELSIO_CHIP_VERSION(padap->params.chip) < CHELSIO_T6)
2974         return CUDBG_STATUS_ENTITY_NOT_FOUND;
2975 
2976     n = sizeof(t6_ma_ireg_array) / (IREG_NUM_ELEM * sizeof(u32));
2977     size = sizeof(struct ireg_buf) * n * 2;
2978     rc = cudbg_get_buff(pdbg_init, dbg_buff, size, &temp_buff);
2979     if (rc)
2980         return rc;
2981 
2982     ma_indr = (struct ireg_buf *)temp_buff.data;
2983     for (i = 0; i < n; i++) {
2984         struct ireg_field *ma_fli = &ma_indr->tp_pio;
2985         u32 *buff = ma_indr->outbuf;
2986 
2987         ma_fli->ireg_addr = t6_ma_ireg_array[i][0];
2988         ma_fli->ireg_data = t6_ma_ireg_array[i][1];
2989         ma_fli->ireg_local_offset = t6_ma_ireg_array[i][2];
2990         ma_fli->ireg_offset_range = t6_ma_ireg_array[i][3];
2991         t4_read_indirect(padap, ma_fli->ireg_addr, ma_fli->ireg_data,
2992                  buff, ma_fli->ireg_offset_range,
2993                  ma_fli->ireg_local_offset);
2994         ma_indr++;
2995     }
2996 
2997     n = sizeof(t6_ma_ireg_array2) / (IREG_NUM_ELEM * sizeof(u32));
2998     for (i = 0; i < n; i++) {
2999         struct ireg_field *ma_fli = &ma_indr->tp_pio;
3000         u32 *buff = ma_indr->outbuf;
3001 
3002         ma_fli->ireg_addr = t6_ma_ireg_array2[i][0];
3003         ma_fli->ireg_data = t6_ma_ireg_array2[i][1];
3004         ma_fli->ireg_local_offset = t6_ma_ireg_array2[i][2];
3005         for (j = 0; j < t6_ma_ireg_array2[i][3]; j++) {
3006             t4_read_indirect(padap, ma_fli->ireg_addr,
3007                      ma_fli->ireg_data, buff, 1,
3008                      ma_fli->ireg_local_offset);
3009             buff++;
3010             ma_fli->ireg_local_offset += 0x20;
3011         }
3012         ma_indr++;
3013     }
3014     return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
3015 }
3016 
3017 int cudbg_collect_ulptx_la(struct cudbg_init *pdbg_init,
3018                struct cudbg_buffer *dbg_buff,
3019                struct cudbg_error *cudbg_err)
3020 {
3021     struct adapter *padap = pdbg_init->adap;
3022     struct cudbg_buffer temp_buff = { 0 };
3023     struct cudbg_ulptx_la *ulptx_la_buff;
3024     struct cudbg_ver_hdr *ver_hdr;
3025     u32 i, j;
3026     int rc;
3027 
3028     rc = cudbg_get_buff(pdbg_init, dbg_buff,
3029                 sizeof(struct cudbg_ver_hdr) +
3030                 sizeof(struct cudbg_ulptx_la),
3031                 &temp_buff);
3032     if (rc)
3033         return rc;
3034 
3035     ver_hdr = (struct cudbg_ver_hdr *)temp_buff.data;
3036     ver_hdr->signature = CUDBG_ENTITY_SIGNATURE;
3037     ver_hdr->revision = CUDBG_ULPTX_LA_REV;
3038     ver_hdr->size = sizeof(struct cudbg_ulptx_la);
3039 
3040     ulptx_la_buff = (struct cudbg_ulptx_la *)(temp_buff.data +
3041                           sizeof(*ver_hdr));
3042     for (i = 0; i < CUDBG_NUM_ULPTX; i++) {
3043         ulptx_la_buff->rdptr[i] = t4_read_reg(padap,
3044                               ULP_TX_LA_RDPTR_0_A +
3045                               0x10 * i);
3046         ulptx_la_buff->wrptr[i] = t4_read_reg(padap,
3047                               ULP_TX_LA_WRPTR_0_A +
3048                               0x10 * i);
3049         ulptx_la_buff->rddata[i] = t4_read_reg(padap,
3050                                ULP_TX_LA_RDDATA_0_A +
3051                                0x10 * i);
3052         for (j = 0; j < CUDBG_NUM_ULPTX_READ; j++)
3053             ulptx_la_buff->rd_data[i][j] =
3054                 t4_read_reg(padap,
3055                         ULP_TX_LA_RDDATA_0_A + 0x10 * i);
3056     }
3057 
3058     for (i = 0; i < CUDBG_NUM_ULPTX_ASIC_READ; i++) {
3059         t4_write_reg(padap, ULP_TX_ASIC_DEBUG_CTRL_A, 0x1);
3060         ulptx_la_buff->rdptr_asic[i] =
3061                 t4_read_reg(padap, ULP_TX_ASIC_DEBUG_CTRL_A);
3062         ulptx_la_buff->rddata_asic[i][0] =
3063                 t4_read_reg(padap, ULP_TX_ASIC_DEBUG_0_A);
3064         ulptx_la_buff->rddata_asic[i][1] =
3065                 t4_read_reg(padap, ULP_TX_ASIC_DEBUG_1_A);
3066         ulptx_la_buff->rddata_asic[i][2] =
3067                 t4_read_reg(padap, ULP_TX_ASIC_DEBUG_2_A);
3068         ulptx_la_buff->rddata_asic[i][3] =
3069                 t4_read_reg(padap, ULP_TX_ASIC_DEBUG_3_A);
3070         ulptx_la_buff->rddata_asic[i][4] =
3071                 t4_read_reg(padap, ULP_TX_ASIC_DEBUG_4_A);
3072         ulptx_la_buff->rddata_asic[i][5] =
3073                 t4_read_reg(padap, PM_RX_BASE_ADDR);
3074     }
3075 
3076     return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
3077 }
3078 
3079 int cudbg_collect_up_cim_indirect(struct cudbg_init *pdbg_init,
3080                   struct cudbg_buffer *dbg_buff,
3081                   struct cudbg_error *cudbg_err)
3082 {
3083     struct adapter *padap = pdbg_init->adap;
3084     struct cudbg_buffer temp_buff = { 0 };
3085     u32 local_offset, local_range;
3086     struct ireg_buf *up_cim;
3087     u32 size, j, iter;
3088     u32 instance = 0;
3089     int i, rc, n;
3090 
3091     if (is_t5(padap->params.chip))
3092         n = sizeof(t5_up_cim_reg_array) /
3093             ((IREG_NUM_ELEM + 1) * sizeof(u32));
3094     else if (is_t6(padap->params.chip))
3095         n = sizeof(t6_up_cim_reg_array) /
3096             ((IREG_NUM_ELEM + 1) * sizeof(u32));
3097     else
3098         return CUDBG_STATUS_NOT_IMPLEMENTED;
3099 
3100     size = sizeof(struct ireg_buf) * n;
3101     rc = cudbg_get_buff(pdbg_init, dbg_buff, size, &temp_buff);
3102     if (rc)
3103         return rc;
3104 
3105     up_cim = (struct ireg_buf *)temp_buff.data;
3106     for (i = 0; i < n; i++) {
3107         struct ireg_field *up_cim_reg = &up_cim->tp_pio;
3108         u32 *buff = up_cim->outbuf;
3109 
3110         if (is_t5(padap->params.chip)) {
3111             up_cim_reg->ireg_addr = t5_up_cim_reg_array[i][0];
3112             up_cim_reg->ireg_data = t5_up_cim_reg_array[i][1];
3113             up_cim_reg->ireg_local_offset =
3114                         t5_up_cim_reg_array[i][2];
3115             up_cim_reg->ireg_offset_range =
3116                         t5_up_cim_reg_array[i][3];
3117             instance = t5_up_cim_reg_array[i][4];
3118         } else if (is_t6(padap->params.chip)) {
3119             up_cim_reg->ireg_addr = t6_up_cim_reg_array[i][0];
3120             up_cim_reg->ireg_data = t6_up_cim_reg_array[i][1];
3121             up_cim_reg->ireg_local_offset =
3122                         t6_up_cim_reg_array[i][2];
3123             up_cim_reg->ireg_offset_range =
3124                         t6_up_cim_reg_array[i][3];
3125             instance = t6_up_cim_reg_array[i][4];
3126         }
3127 
3128         switch (instance) {
3129         case NUM_CIM_CTL_TSCH_CHANNEL_INSTANCES:
3130             iter = up_cim_reg->ireg_offset_range;
3131             local_offset = 0x120;
3132             local_range = 1;
3133             break;
3134         case NUM_CIM_CTL_TSCH_CHANNEL_TSCH_CLASS_INSTANCES:
3135             iter = up_cim_reg->ireg_offset_range;
3136             local_offset = 0x10;
3137             local_range = 1;
3138             break;
3139         default:
3140             iter = 1;
3141             local_offset = 0;
3142             local_range = up_cim_reg->ireg_offset_range;
3143             break;
3144         }
3145 
3146         for (j = 0; j < iter; j++, buff++) {
3147             rc = t4_cim_read(padap,
3148                      up_cim_reg->ireg_local_offset +
3149                      (j * local_offset), local_range, buff);
3150             if (rc) {
3151                 cudbg_put_buff(pdbg_init, &temp_buff);
3152                 return rc;
3153             }
3154         }
3155         up_cim++;
3156     }
3157     return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
3158 }
3159 
3160 int cudbg_collect_pbt_tables(struct cudbg_init *pdbg_init,
3161                  struct cudbg_buffer *dbg_buff,
3162                  struct cudbg_error *cudbg_err)
3163 {
3164     struct adapter *padap = pdbg_init->adap;
3165     struct cudbg_buffer temp_buff = { 0 };
3166     struct cudbg_pbt_tables *pbt;
3167     int i, rc;
3168     u32 addr;
3169 
3170     rc = cudbg_get_buff(pdbg_init, dbg_buff,
3171                 sizeof(struct cudbg_pbt_tables),
3172                 &temp_buff);
3173     if (rc)
3174         return rc;
3175 
3176     pbt = (struct cudbg_pbt_tables *)temp_buff.data;
3177     /* PBT dynamic entries */
3178     addr = CUDBG_CHAC_PBT_ADDR;
3179     for (i = 0; i < CUDBG_PBT_DYNAMIC_ENTRIES; i++) {
3180         rc = t4_cim_read(padap, addr + (i * 4), 1,
3181                  &pbt->pbt_dynamic[i]);
3182         if (rc) {
3183             cudbg_err->sys_err = rc;
3184             cudbg_put_buff(pdbg_init, &temp_buff);
3185             return rc;
3186         }
3187     }
3188 
3189     /* PBT static entries */
3190     /* static entries start when bit 6 is set */
3191     addr = CUDBG_CHAC_PBT_ADDR + (1 << 6);
3192     for (i = 0; i < CUDBG_PBT_STATIC_ENTRIES; i++) {
3193         rc = t4_cim_read(padap, addr + (i * 4), 1,
3194                  &pbt->pbt_static[i]);
3195         if (rc) {
3196             cudbg_err->sys_err = rc;
3197             cudbg_put_buff(pdbg_init, &temp_buff);
3198             return rc;
3199         }
3200     }
3201 
3202     /* LRF entries */
3203     addr = CUDBG_CHAC_PBT_LRF;
3204     for (i = 0; i < CUDBG_LRF_ENTRIES; i++) {
3205         rc = t4_cim_read(padap, addr + (i * 4), 1,
3206                  &pbt->lrf_table[i]);
3207         if (rc) {
3208             cudbg_err->sys_err = rc;
3209             cudbg_put_buff(pdbg_init, &temp_buff);
3210             return rc;
3211         }
3212     }
3213 
3214     /* PBT data entries */
3215     addr = CUDBG_CHAC_PBT_DATA;
3216     for (i = 0; i < CUDBG_PBT_DATA_ENTRIES; i++) {
3217         rc = t4_cim_read(padap, addr + (i * 4), 1,
3218                  &pbt->pbt_data[i]);
3219         if (rc) {
3220             cudbg_err->sys_err = rc;
3221             cudbg_put_buff(pdbg_init, &temp_buff);
3222             return rc;
3223         }
3224     }
3225     return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
3226 }
3227 
3228 int cudbg_collect_mbox_log(struct cudbg_init *pdbg_init,
3229                struct cudbg_buffer *dbg_buff,
3230                struct cudbg_error *cudbg_err)
3231 {
3232     struct adapter *padap = pdbg_init->adap;
3233     struct cudbg_mbox_log *mboxlog = NULL;
3234     struct cudbg_buffer temp_buff = { 0 };
3235     struct mbox_cmd_log *log = NULL;
3236     struct mbox_cmd *entry;
3237     unsigned int entry_idx;
3238     u16 mbox_cmds;
3239     int i, k, rc;
3240     u64 flit;
3241     u32 size;
3242 
3243     log = padap->mbox_log;
3244     mbox_cmds = padap->mbox_log->size;
3245     size = sizeof(struct cudbg_mbox_log) * mbox_cmds;
3246     rc = cudbg_get_buff(pdbg_init, dbg_buff, size, &temp_buff);
3247     if (rc)
3248         return rc;
3249 
3250     mboxlog = (struct cudbg_mbox_log *)temp_buff.data;
3251     for (k = 0; k < mbox_cmds; k++) {
3252         entry_idx = log->cursor + k;
3253         if (entry_idx >= log->size)
3254             entry_idx -= log->size;
3255 
3256         entry = mbox_cmd_log_entry(log, entry_idx);
3257         /* skip over unused entries */
3258         if (entry->timestamp == 0)
3259             continue;
3260 
3261         memcpy(&mboxlog->entry, entry, sizeof(struct mbox_cmd));
3262         for (i = 0; i < MBOX_LEN / 8; i++) {
3263             flit = entry->cmd[i];
3264             mboxlog->hi[i] = (u32)(flit >> 32);
3265             mboxlog->lo[i] = (u32)flit;
3266         }
3267         mboxlog++;
3268     }
3269     return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
3270 }
3271 
3272 int cudbg_collect_hma_indirect(struct cudbg_init *pdbg_init,
3273                    struct cudbg_buffer *dbg_buff,
3274                    struct cudbg_error *cudbg_err)
3275 {
3276     struct adapter *padap = pdbg_init->adap;
3277     struct cudbg_buffer temp_buff = { 0 };
3278     struct ireg_buf *hma_indr;
3279     int i, rc, n;
3280     u32 size;
3281 
3282     if (CHELSIO_CHIP_VERSION(padap->params.chip) < CHELSIO_T6)
3283         return CUDBG_STATUS_ENTITY_NOT_FOUND;
3284 
3285     n = sizeof(t6_hma_ireg_array) / (IREG_NUM_ELEM * sizeof(u32));
3286     size = sizeof(struct ireg_buf) * n;
3287     rc = cudbg_get_buff(pdbg_init, dbg_buff, size, &temp_buff);
3288     if (rc)
3289         return rc;
3290 
3291     hma_indr = (struct ireg_buf *)temp_buff.data;
3292     for (i = 0; i < n; i++) {
3293         struct ireg_field *hma_fli = &hma_indr->tp_pio;
3294         u32 *buff = hma_indr->outbuf;
3295 
3296         hma_fli->ireg_addr = t6_hma_ireg_array[i][0];
3297         hma_fli->ireg_data = t6_hma_ireg_array[i][1];
3298         hma_fli->ireg_local_offset = t6_hma_ireg_array[i][2];
3299         hma_fli->ireg_offset_range = t6_hma_ireg_array[i][3];
3300         t4_read_indirect(padap, hma_fli->ireg_addr, hma_fli->ireg_data,
3301                  buff, hma_fli->ireg_offset_range,
3302                  hma_fli->ireg_local_offset);
3303         hma_indr++;
3304     }
3305     return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
3306 }
3307 
3308 void cudbg_fill_qdesc_num_and_size(const struct adapter *padap,
3309                    u32 *num, u32 *size)
3310 {
3311     u32 tot_entries = 0, tot_size = 0;
3312 
3313     /* NIC TXQ, RXQ, FLQ, and CTRLQ */
3314     tot_entries += MAX_ETH_QSETS * 3;
3315     tot_entries += MAX_CTRL_QUEUES;
3316 
3317     tot_size += MAX_ETH_QSETS * MAX_TXQ_ENTRIES * MAX_TXQ_DESC_SIZE;
3318     tot_size += MAX_ETH_QSETS * MAX_RSPQ_ENTRIES * MAX_RXQ_DESC_SIZE;
3319     tot_size += MAX_ETH_QSETS * MAX_RX_BUFFERS * MAX_FL_DESC_SIZE;
3320     tot_size += MAX_CTRL_QUEUES * MAX_CTRL_TXQ_ENTRIES *
3321             MAX_CTRL_TXQ_DESC_SIZE;
3322 
3323     /* FW_EVTQ and INTRQ */
3324     tot_entries += INGQ_EXTRAS;
3325     tot_size += INGQ_EXTRAS * MAX_RSPQ_ENTRIES * MAX_RXQ_DESC_SIZE;
3326 
3327     /* PTP_TXQ */
3328     tot_entries += 1;
3329     tot_size += MAX_TXQ_ENTRIES * MAX_TXQ_DESC_SIZE;
3330 
3331     /* ULD TXQ, RXQ, and FLQ */
3332     tot_entries += CXGB4_TX_MAX * MAX_OFLD_QSETS;
3333     tot_entries += CXGB4_ULD_MAX * MAX_ULD_QSETS * 2;
3334 
3335     tot_size += CXGB4_TX_MAX * MAX_OFLD_QSETS * MAX_TXQ_ENTRIES *
3336             MAX_TXQ_DESC_SIZE;
3337     tot_size += CXGB4_ULD_MAX * MAX_ULD_QSETS * MAX_RSPQ_ENTRIES *
3338             MAX_RXQ_DESC_SIZE;
3339     tot_size += CXGB4_ULD_MAX * MAX_ULD_QSETS * MAX_RX_BUFFERS *
3340             MAX_FL_DESC_SIZE;
3341 
3342     /* ULD CIQ */
3343     tot_entries += CXGB4_ULD_MAX * MAX_ULD_QSETS;
3344     tot_size += CXGB4_ULD_MAX * MAX_ULD_QSETS * SGE_MAX_IQ_SIZE *
3345             MAX_RXQ_DESC_SIZE;
3346 
3347     /* ETHOFLD TXQ, RXQ, and FLQ */
3348     tot_entries += MAX_OFLD_QSETS * 3;
3349     tot_size += MAX_OFLD_QSETS * MAX_TXQ_ENTRIES * MAX_TXQ_DESC_SIZE;
3350 
3351     tot_size += sizeof(struct cudbg_ver_hdr) +
3352             sizeof(struct cudbg_qdesc_info) +
3353             sizeof(struct cudbg_qdesc_entry) * tot_entries;
3354 
3355     if (num)
3356         *num = tot_entries;
3357 
3358     if (size)
3359         *size = tot_size;
3360 }
3361 
3362 int cudbg_collect_qdesc(struct cudbg_init *pdbg_init,
3363             struct cudbg_buffer *dbg_buff,
3364             struct cudbg_error *cudbg_err)
3365 {
3366     u32 num_queues = 0, tot_entries = 0, size = 0;
3367     struct adapter *padap = pdbg_init->adap;
3368     struct cudbg_buffer temp_buff = { 0 };
3369     struct cudbg_qdesc_entry *qdesc_entry;
3370     struct cudbg_qdesc_info *qdesc_info;
3371     struct cudbg_ver_hdr *ver_hdr;
3372     struct sge *s = &padap->sge;
3373     u32 i, j, cur_off, tot_len;
3374     u8 *data;
3375     int rc;
3376 
3377     cudbg_fill_qdesc_num_and_size(padap, &tot_entries, &size);
3378     size = min_t(u32, size, CUDBG_DUMP_BUFF_SIZE);
3379     tot_len = size;
3380     data = kvzalloc(size, GFP_KERNEL);
3381     if (!data)
3382         return -ENOMEM;
3383 
3384     ver_hdr = (struct cudbg_ver_hdr *)data;
3385     ver_hdr->signature = CUDBG_ENTITY_SIGNATURE;
3386     ver_hdr->revision = CUDBG_QDESC_REV;
3387     ver_hdr->size = sizeof(struct cudbg_qdesc_info);
3388     size -= sizeof(*ver_hdr);
3389 
3390     qdesc_info = (struct cudbg_qdesc_info *)(data +
3391                          sizeof(*ver_hdr));
3392     size -= sizeof(*qdesc_info);
3393     qdesc_entry = (struct cudbg_qdesc_entry *)qdesc_info->data;
3394 
3395 #define QDESC_GET(q, desc, type, label) do { \
3396     if (size <= 0) { \
3397         goto label; \
3398     } \
3399     if (desc) { \
3400         cudbg_fill_qdesc_##q(q, type, qdesc_entry); \
3401         size -= sizeof(*qdesc_entry) + qdesc_entry->data_size; \
3402         num_queues++; \
3403         qdesc_entry = cudbg_next_qdesc(qdesc_entry); \
3404     } \
3405 } while (0)
3406 
3407 #define QDESC_GET_TXQ(q, type, label) do { \
3408     struct sge_txq *txq = (struct sge_txq *)q; \
3409     QDESC_GET(txq, txq->desc, type, label); \
3410 } while (0)
3411 
3412 #define QDESC_GET_RXQ(q, type, label) do { \
3413     struct sge_rspq *rxq = (struct sge_rspq *)q; \
3414     QDESC_GET(rxq, rxq->desc, type, label); \
3415 } while (0)
3416 
3417 #define QDESC_GET_FLQ(q, type, label) do { \
3418     struct sge_fl *flq = (struct sge_fl *)q; \
3419     QDESC_GET(flq, flq->desc, type, label); \
3420 } while (0)
3421 
3422     /* NIC TXQ */
3423     for (i = 0; i < s->ethqsets; i++)
3424         QDESC_GET_TXQ(&s->ethtxq[i].q, CUDBG_QTYPE_NIC_TXQ, out);
3425 
3426     /* NIC RXQ */
3427     for (i = 0; i < s->ethqsets; i++)
3428         QDESC_GET_RXQ(&s->ethrxq[i].rspq, CUDBG_QTYPE_NIC_RXQ, out);
3429 
3430     /* NIC FLQ */
3431     for (i = 0; i < s->ethqsets; i++)
3432         QDESC_GET_FLQ(&s->ethrxq[i].fl, CUDBG_QTYPE_NIC_FLQ, out);
3433 
3434     /* NIC CTRLQ */
3435     for (i = 0; i < padap->params.nports; i++)
3436         QDESC_GET_TXQ(&s->ctrlq[i].q, CUDBG_QTYPE_CTRLQ, out);
3437 
3438     /* FW_EVTQ */
3439     QDESC_GET_RXQ(&s->fw_evtq, CUDBG_QTYPE_FWEVTQ, out);
3440 
3441     /* INTRQ */
3442     QDESC_GET_RXQ(&s->intrq, CUDBG_QTYPE_INTRQ, out);
3443 
3444     /* PTP_TXQ */
3445     QDESC_GET_TXQ(&s->ptptxq.q, CUDBG_QTYPE_PTP_TXQ, out);
3446 
3447     /* ULD Queues */
3448     mutex_lock(&uld_mutex);
3449 
3450     if (s->uld_txq_info) {
3451         struct sge_uld_txq_info *utxq;
3452 
3453         /* ULD TXQ */
3454         for (j = 0; j < CXGB4_TX_MAX; j++) {
3455             if (!s->uld_txq_info[j])
3456                 continue;
3457 
3458             utxq = s->uld_txq_info[j];
3459             for (i = 0; i < utxq->ntxq; i++)
3460                 QDESC_GET_TXQ(&utxq->uldtxq[i].q,
3461                           cudbg_uld_txq_to_qtype(j),
3462                           out_unlock_uld);
3463         }
3464     }
3465 
3466     if (s->uld_rxq_info) {
3467         struct sge_uld_rxq_info *urxq;
3468         u32 base;
3469 
3470         /* ULD RXQ */
3471         for (j = 0; j < CXGB4_ULD_MAX; j++) {
3472             if (!s->uld_rxq_info[j])
3473                 continue;
3474 
3475             urxq = s->uld_rxq_info[j];
3476             for (i = 0; i < urxq->nrxq; i++)
3477                 QDESC_GET_RXQ(&urxq->uldrxq[i].rspq,
3478                           cudbg_uld_rxq_to_qtype(j),
3479                           out_unlock_uld);
3480         }
3481 
3482         /* ULD FLQ */
3483         for (j = 0; j < CXGB4_ULD_MAX; j++) {
3484             if (!s->uld_rxq_info[j])
3485                 continue;
3486 
3487             urxq = s->uld_rxq_info[j];
3488             for (i = 0; i < urxq->nrxq; i++)
3489                 QDESC_GET_FLQ(&urxq->uldrxq[i].fl,
3490                           cudbg_uld_flq_to_qtype(j),
3491                           out_unlock_uld);
3492         }
3493 
3494         /* ULD CIQ */
3495         for (j = 0; j < CXGB4_ULD_MAX; j++) {
3496             if (!s->uld_rxq_info[j])
3497                 continue;
3498 
3499             urxq = s->uld_rxq_info[j];
3500             base = urxq->nrxq;
3501             for (i = 0; i < urxq->nciq; i++)
3502                 QDESC_GET_RXQ(&urxq->uldrxq[base + i].rspq,
3503                           cudbg_uld_ciq_to_qtype(j),
3504                           out_unlock_uld);
3505         }
3506     }
3507     mutex_unlock(&uld_mutex);
3508 
3509     if (!padap->tc_mqprio)
3510         goto out;
3511 
3512     mutex_lock(&padap->tc_mqprio->mqprio_mutex);
3513     /* ETHOFLD TXQ */
3514     if (s->eohw_txq)
3515         for (i = 0; i < s->eoqsets; i++)
3516             QDESC_GET_TXQ(&s->eohw_txq[i].q,
3517                       CUDBG_QTYPE_ETHOFLD_TXQ, out_unlock_mqprio);
3518 
3519     /* ETHOFLD RXQ and FLQ */
3520     if (s->eohw_rxq) {
3521         for (i = 0; i < s->eoqsets; i++)
3522             QDESC_GET_RXQ(&s->eohw_rxq[i].rspq,
3523                       CUDBG_QTYPE_ETHOFLD_RXQ, out_unlock_mqprio);
3524 
3525         for (i = 0; i < s->eoqsets; i++)
3526             QDESC_GET_FLQ(&s->eohw_rxq[i].fl,
3527                       CUDBG_QTYPE_ETHOFLD_FLQ, out_unlock_mqprio);
3528     }
3529 
3530 out_unlock_mqprio:
3531     mutex_unlock(&padap->tc_mqprio->mqprio_mutex);
3532 
3533 out:
3534     qdesc_info->qdesc_entry_size = sizeof(*qdesc_entry);
3535     qdesc_info->num_queues = num_queues;
3536     cur_off = 0;
3537     while (tot_len) {
3538         u32 chunk_size = min_t(u32, tot_len, CUDBG_CHUNK_SIZE);
3539 
3540         rc = cudbg_get_buff(pdbg_init, dbg_buff, chunk_size,
3541                     &temp_buff);
3542         if (rc) {
3543             cudbg_err->sys_warn = CUDBG_STATUS_PARTIAL_DATA;
3544             goto out_free;
3545         }
3546 
3547         memcpy(temp_buff.data, data + cur_off, chunk_size);
3548         tot_len -= chunk_size;
3549         cur_off += chunk_size;
3550         rc = cudbg_write_and_release_buff(pdbg_init, &temp_buff,
3551                           dbg_buff);
3552         if (rc) {
3553             cudbg_put_buff(pdbg_init, &temp_buff);
3554             cudbg_err->sys_warn = CUDBG_STATUS_PARTIAL_DATA;
3555             goto out_free;
3556         }
3557     }
3558 
3559 out_free:
3560     kvfree(data);
3561 
3562 #undef QDESC_GET_FLQ
3563 #undef QDESC_GET_RXQ
3564 #undef QDESC_GET_TXQ
3565 #undef QDESC_GET
3566 
3567     return rc;
3568 
3569 out_unlock_uld:
3570     mutex_unlock(&uld_mutex);
3571     goto out;
3572 }
3573 
3574 int cudbg_collect_flash(struct cudbg_init *pdbg_init,
3575             struct cudbg_buffer *dbg_buff,
3576             struct cudbg_error *cudbg_err)
3577 {
3578     struct adapter *padap = pdbg_init->adap;
3579     u32 count = padap->params.sf_size, n;
3580     struct cudbg_buffer temp_buff = {0};
3581     u32 addr, i;
3582     int rc;
3583 
3584     addr = FLASH_EXP_ROM_START;
3585 
3586     for (i = 0; i < count; i += SF_PAGE_SIZE) {
3587         n = min_t(u32, count - i, SF_PAGE_SIZE);
3588 
3589         rc = cudbg_get_buff(pdbg_init, dbg_buff, n, &temp_buff);
3590         if (rc) {
3591             cudbg_err->sys_warn = CUDBG_STATUS_PARTIAL_DATA;
3592             goto out;
3593         }
3594         rc = t4_read_flash(padap, addr, n, (u32 *)temp_buff.data, 0);
3595         if (rc)
3596             goto out;
3597 
3598         addr += (n * 4);
3599         rc = cudbg_write_and_release_buff(pdbg_init, &temp_buff,
3600                           dbg_buff);
3601         if (rc) {
3602             cudbg_err->sys_warn = CUDBG_STATUS_PARTIAL_DATA;
3603             goto out;
3604         }
3605     }
3606 
3607 out:
3608     return rc;
3609 }