1 /* SPDX-License-Identifier: GPL-2.0 */
3 * Common codes for both the skx_edac driver and Intel 10nm server EDAC driver.
4 * Originally split out from the skx_edac driver.
6 * Copyright (c) 2018, Intel Corporation.
9 #ifndef _SKX_COMM_EDAC_H
10 #define _SKX_COMM_EDAC_H
12 #include <linux/bits.h>
20 #define skx_printk(level, fmt, arg...) \
21 edac_printk(level, "skx", fmt, ##arg)
23 #define skx_mc_printk(mci, level, fmt, arg...) \
24 edac_mc_chipset_printk(mci, level, "skx", fmt, ##arg)
27 * Get a bit field at register value <v>, from bit <lo> to bit <hi>
29 #define GET_BITFIELD(v, lo, hi) \
30 (((v) & GENMASK_ULL((hi), (lo))) >> (lo))
32 #define SKX_NUM_IMC 2 /* Memory controllers per socket */
33 #define SKX_NUM_CHANNELS 3 /* Channels per memory controller */
34 #define SKX_NUM_DIMMS 2 /* Max DIMMS per channel */
36 #define I10NM_NUM_DDR_IMC 12
37 #define I10NM_NUM_DDR_CHANNELS 2
38 #define I10NM_NUM_DDR_DIMMS 2
40 #define I10NM_NUM_HBM_IMC 16
41 #define I10NM_NUM_HBM_CHANNELS 2
42 #define I10NM_NUM_HBM_DIMMS 1
44 #define I10NM_NUM_IMC (I10NM_NUM_DDR_IMC + I10NM_NUM_HBM_IMC)
45 #define I10NM_NUM_CHANNELS MAX(I10NM_NUM_DDR_CHANNELS, I10NM_NUM_HBM_CHANNELS)
46 #define I10NM_NUM_DIMMS MAX(I10NM_NUM_DDR_DIMMS, I10NM_NUM_HBM_DIMMS)
48 #define MAX(a, b) ((a) > (b) ? (a) : (b))
49 #define NUM_IMC MAX(SKX_NUM_IMC, I10NM_NUM_IMC)
50 #define NUM_CHANNELS MAX(SKX_NUM_CHANNELS, I10NM_NUM_CHANNELS)
51 #define NUM_DIMMS MAX(SKX_NUM_DIMMS, I10NM_NUM_DIMMS)
53 #define IS_DIMM_PRESENT(r) GET_BITFIELD(r, 15, 15)
54 #define IS_NVDIMM_PRESENT(r, i) GET_BITFIELD(r, i, i)
56 #define MCI_MISC_ECC_MODE(m) (((m) >> 59) & 15)
57 #define MCI_MISC_ECC_DDRT 8 /* read from DDRT */
60 * According to Intel Architecture spec vol 3B,
61 * Table 15-10 "IA32_MCi_Status [15:0] Compound Error Code Encoding"
62 * memory errors should fit one of these masks:
63 * 000f 0000 1mmm cccc (binary)
64 * 000f 0010 1mmm cccc (binary) [RAM used as cache]
66 * f = Correction Report Filtering Bit. If 1, subsequent errors
71 #define MCACOD_MEM_ERR_MASK 0xef80
73 * Errors from either the memory of the 1-level memory system or the
74 * 2nd level memory (the slow "far" memory) of the 2-level memory system.
76 #define MCACOD_MEM_CTL_ERR 0x80
78 * Errors from the 1st level memory (the fast "near" memory as cache)
79 * of the 2-level memory system.
81 #define MCACOD_EXT_MEM_ERR 0x280
84 * Each cpu socket contains some pci devices that provide global
85 * information, and also some that are local to each of the two
86 * memory controllers on the die.
89 struct list_head list;
92 struct pci_dev *sad_all;
93 struct pci_dev *util_all;
94 struct pci_dev *uracu; /* for i10nm CPU */
95 struct pci_dev *pcu_cr3; /* for HBM memory detection */
98 struct mem_ctl_info *mci;
99 struct pci_dev *mdev; /* for i10nm CPU */
100 void __iomem *mbase; /* for i10nm CPU */
101 int chan_mmio_sz; /* for i10nm CPU */
102 int num_channels; /* channels per memory controller */
103 int num_dimms; /* dimms per channel */
105 u8 mc; /* system wide mc# */
106 u8 lmc; /* socket relative mc# */
109 struct pci_dev *cdev;
110 struct pci_dev *edev;
111 u32 retry_rd_err_log_s;
112 u32 retry_rd_err_log_d;
113 u32 retry_rd_err_log_d2;
121 } chan[NUM_CHANNELS];
143 INDEX_NM_MEMCTRL = INDEX_NM_FIRST,
150 #define BIT_NM_MEMCTRL BIT_ULL(INDEX_NM_MEMCTRL)
151 #define BIT_NM_CHANNEL BIT_ULL(INDEX_NM_CHANNEL)
152 #define BIT_NM_DIMM BIT_ULL(INDEX_NM_DIMM)
153 #define BIT_NM_CS BIT_ULL(INDEX_NM_CS)
155 struct decoded_addr {
174 bool decoded_by_adxl;
185 /* Configuration agent device ID */
186 unsigned int decs_did;
187 /* Default bus number configuration register offset */
188 int busno_cfg_offset;
189 /* DDR memory controllers per socket */
191 /* DDR channels per DDR memory controller */
193 /* DDR DIMMs per DDR memory channel */
195 /* Per DDR channel memory-mapped I/O size */
196 int ddr_chan_mmio_sz;
197 /* HBM memory controllers per socket */
199 /* HBM channels per HBM memory controller */
201 /* HBM DIMMs per HBM memory channel */
203 /* Per HBM channel memory-mapped I/O size */
204 int hbm_chan_mmio_sz;
207 struct pci_bdf sad_all_bdf;
209 struct pci_bdf pcu_cr3_bdf;
210 /* UTIL device BDF */
211 struct pci_bdf util_all_bdf;
212 /* URACU device BDF */
213 struct pci_bdf uracu_bdf;
214 /* DDR mdev device BDF */
215 struct pci_bdf ddr_mdev_bdf;
216 /* HBM mdev device BDF */
217 struct pci_bdf hbm_mdev_bdf;
219 /* Offsets of retry_rd_err_log registers */
221 u32 *offsets_scrub_hbm0;
222 u32 *offsets_scrub_hbm1;
224 u32 *offsets_demand2;
225 u32 *offsets_demand_hbm0;
226 u32 *offsets_demand_hbm1;
229 typedef int (*get_dimm_config_f)(struct mem_ctl_info *mci,
230 struct res_config *cfg);
231 typedef bool (*skx_decode_f)(struct decoded_addr *res);
232 typedef void (*skx_show_retry_log_f)(struct decoded_addr *res, char *msg, int len, bool scrub_err);
234 int __init skx_adxl_get(void);
235 void __exit skx_adxl_put(void);
236 void skx_set_decode(skx_decode_f decode, skx_show_retry_log_f show_retry_log);
237 void skx_set_mem_cfg(bool mem_cfg_2lm);
239 int skx_get_src_id(struct skx_dev *d, int off, u8 *id);
240 int skx_get_node_id(struct skx_dev *d, u8 *id);
242 int skx_get_all_bus_mappings(struct res_config *cfg, struct list_head **list);
244 int skx_get_hi_lo(unsigned int did, int off[], u64 *tolm, u64 *tohm);
246 int skx_get_dimm_info(u32 mtr, u32 mcmtr, u32 amap, struct dimm_info *dimm,
247 struct skx_imc *imc, int chan, int dimmno,
248 struct res_config *cfg);
250 int skx_get_nvdimm_info(struct dimm_info *dimm, struct skx_imc *imc,
251 int chan, int dimmno, const char *mod_str);
253 int skx_register_mci(struct skx_imc *imc, struct pci_dev *pdev,
254 const char *ctl_name, const char *mod_str,
255 get_dimm_config_f get_dimm_config,
256 struct res_config *cfg);
258 int skx_mce_check_error(struct notifier_block *nb, unsigned long val,
261 void skx_remove(void);
263 #endif /* _SKX_COMM_EDAC_H */