xref: /openbmc/linux/drivers/edac/pnd2_edac.c (revision 6614a3c3164a5df2b54abb0b3559f51041cf705b)
1 // SPDX-License-Identifier: GPL-2.0-only
2 /*
3  * Driver for Pondicherry2 memory controller.
4  *
5  * Copyright (c) 2016, Intel Corporation.
6  *
7  * [Derived from sb_edac.c]
8  *
9  * Translation of system physical addresses to DIMM addresses
10  * is a two stage process:
11  *
12  * First the Pondicherry 2 memory controller handles slice and channel interleaving
13  * in "sys2pmi()". This is (almost) completley common between platforms.
14  *
15  * Then a platform specific dunit (DIMM unit) completes the process to provide DIMM,
16  * rank, bank, row and column using the appropriate "dunit_ops" functions/parameters.
17  */
18 
19 #include <linux/module.h>
20 #include <linux/init.h>
21 #include <linux/pci.h>
22 #include <linux/pci_ids.h>
23 #include <linux/slab.h>
24 #include <linux/delay.h>
25 #include <linux/edac.h>
26 #include <linux/mmzone.h>
27 #include <linux/smp.h>
28 #include <linux/bitmap.h>
29 #include <linux/math64.h>
30 #include <linux/mod_devicetable.h>
31 #include <linux/platform_data/x86/p2sb.h>
32 
33 #include <asm/cpu_device_id.h>
34 #include <asm/intel-family.h>
35 #include <asm/processor.h>
36 #include <asm/mce.h>
37 
38 #include "edac_mc.h"
39 #include "edac_module.h"
40 #include "pnd2_edac.h"
41 
42 #define EDAC_MOD_STR		"pnd2_edac"
43 
44 #define APL_NUM_CHANNELS	4
45 #define DNV_NUM_CHANNELS	2
46 #define DNV_MAX_DIMMS		2 /* Max DIMMs per channel */
47 
48 enum type {
49 	APL,
50 	DNV, /* All requests go to PMI CH0 on each slice (CH1 disabled) */
51 };
52 
53 struct dram_addr {
54 	int chan;
55 	int dimm;
56 	int rank;
57 	int bank;
58 	int row;
59 	int col;
60 };
61 
62 struct pnd2_pvt {
63 	int dimm_geom[APL_NUM_CHANNELS];
64 	u64 tolm, tohm;
65 };
66 
67 /*
68  * System address space is divided into multiple regions with
69  * different interleave rules in each. The as0/as1 regions
70  * have no interleaving at all. The as2 region is interleaved
71  * between two channels. The mot region is magic and may overlap
72  * other regions, with its interleave rules taking precedence.
73  * Addresses not in any of these regions are interleaved across
74  * all four channels.
75  */
76 static struct region {
77 	u64	base;
78 	u64	limit;
79 	u8	enabled;
80 } mot, as0, as1, as2;
81 
82 static struct dunit_ops {
83 	char *name;
84 	enum type type;
85 	int pmiaddr_shift;
86 	int pmiidx_shift;
87 	int channels;
88 	int dimms_per_channel;
89 	int (*rd_reg)(int port, int off, int op, void *data, size_t sz, char *name);
90 	int (*get_registers)(void);
91 	int (*check_ecc)(void);
92 	void (*mk_region)(char *name, struct region *rp, void *asym);
93 	void (*get_dimm_config)(struct mem_ctl_info *mci);
94 	int (*pmi2mem)(struct mem_ctl_info *mci, u64 pmiaddr, u32 pmiidx,
95 				   struct dram_addr *daddr, char *msg);
96 } *ops;
97 
98 static struct mem_ctl_info *pnd2_mci;
99 
100 #define PND2_MSG_SIZE	256
101 
102 /* Debug macros */
103 #define pnd2_printk(level, fmt, arg...)			\
104 	edac_printk(level, "pnd2", fmt, ##arg)
105 
106 #define pnd2_mc_printk(mci, level, fmt, arg...)	\
107 	edac_mc_chipset_printk(mci, level, "pnd2", fmt, ##arg)
108 
109 #define MOT_CHAN_INTLV_BIT_1SLC_2CH 12
110 #define MOT_CHAN_INTLV_BIT_2SLC_2CH 13
111 #define SELECTOR_DISABLED (-1)
112 #define _4GB (1ul << 32)
113 
114 #define PMI_ADDRESS_WIDTH	31
115 #define PND_MAX_PHYS_BIT	39
116 
117 #define APL_ASYMSHIFT		28
118 #define DNV_ASYMSHIFT		31
119 #define CH_HASH_MASK_LSB	6
120 #define SLICE_HASH_MASK_LSB	6
121 #define MOT_SLC_INTLV_BIT	12
122 #define LOG2_PMI_ADDR_GRANULARITY	5
123 #define MOT_SHIFT	24
124 
125 #define GET_BITFIELD(v, lo, hi)	(((v) & GENMASK_ULL(hi, lo)) >> (lo))
126 #define U64_LSHIFT(val, s)	((u64)(val) << (s))
127 
128 /*
129  * On Apollo Lake we access memory controller registers via a
130  * side-band mailbox style interface in a hidden PCI device
131  * configuration space.
132  */
133 static struct pci_bus	*p2sb_bus;
134 #define P2SB_DEVFN	PCI_DEVFN(0xd, 0)
135 #define P2SB_ADDR_OFF	0xd0
136 #define P2SB_DATA_OFF	0xd4
137 #define P2SB_STAT_OFF	0xd8
138 #define P2SB_ROUT_OFF	0xda
139 #define P2SB_EADD_OFF	0xdc
140 #define P2SB_HIDE_OFF	0xe1
141 
142 #define P2SB_BUSY	1
143 
144 #define P2SB_READ(size, off, ptr) \
145 	pci_bus_read_config_##size(p2sb_bus, P2SB_DEVFN, off, ptr)
146 #define P2SB_WRITE(size, off, val) \
147 	pci_bus_write_config_##size(p2sb_bus, P2SB_DEVFN, off, val)
148 
149 static bool p2sb_is_busy(u16 *status)
150 {
151 	P2SB_READ(word, P2SB_STAT_OFF, status);
152 
153 	return !!(*status & P2SB_BUSY);
154 }
155 
156 static int _apl_rd_reg(int port, int off, int op, u32 *data)
157 {
158 	int retries = 0xff, ret;
159 	u16 status;
160 	u8 hidden;
161 
162 	/* Unhide the P2SB device, if it's hidden */
163 	P2SB_READ(byte, P2SB_HIDE_OFF, &hidden);
164 	if (hidden)
165 		P2SB_WRITE(byte, P2SB_HIDE_OFF, 0);
166 
167 	if (p2sb_is_busy(&status)) {
168 		ret = -EAGAIN;
169 		goto out;
170 	}
171 
172 	P2SB_WRITE(dword, P2SB_ADDR_OFF, (port << 24) | off);
173 	P2SB_WRITE(dword, P2SB_DATA_OFF, 0);
174 	P2SB_WRITE(dword, P2SB_EADD_OFF, 0);
175 	P2SB_WRITE(word, P2SB_ROUT_OFF, 0);
176 	P2SB_WRITE(word, P2SB_STAT_OFF, (op << 8) | P2SB_BUSY);
177 
178 	while (p2sb_is_busy(&status)) {
179 		if (retries-- == 0) {
180 			ret = -EBUSY;
181 			goto out;
182 		}
183 	}
184 
185 	P2SB_READ(dword, P2SB_DATA_OFF, data);
186 	ret = (status >> 1) & 0x3;
187 out:
188 	/* Hide the P2SB device, if it was hidden before */
189 	if (hidden)
190 		P2SB_WRITE(byte, P2SB_HIDE_OFF, hidden);
191 
192 	return ret;
193 }
194 
195 static int apl_rd_reg(int port, int off, int op, void *data, size_t sz, char *name)
196 {
197 	int ret = 0;
198 
199 	edac_dbg(2, "Read %s port=%x off=%x op=%x\n", name, port, off, op);
200 	switch (sz) {
201 	case 8:
202 		ret = _apl_rd_reg(port, off + 4, op, (u32 *)(data + 4));
203 		fallthrough;
204 	case 4:
205 		ret |= _apl_rd_reg(port, off, op, (u32 *)data);
206 		pnd2_printk(KERN_DEBUG, "%s=%x%08x ret=%d\n", name,
207 					sz == 8 ? *((u32 *)(data + 4)) : 0, *((u32 *)data), ret);
208 		break;
209 	}
210 
211 	return ret;
212 }
213 
214 static u64 get_mem_ctrl_hub_base_addr(void)
215 {
216 	struct b_cr_mchbar_lo_pci lo;
217 	struct b_cr_mchbar_hi_pci hi;
218 	struct pci_dev *pdev;
219 
220 	pdev = pci_get_device(PCI_VENDOR_ID_INTEL, 0x1980, NULL);
221 	if (pdev) {
222 		pci_read_config_dword(pdev, 0x48, (u32 *)&lo);
223 		pci_read_config_dword(pdev, 0x4c, (u32 *)&hi);
224 		pci_dev_put(pdev);
225 	} else {
226 		return 0;
227 	}
228 
229 	if (!lo.enable) {
230 		edac_dbg(2, "MMIO via memory controller hub base address is disabled!\n");
231 		return 0;
232 	}
233 
234 	return U64_LSHIFT(hi.base, 32) | U64_LSHIFT(lo.base, 15);
235 }
236 
237 #define DNV_MCHBAR_SIZE  0x8000
238 #define DNV_SB_PORT_SIZE 0x10000
239 static int dnv_rd_reg(int port, int off, int op, void *data, size_t sz, char *name)
240 {
241 	struct pci_dev *pdev;
242 	void __iomem *base;
243 	struct resource r;
244 	int ret;
245 
246 	if (op == 4) {
247 		pdev = pci_get_device(PCI_VENDOR_ID_INTEL, 0x1980, NULL);
248 		if (!pdev)
249 			return -ENODEV;
250 
251 		pci_read_config_dword(pdev, off, data);
252 		pci_dev_put(pdev);
253 	} else {
254 		/* MMIO via memory controller hub base address */
255 		if (op == 0 && port == 0x4c) {
256 			memset(&r, 0, sizeof(r));
257 
258 			r.start = get_mem_ctrl_hub_base_addr();
259 			if (!r.start)
260 				return -ENODEV;
261 			r.end = r.start + DNV_MCHBAR_SIZE - 1;
262 		} else {
263 			/* MMIO via sideband register base address */
264 			ret = p2sb_bar(NULL, 0, &r);
265 			if (ret)
266 				return ret;
267 
268 			r.start += (port << 16);
269 			r.end = r.start + DNV_SB_PORT_SIZE - 1;
270 		}
271 
272 		base = ioremap(r.start, resource_size(&r));
273 		if (!base)
274 			return -ENODEV;
275 
276 		if (sz == 8)
277 			*(u64 *)data = readq(base + off);
278 		else
279 			*(u32 *)data = readl(base + off);
280 
281 		iounmap(base);
282 	}
283 
284 	edac_dbg(2, "Read %s=%.8x_%.8x\n", name,
285 			(sz == 8) ? *(u32 *)(data + 4) : 0, *(u32 *)data);
286 
287 	return 0;
288 }
289 
290 #define RD_REGP(regp, regname, port)	\
291 	ops->rd_reg(port,					\
292 		regname##_offset,				\
293 		regname##_r_opcode,				\
294 		regp, sizeof(struct regname),	\
295 		#regname)
296 
297 #define RD_REG(regp, regname)			\
298 	ops->rd_reg(regname ## _port,		\
299 		regname##_offset,				\
300 		regname##_r_opcode,				\
301 		regp, sizeof(struct regname),	\
302 		#regname)
303 
304 static u64 top_lm, top_hm;
305 static bool two_slices;
306 static bool two_channels; /* Both PMI channels in one slice enabled */
307 
308 static u8 sym_chan_mask;
309 static u8 asym_chan_mask;
310 static u8 chan_mask;
311 
312 static int slice_selector = -1;
313 static int chan_selector = -1;
314 static u64 slice_hash_mask;
315 static u64 chan_hash_mask;
316 
317 static void mk_region(char *name, struct region *rp, u64 base, u64 limit)
318 {
319 	rp->enabled = 1;
320 	rp->base = base;
321 	rp->limit = limit;
322 	edac_dbg(2, "Region:%s [%llx, %llx]\n", name, base, limit);
323 }
324 
325 static void mk_region_mask(char *name, struct region *rp, u64 base, u64 mask)
326 {
327 	if (mask == 0) {
328 		pr_info(FW_BUG "MOT mask cannot be zero\n");
329 		return;
330 	}
331 	if (mask != GENMASK_ULL(PND_MAX_PHYS_BIT, __ffs(mask))) {
332 		pr_info(FW_BUG "MOT mask not power of two\n");
333 		return;
334 	}
335 	if (base & ~mask) {
336 		pr_info(FW_BUG "MOT region base/mask alignment error\n");
337 		return;
338 	}
339 	rp->base = base;
340 	rp->limit = (base | ~mask) & GENMASK_ULL(PND_MAX_PHYS_BIT, 0);
341 	rp->enabled = 1;
342 	edac_dbg(2, "Region:%s [%llx, %llx]\n", name, base, rp->limit);
343 }
344 
345 static bool in_region(struct region *rp, u64 addr)
346 {
347 	if (!rp->enabled)
348 		return false;
349 
350 	return rp->base <= addr && addr <= rp->limit;
351 }
352 
353 static int gen_sym_mask(struct b_cr_slice_channel_hash *p)
354 {
355 	int mask = 0;
356 
357 	if (!p->slice_0_mem_disabled)
358 		mask |= p->sym_slice0_channel_enabled;
359 
360 	if (!p->slice_1_disabled)
361 		mask |= p->sym_slice1_channel_enabled << 2;
362 
363 	if (p->ch_1_disabled || p->enable_pmi_dual_data_mode)
364 		mask &= 0x5;
365 
366 	return mask;
367 }
368 
369 static int gen_asym_mask(struct b_cr_slice_channel_hash *p,
370 			 struct b_cr_asym_mem_region0_mchbar *as0,
371 			 struct b_cr_asym_mem_region1_mchbar *as1,
372 			 struct b_cr_asym_2way_mem_region_mchbar *as2way)
373 {
374 	const int intlv[] = { 0x5, 0xA, 0x3, 0xC };
375 	int mask = 0;
376 
377 	if (as2way->asym_2way_interleave_enable)
378 		mask = intlv[as2way->asym_2way_intlv_mode];
379 	if (as0->slice0_asym_enable)
380 		mask |= (1 << as0->slice0_asym_channel_select);
381 	if (as1->slice1_asym_enable)
382 		mask |= (4 << as1->slice1_asym_channel_select);
383 	if (p->slice_0_mem_disabled)
384 		mask &= 0xc;
385 	if (p->slice_1_disabled)
386 		mask &= 0x3;
387 	if (p->ch_1_disabled || p->enable_pmi_dual_data_mode)
388 		mask &= 0x5;
389 
390 	return mask;
391 }
392 
393 static struct b_cr_tolud_pci tolud;
394 static struct b_cr_touud_lo_pci touud_lo;
395 static struct b_cr_touud_hi_pci touud_hi;
396 static struct b_cr_asym_mem_region0_mchbar asym0;
397 static struct b_cr_asym_mem_region1_mchbar asym1;
398 static struct b_cr_asym_2way_mem_region_mchbar asym_2way;
399 static struct b_cr_mot_out_base_mchbar mot_base;
400 static struct b_cr_mot_out_mask_mchbar mot_mask;
401 static struct b_cr_slice_channel_hash chash;
402 
403 /* Apollo Lake dunit */
404 /*
405  * Validated on board with just two DIMMs in the [0] and [2] positions
406  * in this array. Other port number matches documentation, but caution
407  * advised.
408  */
409 static const int apl_dports[APL_NUM_CHANNELS] = { 0x18, 0x10, 0x11, 0x19 };
410 static struct d_cr_drp0 drp0[APL_NUM_CHANNELS];
411 
412 /* Denverton dunit */
413 static const int dnv_dports[DNV_NUM_CHANNELS] = { 0x10, 0x12 };
414 static struct d_cr_dsch dsch;
415 static struct d_cr_ecc_ctrl ecc_ctrl[DNV_NUM_CHANNELS];
416 static struct d_cr_drp drp[DNV_NUM_CHANNELS];
417 static struct d_cr_dmap dmap[DNV_NUM_CHANNELS];
418 static struct d_cr_dmap1 dmap1[DNV_NUM_CHANNELS];
419 static struct d_cr_dmap2 dmap2[DNV_NUM_CHANNELS];
420 static struct d_cr_dmap3 dmap3[DNV_NUM_CHANNELS];
421 static struct d_cr_dmap4 dmap4[DNV_NUM_CHANNELS];
422 static struct d_cr_dmap5 dmap5[DNV_NUM_CHANNELS];
423 
424 static void apl_mk_region(char *name, struct region *rp, void *asym)
425 {
426 	struct b_cr_asym_mem_region0_mchbar *a = asym;
427 
428 	mk_region(name, rp,
429 			  U64_LSHIFT(a->slice0_asym_base, APL_ASYMSHIFT),
430 			  U64_LSHIFT(a->slice0_asym_limit, APL_ASYMSHIFT) +
431 			  GENMASK_ULL(APL_ASYMSHIFT - 1, 0));
432 }
433 
434 static void dnv_mk_region(char *name, struct region *rp, void *asym)
435 {
436 	struct b_cr_asym_mem_region_denverton *a = asym;
437 
438 	mk_region(name, rp,
439 			  U64_LSHIFT(a->slice_asym_base, DNV_ASYMSHIFT),
440 			  U64_LSHIFT(a->slice_asym_limit, DNV_ASYMSHIFT) +
441 			  GENMASK_ULL(DNV_ASYMSHIFT - 1, 0));
442 }
443 
444 static int apl_get_registers(void)
445 {
446 	int ret = -ENODEV;
447 	int i;
448 
449 	if (RD_REG(&asym_2way, b_cr_asym_2way_mem_region_mchbar))
450 		return -ENODEV;
451 
452 	/*
453 	 * RD_REGP() will fail for unpopulated or non-existent
454 	 * DIMM slots. Return success if we find at least one DIMM.
455 	 */
456 	for (i = 0; i < APL_NUM_CHANNELS; i++)
457 		if (!RD_REGP(&drp0[i], d_cr_drp0, apl_dports[i]))
458 			ret = 0;
459 
460 	return ret;
461 }
462 
463 static int dnv_get_registers(void)
464 {
465 	int i;
466 
467 	if (RD_REG(&dsch, d_cr_dsch))
468 		return -ENODEV;
469 
470 	for (i = 0; i < DNV_NUM_CHANNELS; i++)
471 		if (RD_REGP(&ecc_ctrl[i], d_cr_ecc_ctrl, dnv_dports[i]) ||
472 			RD_REGP(&drp[i], d_cr_drp, dnv_dports[i]) ||
473 			RD_REGP(&dmap[i], d_cr_dmap, dnv_dports[i]) ||
474 			RD_REGP(&dmap1[i], d_cr_dmap1, dnv_dports[i]) ||
475 			RD_REGP(&dmap2[i], d_cr_dmap2, dnv_dports[i]) ||
476 			RD_REGP(&dmap3[i], d_cr_dmap3, dnv_dports[i]) ||
477 			RD_REGP(&dmap4[i], d_cr_dmap4, dnv_dports[i]) ||
478 			RD_REGP(&dmap5[i], d_cr_dmap5, dnv_dports[i]))
479 			return -ENODEV;
480 
481 	return 0;
482 }
483 
484 /*
485  * Read all the h/w config registers once here (they don't
486  * change at run time. Figure out which address ranges have
487  * which interleave characteristics.
488  */
489 static int get_registers(void)
490 {
491 	const int intlv[] = { 10, 11, 12, 12 };
492 
493 	if (RD_REG(&tolud, b_cr_tolud_pci) ||
494 		RD_REG(&touud_lo, b_cr_touud_lo_pci) ||
495 		RD_REG(&touud_hi, b_cr_touud_hi_pci) ||
496 		RD_REG(&asym0, b_cr_asym_mem_region0_mchbar) ||
497 		RD_REG(&asym1, b_cr_asym_mem_region1_mchbar) ||
498 		RD_REG(&mot_base, b_cr_mot_out_base_mchbar) ||
499 		RD_REG(&mot_mask, b_cr_mot_out_mask_mchbar) ||
500 		RD_REG(&chash, b_cr_slice_channel_hash))
501 		return -ENODEV;
502 
503 	if (ops->get_registers())
504 		return -ENODEV;
505 
506 	if (ops->type == DNV) {
507 		/* PMI channel idx (always 0) for asymmetric region */
508 		asym0.slice0_asym_channel_select = 0;
509 		asym1.slice1_asym_channel_select = 0;
510 		/* PMI channel bitmap (always 1) for symmetric region */
511 		chash.sym_slice0_channel_enabled = 0x1;
512 		chash.sym_slice1_channel_enabled = 0x1;
513 	}
514 
515 	if (asym0.slice0_asym_enable)
516 		ops->mk_region("as0", &as0, &asym0);
517 
518 	if (asym1.slice1_asym_enable)
519 		ops->mk_region("as1", &as1, &asym1);
520 
521 	if (asym_2way.asym_2way_interleave_enable) {
522 		mk_region("as2way", &as2,
523 				  U64_LSHIFT(asym_2way.asym_2way_base, APL_ASYMSHIFT),
524 				  U64_LSHIFT(asym_2way.asym_2way_limit, APL_ASYMSHIFT) +
525 				  GENMASK_ULL(APL_ASYMSHIFT - 1, 0));
526 	}
527 
528 	if (mot_base.imr_en) {
529 		mk_region_mask("mot", &mot,
530 					   U64_LSHIFT(mot_base.mot_out_base, MOT_SHIFT),
531 					   U64_LSHIFT(mot_mask.mot_out_mask, MOT_SHIFT));
532 	}
533 
534 	top_lm = U64_LSHIFT(tolud.tolud, 20);
535 	top_hm = U64_LSHIFT(touud_hi.touud, 32) | U64_LSHIFT(touud_lo.touud, 20);
536 
537 	two_slices = !chash.slice_1_disabled &&
538 				 !chash.slice_0_mem_disabled &&
539 				 (chash.sym_slice0_channel_enabled != 0) &&
540 				 (chash.sym_slice1_channel_enabled != 0);
541 	two_channels = !chash.ch_1_disabled &&
542 				 !chash.enable_pmi_dual_data_mode &&
543 				 ((chash.sym_slice0_channel_enabled == 3) ||
544 				 (chash.sym_slice1_channel_enabled == 3));
545 
546 	sym_chan_mask = gen_sym_mask(&chash);
547 	asym_chan_mask = gen_asym_mask(&chash, &asym0, &asym1, &asym_2way);
548 	chan_mask = sym_chan_mask | asym_chan_mask;
549 
550 	if (two_slices && !two_channels) {
551 		if (chash.hvm_mode)
552 			slice_selector = 29;
553 		else
554 			slice_selector = intlv[chash.interleave_mode];
555 	} else if (!two_slices && two_channels) {
556 		if (chash.hvm_mode)
557 			chan_selector = 29;
558 		else
559 			chan_selector = intlv[chash.interleave_mode];
560 	} else if (two_slices && two_channels) {
561 		if (chash.hvm_mode) {
562 			slice_selector = 29;
563 			chan_selector = 30;
564 		} else {
565 			slice_selector = intlv[chash.interleave_mode];
566 			chan_selector = intlv[chash.interleave_mode] + 1;
567 		}
568 	}
569 
570 	if (two_slices) {
571 		if (!chash.hvm_mode)
572 			slice_hash_mask = chash.slice_hash_mask << SLICE_HASH_MASK_LSB;
573 		if (!two_channels)
574 			slice_hash_mask |= BIT_ULL(slice_selector);
575 	}
576 
577 	if (two_channels) {
578 		if (!chash.hvm_mode)
579 			chan_hash_mask = chash.ch_hash_mask << CH_HASH_MASK_LSB;
580 		if (!two_slices)
581 			chan_hash_mask |= BIT_ULL(chan_selector);
582 	}
583 
584 	return 0;
585 }
586 
587 /* Get a contiguous memory address (remove the MMIO gap) */
588 static u64 remove_mmio_gap(u64 sys)
589 {
590 	return (sys < _4GB) ? sys : sys - (_4GB - top_lm);
591 }
592 
593 /* Squeeze out one address bit, shift upper part down to fill gap */
594 static void remove_addr_bit(u64 *addr, int bitidx)
595 {
596 	u64	mask;
597 
598 	if (bitidx == -1)
599 		return;
600 
601 	mask = (1ull << bitidx) - 1;
602 	*addr = ((*addr >> 1) & ~mask) | (*addr & mask);
603 }
604 
605 /* XOR all the bits from addr specified in mask */
606 static int hash_by_mask(u64 addr, u64 mask)
607 {
608 	u64 result = addr & mask;
609 
610 	result = (result >> 32) ^ result;
611 	result = (result >> 16) ^ result;
612 	result = (result >> 8) ^ result;
613 	result = (result >> 4) ^ result;
614 	result = (result >> 2) ^ result;
615 	result = (result >> 1) ^ result;
616 
617 	return (int)result & 1;
618 }
619 
620 /*
621  * First stage decode. Take the system address and figure out which
622  * second stage will deal with it based on interleave modes.
623  */
624 static int sys2pmi(const u64 addr, u32 *pmiidx, u64 *pmiaddr, char *msg)
625 {
626 	u64 contig_addr, contig_base, contig_offset, contig_base_adj;
627 	int mot_intlv_bit = two_slices ? MOT_CHAN_INTLV_BIT_2SLC_2CH :
628 						MOT_CHAN_INTLV_BIT_1SLC_2CH;
629 	int slice_intlv_bit_rm = SELECTOR_DISABLED;
630 	int chan_intlv_bit_rm = SELECTOR_DISABLED;
631 	/* Determine if address is in the MOT region. */
632 	bool mot_hit = in_region(&mot, addr);
633 	/* Calculate the number of symmetric regions enabled. */
634 	int sym_channels = hweight8(sym_chan_mask);
635 
636 	/*
637 	 * The amount we need to shift the asym base can be determined by the
638 	 * number of enabled symmetric channels.
639 	 * NOTE: This can only work because symmetric memory is not supposed
640 	 * to do a 3-way interleave.
641 	 */
642 	int sym_chan_shift = sym_channels >> 1;
643 
644 	/* Give up if address is out of range, or in MMIO gap */
645 	if (addr >= (1ul << PND_MAX_PHYS_BIT) ||
646 	   (addr >= top_lm && addr < _4GB) || addr >= top_hm) {
647 		snprintf(msg, PND2_MSG_SIZE, "Error address 0x%llx is not DRAM", addr);
648 		return -EINVAL;
649 	}
650 
651 	/* Get a contiguous memory address (remove the MMIO gap) */
652 	contig_addr = remove_mmio_gap(addr);
653 
654 	if (in_region(&as0, addr)) {
655 		*pmiidx = asym0.slice0_asym_channel_select;
656 
657 		contig_base = remove_mmio_gap(as0.base);
658 		contig_offset = contig_addr - contig_base;
659 		contig_base_adj = (contig_base >> sym_chan_shift) *
660 						  ((chash.sym_slice0_channel_enabled >> (*pmiidx & 1)) & 1);
661 		contig_addr = contig_offset + ((sym_channels > 0) ? contig_base_adj : 0ull);
662 	} else if (in_region(&as1, addr)) {
663 		*pmiidx = 2u + asym1.slice1_asym_channel_select;
664 
665 		contig_base = remove_mmio_gap(as1.base);
666 		contig_offset = contig_addr - contig_base;
667 		contig_base_adj = (contig_base >> sym_chan_shift) *
668 						  ((chash.sym_slice1_channel_enabled >> (*pmiidx & 1)) & 1);
669 		contig_addr = contig_offset + ((sym_channels > 0) ? contig_base_adj : 0ull);
670 	} else if (in_region(&as2, addr) && (asym_2way.asym_2way_intlv_mode == 0x3ul)) {
671 		bool channel1;
672 
673 		mot_intlv_bit = MOT_CHAN_INTLV_BIT_1SLC_2CH;
674 		*pmiidx = (asym_2way.asym_2way_intlv_mode & 1) << 1;
675 		channel1 = mot_hit ? ((bool)((addr >> mot_intlv_bit) & 1)) :
676 			hash_by_mask(contig_addr, chan_hash_mask);
677 		*pmiidx |= (u32)channel1;
678 
679 		contig_base = remove_mmio_gap(as2.base);
680 		chan_intlv_bit_rm = mot_hit ? mot_intlv_bit : chan_selector;
681 		contig_offset = contig_addr - contig_base;
682 		remove_addr_bit(&contig_offset, chan_intlv_bit_rm);
683 		contig_addr = (contig_base >> sym_chan_shift) + contig_offset;
684 	} else {
685 		/* Otherwise we're in normal, boring symmetric mode. */
686 		*pmiidx = 0u;
687 
688 		if (two_slices) {
689 			bool slice1;
690 
691 			if (mot_hit) {
692 				slice_intlv_bit_rm = MOT_SLC_INTLV_BIT;
693 				slice1 = (addr >> MOT_SLC_INTLV_BIT) & 1;
694 			} else {
695 				slice_intlv_bit_rm = slice_selector;
696 				slice1 = hash_by_mask(addr, slice_hash_mask);
697 			}
698 
699 			*pmiidx = (u32)slice1 << 1;
700 		}
701 
702 		if (two_channels) {
703 			bool channel1;
704 
705 			mot_intlv_bit = two_slices ? MOT_CHAN_INTLV_BIT_2SLC_2CH :
706 							MOT_CHAN_INTLV_BIT_1SLC_2CH;
707 
708 			if (mot_hit) {
709 				chan_intlv_bit_rm = mot_intlv_bit;
710 				channel1 = (addr >> mot_intlv_bit) & 1;
711 			} else {
712 				chan_intlv_bit_rm = chan_selector;
713 				channel1 = hash_by_mask(contig_addr, chan_hash_mask);
714 			}
715 
716 			*pmiidx |= (u32)channel1;
717 		}
718 	}
719 
720 	/* Remove the chan_selector bit first */
721 	remove_addr_bit(&contig_addr, chan_intlv_bit_rm);
722 	/* Remove the slice bit (we remove it second because it must be lower */
723 	remove_addr_bit(&contig_addr, slice_intlv_bit_rm);
724 	*pmiaddr = contig_addr;
725 
726 	return 0;
727 }
728 
729 /* Translate PMI address to memory (rank, row, bank, column) */
730 #define C(n) (0x10 | (n))	/* column */
731 #define B(n) (0x20 | (n))	/* bank */
732 #define R(n) (0x40 | (n))	/* row */
733 #define RS   (0x80)			/* rank */
734 
735 /* addrdec values */
736 #define AMAP_1KB	0
737 #define AMAP_2KB	1
738 #define AMAP_4KB	2
739 #define AMAP_RSVD	3
740 
741 /* dden values */
742 #define DEN_4Gb		0
743 #define DEN_8Gb		2
744 
745 /* dwid values */
746 #define X8		0
747 #define X16		1
748 
749 static struct dimm_geometry {
750 	u8	addrdec;
751 	u8	dden;
752 	u8	dwid;
753 	u8	rowbits, colbits;
754 	u16	bits[PMI_ADDRESS_WIDTH];
755 } dimms[] = {
756 	{
757 		.addrdec = AMAP_1KB, .dden = DEN_4Gb, .dwid = X16,
758 		.rowbits = 15, .colbits = 10,
759 		.bits = {
760 			C(2),  C(3),  C(4),  C(5),  C(6),  B(0),  B(1),  B(2),  R(0),
761 			R(1),  R(2),  R(3),  R(4),  R(5),  R(6),  R(7),  R(8),  R(9),
762 			R(10), C(7),  C(8),  C(9),  R(11), RS,    R(12), R(13), R(14),
763 			0,     0,     0,     0
764 		}
765 	},
766 	{
767 		.addrdec = AMAP_1KB, .dden = DEN_4Gb, .dwid = X8,
768 		.rowbits = 16, .colbits = 10,
769 		.bits = {
770 			C(2),  C(3),  C(4),  C(5),  C(6),  B(0),  B(1),  B(2),  R(0),
771 			R(1),  R(2),  R(3),  R(4),  R(5),  R(6),  R(7),  R(8),  R(9),
772 			R(10), C(7),  C(8),  C(9),  R(11), RS,    R(12), R(13), R(14),
773 			R(15), 0,     0,     0
774 		}
775 	},
776 	{
777 		.addrdec = AMAP_1KB, .dden = DEN_8Gb, .dwid = X16,
778 		.rowbits = 16, .colbits = 10,
779 		.bits = {
780 			C(2),  C(3),  C(4),  C(5),  C(6),  B(0),  B(1),  B(2),  R(0),
781 			R(1),  R(2),  R(3),  R(4),  R(5),  R(6),  R(7),  R(8),  R(9),
782 			R(10), C(7),  C(8),  C(9),  R(11), RS,    R(12), R(13), R(14),
783 			R(15), 0,     0,     0
784 		}
785 	},
786 	{
787 		.addrdec = AMAP_1KB, .dden = DEN_8Gb, .dwid = X8,
788 		.rowbits = 16, .colbits = 11,
789 		.bits = {
790 			C(2),  C(3),  C(4),  C(5),  C(6),  B(0),  B(1),  B(2),  R(0),
791 			R(1),  R(2),  R(3),  R(4),  R(5),  R(6),  R(7),  R(8),  R(9),
792 			R(10), C(7),  C(8),  C(9),  R(11), RS,    C(11), R(12), R(13),
793 			R(14), R(15), 0,     0
794 		}
795 	},
796 	{
797 		.addrdec = AMAP_2KB, .dden = DEN_4Gb, .dwid = X16,
798 		.rowbits = 15, .colbits = 10,
799 		.bits = {
800 			C(2),  C(3),  C(4),  C(5),  C(6),  C(7),  B(0),  B(1),  B(2),
801 			R(0),  R(1),  R(2),  R(3),  R(4),  R(5),  R(6),  R(7),  R(8),
802 			R(9),  R(10), C(8),  C(9),  R(11), RS,    R(12), R(13), R(14),
803 			0,     0,     0,     0
804 		}
805 	},
806 	{
807 		.addrdec = AMAP_2KB, .dden = DEN_4Gb, .dwid = X8,
808 		.rowbits = 16, .colbits = 10,
809 		.bits = {
810 			C(2),  C(3),  C(4),  C(5),  C(6),  C(7),  B(0),  B(1),  B(2),
811 			R(0),  R(1),  R(2),  R(3),  R(4),  R(5),  R(6),  R(7),  R(8),
812 			R(9),  R(10), C(8),  C(9),  R(11), RS,    R(12), R(13), R(14),
813 			R(15), 0,     0,     0
814 		}
815 	},
816 	{
817 		.addrdec = AMAP_2KB, .dden = DEN_8Gb, .dwid = X16,
818 		.rowbits = 16, .colbits = 10,
819 		.bits = {
820 			C(2),  C(3),  C(4),  C(5),  C(6),  C(7),  B(0),  B(1),  B(2),
821 			R(0),  R(1),  R(2),  R(3),  R(4),  R(5),  R(6),  R(7),  R(8),
822 			R(9),  R(10), C(8),  C(9),  R(11), RS,    R(12), R(13), R(14),
823 			R(15), 0,     0,     0
824 		}
825 	},
826 	{
827 		.addrdec = AMAP_2KB, .dden = DEN_8Gb, .dwid = X8,
828 		.rowbits = 16, .colbits = 11,
829 		.bits = {
830 			C(2),  C(3),  C(4),  C(5),  C(6),  C(7),  B(0),  B(1),  B(2),
831 			R(0),  R(1),  R(2),  R(3),  R(4),  R(5),  R(6),  R(7),  R(8),
832 			R(9),  R(10), C(8),  C(9),  R(11), RS,    C(11), R(12), R(13),
833 			R(14), R(15), 0,     0
834 		}
835 	},
836 	{
837 		.addrdec = AMAP_4KB, .dden = DEN_4Gb, .dwid = X16,
838 		.rowbits = 15, .colbits = 10,
839 		.bits = {
840 			C(2),  C(3),  C(4),  C(5),  C(6),  C(7),  C(8),  B(0),  B(1),
841 			B(2),  R(0),  R(1),  R(2),  R(3),  R(4),  R(5),  R(6),  R(7),
842 			R(8),  R(9),  R(10), C(9),  R(11), RS,    R(12), R(13), R(14),
843 			0,     0,     0,     0
844 		}
845 	},
846 	{
847 		.addrdec = AMAP_4KB, .dden = DEN_4Gb, .dwid = X8,
848 		.rowbits = 16, .colbits = 10,
849 		.bits = {
850 			C(2),  C(3),  C(4),  C(5),  C(6),  C(7),  C(8),  B(0),  B(1),
851 			B(2),  R(0),  R(1),  R(2),  R(3),  R(4),  R(5),  R(6),  R(7),
852 			R(8),  R(9),  R(10), C(9),  R(11), RS,    R(12), R(13), R(14),
853 			R(15), 0,     0,     0
854 		}
855 	},
856 	{
857 		.addrdec = AMAP_4KB, .dden = DEN_8Gb, .dwid = X16,
858 		.rowbits = 16, .colbits = 10,
859 		.bits = {
860 			C(2),  C(3),  C(4),  C(5),  C(6),  C(7),  C(8),  B(0),  B(1),
861 			B(2),  R(0),  R(1),  R(2),  R(3),  R(4),  R(5),  R(6),  R(7),
862 			R(8),  R(9),  R(10), C(9),  R(11), RS,    R(12), R(13), R(14),
863 			R(15), 0,     0,     0
864 		}
865 	},
866 	{
867 		.addrdec = AMAP_4KB, .dden = DEN_8Gb, .dwid = X8,
868 		.rowbits = 16, .colbits = 11,
869 		.bits = {
870 			C(2),  C(3),  C(4),  C(5),  C(6),  C(7),  C(8),  B(0),  B(1),
871 			B(2),  R(0),  R(1),  R(2),  R(3),  R(4),  R(5),  R(6),  R(7),
872 			R(8),  R(9),  R(10), C(9),  R(11), RS,    C(11), R(12), R(13),
873 			R(14), R(15), 0,     0
874 		}
875 	}
876 };
877 
878 static int bank_hash(u64 pmiaddr, int idx, int shft)
879 {
880 	int bhash = 0;
881 
882 	switch (idx) {
883 	case 0:
884 		bhash ^= ((pmiaddr >> (12 + shft)) ^ (pmiaddr >> (9 + shft))) & 1;
885 		break;
886 	case 1:
887 		bhash ^= (((pmiaddr >> (10 + shft)) ^ (pmiaddr >> (8 + shft))) & 1) << 1;
888 		bhash ^= ((pmiaddr >> 22) & 1) << 1;
889 		break;
890 	case 2:
891 		bhash ^= (((pmiaddr >> (13 + shft)) ^ (pmiaddr >> (11 + shft))) & 1) << 2;
892 		break;
893 	}
894 
895 	return bhash;
896 }
897 
898 static int rank_hash(u64 pmiaddr)
899 {
900 	return ((pmiaddr >> 16) ^ (pmiaddr >> 10)) & 1;
901 }
902 
903 /* Second stage decode. Compute rank, bank, row & column. */
904 static int apl_pmi2mem(struct mem_ctl_info *mci, u64 pmiaddr, u32 pmiidx,
905 		       struct dram_addr *daddr, char *msg)
906 {
907 	struct d_cr_drp0 *cr_drp0 = &drp0[pmiidx];
908 	struct pnd2_pvt *pvt = mci->pvt_info;
909 	int g = pvt->dimm_geom[pmiidx];
910 	struct dimm_geometry *d = &dimms[g];
911 	int column = 0, bank = 0, row = 0, rank = 0;
912 	int i, idx, type, skiprs = 0;
913 
914 	for (i = 0; i < PMI_ADDRESS_WIDTH; i++) {
915 		int	bit = (pmiaddr >> i) & 1;
916 
917 		if (i + skiprs >= PMI_ADDRESS_WIDTH) {
918 			snprintf(msg, PND2_MSG_SIZE, "Bad dimm_geometry[] table\n");
919 			return -EINVAL;
920 		}
921 
922 		type = d->bits[i + skiprs] & ~0xf;
923 		idx = d->bits[i + skiprs] & 0xf;
924 
925 		/*
926 		 * On single rank DIMMs ignore the rank select bit
927 		 * and shift remainder of "bits[]" down one place.
928 		 */
929 		if (type == RS && (cr_drp0->rken0 + cr_drp0->rken1) == 1) {
930 			skiprs = 1;
931 			type = d->bits[i + skiprs] & ~0xf;
932 			idx = d->bits[i + skiprs] & 0xf;
933 		}
934 
935 		switch (type) {
936 		case C(0):
937 			column |= (bit << idx);
938 			break;
939 		case B(0):
940 			bank |= (bit << idx);
941 			if (cr_drp0->bahen)
942 				bank ^= bank_hash(pmiaddr, idx, d->addrdec);
943 			break;
944 		case R(0):
945 			row |= (bit << idx);
946 			break;
947 		case RS:
948 			rank = bit;
949 			if (cr_drp0->rsien)
950 				rank ^= rank_hash(pmiaddr);
951 			break;
952 		default:
953 			if (bit) {
954 				snprintf(msg, PND2_MSG_SIZE, "Bad translation\n");
955 				return -EINVAL;
956 			}
957 			goto done;
958 		}
959 	}
960 
961 done:
962 	daddr->col = column;
963 	daddr->bank = bank;
964 	daddr->row = row;
965 	daddr->rank = rank;
966 	daddr->dimm = 0;
967 
968 	return 0;
969 }
970 
971 /* Pluck bit "in" from pmiaddr and return value shifted to bit "out" */
972 #define dnv_get_bit(pmi, in, out) ((int)(((pmi) >> (in)) & 1u) << (out))
973 
974 static int dnv_pmi2mem(struct mem_ctl_info *mci, u64 pmiaddr, u32 pmiidx,
975 					   struct dram_addr *daddr, char *msg)
976 {
977 	/* Rank 0 or 1 */
978 	daddr->rank = dnv_get_bit(pmiaddr, dmap[pmiidx].rs0 + 13, 0);
979 	/* Rank 2 or 3 */
980 	daddr->rank |= dnv_get_bit(pmiaddr, dmap[pmiidx].rs1 + 13, 1);
981 
982 	/*
983 	 * Normally ranks 0,1 are DIMM0, and 2,3 are DIMM1, but we
984 	 * flip them if DIMM1 is larger than DIMM0.
985 	 */
986 	daddr->dimm = (daddr->rank >= 2) ^ drp[pmiidx].dimmflip;
987 
988 	daddr->bank = dnv_get_bit(pmiaddr, dmap[pmiidx].ba0 + 6, 0);
989 	daddr->bank |= dnv_get_bit(pmiaddr, dmap[pmiidx].ba1 + 6, 1);
990 	daddr->bank |= dnv_get_bit(pmiaddr, dmap[pmiidx].bg0 + 6, 2);
991 	if (dsch.ddr4en)
992 		daddr->bank |= dnv_get_bit(pmiaddr, dmap[pmiidx].bg1 + 6, 3);
993 	if (dmap1[pmiidx].bxor) {
994 		if (dsch.ddr4en) {
995 			daddr->bank ^= dnv_get_bit(pmiaddr, dmap3[pmiidx].row6 + 6, 0);
996 			daddr->bank ^= dnv_get_bit(pmiaddr, dmap3[pmiidx].row7 + 6, 1);
997 			if (dsch.chan_width == 0)
998 				/* 64/72 bit dram channel width */
999 				daddr->bank ^= dnv_get_bit(pmiaddr, dmap5[pmiidx].ca3 + 6, 2);
1000 			else
1001 				/* 32/40 bit dram channel width */
1002 				daddr->bank ^= dnv_get_bit(pmiaddr, dmap5[pmiidx].ca4 + 6, 2);
1003 			daddr->bank ^= dnv_get_bit(pmiaddr, dmap2[pmiidx].row2 + 6, 3);
1004 		} else {
1005 			daddr->bank ^= dnv_get_bit(pmiaddr, dmap2[pmiidx].row2 + 6, 0);
1006 			daddr->bank ^= dnv_get_bit(pmiaddr, dmap3[pmiidx].row6 + 6, 1);
1007 			if (dsch.chan_width == 0)
1008 				daddr->bank ^= dnv_get_bit(pmiaddr, dmap5[pmiidx].ca3 + 6, 2);
1009 			else
1010 				daddr->bank ^= dnv_get_bit(pmiaddr, dmap5[pmiidx].ca4 + 6, 2);
1011 		}
1012 	}
1013 
1014 	daddr->row = dnv_get_bit(pmiaddr, dmap2[pmiidx].row0 + 6, 0);
1015 	daddr->row |= dnv_get_bit(pmiaddr, dmap2[pmiidx].row1 + 6, 1);
1016 	daddr->row |= dnv_get_bit(pmiaddr, dmap2[pmiidx].row2 + 6, 2);
1017 	daddr->row |= dnv_get_bit(pmiaddr, dmap2[pmiidx].row3 + 6, 3);
1018 	daddr->row |= dnv_get_bit(pmiaddr, dmap2[pmiidx].row4 + 6, 4);
1019 	daddr->row |= dnv_get_bit(pmiaddr, dmap2[pmiidx].row5 + 6, 5);
1020 	daddr->row |= dnv_get_bit(pmiaddr, dmap3[pmiidx].row6 + 6, 6);
1021 	daddr->row |= dnv_get_bit(pmiaddr, dmap3[pmiidx].row7 + 6, 7);
1022 	daddr->row |= dnv_get_bit(pmiaddr, dmap3[pmiidx].row8 + 6, 8);
1023 	daddr->row |= dnv_get_bit(pmiaddr, dmap3[pmiidx].row9 + 6, 9);
1024 	daddr->row |= dnv_get_bit(pmiaddr, dmap3[pmiidx].row10 + 6, 10);
1025 	daddr->row |= dnv_get_bit(pmiaddr, dmap3[pmiidx].row11 + 6, 11);
1026 	daddr->row |= dnv_get_bit(pmiaddr, dmap4[pmiidx].row12 + 6, 12);
1027 	daddr->row |= dnv_get_bit(pmiaddr, dmap4[pmiidx].row13 + 6, 13);
1028 	if (dmap4[pmiidx].row14 != 31)
1029 		daddr->row |= dnv_get_bit(pmiaddr, dmap4[pmiidx].row14 + 6, 14);
1030 	if (dmap4[pmiidx].row15 != 31)
1031 		daddr->row |= dnv_get_bit(pmiaddr, dmap4[pmiidx].row15 + 6, 15);
1032 	if (dmap4[pmiidx].row16 != 31)
1033 		daddr->row |= dnv_get_bit(pmiaddr, dmap4[pmiidx].row16 + 6, 16);
1034 	if (dmap4[pmiidx].row17 != 31)
1035 		daddr->row |= dnv_get_bit(pmiaddr, dmap4[pmiidx].row17 + 6, 17);
1036 
1037 	daddr->col = dnv_get_bit(pmiaddr, dmap5[pmiidx].ca3 + 6, 3);
1038 	daddr->col |= dnv_get_bit(pmiaddr, dmap5[pmiidx].ca4 + 6, 4);
1039 	daddr->col |= dnv_get_bit(pmiaddr, dmap5[pmiidx].ca5 + 6, 5);
1040 	daddr->col |= dnv_get_bit(pmiaddr, dmap5[pmiidx].ca6 + 6, 6);
1041 	daddr->col |= dnv_get_bit(pmiaddr, dmap5[pmiidx].ca7 + 6, 7);
1042 	daddr->col |= dnv_get_bit(pmiaddr, dmap5[pmiidx].ca8 + 6, 8);
1043 	daddr->col |= dnv_get_bit(pmiaddr, dmap5[pmiidx].ca9 + 6, 9);
1044 	if (!dsch.ddr4en && dmap1[pmiidx].ca11 != 0x3f)
1045 		daddr->col |= dnv_get_bit(pmiaddr, dmap1[pmiidx].ca11 + 13, 11);
1046 
1047 	return 0;
1048 }
1049 
1050 static int check_channel(int ch)
1051 {
1052 	if (drp0[ch].dramtype != 0) {
1053 		pnd2_printk(KERN_INFO, "Unsupported DIMM in channel %d\n", ch);
1054 		return 1;
1055 	} else if (drp0[ch].eccen == 0) {
1056 		pnd2_printk(KERN_INFO, "ECC disabled on channel %d\n", ch);
1057 		return 1;
1058 	}
1059 	return 0;
1060 }
1061 
1062 static int apl_check_ecc_active(void)
1063 {
1064 	int	i, ret = 0;
1065 
1066 	/* Check dramtype and ECC mode for each present DIMM */
1067 	for (i = 0; i < APL_NUM_CHANNELS; i++)
1068 		if (chan_mask & BIT(i))
1069 			ret += check_channel(i);
1070 	return ret ? -EINVAL : 0;
1071 }
1072 
1073 #define DIMMS_PRESENT(d) ((d)->rken0 + (d)->rken1 + (d)->rken2 + (d)->rken3)
1074 
1075 static int check_unit(int ch)
1076 {
1077 	struct d_cr_drp *d = &drp[ch];
1078 
1079 	if (DIMMS_PRESENT(d) && !ecc_ctrl[ch].eccen) {
1080 		pnd2_printk(KERN_INFO, "ECC disabled on channel %d\n", ch);
1081 		return 1;
1082 	}
1083 	return 0;
1084 }
1085 
1086 static int dnv_check_ecc_active(void)
1087 {
1088 	int	i, ret = 0;
1089 
1090 	for (i = 0; i < DNV_NUM_CHANNELS; i++)
1091 		ret += check_unit(i);
1092 	return ret ? -EINVAL : 0;
1093 }
1094 
1095 static int get_memory_error_data(struct mem_ctl_info *mci, u64 addr,
1096 								 struct dram_addr *daddr, char *msg)
1097 {
1098 	u64	pmiaddr;
1099 	u32	pmiidx;
1100 	int	ret;
1101 
1102 	ret = sys2pmi(addr, &pmiidx, &pmiaddr, msg);
1103 	if (ret)
1104 		return ret;
1105 
1106 	pmiaddr >>= ops->pmiaddr_shift;
1107 	/* pmi channel idx to dimm channel idx */
1108 	pmiidx >>= ops->pmiidx_shift;
1109 	daddr->chan = pmiidx;
1110 
1111 	ret = ops->pmi2mem(mci, pmiaddr, pmiidx, daddr, msg);
1112 	if (ret)
1113 		return ret;
1114 
1115 	edac_dbg(0, "SysAddr=%llx PmiAddr=%llx Channel=%d DIMM=%d Rank=%d Bank=%d Row=%d Column=%d\n",
1116 			 addr, pmiaddr, daddr->chan, daddr->dimm, daddr->rank, daddr->bank, daddr->row, daddr->col);
1117 
1118 	return 0;
1119 }
1120 
1121 static void pnd2_mce_output_error(struct mem_ctl_info *mci, const struct mce *m,
1122 				  struct dram_addr *daddr)
1123 {
1124 	enum hw_event_mc_err_type tp_event;
1125 	char *optype, msg[PND2_MSG_SIZE];
1126 	bool ripv = m->mcgstatus & MCG_STATUS_RIPV;
1127 	bool overflow = m->status & MCI_STATUS_OVER;
1128 	bool uc_err = m->status & MCI_STATUS_UC;
1129 	bool recov = m->status & MCI_STATUS_S;
1130 	u32 core_err_cnt = GET_BITFIELD(m->status, 38, 52);
1131 	u32 mscod = GET_BITFIELD(m->status, 16, 31);
1132 	u32 errcode = GET_BITFIELD(m->status, 0, 15);
1133 	u32 optypenum = GET_BITFIELD(m->status, 4, 6);
1134 	int rc;
1135 
1136 	tp_event = uc_err ? (ripv ? HW_EVENT_ERR_UNCORRECTED : HW_EVENT_ERR_FATAL) :
1137 						 HW_EVENT_ERR_CORRECTED;
1138 
1139 	/*
1140 	 * According with Table 15-9 of the Intel Architecture spec vol 3A,
1141 	 * memory errors should fit in this mask:
1142 	 *	000f 0000 1mmm cccc (binary)
1143 	 * where:
1144 	 *	f = Correction Report Filtering Bit. If 1, subsequent errors
1145 	 *	    won't be shown
1146 	 *	mmm = error type
1147 	 *	cccc = channel
1148 	 * If the mask doesn't match, report an error to the parsing logic
1149 	 */
1150 	if (!((errcode & 0xef80) == 0x80)) {
1151 		optype = "Can't parse: it is not a mem";
1152 	} else {
1153 		switch (optypenum) {
1154 		case 0:
1155 			optype = "generic undef request error";
1156 			break;
1157 		case 1:
1158 			optype = "memory read error";
1159 			break;
1160 		case 2:
1161 			optype = "memory write error";
1162 			break;
1163 		case 3:
1164 			optype = "addr/cmd error";
1165 			break;
1166 		case 4:
1167 			optype = "memory scrubbing error";
1168 			break;
1169 		default:
1170 			optype = "reserved";
1171 			break;
1172 		}
1173 	}
1174 
1175 	/* Only decode errors with an valid address (ADDRV) */
1176 	if (!(m->status & MCI_STATUS_ADDRV))
1177 		return;
1178 
1179 	rc = get_memory_error_data(mci, m->addr, daddr, msg);
1180 	if (rc)
1181 		goto address_error;
1182 
1183 	snprintf(msg, sizeof(msg),
1184 		 "%s%s err_code:%04x:%04x channel:%d DIMM:%d rank:%d row:%d bank:%d col:%d",
1185 		 overflow ? " OVERFLOW" : "", (uc_err && recov) ? " recoverable" : "", mscod,
1186 		 errcode, daddr->chan, daddr->dimm, daddr->rank, daddr->row, daddr->bank, daddr->col);
1187 
1188 	edac_dbg(0, "%s\n", msg);
1189 
1190 	/* Call the helper to output message */
1191 	edac_mc_handle_error(tp_event, mci, core_err_cnt, m->addr >> PAGE_SHIFT,
1192 						 m->addr & ~PAGE_MASK, 0, daddr->chan, daddr->dimm, -1, optype, msg);
1193 
1194 	return;
1195 
1196 address_error:
1197 	edac_mc_handle_error(tp_event, mci, core_err_cnt, 0, 0, 0, -1, -1, -1, msg, "");
1198 }
1199 
1200 static void apl_get_dimm_config(struct mem_ctl_info *mci)
1201 {
1202 	struct pnd2_pvt	*pvt = mci->pvt_info;
1203 	struct dimm_info *dimm;
1204 	struct d_cr_drp0 *d;
1205 	u64	capacity;
1206 	int	i, g;
1207 
1208 	for (i = 0; i < APL_NUM_CHANNELS; i++) {
1209 		if (!(chan_mask & BIT(i)))
1210 			continue;
1211 
1212 		dimm = edac_get_dimm(mci, i, 0, 0);
1213 		if (!dimm) {
1214 			edac_dbg(0, "No allocated DIMM for channel %d\n", i);
1215 			continue;
1216 		}
1217 
1218 		d = &drp0[i];
1219 		for (g = 0; g < ARRAY_SIZE(dimms); g++)
1220 			if (dimms[g].addrdec == d->addrdec &&
1221 			    dimms[g].dden == d->dden &&
1222 			    dimms[g].dwid == d->dwid)
1223 				break;
1224 
1225 		if (g == ARRAY_SIZE(dimms)) {
1226 			edac_dbg(0, "Channel %d: unrecognized DIMM\n", i);
1227 			continue;
1228 		}
1229 
1230 		pvt->dimm_geom[i] = g;
1231 		capacity = (d->rken0 + d->rken1) * 8 * (1ul << dimms[g].rowbits) *
1232 				   (1ul << dimms[g].colbits);
1233 		edac_dbg(0, "Channel %d: %lld MByte DIMM\n", i, capacity >> (20 - 3));
1234 		dimm->nr_pages = MiB_TO_PAGES(capacity >> (20 - 3));
1235 		dimm->grain = 32;
1236 		dimm->dtype = (d->dwid == 0) ? DEV_X8 : DEV_X16;
1237 		dimm->mtype = MEM_DDR3;
1238 		dimm->edac_mode = EDAC_SECDED;
1239 		snprintf(dimm->label, sizeof(dimm->label), "Slice#%d_Chan#%d", i / 2, i % 2);
1240 	}
1241 }
1242 
1243 static const int dnv_dtypes[] = {
1244 	DEV_X8, DEV_X4, DEV_X16, DEV_UNKNOWN
1245 };
1246 
1247 static void dnv_get_dimm_config(struct mem_ctl_info *mci)
1248 {
1249 	int	i, j, ranks_of_dimm[DNV_MAX_DIMMS], banks, rowbits, colbits, memtype;
1250 	struct dimm_info *dimm;
1251 	struct d_cr_drp *d;
1252 	u64	capacity;
1253 
1254 	if (dsch.ddr4en) {
1255 		memtype = MEM_DDR4;
1256 		banks = 16;
1257 		colbits = 10;
1258 	} else {
1259 		memtype = MEM_DDR3;
1260 		banks = 8;
1261 	}
1262 
1263 	for (i = 0; i < DNV_NUM_CHANNELS; i++) {
1264 		if (dmap4[i].row14 == 31)
1265 			rowbits = 14;
1266 		else if (dmap4[i].row15 == 31)
1267 			rowbits = 15;
1268 		else if (dmap4[i].row16 == 31)
1269 			rowbits = 16;
1270 		else if (dmap4[i].row17 == 31)
1271 			rowbits = 17;
1272 		else
1273 			rowbits = 18;
1274 
1275 		if (memtype == MEM_DDR3) {
1276 			if (dmap1[i].ca11 != 0x3f)
1277 				colbits = 12;
1278 			else
1279 				colbits = 10;
1280 		}
1281 
1282 		d = &drp[i];
1283 		/* DIMM0 is present if rank0 and/or rank1 is enabled */
1284 		ranks_of_dimm[0] = d->rken0 + d->rken1;
1285 		/* DIMM1 is present if rank2 and/or rank3 is enabled */
1286 		ranks_of_dimm[1] = d->rken2 + d->rken3;
1287 
1288 		for (j = 0; j < DNV_MAX_DIMMS; j++) {
1289 			if (!ranks_of_dimm[j])
1290 				continue;
1291 
1292 			dimm = edac_get_dimm(mci, i, j, 0);
1293 			if (!dimm) {
1294 				edac_dbg(0, "No allocated DIMM for channel %d DIMM %d\n", i, j);
1295 				continue;
1296 			}
1297 
1298 			capacity = ranks_of_dimm[j] * banks * (1ul << rowbits) * (1ul << colbits);
1299 			edac_dbg(0, "Channel %d DIMM %d: %lld MByte DIMM\n", i, j, capacity >> (20 - 3));
1300 			dimm->nr_pages = MiB_TO_PAGES(capacity >> (20 - 3));
1301 			dimm->grain = 32;
1302 			dimm->dtype = dnv_dtypes[j ? d->dimmdwid0 : d->dimmdwid1];
1303 			dimm->mtype = memtype;
1304 			dimm->edac_mode = EDAC_SECDED;
1305 			snprintf(dimm->label, sizeof(dimm->label), "Chan#%d_DIMM#%d", i, j);
1306 		}
1307 	}
1308 }
1309 
1310 static int pnd2_register_mci(struct mem_ctl_info **ppmci)
1311 {
1312 	struct edac_mc_layer layers[2];
1313 	struct mem_ctl_info *mci;
1314 	struct pnd2_pvt *pvt;
1315 	int rc;
1316 
1317 	rc = ops->check_ecc();
1318 	if (rc < 0)
1319 		return rc;
1320 
1321 	/* Allocate a new MC control structure */
1322 	layers[0].type = EDAC_MC_LAYER_CHANNEL;
1323 	layers[0].size = ops->channels;
1324 	layers[0].is_virt_csrow = false;
1325 	layers[1].type = EDAC_MC_LAYER_SLOT;
1326 	layers[1].size = ops->dimms_per_channel;
1327 	layers[1].is_virt_csrow = true;
1328 	mci = edac_mc_alloc(0, ARRAY_SIZE(layers), layers, sizeof(*pvt));
1329 	if (!mci)
1330 		return -ENOMEM;
1331 
1332 	pvt = mci->pvt_info;
1333 	memset(pvt, 0, sizeof(*pvt));
1334 
1335 	mci->mod_name = EDAC_MOD_STR;
1336 	mci->dev_name = ops->name;
1337 	mci->ctl_name = "Pondicherry2";
1338 
1339 	/* Get dimm basic config and the memory layout */
1340 	ops->get_dimm_config(mci);
1341 
1342 	if (edac_mc_add_mc(mci)) {
1343 		edac_dbg(0, "MC: failed edac_mc_add_mc()\n");
1344 		edac_mc_free(mci);
1345 		return -EINVAL;
1346 	}
1347 
1348 	*ppmci = mci;
1349 
1350 	return 0;
1351 }
1352 
1353 static void pnd2_unregister_mci(struct mem_ctl_info *mci)
1354 {
1355 	if (unlikely(!mci || !mci->pvt_info)) {
1356 		pnd2_printk(KERN_ERR, "Couldn't find mci handler\n");
1357 		return;
1358 	}
1359 
1360 	/* Remove MC sysfs nodes */
1361 	edac_mc_del_mc(NULL);
1362 	edac_dbg(1, "%s: free mci struct\n", mci->ctl_name);
1363 	edac_mc_free(mci);
1364 }
1365 
1366 /*
1367  * Callback function registered with core kernel mce code.
1368  * Called once for each logged error.
1369  */
1370 static int pnd2_mce_check_error(struct notifier_block *nb, unsigned long val, void *data)
1371 {
1372 	struct mce *mce = (struct mce *)data;
1373 	struct mem_ctl_info *mci;
1374 	struct dram_addr daddr;
1375 	char *type;
1376 
1377 	mci = pnd2_mci;
1378 	if (!mci || (mce->kflags & MCE_HANDLED_CEC))
1379 		return NOTIFY_DONE;
1380 
1381 	/*
1382 	 * Just let mcelog handle it if the error is
1383 	 * outside the memory controller. A memory error
1384 	 * is indicated by bit 7 = 1 and bits = 8-11,13-15 = 0.
1385 	 * bit 12 has an special meaning.
1386 	 */
1387 	if ((mce->status & 0xefff) >> 7 != 1)
1388 		return NOTIFY_DONE;
1389 
1390 	if (mce->mcgstatus & MCG_STATUS_MCIP)
1391 		type = "Exception";
1392 	else
1393 		type = "Event";
1394 
1395 	pnd2_mc_printk(mci, KERN_INFO, "HANDLING MCE MEMORY ERROR\n");
1396 	pnd2_mc_printk(mci, KERN_INFO, "CPU %u: Machine Check %s: %llx Bank %u: %llx\n",
1397 				   mce->extcpu, type, mce->mcgstatus, mce->bank, mce->status);
1398 	pnd2_mc_printk(mci, KERN_INFO, "TSC %llx ", mce->tsc);
1399 	pnd2_mc_printk(mci, KERN_INFO, "ADDR %llx ", mce->addr);
1400 	pnd2_mc_printk(mci, KERN_INFO, "MISC %llx ", mce->misc);
1401 	pnd2_mc_printk(mci, KERN_INFO, "PROCESSOR %u:%x TIME %llu SOCKET %u APIC %x\n",
1402 				   mce->cpuvendor, mce->cpuid, mce->time, mce->socketid, mce->apicid);
1403 
1404 	pnd2_mce_output_error(mci, mce, &daddr);
1405 
1406 	/* Advice mcelog that the error were handled */
1407 	mce->kflags |= MCE_HANDLED_EDAC;
1408 	return NOTIFY_OK;
1409 }
1410 
1411 static struct notifier_block pnd2_mce_dec = {
1412 	.notifier_call	= pnd2_mce_check_error,
1413 	.priority	= MCE_PRIO_EDAC,
1414 };
1415 
1416 #ifdef CONFIG_EDAC_DEBUG
1417 /*
1418  * Write an address to this file to exercise the address decode
1419  * logic in this driver.
1420  */
1421 static u64 pnd2_fake_addr;
1422 #define PND2_BLOB_SIZE 1024
1423 static char pnd2_result[PND2_BLOB_SIZE];
1424 static struct dentry *pnd2_test;
1425 static struct debugfs_blob_wrapper pnd2_blob = {
1426 	.data = pnd2_result,
1427 	.size = 0
1428 };
1429 
1430 static int debugfs_u64_set(void *data, u64 val)
1431 {
1432 	struct dram_addr daddr;
1433 	struct mce m;
1434 
1435 	*(u64 *)data = val;
1436 	m.mcgstatus = 0;
1437 	/* ADDRV + MemRd + Unknown channel */
1438 	m.status = MCI_STATUS_ADDRV + 0x9f;
1439 	m.addr = val;
1440 	pnd2_mce_output_error(pnd2_mci, &m, &daddr);
1441 	snprintf(pnd2_blob.data, PND2_BLOB_SIZE,
1442 			 "SysAddr=%llx Channel=%d DIMM=%d Rank=%d Bank=%d Row=%d Column=%d\n",
1443 			 m.addr, daddr.chan, daddr.dimm, daddr.rank, daddr.bank, daddr.row, daddr.col);
1444 	pnd2_blob.size = strlen(pnd2_blob.data);
1445 
1446 	return 0;
1447 }
1448 DEFINE_DEBUGFS_ATTRIBUTE(fops_u64_wo, NULL, debugfs_u64_set, "%llu\n");
1449 
1450 static void setup_pnd2_debug(void)
1451 {
1452 	pnd2_test = edac_debugfs_create_dir("pnd2_test");
1453 	edac_debugfs_create_file("pnd2_debug_addr", 0200, pnd2_test,
1454 							 &pnd2_fake_addr, &fops_u64_wo);
1455 	debugfs_create_blob("pnd2_debug_results", 0400, pnd2_test, &pnd2_blob);
1456 }
1457 
1458 static void teardown_pnd2_debug(void)
1459 {
1460 	debugfs_remove_recursive(pnd2_test);
1461 }
1462 #else
1463 static void setup_pnd2_debug(void)	{}
1464 static void teardown_pnd2_debug(void)	{}
1465 #endif /* CONFIG_EDAC_DEBUG */
1466 
1467 
1468 static int pnd2_probe(void)
1469 {
1470 	int rc;
1471 
1472 	edac_dbg(2, "\n");
1473 	rc = get_registers();
1474 	if (rc)
1475 		return rc;
1476 
1477 	return pnd2_register_mci(&pnd2_mci);
1478 }
1479 
1480 static void pnd2_remove(void)
1481 {
1482 	edac_dbg(0, "\n");
1483 	pnd2_unregister_mci(pnd2_mci);
1484 }
1485 
1486 static struct dunit_ops apl_ops = {
1487 		.name			= "pnd2/apl",
1488 		.type			= APL,
1489 		.pmiaddr_shift		= LOG2_PMI_ADDR_GRANULARITY,
1490 		.pmiidx_shift		= 0,
1491 		.channels		= APL_NUM_CHANNELS,
1492 		.dimms_per_channel	= 1,
1493 		.rd_reg			= apl_rd_reg,
1494 		.get_registers		= apl_get_registers,
1495 		.check_ecc		= apl_check_ecc_active,
1496 		.mk_region		= apl_mk_region,
1497 		.get_dimm_config	= apl_get_dimm_config,
1498 		.pmi2mem		= apl_pmi2mem,
1499 };
1500 
1501 static struct dunit_ops dnv_ops = {
1502 		.name			= "pnd2/dnv",
1503 		.type			= DNV,
1504 		.pmiaddr_shift		= 0,
1505 		.pmiidx_shift		= 1,
1506 		.channels		= DNV_NUM_CHANNELS,
1507 		.dimms_per_channel	= 2,
1508 		.rd_reg			= dnv_rd_reg,
1509 		.get_registers		= dnv_get_registers,
1510 		.check_ecc		= dnv_check_ecc_active,
1511 		.mk_region		= dnv_mk_region,
1512 		.get_dimm_config	= dnv_get_dimm_config,
1513 		.pmi2mem		= dnv_pmi2mem,
1514 };
1515 
1516 static const struct x86_cpu_id pnd2_cpuids[] = {
1517 	X86_MATCH_INTEL_FAM6_MODEL(ATOM_GOLDMONT,	&apl_ops),
1518 	X86_MATCH_INTEL_FAM6_MODEL(ATOM_GOLDMONT_D,	&dnv_ops),
1519 	{ }
1520 };
1521 MODULE_DEVICE_TABLE(x86cpu, pnd2_cpuids);
1522 
1523 static int __init pnd2_init(void)
1524 {
1525 	const struct x86_cpu_id *id;
1526 	const char *owner;
1527 	int rc;
1528 
1529 	edac_dbg(2, "\n");
1530 
1531 	owner = edac_get_owner();
1532 	if (owner && strncmp(owner, EDAC_MOD_STR, sizeof(EDAC_MOD_STR)))
1533 		return -EBUSY;
1534 
1535 	if (cpu_feature_enabled(X86_FEATURE_HYPERVISOR))
1536 		return -ENODEV;
1537 
1538 	id = x86_match_cpu(pnd2_cpuids);
1539 	if (!id)
1540 		return -ENODEV;
1541 
1542 	ops = (struct dunit_ops *)id->driver_data;
1543 
1544 	if (ops->type == APL) {
1545 		p2sb_bus = pci_find_bus(0, 0);
1546 		if (!p2sb_bus)
1547 			return -ENODEV;
1548 	}
1549 
1550 	/* Ensure that the OPSTATE is set correctly for POLL or NMI */
1551 	opstate_init();
1552 
1553 	rc = pnd2_probe();
1554 	if (rc < 0) {
1555 		pnd2_printk(KERN_ERR, "Failed to register device with error %d.\n", rc);
1556 		return rc;
1557 	}
1558 
1559 	if (!pnd2_mci)
1560 		return -ENODEV;
1561 
1562 	mce_register_decode_chain(&pnd2_mce_dec);
1563 	setup_pnd2_debug();
1564 
1565 	return 0;
1566 }
1567 
1568 static void __exit pnd2_exit(void)
1569 {
1570 	edac_dbg(2, "\n");
1571 	teardown_pnd2_debug();
1572 	mce_unregister_decode_chain(&pnd2_mce_dec);
1573 	pnd2_remove();
1574 }
1575 
1576 module_init(pnd2_init);
1577 module_exit(pnd2_exit);
1578 
1579 module_param(edac_op_state, int, 0444);
1580 MODULE_PARM_DESC(edac_op_state, "EDAC Error Reporting state: 0=Poll,1=NMI");
1581 
1582 MODULE_LICENSE("GPL v2");
1583 MODULE_AUTHOR("Tony Luck");
1584 MODULE_DESCRIPTION("MC Driver for Intel SoC using Pondicherry memory controller");
1585