| 1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093109410951096109710981099110011011102110311041105110611071108110911101111111211131114111511161117111811191120112111221123112411251126112711281129113011311132113311341135113611371138113911401141114211431144114511461147114811491150115111521153115411551156115711581159116011611162116311641165116611671168116911701171117211731174117511761177117811791180118111821183118411851186118711881189119011911192119311941195119611971198119912001201120212031204120512061207120812091210121112121213121412151216121712181219122012211222122312241225122612271228122912301231123212331234123512361237123812391240124112421243124412451246124712481249125012511252125312541255125612571258125912601261126212631264126512661267126812691270127112721273127412751276127712781279128012811282128312841285128612871288128912901291129212931294129512961297129812991300130113021303130413051306130713081309131013111312131313141315131613171318131913201321132213231324132513261327132813291330133113321333133413351336133713381339134013411342134313441345134613471348134913501351135213531354135513561357135813591360136113621363136413651366136713681369137013711372137313741375137613771378137913801381138213831384138513861387138813891390139113921393139413951396139713981399140014011402140314041405140614071408140914101411141214131414141514161417141814191420142114221423142414251426142714281429143014311432143314341435143614371438143914401441144214431444144514461447144814491450145114521453145414551456145714581459146014611462146314641465146614671468146914701471147214731474147514761477147814791480148114821483148414851486148714881489149014911492149314941495149614971498149915001501150215031504150515061507150815091510151115121513151415151516151715181519152015211522152315241525152615271528152915301531153215331534153515361537153815391540154115421543154415451546154715481549155015511552155315541555155615571558155915601561156215631564156515661567156815691570157115721573157415751576157715781579158015811582158315841585158615871588158915901591159215931594159515961597159815991600160116021603160416051606160716081609161016111612161316141615161616171618161916201621162216231624162516261627162816291630163116321633163416351636163716381639164016411642164316441645164616471648164916501651165216531654165516561657165816591660166116621663166416651666 |
- // SPDX-License-Identifier: GPL-2.0
- /*
- * Driver for Intel client SoC with integrated memory controller using IBECC
- *
- * Copyright (C) 2020 Intel Corporation
- *
- * The In-Band ECC (IBECC) IP provides ECC protection to all or specific
- * regions of the physical memory space. It's used for memory controllers
- * that don't support the out-of-band ECC which often needs an additional
- * storage device to each channel for storing ECC data.
- */
- #include <linux/module.h>
- #include <linux/init.h>
- #include <linux/pci.h>
- #include <linux/slab.h>
- #include <linux/irq_work.h>
- #include <linux/llist.h>
- #include <linux/genalloc.h>
- #include <linux/edac.h>
- #include <linux/bits.h>
- #include <linux/bitfield.h>
- #include <linux/io.h>
- #include <asm/mach_traps.h>
- #include <asm/nmi.h>
- #include <asm/mce.h>
- #include "edac_mc.h"
- #include "edac_module.h"
- #define IGEN6_REVISION "v2.5.1"
- #define EDAC_MOD_STR "igen6_edac"
- #define IGEN6_NMI_NAME "igen6_ibecc"
- /* Debug macros */
- #define igen6_printk(level, fmt, arg...) \
- edac_printk(level, "igen6", fmt, ##arg)
- #define igen6_mc_printk(mci, level, fmt, arg...) \
- edac_mc_chipset_printk(mci, level, "igen6", fmt, ##arg)
- #define GET_BITFIELD(v, lo, hi) (((v) & GENMASK_ULL(hi, lo)) >> (lo))
- #define NUM_IMC 2 /* Max memory controllers */
- #define NUM_CHANNELS 2 /* Max channels */
- #define NUM_DIMMS 2 /* Max DIMMs per channel */
- #define _4GB BIT_ULL(32)
- /* Size of physical memory */
- #define TOM_OFFSET 0xa0
- /* Top of low usable DRAM */
- #define TOLUD_OFFSET 0xbc
- /* Capability register C */
- #define CAPID_C_OFFSET 0xec
- #define CAPID_C_IBECC BIT(15)
- /* Capability register E */
- #define CAPID_E_OFFSET 0xf0
- #define CAPID_E_IBECC BIT(12)
- #define CAPID_E_IBECC_BIT18 BIT(18)
- /* Error Status */
- #define ERRSTS_OFFSET 0xc8
- #define ERRSTS_CE BIT_ULL(6)
- #define ERRSTS_UE BIT_ULL(7)
- /* Error Command */
- #define ERRCMD_OFFSET 0xca
- #define ERRCMD_CE BIT_ULL(6)
- #define ERRCMD_UE BIT_ULL(7)
- /* IBECC MMIO base address */
- #define IBECC_BASE (res_cfg->ibecc_base)
- #define IBECC_ACTIVATE_OFFSET IBECC_BASE
- #define IBECC_ACTIVATE_EN BIT(0)
- /* IBECC error log */
- #define ECC_ERROR_LOG_OFFSET (IBECC_BASE + res_cfg->ibecc_error_log_offset)
- #define ECC_ERROR_LOG_CE BIT_ULL(62)
- #define ECC_ERROR_LOG_UE BIT_ULL(63)
- #define ECC_ERROR_LOG_SYND(v) GET_BITFIELD(v, 46, 61)
- /* Host MMIO base address */
- #define MCHBAR_OFFSET 0x48
- #define MCHBAR_EN BIT_ULL(0)
- #define MCHBAR_SIZE 0x10000
- /* Parameters for the channel decode stage */
- #define IMC_BASE (res_cfg->imc_base)
- #define MAD_INTER_CHANNEL_OFFSET IMC_BASE
- #define MAD_INTER_CHANNEL_DDR_TYPE(v) GET_BITFIELD(v, 0, 2)
- #define MAD_INTER_CHANNEL_ECHM(v) GET_BITFIELD(v, 3, 3)
- #define MAD_INTER_CHANNEL_CH_L_MAP(v) GET_BITFIELD(v, 4, 4)
- #define MAD_INTER_CHANNEL_CH_S_SIZE(v) ((u64)GET_BITFIELD(v, 12, 19) << 29)
- /* Parameters for DRAM decode stage */
- #define MAD_INTRA_CH0_OFFSET (IMC_BASE + 4)
- #define MAD_INTRA_CH_DIMM_L_MAP(v) GET_BITFIELD(v, 0, 0)
- /* DIMM characteristics */
- #define MAD_DIMM_CH0_OFFSET (IMC_BASE + 0xc)
- #define MAD_DIMM_CH_DIMM_L_SIZE(v) ((u64)GET_BITFIELD(v, 0, 6) << 29)
- #define MAD_DIMM_CH_DLW(v) GET_BITFIELD(v, 7, 8)
- #define MAD_DIMM_CH_DIMM_S_SIZE(v) ((u64)GET_BITFIELD(v, 16, 22) << 29)
- #define MAD_DIMM_CH_DSW(v) GET_BITFIELD(v, 24, 25)
- /* Hash for memory controller selection */
- #define MAD_MC_HASH_OFFSET (IMC_BASE + 0x1b8)
- #define MAC_MC_HASH_LSB(v) GET_BITFIELD(v, 1, 3)
- /* Hash for channel selection */
- #define CHANNEL_HASH_OFFSET (IMC_BASE + 0x24)
- /* Hash for enhanced channel selection */
- #define CHANNEL_EHASH_OFFSET (IMC_BASE + 0x28)
- #define CHANNEL_HASH_MASK(v) (GET_BITFIELD(v, 6, 19) << 6)
- #define CHANNEL_HASH_LSB_MASK_BIT(v) GET_BITFIELD(v, 24, 26)
- #define CHANNEL_HASH_MODE(v) GET_BITFIELD(v, 28, 28)
- /* Parameters for memory slice decode stage */
- #define MEM_SLICE_HASH_MASK(v) (GET_BITFIELD(v, 6, 19) << 6)
- #define MEM_SLICE_HASH_LSB_MASK_BIT(v) GET_BITFIELD(v, 24, 26)
- static struct res_config {
- bool machine_check;
- /* The number of present memory controllers. */
- int num_imc;
- /* Host MMIO configuration */
- u64 reg_mchbar_mask;
- /* Top of memory */
- u64 reg_tom_mask;
- /* Top of upper usable DRAM */
- u64 reg_touud_mask;
- /* IBECC error log */
- u64 reg_eccerrlog_addr_mask;
- u32 imc_base;
- u32 cmf_base;
- u32 cmf_size;
- u32 ms_hash_offset;
- u32 ibecc_base;
- u32 ibecc_error_log_offset;
- bool (*ibecc_available)(struct pci_dev *pdev);
- /* Extract error address logged in IBECC */
- u64 (*err_addr)(u64 ecclog);
- /* Convert error address logged in IBECC to system physical address */
- u64 (*err_addr_to_sys_addr)(u64 eaddr, int mc);
- /* Convert error address logged in IBECC to integrated memory controller address */
- u64 (*err_addr_to_imc_addr)(u64 eaddr, int mc);
- } *res_cfg;
- struct igen6_imc {
- int mc;
- struct mem_ctl_info *mci;
- struct pci_dev *pdev;
- struct device dev;
- void __iomem *window;
- u64 size;
- u64 ch_s_size;
- int ch_l_map;
- u64 dimm_s_size[NUM_CHANNELS];
- u64 dimm_l_size[NUM_CHANNELS];
- int dimm_l_map[NUM_CHANNELS];
- };
- static struct igen6_pvt {
- struct igen6_imc imc[NUM_IMC];
- u64 ms_hash;
- u64 ms_s_size;
- int ms_l_map;
- } *igen6_pvt;
- /* The top of low usable DRAM */
- static u32 igen6_tolud;
- /* The size of physical memory */
- static u64 igen6_tom;
- struct decoded_addr {
- int mc;
- u64 imc_addr;
- u64 sys_addr;
- int channel_idx;
- u64 channel_addr;
- int sub_channel_idx;
- u64 sub_channel_addr;
- };
- struct ecclog_node {
- struct llist_node llnode;
- int mc;
- u64 ecclog;
- };
- /*
- * In the NMI handler, the driver uses the lock-less memory allocator
- * to allocate memory to store the IBECC error logs and links the logs
- * to the lock-less list. Delay printk() and the work of error reporting
- * to EDAC core in a worker.
- */
- #define ECCLOG_POOL_SIZE PAGE_SIZE
- static LLIST_HEAD(ecclog_llist);
- static struct gen_pool *ecclog_pool;
- static char ecclog_buf[ECCLOG_POOL_SIZE];
- static struct irq_work ecclog_irq_work;
- static struct work_struct ecclog_work;
- /* Compute die IDs for Elkhart Lake with IBECC */
- #define DID_EHL_SKU5 0x4514
- #define DID_EHL_SKU6 0x4528
- #define DID_EHL_SKU7 0x452a
- #define DID_EHL_SKU8 0x4516
- #define DID_EHL_SKU9 0x452c
- #define DID_EHL_SKU10 0x452e
- #define DID_EHL_SKU11 0x4532
- #define DID_EHL_SKU12 0x4518
- #define DID_EHL_SKU13 0x451a
- #define DID_EHL_SKU14 0x4534
- #define DID_EHL_SKU15 0x4536
- /* Compute die IDs for ICL-NNPI with IBECC */
- #define DID_ICL_SKU8 0x4581
- #define DID_ICL_SKU10 0x4585
- #define DID_ICL_SKU11 0x4589
- #define DID_ICL_SKU12 0x458d
- /* Compute die IDs for Tiger Lake with IBECC */
- #define DID_TGL_SKU 0x9a14
- /* Compute die IDs for Alder Lake with IBECC */
- #define DID_ADL_SKU1 0x4601
- #define DID_ADL_SKU2 0x4602
- #define DID_ADL_SKU3 0x4621
- #define DID_ADL_SKU4 0x4641
- /* Compute die IDs for Alder Lake-N with IBECC */
- #define DID_ADL_N_SKU1 0x4614
- #define DID_ADL_N_SKU2 0x4617
- #define DID_ADL_N_SKU3 0x461b
- #define DID_ADL_N_SKU4 0x461c
- #define DID_ADL_N_SKU5 0x4673
- #define DID_ADL_N_SKU6 0x4674
- #define DID_ADL_N_SKU7 0x4675
- #define DID_ADL_N_SKU8 0x4677
- #define DID_ADL_N_SKU9 0x4678
- #define DID_ADL_N_SKU10 0x4679
- #define DID_ADL_N_SKU11 0x467c
- #define DID_ADL_N_SKU12 0x4632
- /* Compute die IDs for Arizona Beach with IBECC */
- #define DID_AZB_SKU1 0x4676
- /* Compute did IDs for Amston Lake with IBECC */
- #define DID_ASL_SKU1 0x464a
- #define DID_ASL_SKU2 0x4646
- #define DID_ASL_SKU3 0x4652
- /* Compute die IDs for Raptor Lake-P with IBECC */
- #define DID_RPL_P_SKU1 0xa706
- #define DID_RPL_P_SKU2 0xa707
- #define DID_RPL_P_SKU3 0xa708
- #define DID_RPL_P_SKU4 0xa716
- #define DID_RPL_P_SKU5 0xa718
- /* Compute die IDs for Meteor Lake-PS with IBECC */
- #define DID_MTL_PS_SKU1 0x7d21
- #define DID_MTL_PS_SKU2 0x7d22
- #define DID_MTL_PS_SKU3 0x7d23
- #define DID_MTL_PS_SKU4 0x7d24
- /* Compute die IDs for Meteor Lake-P with IBECC */
- #define DID_MTL_P_SKU1 0x7d01
- #define DID_MTL_P_SKU2 0x7d02
- #define DID_MTL_P_SKU3 0x7d14
- /* Compute die IDs for Arrow Lake-UH with IBECC */
- #define DID_ARL_UH_SKU1 0x7d06
- #define DID_ARL_UH_SKU2 0x7d20
- #define DID_ARL_UH_SKU3 0x7d30
- /* Compute die IDs for Panther Lake-H with IBECC */
- #define DID_PTL_H_SKU1 0xb000
- #define DID_PTL_H_SKU2 0xb001
- #define DID_PTL_H_SKU3 0xb002
- #define DID_PTL_H_SKU4 0xb003
- #define DID_PTL_H_SKU5 0xb004
- #define DID_PTL_H_SKU6 0xb005
- #define DID_PTL_H_SKU7 0xb008
- #define DID_PTL_H_SKU8 0xb011
- #define DID_PTL_H_SKU9 0xb014
- #define DID_PTL_H_SKU10 0xb015
- #define DID_PTL_H_SKU11 0xb028
- #define DID_PTL_H_SKU12 0xb029
- #define DID_PTL_H_SKU13 0xb02a
- /* Compute die IDs for Wildcat Lake with IBECC */
- #define DID_WCL_SKU1 0xfd00
- static int get_mchbar(struct pci_dev *pdev, u64 *mchbar)
- {
- union {
- u64 v;
- struct {
- u32 v_lo;
- u32 v_hi;
- };
- } u;
- if (pci_read_config_dword(pdev, MCHBAR_OFFSET, &u.v_lo)) {
- igen6_printk(KERN_ERR, "Failed to read lower MCHBAR\n");
- return -ENODEV;
- }
- if (pci_read_config_dword(pdev, MCHBAR_OFFSET + 4, &u.v_hi)) {
- igen6_printk(KERN_ERR, "Failed to read upper MCHBAR\n");
- return -ENODEV;
- }
- if (!(u.v & MCHBAR_EN)) {
- igen6_printk(KERN_ERR, "MCHBAR is disabled\n");
- return -ENODEV;
- }
- *mchbar = u.v & res_cfg->reg_mchbar_mask;
- edac_dbg(2, "MCHBAR 0x%llx (reg 0x%llx)\n", *mchbar, u.v);
- return 0;
- }
- static bool ehl_ibecc_available(struct pci_dev *pdev)
- {
- u32 v;
- if (pci_read_config_dword(pdev, CAPID_C_OFFSET, &v))
- return false;
- return !!(CAPID_C_IBECC & v);
- }
- static u64 ehl_err_addr_to_sys_addr(u64 eaddr, int mc)
- {
- return eaddr;
- }
- static u64 ehl_err_addr_to_imc_addr(u64 eaddr, int mc)
- {
- if (eaddr < igen6_tolud)
- return eaddr;
- if (igen6_tom <= _4GB)
- return eaddr + igen6_tolud - _4GB;
- if (eaddr >= igen6_tom)
- return eaddr + igen6_tolud - igen6_tom;
- return eaddr;
- }
- static bool icl_ibecc_available(struct pci_dev *pdev)
- {
- u32 v;
- if (pci_read_config_dword(pdev, CAPID_C_OFFSET, &v))
- return false;
- return !(CAPID_C_IBECC & v) &&
- (boot_cpu_data.x86_stepping >= 1);
- }
- static bool tgl_ibecc_available(struct pci_dev *pdev)
- {
- u32 v;
- if (pci_read_config_dword(pdev, CAPID_E_OFFSET, &v))
- return false;
- return !(CAPID_E_IBECC & v);
- }
- static bool mtl_p_ibecc_available(struct pci_dev *pdev)
- {
- u32 v;
- if (pci_read_config_dword(pdev, CAPID_E_OFFSET, &v))
- return false;
- return !(CAPID_E_IBECC_BIT18 & v);
- }
- static bool mtl_ps_ibecc_available(struct pci_dev *pdev)
- {
- #define MCHBAR_MEMSS_IBECCDIS 0x13c00
- void __iomem *window;
- u64 mchbar;
- u32 val;
- if (get_mchbar(pdev, &mchbar))
- return false;
- window = ioremap(mchbar, MCHBAR_SIZE * 2);
- if (!window) {
- igen6_printk(KERN_ERR, "Failed to ioremap 0x%llx\n", mchbar);
- return false;
- }
- val = readl(window + MCHBAR_MEMSS_IBECCDIS);
- iounmap(window);
- /* Bit6: 1 - IBECC is disabled, 0 - IBECC isn't disabled */
- return !GET_BITFIELD(val, 6, 6);
- }
- static u64 mem_addr_to_sys_addr(u64 maddr)
- {
- if (maddr < igen6_tolud)
- return maddr;
- if (igen6_tom <= _4GB)
- return maddr - igen6_tolud + _4GB;
- if (maddr < _4GB)
- return maddr - igen6_tolud + igen6_tom;
- return maddr;
- }
- static u64 mem_slice_hash(u64 addr, u64 mask, u64 hash_init, int intlv_bit)
- {
- u64 hash_addr = addr & mask, hash = hash_init;
- u64 intlv = (addr >> intlv_bit) & 1;
- int i;
- for (i = 6; i < 20; i++)
- hash ^= (hash_addr >> i) & 1;
- return hash ^ intlv;
- }
- static u64 tgl_err_addr_to_mem_addr(u64 eaddr, int mc)
- {
- u64 maddr, hash, mask, ms_s_size;
- int intlv_bit;
- u32 ms_hash;
- ms_s_size = igen6_pvt->ms_s_size;
- if (eaddr >= ms_s_size)
- return eaddr + ms_s_size;
- ms_hash = igen6_pvt->ms_hash;
- mask = MEM_SLICE_HASH_MASK(ms_hash);
- intlv_bit = MEM_SLICE_HASH_LSB_MASK_BIT(ms_hash) + 6;
- maddr = GET_BITFIELD(eaddr, intlv_bit, 63) << (intlv_bit + 1) |
- GET_BITFIELD(eaddr, 0, intlv_bit - 1);
- hash = mem_slice_hash(maddr, mask, mc, intlv_bit);
- return maddr | (hash << intlv_bit);
- }
- static u64 tgl_err_addr_to_sys_addr(u64 eaddr, int mc)
- {
- u64 maddr = tgl_err_addr_to_mem_addr(eaddr, mc);
- return mem_addr_to_sys_addr(maddr);
- }
- static u64 tgl_err_addr_to_imc_addr(u64 eaddr, int mc)
- {
- return eaddr;
- }
- static u64 adl_err_addr_to_sys_addr(u64 eaddr, int mc)
- {
- return mem_addr_to_sys_addr(eaddr);
- }
- static u64 adl_err_addr_to_imc_addr(u64 eaddr, int mc)
- {
- u64 imc_addr, ms_s_size = igen6_pvt->ms_s_size;
- struct igen6_imc *imc = &igen6_pvt->imc[mc];
- int intlv_bit;
- u32 mc_hash;
- if (eaddr >= 2 * ms_s_size)
- return eaddr - ms_s_size;
- mc_hash = readl(imc->window + MAD_MC_HASH_OFFSET);
- intlv_bit = MAC_MC_HASH_LSB(mc_hash) + 6;
- imc_addr = GET_BITFIELD(eaddr, intlv_bit + 1, 63) << intlv_bit |
- GET_BITFIELD(eaddr, 0, intlv_bit - 1);
- return imc_addr;
- }
- static u64 rpl_p_err_addr(u64 ecclog)
- {
- return field_get(res_cfg->reg_eccerrlog_addr_mask, ecclog);
- }
- static struct res_config ehl_cfg = {
- .num_imc = 1,
- .reg_mchbar_mask = GENMASK_ULL(38, 16),
- .reg_tom_mask = GENMASK_ULL(38, 20),
- .reg_touud_mask = GENMASK_ULL(38, 20),
- .reg_eccerrlog_addr_mask = GENMASK_ULL(38, 5),
- .imc_base = 0x5000,
- .ibecc_base = 0xdc00,
- .ibecc_available = ehl_ibecc_available,
- .ibecc_error_log_offset = 0x170,
- .err_addr_to_sys_addr = ehl_err_addr_to_sys_addr,
- .err_addr_to_imc_addr = ehl_err_addr_to_imc_addr,
- };
- static struct res_config icl_cfg = {
- .num_imc = 1,
- .reg_mchbar_mask = GENMASK_ULL(38, 16),
- .reg_tom_mask = GENMASK_ULL(38, 20),
- .reg_touud_mask = GENMASK_ULL(38, 20),
- .reg_eccerrlog_addr_mask = GENMASK_ULL(38, 5),
- .imc_base = 0x5000,
- .ibecc_base = 0xd800,
- .ibecc_error_log_offset = 0x170,
- .ibecc_available = icl_ibecc_available,
- .err_addr_to_sys_addr = ehl_err_addr_to_sys_addr,
- .err_addr_to_imc_addr = ehl_err_addr_to_imc_addr,
- };
- static struct res_config tgl_cfg = {
- .machine_check = true,
- .num_imc = 2,
- .reg_mchbar_mask = GENMASK_ULL(38, 17),
- .reg_tom_mask = GENMASK_ULL(38, 20),
- .reg_touud_mask = GENMASK_ULL(38, 20),
- .reg_eccerrlog_addr_mask = GENMASK_ULL(38, 5),
- .imc_base = 0x5000,
- .cmf_base = 0x11000,
- .cmf_size = 0x800,
- .ms_hash_offset = 0xac,
- .ibecc_base = 0xd400,
- .ibecc_error_log_offset = 0x170,
- .ibecc_available = tgl_ibecc_available,
- .err_addr_to_sys_addr = tgl_err_addr_to_sys_addr,
- .err_addr_to_imc_addr = tgl_err_addr_to_imc_addr,
- };
- static struct res_config adl_cfg = {
- .machine_check = true,
- .num_imc = 2,
- .reg_mchbar_mask = GENMASK_ULL(41, 17),
- .reg_tom_mask = GENMASK_ULL(41, 20),
- .reg_touud_mask = GENMASK_ULL(41, 20),
- .reg_eccerrlog_addr_mask = GENMASK_ULL(45, 5),
- .imc_base = 0xd800,
- .ibecc_base = 0xd400,
- .ibecc_error_log_offset = 0x68,
- .ibecc_available = tgl_ibecc_available,
- .err_addr_to_sys_addr = adl_err_addr_to_sys_addr,
- .err_addr_to_imc_addr = adl_err_addr_to_imc_addr,
- };
- static struct res_config adl_n_cfg = {
- .machine_check = true,
- .num_imc = 1,
- .reg_mchbar_mask = GENMASK_ULL(41, 17),
- .reg_tom_mask = GENMASK_ULL(41, 20),
- .reg_touud_mask = GENMASK_ULL(41, 20),
- .reg_eccerrlog_addr_mask = GENMASK_ULL(45, 5),
- .imc_base = 0xd800,
- .ibecc_base = 0xd400,
- .ibecc_error_log_offset = 0x68,
- .ibecc_available = tgl_ibecc_available,
- .err_addr_to_sys_addr = adl_err_addr_to_sys_addr,
- .err_addr_to_imc_addr = adl_err_addr_to_imc_addr,
- };
- static struct res_config rpl_p_cfg = {
- .machine_check = true,
- .num_imc = 2,
- .reg_mchbar_mask = GENMASK_ULL(41, 17),
- .reg_tom_mask = GENMASK_ULL(41, 20),
- .reg_touud_mask = GENMASK_ULL(41, 20),
- .reg_eccerrlog_addr_mask = GENMASK_ULL(45, 5),
- .imc_base = 0xd800,
- .ibecc_base = 0xd400,
- .ibecc_error_log_offset = 0x68,
- .ibecc_available = tgl_ibecc_available,
- .err_addr = rpl_p_err_addr,
- .err_addr_to_sys_addr = adl_err_addr_to_sys_addr,
- .err_addr_to_imc_addr = adl_err_addr_to_imc_addr,
- };
- static struct res_config mtl_ps_cfg = {
- .machine_check = true,
- .num_imc = 2,
- .reg_mchbar_mask = GENMASK_ULL(41, 17),
- .reg_tom_mask = GENMASK_ULL(41, 20),
- .reg_touud_mask = GENMASK_ULL(41, 20),
- .reg_eccerrlog_addr_mask = GENMASK_ULL(38, 5),
- .imc_base = 0xd800,
- .ibecc_base = 0xd400,
- .ibecc_error_log_offset = 0x170,
- .ibecc_available = mtl_ps_ibecc_available,
- .err_addr_to_sys_addr = adl_err_addr_to_sys_addr,
- .err_addr_to_imc_addr = adl_err_addr_to_imc_addr,
- };
- static struct res_config mtl_p_cfg = {
- .machine_check = true,
- .num_imc = 2,
- .reg_mchbar_mask = GENMASK_ULL(41, 17),
- .reg_tom_mask = GENMASK_ULL(41, 20),
- .reg_touud_mask = GENMASK_ULL(41, 20),
- .reg_eccerrlog_addr_mask = GENMASK_ULL(38, 5),
- .imc_base = 0xd800,
- .ibecc_base = 0xd400,
- .ibecc_error_log_offset = 0x170,
- .ibecc_available = mtl_p_ibecc_available,
- .err_addr_to_sys_addr = adl_err_addr_to_sys_addr,
- .err_addr_to_imc_addr = adl_err_addr_to_imc_addr,
- };
- static struct res_config wcl_cfg = {
- .machine_check = true,
- .num_imc = 1,
- .reg_mchbar_mask = GENMASK_ULL(41, 17),
- .reg_tom_mask = GENMASK_ULL(41, 20),
- .reg_touud_mask = GENMASK_ULL(41, 20),
- .reg_eccerrlog_addr_mask = GENMASK_ULL(38, 5),
- .imc_base = 0xd800,
- .ibecc_base = 0xd400,
- .ibecc_error_log_offset = 0x170,
- .ibecc_available = mtl_p_ibecc_available,
- .err_addr_to_sys_addr = adl_err_addr_to_sys_addr,
- .err_addr_to_imc_addr = adl_err_addr_to_imc_addr,
- };
- static struct pci_device_id igen6_pci_tbl[] = {
- { PCI_VDEVICE(INTEL, DID_EHL_SKU5), (kernel_ulong_t)&ehl_cfg },
- { PCI_VDEVICE(INTEL, DID_EHL_SKU6), (kernel_ulong_t)&ehl_cfg },
- { PCI_VDEVICE(INTEL, DID_EHL_SKU7), (kernel_ulong_t)&ehl_cfg },
- { PCI_VDEVICE(INTEL, DID_EHL_SKU8), (kernel_ulong_t)&ehl_cfg },
- { PCI_VDEVICE(INTEL, DID_EHL_SKU9), (kernel_ulong_t)&ehl_cfg },
- { PCI_VDEVICE(INTEL, DID_EHL_SKU10), (kernel_ulong_t)&ehl_cfg },
- { PCI_VDEVICE(INTEL, DID_EHL_SKU11), (kernel_ulong_t)&ehl_cfg },
- { PCI_VDEVICE(INTEL, DID_EHL_SKU12), (kernel_ulong_t)&ehl_cfg },
- { PCI_VDEVICE(INTEL, DID_EHL_SKU13), (kernel_ulong_t)&ehl_cfg },
- { PCI_VDEVICE(INTEL, DID_EHL_SKU14), (kernel_ulong_t)&ehl_cfg },
- { PCI_VDEVICE(INTEL, DID_EHL_SKU15), (kernel_ulong_t)&ehl_cfg },
- { PCI_VDEVICE(INTEL, DID_ICL_SKU8), (kernel_ulong_t)&icl_cfg },
- { PCI_VDEVICE(INTEL, DID_ICL_SKU10), (kernel_ulong_t)&icl_cfg },
- { PCI_VDEVICE(INTEL, DID_ICL_SKU11), (kernel_ulong_t)&icl_cfg },
- { PCI_VDEVICE(INTEL, DID_ICL_SKU12), (kernel_ulong_t)&icl_cfg },
- { PCI_VDEVICE(INTEL, DID_TGL_SKU), (kernel_ulong_t)&tgl_cfg },
- { PCI_VDEVICE(INTEL, DID_ADL_SKU1), (kernel_ulong_t)&adl_cfg },
- { PCI_VDEVICE(INTEL, DID_ADL_SKU2), (kernel_ulong_t)&adl_cfg },
- { PCI_VDEVICE(INTEL, DID_ADL_SKU3), (kernel_ulong_t)&adl_cfg },
- { PCI_VDEVICE(INTEL, DID_ADL_SKU4), (kernel_ulong_t)&adl_cfg },
- { PCI_VDEVICE(INTEL, DID_ADL_N_SKU1), (kernel_ulong_t)&adl_n_cfg },
- { PCI_VDEVICE(INTEL, DID_ADL_N_SKU2), (kernel_ulong_t)&adl_n_cfg },
- { PCI_VDEVICE(INTEL, DID_ADL_N_SKU3), (kernel_ulong_t)&adl_n_cfg },
- { PCI_VDEVICE(INTEL, DID_ADL_N_SKU4), (kernel_ulong_t)&adl_n_cfg },
- { PCI_VDEVICE(INTEL, DID_ADL_N_SKU5), (kernel_ulong_t)&adl_n_cfg },
- { PCI_VDEVICE(INTEL, DID_ADL_N_SKU6), (kernel_ulong_t)&adl_n_cfg },
- { PCI_VDEVICE(INTEL, DID_ADL_N_SKU7), (kernel_ulong_t)&adl_n_cfg },
- { PCI_VDEVICE(INTEL, DID_ADL_N_SKU8), (kernel_ulong_t)&adl_n_cfg },
- { PCI_VDEVICE(INTEL, DID_ADL_N_SKU9), (kernel_ulong_t)&adl_n_cfg },
- { PCI_VDEVICE(INTEL, DID_ADL_N_SKU10), (kernel_ulong_t)&adl_n_cfg },
- { PCI_VDEVICE(INTEL, DID_ADL_N_SKU11), (kernel_ulong_t)&adl_n_cfg },
- { PCI_VDEVICE(INTEL, DID_ADL_N_SKU12), (kernel_ulong_t)&adl_n_cfg },
- { PCI_VDEVICE(INTEL, DID_AZB_SKU1), (kernel_ulong_t)&adl_n_cfg },
- { PCI_VDEVICE(INTEL, DID_ASL_SKU1), (kernel_ulong_t)&adl_n_cfg },
- { PCI_VDEVICE(INTEL, DID_ASL_SKU2), (kernel_ulong_t)&adl_n_cfg },
- { PCI_VDEVICE(INTEL, DID_ASL_SKU3), (kernel_ulong_t)&adl_n_cfg },
- { PCI_VDEVICE(INTEL, DID_RPL_P_SKU1), (kernel_ulong_t)&rpl_p_cfg },
- { PCI_VDEVICE(INTEL, DID_RPL_P_SKU2), (kernel_ulong_t)&rpl_p_cfg },
- { PCI_VDEVICE(INTEL, DID_RPL_P_SKU3), (kernel_ulong_t)&rpl_p_cfg },
- { PCI_VDEVICE(INTEL, DID_RPL_P_SKU4), (kernel_ulong_t)&rpl_p_cfg },
- { PCI_VDEVICE(INTEL, DID_RPL_P_SKU5), (kernel_ulong_t)&rpl_p_cfg },
- { PCI_VDEVICE(INTEL, DID_MTL_PS_SKU1), (kernel_ulong_t)&mtl_ps_cfg },
- { PCI_VDEVICE(INTEL, DID_MTL_PS_SKU2), (kernel_ulong_t)&mtl_ps_cfg },
- { PCI_VDEVICE(INTEL, DID_MTL_PS_SKU3), (kernel_ulong_t)&mtl_ps_cfg },
- { PCI_VDEVICE(INTEL, DID_MTL_PS_SKU4), (kernel_ulong_t)&mtl_ps_cfg },
- { PCI_VDEVICE(INTEL, DID_MTL_P_SKU1), (kernel_ulong_t)&mtl_p_cfg },
- { PCI_VDEVICE(INTEL, DID_MTL_P_SKU2), (kernel_ulong_t)&mtl_p_cfg },
- { PCI_VDEVICE(INTEL, DID_MTL_P_SKU3), (kernel_ulong_t)&mtl_p_cfg },
- { PCI_VDEVICE(INTEL, DID_ARL_UH_SKU1), (kernel_ulong_t)&mtl_p_cfg },
- { PCI_VDEVICE(INTEL, DID_ARL_UH_SKU2), (kernel_ulong_t)&mtl_p_cfg },
- { PCI_VDEVICE(INTEL, DID_ARL_UH_SKU3), (kernel_ulong_t)&mtl_p_cfg },
- { PCI_VDEVICE(INTEL, DID_PTL_H_SKU1), (kernel_ulong_t)&mtl_p_cfg },
- { PCI_VDEVICE(INTEL, DID_PTL_H_SKU2), (kernel_ulong_t)&mtl_p_cfg },
- { PCI_VDEVICE(INTEL, DID_PTL_H_SKU3), (kernel_ulong_t)&mtl_p_cfg },
- { PCI_VDEVICE(INTEL, DID_PTL_H_SKU4), (kernel_ulong_t)&mtl_p_cfg },
- { PCI_VDEVICE(INTEL, DID_PTL_H_SKU5), (kernel_ulong_t)&mtl_p_cfg },
- { PCI_VDEVICE(INTEL, DID_PTL_H_SKU6), (kernel_ulong_t)&mtl_p_cfg },
- { PCI_VDEVICE(INTEL, DID_PTL_H_SKU7), (kernel_ulong_t)&mtl_p_cfg },
- { PCI_VDEVICE(INTEL, DID_PTL_H_SKU8), (kernel_ulong_t)&mtl_p_cfg },
- { PCI_VDEVICE(INTEL, DID_PTL_H_SKU9), (kernel_ulong_t)&mtl_p_cfg },
- { PCI_VDEVICE(INTEL, DID_PTL_H_SKU10), (kernel_ulong_t)&mtl_p_cfg },
- { PCI_VDEVICE(INTEL, DID_PTL_H_SKU11), (kernel_ulong_t)&mtl_p_cfg },
- { PCI_VDEVICE(INTEL, DID_PTL_H_SKU12), (kernel_ulong_t)&mtl_p_cfg },
- { PCI_VDEVICE(INTEL, DID_PTL_H_SKU13), (kernel_ulong_t)&mtl_p_cfg },
- { PCI_VDEVICE(INTEL, DID_WCL_SKU1), (kernel_ulong_t)&wcl_cfg },
- { },
- };
- MODULE_DEVICE_TABLE(pci, igen6_pci_tbl);
- static enum dev_type get_width(int dimm_l, u32 mad_dimm)
- {
- u32 w = dimm_l ? MAD_DIMM_CH_DLW(mad_dimm) :
- MAD_DIMM_CH_DSW(mad_dimm);
- switch (w) {
- case 0:
- return DEV_X8;
- case 1:
- return DEV_X16;
- case 2:
- return DEV_X32;
- default:
- return DEV_UNKNOWN;
- }
- }
- static enum mem_type get_memory_type(u32 mad_inter)
- {
- u32 t = MAD_INTER_CHANNEL_DDR_TYPE(mad_inter);
- switch (t) {
- case 0:
- return MEM_DDR4;
- case 1:
- return MEM_DDR3;
- case 2:
- return MEM_LPDDR3;
- case 3:
- return MEM_LPDDR4;
- case 4:
- return MEM_WIO2;
- default:
- return MEM_UNKNOWN;
- }
- }
- static int decode_chan_idx(u64 addr, u64 mask, int intlv_bit)
- {
- u64 hash_addr = addr & mask, hash = 0;
- u64 intlv = (addr >> intlv_bit) & 1;
- int i;
- for (i = 6; i < 20; i++)
- hash ^= (hash_addr >> i) & 1;
- return (int)hash ^ intlv;
- }
- static u64 decode_channel_addr(u64 addr, int intlv_bit)
- {
- u64 channel_addr;
- /* Remove the interleave bit and shift upper part down to fill gap */
- channel_addr = GET_BITFIELD(addr, intlv_bit + 1, 63) << intlv_bit;
- channel_addr |= GET_BITFIELD(addr, 0, intlv_bit - 1);
- return channel_addr;
- }
- static void decode_addr(u64 addr, u32 hash, u64 s_size, int l_map,
- int *idx, u64 *sub_addr)
- {
- int intlv_bit = CHANNEL_HASH_LSB_MASK_BIT(hash) + 6;
- if (addr > 2 * s_size) {
- *sub_addr = addr - s_size;
- *idx = l_map;
- return;
- }
- if (CHANNEL_HASH_MODE(hash)) {
- *sub_addr = decode_channel_addr(addr, intlv_bit);
- *idx = decode_chan_idx(addr, CHANNEL_HASH_MASK(hash), intlv_bit);
- } else {
- *sub_addr = decode_channel_addr(addr, 6);
- *idx = GET_BITFIELD(addr, 6, 6);
- }
- }
- static int igen6_decode(struct decoded_addr *res)
- {
- struct igen6_imc *imc = &igen6_pvt->imc[res->mc];
- u64 addr = res->imc_addr, sub_addr, s_size;
- int idx, l_map;
- u32 hash;
- if (addr >= igen6_tom) {
- edac_dbg(0, "Address 0x%llx out of range\n", addr);
- return -EINVAL;
- }
- /* Decode channel */
- hash = readl(imc->window + CHANNEL_HASH_OFFSET);
- s_size = imc->ch_s_size;
- l_map = imc->ch_l_map;
- decode_addr(addr, hash, s_size, l_map, &idx, &sub_addr);
- res->channel_idx = idx;
- res->channel_addr = sub_addr;
- /* Decode sub-channel/DIMM */
- hash = readl(imc->window + CHANNEL_EHASH_OFFSET);
- s_size = imc->dimm_s_size[idx];
- l_map = imc->dimm_l_map[idx];
- decode_addr(res->channel_addr, hash, s_size, l_map, &idx, &sub_addr);
- res->sub_channel_idx = idx;
- res->sub_channel_addr = sub_addr;
- return 0;
- }
- static void igen6_output_error(struct decoded_addr *res,
- struct mem_ctl_info *mci, u64 ecclog)
- {
- enum hw_event_mc_err_type type = ecclog & ECC_ERROR_LOG_UE ?
- HW_EVENT_ERR_UNCORRECTED :
- HW_EVENT_ERR_CORRECTED;
- edac_mc_handle_error(type, mci, 1,
- res->sys_addr >> PAGE_SHIFT,
- res->sys_addr & ~PAGE_MASK,
- ECC_ERROR_LOG_SYND(ecclog),
- res->channel_idx, res->sub_channel_idx,
- -1, "", "");
- }
- static struct gen_pool *ecclog_gen_pool_create(void)
- {
- struct gen_pool *pool;
- pool = gen_pool_create(ilog2(sizeof(struct ecclog_node)), -1);
- if (!pool)
- return NULL;
- if (gen_pool_add(pool, (unsigned long)ecclog_buf, ECCLOG_POOL_SIZE, -1)) {
- gen_pool_destroy(pool);
- return NULL;
- }
- return pool;
- }
- static int ecclog_gen_pool_add(int mc, u64 ecclog)
- {
- struct ecclog_node *node;
- node = (void *)gen_pool_alloc(ecclog_pool, sizeof(*node));
- if (!node)
- return -ENOMEM;
- node->mc = mc;
- node->ecclog = ecclog;
- llist_add(&node->llnode, &ecclog_llist);
- return 0;
- }
- /*
- * Either the memory-mapped I/O status register ECC_ERROR_LOG or the PCI
- * configuration space status register ERRSTS can indicate whether a
- * correctable error or an uncorrectable error occurred. We only use the
- * ECC_ERROR_LOG register to check error type, but need to clear both
- * registers to enable future error events.
- */
- static u64 ecclog_read_and_clear(struct igen6_imc *imc)
- {
- u64 ecclog = readq(imc->window + ECC_ERROR_LOG_OFFSET);
- /*
- * Quirk: The ECC_ERROR_LOG register of certain SoCs may contain
- * the invalid value ~0. This will result in a flood of invalid
- * error reports in polling mode. Skip it.
- */
- if (ecclog == ~0)
- return 0;
- /* Neither a CE nor a UE. Skip it.*/
- if (!(ecclog & (ECC_ERROR_LOG_CE | ECC_ERROR_LOG_UE)))
- return 0;
- /* Clear CE/UE bits by writing 1s */
- writeq(ecclog, imc->window + ECC_ERROR_LOG_OFFSET);
- return ecclog;
- }
- static void errsts_clear(struct igen6_imc *imc)
- {
- u16 errsts;
- if (pci_read_config_word(imc->pdev, ERRSTS_OFFSET, &errsts)) {
- igen6_printk(KERN_ERR, "Failed to read ERRSTS\n");
- return;
- }
- /* Clear CE/UE bits by writing 1s */
- if (errsts & (ERRSTS_CE | ERRSTS_UE))
- pci_write_config_word(imc->pdev, ERRSTS_OFFSET, errsts);
- }
- static int errcmd_enable_error_reporting(bool enable)
- {
- struct igen6_imc *imc = &igen6_pvt->imc[0];
- u16 errcmd;
- int rc;
- rc = pci_read_config_word(imc->pdev, ERRCMD_OFFSET, &errcmd);
- if (rc)
- return pcibios_err_to_errno(rc);
- if (enable)
- errcmd |= ERRCMD_CE | ERRSTS_UE;
- else
- errcmd &= ~(ERRCMD_CE | ERRSTS_UE);
- rc = pci_write_config_word(imc->pdev, ERRCMD_OFFSET, errcmd);
- if (rc)
- return pcibios_err_to_errno(rc);
- return 0;
- }
- static int ecclog_handler(void)
- {
- struct igen6_imc *imc;
- int i, n = 0;
- u64 ecclog;
- for (i = 0; i < res_cfg->num_imc; i++) {
- imc = &igen6_pvt->imc[i];
- /* errsts_clear() isn't NMI-safe. Delay it in the IRQ context */
- ecclog = ecclog_read_and_clear(imc);
- if (!ecclog)
- continue;
- if (!ecclog_gen_pool_add(i, ecclog))
- irq_work_queue(&ecclog_irq_work);
- n++;
- }
- return n;
- }
- static void ecclog_work_cb(struct work_struct *work)
- {
- struct ecclog_node *node, *tmp;
- struct mem_ctl_info *mci;
- struct llist_node *head;
- struct decoded_addr res;
- u64 eaddr;
- head = llist_del_all(&ecclog_llist);
- if (!head)
- return;
- llist_for_each_entry_safe(node, tmp, head, llnode) {
- memset(&res, 0, sizeof(res));
- if (res_cfg->err_addr)
- eaddr = res_cfg->err_addr(node->ecclog);
- else
- eaddr = node->ecclog & res_cfg->reg_eccerrlog_addr_mask;
- res.mc = node->mc;
- res.sys_addr = res_cfg->err_addr_to_sys_addr(eaddr, res.mc);
- res.imc_addr = res_cfg->err_addr_to_imc_addr(eaddr, res.mc);
- mci = igen6_pvt->imc[res.mc].mci;
- edac_dbg(2, "MC %d, ecclog = 0x%llx\n", node->mc, node->ecclog);
- igen6_mc_printk(mci, KERN_DEBUG, "HANDLING IBECC MEMORY ERROR\n");
- igen6_mc_printk(mci, KERN_DEBUG, "ADDR 0x%llx ", res.sys_addr);
- if (!igen6_decode(&res))
- igen6_output_error(&res, mci, node->ecclog);
- gen_pool_free(ecclog_pool, (unsigned long)node, sizeof(*node));
- }
- }
- static void ecclog_irq_work_cb(struct irq_work *irq_work)
- {
- int i;
- for (i = 0; i < res_cfg->num_imc; i++)
- errsts_clear(&igen6_pvt->imc[i]);
- if (!llist_empty(&ecclog_llist))
- schedule_work(&ecclog_work);
- }
- static int ecclog_nmi_handler(unsigned int cmd, struct pt_regs *regs)
- {
- unsigned char reason;
- if (!ecclog_handler())
- return NMI_DONE;
- /*
- * Both In-Band ECC correctable error and uncorrectable error are
- * reported by SERR# NMI. The NMI generic code (see pci_serr_error())
- * doesn't clear the bit NMI_REASON_CLEAR_SERR (in port 0x61) to
- * re-enable the SERR# NMI after NMI handling. So clear this bit here
- * to re-enable SERR# NMI for receiving future In-Band ECC errors.
- */
- reason = x86_platform.get_nmi_reason() & NMI_REASON_CLEAR_MASK;
- reason |= NMI_REASON_CLEAR_SERR;
- outb(reason, NMI_REASON_PORT);
- reason &= ~NMI_REASON_CLEAR_SERR;
- outb(reason, NMI_REASON_PORT);
- return NMI_HANDLED;
- }
- static int ecclog_mce_handler(struct notifier_block *nb, unsigned long val,
- void *data)
- {
- struct mce *mce = (struct mce *)data;
- char *type;
- if (mce->kflags & MCE_HANDLED_CEC)
- return NOTIFY_DONE;
- /*
- * Ignore unless this is a memory related error.
- * We don't check the bit MCI_STATUS_ADDRV of MCi_STATUS here,
- * since this bit isn't set on some CPU (e.g., Tiger Lake UP3).
- */
- if ((mce->status & 0xefff) >> 7 != 1)
- return NOTIFY_DONE;
- if (mce->mcgstatus & MCG_STATUS_MCIP)
- type = "Exception";
- else
- type = "Event";
- edac_dbg(0, "CPU %d: Machine Check %s: 0x%llx Bank %d: 0x%llx\n",
- mce->extcpu, type, mce->mcgstatus,
- mce->bank, mce->status);
- edac_dbg(0, "TSC 0x%llx\n", mce->tsc);
- edac_dbg(0, "ADDR 0x%llx\n", mce->addr);
- edac_dbg(0, "MISC 0x%llx\n", mce->misc);
- edac_dbg(0, "PROCESSOR %u:0x%x TIME %llu SOCKET %u APIC 0x%x\n",
- mce->cpuvendor, mce->cpuid, mce->time,
- mce->socketid, mce->apicid);
- /*
- * We just use the Machine Check for the memory error notification.
- * Each memory controller is associated with an IBECC instance.
- * Directly read and clear the error information(error address and
- * error type) on all the IBECC instances so that we know on which
- * memory controller the memory error(s) occurred.
- */
- if (!ecclog_handler())
- return NOTIFY_DONE;
- mce->kflags |= MCE_HANDLED_EDAC;
- return NOTIFY_DONE;
- }
- static struct notifier_block ecclog_mce_dec = {
- .notifier_call = ecclog_mce_handler,
- .priority = MCE_PRIO_EDAC,
- };
- static bool igen6_check_ecc(struct igen6_imc *imc)
- {
- u32 activate = readl(imc->window + IBECC_ACTIVATE_OFFSET);
- return !!(activate & IBECC_ACTIVATE_EN);
- }
- static int igen6_get_dimm_config(struct mem_ctl_info *mci)
- {
- struct igen6_imc *imc = mci->pvt_info;
- u32 mad_inter, mad_intra, mad_dimm;
- int i, j, ndimms, mc = imc->mc;
- struct dimm_info *dimm;
- enum mem_type mtype;
- enum dev_type dtype;
- u64 dsize;
- bool ecc;
- edac_dbg(2, "\n");
- mad_inter = readl(imc->window + MAD_INTER_CHANNEL_OFFSET);
- mtype = get_memory_type(mad_inter);
- ecc = igen6_check_ecc(imc);
- imc->ch_s_size = MAD_INTER_CHANNEL_CH_S_SIZE(mad_inter);
- imc->ch_l_map = MAD_INTER_CHANNEL_CH_L_MAP(mad_inter);
- for (i = 0; i < NUM_CHANNELS; i++) {
- mad_intra = readl(imc->window + MAD_INTRA_CH0_OFFSET + i * 4);
- mad_dimm = readl(imc->window + MAD_DIMM_CH0_OFFSET + i * 4);
- imc->dimm_l_size[i] = MAD_DIMM_CH_DIMM_L_SIZE(mad_dimm);
- imc->dimm_s_size[i] = MAD_DIMM_CH_DIMM_S_SIZE(mad_dimm);
- imc->dimm_l_map[i] = MAD_INTRA_CH_DIMM_L_MAP(mad_intra);
- imc->size += imc->dimm_s_size[i];
- imc->size += imc->dimm_l_size[i];
- ndimms = 0;
- for (j = 0; j < NUM_DIMMS; j++) {
- dimm = edac_get_dimm(mci, i, j, 0);
- if (j ^ imc->dimm_l_map[i]) {
- dtype = get_width(0, mad_dimm);
- dsize = imc->dimm_s_size[i];
- } else {
- dtype = get_width(1, mad_dimm);
- dsize = imc->dimm_l_size[i];
- }
- if (!dsize)
- continue;
- dimm->grain = 64;
- dimm->mtype = mtype;
- dimm->dtype = dtype;
- dimm->nr_pages = MiB_TO_PAGES(dsize >> 20);
- dimm->edac_mode = EDAC_SECDED;
- snprintf(dimm->label, sizeof(dimm->label),
- "MC#%d_Chan#%d_DIMM#%d", mc, i, j);
- edac_dbg(0, "MC %d, Channel %d, DIMM %d, Size %llu MiB (%u pages)\n",
- mc, i, j, dsize >> 20, dimm->nr_pages);
- ndimms++;
- }
- if (ndimms && !ecc) {
- igen6_printk(KERN_ERR, "MC%d In-Band ECC is disabled\n", mc);
- return -ENODEV;
- }
- }
- edac_dbg(0, "MC %d, total size %llu MiB\n", mc, imc->size >> 20);
- return 0;
- }
- #ifdef CONFIG_EDAC_DEBUG
- /* Top of upper usable DRAM */
- static u64 igen6_touud;
- #define TOUUD_OFFSET 0xa8
- static void igen6_reg_dump(struct igen6_imc *imc)
- {
- int i;
- edac_dbg(2, "CHANNEL_HASH : 0x%x\n",
- readl(imc->window + CHANNEL_HASH_OFFSET));
- edac_dbg(2, "CHANNEL_EHASH : 0x%x\n",
- readl(imc->window + CHANNEL_EHASH_OFFSET));
- edac_dbg(2, "MAD_INTER_CHANNEL: 0x%x\n",
- readl(imc->window + MAD_INTER_CHANNEL_OFFSET));
- edac_dbg(2, "ECC_ERROR_LOG : 0x%llx\n",
- readq(imc->window + ECC_ERROR_LOG_OFFSET));
- for (i = 0; i < NUM_CHANNELS; i++) {
- edac_dbg(2, "MAD_INTRA_CH%d : 0x%x\n", i,
- readl(imc->window + MAD_INTRA_CH0_OFFSET + i * 4));
- edac_dbg(2, "MAD_DIMM_CH%d : 0x%x\n", i,
- readl(imc->window + MAD_DIMM_CH0_OFFSET + i * 4));
- }
- edac_dbg(2, "TOLUD : 0x%x", igen6_tolud);
- edac_dbg(2, "TOUUD : 0x%llx", igen6_touud);
- edac_dbg(2, "TOM : 0x%llx", igen6_tom);
- }
- static struct dentry *igen6_test;
- static int debugfs_u64_set(void *data, u64 val)
- {
- u64 ecclog;
- if ((val >= igen6_tolud && val < _4GB) || val >= igen6_touud) {
- edac_dbg(0, "Address 0x%llx out of range\n", val);
- return 0;
- }
- pr_warn_once("Fake error to 0x%llx injected via debugfs\n", val);
- ecclog = (val & res_cfg->reg_eccerrlog_addr_mask) | ECC_ERROR_LOG_CE;
- if (!ecclog_gen_pool_add(0, ecclog))
- irq_work_queue(&ecclog_irq_work);
- return 0;
- }
- DEFINE_SIMPLE_ATTRIBUTE(fops_u64_wo, NULL, debugfs_u64_set, "%llu\n");
- static void igen6_debug_setup(void)
- {
- igen6_test = edac_debugfs_create_dir("igen6_test");
- if (!igen6_test)
- return;
- if (!edac_debugfs_create_file("addr", 0200, igen6_test,
- NULL, &fops_u64_wo)) {
- debugfs_remove(igen6_test);
- igen6_test = NULL;
- }
- }
- static void igen6_debug_teardown(void)
- {
- debugfs_remove_recursive(igen6_test);
- }
- #else
- static void igen6_reg_dump(struct igen6_imc *imc) {}
- static void igen6_debug_setup(void) {}
- static void igen6_debug_teardown(void) {}
- #endif
- static int igen6_pci_setup(struct pci_dev *pdev, u64 *mchbar)
- {
- union {
- u64 v;
- struct {
- u32 v_lo;
- u32 v_hi;
- };
- } u;
- edac_dbg(2, "\n");
- if (!res_cfg->ibecc_available(pdev)) {
- edac_dbg(2, "No In-Band ECC IP\n");
- goto fail;
- }
- if (pci_read_config_dword(pdev, TOLUD_OFFSET, &igen6_tolud)) {
- igen6_printk(KERN_ERR, "Failed to read TOLUD\n");
- goto fail;
- }
- igen6_tolud &= GENMASK(31, 20);
- if (pci_read_config_dword(pdev, TOM_OFFSET, &u.v_lo)) {
- igen6_printk(KERN_ERR, "Failed to read lower TOM\n");
- goto fail;
- }
- if (pci_read_config_dword(pdev, TOM_OFFSET + 4, &u.v_hi)) {
- igen6_printk(KERN_ERR, "Failed to read upper TOM\n");
- goto fail;
- }
- igen6_tom = u.v & res_cfg->reg_tom_mask;
- if (get_mchbar(pdev, mchbar))
- goto fail;
- #ifdef CONFIG_EDAC_DEBUG
- if (pci_read_config_dword(pdev, TOUUD_OFFSET, &u.v_lo))
- edac_dbg(2, "Failed to read lower TOUUD\n");
- else if (pci_read_config_dword(pdev, TOUUD_OFFSET + 4, &u.v_hi))
- edac_dbg(2, "Failed to read upper TOUUD\n");
- else
- igen6_touud = u.v & res_cfg->reg_touud_mask;
- #endif
- return 0;
- fail:
- return -ENODEV;
- }
- static void igen6_check(struct mem_ctl_info *mci)
- {
- struct igen6_imc *imc = mci->pvt_info;
- u64 ecclog;
- /* errsts_clear() isn't NMI-safe. Delay it in the IRQ context */
- ecclog = ecclog_read_and_clear(imc);
- if (!ecclog)
- return;
- if (!ecclog_gen_pool_add(imc->mc, ecclog))
- irq_work_queue(&ecclog_irq_work);
- }
- /* Check whether the memory controller is absent. */
- static bool igen6_imc_absent(void __iomem *window)
- {
- return readl(window + MAD_INTER_CHANNEL_OFFSET) == ~0;
- }
- static int igen6_register_mci(int mc, void __iomem *window, struct pci_dev *pdev)
- {
- struct edac_mc_layer layers[2];
- struct mem_ctl_info *mci;
- struct igen6_imc *imc;
- int rc;
- edac_dbg(2, "\n");
- layers[0].type = EDAC_MC_LAYER_CHANNEL;
- layers[0].size = NUM_CHANNELS;
- layers[0].is_virt_csrow = false;
- layers[1].type = EDAC_MC_LAYER_SLOT;
- layers[1].size = NUM_DIMMS;
- layers[1].is_virt_csrow = true;
- mci = edac_mc_alloc(mc, ARRAY_SIZE(layers), layers, 0);
- if (!mci) {
- rc = -ENOMEM;
- goto fail;
- }
- mci->ctl_name = kasprintf(GFP_KERNEL, "Intel_client_SoC MC#%d", mc);
- if (!mci->ctl_name) {
- rc = -ENOMEM;
- goto fail2;
- }
- mci->mtype_cap = MEM_FLAG_LPDDR4 | MEM_FLAG_DDR4;
- mci->edac_ctl_cap = EDAC_FLAG_SECDED;
- mci->edac_cap = EDAC_FLAG_SECDED;
- mci->mod_name = EDAC_MOD_STR;
- mci->dev_name = pci_name(pdev);
- if (edac_op_state == EDAC_OPSTATE_POLL)
- mci->edac_check = igen6_check;
- mci->pvt_info = &igen6_pvt->imc[mc];
- imc = mci->pvt_info;
- device_initialize(&imc->dev);
- /*
- * EDAC core uses mci->pdev(pointer of structure device) as
- * memory controller ID. The client SoCs attach one or more
- * memory controllers to single pci_dev (single pci_dev->dev
- * can be for multiple memory controllers).
- *
- * To make mci->pdev unique, assign pci_dev->dev to mci->pdev
- * for the first memory controller and assign a unique imc->dev
- * to mci->pdev for each non-first memory controller.
- */
- mci->pdev = mc ? &imc->dev : &pdev->dev;
- imc->mc = mc;
- imc->pdev = pdev;
- imc->window = window;
- igen6_reg_dump(imc);
- rc = igen6_get_dimm_config(mci);
- if (rc)
- goto fail3;
- rc = edac_mc_add_mc(mci);
- if (rc) {
- igen6_printk(KERN_ERR, "Failed to register mci#%d\n", mc);
- goto fail3;
- }
- imc->mci = mci;
- return 0;
- fail3:
- put_device(&imc->dev);
- mci->pvt_info = NULL;
- kfree(mci->ctl_name);
- fail2:
- edac_mc_free(mci);
- fail:
- return rc;
- }
- static void igen6_unregister_mcis(void)
- {
- struct mem_ctl_info *mci;
- struct igen6_imc *imc;
- int i;
- edac_dbg(2, "\n");
- for (i = 0; i < res_cfg->num_imc; i++) {
- imc = &igen6_pvt->imc[i];
- mci = imc->mci;
- if (!mci)
- continue;
- edac_mc_del_mc(mci->pdev);
- kfree(mci->ctl_name);
- mci->pvt_info = NULL;
- edac_mc_free(mci);
- put_device(&imc->dev);
- iounmap(imc->window);
- }
- }
- static int igen6_register_mcis(struct pci_dev *pdev, u64 mchbar)
- {
- void __iomem *window;
- int lmc, pmc, rc;
- u64 base;
- for (lmc = 0, pmc = 0; pmc < NUM_IMC; pmc++) {
- base = mchbar + pmc * MCHBAR_SIZE;
- window = ioremap(base, MCHBAR_SIZE);
- if (!window) {
- igen6_printk(KERN_ERR, "Failed to ioremap 0x%llx for mc%d\n", base, pmc);
- rc = -ENOMEM;
- goto out_unregister_mcis;
- }
- if (igen6_imc_absent(window)) {
- iounmap(window);
- edac_dbg(2, "Skip absent mc%d\n", pmc);
- continue;
- }
- rc = igen6_register_mci(lmc, window, pdev);
- if (rc)
- goto out_iounmap;
- /* Done, if all present MCs are detected and registered. */
- if (++lmc >= res_cfg->num_imc)
- break;
- }
- if (!lmc) {
- igen6_printk(KERN_ERR, "No mc found.\n");
- return -ENODEV;
- }
- if (lmc < res_cfg->num_imc) {
- igen6_printk(KERN_DEBUG, "Expected %d mcs, but only %d detected.",
- res_cfg->num_imc, lmc);
- res_cfg->num_imc = lmc;
- }
- return 0;
- out_iounmap:
- iounmap(window);
- out_unregister_mcis:
- igen6_unregister_mcis();
- return rc;
- }
- static int igen6_mem_slice_setup(u64 mchbar)
- {
- struct igen6_imc *imc = &igen6_pvt->imc[0];
- u64 base = mchbar + res_cfg->cmf_base;
- u32 offset = res_cfg->ms_hash_offset;
- u32 size = res_cfg->cmf_size;
- u64 ms_s_size, ms_hash;
- void __iomem *cmf;
- int ms_l_map;
- edac_dbg(2, "\n");
- if (imc[0].size < imc[1].size) {
- ms_s_size = imc[0].size;
- ms_l_map = 1;
- } else {
- ms_s_size = imc[1].size;
- ms_l_map = 0;
- }
- igen6_pvt->ms_s_size = ms_s_size;
- igen6_pvt->ms_l_map = ms_l_map;
- edac_dbg(0, "ms_s_size: %llu MiB, ms_l_map %d\n",
- ms_s_size >> 20, ms_l_map);
- if (!size)
- return 0;
- cmf = ioremap(base, size);
- if (!cmf) {
- igen6_printk(KERN_ERR, "Failed to ioremap cmf 0x%llx\n", base);
- return -ENODEV;
- }
- ms_hash = readq(cmf + offset);
- igen6_pvt->ms_hash = ms_hash;
- edac_dbg(0, "MEM_SLICE_HASH: 0x%llx\n", ms_hash);
- iounmap(cmf);
- return 0;
- }
- static int register_err_handler(void)
- {
- int rc;
- if (res_cfg->machine_check) {
- mce_register_decode_chain(&ecclog_mce_dec);
- return 0;
- }
- rc = register_nmi_handler(NMI_SERR, ecclog_nmi_handler,
- 0, IGEN6_NMI_NAME);
- if (rc) {
- igen6_printk(KERN_ERR, "Failed to register NMI handler\n");
- return rc;
- }
- return 0;
- }
- static void unregister_err_handler(void)
- {
- if (res_cfg->machine_check) {
- mce_unregister_decode_chain(&ecclog_mce_dec);
- return;
- }
- unregister_nmi_handler(NMI_SERR, IGEN6_NMI_NAME);
- }
- static void opstate_set(const struct res_config *cfg, const struct pci_device_id *ent)
- {
- /*
- * Quirk: Certain SoCs' error reporting interrupts don't work.
- * Force polling mode for them to ensure that memory error
- * events can be handled.
- */
- if (ent->device == DID_ADL_N_SKU4) {
- edac_op_state = EDAC_OPSTATE_POLL;
- return;
- }
- /* Set the mode according to the configuration data. */
- if (cfg->machine_check)
- edac_op_state = EDAC_OPSTATE_INT;
- else
- edac_op_state = EDAC_OPSTATE_NMI;
- }
- static int igen6_probe(struct pci_dev *pdev, const struct pci_device_id *ent)
- {
- u64 mchbar;
- int rc;
- edac_dbg(2, "\n");
- igen6_pvt = kzalloc_obj(*igen6_pvt);
- if (!igen6_pvt)
- return -ENOMEM;
- res_cfg = (struct res_config *)ent->driver_data;
- rc = igen6_pci_setup(pdev, &mchbar);
- if (rc)
- goto fail;
- opstate_set(res_cfg, ent);
- rc = igen6_register_mcis(pdev, mchbar);
- if (rc)
- goto fail;
- if (res_cfg->num_imc > 1) {
- rc = igen6_mem_slice_setup(mchbar);
- if (rc)
- goto fail2;
- }
- ecclog_pool = ecclog_gen_pool_create();
- if (!ecclog_pool) {
- rc = -ENOMEM;
- goto fail2;
- }
- INIT_WORK(&ecclog_work, ecclog_work_cb);
- init_irq_work(&ecclog_irq_work, ecclog_irq_work_cb);
- rc = register_err_handler();
- if (rc)
- goto fail3;
- /* Enable error reporting */
- rc = errcmd_enable_error_reporting(true);
- if (rc) {
- igen6_printk(KERN_ERR, "Failed to enable error reporting\n");
- goto fail4;
- }
- /* Check if any pending errors before/during the registration of the error handler */
- ecclog_handler();
- igen6_debug_setup();
- return 0;
- fail4:
- unregister_nmi_handler(NMI_SERR, IGEN6_NMI_NAME);
- fail3:
- gen_pool_destroy(ecclog_pool);
- fail2:
- igen6_unregister_mcis();
- fail:
- kfree(igen6_pvt);
- return rc;
- }
- static void igen6_remove(struct pci_dev *pdev)
- {
- edac_dbg(2, "\n");
- igen6_debug_teardown();
- errcmd_enable_error_reporting(false);
- unregister_err_handler();
- irq_work_sync(&ecclog_irq_work);
- flush_work(&ecclog_work);
- gen_pool_destroy(ecclog_pool);
- igen6_unregister_mcis();
- kfree(igen6_pvt);
- }
- static struct pci_driver igen6_driver = {
- .name = EDAC_MOD_STR,
- .probe = igen6_probe,
- .remove = igen6_remove,
- .id_table = igen6_pci_tbl,
- };
- static int __init igen6_init(void)
- {
- const char *owner;
- int rc;
- edac_dbg(2, "\n");
- if (ghes_get_devices())
- return -EBUSY;
- owner = edac_get_owner();
- if (owner && strncmp(owner, EDAC_MOD_STR, sizeof(EDAC_MOD_STR)))
- return -EBUSY;
- rc = pci_register_driver(&igen6_driver);
- if (rc)
- return rc;
- igen6_printk(KERN_INFO, "%s\n", IGEN6_REVISION);
- return 0;
- }
- static void __exit igen6_exit(void)
- {
- edac_dbg(2, "\n");
- pci_unregister_driver(&igen6_driver);
- }
- module_init(igen6_init);
- module_exit(igen6_exit);
- MODULE_LICENSE("GPL v2");
- MODULE_AUTHOR("Qiuxu Zhuo");
- MODULE_DESCRIPTION("MC Driver for Intel client SoC using In-Band ECC");
|