11772Sjl139090 /* 21772Sjl139090 * CDDL HEADER START 31772Sjl139090 * 41772Sjl139090 * The contents of this file are subject to the terms of the 51772Sjl139090 * Common Development and Distribution License (the "License"). 61772Sjl139090 * You may not use this file except in compliance with the License. 71772Sjl139090 * 81772Sjl139090 * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE 91772Sjl139090 * or http://www.opensolaris.org/os/licensing. 101772Sjl139090 * See the License for the specific language governing permissions 111772Sjl139090 * and limitations under the License. 121772Sjl139090 * 131772Sjl139090 * When distributing Covered Code, include this CDDL HEADER in each 141772Sjl139090 * file and include the License file at usr/src/OPENSOLARIS.LICENSE. 151772Sjl139090 * If applicable, add the following below this CDDL HEADER, with the 161772Sjl139090 * fields enclosed by brackets "[]" replaced with your own identifying 171772Sjl139090 * information: Portions Copyright [yyyy] [name of copyright owner] 181772Sjl139090 * 191772Sjl139090 * CDDL HEADER END 201772Sjl139090 */ 211772Sjl139090 /* 22*5979Sjimand * Copyright 2008 Sun Microsystems, Inc. All rights reserved. 232241Shuah * Use is subject to license terms. 242241Shuah */ 252241Shuah /* 265310Sdhain * All Rights Reserved, Copyright (c) FUJITSU LIMITED 2007 271772Sjl139090 */ 281772Sjl139090 291772Sjl139090 #pragma ident "%Z%%M% %I% %E% SMI" 301772Sjl139090 311772Sjl139090 #include <sys/types.h> 321772Sjl139090 #include <sys/sysmacros.h> 331772Sjl139090 #include <sys/conf.h> 341772Sjl139090 #include <sys/modctl.h> 351772Sjl139090 #include <sys/stat.h> 361772Sjl139090 #include <sys/async.h> 372241Shuah #include <sys/machcpuvar.h> 381772Sjl139090 #include <sys/machsystm.h> 392214Sav145390 #include <sys/promif.h> 401772Sjl139090 #include <sys/ksynch.h> 411772Sjl139090 #include <sys/ddi.h> 421772Sjl139090 #include <sys/sunddi.h> 435080Swh31274 #include <sys/sunndi.h> 441772Sjl139090 #include <sys/ddifm.h> 451772Sjl139090 #include <sys/fm/protocol.h> 461772Sjl139090 #include <sys/fm/util.h> 471772Sjl139090 #include <sys/kmem.h> 481772Sjl139090 #include <sys/fm/io/opl_mc_fm.h> 491772Sjl139090 #include <sys/memlist.h> 501772Sjl139090 #include <sys/param.h> 512214Sav145390 #include <sys/disp.h> 521772Sjl139090 #include <vm/page.h> 531772Sjl139090 #include <sys/mc-opl.h> 542214Sav145390 #include <sys/opl.h> 552214Sav145390 #include <sys/opl_dimm.h> 562214Sav145390 #include <sys/scfd/scfostoescf.h> 572494Shyw #include <sys/cpu_module.h> 582494Shyw #include <vm/seg_kmem.h> 592494Shyw #include <sys/vmem.h> 602494Shyw #include <vm/hat_sfmmu.h> 612494Shyw #include <sys/vmsystm.h> 622662Shyw #include <sys/membar.h> 631772Sjl139090 641772Sjl139090 /* 651772Sjl139090 * Function prototypes 661772Sjl139090 */ 671772Sjl139090 static int mc_open(dev_t *, int, int, cred_t *); 681772Sjl139090 static int mc_close(dev_t, int, int, cred_t *); 691772Sjl139090 static int mc_ioctl(dev_t, int, intptr_t, int, cred_t *, int *); 701772Sjl139090 static int mc_attach(dev_info_t *, ddi_attach_cmd_t); 711772Sjl139090 static int mc_detach(dev_info_t *, ddi_detach_cmd_t); 721772Sjl139090 732214Sav145390 static int mc_poll_init(void); 742214Sav145390 static void mc_poll_fini(void); 751772Sjl139090 static int mc_board_add(mc_opl_t *mcp); 761772Sjl139090 static int mc_board_del(mc_opl_t *mcp); 771772Sjl139090 static int mc_suspend(mc_opl_t *mcp, uint32_t flag); 781772Sjl139090 static int mc_resume(mc_opl_t *mcp, uint32_t flag); 792214Sav145390 int opl_mc_suspend(void); 802214Sav145390 int opl_mc_resume(void); 811772Sjl139090 821772Sjl139090 static void insert_mcp(mc_opl_t *mcp); 831772Sjl139090 static void delete_mcp(mc_opl_t *mcp); 841772Sjl139090 851772Sjl139090 static int pa_to_maddr(mc_opl_t *mcp, uint64_t pa, mc_addr_t *maddr); 861772Sjl139090 872662Shyw static int mc_rangecheck_pa(mc_opl_t *mcp, uint64_t pa); 881772Sjl139090 891772Sjl139090 int mc_get_mem_unum(int, uint64_t, char *, int, int *); 902214Sav145390 int mc_get_mem_addr(char *unum, char *sid, uint64_t offset, uint64_t *paddr); 912214Sav145390 int mc_get_mem_offset(uint64_t paddr, uint64_t *offp); 922214Sav145390 int mc_get_mem_sid(char *unum, char *buf, int buflen, int *lenp); 932214Sav145390 int mc_get_mem_sid_dimm(mc_opl_t *mcp, char *dname, char *buf, 942214Sav145390 int buflen, int *lenp); 952214Sav145390 mc_dimm_info_t *mc_get_dimm_list(mc_opl_t *mcp); 962214Sav145390 mc_dimm_info_t *mc_prepare_dimmlist(board_dimm_info_t *bd_dimmp); 972214Sav145390 int mc_set_mem_sid(mc_opl_t *mcp, char *buf, int buflen, int lsb, int bank, 982214Sav145390 uint32_t mf_type, uint32_t d_slot); 992214Sav145390 static void mc_free_dimm_list(mc_dimm_info_t *d); 1001772Sjl139090 static void mc_get_mlist(mc_opl_t *); 1012214Sav145390 static void mc_polling(void); 1022214Sav145390 static int mc_opl_get_physical_board(int); 1032214Sav145390 1045310Sdhain static void mc_clear_rewrite(mc_opl_t *mcp, int i); 1055310Sdhain static void mc_set_rewrite(mc_opl_t *mcp, int bank, uint32_t addr, int state); 1065310Sdhain 1072214Sav145390 #ifdef DEBUG 1082214Sav145390 static int mc_ioctl_debug(dev_t, int, intptr_t, int, cred_t *, int *); 1092214Sav145390 void mc_dump_dimm(char *buf, int dnamesz, int serialsz, int partnumsz); 1102214Sav145390 void mc_dump_dimm_info(board_dimm_info_t *bd_dimmp); 1112214Sav145390 #endif 1121772Sjl139090 1131772Sjl139090 #pragma weak opl_get_physical_board 1141772Sjl139090 extern int opl_get_physical_board(int); 1152214Sav145390 extern int plat_max_boards(void); 1161772Sjl139090 1171772Sjl139090 /* 1181772Sjl139090 * Configuration data structures 1191772Sjl139090 */ 1201772Sjl139090 static struct cb_ops mc_cb_ops = { 1211772Sjl139090 mc_open, /* open */ 1221772Sjl139090 mc_close, /* close */ 1231772Sjl139090 nulldev, /* strategy */ 1241772Sjl139090 nulldev, /* print */ 1251772Sjl139090 nodev, /* dump */ 1261772Sjl139090 nulldev, /* read */ 1271772Sjl139090 nulldev, /* write */ 1281772Sjl139090 mc_ioctl, /* ioctl */ 1291772Sjl139090 nodev, /* devmap */ 1301772Sjl139090 nodev, /* mmap */ 1311772Sjl139090 nodev, /* segmap */ 1321772Sjl139090 nochpoll, /* poll */ 1331772Sjl139090 ddi_prop_op, /* cb_prop_op */ 1341772Sjl139090 0, /* streamtab */ 1351772Sjl139090 D_MP | D_NEW | D_HOTPLUG, /* Driver compatibility flag */ 1361772Sjl139090 CB_REV, /* rev */ 1371772Sjl139090 nodev, /* cb_aread */ 1381772Sjl139090 nodev /* cb_awrite */ 1391772Sjl139090 }; 1401772Sjl139090 1411772Sjl139090 static struct dev_ops mc_ops = { 1421772Sjl139090 DEVO_REV, /* rev */ 1431772Sjl139090 0, /* refcnt */ 1441772Sjl139090 ddi_getinfo_1to1, /* getinfo */ 1451772Sjl139090 nulldev, /* identify */ 1461772Sjl139090 nulldev, /* probe */ 1471772Sjl139090 mc_attach, /* attach */ 1481772Sjl139090 mc_detach, /* detach */ 1491772Sjl139090 nulldev, /* reset */ 1501772Sjl139090 &mc_cb_ops, /* cb_ops */ 1511772Sjl139090 (struct bus_ops *)0, /* bus_ops */ 1521772Sjl139090 nulldev /* power */ 1531772Sjl139090 }; 1541772Sjl139090 1551772Sjl139090 /* 1561772Sjl139090 * Driver globals 1571772Sjl139090 */ 1582214Sav145390 1592214Sav145390 static enum { 1602214Sav145390 MODEL_FF1 = 0, 1612214Sav145390 MODEL_FF2 = 1, 1622214Sav145390 MODEL_DC = 2 1632214Sav145390 } plat_model = MODEL_DC; /* The default behaviour is DC */ 1642214Sav145390 1652214Sav145390 static struct plat_model_names { 1662214Sav145390 const char *unit_name; 1672214Sav145390 const char *mem_name; 1682214Sav145390 } model_names[] = { 1692214Sav145390 { "MBU_A", "MEMB" }, 1702214Sav145390 { "MBU_B", "MEMB" }, 1712214Sav145390 { "CMU", "" } 1722214Sav145390 }; 1732214Sav145390 1742214Sav145390 /* 1752214Sav145390 * The DIMM Names for DC platform. 1762214Sav145390 * The index into this table is made up of (bank, dslot), 1772214Sav145390 * Where dslot occupies bits 0-1 and bank occupies 2-4. 1782214Sav145390 */ 1792214Sav145390 static char *mc_dc_dimm_unum_table[OPL_MAX_DIMMS] = { 1802214Sav145390 /* --------CMUnn----------- */ 1812214Sav145390 /* --CS0-----|--CS1------ */ 1822214Sav145390 /* -H-|--L-- | -H- | -L-- */ 1832501Sraghuram "03A", "02A", "03B", "02B", /* Bank 0 (MAC 0 bank 0) */ 1842501Sraghuram "13A", "12A", "13B", "12B", /* Bank 1 (MAC 0 bank 1) */ 1852501Sraghuram "23A", "22A", "23B", "22B", /* Bank 2 (MAC 1 bank 0) */ 1862501Sraghuram "33A", "32A", "33B", "32B", /* Bank 3 (MAC 1 bank 1) */ 1872501Sraghuram "01A", "00A", "01B", "00B", /* Bank 4 (MAC 2 bank 0) */ 1882501Sraghuram "11A", "10A", "11B", "10B", /* Bank 5 (MAC 2 bank 1) */ 1892501Sraghuram "21A", "20A", "21B", "20B", /* Bank 6 (MAC 3 bank 0) */ 1902501Sraghuram "31A", "30A", "31B", "30B" /* Bank 7 (MAC 3 bank 1) */ 1912214Sav145390 }; 1922214Sav145390 1932214Sav145390 /* 1942214Sav145390 * The DIMM Names for FF1/FF2 platforms. 1952214Sav145390 * The index into this table is made up of (board, bank, dslot), 1962214Sav145390 * Where dslot occupies bits 0-1, bank occupies 2-4 and 1972214Sav145390 * board occupies the bit 5. 1982214Sav145390 */ 1992214Sav145390 static char *mc_ff_dimm_unum_table[2 * OPL_MAX_DIMMS] = { 2002214Sav145390 /* --------CMU0---------- */ 2012214Sav145390 /* --CS0-----|--CS1------ */ 2022214Sav145390 /* -H-|--L-- | -H- | -L-- */ 2032501Sraghuram "03A", "02A", "03B", "02B", /* Bank 0 (MAC 0 bank 0) */ 2042501Sraghuram "01A", "00A", "01B", "00B", /* Bank 1 (MAC 0 bank 1) */ 2052501Sraghuram "13A", "12A", "13B", "12B", /* Bank 2 (MAC 1 bank 0) */ 2062501Sraghuram "11A", "10A", "11B", "10B", /* Bank 3 (MAC 1 bank 1) */ 2072501Sraghuram "23A", "22A", "23B", "22B", /* Bank 4 (MAC 2 bank 0) */ 2082501Sraghuram "21A", "20A", "21B", "20B", /* Bank 5 (MAC 2 bank 1) */ 2092501Sraghuram "33A", "32A", "33B", "32B", /* Bank 6 (MAC 3 bank 0) */ 2102501Sraghuram "31A", "30A", "31B", "30B", /* Bank 7 (MAC 3 bank 1) */ 2112214Sav145390 /* --------CMU1---------- */ 2122214Sav145390 /* --CS0-----|--CS1------ */ 2132214Sav145390 /* -H-|--L-- | -H- | -L-- */ 2142501Sraghuram "43A", "42A", "43B", "42B", /* Bank 0 (MAC 0 bank 0) */ 2152501Sraghuram "41A", "40A", "41B", "40B", /* Bank 1 (MAC 0 bank 1) */ 2162501Sraghuram "53A", "52A", "53B", "52B", /* Bank 2 (MAC 1 bank 0) */ 2172501Sraghuram "51A", "50A", "51B", "50B", /* Bank 3 (MAC 1 bank 1) */ 2182501Sraghuram "63A", "62A", "63B", "62B", /* Bank 4 (MAC 2 bank 0) */ 2192501Sraghuram "61A", "60A", "61B", "60B", /* Bank 5 (MAC 2 bank 1) */ 2202501Sraghuram "73A", "72A", "73B", "72B", /* Bank 6 (MAC 3 bank 0) */ 2212501Sraghuram "71A", "70A", "71B", "70B" /* Bank 7 (MAC 3 bank 1) */ 2222214Sav145390 }; 2232214Sav145390 2242214Sav145390 #define BD_BK_SLOT_TO_INDEX(bd, bk, s) \ 2252214Sav145390 (((bd & 0x01) << 5) | ((bk & 0x07) << 2) | (s & 0x03)) 2262214Sav145390 2272214Sav145390 #define INDEX_TO_BANK(i) (((i) & 0x1C) >> 2) 2282214Sav145390 #define INDEX_TO_SLOT(i) ((i) & 0x03) 2292214Sav145390 2303045Sav145390 #define SLOT_TO_CS(slot) ((slot & 0x3) >> 1) 2313045Sav145390 2322214Sav145390 /* Isolation unit size is 64 MB */ 2332214Sav145390 #define MC_ISOLATION_BSIZE (64 * 1024 * 1024) 2342214Sav145390 2352214Sav145390 #define MC_MAX_SPEEDS 7 2362214Sav145390 2372214Sav145390 typedef struct { 2382214Sav145390 uint32_t mc_speeds; 2392214Sav145390 uint32_t mc_period; 2402214Sav145390 } mc_scan_speed_t; 2412214Sav145390 2422214Sav145390 #define MC_CNTL_SPEED_SHIFT 26 2432214Sav145390 2442867Shyw /* 2452867Shyw * In mirror mode, we normalized the bank idx to "even" since 2462867Shyw * the HW treats them as one unit w.r.t programming. 2472867Shyw * This bank index will be the "effective" bank index. 2482867Shyw * All mirrored bank state info on mc_period, mc_speedup_period 2492867Shyw * will be stored in the even bank structure to avoid code duplication. 2502867Shyw */ 2512867Shyw #define MIRROR_IDX(bankidx) (bankidx & ~1) 2522867Shyw 2532214Sav145390 static mc_scan_speed_t mc_scan_speeds[MC_MAX_SPEEDS] = { 2542214Sav145390 {0x6 << MC_CNTL_SPEED_SHIFT, 0}, 2552214Sav145390 {0x5 << MC_CNTL_SPEED_SHIFT, 32}, 2562214Sav145390 {0x4 << MC_CNTL_SPEED_SHIFT, 64}, 2572214Sav145390 {0x3 << MC_CNTL_SPEED_SHIFT, 128}, 2582214Sav145390 {0x2 << MC_CNTL_SPEED_SHIFT, 256}, 2592214Sav145390 {0x1 << MC_CNTL_SPEED_SHIFT, 512}, 2602214Sav145390 {0x0 << MC_CNTL_SPEED_SHIFT, 1024} 2612214Sav145390 }; 2622214Sav145390 2632214Sav145390 static uint32_t mc_max_speed = (0x6 << 26); 2642214Sav145390 2652214Sav145390 int mc_isolation_bsize = MC_ISOLATION_BSIZE; 2662214Sav145390 int mc_patrol_interval_sec = MC_PATROL_INTERVAL_SEC; 2672214Sav145390 int mc_max_scf_retry = 16; 2682214Sav145390 int mc_max_scf_logs = 64; 2692214Sav145390 int mc_max_errlog_processed = BANKNUM_PER_SB*2; 2702214Sav145390 int mc_scan_period = 12 * 60 * 60; /* 12 hours period */ 2712214Sav145390 int mc_max_rewrite_loop = 100; 2722214Sav145390 int mc_rewrite_delay = 10; 2732214Sav145390 /* 2742214Sav145390 * it takes SCF about 300 m.s. to process a requst. We can bail out 2752214Sav145390 * if it is busy. It does not pay to wait for it too long. 2762214Sav145390 */ 2772214Sav145390 int mc_max_scf_loop = 2; 2782214Sav145390 int mc_scf_delay = 100; 2792214Sav145390 int mc_pce_dropped = 0; 2802214Sav145390 int mc_poll_priority = MINCLSYSPRI; 2815310Sdhain int mc_max_rewrite_retry = 6 * 60; 2822214Sav145390 2832214Sav145390 2842214Sav145390 /* 2853152Sav145390 * Mutex hierarchy in mc-opl 2862214Sav145390 * If both mcmutex and mc_lock must be held, 2872214Sav145390 * mcmutex must be acquired first, and then mc_lock. 2882214Sav145390 */ 2892214Sav145390 2901772Sjl139090 static kmutex_t mcmutex; 2912214Sav145390 mc_opl_t *mc_instances[OPL_MAX_BOARDS]; 2922214Sav145390 2932214Sav145390 static kmutex_t mc_polling_lock; 2942214Sav145390 static kcondvar_t mc_polling_cv; 2952214Sav145390 static kcondvar_t mc_poll_exit_cv; 2962214Sav145390 static int mc_poll_cmd = 0; 2972214Sav145390 static int mc_pollthr_running = 0; 2982214Sav145390 int mc_timeout_period = 0; /* this is in m.s. */ 2991772Sjl139090 void *mc_statep; 3001772Sjl139090 3011772Sjl139090 #ifdef DEBUG 3021809Shyw int oplmc_debug = 0; 3031772Sjl139090 #endif 3041772Sjl139090 3052214Sav145390 static int mc_debug_show_all = 0; 3061772Sjl139090 3071772Sjl139090 extern struct mod_ops mod_driverops; 3081772Sjl139090 3091772Sjl139090 static struct modldrv modldrv = { 3101772Sjl139090 &mod_driverops, /* module type, this one is a driver */ 3112214Sav145390 "OPL Memory-controller %I%", /* module name */ 3121772Sjl139090 &mc_ops, /* driver ops */ 3131772Sjl139090 }; 3141772Sjl139090 3151772Sjl139090 static struct modlinkage modlinkage = { 3161772Sjl139090 MODREV_1, /* rev */ 3171772Sjl139090 (void *)&modldrv, 3181772Sjl139090 NULL 3191772Sjl139090 }; 3201772Sjl139090 3211772Sjl139090 #pragma weak opl_get_mem_unum 3222214Sav145390 #pragma weak opl_get_mem_sid 3232214Sav145390 #pragma weak opl_get_mem_offset 3242214Sav145390 #pragma weak opl_get_mem_addr 3252214Sav145390 3261772Sjl139090 extern int (*opl_get_mem_unum)(int, uint64_t, char *, int, int *); 3272214Sav145390 extern int (*opl_get_mem_sid)(char *unum, char *buf, int buflen, int *lenp); 3282214Sav145390 extern int (*opl_get_mem_offset)(uint64_t paddr, uint64_t *offp); 3292214Sav145390 extern int (*opl_get_mem_addr)(char *unum, char *sid, uint64_t offset, 3302214Sav145390 uint64_t *paddr); 3312214Sav145390 3321772Sjl139090 3331772Sjl139090 /* 3341772Sjl139090 * pseudo-mc node portid format 3351772Sjl139090 * 3361772Sjl139090 * [10] = 0 3371772Sjl139090 * [9] = 1 3381772Sjl139090 * [8] = LSB_ID[4] = 0 3391772Sjl139090 * [7:4] = LSB_ID[3:0] 3401772Sjl139090 * [3:0] = 0 3411772Sjl139090 * 3421772Sjl139090 */ 3431772Sjl139090 3441772Sjl139090 /* 3451772Sjl139090 * These are the module initialization routines. 3461772Sjl139090 */ 3471772Sjl139090 int 3481772Sjl139090 _init(void) 3491772Sjl139090 { 3502214Sav145390 int error; 3512214Sav145390 int plen; 3522214Sav145390 char model[20]; 3532214Sav145390 pnode_t node; 3541772Sjl139090 3551772Sjl139090 3561772Sjl139090 if ((error = ddi_soft_state_init(&mc_statep, 3571772Sjl139090 sizeof (mc_opl_t), 1)) != 0) 3581772Sjl139090 return (error); 3591772Sjl139090 3602214Sav145390 if ((error = mc_poll_init()) != 0) { 3612214Sav145390 ddi_soft_state_fini(&mc_statep); 3622214Sav145390 return (error); 3632214Sav145390 } 3642214Sav145390 3651772Sjl139090 mutex_init(&mcmutex, NULL, MUTEX_DRIVER, NULL); 3661772Sjl139090 if (&opl_get_mem_unum) 3671772Sjl139090 opl_get_mem_unum = mc_get_mem_unum; 3682214Sav145390 if (&opl_get_mem_sid) 3692214Sav145390 opl_get_mem_sid = mc_get_mem_sid; 3702214Sav145390 if (&opl_get_mem_offset) 3712214Sav145390 opl_get_mem_offset = mc_get_mem_offset; 3722214Sav145390 if (&opl_get_mem_addr) 3732214Sav145390 opl_get_mem_addr = mc_get_mem_addr; 3742214Sav145390 3752214Sav145390 node = prom_rootnode(); 3762214Sav145390 plen = prom_getproplen(node, "model"); 3772214Sav145390 3782214Sav145390 if (plen > 0 && plen < sizeof (model)) { 3792214Sav145390 (void) prom_getprop(node, "model", model); 3802214Sav145390 model[plen] = '\0'; 3812214Sav145390 if (strcmp(model, "FF1") == 0) 3822214Sav145390 plat_model = MODEL_FF1; 3832214Sav145390 else if (strcmp(model, "FF2") == 0) 3842214Sav145390 plat_model = MODEL_FF2; 3852214Sav145390 else if (strncmp(model, "DC", 2) == 0) 3862214Sav145390 plat_model = MODEL_DC; 3872214Sav145390 } 3881772Sjl139090 3891772Sjl139090 error = mod_install(&modlinkage); 3901772Sjl139090 if (error != 0) { 3911772Sjl139090 if (&opl_get_mem_unum) 3921772Sjl139090 opl_get_mem_unum = NULL; 3932214Sav145390 if (&opl_get_mem_sid) 3942214Sav145390 opl_get_mem_sid = NULL; 3952214Sav145390 if (&opl_get_mem_offset) 3962214Sav145390 opl_get_mem_offset = NULL; 3972214Sav145390 if (&opl_get_mem_addr) 3982214Sav145390 opl_get_mem_addr = NULL; 3991772Sjl139090 mutex_destroy(&mcmutex); 4002214Sav145390 mc_poll_fini(); 4011772Sjl139090 ddi_soft_state_fini(&mc_statep); 4021772Sjl139090 } 4031772Sjl139090 return (error); 4041772Sjl139090 } 4051772Sjl139090 4061772Sjl139090 int 4071772Sjl139090 _fini(void) 4081772Sjl139090 { 4091772Sjl139090 int error; 4101772Sjl139090 4111772Sjl139090 if ((error = mod_remove(&modlinkage)) != 0) 4121772Sjl139090 return (error); 4131772Sjl139090 4141772Sjl139090 if (&opl_get_mem_unum) 4151772Sjl139090 opl_get_mem_unum = NULL; 4162214Sav145390 if (&opl_get_mem_sid) 4172214Sav145390 opl_get_mem_sid = NULL; 4182214Sav145390 if (&opl_get_mem_offset) 4192214Sav145390 opl_get_mem_offset = NULL; 4202214Sav145390 if (&opl_get_mem_addr) 4212214Sav145390 opl_get_mem_addr = NULL; 4222214Sav145390 4232214Sav145390 mutex_destroy(&mcmutex); 4242214Sav145390 mc_poll_fini(); 4251772Sjl139090 ddi_soft_state_fini(&mc_statep); 4261772Sjl139090 4271772Sjl139090 return (0); 4281772Sjl139090 } 4291772Sjl139090 4301772Sjl139090 int 4311772Sjl139090 _info(struct modinfo *modinfop) 4321772Sjl139090 { 4331772Sjl139090 return (mod_info(&modlinkage, modinfop)); 4341772Sjl139090 } 4351772Sjl139090 4362214Sav145390 static void 4372214Sav145390 mc_polling_thread() 4382214Sav145390 { 4392214Sav145390 mutex_enter(&mc_polling_lock); 4402214Sav145390 mc_pollthr_running = 1; 4412214Sav145390 while (!(mc_poll_cmd & MC_POLL_EXIT)) { 4422214Sav145390 mc_polling(); 4432214Sav145390 cv_timedwait(&mc_polling_cv, &mc_polling_lock, 4442214Sav145390 ddi_get_lbolt() + mc_timeout_period); 4452214Sav145390 } 4462214Sav145390 mc_pollthr_running = 0; 4472214Sav145390 4482214Sav145390 /* 4492214Sav145390 * signal if any one is waiting for this thread to exit. 4502214Sav145390 */ 4512214Sav145390 cv_signal(&mc_poll_exit_cv); 4522214Sav145390 mutex_exit(&mc_polling_lock); 4532214Sav145390 thread_exit(); 4542214Sav145390 /* NOTREACHED */ 4552214Sav145390 } 4562214Sav145390 4572214Sav145390 static int 4582214Sav145390 mc_poll_init() 4592214Sav145390 { 4602214Sav145390 mutex_init(&mc_polling_lock, NULL, MUTEX_DRIVER, NULL); 4612214Sav145390 cv_init(&mc_polling_cv, NULL, CV_DRIVER, NULL); 4622214Sav145390 cv_init(&mc_poll_exit_cv, NULL, CV_DRIVER, NULL); 4632214Sav145390 return (0); 4642214Sav145390 } 4652214Sav145390 4662214Sav145390 static void 4672214Sav145390 mc_poll_fini() 4682214Sav145390 { 4692214Sav145390 mutex_enter(&mc_polling_lock); 4702214Sav145390 if (mc_pollthr_running) { 4712214Sav145390 mc_poll_cmd = MC_POLL_EXIT; 4722214Sav145390 cv_signal(&mc_polling_cv); 4732214Sav145390 while (mc_pollthr_running) { 4742214Sav145390 cv_wait(&mc_poll_exit_cv, &mc_polling_lock); 4752214Sav145390 } 4762214Sav145390 } 4772214Sav145390 mutex_exit(&mc_polling_lock); 4782214Sav145390 mutex_destroy(&mc_polling_lock); 4792214Sav145390 cv_destroy(&mc_polling_cv); 4802214Sav145390 cv_destroy(&mc_poll_exit_cv); 4812214Sav145390 } 4822214Sav145390 4831772Sjl139090 static int 4841772Sjl139090 mc_attach(dev_info_t *devi, ddi_attach_cmd_t cmd) 4851772Sjl139090 { 4861772Sjl139090 mc_opl_t *mcp; 4871772Sjl139090 int instance; 4882214Sav145390 int rv; 4891772Sjl139090 4901772Sjl139090 /* get the instance of this devi */ 4911772Sjl139090 instance = ddi_get_instance(devi); 4921772Sjl139090 4931772Sjl139090 switch (cmd) { 4941772Sjl139090 case DDI_ATTACH: 4951772Sjl139090 break; 4961772Sjl139090 case DDI_RESUME: 4971772Sjl139090 mcp = ddi_get_soft_state(mc_statep, instance); 4982214Sav145390 rv = mc_resume(mcp, MC_DRIVER_SUSPENDED); 4992214Sav145390 return (rv); 5001772Sjl139090 default: 5011772Sjl139090 return (DDI_FAILURE); 5021772Sjl139090 } 5031772Sjl139090 5041772Sjl139090 if (ddi_soft_state_zalloc(mc_statep, instance) != DDI_SUCCESS) 5051772Sjl139090 return (DDI_FAILURE); 5061772Sjl139090 5071772Sjl139090 if ((mcp = ddi_get_soft_state(mc_statep, instance)) == NULL) { 5081772Sjl139090 goto bad; 5091772Sjl139090 } 5101772Sjl139090 5112214Sav145390 if (mc_timeout_period == 0) { 5122214Sav145390 mc_patrol_interval_sec = (int)ddi_getprop(DDI_DEV_T_ANY, devi, 5135080Swh31274 DDI_PROP_DONTPASS, "mc-timeout-interval-sec", 5145080Swh31274 mc_patrol_interval_sec); 5155080Swh31274 mc_timeout_period = drv_usectohz(1000000 * 5165080Swh31274 mc_patrol_interval_sec / OPL_MAX_BOARDS); 5172214Sav145390 } 5182214Sav145390 5191772Sjl139090 /* set informations in mc state */ 5201772Sjl139090 mcp->mc_dip = devi; 5211772Sjl139090 5221772Sjl139090 if (mc_board_add(mcp)) 5231772Sjl139090 goto bad; 5241772Sjl139090 5251772Sjl139090 insert_mcp(mcp); 5262214Sav145390 5272214Sav145390 /* 5282214Sav145390 * Start the polling thread if it is not running already. 5292214Sav145390 */ 5302214Sav145390 mutex_enter(&mc_polling_lock); 5312214Sav145390 if (!mc_pollthr_running) { 5322214Sav145390 (void) thread_create(NULL, 0, (void (*)())mc_polling_thread, 5335080Swh31274 NULL, 0, &p0, TS_RUN, mc_poll_priority); 5342214Sav145390 } 5352214Sav145390 mutex_exit(&mc_polling_lock); 5361772Sjl139090 ddi_report_dev(devi); 5371772Sjl139090 5381772Sjl139090 return (DDI_SUCCESS); 5391772Sjl139090 5401772Sjl139090 bad: 5411772Sjl139090 ddi_soft_state_free(mc_statep, instance); 5421772Sjl139090 return (DDI_FAILURE); 5431772Sjl139090 } 5441772Sjl139090 5451772Sjl139090 /* ARGSUSED */ 5461772Sjl139090 static int 5471772Sjl139090 mc_detach(dev_info_t *devi, ddi_detach_cmd_t cmd) 5481772Sjl139090 { 5492214Sav145390 int rv; 5501772Sjl139090 int instance; 5511772Sjl139090 mc_opl_t *mcp; 5521772Sjl139090 5531772Sjl139090 /* get the instance of this devi */ 5541772Sjl139090 instance = ddi_get_instance(devi); 5551772Sjl139090 if ((mcp = ddi_get_soft_state(mc_statep, instance)) == NULL) { 5561772Sjl139090 return (DDI_FAILURE); 5571772Sjl139090 } 5581772Sjl139090 5591772Sjl139090 switch (cmd) { 5601772Sjl139090 case DDI_SUSPEND: 5612214Sav145390 rv = mc_suspend(mcp, MC_DRIVER_SUSPENDED); 5622214Sav145390 return (rv); 5631772Sjl139090 case DDI_DETACH: 5641772Sjl139090 break; 5651772Sjl139090 default: 5661772Sjl139090 return (DDI_FAILURE); 5671772Sjl139090 } 5681772Sjl139090 5692214Sav145390 delete_mcp(mcp); 5701772Sjl139090 if (mc_board_del(mcp) != DDI_SUCCESS) { 5711772Sjl139090 return (DDI_FAILURE); 5721772Sjl139090 } 5731772Sjl139090 5741772Sjl139090 /* free up the soft state */ 5751772Sjl139090 ddi_soft_state_free(mc_statep, instance); 5761772Sjl139090 5771772Sjl139090 return (DDI_SUCCESS); 5781772Sjl139090 } 5791772Sjl139090 5801772Sjl139090 /* ARGSUSED */ 5811772Sjl139090 static int 5821772Sjl139090 mc_open(dev_t *devp, int flag, int otyp, cred_t *credp) 5831772Sjl139090 { 5841772Sjl139090 return (0); 5851772Sjl139090 } 5861772Sjl139090 5871772Sjl139090 /* ARGSUSED */ 5881772Sjl139090 static int 5891772Sjl139090 mc_close(dev_t devp, int flag, int otyp, cred_t *credp) 5901772Sjl139090 { 5911772Sjl139090 return (0); 5921772Sjl139090 } 5931772Sjl139090 5941772Sjl139090 /* ARGSUSED */ 5951772Sjl139090 static int 5961772Sjl139090 mc_ioctl(dev_t dev, int cmd, intptr_t arg, int mode, cred_t *credp, 5971772Sjl139090 int *rvalp) 5981772Sjl139090 { 5992214Sav145390 #ifdef DEBUG 6002214Sav145390 return (mc_ioctl_debug(dev, cmd, arg, mode, credp, rvalp)); 6012214Sav145390 #else 6021772Sjl139090 return (ENXIO); 6032214Sav145390 #endif 6041772Sjl139090 } 6051772Sjl139090 6061772Sjl139090 /* 6071772Sjl139090 * PA validity check: 6082662Shyw * This function return 1 if the PA is a valid PA 6092662Shyw * in the running Solaris instance i.e. in physinstall 6102662Shyw * Otherwise, return 0. 6111772Sjl139090 */ 6121772Sjl139090 6131772Sjl139090 /* ARGSUSED */ 6141772Sjl139090 static int 6151772Sjl139090 pa_is_valid(mc_opl_t *mcp, uint64_t addr) 6161772Sjl139090 { 6171772Sjl139090 if (mcp->mlist == NULL) 6181772Sjl139090 mc_get_mlist(mcp); 6191772Sjl139090 6201772Sjl139090 if (mcp->mlist && address_in_memlist(mcp->mlist, addr, 0)) { 6211772Sjl139090 return (1); 6221772Sjl139090 } 6231772Sjl139090 return (0); 6241772Sjl139090 } 6251772Sjl139090 6261772Sjl139090 /* 6271772Sjl139090 * mac-pa translation routines. 6281772Sjl139090 * 6291772Sjl139090 * Input: mc driver state, (LSB#, Bank#, DIMM address) 6301772Sjl139090 * Output: physical address 6311772Sjl139090 * 6321772Sjl139090 * Valid - return value: 0 6331772Sjl139090 * Invalid - return value: -1 6341772Sjl139090 */ 6351772Sjl139090 static int 6361772Sjl139090 mcaddr_to_pa(mc_opl_t *mcp, mc_addr_t *maddr, uint64_t *pa) 6371772Sjl139090 { 6381772Sjl139090 int i; 6391772Sjl139090 uint64_t pa_offset = 0; 6401772Sjl139090 int cs = (maddr->ma_dimm_addr >> CS_SHIFT) & 1; 6411772Sjl139090 int bank = maddr->ma_bank; 6421772Sjl139090 mc_addr_t maddr1; 6431772Sjl139090 int bank0, bank1; 6441772Sjl139090 6451772Sjl139090 MC_LOG("mcaddr /LSB%d/B%d/%x\n", maddr->ma_bd, bank, 6465080Swh31274 maddr->ma_dimm_addr); 6471772Sjl139090 6481772Sjl139090 /* loc validity check */ 6491772Sjl139090 ASSERT(maddr->ma_bd >= 0 && OPL_BOARD_MAX > maddr->ma_bd); 6501772Sjl139090 ASSERT(bank >= 0 && OPL_BANK_MAX > bank); 6511772Sjl139090 6521772Sjl139090 /* Do translation */ 6531772Sjl139090 for (i = 0; i < PA_BITS_FOR_MAC; i++) { 6541772Sjl139090 int pa_bit = 0; 6551772Sjl139090 int mc_bit = mcp->mc_trans_table[cs][i]; 6561772Sjl139090 if (mc_bit < MC_ADDRESS_BITS) { 6571772Sjl139090 pa_bit = (maddr->ma_dimm_addr >> mc_bit) & 1; 6581772Sjl139090 } else if (mc_bit == MP_NONE) { 6591772Sjl139090 pa_bit = 0; 6601772Sjl139090 } else if (mc_bit == MP_BANK_0) { 6611772Sjl139090 pa_bit = bank & 1; 6621772Sjl139090 } else if (mc_bit == MP_BANK_1) { 6631772Sjl139090 pa_bit = (bank >> 1) & 1; 6641772Sjl139090 } else if (mc_bit == MP_BANK_2) { 6651772Sjl139090 pa_bit = (bank >> 2) & 1; 6661772Sjl139090 } 6671772Sjl139090 pa_offset |= ((uint64_t)pa_bit) << i; 6681772Sjl139090 } 6691772Sjl139090 *pa = mcp->mc_start_address + pa_offset; 6701772Sjl139090 MC_LOG("pa = %lx\n", *pa); 6711772Sjl139090 6721772Sjl139090 if (pa_to_maddr(mcp, *pa, &maddr1) == -1) { 6732214Sav145390 cmn_err(CE_WARN, "mcaddr_to_pa: /LSB%d/B%d/%x failed to " 6742214Sav145390 "convert PA %lx\n", maddr->ma_bd, bank, 6752214Sav145390 maddr->ma_dimm_addr, *pa); 6761772Sjl139090 return (-1); 6771772Sjl139090 } 6781772Sjl139090 6792214Sav145390 /* 6802214Sav145390 * In mirror mode, PA is always translated to the even bank. 6812214Sav145390 */ 6821772Sjl139090 if (IS_MIRROR(mcp, maddr->ma_bank)) { 6831772Sjl139090 bank0 = maddr->ma_bank & ~(1); 6841772Sjl139090 bank1 = maddr1.ma_bank & ~(1); 6851772Sjl139090 } else { 6861772Sjl139090 bank0 = maddr->ma_bank; 6871772Sjl139090 bank1 = maddr1.ma_bank; 6881772Sjl139090 } 6891772Sjl139090 /* 6901772Sjl139090 * there is no need to check ma_bd because it is generated from 6911772Sjl139090 * mcp. They are the same. 6921772Sjl139090 */ 6935080Swh31274 if ((bank0 == bank1) && (maddr->ma_dimm_addr == 6945080Swh31274 maddr1.ma_dimm_addr)) { 6951772Sjl139090 return (0); 6961772Sjl139090 } else { 6971772Sjl139090 cmn_err(CE_WARN, "Translation error source /LSB%d/B%d/%x, " 6985080Swh31274 "PA %lx, target /LSB%d/B%d/%x\n", maddr->ma_bd, bank, 6995080Swh31274 maddr->ma_dimm_addr, *pa, maddr1.ma_bd, maddr1.ma_bank, 7005080Swh31274 maddr1.ma_dimm_addr); 7011772Sjl139090 return (-1); 7021772Sjl139090 } 7031772Sjl139090 } 7041772Sjl139090 7051772Sjl139090 /* 7061772Sjl139090 * PA to CS (used by pa_to_maddr). 7071772Sjl139090 */ 7081772Sjl139090 static int 7091772Sjl139090 pa_to_cs(mc_opl_t *mcp, uint64_t pa_offset) 7101772Sjl139090 { 7111772Sjl139090 int i; 7122662Shyw int cs = 1; 7131772Sjl139090 7141772Sjl139090 for (i = 0; i < PA_BITS_FOR_MAC; i++) { 7151772Sjl139090 /* MAC address bit<29> is arranged on the same PA bit */ 7161772Sjl139090 /* on both table. So we may use any table. */ 7171772Sjl139090 if (mcp->mc_trans_table[0][i] == CS_SHIFT) { 7181772Sjl139090 cs = (pa_offset >> i) & 1; 7191772Sjl139090 break; 7201772Sjl139090 } 7211772Sjl139090 } 7221772Sjl139090 return (cs); 7231772Sjl139090 } 7241772Sjl139090 7251772Sjl139090 /* 7261772Sjl139090 * PA to DIMM (used by pa_to_maddr). 7271772Sjl139090 */ 7281772Sjl139090 /* ARGSUSED */ 7291772Sjl139090 static uint32_t 7301772Sjl139090 pa_to_dimm(mc_opl_t *mcp, uint64_t pa_offset) 7311772Sjl139090 { 7321772Sjl139090 int i; 7331772Sjl139090 int cs = pa_to_cs(mcp, pa_offset); 7341772Sjl139090 uint32_t dimm_addr = 0; 7351772Sjl139090 7361772Sjl139090 for (i = 0; i < PA_BITS_FOR_MAC; i++) { 7371772Sjl139090 int pa_bit_value = (pa_offset >> i) & 1; 7381772Sjl139090 int mc_bit = mcp->mc_trans_table[cs][i]; 7391772Sjl139090 if (mc_bit < MC_ADDRESS_BITS) { 7401772Sjl139090 dimm_addr |= pa_bit_value << mc_bit; 7411772Sjl139090 } 7421772Sjl139090 } 7432662Shyw dimm_addr |= cs << CS_SHIFT; 7441772Sjl139090 return (dimm_addr); 7451772Sjl139090 } 7461772Sjl139090 7471772Sjl139090 /* 7481772Sjl139090 * PA to Bank (used by pa_to_maddr). 7491772Sjl139090 */ 7501772Sjl139090 static int 7511772Sjl139090 pa_to_bank(mc_opl_t *mcp, uint64_t pa_offset) 7521772Sjl139090 { 7531772Sjl139090 int i; 7541772Sjl139090 int cs = pa_to_cs(mcp, pa_offset); 7551772Sjl139090 int bankno = mcp->mc_trans_table[cs][INDEX_OF_BANK_SUPPLEMENT_BIT]; 7561772Sjl139090 7571772Sjl139090 7581772Sjl139090 for (i = 0; i < PA_BITS_FOR_MAC; i++) { 7591772Sjl139090 int pa_bit_value = (pa_offset >> i) & 1; 7601772Sjl139090 int mc_bit = mcp->mc_trans_table[cs][i]; 7611772Sjl139090 switch (mc_bit) { 7621772Sjl139090 case MP_BANK_0: 7631772Sjl139090 bankno |= pa_bit_value; 7641772Sjl139090 break; 7651772Sjl139090 case MP_BANK_1: 7661772Sjl139090 bankno |= pa_bit_value << 1; 7671772Sjl139090 break; 7681772Sjl139090 case MP_BANK_2: 7691772Sjl139090 bankno |= pa_bit_value << 2; 7701772Sjl139090 break; 7711772Sjl139090 } 7721772Sjl139090 } 7731772Sjl139090 7741772Sjl139090 return (bankno); 7751772Sjl139090 } 7761772Sjl139090 7771772Sjl139090 /* 7781772Sjl139090 * PA to MAC address translation 7791772Sjl139090 * 7801772Sjl139090 * Input: MAC driver state, physicall adress 7811772Sjl139090 * Output: LSB#, Bank id, mac address 7821772Sjl139090 * 7831772Sjl139090 * Valid - return value: 0 7841772Sjl139090 * Invalid - return value: -1 7851772Sjl139090 */ 7861772Sjl139090 7871772Sjl139090 int 7881772Sjl139090 pa_to_maddr(mc_opl_t *mcp, uint64_t pa, mc_addr_t *maddr) 7891772Sjl139090 { 7901772Sjl139090 uint64_t pa_offset; 7911772Sjl139090 7922662Shyw if (!mc_rangecheck_pa(mcp, pa)) 7931772Sjl139090 return (-1); 7941772Sjl139090 7951772Sjl139090 /* Do translation */ 7961772Sjl139090 pa_offset = pa - mcp->mc_start_address; 7971772Sjl139090 7981772Sjl139090 maddr->ma_bd = mcp->mc_board_num; 7993045Sav145390 maddr->ma_phys_bd = mcp->mc_phys_board_num; 8001772Sjl139090 maddr->ma_bank = pa_to_bank(mcp, pa_offset); 8011772Sjl139090 maddr->ma_dimm_addr = pa_to_dimm(mcp, pa_offset); 8025080Swh31274 MC_LOG("pa %lx -> mcaddr /LSB%d/B%d/%x\n", pa_offset, maddr->ma_bd, 8035080Swh31274 maddr->ma_bank, maddr->ma_dimm_addr); 8041772Sjl139090 return (0); 8051772Sjl139090 } 8061772Sjl139090 8072214Sav145390 /* 8082214Sav145390 * UNUM format for DC is "/CMUnn/MEMxyZ", where 8092214Sav145390 * nn = 00..03 for DC1 and 00..07 for DC2 and 00..15 for DC3. 8102214Sav145390 * x = MAC 0..3 8112214Sav145390 * y = 0..3 (slot info). 8122214Sav145390 * Z = 'A' or 'B' 8132214Sav145390 * 8142214Sav145390 * UNUM format for FF1 is "/MBU_A/MEMBx/MEMyZ", where 8152214Sav145390 * x = 0..3 (MEMB number) 8162214Sav145390 * y = 0..3 (slot info). 8172214Sav145390 * Z = 'A' or 'B' 8182214Sav145390 * 8192214Sav145390 * UNUM format for FF2 is "/MBU_B/MEMBx/MEMyZ" 8202214Sav145390 * x = 0..7 (MEMB number) 8212214Sav145390 * y = 0..3 (slot info). 8222214Sav145390 * Z = 'A' or 'B' 8232214Sav145390 */ 8242214Sav145390 int 8253045Sav145390 mc_set_mem_unum(char *buf, int buflen, int sb, int bank, 8262214Sav145390 uint32_t mf_type, uint32_t d_slot) 8272214Sav145390 { 8282214Sav145390 char *dimmnm; 8292214Sav145390 char memb_num; 8303045Sav145390 int cs; 8312214Sav145390 int i; 8323045Sav145390 int j; 8333045Sav145390 8343045Sav145390 cs = SLOT_TO_CS(d_slot); 8352214Sav145390 8362214Sav145390 if (plat_model == MODEL_DC) { 8375275Stsien if (mf_type == FLT_TYPE_INTERMITTENT_CE || 8385275Stsien mf_type == FLT_TYPE_PERMANENT_CE) { 8392214Sav145390 i = BD_BK_SLOT_TO_INDEX(0, bank, d_slot); 8402214Sav145390 dimmnm = mc_dc_dimm_unum_table[i]; 8412214Sav145390 snprintf(buf, buflen, "/%s%02d/MEM%s", 8422214Sav145390 model_names[plat_model].unit_name, sb, dimmnm); 8432214Sav145390 } else { 8442214Sav145390 i = BD_BK_SLOT_TO_INDEX(0, bank, 0); 8453045Sav145390 j = (cs == 0) ? i : i + 2; 8463045Sav145390 snprintf(buf, buflen, "/%s%02d/MEM%s MEM%s", 8472214Sav145390 model_names[plat_model].unit_name, sb, 8483045Sav145390 mc_dc_dimm_unum_table[j], 8493045Sav145390 mc_dc_dimm_unum_table[j + 1]); 8502214Sav145390 } 8512214Sav145390 } else { 8525275Stsien if (mf_type == FLT_TYPE_INTERMITTENT_CE || 8535275Stsien mf_type == FLT_TYPE_PERMANENT_CE) { 8543045Sav145390 i = BD_BK_SLOT_TO_INDEX(sb, bank, d_slot); 8552214Sav145390 dimmnm = mc_ff_dimm_unum_table[i]; 8562214Sav145390 memb_num = dimmnm[0]; 8572214Sav145390 snprintf(buf, buflen, "/%s/%s%c/MEM%s", 8582214Sav145390 model_names[plat_model].unit_name, 8592214Sav145390 model_names[plat_model].mem_name, 8602214Sav145390 memb_num, &dimmnm[1]); 8612214Sav145390 } else { 8622214Sav145390 i = BD_BK_SLOT_TO_INDEX(sb, bank, 0); 8633045Sav145390 j = (cs == 0) ? i : i + 2; 8642214Sav145390 memb_num = mc_ff_dimm_unum_table[i][0], 8655080Swh31274 snprintf(buf, buflen, "/%s/%s%c/MEM%s MEM%s", 8662214Sav145390 model_names[plat_model].unit_name, 8672214Sav145390 model_names[plat_model].mem_name, memb_num, 8683045Sav145390 &mc_ff_dimm_unum_table[j][1], 8693045Sav145390 &mc_ff_dimm_unum_table[j + 1][1]); 8702214Sav145390 } 8712214Sav145390 } 8722214Sav145390 return (0); 8732214Sav145390 } 8742214Sav145390 8751772Sjl139090 static void 8761772Sjl139090 mc_ereport_post(mc_aflt_t *mc_aflt) 8771772Sjl139090 { 8781772Sjl139090 char buf[FM_MAX_CLASS]; 8791772Sjl139090 char device_path[MAXPATHLEN]; 8802214Sav145390 char sid[MAXPATHLEN]; 8811772Sjl139090 nv_alloc_t *nva = NULL; 8821772Sjl139090 nvlist_t *ereport, *detector, *resource; 8831772Sjl139090 errorq_elem_t *eqep; 8841772Sjl139090 int nflts; 8851772Sjl139090 mc_flt_stat_t *flt_stat; 8862214Sav145390 int i, n; 8872214Sav145390 int blen = MAXPATHLEN; 8882214Sav145390 char *p, *s = NULL; 8891772Sjl139090 uint32_t values[2], synd[2], dslot[2]; 8902214Sav145390 uint64_t offset = (uint64_t)-1; 8912214Sav145390 int ret = -1; 8921772Sjl139090 8931772Sjl139090 if (panicstr) { 8941772Sjl139090 eqep = errorq_reserve(ereport_errorq); 8951772Sjl139090 if (eqep == NULL) 8961772Sjl139090 return; 8971772Sjl139090 ereport = errorq_elem_nvl(ereport_errorq, eqep); 8981772Sjl139090 nva = errorq_elem_nva(ereport_errorq, eqep); 8991772Sjl139090 } else { 9001772Sjl139090 ereport = fm_nvlist_create(nva); 9011772Sjl139090 } 9021772Sjl139090 9031772Sjl139090 /* 9041772Sjl139090 * Create the scheme "dev" FMRI. 9051772Sjl139090 */ 9061772Sjl139090 detector = fm_nvlist_create(nva); 9071772Sjl139090 resource = fm_nvlist_create(nva); 9081772Sjl139090 9091772Sjl139090 nflts = mc_aflt->mflt_nflts; 9101772Sjl139090 9111772Sjl139090 ASSERT(nflts >= 1 && nflts <= 2); 9121772Sjl139090 9131772Sjl139090 flt_stat = mc_aflt->mflt_stat[0]; 9141772Sjl139090 (void) ddi_pathname(mc_aflt->mflt_mcp->mc_dip, device_path); 9151772Sjl139090 (void) fm_fmri_dev_set(detector, FM_DEV_SCHEME_VERSION, NULL, 9161772Sjl139090 device_path, NULL); 9171772Sjl139090 9181772Sjl139090 /* 9191772Sjl139090 * Encode all the common data into the ereport. 9201772Sjl139090 */ 9215080Swh31274 (void) snprintf(buf, FM_MAX_CLASS, "%s.%s-%s", MC_OPL_ERROR_CLASS, 9225080Swh31274 mc_aflt->mflt_is_ptrl ? MC_OPL_PTRL_SUBCLASS : MC_OPL_MI_SUBCLASS, 9235080Swh31274 mc_aflt->mflt_erpt_class); 9241772Sjl139090 9251772Sjl139090 MC_LOG("mc_ereport_post: ereport %s\n", buf); 9261772Sjl139090 9271772Sjl139090 9281772Sjl139090 fm_ereport_set(ereport, FM_EREPORT_VERSION, buf, 9295080Swh31274 fm_ena_generate(mc_aflt->mflt_id, FM_ENA_FMT1), detector, NULL); 9301772Sjl139090 9311772Sjl139090 /* 9321772Sjl139090 * Set payload. 9331772Sjl139090 */ 9341772Sjl139090 fm_payload_set(ereport, MC_OPL_BOARD, DATA_TYPE_UINT32, 9355080Swh31274 flt_stat->mf_flt_maddr.ma_bd, NULL); 9361772Sjl139090 9371772Sjl139090 fm_payload_set(ereport, MC_OPL_PA, DATA_TYPE_UINT64, 9385080Swh31274 flt_stat->mf_flt_paddr, NULL); 9391772Sjl139090 9405275Stsien if (flt_stat->mf_type == FLT_TYPE_INTERMITTENT_CE || 9415275Stsien flt_stat->mf_type == FLT_TYPE_PERMANENT_CE) { 9425080Swh31274 fm_payload_set(ereport, MC_OPL_FLT_TYPE, DATA_TYPE_UINT8, 9435080Swh31274 ECC_STICKY, NULL); 9441772Sjl139090 } 9451772Sjl139090 9461772Sjl139090 for (i = 0; i < nflts; i++) 9471772Sjl139090 values[i] = mc_aflt->mflt_stat[i]->mf_flt_maddr.ma_bank; 9481772Sjl139090 9495080Swh31274 fm_payload_set(ereport, MC_OPL_BANK, DATA_TYPE_UINT32_ARRAY, nflts, 9505080Swh31274 values, NULL); 9511772Sjl139090 9521772Sjl139090 for (i = 0; i < nflts; i++) 9531772Sjl139090 values[i] = mc_aflt->mflt_stat[i]->mf_cntl; 9541772Sjl139090 9555080Swh31274 fm_payload_set(ereport, MC_OPL_STATUS, DATA_TYPE_UINT32_ARRAY, nflts, 9565080Swh31274 values, NULL); 9571772Sjl139090 9581772Sjl139090 for (i = 0; i < nflts; i++) 9591772Sjl139090 values[i] = mc_aflt->mflt_stat[i]->mf_err_add; 9601772Sjl139090 9615275Stsien /* offset is set only for PCE and ICE */ 9625275Stsien if (mc_aflt->mflt_stat[0]->mf_type == FLT_TYPE_INTERMITTENT_CE || 9635275Stsien mc_aflt->mflt_stat[0]->mf_type == FLT_TYPE_PERMANENT_CE) { 9642214Sav145390 offset = values[0]; 9652214Sav145390 9662214Sav145390 } 9675080Swh31274 fm_payload_set(ereport, MC_OPL_ERR_ADD, DATA_TYPE_UINT32_ARRAY, nflts, 9685080Swh31274 values, NULL); 9691772Sjl139090 9701772Sjl139090 for (i = 0; i < nflts; i++) 9711772Sjl139090 values[i] = mc_aflt->mflt_stat[i]->mf_err_log; 9721772Sjl139090 9735080Swh31274 fm_payload_set(ereport, MC_OPL_ERR_LOG, DATA_TYPE_UINT32_ARRAY, nflts, 9745080Swh31274 values, NULL); 9751772Sjl139090 9761772Sjl139090 for (i = 0; i < nflts; i++) { 9771772Sjl139090 flt_stat = mc_aflt->mflt_stat[i]; 9781772Sjl139090 if (flt_stat->mf_errlog_valid) { 9791772Sjl139090 synd[i] = flt_stat->mf_synd; 9801772Sjl139090 dslot[i] = flt_stat->mf_dimm_slot; 9811772Sjl139090 values[i] = flt_stat->mf_dram_place; 9821772Sjl139090 } else { 9831772Sjl139090 synd[i] = 0; 9841772Sjl139090 dslot[i] = 0; 9851772Sjl139090 values[i] = 0; 9861772Sjl139090 } 9871772Sjl139090 } 9881772Sjl139090 9895080Swh31274 fm_payload_set(ereport, MC_OPL_ERR_SYND, DATA_TYPE_UINT32_ARRAY, nflts, 9905080Swh31274 synd, NULL); 9915080Swh31274 9925080Swh31274 fm_payload_set(ereport, MC_OPL_ERR_DIMMSLOT, DATA_TYPE_UINT32_ARRAY, 9935080Swh31274 nflts, dslot, NULL); 9945080Swh31274 9955080Swh31274 fm_payload_set(ereport, MC_OPL_ERR_DRAM, DATA_TYPE_UINT32_ARRAY, nflts, 9965080Swh31274 values, NULL); 9971772Sjl139090 9981772Sjl139090 device_path[0] = 0; 9991772Sjl139090 p = &device_path[0]; 10002214Sav145390 sid[0] = 0; 10012214Sav145390 s = &sid[0]; 10022214Sav145390 ret = 0; 10031772Sjl139090 10041772Sjl139090 for (i = 0; i < nflts; i++) { 10052214Sav145390 int bank; 10061772Sjl139090 10071772Sjl139090 flt_stat = mc_aflt->mflt_stat[i]; 10082214Sav145390 bank = flt_stat->mf_flt_maddr.ma_bank; 10095080Swh31274 ret = mc_set_mem_unum(p + strlen(p), blen, 10105080Swh31274 flt_stat->mf_flt_maddr.ma_phys_bd, bank, flt_stat->mf_type, 10115080Swh31274 flt_stat->mf_dimm_slot); 10122214Sav145390 10132214Sav145390 if (ret != 0) { 10142214Sav145390 cmn_err(CE_WARN, 10152214Sav145390 "mc_ereport_post: Failed to determine the unum " 10162214Sav145390 "for board=%d bank=%d type=0x%x slot=0x%x", 10172214Sav145390 flt_stat->mf_flt_maddr.ma_bd, bank, 10182214Sav145390 flt_stat->mf_type, flt_stat->mf_dimm_slot); 10192214Sav145390 continue; 10201772Sjl139090 } 10212214Sav145390 n = strlen(device_path); 10221772Sjl139090 blen = MAXPATHLEN - n; 10231772Sjl139090 p = &device_path[n]; 10241772Sjl139090 if (i < (nflts - 1)) { 10251772Sjl139090 snprintf(p, blen, " "); 10262214Sav145390 blen--; 10272214Sav145390 p++; 10282214Sav145390 } 10292214Sav145390 10302214Sav145390 if (ret == 0) { 10312214Sav145390 ret = mc_set_mem_sid(mc_aflt->mflt_mcp, s + strlen(s), 10323045Sav145390 blen, flt_stat->mf_flt_maddr.ma_phys_bd, bank, 10332214Sav145390 flt_stat->mf_type, flt_stat->mf_dimm_slot); 10342214Sav145390 10351772Sjl139090 } 10361772Sjl139090 } 10371772Sjl139090 10385080Swh31274 (void) fm_fmri_mem_set(resource, FM_MEM_SCHEME_VERSION, NULL, 10395080Swh31274 device_path, (ret == 0) ? sid : NULL, (ret == 0) ? offset : 10405080Swh31274 (uint64_t)-1); 10415080Swh31274 10425080Swh31274 fm_payload_set(ereport, MC_OPL_RESOURCE, DATA_TYPE_NVLIST, resource, 10435080Swh31274 NULL); 10441772Sjl139090 10451772Sjl139090 if (panicstr) { 10461772Sjl139090 errorq_commit(ereport_errorq, eqep, ERRORQ_SYNC); 10471772Sjl139090 } else { 10481772Sjl139090 (void) fm_ereport_post(ereport, EVCH_TRYHARD); 10491772Sjl139090 fm_nvlist_destroy(ereport, FM_NVA_FREE); 10501772Sjl139090 fm_nvlist_destroy(detector, FM_NVA_FREE); 10511772Sjl139090 fm_nvlist_destroy(resource, FM_NVA_FREE); 10521772Sjl139090 } 10531772Sjl139090 } 10541772Sjl139090 10552214Sav145390 10561772Sjl139090 static void 10571772Sjl139090 mc_err_drain(mc_aflt_t *mc_aflt) 10581772Sjl139090 { 10591772Sjl139090 int rv; 10601772Sjl139090 uint64_t pa = (uint64_t)(-1); 10612214Sav145390 int i; 10621772Sjl139090 10635080Swh31274 MC_LOG("mc_err_drain: %s\n", mc_aflt->mflt_erpt_class); 10641772Sjl139090 /* 10651772Sjl139090 * we come here only when we have: 10663152Sav145390 * In mirror mode: MUE, SUE 10675275Stsien * In normal mode: UE, Permanent CE, Intermittent CE 10681772Sjl139090 */ 10692214Sav145390 for (i = 0; i < mc_aflt->mflt_nflts; i++) { 10702214Sav145390 rv = mcaddr_to_pa(mc_aflt->mflt_mcp, 10715080Swh31274 &(mc_aflt->mflt_stat[i]->mf_flt_maddr), &pa); 10722662Shyw 10732662Shyw /* Ensure the pa is valid (not in isolated memory block) */ 10742662Shyw if (rv == 0 && pa_is_valid(mc_aflt->mflt_mcp, pa)) 10752214Sav145390 mc_aflt->mflt_stat[i]->mf_flt_paddr = pa; 10762214Sav145390 else 10772214Sav145390 mc_aflt->mflt_stat[i]->mf_flt_paddr = (uint64_t)-1; 10782214Sav145390 } 10792214Sav145390 10802662Shyw MC_LOG("mc_err_drain:pa = %lx\n", pa); 10812662Shyw 10822662Shyw switch (page_retire_check(pa, NULL)) { 10832662Shyw case 0: 10842662Shyw case EAGAIN: 10852662Shyw MC_LOG("Page retired or pending\n"); 10862662Shyw return; 10872662Shyw case EIO: 10882662Shyw /* 10895275Stsien * Do page retirement except for the PCE and ICE cases. 10902662Shyw * This is taken care by the OPL DE 10912662Shyw */ 10925275Stsien if (mc_aflt->mflt_stat[0]->mf_type != 10935275Stsien FLT_TYPE_INTERMITTENT_CE && 10945275Stsien mc_aflt->mflt_stat[0]->mf_type != FLT_TYPE_PERMANENT_CE) { 10952662Shyw MC_LOG("offline page at pa %lx error %x\n", pa, 10965080Swh31274 mc_aflt->mflt_pr); 10972662Shyw (void) page_retire(pa, mc_aflt->mflt_pr); 10981772Sjl139090 } 10992662Shyw break; 11002662Shyw case EINVAL: 11012662Shyw default: 11022662Shyw /* 11032662Shyw * Some memory do not have page structure so 11042662Shyw * we keep going in case of EINVAL. 11052662Shyw */ 11062662Shyw break; 11071772Sjl139090 } 11082214Sav145390 11092214Sav145390 for (i = 0; i < mc_aflt->mflt_nflts; i++) { 11102214Sav145390 mc_aflt_t mc_aflt0; 11112214Sav145390 if (mc_aflt->mflt_stat[i]->mf_flt_paddr != (uint64_t)-1) { 11122214Sav145390 mc_aflt0 = *mc_aflt; 11132214Sav145390 mc_aflt0.mflt_nflts = 1; 11142214Sav145390 mc_aflt0.mflt_stat[0] = mc_aflt->mflt_stat[i]; 11152214Sav145390 mc_ereport_post(&mc_aflt0); 11162214Sav145390 } 11172214Sav145390 } 11181772Sjl139090 } 11191772Sjl139090 11201772Sjl139090 /* 11211772Sjl139090 * The restart address is actually defined in unit of PA[37:6] 11221772Sjl139090 * the mac patrol will convert that to dimm offset. If the 11231772Sjl139090 * address is not in the bank, it will continue to search for 11241772Sjl139090 * the next PA that is within the bank. 11251772Sjl139090 * 11261772Sjl139090 * Also the mac patrol scans the dimms based on PA, not 11271772Sjl139090 * dimm offset. 11281772Sjl139090 */ 11291772Sjl139090 static int 11302662Shyw restart_patrol(mc_opl_t *mcp, int bank, mc_rsaddr_info_t *rsaddr_info) 11311772Sjl139090 { 11321772Sjl139090 uint64_t pa; 11331772Sjl139090 int rv; 11342662Shyw 11355310Sdhain if (MC_REWRITE_MODE(mcp, bank)) { 11365310Sdhain return (0); 11375310Sdhain } 11382662Shyw if (rsaddr_info == NULL || (rsaddr_info->mi_valid == 0)) { 11391772Sjl139090 MAC_PTRL_START(mcp, bank); 11401772Sjl139090 return (0); 11411772Sjl139090 } 11421772Sjl139090 11432662Shyw rv = mcaddr_to_pa(mcp, &rsaddr_info->mi_restartaddr, &pa); 11441772Sjl139090 if (rv != 0) { 11451772Sjl139090 MC_LOG("cannot convert mcaddr to pa. use auto restart\n"); 11461772Sjl139090 MAC_PTRL_START(mcp, bank); 11471772Sjl139090 return (0); 11481772Sjl139090 } 11491772Sjl139090 11502662Shyw if (!mc_rangecheck_pa(mcp, pa)) { 11511772Sjl139090 /* pa is not on this board, just retry */ 11521772Sjl139090 cmn_err(CE_WARN, "restart_patrol: invalid address %lx " 11535080Swh31274 "on board %d\n", pa, mcp->mc_board_num); 11541772Sjl139090 MAC_PTRL_START(mcp, bank); 11551772Sjl139090 return (0); 11561772Sjl139090 } 11571772Sjl139090 11581772Sjl139090 MC_LOG("restart_patrol: pa = %lx\n", pa); 11592662Shyw 11602662Shyw if (!rsaddr_info->mi_injectrestart) { 11612662Shyw /* 11623152Sav145390 * For non-error injection restart we need to 11632662Shyw * determine if the current restart pa/page is 11642662Shyw * a "good" page. A "good" page is a page that 11652662Shyw * has not been page retired. If the current 11662662Shyw * page that contains the pa is "good", we will 11672662Shyw * do a HW auto restart and let HW patrol continue 11682662Shyw * where it last stopped. Most desired scenario. 11692662Shyw * 11702662Shyw * If the current page is not "good", we will advance 11712662Shyw * to the next page to find the next "good" page and 11722662Shyw * restart the patrol from there. 11732662Shyw */ 11742662Shyw int wrapcount = 0; 11752662Shyw uint64_t origpa = pa; 11762662Shyw while (wrapcount < 2) { 11775080Swh31274 if (!pa_is_valid(mcp, pa)) { 11785310Sdhain /* 11795310Sdhain * Not in physinstall - advance to the 11805310Sdhain * next memory isolation blocksize 11815310Sdhain */ 11825310Sdhain MC_LOG("Invalid PA\n"); 11835310Sdhain pa = roundup(pa + 1, mc_isolation_bsize); 11845080Swh31274 } else { 11855310Sdhain int rv; 11865310Sdhain if ((rv = page_retire_check(pa, NULL)) != 0 && 11875310Sdhain rv != EAGAIN) { 11885080Swh31274 /* 11895080Swh31274 * The page is "good" (not retired), 11905080Swh31274 * we will use automatic HW restart 11915080Swh31274 * algorithm if this is the original 11925080Swh31274 * current starting page. 11935080Swh31274 */ 11945310Sdhain if (pa == origpa) { 11955310Sdhain MC_LOG("Page has no error. " 11965310Sdhain "Auto restart\n"); 11975310Sdhain MAC_PTRL_START(mcp, bank); 11985310Sdhain return (0); 11995310Sdhain } else { 12005310Sdhain /* 12015310Sdhain * found a subsequent good page 12025310Sdhain */ 12035310Sdhain break; 12042662Shyw } 12051772Sjl139090 } 12062662Shyw 12075310Sdhain /* 12085310Sdhain * Skip to the next page 12095310Sdhain */ 12105310Sdhain pa = roundup(pa + 1, PAGESIZE); 12115310Sdhain MC_LOG("Skipping bad page to %lx\n", pa); 12125310Sdhain } 12135310Sdhain 12145310Sdhain /* Check to see if we hit the end of the memory range */ 12155080Swh31274 if (pa >= (mcp->mc_start_address + mcp->mc_size)) { 12165310Sdhain MC_LOG("Wrap around\n"); 12175310Sdhain pa = mcp->mc_start_address; 12185310Sdhain wrapcount++; 12195080Swh31274 } 12202662Shyw } 12212662Shyw 12222662Shyw if (wrapcount > 1) { 12235080Swh31274 MC_LOG("Failed to find a good page. Just restart\n"); 12245080Swh31274 MAC_PTRL_START(mcp, bank); 12255080Swh31274 return (0); 12261772Sjl139090 } 12271772Sjl139090 } 12281772Sjl139090 12291772Sjl139090 /* 12302662Shyw * We reached here either: 12312662Shyw * 1. We are doing an error injection restart that specify 12322662Shyw * the exact pa/page to restart. OR 12332662Shyw * 2. We found a subsequent good page different from the 12342662Shyw * original restart pa/page. 12352662Shyw * Restart MAC patrol: PA[37:6] 12361772Sjl139090 */ 12371772Sjl139090 MC_LOG("restart at pa = %lx\n", pa); 12381772Sjl139090 ST_MAC_REG(MAC_RESTART_ADD(mcp, bank), MAC_RESTART_PA(pa)); 12391772Sjl139090 MAC_PTRL_START_ADD(mcp, bank); 12401772Sjl139090 12411772Sjl139090 return (0); 12421772Sjl139090 } 12431772Sjl139090 12445310Sdhain static void 12455310Sdhain mc_retry_info_put(mc_retry_info_t **q, mc_retry_info_t *p) 12465310Sdhain { 12475310Sdhain ASSERT(p != NULL); 12485310Sdhain p->ri_next = *q; 12495310Sdhain *q = p; 12505310Sdhain } 12515310Sdhain 12525310Sdhain static mc_retry_info_t * 12535310Sdhain mc_retry_info_get(mc_retry_info_t **q) 12545310Sdhain { 12555310Sdhain mc_retry_info_t *p; 12565310Sdhain 12575310Sdhain if ((p = *q) != NULL) { 12585310Sdhain *q = p->ri_next; 12595310Sdhain return (p); 12605310Sdhain } else { 12615310Sdhain return (NULL); 12625310Sdhain } 12635310Sdhain } 12645310Sdhain 12651772Sjl139090 /* 12661772Sjl139090 * Rewriting is used for two purposes. 12671772Sjl139090 * - to correct the error in memory. 12681772Sjl139090 * - to determine whether the error is permanent or intermittent. 12691772Sjl139090 * It's done by writing the address in MAC_BANKm_REWRITE_ADD 12701772Sjl139090 * and issuing REW_REQ command in MAC_BANKm_PTRL_CNRL. After that, 12711772Sjl139090 * REW_END (and REW_CE/REW_UE if some error detected) is set when 12721772Sjl139090 * rewrite operation is done. See 4.7.3 and 4.7.11 in Columbus2 PRM. 12731772Sjl139090 * 12741772Sjl139090 * Note that rewrite operation doesn't change RAW_UE to Marked UE. 12751772Sjl139090 * Therefore, we use it only CE case. 12761772Sjl139090 */ 12775310Sdhain 12781772Sjl139090 static uint32_t 12795310Sdhain do_rewrite(mc_opl_t *mcp, int bank, uint32_t dimm_addr, int retrying) 12801772Sjl139090 { 12811772Sjl139090 uint32_t cntl; 12821772Sjl139090 int count = 0; 12835310Sdhain int max_count; 12845310Sdhain int retry_state; 12855310Sdhain 12865310Sdhain if (retrying) 12875310Sdhain max_count = 1; 12885310Sdhain else 12895310Sdhain max_count = mc_max_rewrite_loop; 12905310Sdhain 12915310Sdhain retry_state = RETRY_STATE_PENDING; 12925310Sdhain 12935310Sdhain if (!retrying && MC_REWRITE_MODE(mcp, bank)) { 12945310Sdhain goto timeout; 12955310Sdhain } 12965310Sdhain 12975310Sdhain retry_state = RETRY_STATE_ACTIVE; 12981772Sjl139090 12991772Sjl139090 /* first wait to make sure PTRL_STATUS is 0 */ 13005310Sdhain while (count++ < max_count) { 13011772Sjl139090 cntl = LD_MAC_REG(MAC_PTRL_CNTL(mcp, bank)); 13025310Sdhain if (!(cntl & MAC_CNTL_PTRL_STATUS)) { 13035310Sdhain count = 0; 13041772Sjl139090 break; 13055310Sdhain } 13062214Sav145390 drv_usecwait(mc_rewrite_delay); 13071772Sjl139090 } 13085310Sdhain if (count >= max_count) 13095310Sdhain goto timeout; 13101772Sjl139090 13111772Sjl139090 count = 0; 13121772Sjl139090 13131772Sjl139090 ST_MAC_REG(MAC_REWRITE_ADD(mcp, bank), dimm_addr); 13141772Sjl139090 MAC_REW_REQ(mcp, bank); 13151772Sjl139090 13165310Sdhain retry_state = RETRY_STATE_REWRITE; 13175310Sdhain 13181772Sjl139090 do { 13195310Sdhain if (count++ > max_count) { 13205310Sdhain goto timeout; 13212214Sav145390 } else { 13222214Sav145390 drv_usecwait(mc_rewrite_delay); 13232214Sav145390 } 13245310Sdhain cntl = LD_MAC_REG(MAC_PTRL_CNTL(mcp, bank)); 13251772Sjl139090 /* 13261772Sjl139090 * If there are other MEMORY or PCI activities, this 13271772Sjl139090 * will be BUSY, else it should be set immediately 13281772Sjl139090 */ 13291772Sjl139090 } while (!(cntl & MAC_CNTL_REW_END)); 13301772Sjl139090 13311772Sjl139090 MAC_CLEAR_ERRS(mcp, bank, MAC_CNTL_REW_ERRS); 13321772Sjl139090 return (cntl); 13335310Sdhain timeout: 13345310Sdhain mc_set_rewrite(mcp, bank, dimm_addr, retry_state); 13355310Sdhain 13365310Sdhain return (0); 13371772Sjl139090 } 13385310Sdhain 13395310Sdhain void 13405310Sdhain mc_clear_rewrite(mc_opl_t *mcp, int bank) 13415310Sdhain { 13425310Sdhain struct mc_bank *bankp; 13435310Sdhain mc_retry_info_t *retry; 13445310Sdhain uint32_t rew_addr; 13455310Sdhain 13465310Sdhain bankp = &(mcp->mc_bank[bank]); 13475310Sdhain retry = bankp->mcb_active; 13485310Sdhain bankp->mcb_active = NULL; 13495310Sdhain mc_retry_info_put(&bankp->mcb_retry_freelist, retry); 13505310Sdhain 13515310Sdhain again: 13525310Sdhain bankp->mcb_rewrite_count = 0; 13535310Sdhain 13545310Sdhain while (retry = mc_retry_info_get(&bankp->mcb_retry_pending)) { 13555310Sdhain rew_addr = retry->ri_addr; 13565310Sdhain mc_retry_info_put(&bankp->mcb_retry_freelist, retry); 13575310Sdhain if (do_rewrite(mcp, bank, rew_addr, 1) == 0) 13585310Sdhain break; 13595310Sdhain } 13605310Sdhain 13615310Sdhain /* we break out if no more pending rewrite or we got timeout again */ 13625310Sdhain 13635310Sdhain if (!bankp->mcb_active && !bankp->mcb_retry_pending) { 13645310Sdhain if (!IS_MIRROR(mcp, bank)) { 13655310Sdhain MC_CLEAR_REWRITE_MODE(mcp, bank); 13665310Sdhain } else { 13675310Sdhain int mbank = bank ^ 1; 13685310Sdhain bankp = &(mcp->mc_bank[mbank]); 13695310Sdhain if (!bankp->mcb_active && !bankp->mcb_retry_pending) { 13705310Sdhain MC_CLEAR_REWRITE_MODE(mcp, bank); 13715310Sdhain MC_CLEAR_REWRITE_MODE(mcp, mbank); 13725310Sdhain } else { 13735310Sdhain bank = mbank; 13745310Sdhain goto again; 13755310Sdhain } 13765310Sdhain } 13775310Sdhain } 13785310Sdhain } 13795310Sdhain 13805310Sdhain void 13815310Sdhain mc_set_rewrite(mc_opl_t *mcp, int bank, uint32_t addr, int state) 13825310Sdhain { 13835310Sdhain mc_retry_info_t *retry; 13845310Sdhain struct mc_bank *bankp; 13855310Sdhain 13865310Sdhain bankp = &mcp->mc_bank[bank]; 13875310Sdhain 13885310Sdhain retry = mc_retry_info_get(&bankp->mcb_retry_freelist); 13895310Sdhain 13905310Sdhain ASSERT(retry != NULL); 13915310Sdhain 13925310Sdhain retry->ri_addr = addr; 13935310Sdhain retry->ri_state = state; 13945310Sdhain 13955310Sdhain MC_SET_REWRITE_MODE(mcp, bank); 13965310Sdhain 13975310Sdhain if ((state > RETRY_STATE_PENDING)) { 13985310Sdhain ASSERT(bankp->mcb_active == NULL); 13995310Sdhain bankp->mcb_active = retry; 14005310Sdhain } else { 14015310Sdhain mc_retry_info_put(&bankp->mcb_retry_pending, retry); 14025310Sdhain } 14035310Sdhain 14045310Sdhain if (IS_MIRROR(mcp, bank)) { 14055310Sdhain int mbank = bank ^1; 14065310Sdhain MC_SET_REWRITE_MODE(mcp, mbank); 14075310Sdhain } 14085310Sdhain } 14095310Sdhain 14101772Sjl139090 void 14111772Sjl139090 mc_process_scf_log(mc_opl_t *mcp) 14121772Sjl139090 { 14132214Sav145390 int count; 14142214Sav145390 int n = 0; 14151772Sjl139090 scf_log_t *p; 14161772Sjl139090 int bank; 14171772Sjl139090 14182214Sav145390 for (bank = 0; bank < BANKNUM_PER_SB; bank++) { 14195080Swh31274 while ((p = mcp->mc_scf_log[bank]) != NULL && 14205080Swh31274 (n < mc_max_errlog_processed)) { 14215310Sdhain ASSERT(bank == p->sl_bank); 14225310Sdhain count = 0; 14235310Sdhain while ((LD_MAC_REG(MAC_STATIC_ERR_ADD(mcp, p->sl_bank)) 14245310Sdhain & MAC_STATIC_ERR_VLD)) { 14255310Sdhain if (count++ >= (mc_max_scf_loop)) { 14265310Sdhain break; 14271772Sjl139090 } 14285310Sdhain drv_usecwait(mc_scf_delay); 14295310Sdhain } 14305310Sdhain 14315310Sdhain if (count < mc_max_scf_loop) { 14325310Sdhain ST_MAC_REG(MAC_STATIC_ERR_LOG(mcp, p->sl_bank), 14335310Sdhain p->sl_err_log); 14345310Sdhain 14355310Sdhain ST_MAC_REG(MAC_STATIC_ERR_ADD(mcp, p->sl_bank), 14365310Sdhain p->sl_err_add|MAC_STATIC_ERR_VLD); 14375310Sdhain mcp->mc_scf_retry[bank] = 0; 14385310Sdhain } else { 14395310Sdhain /* 14405310Sdhain * if we try too many times, just drop the req 14415310Sdhain */ 14425310Sdhain if (mcp->mc_scf_retry[bank]++ <= 14435310Sdhain mc_max_scf_retry) { 14445310Sdhain return; 14455080Swh31274 } else { 14465310Sdhain if ((++mc_pce_dropped & 0xff) == 0) { 14475310Sdhain cmn_err(CE_WARN, "Cannot " 14485310Sdhain "report Permanent CE to " 14495310Sdhain "SCF\n"); 14505080Swh31274 } 14515080Swh31274 } 14525310Sdhain } 14535310Sdhain n++; 14545310Sdhain mcp->mc_scf_log[bank] = p->sl_next; 14555310Sdhain mcp->mc_scf_total[bank]--; 14565310Sdhain ASSERT(mcp->mc_scf_total[bank] >= 0); 14575310Sdhain kmem_free(p, sizeof (scf_log_t)); 14581772Sjl139090 } 14591772Sjl139090 } 14601772Sjl139090 } 14611772Sjl139090 void 14621772Sjl139090 mc_queue_scf_log(mc_opl_t *mcp, mc_flt_stat_t *flt_stat, int bank) 14631772Sjl139090 { 14641772Sjl139090 scf_log_t *p; 14651772Sjl139090 14662214Sav145390 if (mcp->mc_scf_total[bank] >= mc_max_scf_logs) { 14672214Sav145390 if ((++mc_pce_dropped & 0xff) == 0) { 14685080Swh31274 cmn_err(CE_WARN, "Too many Permanent CE requests.\n"); 14692214Sav145390 } 14701772Sjl139090 return; 14711772Sjl139090 } 14721772Sjl139090 p = kmem_zalloc(sizeof (scf_log_t), KM_SLEEP); 14731772Sjl139090 p->sl_next = 0; 14741772Sjl139090 p->sl_err_add = flt_stat->mf_err_add; 14751772Sjl139090 p->sl_err_log = flt_stat->mf_err_log; 14761772Sjl139090 p->sl_bank = bank; 14771772Sjl139090 14782214Sav145390 if (mcp->mc_scf_log[bank] == NULL) { 14791772Sjl139090 /* 14801772Sjl139090 * we rely on mc_scf_log to detect NULL queue. 14811772Sjl139090 * mc_scf_log_tail is irrelevant is such case. 14821772Sjl139090 */ 14832214Sav145390 mcp->mc_scf_log_tail[bank] = mcp->mc_scf_log[bank] = p; 14841772Sjl139090 } else { 14852214Sav145390 mcp->mc_scf_log_tail[bank]->sl_next = p; 14862214Sav145390 mcp->mc_scf_log_tail[bank] = p; 14871772Sjl139090 } 14882214Sav145390 mcp->mc_scf_total[bank]++; 14891772Sjl139090 } 14901772Sjl139090 /* 14911772Sjl139090 * This routine determines what kind of CE happens, intermittent 14921772Sjl139090 * or permanent as follows. (See 4.7.3 in Columbus2 PRM.) 14931772Sjl139090 * - Do rewrite by issuing REW_REQ command to MAC_PTRL_CNTL register. 14941772Sjl139090 * - If CE is still detected on the same address even after doing 14951772Sjl139090 * rewrite operation twice, it is determined as permanent error. 14961772Sjl139090 * - If error is not detected anymore, it is determined as intermittent 14971772Sjl139090 * error. 14981772Sjl139090 * - If UE is detected due to rewrite operation, it should be treated 14991772Sjl139090 * as UE. 15001772Sjl139090 */ 15011772Sjl139090 15021772Sjl139090 /* ARGSUSED */ 15031772Sjl139090 static void 15041772Sjl139090 mc_scrub_ce(mc_opl_t *mcp, int bank, mc_flt_stat_t *flt_stat, int ptrl_error) 15051772Sjl139090 { 15061772Sjl139090 uint32_t cntl; 15071772Sjl139090 int i; 15081772Sjl139090 15091772Sjl139090 flt_stat->mf_type = FLT_TYPE_PERMANENT_CE; 15101772Sjl139090 /* 15111772Sjl139090 * rewrite request 1st time reads and correct error data 15121772Sjl139090 * and write to DIMM. 2nd rewrite request must be issued 15131772Sjl139090 * after REW_CE/UE/END is 0. When the 2nd request is completed, 15141772Sjl139090 * if REW_CE = 1, then it is permanent CE. 15151772Sjl139090 */ 15161772Sjl139090 for (i = 0; i < 2; i++) { 15175310Sdhain cntl = do_rewrite(mcp, bank, flt_stat->mf_err_add, 0); 15185310Sdhain 15195310Sdhain if (cntl == 0) { 15205310Sdhain /* timeout case */ 15215310Sdhain return; 15225310Sdhain } 15231772Sjl139090 /* 15241772Sjl139090 * If the error becomes UE or CMPE 15251772Sjl139090 * we return to the caller immediately. 15261772Sjl139090 */ 15271772Sjl139090 if (cntl & MAC_CNTL_REW_UE) { 15281772Sjl139090 if (ptrl_error) 15291772Sjl139090 flt_stat->mf_cntl |= MAC_CNTL_PTRL_UE; 15301772Sjl139090 else 15311772Sjl139090 flt_stat->mf_cntl |= MAC_CNTL_MI_UE; 15321772Sjl139090 flt_stat->mf_type = FLT_TYPE_UE; 15331772Sjl139090 return; 15341772Sjl139090 } 15351772Sjl139090 if (cntl & MAC_CNTL_REW_CMPE) { 15361772Sjl139090 if (ptrl_error) 15371772Sjl139090 flt_stat->mf_cntl |= MAC_CNTL_PTRL_CMPE; 15381772Sjl139090 else 15391772Sjl139090 flt_stat->mf_cntl |= MAC_CNTL_MI_CMPE; 15401772Sjl139090 flt_stat->mf_type = FLT_TYPE_CMPE; 15411772Sjl139090 return; 15421772Sjl139090 } 15431772Sjl139090 } 15441772Sjl139090 if (!(cntl & MAC_CNTL_REW_CE)) { 15451772Sjl139090 flt_stat->mf_type = FLT_TYPE_INTERMITTENT_CE; 15461772Sjl139090 } 15471772Sjl139090 15481772Sjl139090 if (flt_stat->mf_type == FLT_TYPE_PERMANENT_CE) { 15491772Sjl139090 /* report PERMANENT_CE to SP via SCF */ 15501772Sjl139090 if (!(flt_stat->mf_err_log & MAC_ERR_LOG_INVALID)) { 15511772Sjl139090 mc_queue_scf_log(mcp, flt_stat, bank); 15521772Sjl139090 } 15531772Sjl139090 } 15541772Sjl139090 } 15551772Sjl139090 15561772Sjl139090 #define IS_CMPE(cntl, f) ((cntl) & ((f) ? MAC_CNTL_PTRL_CMPE :\ 15571772Sjl139090 MAC_CNTL_MI_CMPE)) 15581772Sjl139090 #define IS_UE(cntl, f) ((cntl) & ((f) ? MAC_CNTL_PTRL_UE : MAC_CNTL_MI_UE)) 15591772Sjl139090 #define IS_CE(cntl, f) ((cntl) & ((f) ? MAC_CNTL_PTRL_CE : MAC_CNTL_MI_CE)) 15601772Sjl139090 #define IS_OK(cntl, f) (!((cntl) & ((f) ? MAC_CNTL_PTRL_ERRS : \ 15611772Sjl139090 MAC_CNTL_MI_ERRS))) 15621772Sjl139090 15631772Sjl139090 15641772Sjl139090 static int 15651772Sjl139090 IS_CE_ONLY(uint32_t cntl, int ptrl_error) 15661772Sjl139090 { 15671772Sjl139090 if (ptrl_error) { 15681772Sjl139090 return ((cntl & MAC_CNTL_PTRL_ERRS) == MAC_CNTL_PTRL_CE); 15691772Sjl139090 } else { 15701772Sjl139090 return ((cntl & MAC_CNTL_MI_ERRS) == MAC_CNTL_MI_CE); 15711772Sjl139090 } 15721772Sjl139090 } 15731772Sjl139090 15741772Sjl139090 void 15751772Sjl139090 mc_write_cntl(mc_opl_t *mcp, int bank, uint32_t value) 15761772Sjl139090 { 15772867Shyw int ebank = (IS_MIRROR(mcp, bank)) ? MIRROR_IDX(bank) : bank; 15782867Shyw 15792867Shyw if (mcp->mc_speedup_period[ebank] > 0) 15802214Sav145390 value |= mc_max_speed; 15812214Sav145390 else 15822214Sav145390 value |= mcp->mc_speed; 15831772Sjl139090 ST_MAC_REG(MAC_PTRL_CNTL(mcp, bank), value); 15841772Sjl139090 } 15851772Sjl139090 15861772Sjl139090 static void 15871772Sjl139090 mc_read_ptrl_reg(mc_opl_t *mcp, int bank, mc_flt_stat_t *flt_stat) 15881772Sjl139090 { 15891772Sjl139090 flt_stat->mf_cntl = LD_MAC_REG(MAC_PTRL_CNTL(mcp, bank)) & 15905080Swh31274 MAC_CNTL_PTRL_ERRS; 15911772Sjl139090 flt_stat->mf_err_add = LD_MAC_REG(MAC_PTRL_ERR_ADD(mcp, bank)); 15921772Sjl139090 flt_stat->mf_err_log = LD_MAC_REG(MAC_PTRL_ERR_LOG(mcp, bank)); 15931772Sjl139090 flt_stat->mf_flt_maddr.ma_bd = mcp->mc_board_num; 15943045Sav145390 flt_stat->mf_flt_maddr.ma_phys_bd = mcp->mc_phys_board_num; 15951772Sjl139090 flt_stat->mf_flt_maddr.ma_bank = bank; 15961772Sjl139090 flt_stat->mf_flt_maddr.ma_dimm_addr = flt_stat->mf_err_add; 15971772Sjl139090 } 15981772Sjl139090 15991772Sjl139090 static void 16001772Sjl139090 mc_read_mi_reg(mc_opl_t *mcp, int bank, mc_flt_stat_t *flt_stat) 16011772Sjl139090 { 16021772Sjl139090 uint32_t status, old_status; 16031772Sjl139090 16045080Swh31274 status = LD_MAC_REG(MAC_PTRL_CNTL(mcp, bank)) & MAC_CNTL_MI_ERRS; 16051772Sjl139090 old_status = 0; 16061772Sjl139090 16071772Sjl139090 /* we keep reading until the status is stable */ 16081772Sjl139090 while (old_status != status) { 16091772Sjl139090 old_status = status; 16105080Swh31274 flt_stat->mf_err_add = LD_MAC_REG(MAC_MI_ERR_ADD(mcp, bank)); 16115080Swh31274 flt_stat->mf_err_log = LD_MAC_REG(MAC_MI_ERR_LOG(mcp, bank)); 16121772Sjl139090 status = LD_MAC_REG(MAC_PTRL_CNTL(mcp, bank)) & 16135080Swh31274 MAC_CNTL_MI_ERRS; 16141772Sjl139090 if (status == old_status) { 16151772Sjl139090 break; 16161772Sjl139090 } 16171772Sjl139090 } 16181772Sjl139090 16191772Sjl139090 flt_stat->mf_cntl = status; 16201772Sjl139090 flt_stat->mf_flt_maddr.ma_bd = mcp->mc_board_num; 16213045Sav145390 flt_stat->mf_flt_maddr.ma_phys_bd = mcp->mc_phys_board_num; 16221772Sjl139090 flt_stat->mf_flt_maddr.ma_bank = bank; 16231772Sjl139090 flt_stat->mf_flt_maddr.ma_dimm_addr = flt_stat->mf_err_add; 16241772Sjl139090 } 16251772Sjl139090 16261772Sjl139090 16271772Sjl139090 /* 16281772Sjl139090 * Error philosophy for mirror mode: 16291772Sjl139090 * 16301772Sjl139090 * PTRL (The error address for both banks are same, since ptrl stops if it 16311772Sjl139090 * detects error.) 16323152Sav145390 * - Compare error log CMPE. 16331772Sjl139090 * 16341772Sjl139090 * - UE-UE Report MUE. No rewrite. 16351772Sjl139090 * 16361772Sjl139090 * - UE-* UE-(CE/OK). Rewrite to scrub UE. Report SUE. 16371772Sjl139090 * 16381772Sjl139090 * - CE-* CE-(CE/OK). Scrub to determine if CE is permanent. 16391772Sjl139090 * If CE is permanent, inform SCF. Once for each 16401772Sjl139090 * Dimm. If CE becomes UE or CMPE, go back to above. 16411772Sjl139090 * 16421772Sjl139090 * 16431772Sjl139090 * MI (The error addresses for each bank are the same or different.) 16443152Sav145390 * - Compare error If addresses are the same. Just CMPE, so log CMPE. 16451772Sjl139090 * If addresses are different (this could happen 16463152Sav145390 * as a result of scrubbing. Report each separately. 16471772Sjl139090 * Only report error info on each side. 16481772Sjl139090 * 16491772Sjl139090 * - UE-UE Addresses are the same. Report MUE. 16501772Sjl139090 * Addresses are different. Report SUE on each bank. 16511772Sjl139090 * Rewrite to clear UE. 16521772Sjl139090 * 16531772Sjl139090 * - UE-* UE-(CE/OK) 16541772Sjl139090 * Rewrite to clear UE. Report SUE for the bank. 16551772Sjl139090 * 16561772Sjl139090 * - CE-* CE-(CE/OK). Scrub to determine if CE is permanent. 16571772Sjl139090 * If CE becomes UE or CMPE, go back to above. 16581772Sjl139090 * 16591772Sjl139090 */ 16601772Sjl139090 16611772Sjl139090 static int 16621772Sjl139090 mc_process_error_mir(mc_opl_t *mcp, mc_aflt_t *mc_aflt, mc_flt_stat_t *flt_stat) 16631772Sjl139090 { 16641772Sjl139090 int ptrl_error = mc_aflt->mflt_is_ptrl; 16651772Sjl139090 int i; 16661772Sjl139090 int rv = 0; 16675310Sdhain int bank; 16685310Sdhain int rewrite_timeout = 0; 16691772Sjl139090 16701772Sjl139090 MC_LOG("process mirror errors cntl[0] = %x, cntl[1] = %x\n", 16715080Swh31274 flt_stat[0].mf_cntl, flt_stat[1].mf_cntl); 16721772Sjl139090 16731772Sjl139090 if (ptrl_error) { 16745080Swh31274 if (((flt_stat[0].mf_cntl | flt_stat[1].mf_cntl) & 16755080Swh31274 MAC_CNTL_PTRL_ERRS) == 0) 16761772Sjl139090 return (0); 16771772Sjl139090 } else { 16785080Swh31274 if (((flt_stat[0].mf_cntl | flt_stat[1].mf_cntl) & 16795080Swh31274 MAC_CNTL_MI_ERRS) == 0) 16801772Sjl139090 return (0); 16811772Sjl139090 } 16821772Sjl139090 16831772Sjl139090 /* 16841772Sjl139090 * First we take care of the case of CE 16851772Sjl139090 * because they can become UE or CMPE 16861772Sjl139090 */ 16871772Sjl139090 for (i = 0; i < 2; i++) { 16881772Sjl139090 if (IS_CE_ONLY(flt_stat[i].mf_cntl, ptrl_error)) { 16895310Sdhain bank = flt_stat[i].mf_flt_maddr.ma_bank; 16905310Sdhain MC_LOG("CE detected on bank %d\n", bank); 16915310Sdhain mc_scrub_ce(mcp, bank, &flt_stat[i], ptrl_error); 16925310Sdhain if (MC_REWRITE_ACTIVE(mcp, bank)) { 16935310Sdhain rewrite_timeout = 1; 16945310Sdhain } 16951772Sjl139090 rv = 1; 16961772Sjl139090 } 16971772Sjl139090 } 16981772Sjl139090 16995310Sdhain if (rewrite_timeout) 17005310Sdhain return (0); 17015310Sdhain 17021772Sjl139090 /* The above scrubbing can turn CE into UE or CMPE */ 17031772Sjl139090 17041772Sjl139090 /* 17051772Sjl139090 * Now we distinguish two cases: same address or not 17061772Sjl139090 * the same address. It might seem more intuitive to 17071772Sjl139090 * distinguish PTRL v.s. MI error but it is more 17081772Sjl139090 * complicated that way. 17091772Sjl139090 */ 17101772Sjl139090 17111772Sjl139090 if (flt_stat[0].mf_err_add == flt_stat[1].mf_err_add) { 17121772Sjl139090 17131772Sjl139090 if (IS_CMPE(flt_stat[0].mf_cntl, ptrl_error) || 17141772Sjl139090 IS_CMPE(flt_stat[1].mf_cntl, ptrl_error)) { 17151772Sjl139090 flt_stat[0].mf_type = FLT_TYPE_CMPE; 17161772Sjl139090 flt_stat[1].mf_type = FLT_TYPE_CMPE; 17171772Sjl139090 mc_aflt->mflt_erpt_class = MC_OPL_CMPE; 17181772Sjl139090 mc_aflt->mflt_nflts = 2; 17191772Sjl139090 mc_aflt->mflt_stat[0] = &flt_stat[0]; 17201772Sjl139090 mc_aflt->mflt_stat[1] = &flt_stat[1]; 17211772Sjl139090 mc_aflt->mflt_pr = PR_UE; 17223152Sav145390 /* 17233152Sav145390 * Compare error is result of MAC internal error, so 17243152Sav145390 * simply log it instead of publishing an ereport. SCF 17253152Sav145390 * diagnoses all the MAC internal and its i/f error. 17263152Sav145390 */ 17273152Sav145390 MC_LOG("cmpe error detected\n"); 17281772Sjl139090 return (1); 17291772Sjl139090 } 17301772Sjl139090 17311772Sjl139090 if (IS_UE(flt_stat[0].mf_cntl, ptrl_error) && 17325080Swh31274 IS_UE(flt_stat[1].mf_cntl, ptrl_error)) { 17331772Sjl139090 /* Both side are UE's */ 17341772Sjl139090 17351772Sjl139090 MAC_SET_ERRLOG_INFO(&flt_stat[0]); 17361772Sjl139090 MAC_SET_ERRLOG_INFO(&flt_stat[1]); 17371772Sjl139090 MC_LOG("MUE detected\n"); 17382214Sav145390 flt_stat[0].mf_type = FLT_TYPE_MUE; 17392214Sav145390 flt_stat[1].mf_type = FLT_TYPE_MUE; 17401772Sjl139090 mc_aflt->mflt_erpt_class = MC_OPL_MUE; 17411772Sjl139090 mc_aflt->mflt_nflts = 2; 17421772Sjl139090 mc_aflt->mflt_stat[0] = &flt_stat[0]; 17431772Sjl139090 mc_aflt->mflt_stat[1] = &flt_stat[1]; 17441772Sjl139090 mc_aflt->mflt_pr = PR_UE; 17451772Sjl139090 mc_err_drain(mc_aflt); 17461772Sjl139090 return (1); 17471772Sjl139090 } 17481772Sjl139090 17491772Sjl139090 /* Now the only case is UE/CE, UE/OK, or don't care */ 17501772Sjl139090 for (i = 0; i < 2; i++) { 17515310Sdhain if (IS_UE(flt_stat[i].mf_cntl, ptrl_error)) { 17522214Sav145390 17532214Sav145390 /* rewrite can clear the one side UE error */ 17542214Sav145390 17551772Sjl139090 if (IS_OK(flt_stat[i^1].mf_cntl, ptrl_error)) { 17561772Sjl139090 (void) do_rewrite(mcp, 17571772Sjl139090 flt_stat[i].mf_flt_maddr.ma_bank, 17585310Sdhain flt_stat[i].mf_flt_maddr.ma_dimm_addr, 0); 17591772Sjl139090 } 17601772Sjl139090 flt_stat[i].mf_type = FLT_TYPE_UE; 17611772Sjl139090 MAC_SET_ERRLOG_INFO(&flt_stat[i]); 17621772Sjl139090 mc_aflt->mflt_erpt_class = MC_OPL_SUE; 17631772Sjl139090 mc_aflt->mflt_stat[0] = &flt_stat[i]; 17641772Sjl139090 mc_aflt->mflt_nflts = 1; 17651772Sjl139090 mc_aflt->mflt_pr = PR_MCE; 17661772Sjl139090 mc_err_drain(mc_aflt); 17671772Sjl139090 /* Once we hit a UE/CE or UE/OK case, done */ 17681772Sjl139090 return (1); 17695310Sdhain } 17701772Sjl139090 } 17711772Sjl139090 17721772Sjl139090 } else { 17731772Sjl139090 /* 17741772Sjl139090 * addresses are different. That means errors 17751772Sjl139090 * on the 2 banks are not related at all. 17761772Sjl139090 */ 17771772Sjl139090 for (i = 0; i < 2; i++) { 17785080Swh31274 if (IS_CMPE(flt_stat[i].mf_cntl, ptrl_error)) { 17795080Swh31274 flt_stat[i].mf_type = FLT_TYPE_CMPE; 17805080Swh31274 mc_aflt->mflt_erpt_class = MC_OPL_CMPE; 17815080Swh31274 mc_aflt->mflt_nflts = 1; 17825080Swh31274 mc_aflt->mflt_stat[0] = &flt_stat[i]; 17835080Swh31274 mc_aflt->mflt_pr = PR_UE; 17845080Swh31274 /* 17855080Swh31274 * Compare error is result of MAC internal 17865080Swh31274 * error, so simply log it instead of 17875080Swh31274 * publishing an ereport. SCF diagnoses all 17885080Swh31274 * the MAC internal and its interface error. 17895080Swh31274 */ 17905080Swh31274 MC_LOG("cmpe error detected\n"); 17915080Swh31274 /* no more report on this bank */ 17925080Swh31274 flt_stat[i].mf_cntl = 0; 17935080Swh31274 rv = 1; 17945080Swh31274 } 17951772Sjl139090 } 17961772Sjl139090 17972214Sav145390 /* rewrite can clear the one side UE error */ 17982214Sav145390 17991772Sjl139090 for (i = 0; i < 2; i++) { 18005080Swh31274 if (IS_UE(flt_stat[i].mf_cntl, ptrl_error)) { 18015080Swh31274 (void) do_rewrite(mcp, 18025080Swh31274 flt_stat[i].mf_flt_maddr.ma_bank, 18035310Sdhain flt_stat[i].mf_flt_maddr.ma_dimm_addr, 18045310Sdhain 0); 18055080Swh31274 flt_stat[i].mf_type = FLT_TYPE_UE; 18065080Swh31274 MAC_SET_ERRLOG_INFO(&flt_stat[i]); 18075080Swh31274 mc_aflt->mflt_erpt_class = MC_OPL_SUE; 18085080Swh31274 mc_aflt->mflt_stat[0] = &flt_stat[i]; 18095080Swh31274 mc_aflt->mflt_nflts = 1; 18105080Swh31274 mc_aflt->mflt_pr = PR_MCE; 18115080Swh31274 mc_err_drain(mc_aflt); 18125080Swh31274 rv = 1; 18135080Swh31274 } 18141772Sjl139090 } 18151772Sjl139090 } 18161772Sjl139090 return (rv); 18171772Sjl139090 } 18181772Sjl139090 static void 18192662Shyw mc_error_handler_mir(mc_opl_t *mcp, int bank, mc_rsaddr_info_t *rsaddr) 18201772Sjl139090 { 18211772Sjl139090 mc_aflt_t mc_aflt; 18221772Sjl139090 mc_flt_stat_t flt_stat[2], mi_flt_stat[2]; 18232214Sav145390 int i; 18242214Sav145390 int mi_valid; 18252214Sav145390 18262662Shyw ASSERT(rsaddr); 18272662Shyw 18281772Sjl139090 bzero(&mc_aflt, sizeof (mc_aflt_t)); 18291772Sjl139090 bzero(&flt_stat, 2 * sizeof (mc_flt_stat_t)); 18301772Sjl139090 bzero(&mi_flt_stat, 2 * sizeof (mc_flt_stat_t)); 18311772Sjl139090 18323373Sbm42561 18331772Sjl139090 mc_aflt.mflt_mcp = mcp; 18341772Sjl139090 mc_aflt.mflt_id = gethrtime(); 18351772Sjl139090 18361772Sjl139090 /* Now read all the registers into flt_stat */ 18371772Sjl139090 18382214Sav145390 for (i = 0; i < 2; i++) { 18392214Sav145390 MC_LOG("Reading registers of bank %d\n", bank); 18402214Sav145390 /* patrol registers */ 18412214Sav145390 mc_read_ptrl_reg(mcp, bank, &flt_stat[i]); 18422214Sav145390 18432662Shyw /* 18442662Shyw * In mirror mode, it is possible that only one bank 18452662Shyw * may report the error. We need to check for it to 18462662Shyw * ensure we pick the right addr value for patrol restart. 18472662Shyw * Note that if both banks reported errors, we pick the 18482662Shyw * 2nd one. Both banks should reported the same error address. 18492662Shyw */ 18502662Shyw if (flt_stat[i].mf_cntl & MAC_CNTL_PTRL_ERRS) 18512662Shyw rsaddr->mi_restartaddr = flt_stat[i].mf_flt_maddr; 18522214Sav145390 18532214Sav145390 MC_LOG("ptrl registers cntl %x add %x log %x\n", 18545080Swh31274 flt_stat[i].mf_cntl, flt_stat[i].mf_err_add, 18555080Swh31274 flt_stat[i].mf_err_log); 18562214Sav145390 18572214Sav145390 /* MI registers */ 18582214Sav145390 mc_read_mi_reg(mcp, bank, &mi_flt_stat[i]); 18592214Sav145390 18602214Sav145390 MC_LOG("MI registers cntl %x add %x log %x\n", 18615080Swh31274 mi_flt_stat[i].mf_cntl, mi_flt_stat[i].mf_err_add, 18625080Swh31274 mi_flt_stat[i].mf_err_log); 18632214Sav145390 18642214Sav145390 bank = bank^1; 18652214Sav145390 } 18661772Sjl139090 18671772Sjl139090 /* clear errors once we read all the registers */ 18685080Swh31274 MAC_CLEAR_ERRS(mcp, bank, (MAC_CNTL_PTRL_ERRS|MAC_CNTL_MI_ERRS)); 18691772Sjl139090 18702214Sav145390 MAC_CLEAR_ERRS(mcp, bank ^ 1, (MAC_CNTL_PTRL_ERRS|MAC_CNTL_MI_ERRS)); 18712214Sav145390 18722214Sav145390 /* Process MI errors first */ 18732214Sav145390 18742214Sav145390 /* if not error mode, cntl1 is 0 */ 18752214Sav145390 if ((mi_flt_stat[0].mf_err_add & MAC_ERR_ADD_INVALID) || 18765080Swh31274 (mi_flt_stat[0].mf_err_log & MAC_ERR_LOG_INVALID)) 18772214Sav145390 mi_flt_stat[0].mf_cntl = 0; 18782214Sav145390 18792214Sav145390 if ((mi_flt_stat[1].mf_err_add & MAC_ERR_ADD_INVALID) || 18805080Swh31274 (mi_flt_stat[1].mf_err_log & MAC_ERR_LOG_INVALID)) 18812214Sav145390 mi_flt_stat[1].mf_cntl = 0; 18822214Sav145390 18832214Sav145390 mc_aflt.mflt_is_ptrl = 0; 18842214Sav145390 mi_valid = mc_process_error_mir(mcp, &mc_aflt, &mi_flt_stat[0]); 18852214Sav145390 18862214Sav145390 if ((((flt_stat[0].mf_cntl & MAC_CNTL_PTRL_ERRS) >> 18875080Swh31274 MAC_CNTL_PTRL_ERR_SHIFT) == ((mi_flt_stat[0].mf_cntl & 18885080Swh31274 MAC_CNTL_MI_ERRS) >> MAC_CNTL_MI_ERR_SHIFT)) && 18895080Swh31274 (flt_stat[0].mf_err_add == mi_flt_stat[0].mf_err_add) && 18905080Swh31274 (((flt_stat[1].mf_cntl & MAC_CNTL_PTRL_ERRS) >> 18915080Swh31274 MAC_CNTL_PTRL_ERR_SHIFT) == ((mi_flt_stat[1].mf_cntl & 18925080Swh31274 MAC_CNTL_MI_ERRS) >> MAC_CNTL_MI_ERR_SHIFT)) && 18935080Swh31274 (flt_stat[1].mf_err_add == mi_flt_stat[1].mf_err_add)) { 18942214Sav145390 #ifdef DEBUG 18952214Sav145390 MC_LOG("discarding PTRL error because " 18962214Sav145390 "it is the same as MI\n"); 18972214Sav145390 #endif 18982662Shyw rsaddr->mi_valid = mi_valid; 18992214Sav145390 return; 19002214Sav145390 } 19011772Sjl139090 /* if not error mode, cntl1 is 0 */ 19021772Sjl139090 if ((flt_stat[0].mf_err_add & MAC_ERR_ADD_INVALID) || 19035080Swh31274 (flt_stat[0].mf_err_log & MAC_ERR_LOG_INVALID)) 19041772Sjl139090 flt_stat[0].mf_cntl = 0; 19051772Sjl139090 19061772Sjl139090 if ((flt_stat[1].mf_err_add & MAC_ERR_ADD_INVALID) || 19075080Swh31274 (flt_stat[1].mf_err_log & MAC_ERR_LOG_INVALID)) 19081772Sjl139090 flt_stat[1].mf_cntl = 0; 19091772Sjl139090 19101772Sjl139090 mc_aflt.mflt_is_ptrl = 1; 19112662Shyw rsaddr->mi_valid = mc_process_error_mir(mcp, &mc_aflt, &flt_stat[0]); 19121772Sjl139090 } 19131772Sjl139090 static int 19141772Sjl139090 mc_process_error(mc_opl_t *mcp, int bank, mc_aflt_t *mc_aflt, 19151772Sjl139090 mc_flt_stat_t *flt_stat) 19161772Sjl139090 { 19171772Sjl139090 int ptrl_error = mc_aflt->mflt_is_ptrl; 19181772Sjl139090 int rv = 0; 19191772Sjl139090 19201772Sjl139090 mc_aflt->mflt_erpt_class = NULL; 19211772Sjl139090 if (IS_UE(flt_stat->mf_cntl, ptrl_error)) { 19223152Sav145390 MC_LOG("UE detected\n"); 19231772Sjl139090 flt_stat->mf_type = FLT_TYPE_UE; 19241772Sjl139090 mc_aflt->mflt_erpt_class = MC_OPL_UE; 19251772Sjl139090 mc_aflt->mflt_pr = PR_UE; 19261772Sjl139090 MAC_SET_ERRLOG_INFO(flt_stat); 19271772Sjl139090 rv = 1; 19281772Sjl139090 } else if (IS_CE(flt_stat->mf_cntl, ptrl_error)) { 19293152Sav145390 MC_LOG("CE detected\n"); 19301772Sjl139090 MAC_SET_ERRLOG_INFO(flt_stat); 19311772Sjl139090 19323152Sav145390 /* Error type can change after scrubbing */ 19331772Sjl139090 mc_scrub_ce(mcp, bank, flt_stat, ptrl_error); 19345310Sdhain if (MC_REWRITE_ACTIVE(mcp, bank)) { 19355310Sdhain return (0); 19365310Sdhain } 19371772Sjl139090 19385275Stsien if (flt_stat->mf_type == FLT_TYPE_INTERMITTENT_CE) { 19395275Stsien mc_aflt->mflt_erpt_class = MC_OPL_ICE; 19405275Stsien mc_aflt->mflt_pr = PR_MCE; 19415275Stsien } else if (flt_stat->mf_type == FLT_TYPE_PERMANENT_CE) { 19421772Sjl139090 mc_aflt->mflt_erpt_class = MC_OPL_CE; 19431772Sjl139090 mc_aflt->mflt_pr = PR_MCE; 19441772Sjl139090 } else if (flt_stat->mf_type == FLT_TYPE_UE) { 19451772Sjl139090 mc_aflt->mflt_erpt_class = MC_OPL_UE; 19461772Sjl139090 mc_aflt->mflt_pr = PR_UE; 19471772Sjl139090 } 19481772Sjl139090 rv = 1; 19491772Sjl139090 } 19505080Swh31274 MC_LOG("mc_process_error: fault type %x erpt %s\n", flt_stat->mf_type, 19515080Swh31274 mc_aflt->mflt_erpt_class); 19521772Sjl139090 if (mc_aflt->mflt_erpt_class) { 19531772Sjl139090 mc_aflt->mflt_stat[0] = flt_stat; 19541772Sjl139090 mc_aflt->mflt_nflts = 1; 19551772Sjl139090 mc_err_drain(mc_aflt); 19561772Sjl139090 } 19571772Sjl139090 return (rv); 19581772Sjl139090 } 19591772Sjl139090 19601772Sjl139090 static void 19612662Shyw mc_error_handler(mc_opl_t *mcp, int bank, mc_rsaddr_info_t *rsaddr) 19621772Sjl139090 { 19631772Sjl139090 mc_aflt_t mc_aflt; 19641772Sjl139090 mc_flt_stat_t flt_stat, mi_flt_stat; 19652214Sav145390 int mi_valid; 19661772Sjl139090 19671772Sjl139090 bzero(&mc_aflt, sizeof (mc_aflt_t)); 19681772Sjl139090 bzero(&flt_stat, sizeof (mc_flt_stat_t)); 19691772Sjl139090 bzero(&mi_flt_stat, sizeof (mc_flt_stat_t)); 19701772Sjl139090 19711772Sjl139090 mc_aflt.mflt_mcp = mcp; 19721772Sjl139090 mc_aflt.mflt_id = gethrtime(); 19731772Sjl139090 19741772Sjl139090 /* patrol registers */ 19751772Sjl139090 mc_read_ptrl_reg(mcp, bank, &flt_stat); 19761772Sjl139090 19772662Shyw ASSERT(rsaddr); 19782662Shyw rsaddr->mi_restartaddr = flt_stat.mf_flt_maddr; 19791772Sjl139090 19805080Swh31274 MC_LOG("ptrl registers cntl %x add %x log %x\n", flt_stat.mf_cntl, 19815080Swh31274 flt_stat.mf_err_add, flt_stat.mf_err_log); 19821772Sjl139090 19831772Sjl139090 /* MI registers */ 19841772Sjl139090 mc_read_mi_reg(mcp, bank, &mi_flt_stat); 19851772Sjl139090 19862214Sav145390 19875080Swh31274 MC_LOG("MI registers cntl %x add %x log %x\n", mi_flt_stat.mf_cntl, 19885080Swh31274 mi_flt_stat.mf_err_add, mi_flt_stat.mf_err_log); 19891772Sjl139090 19901772Sjl139090 /* clear errors once we read all the registers */ 19911772Sjl139090 MAC_CLEAR_ERRS(mcp, bank, (MAC_CNTL_PTRL_ERRS|MAC_CNTL_MI_ERRS)); 19921772Sjl139090 19932214Sav145390 mc_aflt.mflt_is_ptrl = 0; 19942214Sav145390 if ((mi_flt_stat.mf_cntl & MAC_CNTL_MI_ERRS) && 19955080Swh31274 ((mi_flt_stat.mf_err_add & MAC_ERR_ADD_INVALID) == 0) && 19965080Swh31274 ((mi_flt_stat.mf_err_log & MAC_ERR_LOG_INVALID) == 0)) { 19972214Sav145390 mi_valid = mc_process_error(mcp, bank, &mc_aflt, &mi_flt_stat); 19982214Sav145390 } 19992214Sav145390 20002214Sav145390 if ((((flt_stat.mf_cntl & MAC_CNTL_PTRL_ERRS) >> 20015080Swh31274 MAC_CNTL_PTRL_ERR_SHIFT) == ((mi_flt_stat.mf_cntl & 20025080Swh31274 MAC_CNTL_MI_ERRS) >> MAC_CNTL_MI_ERR_SHIFT)) && 20035080Swh31274 (flt_stat.mf_err_add == mi_flt_stat.mf_err_add)) { 20042214Sav145390 #ifdef DEBUG 20052214Sav145390 MC_LOG("discarding PTRL error because " 20062214Sav145390 "it is the same as MI\n"); 20072214Sav145390 #endif 20082662Shyw rsaddr->mi_valid = mi_valid; 20092214Sav145390 return; 20102214Sav145390 } 20112214Sav145390 20121772Sjl139090 mc_aflt.mflt_is_ptrl = 1; 20131772Sjl139090 if ((flt_stat.mf_cntl & MAC_CNTL_PTRL_ERRS) && 20145080Swh31274 ((flt_stat.mf_err_add & MAC_ERR_ADD_INVALID) == 0) && 20155080Swh31274 ((flt_stat.mf_err_log & MAC_ERR_LOG_INVALID) == 0)) { 20165080Swh31274 rsaddr->mi_valid = mc_process_error(mcp, bank, &mc_aflt, 20175080Swh31274 &flt_stat); 20181772Sjl139090 } 20191772Sjl139090 } 20201772Sjl139090 /* 20211772Sjl139090 * memory patrol error handling algorithm: 20221772Sjl139090 * timeout() is used to do periodic polling 20231772Sjl139090 * This is the flow chart. 20241772Sjl139090 * timeout -> 20251772Sjl139090 * mc_check_errors() 20261772Sjl139090 * if memory bank is installed, read the status register 20271772Sjl139090 * if any error bit is set, 20281772Sjl139090 * -> mc_error_handler() 20293152Sav145390 * -> read all error registers 20301772Sjl139090 * -> mc_process_error() 20311772Sjl139090 * determine error type 20321772Sjl139090 * rewrite to clear error or scrub to determine CE type 20331772Sjl139090 * inform SCF on permanent CE 20341772Sjl139090 * -> mc_err_drain 20351772Sjl139090 * page offline processing 20361772Sjl139090 * -> mc_ereport_post() 20371772Sjl139090 */ 20381772Sjl139090 20391772Sjl139090 static void 20405310Sdhain mc_process_rewrite(mc_opl_t *mcp, int bank) 20415310Sdhain { 20425310Sdhain uint32_t rew_addr, cntl; 20435310Sdhain mc_retry_info_t *retry; 20445310Sdhain struct mc_bank *bankp; 20455310Sdhain 20465310Sdhain bankp = &(mcp->mc_bank[bank]); 20475310Sdhain retry = bankp->mcb_active; 20485310Sdhain if (retry == NULL) 20495310Sdhain return; 20505310Sdhain 20515310Sdhain if (retry->ri_state <= RETRY_STATE_ACTIVE) { 20525310Sdhain cntl = LD_MAC_REG(MAC_PTRL_CNTL(mcp, bank)); 20535310Sdhain if (cntl & MAC_CNTL_PTRL_STATUS) 20545310Sdhain return; 20555310Sdhain rew_addr = retry->ri_addr; 20565310Sdhain ST_MAC_REG(MAC_REWRITE_ADD(mcp, bank), rew_addr); 20575310Sdhain MAC_REW_REQ(mcp, bank); 20585310Sdhain 20595310Sdhain retry->ri_state = RETRY_STATE_REWRITE; 20605310Sdhain } 20615310Sdhain 20625310Sdhain cntl = ldphysio(MAC_PTRL_CNTL(mcp, bank)); 20635310Sdhain 20645310Sdhain if (cntl & MAC_CNTL_REW_END) { 20655310Sdhain MAC_CLEAR_ERRS(mcp, bank, 20665310Sdhain MAC_CNTL_REW_ERRS); 20675310Sdhain mc_clear_rewrite(mcp, bank); 20685310Sdhain } else { 20695310Sdhain /* 20705310Sdhain * If the rewrite does not complete in 20715310Sdhain * 1 hour, we have to consider this a HW 20725310Sdhain * failure. However, there is no recovery 20735310Sdhain * mechanism. The only thing we can do 20745310Sdhain * to to print a warning message to the 20755310Sdhain * console. We continue to increment the 20765310Sdhain * counter but we only print the message 20775310Sdhain * once. It will take the counter a long 20785310Sdhain * time to wrap around and the user might 20795310Sdhain * see a second message. In practice, 20805310Sdhain * we have never hit this condition but 20815310Sdhain * we have to keep the code here just in case. 20825310Sdhain */ 20835310Sdhain if (++mcp->mc_bank[bank].mcb_rewrite_count 20845310Sdhain == mc_max_rewrite_retry) { 20855310Sdhain cmn_err(CE_WARN, "Memory patrol feature is" 20865310Sdhain " partly suspended on /LSB%d/B%d" 20875310Sdhain " due to heavy memory load," 20885310Sdhain " and it will restart" 20895310Sdhain " automatically.\n", mcp->mc_board_num, 20905310Sdhain bank); 20915310Sdhain } 20925310Sdhain } 20935310Sdhain } 20945310Sdhain 20955310Sdhain static void 20961772Sjl139090 mc_check_errors_func(mc_opl_t *mcp) 20971772Sjl139090 { 20982662Shyw mc_rsaddr_info_t rsaddr_info; 20991772Sjl139090 int i, error_count = 0; 21001772Sjl139090 uint32_t stat, cntl; 21012214Sav145390 int running; 21022494Shyw int wrapped; 21032867Shyw int ebk; 21041772Sjl139090 21051772Sjl139090 /* 21061772Sjl139090 * scan errors. 21071772Sjl139090 */ 21082214Sav145390 if (mcp->mc_status & MC_MEMORYLESS) 21092214Sav145390 return; 21102214Sav145390 21111772Sjl139090 for (i = 0; i < BANKNUM_PER_SB; i++) { 21121772Sjl139090 if (mcp->mc_bank[i].mcb_status & BANK_INSTALLED) { 21135310Sdhain if (MC_REWRITE_ACTIVE(mcp, i)) { 21145310Sdhain mc_process_rewrite(mcp, i); 21155310Sdhain } 21161772Sjl139090 stat = ldphysio(MAC_PTRL_STAT(mcp, i)); 21171772Sjl139090 cntl = ldphysio(MAC_PTRL_CNTL(mcp, i)); 21182214Sav145390 running = cntl & MAC_CNTL_PTRL_START; 21192494Shyw wrapped = cntl & MAC_CNTL_PTRL_ADD_MAX; 21202494Shyw 21212867Shyw /* Compute the effective bank idx */ 21222867Shyw ebk = (IS_MIRROR(mcp, i)) ? MIRROR_IDX(i) : i; 21232867Shyw 21242494Shyw if (mc_debug_show_all || stat) { 21252494Shyw MC_LOG("/LSB%d/B%d stat %x cntl %x\n", 21265080Swh31274 mcp->mc_board_num, i, stat, cntl); 21272494Shyw } 21282494Shyw 21292494Shyw /* 21302494Shyw * Update stats and reset flag if the HW patrol 21312494Shyw * wrapped around in its scan. 21322494Shyw */ 21332494Shyw if (wrapped) { 21341772Sjl139090 MAC_CLEAR_MAX(mcp, i); 21352867Shyw mcp->mc_period[ebk]++; 21362867Shyw if (IS_MIRROR(mcp, i)) 21375080Swh31274 MC_LOG("mirror mc period %ld on " 21385080Swh31274 "/LSB%d/B%d\n", mcp->mc_period[ebk], 21395080Swh31274 mcp->mc_board_num, i); 21402867Shyw else { 21415080Swh31274 MC_LOG("mc period %ld on " 21425080Swh31274 "/LSB%d/B%d\n", mcp->mc_period[ebk], 21435080Swh31274 mcp->mc_board_num, i); 21442867Shyw } 21452494Shyw } 21462494Shyw 21472494Shyw if (running) { 21482494Shyw /* 21492494Shyw * Mac patrol HW is still running. 21502494Shyw * Normally when an error is detected, 21512494Shyw * the HW patrol will stop so that we 21522494Shyw * can collect error data for reporting. 21532494Shyw * Certain errors (MI errors) detected may not 21542494Shyw * cause the HW patrol to stop which is a 21552494Shyw * problem since we cannot read error data while 21562494Shyw * the HW patrol is running. SW is not allowed 21572494Shyw * to stop the HW patrol while it is running 21582494Shyw * as it may cause HW inconsistency. This is 21592494Shyw * described in a HW errata. 21602494Shyw * In situations where we detected errors 21612494Shyw * that may not cause the HW patrol to stop. 21622494Shyw * We speed up the HW patrol scanning in 21632494Shyw * the hope that it will find the 'real' PTRL 21642494Shyw * errors associated with the previous errors 21652494Shyw * causing the HW to finally stop so that we 21662494Shyw * can do the reporting. 21672494Shyw */ 21682494Shyw /* 21692494Shyw * Check to see if we did speed up 21702494Shyw * the HW patrol due to previous errors 21712494Shyw * detected that did not cause the patrol 21722494Shyw * to stop. We only do it if HW patrol scan 21732494Shyw * wrapped (counted as completing a 'period'). 21742494Shyw */ 21752867Shyw if (mcp->mc_speedup_period[ebk] > 0) { 21765080Swh31274 if (wrapped && 21775080Swh31274 (--mcp->mc_speedup_period[ebk] == 21785080Swh31274 0)) { 21795080Swh31274 /* 21805080Swh31274 * We did try to speed up. 21815080Swh31274 * The speed up period has 21825080Swh31274 * expired and the HW patrol 21835080Swh31274 * is still running. The 21845080Swh31274 * errors must be intermittent. 21855080Swh31274 * We have no choice but to 21865080Swh31274 * ignore them, reset the scan 21875080Swh31274 * speed to normal and clear 21885080Swh31274 * the MI error bits. For 21895080Swh31274 * mirror mode, we need to 21905080Swh31274 * clear errors on both banks. 21915080Swh31274 */ 21925080Swh31274 MC_LOG("Clearing MI errors\n"); 21935080Swh31274 MAC_CLEAR_ERRS(mcp, i, 21945080Swh31274 MAC_CNTL_MI_ERRS); 21955080Swh31274 21965080Swh31274 if (IS_MIRROR(mcp, i)) { 21975080Swh31274 MC_LOG("Clearing " 21985080Swh31274 "Mirror MI errs\n"); 21995080Swh31274 MAC_CLEAR_ERRS(mcp, 22005080Swh31274 i^1, 22015080Swh31274 MAC_CNTL_MI_ERRS); 22025080Swh31274 } 22032867Shyw } 22042494Shyw } else if (stat & MAC_STAT_MI_ERRS) { 22052494Shyw /* 22062494Shyw * MI errors detected but we cannot 22072494Shyw * report them since the HW patrol 22082494Shyw * is still running. 22092494Shyw * We will attempt to speed up the 22102494Shyw * scanning and hopefully the HW 22112494Shyw * can detect PRTL errors at the same 22122494Shyw * location that cause the HW patrol 22132494Shyw * to stop. 22142494Shyw */ 22152867Shyw mcp->mc_speedup_period[ebk] = 2; 22162214Sav145390 MAC_CMD(mcp, i, 0); 22172214Sav145390 } 22182494Shyw } else if (stat & (MAC_STAT_PTRL_ERRS | 22192494Shyw MAC_STAT_MI_ERRS)) { 22202494Shyw /* 22212494Shyw * HW Patrol has stopped and we found errors. 22222494Shyw * Proceed to collect and report error info. 22232494Shyw */ 22242867Shyw mcp->mc_speedup_period[ebk] = 0; 22252662Shyw rsaddr_info.mi_valid = 0; 22262662Shyw rsaddr_info.mi_injectrestart = 0; 22272662Shyw if (IS_MIRROR(mcp, i)) { 22285080Swh31274 mc_error_handler_mir(mcp, i, 22295080Swh31274 &rsaddr_info); 22302662Shyw } else { 22315080Swh31274 mc_error_handler(mcp, i, &rsaddr_info); 22322662Shyw } 22332494Shyw 22342494Shyw error_count++; 22352662Shyw restart_patrol(mcp, i, &rsaddr_info); 22361772Sjl139090 } else { 22372494Shyw /* 22382494Shyw * HW patrol scan has apparently stopped 22392494Shyw * but no errors detected/flagged. 22402494Shyw * Restart the HW patrol just to be sure. 22412867Shyw * In mirror mode, the odd bank might have 22422867Shyw * reported errors that caused the patrol to 22432867Shyw * stop. We'll defer the restart to the odd 22442867Shyw * bank in this case. 22452494Shyw */ 22462867Shyw if (!IS_MIRROR(mcp, i) || (i & 0x1)) 22472867Shyw restart_patrol(mcp, i, NULL); 22481772Sjl139090 } 22491772Sjl139090 } 22501772Sjl139090 } 22511772Sjl139090 if (error_count > 0) 22521772Sjl139090 mcp->mc_last_error += error_count; 22531772Sjl139090 else 22541772Sjl139090 mcp->mc_last_error = 0; 22551772Sjl139090 } 22561772Sjl139090 22572214Sav145390 /* 22582214Sav145390 * mc_polling -- Check errors for only one instance, 22592214Sav145390 * but process errors for all instances to make sure we drain the errors 22602214Sav145390 * faster than they can be accumulated. 22612214Sav145390 * 22622214Sav145390 * Polling on each board should be done only once per each 22632214Sav145390 * mc_patrol_interval_sec. This is equivalent to setting mc_tick_left 22642214Sav145390 * to OPL_MAX_BOARDS and decrement by 1 on each timeout. 22652214Sav145390 * Once mc_tick_left becomes negative, the board becomes a candidate 22662214Sav145390 * for polling because it has waited for at least 22672214Sav145390 * mc_patrol_interval_sec's long. If mc_timeout_period is calculated 22683152Sav145390 * differently, this has to be updated accordingly. 22692214Sav145390 */ 22701772Sjl139090 22711772Sjl139090 static void 22722214Sav145390 mc_polling(void) 22731772Sjl139090 { 22742214Sav145390 int i, scan_error; 22752214Sav145390 mc_opl_t *mcp; 22762214Sav145390 22772214Sav145390 22782214Sav145390 scan_error = 1; 22792214Sav145390 for (i = 0; i < OPL_MAX_BOARDS; i++) { 22802214Sav145390 mutex_enter(&mcmutex); 22812214Sav145390 if ((mcp = mc_instances[i]) == NULL) { 22822214Sav145390 mutex_exit(&mcmutex); 22832214Sav145390 continue; 22842214Sav145390 } 22852214Sav145390 mutex_enter(&mcp->mc_lock); 22862214Sav145390 mutex_exit(&mcmutex); 22872662Shyw if (!(mcp->mc_status & MC_POLL_RUNNING)) { 22882662Shyw mutex_exit(&mcp->mc_lock); 22892662Shyw continue; 22902662Shyw } 22912214Sav145390 if (scan_error && mcp->mc_tick_left <= 0) { 22922214Sav145390 mc_check_errors_func((void *)mcp); 22932214Sav145390 mcp->mc_tick_left = OPL_MAX_BOARDS; 22942214Sav145390 scan_error = 0; 22952214Sav145390 } else { 22962214Sav145390 mcp->mc_tick_left--; 22972214Sav145390 } 22982214Sav145390 mc_process_scf_log(mcp); 22992214Sav145390 mutex_exit(&mcp->mc_lock); 23001772Sjl139090 } 23011772Sjl139090 } 23021772Sjl139090 23031772Sjl139090 static void 23041772Sjl139090 get_ptrl_start_address(mc_opl_t *mcp, int bank, mc_addr_t *maddr) 23051772Sjl139090 { 23061772Sjl139090 maddr->ma_bd = mcp->mc_board_num; 23071772Sjl139090 maddr->ma_bank = bank; 23081772Sjl139090 maddr->ma_dimm_addr = 0; 23091772Sjl139090 } 23101772Sjl139090 23111772Sjl139090 typedef struct mc_mem_range { 23121772Sjl139090 uint64_t addr; 23131772Sjl139090 uint64_t size; 23141772Sjl139090 } mc_mem_range_t; 23151772Sjl139090 23161772Sjl139090 static int 23171772Sjl139090 get_base_address(mc_opl_t *mcp) 23181772Sjl139090 { 23191772Sjl139090 mc_mem_range_t *mem_range; 23201772Sjl139090 int len; 23211772Sjl139090 23221772Sjl139090 if (ddi_getlongprop(DDI_DEV_T_ANY, mcp->mc_dip, DDI_PROP_DONTPASS, 23235080Swh31274 "sb-mem-ranges", (caddr_t)&mem_range, &len) != DDI_SUCCESS) { 23241772Sjl139090 return (DDI_FAILURE); 23251772Sjl139090 } 23261772Sjl139090 23271772Sjl139090 mcp->mc_start_address = mem_range->addr; 23281772Sjl139090 mcp->mc_size = mem_range->size; 23291772Sjl139090 23301772Sjl139090 kmem_free(mem_range, len); 23311772Sjl139090 return (DDI_SUCCESS); 23321772Sjl139090 } 23331772Sjl139090 23341772Sjl139090 struct mc_addr_spec { 23351772Sjl139090 uint32_t bank; 23361772Sjl139090 uint32_t phys_hi; 23371772Sjl139090 uint32_t phys_lo; 23381772Sjl139090 }; 23391772Sjl139090 23401772Sjl139090 #define REGS_PA(m, i) ((((uint64_t)m[i].phys_hi)<<32) | m[i].phys_lo) 23411772Sjl139090 23421772Sjl139090 static char *mc_tbl_name[] = { 23431772Sjl139090 "cs0-mc-pa-trans-table", 23441772Sjl139090 "cs1-mc-pa-trans-table" 23451772Sjl139090 }; 23461772Sjl139090 23472662Shyw /* 23482662Shyw * This routine performs a rangecheck for a given PA 23492662Shyw * to see if it belongs to the memory range for this board. 23502662Shyw * Return 1 if it is valid (within the range) and 0 otherwise 23512662Shyw */ 23521772Sjl139090 static int 23532662Shyw mc_rangecheck_pa(mc_opl_t *mcp, uint64_t pa) 23541772Sjl139090 { 23555080Swh31274 if ((pa < mcp->mc_start_address) || (mcp->mc_start_address + 23565080Swh31274 mcp->mc_size <= pa)) 23572662Shyw return (0); 23582662Shyw else 23592662Shyw return (1); 23601772Sjl139090 } 23611772Sjl139090 23621772Sjl139090 static void 23631772Sjl139090 mc_memlist_delete(struct memlist *mlist) 23641772Sjl139090 { 23651772Sjl139090 struct memlist *ml; 23661772Sjl139090 23671772Sjl139090 for (ml = mlist; ml; ml = mlist) { 23681772Sjl139090 mlist = ml->next; 23691772Sjl139090 kmem_free(ml, sizeof (struct memlist)); 23701772Sjl139090 } 23711772Sjl139090 } 23721772Sjl139090 23731772Sjl139090 static struct memlist * 23741772Sjl139090 mc_memlist_dup(struct memlist *mlist) 23751772Sjl139090 { 23761772Sjl139090 struct memlist *hl = NULL, *tl, **mlp; 23771772Sjl139090 23781772Sjl139090 if (mlist == NULL) 23791772Sjl139090 return (NULL); 23801772Sjl139090 23811772Sjl139090 mlp = &hl; 23821772Sjl139090 tl = *mlp; 23831772Sjl139090 for (; mlist; mlist = mlist->next) { 23841772Sjl139090 *mlp = kmem_alloc(sizeof (struct memlist), KM_SLEEP); 23851772Sjl139090 (*mlp)->address = mlist->address; 23861772Sjl139090 (*mlp)->size = mlist->size; 23871772Sjl139090 (*mlp)->prev = tl; 23881772Sjl139090 tl = *mlp; 23891772Sjl139090 mlp = &((*mlp)->next); 23901772Sjl139090 } 23911772Sjl139090 *mlp = NULL; 23921772Sjl139090 23931772Sjl139090 return (hl); 23941772Sjl139090 } 23951772Sjl139090 23961772Sjl139090 23971772Sjl139090 static struct memlist * 23981772Sjl139090 mc_memlist_del_span(struct memlist *mlist, uint64_t base, uint64_t len) 23991772Sjl139090 { 24001772Sjl139090 uint64_t end; 24011772Sjl139090 struct memlist *ml, *tl, *nlp; 24021772Sjl139090 24031772Sjl139090 if (mlist == NULL) 24041772Sjl139090 return (NULL); 24051772Sjl139090 24061772Sjl139090 end = base + len; 24071772Sjl139090 if ((end <= mlist->address) || (base == end)) 24081772Sjl139090 return (mlist); 24091772Sjl139090 24101772Sjl139090 for (tl = ml = mlist; ml; tl = ml, ml = nlp) { 24111772Sjl139090 uint64_t mend; 24121772Sjl139090 24131772Sjl139090 nlp = ml->next; 24141772Sjl139090 24151772Sjl139090 if (end <= ml->address) 24161772Sjl139090 break; 24171772Sjl139090 24181772Sjl139090 mend = ml->address + ml->size; 24191772Sjl139090 if (base < mend) { 24201772Sjl139090 if (base <= ml->address) { 24211772Sjl139090 ml->address = end; 24221772Sjl139090 if (end >= mend) 24231772Sjl139090 ml->size = 0ull; 24241772Sjl139090 else 24251772Sjl139090 ml->size = mend - ml->address; 24261772Sjl139090 } else { 24271772Sjl139090 ml->size = base - ml->address; 24281772Sjl139090 if (end < mend) { 24291772Sjl139090 struct memlist *nl; 24301772Sjl139090 /* 24311772Sjl139090 * splitting an memlist entry. 24321772Sjl139090 */ 24331772Sjl139090 nl = kmem_alloc(sizeof (struct memlist), 24345080Swh31274 KM_SLEEP); 24351772Sjl139090 nl->address = end; 24361772Sjl139090 nl->size = mend - nl->address; 24371772Sjl139090 if ((nl->next = nlp) != NULL) 24381772Sjl139090 nlp->prev = nl; 24391772Sjl139090 nl->prev = ml; 24401772Sjl139090 ml->next = nl; 24411772Sjl139090 nlp = nl; 24421772Sjl139090 } 24431772Sjl139090 } 24441772Sjl139090 if (ml->size == 0ull) { 24451772Sjl139090 if (ml == mlist) { 24461772Sjl139090 if ((mlist = nlp) != NULL) 24471772Sjl139090 nlp->prev = NULL; 24481772Sjl139090 kmem_free(ml, sizeof (struct memlist)); 24491772Sjl139090 if (mlist == NULL) 24501772Sjl139090 break; 24511772Sjl139090 ml = nlp; 24521772Sjl139090 } else { 24531772Sjl139090 if ((tl->next = nlp) != NULL) 24541772Sjl139090 nlp->prev = tl; 24551772Sjl139090 kmem_free(ml, sizeof (struct memlist)); 24561772Sjl139090 ml = tl; 24571772Sjl139090 } 24581772Sjl139090 } 24591772Sjl139090 } 24601772Sjl139090 } 24611772Sjl139090 24621772Sjl139090 return (mlist); 24631772Sjl139090 } 24641772Sjl139090 24651772Sjl139090 static void 24661772Sjl139090 mc_get_mlist(mc_opl_t *mcp) 24671772Sjl139090 { 24681772Sjl139090 struct memlist *mlist; 24691772Sjl139090 24701772Sjl139090 memlist_read_lock(); 24711772Sjl139090 mlist = mc_memlist_dup(phys_install); 24721772Sjl139090 memlist_read_unlock(); 24731772Sjl139090 24741772Sjl139090 if (mlist) { 24751772Sjl139090 mlist = mc_memlist_del_span(mlist, 0ull, mcp->mc_start_address); 24761772Sjl139090 } 24771772Sjl139090 24781772Sjl139090 if (mlist) { 24791772Sjl139090 uint64_t startpa, endpa; 24801772Sjl139090 24811772Sjl139090 startpa = mcp->mc_start_address + mcp->mc_size; 24821772Sjl139090 endpa = ptob(physmax + 1); 24831772Sjl139090 if (endpa > startpa) { 24845080Swh31274 mlist = mc_memlist_del_span(mlist, startpa, 24855080Swh31274 endpa - startpa); 24861772Sjl139090 } 24871772Sjl139090 } 24881772Sjl139090 24891772Sjl139090 if (mlist) { 24901772Sjl139090 mcp->mlist = mlist; 24911772Sjl139090 } 24921772Sjl139090 } 24931772Sjl139090 24941772Sjl139090 int 24951772Sjl139090 mc_board_add(mc_opl_t *mcp) 24961772Sjl139090 { 24971772Sjl139090 struct mc_addr_spec *macaddr; 24982214Sav145390 cs_status_t *cs_status; 24992214Sav145390 int len, len1, i, bk, cc; 25002662Shyw mc_rsaddr_info_t rsaddr; 25011772Sjl139090 uint32_t mirr; 25022214Sav145390 int nbanks = 0; 25032214Sav145390 uint64_t nbytes = 0; 25045080Swh31274 int mirror_mode = 0; 25055080Swh31274 int ret; 25061772Sjl139090 25071772Sjl139090 /* 25081772Sjl139090 * Get configurations from "pseudo-mc" node which includes: 25091772Sjl139090 * board# : LSB number 25101772Sjl139090 * mac-addr : physical base address of MAC registers 25111772Sjl139090 * csX-mac-pa-trans-table: translation table from DIMM address 25121772Sjl139090 * to physical address or vice versa. 25131772Sjl139090 */ 25141772Sjl139090 mcp->mc_board_num = (int)ddi_getprop(DDI_DEV_T_ANY, mcp->mc_dip, 25155080Swh31274 DDI_PROP_DONTPASS, "board#", -1); 25161772Sjl139090 25172214Sav145390 if (mcp->mc_board_num == -1) { 25182214Sav145390 return (DDI_FAILURE); 25192214Sav145390 } 25202214Sav145390 25211772Sjl139090 /* 25221772Sjl139090 * Get start address in this CAB. It can be gotten from 25231772Sjl139090 * "sb-mem-ranges" property. 25241772Sjl139090 */ 25251772Sjl139090 25261772Sjl139090 if (get_base_address(mcp) == DDI_FAILURE) { 25271772Sjl139090 return (DDI_FAILURE); 25281772Sjl139090 } 25291772Sjl139090 /* get mac-pa trans tables */ 25301772Sjl139090 for (i = 0; i < MC_TT_CS; i++) { 25311772Sjl139090 len = MC_TT_ENTRIES; 25321772Sjl139090 cc = ddi_getlongprop_buf(DDI_DEV_T_ANY, mcp->mc_dip, 25335080Swh31274 DDI_PROP_DONTPASS, mc_tbl_name[i], 25345080Swh31274 (caddr_t)mcp->mc_trans_table[i], &len); 25351772Sjl139090 25361772Sjl139090 if (cc != DDI_SUCCESS) { 25371772Sjl139090 bzero(mcp->mc_trans_table[i], MC_TT_ENTRIES); 25381772Sjl139090 } 25391772Sjl139090 } 25401772Sjl139090 mcp->mlist = NULL; 25411772Sjl139090 25421772Sjl139090 mc_get_mlist(mcp); 25431772Sjl139090 25441772Sjl139090 /* initialize bank informations */ 25451772Sjl139090 cc = ddi_getlongprop(DDI_DEV_T_ANY, mcp->mc_dip, DDI_PROP_DONTPASS, 25465080Swh31274 "mc-addr", (caddr_t)&macaddr, &len); 25471772Sjl139090 if (cc != DDI_SUCCESS) { 25481772Sjl139090 cmn_err(CE_WARN, "Cannot get mc-addr. err=%d\n", cc); 25492214Sav145390 return (DDI_FAILURE); 25502214Sav145390 } 25512214Sav145390 25522214Sav145390 cc = ddi_getlongprop(DDI_DEV_T_ANY, mcp->mc_dip, DDI_PROP_DONTPASS, 25535080Swh31274 "cs-status", (caddr_t)&cs_status, &len1); 25542214Sav145390 25552214Sav145390 if (cc != DDI_SUCCESS) { 25562214Sav145390 if (len > 0) 25572214Sav145390 kmem_free(macaddr, len); 25582214Sav145390 cmn_err(CE_WARN, "Cannot get cs-status. err=%d\n", cc); 25591772Sjl139090 return (DDI_FAILURE); 25601772Sjl139090 } 25613045Sav145390 /* get the physical board number for a given logical board number */ 25623045Sav145390 mcp->mc_phys_board_num = mc_opl_get_physical_board(mcp->mc_board_num); 25633045Sav145390 25643045Sav145390 if (mcp->mc_phys_board_num < 0) { 25653045Sav145390 if (len > 0) 25663045Sav145390 kmem_free(macaddr, len); 25673045Sav145390 cmn_err(CE_WARN, "Unable to obtain the physical board number"); 25683045Sav145390 return (DDI_FAILURE); 25693045Sav145390 } 25701772Sjl139090 25712214Sav145390 mutex_init(&mcp->mc_lock, NULL, MUTEX_DRIVER, NULL); 25722214Sav145390 25732214Sav145390 for (i = 0; i < len1 / sizeof (cs_status_t); i++) { 25742214Sav145390 nbytes += ((uint64_t)cs_status[i].cs_avail_hi << 32) | 25755080Swh31274 ((uint64_t)cs_status[i].cs_avail_low); 25762214Sav145390 } 25772214Sav145390 if (len1 > 0) 25782214Sav145390 kmem_free(cs_status, len1); 25792214Sav145390 nbanks = len / sizeof (struct mc_addr_spec); 25802214Sav145390 25812214Sav145390 if (nbanks > 0) 25822214Sav145390 nbytes /= nbanks; 25832214Sav145390 else { 25842214Sav145390 /* No need to free macaddr because len must be 0 */ 25852214Sav145390 mcp->mc_status |= MC_MEMORYLESS; 25862214Sav145390 return (DDI_SUCCESS); 25872214Sav145390 } 25882214Sav145390 25892214Sav145390 for (i = 0; i < BANKNUM_PER_SB; i++) { 25902214Sav145390 mcp->mc_scf_retry[i] = 0; 25912214Sav145390 mcp->mc_period[i] = 0; 25922214Sav145390 mcp->mc_speedup_period[i] = 0; 25932214Sav145390 } 25942214Sav145390 25952214Sav145390 /* 25962214Sav145390 * Get the memory size here. Let it be B (bytes). 25972214Sav145390 * Let T be the time in u.s. to scan 64 bytes. 25982214Sav145390 * If we want to complete 1 round of scanning in P seconds. 25992214Sav145390 * 26002214Sav145390 * B * T * 10^(-6) = P 26012214Sav145390 * --------------- 26022214Sav145390 * 64 26032214Sav145390 * 26042214Sav145390 * T = P * 64 * 10^6 26052214Sav145390 * ------------- 26062214Sav145390 * B 26072214Sav145390 * 26082214Sav145390 * = P * 64 * 10^6 26092214Sav145390 * ------------- 26102214Sav145390 * B 26112214Sav145390 * 26122214Sav145390 * The timing bits are set in PTRL_CNTL[28:26] where 26132214Sav145390 * 26142214Sav145390 * 0 - 1 m.s 26152214Sav145390 * 1 - 512 u.s. 26162214Sav145390 * 10 - 256 u.s. 26172214Sav145390 * 11 - 128 u.s. 26182214Sav145390 * 100 - 64 u.s. 26192214Sav145390 * 101 - 32 u.s. 26202214Sav145390 * 110 - 0 u.s. 26212214Sav145390 * 111 - reserved. 26222214Sav145390 * 26232214Sav145390 * 26242214Sav145390 * a[0] = 110, a[1] = 101, ... a[6] = 0 26252214Sav145390 * 26262214Sav145390 * cs-status property is int x 7 26272214Sav145390 * 0 - cs# 26282214Sav145390 * 1 - cs-status 26292214Sav145390 * 2 - cs-avail.hi 26302214Sav145390 * 3 - cs-avail.lo 26312214Sav145390 * 4 - dimm-capa.hi 26322214Sav145390 * 5 - dimm-capa.lo 26332214Sav145390 * 6 - #of dimms 26342214Sav145390 */ 26352214Sav145390 26362214Sav145390 if (nbytes > 0) { 26372214Sav145390 int i; 26382214Sav145390 uint64_t ms; 26392214Sav145390 ms = ((uint64_t)mc_scan_period * 64 * 1000000)/nbytes; 26402214Sav145390 mcp->mc_speed = mc_scan_speeds[MC_MAX_SPEEDS - 1].mc_speeds; 26412214Sav145390 for (i = 0; i < MC_MAX_SPEEDS - 1; i++) { 26422214Sav145390 if (ms < mc_scan_speeds[i + 1].mc_period) { 26432214Sav145390 mcp->mc_speed = mc_scan_speeds[i].mc_speeds; 26442214Sav145390 break; 26452214Sav145390 } 26462214Sav145390 } 26472214Sav145390 } else 26482214Sav145390 mcp->mc_speed = 0; 26492214Sav145390 26502214Sav145390 26511772Sjl139090 for (i = 0; i < len / sizeof (struct mc_addr_spec); i++) { 26521772Sjl139090 struct mc_bank *bankp; 26535310Sdhain mc_retry_info_t *retry; 26541772Sjl139090 uint32_t reg; 26555310Sdhain int k; 26561772Sjl139090 26571772Sjl139090 /* 26581772Sjl139090 * setup bank 26591772Sjl139090 */ 26601772Sjl139090 bk = macaddr[i].bank; 26611772Sjl139090 bankp = &(mcp->mc_bank[bk]); 26621772Sjl139090 bankp->mcb_status = BANK_INSTALLED; 26631772Sjl139090 bankp->mcb_reg_base = REGS_PA(macaddr, i); 26641772Sjl139090 26655310Sdhain bankp->mcb_retry_freelist = NULL; 26665310Sdhain bankp->mcb_retry_pending = NULL; 26675310Sdhain bankp->mcb_active = NULL; 26685310Sdhain retry = &bankp->mcb_retry_infos[0]; 26695310Sdhain for (k = 0; k < MC_RETRY_COUNT; k++, retry++) { 26705310Sdhain mc_retry_info_put(&bankp->mcb_retry_freelist, retry); 26715310Sdhain } 26725310Sdhain 26731772Sjl139090 reg = LD_MAC_REG(MAC_PTRL_CNTL(mcp, bk)); 26741772Sjl139090 bankp->mcb_ptrl_cntl = (reg & MAC_CNTL_PTRL_PRESERVE_BITS); 26751772Sjl139090 26761772Sjl139090 /* 26771772Sjl139090 * check if mirror mode 26781772Sjl139090 */ 26791772Sjl139090 mirr = LD_MAC_REG(MAC_MIRR(mcp, bk)); 26801772Sjl139090 26811772Sjl139090 if (mirr & MAC_MIRR_MIRROR_MODE) { 26825080Swh31274 MC_LOG("Mirror -> /LSB%d/B%d\n", mcp->mc_board_num, 26835080Swh31274 bk); 26841772Sjl139090 bankp->mcb_status |= BANK_MIRROR_MODE; 26855080Swh31274 mirror_mode = 1; 26861772Sjl139090 /* 26871772Sjl139090 * The following bit is only used for 26881772Sjl139090 * error injection. We should clear it 26891772Sjl139090 */ 26901772Sjl139090 if (mirr & MAC_MIRR_BANK_EXCLUSIVE) 26915080Swh31274 ST_MAC_REG(MAC_MIRR(mcp, bk), 0); 26921772Sjl139090 } 26931772Sjl139090 26941772Sjl139090 /* 26951772Sjl139090 * restart if not mirror mode or the other bank 26961772Sjl139090 * of the mirror is not running 26971772Sjl139090 */ 26981772Sjl139090 if (!(mirr & MAC_MIRR_MIRROR_MODE) || 26995080Swh31274 !(mcp->mc_bank[bk^1].mcb_status & BANK_PTRL_RUNNING)) { 27005080Swh31274 MC_LOG("Starting up /LSB%d/B%d\n", mcp->mc_board_num, 27015080Swh31274 bk); 27022662Shyw get_ptrl_start_address(mcp, bk, &rsaddr.mi_restartaddr); 27032662Shyw rsaddr.mi_valid = 0; 27042662Shyw rsaddr.mi_injectrestart = 0; 27052662Shyw restart_patrol(mcp, bk, &rsaddr); 27061772Sjl139090 } else { 27071772Sjl139090 MC_LOG("Not starting up /LSB%d/B%d\n", 27085080Swh31274 mcp->mc_board_num, bk); 27091772Sjl139090 } 27101772Sjl139090 bankp->mcb_status |= BANK_PTRL_RUNNING; 27111772Sjl139090 } 27122214Sav145390 if (len > 0) 27132214Sav145390 kmem_free(macaddr, len); 27142214Sav145390 27155080Swh31274 ret = ndi_prop_update_int(DDI_DEV_T_NONE, mcp->mc_dip, "mirror-mode", 27165080Swh31274 mirror_mode); 27175080Swh31274 if (ret != DDI_PROP_SUCCESS) { 27185080Swh31274 cmn_err(CE_WARN, "Unable to update mirror-mode property"); 27195080Swh31274 } 27205080Swh31274 27212214Sav145390 mcp->mc_dimm_list = mc_get_dimm_list(mcp); 27221772Sjl139090 27231772Sjl139090 /* 27241772Sjl139090 * set interval in HZ. 27251772Sjl139090 */ 27261772Sjl139090 mcp->mc_last_error = 0; 27272214Sav145390 27281772Sjl139090 /* restart memory patrol checking */ 27291772Sjl139090 mcp->mc_status |= MC_POLL_RUNNING; 27301772Sjl139090 27311772Sjl139090 return (DDI_SUCCESS); 27321772Sjl139090 } 27331772Sjl139090 27341772Sjl139090 int 27351772Sjl139090 mc_board_del(mc_opl_t *mcp) 27361772Sjl139090 { 27371772Sjl139090 int i; 27381772Sjl139090 scf_log_t *p; 27391772Sjl139090 27401772Sjl139090 /* 27411772Sjl139090 * cleanup mac state 27421772Sjl139090 */ 27431772Sjl139090 mutex_enter(&mcp->mc_lock); 27442214Sav145390 if (mcp->mc_status & MC_MEMORYLESS) { 27452214Sav145390 mutex_exit(&mcp->mc_lock); 27462214Sav145390 mutex_destroy(&mcp->mc_lock); 27472214Sav145390 return (DDI_SUCCESS); 27482214Sav145390 } 27491772Sjl139090 for (i = 0; i < BANKNUM_PER_SB; i++) { 27501772Sjl139090 if (mcp->mc_bank[i].mcb_status & BANK_INSTALLED) { 27511772Sjl139090 mcp->mc_bank[i].mcb_status &= ~BANK_INSTALLED; 27521772Sjl139090 } 27531772Sjl139090 } 27541772Sjl139090 27551772Sjl139090 /* stop memory patrol checking */ 27562662Shyw mcp->mc_status &= ~MC_POLL_RUNNING; 27571772Sjl139090 27581772Sjl139090 /* just throw away all the scf logs */ 27592214Sav145390 for (i = 0; i < BANKNUM_PER_SB; i++) { 27605080Swh31274 while ((p = mcp->mc_scf_log[i]) != NULL) { 27615080Swh31274 mcp->mc_scf_log[i] = p->sl_next; 27625080Swh31274 mcp->mc_scf_total[i]--; 27635080Swh31274 kmem_free(p, sizeof (scf_log_t)); 27645080Swh31274 } 27651772Sjl139090 } 27661772Sjl139090 27671772Sjl139090 if (mcp->mlist) 27681772Sjl139090 mc_memlist_delete(mcp->mlist); 27691772Sjl139090 27702214Sav145390 if (mcp->mc_dimm_list) 27712214Sav145390 mc_free_dimm_list(mcp->mc_dimm_list); 27722214Sav145390 27731772Sjl139090 mutex_exit(&mcp->mc_lock); 27741772Sjl139090 27751772Sjl139090 mutex_destroy(&mcp->mc_lock); 27761772Sjl139090 return (DDI_SUCCESS); 27771772Sjl139090 } 27781772Sjl139090 27791772Sjl139090 int 27801772Sjl139090 mc_suspend(mc_opl_t *mcp, uint32_t flag) 27811772Sjl139090 { 27821772Sjl139090 /* stop memory patrol checking */ 27831772Sjl139090 mutex_enter(&mcp->mc_lock); 27842214Sav145390 if (mcp->mc_status & MC_MEMORYLESS) { 27852214Sav145390 mutex_exit(&mcp->mc_lock); 27862214Sav145390 return (DDI_SUCCESS); 27872214Sav145390 } 27882214Sav145390 27892662Shyw mcp->mc_status &= ~MC_POLL_RUNNING; 27902662Shyw 27911772Sjl139090 mcp->mc_status |= flag; 27921772Sjl139090 mutex_exit(&mcp->mc_lock); 27931772Sjl139090 27941772Sjl139090 return (DDI_SUCCESS); 27951772Sjl139090 } 27961772Sjl139090 27973354Sjl139090 void 27983354Sjl139090 opl_mc_update_mlist(void) 27993354Sjl139090 { 28003354Sjl139090 int i; 28013354Sjl139090 mc_opl_t *mcp; 28023354Sjl139090 28033354Sjl139090 /* 28043354Sjl139090 * memory information is not updated until 28053354Sjl139090 * the post attach/detach stage during DR. 28063354Sjl139090 * This interface is used by dr_mem to inform 28073354Sjl139090 * mc-opl to update the mlist. 28083354Sjl139090 */ 28093354Sjl139090 28103354Sjl139090 mutex_enter(&mcmutex); 28113354Sjl139090 for (i = 0; i < OPL_MAX_BOARDS; i++) { 28123354Sjl139090 if ((mcp = mc_instances[i]) == NULL) 28133354Sjl139090 continue; 28143354Sjl139090 mutex_enter(&mcp->mc_lock); 28153354Sjl139090 if (mcp->mlist) 28163354Sjl139090 mc_memlist_delete(mcp->mlist); 28173354Sjl139090 mcp->mlist = NULL; 28183354Sjl139090 mc_get_mlist(mcp); 28193354Sjl139090 mutex_exit(&mcp->mc_lock); 28203354Sjl139090 } 28213354Sjl139090 mutex_exit(&mcmutex); 28223354Sjl139090 } 28233354Sjl139090 28241772Sjl139090 /* caller must clear the SUSPEND bits or this will do nothing */ 28251772Sjl139090 28261772Sjl139090 int 28271772Sjl139090 mc_resume(mc_opl_t *mcp, uint32_t flag) 28281772Sjl139090 { 28291772Sjl139090 int i; 28301772Sjl139090 uint64_t basepa; 28311772Sjl139090 28321772Sjl139090 mutex_enter(&mcp->mc_lock); 28332214Sav145390 if (mcp->mc_status & MC_MEMORYLESS) { 28342214Sav145390 mutex_exit(&mcp->mc_lock); 28352214Sav145390 return (DDI_SUCCESS); 28362214Sav145390 } 28371772Sjl139090 basepa = mcp->mc_start_address; 28381772Sjl139090 if (get_base_address(mcp) == DDI_FAILURE) { 28391772Sjl139090 mutex_exit(&mcp->mc_lock); 28401772Sjl139090 return (DDI_FAILURE); 28411772Sjl139090 } 28421772Sjl139090 28431772Sjl139090 if (basepa != mcp->mc_start_address) { 28441772Sjl139090 if (mcp->mlist) 28451772Sjl139090 mc_memlist_delete(mcp->mlist); 28461772Sjl139090 mcp->mlist = NULL; 28471772Sjl139090 mc_get_mlist(mcp); 28481772Sjl139090 } 28491772Sjl139090 28501772Sjl139090 mcp->mc_status &= ~flag; 28511772Sjl139090 28521772Sjl139090 if (mcp->mc_status & (MC_SOFT_SUSPENDED | MC_DRIVER_SUSPENDED)) { 28531772Sjl139090 mutex_exit(&mcp->mc_lock); 28541772Sjl139090 return (DDI_SUCCESS); 28551772Sjl139090 } 28561772Sjl139090 28571772Sjl139090 if (!(mcp->mc_status & MC_POLL_RUNNING)) { 28581772Sjl139090 /* restart memory patrol checking */ 28591772Sjl139090 mcp->mc_status |= MC_POLL_RUNNING; 28601772Sjl139090 for (i = 0; i < BANKNUM_PER_SB; i++) { 28611772Sjl139090 if (mcp->mc_bank[i].mcb_status & BANK_INSTALLED) { 28625310Sdhain mc_check_errors_func(mcp); 28631772Sjl139090 } 28641772Sjl139090 } 28651772Sjl139090 } 28661772Sjl139090 mutex_exit(&mcp->mc_lock); 28671772Sjl139090 28681772Sjl139090 return (DDI_SUCCESS); 28691772Sjl139090 } 28701772Sjl139090 28711772Sjl139090 static mc_opl_t * 28721772Sjl139090 mc_pa_to_mcp(uint64_t pa) 28731772Sjl139090 { 28742214Sav145390 mc_opl_t *mcp; 28752214Sav145390 int i; 28762214Sav145390 28771772Sjl139090 ASSERT(MUTEX_HELD(&mcmutex)); 28782214Sav145390 for (i = 0; i < OPL_MAX_BOARDS; i++) { 28792214Sav145390 if ((mcp = mc_instances[i]) == NULL) 28802214Sav145390 continue; 28811772Sjl139090 /* if mac patrol is suspended, we cannot rely on it */ 28822214Sav145390 if (!(mcp->mc_status & MC_POLL_RUNNING) || 28835080Swh31274 (mcp->mc_status & MC_SOFT_SUSPENDED)) 28841772Sjl139090 continue; 28852662Shyw if (mc_rangecheck_pa(mcp, pa)) { 28862214Sav145390 return (mcp); 28871772Sjl139090 } 28881772Sjl139090 } 28891772Sjl139090 return (NULL); 28901772Sjl139090 } 28911772Sjl139090 28921772Sjl139090 /* 28931772Sjl139090 * Get Physical Board number from Logical one. 28941772Sjl139090 */ 28951772Sjl139090 static int 28961772Sjl139090 mc_opl_get_physical_board(int sb) 28971772Sjl139090 { 28981772Sjl139090 if (&opl_get_physical_board) { 28991772Sjl139090 return (opl_get_physical_board(sb)); 29001772Sjl139090 } 29011772Sjl139090 29021772Sjl139090 cmn_err(CE_NOTE, "!opl_get_physical_board() not loaded\n"); 29031772Sjl139090 return (-1); 29041772Sjl139090 } 29051772Sjl139090 29061772Sjl139090 /* ARGSUSED */ 29071772Sjl139090 int 29081772Sjl139090 mc_get_mem_unum(int synd_code, uint64_t flt_addr, char *buf, int buflen, 29091772Sjl139090 int *lenp) 29101772Sjl139090 { 29112214Sav145390 int i; 29123045Sav145390 int j; 29132214Sav145390 int sb; 29141772Sjl139090 int bank; 29153045Sav145390 int cs; 29162214Sav145390 mc_opl_t *mcp; 29172214Sav145390 char memb_num; 29181772Sjl139090 29191772Sjl139090 mutex_enter(&mcmutex); 29201772Sjl139090 29211772Sjl139090 if (((mcp = mc_pa_to_mcp(flt_addr)) == NULL) || 29225080Swh31274 (!pa_is_valid(mcp, flt_addr))) { 29231772Sjl139090 mutex_exit(&mcmutex); 29241772Sjl139090 if (snprintf(buf, buflen, "UNKNOWN") >= buflen) { 29251772Sjl139090 return (ENOSPC); 29261772Sjl139090 } else { 29271772Sjl139090 if (lenp) 29281772Sjl139090 *lenp = strlen(buf); 29291772Sjl139090 } 29301772Sjl139090 return (0); 29311772Sjl139090 } 29321772Sjl139090 29331772Sjl139090 bank = pa_to_bank(mcp, flt_addr - mcp->mc_start_address); 29343045Sav145390 sb = mcp->mc_phys_board_num; 29353045Sav145390 cs = pa_to_cs(mcp, flt_addr - mcp->mc_start_address); 29361772Sjl139090 29371772Sjl139090 if (sb == -1) { 29381772Sjl139090 mutex_exit(&mcmutex); 29391772Sjl139090 return (ENXIO); 29401772Sjl139090 } 29411772Sjl139090 29422214Sav145390 if (plat_model == MODEL_DC) { 29432214Sav145390 i = BD_BK_SLOT_TO_INDEX(0, bank, 0); 29443045Sav145390 j = (cs == 0) ? i : i + 2; 29453045Sav145390 snprintf(buf, buflen, "/%s%02d/MEM%s MEM%s", 29462214Sav145390 model_names[plat_model].unit_name, sb, 29473045Sav145390 mc_dc_dimm_unum_table[j], 29483045Sav145390 mc_dc_dimm_unum_table[j + 1]); 29491772Sjl139090 } else { 29502214Sav145390 i = BD_BK_SLOT_TO_INDEX(sb, bank, 0); 29513045Sav145390 j = (cs == 0) ? i : i + 2; 29522214Sav145390 memb_num = mc_ff_dimm_unum_table[i][0]; 29533045Sav145390 snprintf(buf, buflen, "/%s/%s%c/MEM%s MEM%s", 29542214Sav145390 model_names[plat_model].unit_name, 29552214Sav145390 model_names[plat_model].mem_name, memb_num, 29563045Sav145390 &mc_ff_dimm_unum_table[j][1], 29573045Sav145390 &mc_ff_dimm_unum_table[j + 1][1]); 29582214Sav145390 } 29592214Sav145390 if (lenp) { 29602214Sav145390 *lenp = strlen(buf); 29611772Sjl139090 } 29621772Sjl139090 mutex_exit(&mcmutex); 29631772Sjl139090 return (0); 29641772Sjl139090 } 29651772Sjl139090 29661772Sjl139090 int 29672214Sav145390 opl_mc_suspend(void) 29681772Sjl139090 { 29691772Sjl139090 mc_opl_t *mcp; 29702214Sav145390 int i; 29711772Sjl139090 29721772Sjl139090 mutex_enter(&mcmutex); 29732214Sav145390 for (i = 0; i < OPL_MAX_BOARDS; i++) { 29742214Sav145390 if ((mcp = mc_instances[i]) == NULL) 29752214Sav145390 continue; 29762214Sav145390 mc_suspend(mcp, MC_SOFT_SUSPENDED); 29771772Sjl139090 } 29781772Sjl139090 mutex_exit(&mcmutex); 29792214Sav145390 29801772Sjl139090 return (0); 29811772Sjl139090 } 29821772Sjl139090 29831772Sjl139090 int 29842214Sav145390 opl_mc_resume(void) 29851772Sjl139090 { 29861772Sjl139090 mc_opl_t *mcp; 29872214Sav145390 int i; 29881772Sjl139090 29891772Sjl139090 mutex_enter(&mcmutex); 29902214Sav145390 for (i = 0; i < OPL_MAX_BOARDS; i++) { 29912214Sav145390 if ((mcp = mc_instances[i]) == NULL) 29922214Sav145390 continue; 29932214Sav145390 mc_resume(mcp, MC_SOFT_SUSPENDED); 29941772Sjl139090 } 29951772Sjl139090 mutex_exit(&mcmutex); 29962214Sav145390 29971772Sjl139090 return (0); 29981772Sjl139090 } 29991772Sjl139090 static void 30001772Sjl139090 insert_mcp(mc_opl_t *mcp) 30011772Sjl139090 { 30021772Sjl139090 mutex_enter(&mcmutex); 30032214Sav145390 if (mc_instances[mcp->mc_board_num] != NULL) { 30042214Sav145390 MC_LOG("mc-opl instance for board# %d already exists\n", 30055080Swh31274 mcp->mc_board_num); 30062214Sav145390 } 30072214Sav145390 mc_instances[mcp->mc_board_num] = mcp; 30081772Sjl139090 mutex_exit(&mcmutex); 30091772Sjl139090 } 30101772Sjl139090 30111772Sjl139090 static void 30121772Sjl139090 delete_mcp(mc_opl_t *mcp) 30131772Sjl139090 { 30142214Sav145390 mutex_enter(&mcmutex); 30152214Sav145390 mc_instances[mcp->mc_board_num] = 0; 30162214Sav145390 mutex_exit(&mcmutex); 30171772Sjl139090 } 30181772Sjl139090 30191772Sjl139090 /* Error injection interface */ 30201772Sjl139090 30212494Shyw static void 30222494Shyw mc_lock_va(uint64_t pa, caddr_t new_va) 30232494Shyw { 30242494Shyw tte_t tte; 30252494Shyw 30262662Shyw vtag_flushpage(new_va, (uint64_t)ksfmmup); 30275080Swh31274 sfmmu_memtte(&tte, pa >> PAGESHIFT, PROC_DATA|HAT_NOSYNC, TTE8K); 30282494Shyw tte.tte_intlo |= TTE_LCK_INT; 30292494Shyw sfmmu_dtlb_ld_kva(new_va, &tte); 30302494Shyw } 30312494Shyw 30322494Shyw static void 30332494Shyw mc_unlock_va(caddr_t va) 30342494Shyw { 30352494Shyw vtag_flushpage(va, (uint64_t)ksfmmup); 30362494Shyw } 30372494Shyw 30381772Sjl139090 /* ARGSUSED */ 30391772Sjl139090 int 30401772Sjl139090 mc_inject_error(int error_type, uint64_t pa, uint32_t flags) 30411772Sjl139090 { 30421772Sjl139090 mc_opl_t *mcp; 30431772Sjl139090 int bank; 30441772Sjl139090 uint32_t dimm_addr; 30451772Sjl139090 uint32_t cntl; 30462662Shyw mc_rsaddr_info_t rsaddr; 30471772Sjl139090 uint32_t data, stat; 30481772Sjl139090 int both_sides = 0; 30491772Sjl139090 uint64_t pa0; 30502494Shyw int extra_injection_needed = 0; 30511772Sjl139090 extern void cpu_flush_ecache(void); 30521772Sjl139090 30531772Sjl139090 MC_LOG("HW mc_inject_error(%x, %lx, %x)\n", error_type, pa, flags); 30541772Sjl139090 30551772Sjl139090 mutex_enter(&mcmutex); 30561772Sjl139090 if ((mcp = mc_pa_to_mcp(pa)) == NULL) { 30571772Sjl139090 mutex_exit(&mcmutex); 30581772Sjl139090 MC_LOG("mc_inject_error: invalid pa\n"); 30591772Sjl139090 return (ENOTSUP); 30601772Sjl139090 } 30611772Sjl139090 30621772Sjl139090 mutex_enter(&mcp->mc_lock); 30631772Sjl139090 mutex_exit(&mcmutex); 30641772Sjl139090 30651772Sjl139090 if (mcp->mc_status & (MC_SOFT_SUSPENDED | MC_DRIVER_SUSPENDED)) { 30661772Sjl139090 mutex_exit(&mcp->mc_lock); 30671772Sjl139090 MC_LOG("mc-opl has been suspended. No error injection.\n"); 30681772Sjl139090 return (EBUSY); 30691772Sjl139090 } 30701772Sjl139090 30711772Sjl139090 /* convert pa to offset within the board */ 30721772Sjl139090 MC_LOG("pa %lx, offset %lx\n", pa, pa - mcp->mc_start_address); 30731772Sjl139090 30741772Sjl139090 if (!pa_is_valid(mcp, pa)) { 30751772Sjl139090 mutex_exit(&mcp->mc_lock); 30761772Sjl139090 return (EINVAL); 30771772Sjl139090 } 30781772Sjl139090 30791772Sjl139090 pa0 = pa - mcp->mc_start_address; 30801772Sjl139090 30811772Sjl139090 bank = pa_to_bank(mcp, pa0); 30821772Sjl139090 30831772Sjl139090 if (flags & MC_INJECT_FLAG_OTHER) 30841772Sjl139090 bank = bank ^ 1; 30851772Sjl139090 30861772Sjl139090 if (MC_INJECT_MIRROR(error_type) && !IS_MIRROR(mcp, bank)) { 30871772Sjl139090 mutex_exit(&mcp->mc_lock); 30881772Sjl139090 MC_LOG("Not mirror mode\n"); 30891772Sjl139090 return (EINVAL); 30901772Sjl139090 } 30911772Sjl139090 30921772Sjl139090 dimm_addr = pa_to_dimm(mcp, pa0); 30931772Sjl139090 30945080Swh31274 MC_LOG("injecting error to /LSB%d/B%d/%x\n", mcp->mc_board_num, bank, 30955080Swh31274 dimm_addr); 30961772Sjl139090 30971772Sjl139090 30981772Sjl139090 switch (error_type) { 30991772Sjl139090 case MC_INJECT_INTERMITTENT_MCE: 31001772Sjl139090 case MC_INJECT_PERMANENT_MCE: 31011772Sjl139090 case MC_INJECT_MUE: 31021772Sjl139090 both_sides = 1; 31031772Sjl139090 } 31041772Sjl139090 31051772Sjl139090 if (flags & MC_INJECT_FLAG_RESET) 31061772Sjl139090 ST_MAC_REG(MAC_EG_CNTL(mcp, bank), 0); 31071772Sjl139090 31081772Sjl139090 ST_MAC_REG(MAC_EG_ADD(mcp, bank), dimm_addr & MAC_EG_ADD_MASK); 31091772Sjl139090 31101772Sjl139090 if (both_sides) { 31111772Sjl139090 ST_MAC_REG(MAC_EG_CNTL(mcp, bank^1), 0); 31125080Swh31274 ST_MAC_REG(MAC_EG_ADD(mcp, bank^1), dimm_addr & 31135080Swh31274 MAC_EG_ADD_MASK); 31141772Sjl139090 } 31151772Sjl139090 31161772Sjl139090 switch (error_type) { 31172494Shyw case MC_INJECT_SUE: 31182494Shyw extra_injection_needed = 1; 31192494Shyw /*FALLTHROUGH*/ 31201772Sjl139090 case MC_INJECT_UE: 31211772Sjl139090 case MC_INJECT_MUE: 31221772Sjl139090 if (flags & MC_INJECT_FLAG_PATH) { 31235080Swh31274 cntl = MAC_EG_ADD_FIX | MAC_EG_FORCE_READ00 | 31245080Swh31274 MAC_EG_FORCE_READ16 | MAC_EG_RDERR_ONCE; 31251772Sjl139090 } else { 31265080Swh31274 cntl = MAC_EG_ADD_FIX | MAC_EG_FORCE_DERR00 | 31275080Swh31274 MAC_EG_FORCE_DERR16 | MAC_EG_DERR_ONCE; 31281772Sjl139090 } 31291772Sjl139090 flags |= MC_INJECT_FLAG_ST; 31301772Sjl139090 break; 31311772Sjl139090 case MC_INJECT_INTERMITTENT_CE: 31321772Sjl139090 case MC_INJECT_INTERMITTENT_MCE: 31331772Sjl139090 if (flags & MC_INJECT_FLAG_PATH) { 31345080Swh31274 cntl = MAC_EG_ADD_FIX |MAC_EG_FORCE_READ00 | 31355080Swh31274 MAC_EG_RDERR_ONCE; 31361772Sjl139090 } else { 31375080Swh31274 cntl = MAC_EG_ADD_FIX | MAC_EG_FORCE_DERR16 | 31385080Swh31274 MAC_EG_DERR_ONCE; 31391772Sjl139090 } 31402494Shyw extra_injection_needed = 1; 31411772Sjl139090 flags |= MC_INJECT_FLAG_ST; 31421772Sjl139090 break; 31431772Sjl139090 case MC_INJECT_PERMANENT_CE: 31441772Sjl139090 case MC_INJECT_PERMANENT_MCE: 31451772Sjl139090 if (flags & MC_INJECT_FLAG_PATH) { 31465080Swh31274 cntl = MAC_EG_ADD_FIX | MAC_EG_FORCE_READ00 | 31475080Swh31274 MAC_EG_RDERR_ALWAYS; 31481772Sjl139090 } else { 31495080Swh31274 cntl = MAC_EG_ADD_FIX | MAC_EG_FORCE_DERR16 | 31505080Swh31274 MAC_EG_DERR_ALWAYS; 31511772Sjl139090 } 31521772Sjl139090 flags |= MC_INJECT_FLAG_ST; 31531772Sjl139090 break; 31541772Sjl139090 case MC_INJECT_CMPE: 31551772Sjl139090 data = 0xabcdefab; 31561772Sjl139090 stphys(pa, data); 31571772Sjl139090 cpu_flush_ecache(); 31581772Sjl139090 MC_LOG("CMPE: writing data %x to %lx\n", data, pa); 31591772Sjl139090 ST_MAC_REG(MAC_MIRR(mcp, bank), MAC_MIRR_BANK_EXCLUSIVE); 31601772Sjl139090 stphys(pa, data ^ 0xffffffff); 31612662Shyw membar_sync(); 31621772Sjl139090 cpu_flush_ecache(); 31631772Sjl139090 ST_MAC_REG(MAC_MIRR(mcp, bank), 0); 31641772Sjl139090 MC_LOG("CMPE: write new data %xto %lx\n", data, pa); 31651772Sjl139090 cntl = 0; 31661772Sjl139090 break; 31671772Sjl139090 case MC_INJECT_NOP: 31681772Sjl139090 cntl = 0; 31691772Sjl139090 break; 31701772Sjl139090 default: 31711772Sjl139090 MC_LOG("mc_inject_error: invalid option\n"); 31721772Sjl139090 cntl = 0; 31731772Sjl139090 } 31741772Sjl139090 31751772Sjl139090 if (cntl) { 31761772Sjl139090 ST_MAC_REG(MAC_EG_CNTL(mcp, bank), cntl & MAC_EG_SETUP_MASK); 31771772Sjl139090 ST_MAC_REG(MAC_EG_CNTL(mcp, bank), cntl); 31781772Sjl139090 31791772Sjl139090 if (both_sides) { 31801772Sjl139090 ST_MAC_REG(MAC_EG_CNTL(mcp, bank^1), cntl & 31815080Swh31274 MAC_EG_SETUP_MASK); 31821772Sjl139090 ST_MAC_REG(MAC_EG_CNTL(mcp, bank^1), cntl); 31831772Sjl139090 } 31841772Sjl139090 } 31851772Sjl139090 31861772Sjl139090 /* 31871772Sjl139090 * For all injection cases except compare error, we 31881772Sjl139090 * must write to the PA to trigger the error. 31891772Sjl139090 */ 31901772Sjl139090 31911772Sjl139090 if (flags & MC_INJECT_FLAG_ST) { 31921772Sjl139090 data = 0xf0e0d0c0; 31931772Sjl139090 MC_LOG("Writing %x to %lx\n", data, pa); 31941772Sjl139090 stphys(pa, data); 31951772Sjl139090 cpu_flush_ecache(); 31961772Sjl139090 } 31971772Sjl139090 31981772Sjl139090 31991772Sjl139090 if (flags & MC_INJECT_FLAG_LD) { 32002494Shyw if (flags & MC_INJECT_FLAG_PREFETCH) { 32012494Shyw /* 32022494Shyw * Use strong prefetch operation to 32032494Shyw * inject MI errors. 32042494Shyw */ 32052494Shyw page_t *pp; 32062494Shyw extern void mc_prefetch(caddr_t); 32072494Shyw 32082494Shyw MC_LOG("prefetch\n"); 32092494Shyw 32102494Shyw pp = page_numtopp_nolock(pa >> PAGESHIFT); 32112494Shyw if (pp != NULL) { 32122494Shyw caddr_t va, va1; 32132494Shyw 32142494Shyw va = ppmapin(pp, PROT_READ|PROT_WRITE, 32155080Swh31274 (caddr_t)-1); 32162494Shyw kpreempt_disable(); 32172494Shyw mc_lock_va((uint64_t)pa, va); 32182494Shyw va1 = va + (pa & (PAGESIZE - 1)); 32192494Shyw mc_prefetch(va1); 32202494Shyw mc_unlock_va(va); 32212494Shyw kpreempt_enable(); 32222494Shyw ppmapout(va); 32232494Shyw 32242494Shyw /* 32252494Shyw * For MI errors, we need one extra 32262494Shyw * injection for HW patrol to stop. 32272494Shyw */ 32282494Shyw extra_injection_needed = 1; 32291772Sjl139090 } else { 32302494Shyw cmn_err(CE_WARN, "Cannot find page structure" 32315080Swh31274 " for PA %lx\n", pa); 32321772Sjl139090 } 32331772Sjl139090 } else { 32341772Sjl139090 MC_LOG("Reading from %lx\n", pa); 32351772Sjl139090 data = ldphys(pa); 32361772Sjl139090 MC_LOG("data = %x\n", data); 32371772Sjl139090 } 32382494Shyw 32392494Shyw if (extra_injection_needed) { 32402494Shyw /* 32412494Shyw * These are the injection cases where the 32422494Shyw * requested injected errors will not cause the HW 32432494Shyw * patrol to stop. For these cases, we need to inject 32442494Shyw * an extra 'real' PTRL error to force the 32452494Shyw * HW patrol to stop so that we can report the 32462494Shyw * errors injected. Note that we cannot read 32472494Shyw * and report error status while the HW patrol 32482494Shyw * is running. 32492494Shyw */ 32502494Shyw ST_MAC_REG(MAC_EG_CNTL(mcp, bank), 32515080Swh31274 cntl & MAC_EG_SETUP_MASK); 32522494Shyw ST_MAC_REG(MAC_EG_CNTL(mcp, bank), cntl); 32532494Shyw 32542494Shyw if (both_sides) { 32555080Swh31274 ST_MAC_REG(MAC_EG_CNTL(mcp, bank^1), cntl & 32565080Swh31274 MAC_EG_SETUP_MASK); 32575080Swh31274 ST_MAC_REG(MAC_EG_CNTL(mcp, bank^1), cntl); 32582494Shyw } 32592494Shyw data = 0xf0e0d0c0; 32602494Shyw MC_LOG("Writing %x to %lx\n", data, pa); 32612494Shyw stphys(pa, data); 32622494Shyw cpu_flush_ecache(); 32632494Shyw } 32641772Sjl139090 } 32651772Sjl139090 32661772Sjl139090 if (flags & MC_INJECT_FLAG_RESTART) { 32671772Sjl139090 MC_LOG("Restart patrol\n"); 32682662Shyw rsaddr.mi_restartaddr.ma_bd = mcp->mc_board_num; 32692662Shyw rsaddr.mi_restartaddr.ma_bank = bank; 32702662Shyw rsaddr.mi_restartaddr.ma_dimm_addr = dimm_addr; 32712662Shyw rsaddr.mi_valid = 1; 32722662Shyw rsaddr.mi_injectrestart = 1; 32732662Shyw restart_patrol(mcp, bank, &rsaddr); 32741772Sjl139090 } 32751772Sjl139090 32761772Sjl139090 if (flags & MC_INJECT_FLAG_POLL) { 32772214Sav145390 int running; 32782867Shyw int ebank = (IS_MIRROR(mcp, bank)) ? MIRROR_IDX(bank) : bank; 32791772Sjl139090 32801772Sjl139090 MC_LOG("Poll patrol error\n"); 32811772Sjl139090 stat = LD_MAC_REG(MAC_PTRL_STAT(mcp, bank)); 32821772Sjl139090 cntl = LD_MAC_REG(MAC_PTRL_CNTL(mcp, bank)); 32832214Sav145390 running = cntl & MAC_CNTL_PTRL_START; 32842494Shyw 32852494Shyw if (!running && 32862494Shyw (stat & (MAC_STAT_PTRL_ERRS|MAC_STAT_MI_ERRS))) { 32872494Shyw /* 32882494Shyw * HW patrol stopped and we have errors to 32892494Shyw * report. Do it. 32902494Shyw */ 32912867Shyw mcp->mc_speedup_period[ebank] = 0; 32922662Shyw rsaddr.mi_valid = 0; 32932662Shyw rsaddr.mi_injectrestart = 0; 32942662Shyw if (IS_MIRROR(mcp, bank)) { 32952662Shyw mc_error_handler_mir(mcp, bank, &rsaddr); 32962662Shyw } else { 32972662Shyw mc_error_handler(mcp, bank, &rsaddr); 32982662Shyw } 32992662Shyw 33002662Shyw restart_patrol(mcp, bank, &rsaddr); 33012494Shyw } else { 33022494Shyw /* 33032494Shyw * We are expecting to report injected 33042494Shyw * errors but the HW patrol is still running. 33052494Shyw * Speed up the scanning 33062494Shyw */ 33072867Shyw mcp->mc_speedup_period[ebank] = 2; 33082494Shyw MAC_CMD(mcp, bank, 0); 33091772Sjl139090 restart_patrol(mcp, bank, NULL); 33102494Shyw } 33111772Sjl139090 } 33121772Sjl139090 33131772Sjl139090 mutex_exit(&mcp->mc_lock); 33141772Sjl139090 return (0); 33151772Sjl139090 } 33162494Shyw 33171772Sjl139090 void 33181772Sjl139090 mc_stphysio(uint64_t pa, uint32_t data) 33191772Sjl139090 { 33201772Sjl139090 MC_LOG("0x%x -> pa(%lx)\n", data, pa); 33211772Sjl139090 stphysio(pa, data); 33222214Sav145390 33232214Sav145390 /* force the above write to be processed by mac patrol */ 33242494Shyw data = ldphysio(pa); 33252494Shyw MC_LOG("pa(%lx) = 0x%x\n", pa, data); 33261772Sjl139090 } 33271772Sjl139090 33281772Sjl139090 uint32_t 33291772Sjl139090 mc_ldphysio(uint64_t pa) 33301772Sjl139090 { 33311772Sjl139090 uint32_t rv; 33321772Sjl139090 33331772Sjl139090 rv = ldphysio(pa); 33341772Sjl139090 MC_LOG("pa(%lx) = 0x%x\n", pa, rv); 33351772Sjl139090 return (rv); 33361772Sjl139090 } 33372214Sav145390 33382214Sav145390 #define isdigit(ch) ((ch) >= '0' && (ch) <= '9') 33392214Sav145390 33402214Sav145390 /* 33412214Sav145390 * parse_unum_memory -- extract the board number and the DIMM name from 33422214Sav145390 * the unum. 33432214Sav145390 * 33442214Sav145390 * Return 0 for success and non-zero for a failure. 33452214Sav145390 */ 33462214Sav145390 int 33472214Sav145390 parse_unum_memory(char *unum, int *board, char *dname) 33482214Sav145390 { 33492214Sav145390 char *c; 33502214Sav145390 char x, y, z; 33512214Sav145390 33522214Sav145390 if ((c = strstr(unum, "CMU")) != NULL) { 33532214Sav145390 /* DC Model */ 33542214Sav145390 c += 3; 33552214Sav145390 *board = (uint8_t)stoi(&c); 33562214Sav145390 if ((c = strstr(c, "MEM")) == NULL) { 33572214Sav145390 return (1); 33582214Sav145390 } 33592214Sav145390 c += 3; 33602214Sav145390 if (strlen(c) < 3) { 33612214Sav145390 return (2); 33622214Sav145390 } 33632214Sav145390 if ((!isdigit(c[0])) || (!(isdigit(c[1]))) || 33642214Sav145390 ((c[2] != 'A') && (c[2] != 'B'))) { 33652214Sav145390 return (3); 33662214Sav145390 } 33672214Sav145390 x = c[0]; 33682214Sav145390 y = c[1]; 33692214Sav145390 z = c[2]; 33702214Sav145390 } else if ((c = strstr(unum, "MBU_")) != NULL) { 33712214Sav145390 /* FF1/FF2 Model */ 33722214Sav145390 c += 4; 33732214Sav145390 if ((c[0] != 'A') && (c[0] != 'B')) { 33742214Sav145390 return (4); 33752214Sav145390 } 33762214Sav145390 if ((c = strstr(c, "MEMB")) == NULL) { 33772214Sav145390 return (5); 33782214Sav145390 } 33792214Sav145390 c += 4; 33802214Sav145390 33812214Sav145390 x = c[0]; 33822214Sav145390 *board = ((uint8_t)stoi(&c)) / 4; 33832214Sav145390 if ((c = strstr(c, "MEM")) == NULL) { 33842214Sav145390 return (6); 33852214Sav145390 } 33862214Sav145390 c += 3; 33872214Sav145390 if (strlen(c) < 2) { 33882214Sav145390 return (7); 33892214Sav145390 } 33902214Sav145390 if ((!isdigit(c[0])) || ((c[1] != 'A') && (c[1] != 'B'))) { 33912214Sav145390 return (8); 33922214Sav145390 } 33932214Sav145390 y = c[0]; 33942214Sav145390 z = c[1]; 33952214Sav145390 } else { 33962214Sav145390 return (9); 33972214Sav145390 } 33982214Sav145390 if (*board < 0) { 33992214Sav145390 return (10); 34002214Sav145390 } 34012214Sav145390 dname[0] = x; 34022214Sav145390 dname[1] = y; 34032214Sav145390 dname[2] = z; 34042214Sav145390 dname[3] = '\0'; 34052214Sav145390 return (0); 34062214Sav145390 } 34072214Sav145390 34082214Sav145390 /* 34092214Sav145390 * mc_get_mem_sid_dimm -- Get the serial-ID for a given board and 34102214Sav145390 * the DIMM name. 34112214Sav145390 */ 34122214Sav145390 int 34132214Sav145390 mc_get_mem_sid_dimm(mc_opl_t *mcp, char *dname, char *buf, 34142214Sav145390 int buflen, int *lenp) 34152214Sav145390 { 34162214Sav145390 int ret = ENODEV; 34172214Sav145390 mc_dimm_info_t *d = NULL; 34182214Sav145390 34192214Sav145390 if ((d = mcp->mc_dimm_list) == NULL) 34202214Sav145390 return (ENOTSUP); 34212214Sav145390 34222214Sav145390 for (; d != NULL; d = d->md_next) { 34232214Sav145390 if (strcmp(d->md_dimmname, dname) == 0) { 34242214Sav145390 break; 34252214Sav145390 } 34262214Sav145390 } 34272214Sav145390 if (d != NULL) { 34282214Sav145390 *lenp = strlen(d->md_serial) + strlen(d->md_partnum); 34292214Sav145390 if (buflen <= *lenp) { 34302214Sav145390 cmn_err(CE_WARN, "mc_get_mem_sid_dimm: " 34312214Sav145390 "buflen is smaller than %d\n", *lenp); 34322214Sav145390 ret = ENOSPC; 34332214Sav145390 } else { 34342214Sav145390 snprintf(buf, buflen, "%s:%s", 34352214Sav145390 d->md_serial, d->md_partnum); 34362214Sav145390 ret = 0; 34372214Sav145390 } 34382214Sav145390 } 34392214Sav145390 MC_LOG("mc_get_mem_sid_dimm: Ret=%d Name=%s Serial-ID=%s\n", 34402214Sav145390 ret, dname, (ret == 0) ? buf : ""); 34412214Sav145390 return (ret); 34422214Sav145390 } 34432214Sav145390 34442214Sav145390 int 34453045Sav145390 mc_set_mem_sid(mc_opl_t *mcp, char *buf, int buflen, int sb, 34462214Sav145390 int bank, uint32_t mf_type, uint32_t d_slot) 34472214Sav145390 { 34482214Sav145390 int lenp = buflen; 34492214Sav145390 int id; 34502214Sav145390 int ret; 34512214Sav145390 char *dimmnm; 34522214Sav145390 34535275Stsien if (mf_type == FLT_TYPE_INTERMITTENT_CE || 34545275Stsien mf_type == FLT_TYPE_PERMANENT_CE) { 34552214Sav145390 if (plat_model == MODEL_DC) { 34562214Sav145390 id = BD_BK_SLOT_TO_INDEX(0, bank, d_slot); 34573045Sav145390 dimmnm = mc_dc_dimm_unum_table[id]; 34582214Sav145390 } else { 34592214Sav145390 id = BD_BK_SLOT_TO_INDEX(sb, bank, d_slot); 34603045Sav145390 dimmnm = mc_ff_dimm_unum_table[id]; 34612214Sav145390 } 34622214Sav145390 if ((ret = mc_get_mem_sid_dimm(mcp, dimmnm, buf, buflen, 34632214Sav145390 &lenp)) != 0) { 34642214Sav145390 return (ret); 34652214Sav145390 } 34662214Sav145390 } else { 34672214Sav145390 return (1); 34682214Sav145390 } 34692214Sav145390 34702214Sav145390 return (0); 34712214Sav145390 } 34722214Sav145390 34732214Sav145390 /* 34742214Sav145390 * mc_get_mem_sid -- get the DIMM serial-ID corresponding to the unum. 34752214Sav145390 */ 34762214Sav145390 int 34772214Sav145390 mc_get_mem_sid(char *unum, char *buf, int buflen, int *lenp) 34782214Sav145390 { 34792214Sav145390 int i; 34802214Sav145390 int ret = ENODEV; 34812214Sav145390 int board; 34822214Sav145390 char dname[MCOPL_MAX_DIMMNAME + 1]; 34832214Sav145390 mc_opl_t *mcp; 34842214Sav145390 34852214Sav145390 MC_LOG("mc_get_mem_sid: unum=%s buflen=%d\n", unum, buflen); 34862214Sav145390 if ((ret = parse_unum_memory(unum, &board, dname)) != 0) { 34872214Sav145390 MC_LOG("mc_get_mem_sid: unum(%s) parsing failed ret=%d\n", 34882214Sav145390 unum, ret); 34892214Sav145390 return (EINVAL); 34902214Sav145390 } 34912214Sav145390 34922214Sav145390 if (board < 0) { 34932214Sav145390 MC_LOG("mc_get_mem_sid: Invalid board=%d dimm=%s\n", 34942214Sav145390 board, dname); 34952214Sav145390 return (EINVAL); 34962214Sav145390 } 34972214Sav145390 34982214Sav145390 mutex_enter(&mcmutex); 34993152Sav145390 /* 35003152Sav145390 * return ENOENT if we can not find the matching board. 35013152Sav145390 */ 35023152Sav145390 ret = ENOENT; 35032214Sav145390 for (i = 0; i < OPL_MAX_BOARDS; i++) { 35042214Sav145390 if ((mcp = mc_instances[i]) == NULL) 35052214Sav145390 continue; 35062214Sav145390 mutex_enter(&mcp->mc_lock); 35073045Sav145390 if (mcp->mc_phys_board_num != board) { 35083045Sav145390 mutex_exit(&mcp->mc_lock); 35093045Sav145390 continue; 35103045Sav145390 } 35113045Sav145390 ret = mc_get_mem_sid_dimm(mcp, dname, buf, buflen, lenp); 35123045Sav145390 if (ret == 0) { 35132214Sav145390 mutex_exit(&mcp->mc_lock); 35142214Sav145390 break; 35152214Sav145390 } 35162214Sav145390 mutex_exit(&mcp->mc_lock); 35172214Sav145390 } 35182214Sav145390 mutex_exit(&mcmutex); 35192214Sav145390 return (ret); 35202214Sav145390 } 35212214Sav145390 35222214Sav145390 /* 35232214Sav145390 * mc_get_mem_offset -- get the offset in a DIMM for a given physical address. 35242214Sav145390 */ 35252214Sav145390 int 35262214Sav145390 mc_get_mem_offset(uint64_t paddr, uint64_t *offp) 35272214Sav145390 { 35282214Sav145390 int i; 35292214Sav145390 int ret = ENODEV; 35302214Sav145390 mc_addr_t maddr; 35312214Sav145390 mc_opl_t *mcp; 35322214Sav145390 35332214Sav145390 mutex_enter(&mcmutex); 35342501Sraghuram for (i = 0; ((i < OPL_MAX_BOARDS) && (ret != 0)); i++) { 35352214Sav145390 if ((mcp = mc_instances[i]) == NULL) 35362214Sav145390 continue; 35372214Sav145390 mutex_enter(&mcp->mc_lock); 35382214Sav145390 if (!pa_is_valid(mcp, paddr)) { 35392214Sav145390 mutex_exit(&mcp->mc_lock); 35402214Sav145390 continue; 35412214Sav145390 } 35422214Sav145390 if (pa_to_maddr(mcp, paddr, &maddr) == 0) { 35432214Sav145390 *offp = maddr.ma_dimm_addr; 35442214Sav145390 ret = 0; 35452214Sav145390 } 35462214Sav145390 mutex_exit(&mcp->mc_lock); 35472214Sav145390 } 35482214Sav145390 mutex_exit(&mcmutex); 35492214Sav145390 MC_LOG("mc_get_mem_offset: Ret=%d paddr=0x%lx offset=0x%lx\n", 35502214Sav145390 ret, paddr, *offp); 35512214Sav145390 return (ret); 35522214Sav145390 } 35532214Sav145390 35542214Sav145390 /* 35552214Sav145390 * dname_to_bankslot - Get the bank and slot number from the DIMM name. 35562214Sav145390 */ 35572214Sav145390 int 35582214Sav145390 dname_to_bankslot(char *dname, int *bank, int *slot) 35592214Sav145390 { 35602214Sav145390 int i; 35612214Sav145390 int tsz; 35622214Sav145390 char **tbl; 35632214Sav145390 35642214Sav145390 if (plat_model == MODEL_DC) { /* DC */ 35652214Sav145390 tbl = mc_dc_dimm_unum_table; 35662214Sav145390 tsz = OPL_MAX_DIMMS; 35672214Sav145390 } else { 35682214Sav145390 tbl = mc_ff_dimm_unum_table; 35692214Sav145390 tsz = 2 * OPL_MAX_DIMMS; 35702214Sav145390 } 35712214Sav145390 35722214Sav145390 for (i = 0; i < tsz; i++) { 35732214Sav145390 if (strcmp(dname, tbl[i]) == 0) { 35742214Sav145390 break; 35752214Sav145390 } 35762214Sav145390 } 35772214Sav145390 if (i == tsz) { 35782214Sav145390 return (1); 35792214Sav145390 } 35802214Sav145390 *bank = INDEX_TO_BANK(i); 35812214Sav145390 *slot = INDEX_TO_SLOT(i); 35822214Sav145390 return (0); 35832214Sav145390 } 35842214Sav145390 35852214Sav145390 /* 35862214Sav145390 * mc_get_mem_addr -- get the physical address of a DIMM corresponding 35872214Sav145390 * to the unum and sid. 35882214Sav145390 */ 35892214Sav145390 int 35902214Sav145390 mc_get_mem_addr(char *unum, char *sid, uint64_t offset, uint64_t *paddr) 35912214Sav145390 { 35922214Sav145390 int board; 35932214Sav145390 int bank; 35942214Sav145390 int slot; 35952214Sav145390 int i; 35962214Sav145390 int ret = ENODEV; 35972214Sav145390 char dname[MCOPL_MAX_DIMMNAME + 1]; 35982214Sav145390 mc_addr_t maddr; 35992214Sav145390 mc_opl_t *mcp; 36002214Sav145390 36012214Sav145390 MC_LOG("mc_get_mem_addr: unum=%s sid=%s offset=0x%lx\n", 36022214Sav145390 unum, sid, offset); 36032214Sav145390 if (parse_unum_memory(unum, &board, dname) != 0) { 36042214Sav145390 MC_LOG("mc_get_mem_sid: unum(%s) parsing failed ret=%d\n", 36052214Sav145390 unum, ret); 36062214Sav145390 return (EINVAL); 36072214Sav145390 } 36082214Sav145390 36092214Sav145390 if (board < 0) { 36102214Sav145390 MC_LOG("mc_get_mem_addr: Invalid board=%d dimm=%s\n", 36112214Sav145390 board, dname); 36122214Sav145390 return (EINVAL); 36132214Sav145390 } 36142214Sav145390 36152214Sav145390 mutex_enter(&mcmutex); 36162214Sav145390 for (i = 0; i < OPL_MAX_BOARDS; i++) { 36172214Sav145390 if ((mcp = mc_instances[i]) == NULL) 36182214Sav145390 continue; 36192214Sav145390 mutex_enter(&mcp->mc_lock); 36203045Sav145390 if (mcp->mc_phys_board_num != board) { 36212214Sav145390 mutex_exit(&mcp->mc_lock); 36222214Sav145390 continue; 36232214Sav145390 } 36242214Sav145390 36252214Sav145390 ret = dname_to_bankslot(dname, &bank, &slot); 36262214Sav145390 MC_LOG("mc_get_mem_addr: bank=%d slot=%d\n", bank, slot); 36272214Sav145390 if (ret != 0) { 36282214Sav145390 MC_LOG("mc_get_mem_addr: dname_to_bankslot failed\n"); 36292214Sav145390 ret = ENODEV; 36302214Sav145390 } else { 36313045Sav145390 maddr.ma_bd = mcp->mc_board_num; 36322214Sav145390 maddr.ma_bank = bank; 36332214Sav145390 maddr.ma_dimm_addr = offset; 36342214Sav145390 ret = mcaddr_to_pa(mcp, &maddr, paddr); 36352214Sav145390 if (ret != 0) { 36362214Sav145390 MC_LOG("mc_get_mem_addr: " 36372214Sav145390 "mcaddr_to_pa failed\n"); 36382214Sav145390 ret = ENODEV; 36392214Sav145390 } 36403045Sav145390 mutex_exit(&mcp->mc_lock); 36413045Sav145390 break; 36422214Sav145390 } 36432214Sav145390 mutex_exit(&mcp->mc_lock); 36442214Sav145390 } 36452214Sav145390 mutex_exit(&mcmutex); 36462214Sav145390 MC_LOG("mc_get_mem_addr: Ret=%d, Paddr=0x%lx\n", ret, *paddr); 36472214Sav145390 return (ret); 36482214Sav145390 } 36492214Sav145390 36502214Sav145390 static void 36512214Sav145390 mc_free_dimm_list(mc_dimm_info_t *d) 36522214Sav145390 { 36532214Sav145390 mc_dimm_info_t *next; 36542214Sav145390 36552214Sav145390 while (d != NULL) { 36562214Sav145390 next = d->md_next; 36572214Sav145390 kmem_free(d, sizeof (mc_dimm_info_t)); 36582214Sav145390 d = next; 36592214Sav145390 } 36602214Sav145390 } 36612214Sav145390 36622214Sav145390 /* 36632214Sav145390 * mc_get_dimm_list -- get the list of dimms with serial-id info 36642214Sav145390 * from the SP. 36652214Sav145390 */ 36662214Sav145390 mc_dimm_info_t * 36672214Sav145390 mc_get_dimm_list(mc_opl_t *mcp) 36682214Sav145390 { 36692214Sav145390 uint32_t bufsz; 36702214Sav145390 uint32_t maxbufsz; 36712214Sav145390 int ret; 36722214Sav145390 int sexp; 36732214Sav145390 board_dimm_info_t *bd_dimmp; 36742214Sav145390 mc_dimm_info_t *dimm_list = NULL; 36752214Sav145390 36762214Sav145390 maxbufsz = bufsz = sizeof (board_dimm_info_t) + 36772214Sav145390 ((MCOPL_MAX_DIMMNAME + MCOPL_MAX_SERIAL + 36782214Sav145390 MCOPL_MAX_PARTNUM) * OPL_MAX_DIMMS); 36792214Sav145390 36802214Sav145390 bd_dimmp = (board_dimm_info_t *)kmem_alloc(bufsz, KM_SLEEP); 36812214Sav145390 ret = scf_get_dimminfo(mcp->mc_board_num, (void *)bd_dimmp, &bufsz); 36822214Sav145390 36832214Sav145390 MC_LOG("mc_get_dimm_list: scf_service_getinfo returned=%d\n", ret); 36842214Sav145390 if (ret == 0) { 36852214Sav145390 sexp = sizeof (board_dimm_info_t) + 36862214Sav145390 ((bd_dimmp->bd_dnamesz + bd_dimmp->bd_serialsz + 36872214Sav145390 bd_dimmp->bd_partnumsz) * bd_dimmp->bd_numdimms); 36882214Sav145390 36892214Sav145390 if ((bd_dimmp->bd_version == OPL_DIMM_INFO_VERSION) && 36902214Sav145390 (bd_dimmp->bd_dnamesz <= MCOPL_MAX_DIMMNAME) && 36912214Sav145390 (bd_dimmp->bd_serialsz <= MCOPL_MAX_SERIAL) && 36922214Sav145390 (bd_dimmp->bd_partnumsz <= MCOPL_MAX_PARTNUM) && 36932214Sav145390 (sexp <= bufsz)) { 36942214Sav145390 36952214Sav145390 #ifdef DEBUG 36962214Sav145390 if (oplmc_debug) 36972214Sav145390 mc_dump_dimm_info(bd_dimmp); 36982214Sav145390 #endif 36992214Sav145390 dimm_list = mc_prepare_dimmlist(bd_dimmp); 37002214Sav145390 37012214Sav145390 } else { 37022214Sav145390 cmn_err(CE_WARN, "DIMM info version mismatch\n"); 37032214Sav145390 } 37042214Sav145390 } 37052214Sav145390 kmem_free(bd_dimmp, maxbufsz); 37062214Sav145390 MC_LOG("mc_get_dimm_list: dimmlist=0x%p\n", dimm_list); 37072214Sav145390 return (dimm_list); 37082214Sav145390 } 37092214Sav145390 37102214Sav145390 /* 37113152Sav145390 * mc_prepare_dimmlist - Prepare the dimm list from the information 37123152Sav145390 * received from the SP. 37132214Sav145390 */ 37142214Sav145390 mc_dimm_info_t * 37152214Sav145390 mc_prepare_dimmlist(board_dimm_info_t *bd_dimmp) 37162214Sav145390 { 37172214Sav145390 char *dimm_name; 37182214Sav145390 char *serial; 37192214Sav145390 char *part; 37202214Sav145390 int dimm; 37212214Sav145390 int dnamesz = bd_dimmp->bd_dnamesz; 37222214Sav145390 int sersz = bd_dimmp->bd_serialsz; 37232214Sav145390 int partsz = bd_dimmp->bd_partnumsz; 37242214Sav145390 mc_dimm_info_t *dimm_list = NULL; 37252214Sav145390 mc_dimm_info_t *d; 37262214Sav145390 37272214Sav145390 dimm_name = (char *)(bd_dimmp + 1); 37282214Sav145390 for (dimm = 0; dimm < bd_dimmp->bd_numdimms; dimm++) { 37292214Sav145390 37302214Sav145390 d = (mc_dimm_info_t *)kmem_alloc(sizeof (mc_dimm_info_t), 37312214Sav145390 KM_SLEEP); 37323373Sbm42561 37333373Sbm42561 bcopy(dimm_name, d->md_dimmname, dnamesz); 37343373Sbm42561 d->md_dimmname[dnamesz] = 0; 37353373Sbm42561 37362214Sav145390 serial = dimm_name + dnamesz; 37373373Sbm42561 bcopy(serial, d->md_serial, sersz); 37383373Sbm42561 d->md_serial[sersz] = 0; 37393373Sbm42561 37402214Sav145390 part = serial + sersz; 37413373Sbm42561 bcopy(part, d->md_partnum, partsz); 37423373Sbm42561 d->md_partnum[partsz] = 0; 37432214Sav145390 37442214Sav145390 d->md_next = dimm_list; 37452214Sav145390 dimm_list = d; 37462214Sav145390 dimm_name = part + partsz; 37472214Sav145390 } 37482214Sav145390 return (dimm_list); 37492214Sav145390 } 37502214Sav145390 37512214Sav145390 #ifdef DEBUG 37522214Sav145390 void 37532214Sav145390 mc_dump_dimm(char *buf, int dnamesz, int serialsz, int partnumsz) 37542214Sav145390 { 37552214Sav145390 char dname[MCOPL_MAX_DIMMNAME + 1]; 37562214Sav145390 char serial[MCOPL_MAX_SERIAL + 1]; 37572214Sav145390 char part[ MCOPL_MAX_PARTNUM + 1]; 37582214Sav145390 char *b; 37592214Sav145390 37602214Sav145390 b = buf; 37613373Sbm42561 bcopy(b, dname, dnamesz); 37623373Sbm42561 dname[dnamesz] = 0; 37633373Sbm42561 37642214Sav145390 b += dnamesz; 37653373Sbm42561 bcopy(b, serial, serialsz); 37663373Sbm42561 serial[serialsz] = 0; 37673373Sbm42561 37682214Sav145390 b += serialsz; 37693373Sbm42561 bcopy(b, part, partnumsz); 37703373Sbm42561 part[partnumsz] = 0; 37713373Sbm42561 37722214Sav145390 printf("DIMM=%s Serial=%s PartNum=%s\n", dname, serial, part); 37732214Sav145390 } 37742214Sav145390 37752214Sav145390 void 37762214Sav145390 mc_dump_dimm_info(board_dimm_info_t *bd_dimmp) 37772214Sav145390 { 37782214Sav145390 int dimm; 37792214Sav145390 int dnamesz = bd_dimmp->bd_dnamesz; 37802214Sav145390 int sersz = bd_dimmp->bd_serialsz; 37812214Sav145390 int partsz = bd_dimmp->bd_partnumsz; 37822214Sav145390 char *buf; 37832214Sav145390 37842214Sav145390 printf("Version=%d Board=%02d DIMMs=%d NameSize=%d " 37852214Sav145390 "SerialSize=%d PartnumSize=%d\n", bd_dimmp->bd_version, 37862214Sav145390 bd_dimmp->bd_boardnum, bd_dimmp->bd_numdimms, bd_dimmp->bd_dnamesz, 37872214Sav145390 bd_dimmp->bd_serialsz, bd_dimmp->bd_partnumsz); 37882214Sav145390 printf("======================================================\n"); 37892214Sav145390 37902214Sav145390 buf = (char *)(bd_dimmp + 1); 37912214Sav145390 for (dimm = 0; dimm < bd_dimmp->bd_numdimms; dimm++) { 37922214Sav145390 mc_dump_dimm(buf, dnamesz, sersz, partsz); 37932214Sav145390 buf += dnamesz + sersz + partsz; 37942214Sav145390 } 37952214Sav145390 printf("======================================================\n"); 37962214Sav145390 } 37972214Sav145390 37982214Sav145390 37992214Sav145390 /* ARGSUSED */ 38002214Sav145390 static int 38012214Sav145390 mc_ioctl_debug(dev_t dev, int cmd, intptr_t arg, int mode, cred_t *credp, 38022214Sav145390 int *rvalp) 38032214Sav145390 { 38042214Sav145390 caddr_t buf; 38052214Sav145390 uint64_t pa; 38062214Sav145390 int rv = 0; 38072214Sav145390 int i; 38082214Sav145390 uint32_t flags; 38092214Sav145390 static uint32_t offset = 0; 38102214Sav145390 38112214Sav145390 38122214Sav145390 flags = (cmd >> 4) & 0xfffffff; 38132214Sav145390 38142214Sav145390 cmd &= 0xf; 38152214Sav145390 38162214Sav145390 MC_LOG("mc_ioctl(cmd = %x, flags = %x)\n", cmd, flags); 38172214Sav145390 38182214Sav145390 if (arg != NULL) { 38192214Sav145390 if (ddi_copyin((const void *)arg, (void *)&pa, 38205080Swh31274 sizeof (uint64_t), 0) < 0) { 38212214Sav145390 rv = EFAULT; 38222214Sav145390 return (rv); 38232214Sav145390 } 38242214Sav145390 buf = NULL; 38252214Sav145390 } else { 38262214Sav145390 buf = (caddr_t)kmem_alloc(PAGESIZE, KM_SLEEP); 38272214Sav145390 38282214Sav145390 pa = va_to_pa(buf); 38292214Sav145390 pa += offset; 38302214Sav145390 38312214Sav145390 offset += 64; 38322214Sav145390 if (offset >= PAGESIZE) 38332214Sav145390 offset = 0; 38342214Sav145390 } 38352214Sav145390 38362214Sav145390 switch (cmd) { 38372214Sav145390 case MCI_CE: 38385080Swh31274 mc_inject_error(MC_INJECT_INTERMITTENT_CE, pa, flags); 38392214Sav145390 break; 38402214Sav145390 case MCI_PERM_CE: 38415080Swh31274 mc_inject_error(MC_INJECT_PERMANENT_CE, pa, flags); 38422214Sav145390 break; 38432214Sav145390 case MCI_UE: 38445080Swh31274 mc_inject_error(MC_INJECT_UE, pa, flags); 38452214Sav145390 break; 38462214Sav145390 case MCI_M_CE: 38475080Swh31274 mc_inject_error(MC_INJECT_INTERMITTENT_MCE, pa, flags); 38482214Sav145390 break; 38492214Sav145390 case MCI_M_PCE: 38505080Swh31274 mc_inject_error(MC_INJECT_PERMANENT_MCE, pa, flags); 38512214Sav145390 break; 38522214Sav145390 case MCI_M_UE: 38535080Swh31274 mc_inject_error(MC_INJECT_MUE, pa, flags); 38542214Sav145390 break; 38552214Sav145390 case MCI_CMP: 38565080Swh31274 mc_inject_error(MC_INJECT_CMPE, pa, flags); 38572214Sav145390 break; 38582214Sav145390 case MCI_NOP: 38595080Swh31274 mc_inject_error(MC_INJECT_NOP, pa, flags); break; 38602214Sav145390 case MCI_SHOW_ALL: 38612214Sav145390 mc_debug_show_all = 1; 38622214Sav145390 break; 38632214Sav145390 case MCI_SHOW_NONE: 38642214Sav145390 mc_debug_show_all = 0; 38652214Sav145390 break; 38662214Sav145390 case MCI_ALLOC: 38672214Sav145390 /* 38682214Sav145390 * just allocate some kernel memory and never free it 38692214Sav145390 * 512 MB seems to be the maximum size supported. 38702214Sav145390 */ 38712214Sav145390 cmn_err(CE_NOTE, "Allocating kmem %d MB\n", flags * 512); 38722214Sav145390 for (i = 0; i < flags; i++) { 38732214Sav145390 buf = kmem_alloc(512 * 1024 * 1024, KM_SLEEP); 38742214Sav145390 cmn_err(CE_NOTE, "kmem buf %llx PA %llx\n", 38755080Swh31274 (u_longlong_t)buf, (u_longlong_t)va_to_pa(buf)); 38762214Sav145390 } 38772214Sav145390 break; 38782214Sav145390 case MCI_SUSPEND: 38792214Sav145390 (void) opl_mc_suspend(); 38802214Sav145390 break; 38812214Sav145390 case MCI_RESUME: 38822214Sav145390 (void) opl_mc_resume(); 38832214Sav145390 break; 38842214Sav145390 default: 38852214Sav145390 rv = ENXIO; 38862214Sav145390 } 38872214Sav145390 return (rv); 38882214Sav145390 } 38892214Sav145390 38902214Sav145390 #endif /* DEBUG */ 3891