11772Sjl139090 /*
21772Sjl139090 * CDDL HEADER START
31772Sjl139090 *
41772Sjl139090 * The contents of this file are subject to the terms of the
51772Sjl139090 * Common Development and Distribution License (the "License").
61772Sjl139090 * You may not use this file except in compliance with the License.
71772Sjl139090 *
81772Sjl139090 * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
91772Sjl139090 * or http://www.opensolaris.org/os/licensing.
101772Sjl139090 * See the License for the specific language governing permissions
111772Sjl139090 * and limitations under the License.
121772Sjl139090 *
131772Sjl139090 * When distributing Covered Code, include this CDDL HEADER in each
141772Sjl139090 * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
151772Sjl139090 * If applicable, add the following below this CDDL HEADER, with the
161772Sjl139090 * fields enclosed by brackets "[]" replaced with your own identifying
171772Sjl139090 * information: Portions Copyright [yyyy] [name of copyright owner]
181772Sjl139090 *
191772Sjl139090 * CDDL HEADER END
201772Sjl139090 */
211772Sjl139090 /*
22*12931SDave.Plauger@Sun.COM * Copyright (c) 2006, 2010, Oracle and/or its affiliates. All rights reserved.
231772Sjl139090 */
241772Sjl139090
251772Sjl139090 #include <sys/cpuvar.h>
261772Sjl139090 #include <sys/systm.h>
271772Sjl139090 #include <sys/sysmacros.h>
281772Sjl139090 #include <sys/promif.h>
291772Sjl139090 #include <sys/platform_module.h>
301772Sjl139090 #include <sys/cmn_err.h>
311772Sjl139090 #include <sys/errno.h>
321772Sjl139090 #include <sys/machsystm.h>
331772Sjl139090 #include <sys/bootconf.h>
341772Sjl139090 #include <sys/nvpair.h>
351772Sjl139090 #include <sys/kobj.h>
361772Sjl139090 #include <sys/mem_cage.h>
371772Sjl139090 #include <sys/opl.h>
381772Sjl139090 #include <sys/scfd/scfostoescf.h>
391772Sjl139090 #include <sys/cpu_sgnblk_defs.h>
401772Sjl139090 #include <sys/utsname.h>
411772Sjl139090 #include <sys/ddi.h>
421772Sjl139090 #include <sys/sunndi.h>
431772Sjl139090 #include <sys/lgrp.h>
441772Sjl139090 #include <sys/memnode.h>
451772Sjl139090 #include <sys/sysmacros.h>
463914Spm145316 #include <sys/time.h>
473914Spm145316 #include <sys/cpu.h>
4810843SDave.Plauger@Sun.COM #include <sys/dumphdr.h>
491772Sjl139090 #include <vm/vm_dep.h>
501772Sjl139090
511772Sjl139090 int (*opl_get_mem_unum)(int, uint64_t, char *, int, int *);
522214Sav145390 int (*opl_get_mem_sid)(char *unum, char *buf, int buflen, int *lenp);
532214Sav145390 int (*opl_get_mem_offset)(uint64_t paddr, uint64_t *offp);
542214Sav145390 int (*opl_get_mem_addr)(char *unum, char *sid,
552214Sav145390 uint64_t offset, uint64_t *paddr);
561772Sjl139090
571772Sjl139090 /* Memory for fcode claims. 16k times # maximum possible IO units */
581772Sjl139090 #define EFCODE_SIZE (OPL_MAX_BOARDS * OPL_MAX_IO_UNITS_PER_BOARD * 0x4000)
591772Sjl139090 int efcode_size = EFCODE_SIZE;
601772Sjl139090
611772Sjl139090 #define OPL_MC_MEMBOARD_SHIFT 38 /* Boards on 256BG boundary */
621772Sjl139090
631772Sjl139090 /* Set the maximum number of boards for DR */
641772Sjl139090 int opl_boards = OPL_MAX_BOARDS;
651772Sjl139090
661772Sjl139090 void sgn_update_all_cpus(ushort_t, uchar_t, uchar_t);
671772Sjl139090
681772Sjl139090 extern int tsb_lgrp_affinity;
691772Sjl139090
701772Sjl139090 int opl_tsb_spares = (OPL_MAX_BOARDS) * (OPL_MAX_PCICH_UNITS_PER_BOARD) *
711772Sjl139090 (OPL_MAX_TSBS_PER_PCICH);
721772Sjl139090
731772Sjl139090 pgcnt_t opl_startup_cage_size = 0;
741772Sjl139090
755347Sjfrank /*
765347Sjfrank * The length of the delay in seconds in communication with XSCF after
775347Sjfrank * which the warning message will be logged.
785347Sjfrank */
795347Sjfrank uint_t xscf_connect_delay = 60 * 15;
805347Sjfrank
812241Shuah static opl_model_info_t opl_models[] = {
823123Ssubhan { "FF1", OPL_MAX_BOARDS_FF1, FF1, STD_DISPATCH_TABLE },
833123Ssubhan { "FF2", OPL_MAX_BOARDS_FF2, FF2, STD_DISPATCH_TABLE },
843123Ssubhan { "DC1", OPL_MAX_BOARDS_DC1, DC1, STD_DISPATCH_TABLE },
853123Ssubhan { "DC2", OPL_MAX_BOARDS_DC2, DC2, EXT_DISPATCH_TABLE },
863123Ssubhan { "DC3", OPL_MAX_BOARDS_DC3, DC3, EXT_DISPATCH_TABLE },
876297Sjl139090 { "IKKAKU", OPL_MAX_BOARDS_IKKAKU, IKKAKU, STD_DISPATCH_TABLE },
882241Shuah };
892241Shuah static int opl_num_models = sizeof (opl_models)/sizeof (opl_model_info_t);
902241Shuah
913123Ssubhan /*
923627Ssubhan * opl_cur_model
933123Ssubhan */
943627Ssubhan static opl_model_info_t *opl_cur_model = NULL;
952241Shuah
961772Sjl139090 static struct memlist *opl_memlist_per_board(struct memlist *ml);
975347Sjfrank static void post_xscf_msg(char *, int);
985347Sjfrank static void pass2xscf_thread();
991772Sjl139090
1003914Spm145316 /*
1013914Spm145316 * Note FF/DC out-of-order instruction engine takes only a
1023914Spm145316 * single cycle to execute each spin loop
1033914Spm145316 * for comparison, Panther takes 6 cycles for same loop
1045834Spt157919 * OPL_BOFF_SPIN = base spin loop, roughly one memory reference time
1055834Spt157919 * OPL_BOFF_TM = approx nsec for OPL sleep instruction (1600 for OPL-C)
1065834Spt157919 * OPL_BOFF_SLEEP = approx number of SPIN iterations to equal one sleep
1075834Spt157919 * OPL_BOFF_MAX_SCALE - scaling factor for max backoff based on active cpus
1085834Spt157919 * Listed values tuned for 2.15GHz to 2.64GHz systems
1093914Spm145316 * Value may change for future systems
1103914Spm145316 */
1115834Spt157919 #define OPL_BOFF_SPIN 7
1125834Spt157919 #define OPL_BOFF_SLEEP 4
1135834Spt157919 #define OPL_BOFF_TM 1600
1145834Spt157919 #define OPL_BOFF_MAX_SCALE 8
1153914Spm145316
1165788Smv143129 #define OPL_CLOCK_TICK_THRESHOLD 128
1175788Smv143129 #define OPL_CLOCK_TICK_NCPUS 64
1185788Smv143129
1195788Smv143129 extern int clock_tick_threshold;
1205788Smv143129 extern int clock_tick_ncpus;
1215788Smv143129
1221772Sjl139090 int
set_platform_max_ncpus(void)1231772Sjl139090 set_platform_max_ncpus(void)
1241772Sjl139090 {
1251772Sjl139090 return (OPL_MAX_CPU_PER_BOARD * OPL_MAX_BOARDS);
1261772Sjl139090 }
1271772Sjl139090
1281772Sjl139090 int
set_platform_tsb_spares(void)1291772Sjl139090 set_platform_tsb_spares(void)
1301772Sjl139090 {
1311772Sjl139090 return (MIN(opl_tsb_spares, MAX_UPA));
1321772Sjl139090 }
1331772Sjl139090
1342241Shuah static void
set_model_info()1352241Shuah set_model_info()
1362241Shuah {
1373123Ssubhan extern int ts_dispatch_extended;
1382241Shuah char name[MAXSYSNAME];
1392241Shuah int i;
1402241Shuah
1412241Shuah /*
1422241Shuah * Get model name from the root node.
1432241Shuah *
1442241Shuah * We are using the prom device tree since, at this point,
1452241Shuah * the Solaris device tree is not yet setup.
1462241Shuah */
1472241Shuah (void) prom_getprop(prom_rootnode(), "model", (caddr_t)name);
1482241Shuah
1492241Shuah for (i = 0; i < opl_num_models; i++) {
1502241Shuah if (strncmp(name, opl_models[i].model_name, MAXSYSNAME) == 0) {
1512241Shuah opl_cur_model = &opl_models[i];
1522241Shuah break;
1532241Shuah }
1542241Shuah }
1553123Ssubhan
1565539Swh31274 /*
1575539Swh31274 * If model not matched, it's an unknown model.
1586297Sjl139090 * Just return. It will default to standard dispatch tables.
1595539Swh31274 */
1602241Shuah if (i == opl_num_models)
1615539Swh31274 return;
1623123Ssubhan
1633123Ssubhan if ((opl_cur_model->model_cmds & EXT_DISPATCH_TABLE) &&
1645037Sjl139090 (ts_dispatch_extended == -1)) {
1653123Ssubhan /*
1663123Ssubhan * Based on a platform model, select a dispatch table.
1673123Ssubhan * Only DC2 and DC3 systems uses the alternate/extended
1683123Ssubhan * TS dispatch table.
1696297Sjl139090 * IKKAKU, FF1, FF2 and DC1 systems use standard dispatch
1706297Sjl139090 * tables.
1713123Ssubhan */
1723123Ssubhan ts_dispatch_extended = 1;
1733123Ssubhan }
1743123Ssubhan
1752241Shuah }
1762241Shuah
1772241Shuah static void
set_max_mmu_ctxdoms()1782241Shuah set_max_mmu_ctxdoms()
1792241Shuah {
1802241Shuah extern uint_t max_mmu_ctxdoms;
1812241Shuah int max_boards;
1822241Shuah
1832241Shuah /*
1842241Shuah * From the model, get the maximum number of boards
1852241Shuah * supported and set the value accordingly. If the model
1862241Shuah * could not be determined or recognized, we assume the max value.
1872241Shuah */
1882241Shuah if (opl_cur_model == NULL)
1892241Shuah max_boards = OPL_MAX_BOARDS;
1902241Shuah else
1912241Shuah max_boards = opl_cur_model->model_max_boards;
1922241Shuah
1932241Shuah /*
1942241Shuah * On OPL, cores and MMUs are one-to-one.
1952241Shuah */
1962241Shuah max_mmu_ctxdoms = OPL_MAX_CORE_UNITS_PER_BOARD * max_boards;
1972241Shuah }
1982241Shuah
1991772Sjl139090 #pragma weak mmu_init_large_pages
2001772Sjl139090
2011772Sjl139090 void
set_platform_defaults(void)2021772Sjl139090 set_platform_defaults(void)
2031772Sjl139090 {
2041772Sjl139090 extern char *tod_module_name;
2051772Sjl139090 extern void cpu_sgn_update(ushort_t, uchar_t, uchar_t, int);
2061772Sjl139090 extern void mmu_init_large_pages(size_t);
2071772Sjl139090
2081772Sjl139090 /* Set the CPU signature function pointer */
2091772Sjl139090 cpu_sgn_func = cpu_sgn_update;
2101772Sjl139090
2111772Sjl139090 /* Set appropriate tod module for OPL platform */
2121772Sjl139090 ASSERT(tod_module_name == NULL);
2131772Sjl139090 tod_module_name = "todopl";
2141772Sjl139090
2151772Sjl139090 if ((mmu_page_sizes == max_mmu_page_sizes) &&
2162659Ssusans (mmu_ism_pagesize != DEFAULT_ISM_PAGESIZE)) {
2171772Sjl139090 if (&mmu_init_large_pages)
2181772Sjl139090 mmu_init_large_pages(mmu_ism_pagesize);
2191772Sjl139090 }
2201772Sjl139090
2211772Sjl139090 tsb_lgrp_affinity = 1;
2222241Shuah
2232241Shuah set_max_mmu_ctxdoms();
22410843SDave.Plauger@Sun.COM
22510843SDave.Plauger@Sun.COM /* set OPL threshold for compressed dumps */
226*12931SDave.Plauger@Sun.COM dump_plat_mincpu_default = DUMP_PLAT_SUN4U_OPL_MINCPU;
2271772Sjl139090 }
2281772Sjl139090
2291772Sjl139090 /*
2301772Sjl139090 * Convert logical a board number to a physical one.
2311772Sjl139090 */
2321772Sjl139090
2331772Sjl139090 #define LSBPROP "board#"
2341772Sjl139090 #define PSBPROP "physical-board#"
2351772Sjl139090
2361772Sjl139090 int
opl_get_physical_board(int id)2371772Sjl139090 opl_get_physical_board(int id)
2381772Sjl139090 {
2391772Sjl139090 dev_info_t *root_dip, *dip = NULL;
2401772Sjl139090 char *dname = NULL;
2411772Sjl139090 int circ;
2421772Sjl139090
2431772Sjl139090 pnode_t pnode;
2441772Sjl139090 char pname[MAXSYSNAME] = {0};
2451772Sjl139090
2461772Sjl139090 int lsb_id; /* Logical System Board ID */
2471772Sjl139090 int psb_id; /* Physical System Board ID */
2481772Sjl139090
2491772Sjl139090
2501772Sjl139090 /*
2511772Sjl139090 * This function is called on early stage of bootup when the
2521772Sjl139090 * kernel device tree is not initialized yet, and also
2531772Sjl139090 * later on when the device tree is up. We want to try
2541772Sjl139090 * the fast track first.
2551772Sjl139090 */
2561772Sjl139090 root_dip = ddi_root_node();
2571772Sjl139090 if (root_dip) {
2581772Sjl139090 /* Get from devinfo node */
2591772Sjl139090 ndi_devi_enter(root_dip, &circ);
2601772Sjl139090 for (dip = ddi_get_child(root_dip); dip;
2611772Sjl139090 dip = ddi_get_next_sibling(dip)) {
2621772Sjl139090
2631772Sjl139090 dname = ddi_node_name(dip);
2641772Sjl139090 if (strncmp(dname, "pseudo-mc", 9) != 0)
2651772Sjl139090 continue;
2661772Sjl139090
2671772Sjl139090 if ((lsb_id = (int)ddi_getprop(DDI_DEV_T_ANY, dip,
2681772Sjl139090 DDI_PROP_DONTPASS, LSBPROP, -1)) == -1)
2691772Sjl139090 continue;
2701772Sjl139090
2711772Sjl139090 if (id == lsb_id) {
2721772Sjl139090 if ((psb_id = (int)ddi_getprop(DDI_DEV_T_ANY,
2731772Sjl139090 dip, DDI_PROP_DONTPASS, PSBPROP, -1))
2741772Sjl139090 == -1) {
2751772Sjl139090 ndi_devi_exit(root_dip, circ);
2761772Sjl139090 return (-1);
2771772Sjl139090 } else {
2781772Sjl139090 ndi_devi_exit(root_dip, circ);
2791772Sjl139090 return (psb_id);
2801772Sjl139090 }
2811772Sjl139090 }
2821772Sjl139090 }
2831772Sjl139090 ndi_devi_exit(root_dip, circ);
2841772Sjl139090 }
2851772Sjl139090
2861772Sjl139090 /*
2871772Sjl139090 * We do not have the kernel device tree, or we did not
2881772Sjl139090 * find the node for some reason (let's say the kernel
2891772Sjl139090 * device tree was modified), let's try the OBP tree.
2901772Sjl139090 */
2911772Sjl139090 pnode = prom_rootnode();
2921772Sjl139090 for (pnode = prom_childnode(pnode); pnode;
2931772Sjl139090 pnode = prom_nextnode(pnode)) {
2941772Sjl139090
2951772Sjl139090 if ((prom_getprop(pnode, "name", (caddr_t)pname) == -1) ||
2961772Sjl139090 (strncmp(pname, "pseudo-mc", 9) != 0))
2971772Sjl139090 continue;
2981772Sjl139090
2991772Sjl139090 if (prom_getprop(pnode, LSBPROP, (caddr_t)&lsb_id) == -1)
3001772Sjl139090 continue;
3011772Sjl139090
3021772Sjl139090 if (id == lsb_id) {
3031772Sjl139090 if (prom_getprop(pnode, PSBPROP,
3041772Sjl139090 (caddr_t)&psb_id) == -1) {
3051772Sjl139090 return (-1);
3061772Sjl139090 } else {
3071772Sjl139090 return (psb_id);
3081772Sjl139090 }
3091772Sjl139090 }
3101772Sjl139090 }
3111772Sjl139090
3121772Sjl139090 return (-1);
3131772Sjl139090 }
3141772Sjl139090
3151772Sjl139090 /*
3161772Sjl139090 * For OPL it's possible that memory from two or more successive boards
3171772Sjl139090 * will be contiguous across the boards, and therefore represented as a
3181772Sjl139090 * single chunk.
3191772Sjl139090 * This function splits such chunks down the board boundaries.
3201772Sjl139090 */
3211772Sjl139090 static struct memlist *
opl_memlist_per_board(struct memlist * ml)3221772Sjl139090 opl_memlist_per_board(struct memlist *ml)
3231772Sjl139090 {
3241772Sjl139090 uint64_t ssize, low, high, boundary;
3251772Sjl139090 struct memlist *head, *tail, *new;
3261772Sjl139090
3271772Sjl139090 ssize = (1ull << OPL_MC_MEMBOARD_SHIFT);
3281772Sjl139090
3291772Sjl139090 head = tail = NULL;
3301772Sjl139090
33111474SJonathan.Adams@Sun.COM for (; ml; ml = ml->ml_next) {
33211474SJonathan.Adams@Sun.COM low = (uint64_t)ml->ml_address;
33311474SJonathan.Adams@Sun.COM high = low+(uint64_t)(ml->ml_size);
3341772Sjl139090 while (low < high) {
3351772Sjl139090 boundary = roundup(low+1, ssize);
3361772Sjl139090 boundary = MIN(high, boundary);
3371772Sjl139090 new = kmem_zalloc(sizeof (struct memlist), KM_SLEEP);
33811474SJonathan.Adams@Sun.COM new->ml_address = low;
33911474SJonathan.Adams@Sun.COM new->ml_size = boundary - low;
3401772Sjl139090 if (head == NULL)
3411772Sjl139090 head = new;
3421772Sjl139090 if (tail) {
34311474SJonathan.Adams@Sun.COM tail->ml_next = new;
34411474SJonathan.Adams@Sun.COM new->ml_prev = tail;
3451772Sjl139090 }
3461772Sjl139090 tail = new;
3471772Sjl139090 low = boundary;
3481772Sjl139090 }
3491772Sjl139090 }
3501772Sjl139090 return (head);
3511772Sjl139090 }
3521772Sjl139090
3531772Sjl139090 void
set_platform_cage_params(void)3541772Sjl139090 set_platform_cage_params(void)
3551772Sjl139090 {
3561772Sjl139090 extern pgcnt_t total_pages;
3571772Sjl139090 extern struct memlist *phys_avail;
3581772Sjl139090 struct memlist *ml, *tml;
3591772Sjl139090
3601772Sjl139090 if (kernel_cage_enable) {
3611772Sjl139090 pgcnt_t preferred_cage_size;
3621772Sjl139090
3635037Sjl139090 preferred_cage_size = MAX(opl_startup_cage_size,
3645037Sjl139090 total_pages / 256);
3651772Sjl139090
3661772Sjl139090 ml = opl_memlist_per_board(phys_avail);
3671772Sjl139090
3681772Sjl139090 /*
3691772Sjl139090 * Note: we are assuming that post has load the
3701772Sjl139090 * whole show in to the high end of memory. Having
3711772Sjl139090 * taken this leap, we copy the whole of phys_avail
3721772Sjl139090 * the glist and arrange for the cage to grow
3731772Sjl139090 * downward (descending pfns).
3741772Sjl139090 */
3754266Sdp78419 kcage_range_init(ml, KCAGE_DOWN, preferred_cage_size);
3761772Sjl139090
3771772Sjl139090 /* free the memlist */
3781772Sjl139090 do {
37911474SJonathan.Adams@Sun.COM tml = ml->ml_next;
3801772Sjl139090 kmem_free(ml, sizeof (struct memlist));
3811772Sjl139090 ml = tml;
3821772Sjl139090 } while (ml != NULL);
3831772Sjl139090 }
3841772Sjl139090
3851772Sjl139090 if (kcage_on)
3861772Sjl139090 cmn_err(CE_NOTE, "!DR Kernel Cage is ENABLED");
3871772Sjl139090 else
3881772Sjl139090 cmn_err(CE_NOTE, "!DR Kernel Cage is DISABLED");
3891772Sjl139090 }
3901772Sjl139090
3911772Sjl139090 /*ARGSUSED*/
3921772Sjl139090 int
plat_cpu_poweron(struct cpu * cp)3931772Sjl139090 plat_cpu_poweron(struct cpu *cp)
3941772Sjl139090 {
3951772Sjl139090 int (*opl_cpu_poweron)(struct cpu *) = NULL;
3961772Sjl139090
3971772Sjl139090 opl_cpu_poweron =
3981772Sjl139090 (int (*)(struct cpu *))kobj_getsymvalue("drmach_cpu_poweron", 0);
3991772Sjl139090
4001772Sjl139090 if (opl_cpu_poweron == NULL)
4011772Sjl139090 return (ENOTSUP);
4021772Sjl139090 else
4031772Sjl139090 return ((opl_cpu_poweron)(cp));
4041772Sjl139090
4051772Sjl139090 }
4061772Sjl139090
4071772Sjl139090 /*ARGSUSED*/
4081772Sjl139090 int
plat_cpu_poweroff(struct cpu * cp)4091772Sjl139090 plat_cpu_poweroff(struct cpu *cp)
4101772Sjl139090 {
4111772Sjl139090 int (*opl_cpu_poweroff)(struct cpu *) = NULL;
4121772Sjl139090
4131772Sjl139090 opl_cpu_poweroff =
4141772Sjl139090 (int (*)(struct cpu *))kobj_getsymvalue("drmach_cpu_poweroff", 0);
4151772Sjl139090
4161772Sjl139090 if (opl_cpu_poweroff == NULL)
4171772Sjl139090 return (ENOTSUP);
4181772Sjl139090 else
4191772Sjl139090 return ((opl_cpu_poweroff)(cp));
4201772Sjl139090
4211772Sjl139090 }
4221772Sjl139090
4231772Sjl139090 int
plat_max_boards(void)4241772Sjl139090 plat_max_boards(void)
4251772Sjl139090 {
4267206Swh31274 /*
4277206Swh31274 * If the model cannot be determined, default to the max value.
4287206Swh31274 * Otherwise, Ikkaku model only supports 1 system board.
4297206Swh31274 */
4307206Swh31274 if ((opl_cur_model != NULL) && (opl_cur_model->model_type == IKKAKU))
4317206Swh31274 return (OPL_MAX_BOARDS_IKKAKU);
4327206Swh31274 else
4337206Swh31274 return (OPL_MAX_BOARDS);
4341772Sjl139090 }
4351772Sjl139090
4361772Sjl139090 int
plat_max_cpu_units_per_board(void)4371772Sjl139090 plat_max_cpu_units_per_board(void)
4381772Sjl139090 {
4391772Sjl139090 return (OPL_MAX_CPU_PER_BOARD);
4401772Sjl139090 }
4411772Sjl139090
4421772Sjl139090 int
plat_max_mem_units_per_board(void)4431772Sjl139090 plat_max_mem_units_per_board(void)
4441772Sjl139090 {
4451772Sjl139090 return (OPL_MAX_MEM_UNITS_PER_BOARD);
4461772Sjl139090 }
4471772Sjl139090
4481772Sjl139090 int
plat_max_io_units_per_board(void)4491772Sjl139090 plat_max_io_units_per_board(void)
4501772Sjl139090 {
4511772Sjl139090 return (OPL_MAX_IO_UNITS_PER_BOARD);
4521772Sjl139090 }
4531772Sjl139090
4541772Sjl139090 int
plat_max_cmp_units_per_board(void)4551772Sjl139090 plat_max_cmp_units_per_board(void)
4561772Sjl139090 {
4571772Sjl139090 return (OPL_MAX_CMP_UNITS_PER_BOARD);
4581772Sjl139090 }
4591772Sjl139090
4601772Sjl139090 int
plat_max_core_units_per_board(void)4611772Sjl139090 plat_max_core_units_per_board(void)
4621772Sjl139090 {
4631772Sjl139090 return (OPL_MAX_CORE_UNITS_PER_BOARD);
4641772Sjl139090 }
4651772Sjl139090
4661772Sjl139090 int
plat_pfn_to_mem_node(pfn_t pfn)4671772Sjl139090 plat_pfn_to_mem_node(pfn_t pfn)
4681772Sjl139090 {
4691772Sjl139090 return (pfn >> mem_node_pfn_shift);
4701772Sjl139090 }
4711772Sjl139090
4721772Sjl139090 /* ARGSUSED */
4731772Sjl139090 void
plat_build_mem_nodes(prom_memlist_t * list,size_t nelems)4745648Ssetje plat_build_mem_nodes(prom_memlist_t *list, size_t nelems)
4751772Sjl139090 {
4761772Sjl139090 size_t elem;
4771772Sjl139090 pfn_t basepfn;
4781772Sjl139090 pgcnt_t npgs;
4791772Sjl139090 uint64_t boundary, ssize;
4801772Sjl139090 uint64_t low, high;
4811772Sjl139090
4821772Sjl139090 /*
4831772Sjl139090 * OPL mem slices are always aligned on a 256GB boundary.
4841772Sjl139090 */
4851772Sjl139090 mem_node_pfn_shift = OPL_MC_MEMBOARD_SHIFT - MMU_PAGESHIFT;
4861772Sjl139090 mem_node_physalign = 0;
4871772Sjl139090
4881772Sjl139090 /*
4891772Sjl139090 * Boot install lists are arranged <addr, len>, <addr, len>, ...
4901772Sjl139090 */
4911772Sjl139090 ssize = (1ull << OPL_MC_MEMBOARD_SHIFT);
4925648Ssetje for (elem = 0; elem < nelems; list++, elem++) {
4935648Ssetje low = list->addr;
4945648Ssetje high = low + list->size;
4951772Sjl139090 while (low < high) {
4961772Sjl139090 boundary = roundup(low+1, ssize);
4971772Sjl139090 boundary = MIN(high, boundary);
4981772Sjl139090 basepfn = btop(low);
4991772Sjl139090 npgs = btop(boundary - low);
5001772Sjl139090 mem_node_add_slice(basepfn, basepfn + npgs - 1);
5011772Sjl139090 low = boundary;
5021772Sjl139090 }
5031772Sjl139090 }
5041772Sjl139090 }
5051772Sjl139090
5061772Sjl139090 /*
5071772Sjl139090 * Find the CPU associated with a slice at boot-time.
5081772Sjl139090 */
5091772Sjl139090 void
plat_fill_mc(pnode_t nodeid)5101772Sjl139090 plat_fill_mc(pnode_t nodeid)
5111772Sjl139090 {
5121772Sjl139090 int board;
5131772Sjl139090 int memnode;
5141772Sjl139090 struct {
5151772Sjl139090 uint64_t addr;
5161772Sjl139090 uint64_t size;
5171772Sjl139090 } mem_range;
5181772Sjl139090
5191772Sjl139090 if (prom_getprop(nodeid, "board#", (caddr_t)&board) < 0) {
5201772Sjl139090 panic("Can not find board# property in mc node %x", nodeid);
5211772Sjl139090 }
5221772Sjl139090 if (prom_getprop(nodeid, "sb-mem-ranges", (caddr_t)&mem_range) < 0) {
5231772Sjl139090 panic("Can not find sb-mem-ranges property in mc node %x",
5245037Sjl139090 nodeid);
5251772Sjl139090 }
5261772Sjl139090 memnode = mem_range.addr >> OPL_MC_MEMBOARD_SHIFT;
5271772Sjl139090 plat_assign_lgrphand_to_mem_node(board, memnode);
5281772Sjl139090 }
5291772Sjl139090
5301772Sjl139090 /*
5311772Sjl139090 * Return the platform handle for the lgroup containing the given CPU
5321772Sjl139090 *
5331772Sjl139090 * For OPL, lgroup platform handle == board #.
5341772Sjl139090 */
5351772Sjl139090
5361772Sjl139090 extern int mpo_disabled;
5371772Sjl139090 extern lgrp_handle_t lgrp_default_handle;
5381772Sjl139090
5391772Sjl139090 lgrp_handle_t
plat_lgrp_cpu_to_hand(processorid_t id)5401772Sjl139090 plat_lgrp_cpu_to_hand(processorid_t id)
5411772Sjl139090 {
5421772Sjl139090 lgrp_handle_t plathand;
5431772Sjl139090
5441772Sjl139090 /*
5451772Sjl139090 * Return the real platform handle for the CPU until
5461772Sjl139090 * such time as we know that MPO should be disabled.
5471772Sjl139090 * At that point, we set the "mpo_disabled" flag to true,
5481772Sjl139090 * and from that point on, return the default handle.
5491772Sjl139090 *
5501772Sjl139090 * By the time we know that MPO should be disabled, the
5511772Sjl139090 * first CPU will have already been added to a leaf
5521772Sjl139090 * lgroup, but that's ok. The common lgroup code will
5531772Sjl139090 * double check that the boot CPU is in the correct place,
5541772Sjl139090 * and in the case where mpo should be disabled, will move
5551772Sjl139090 * it to the root if necessary.
5561772Sjl139090 */
5571772Sjl139090 if (mpo_disabled) {
5581772Sjl139090 /* If MPO is disabled, return the default (UMA) handle */
5591772Sjl139090 plathand = lgrp_default_handle;
5601772Sjl139090 } else
5611772Sjl139090 plathand = (lgrp_handle_t)LSB_ID(id);
5621772Sjl139090 return (plathand);
5631772Sjl139090 }
5641772Sjl139090
5651772Sjl139090 /*
5661772Sjl139090 * Platform specific lgroup initialization
5671772Sjl139090 */
5681772Sjl139090 void
plat_lgrp_init(void)5691772Sjl139090 plat_lgrp_init(void)
5701772Sjl139090 {
5711772Sjl139090 extern uint32_t lgrp_expand_proc_thresh;
5721772Sjl139090 extern uint32_t lgrp_expand_proc_diff;
5736641Spm145316 const uint_t m = LGRP_LOADAVG_THREAD_MAX;
5741772Sjl139090
5751772Sjl139090 /*
5761772Sjl139090 * Set tuneables for the OPL architecture
5771772Sjl139090 *
5786641Spm145316 * lgrp_expand_proc_thresh is the threshold load on the set of
5796641Spm145316 * lgroups a process is currently using on before considering
5806641Spm145316 * adding another lgroup to the set. For Oly-C and Jupiter
5816641Spm145316 * systems, there are four sockets per lgroup. Setting
5826641Spm145316 * lgrp_expand_proc_thresh to add lgroups when the load reaches
5836641Spm145316 * four threads will spread the load when it exceeds one thread
5846641Spm145316 * per socket, optimizing memory bandwidth and L2 cache space.
5856641Spm145316 *
5866641Spm145316 * lgrp_expand_proc_diff determines how much less another lgroup
5876641Spm145316 * must be loaded before shifting the start location of a thread
5886641Spm145316 * to it.
5896641Spm145316 *
5906641Spm145316 * lgrp_loadavg_tolerance is the threshold where two lgroups are
5916641Spm145316 * considered to have different loads. It is set to be less than
5926641Spm145316 * 1% so that even a small residual load will be considered different
5936641Spm145316 * from no residual load.
5941772Sjl139090 *
5956641Spm145316 * We note loadavg values are not precise.
5966641Spm145316 * Every 1/10 of a second loadavg values are reduced by 5%.
5976641Spm145316 * This adjustment can come in the middle of the lgroup selection
5986641Spm145316 * process, and for larger parallel apps with many threads can
5996641Spm145316 * frequently occur between the start of the second thread
6006641Spm145316 * placement and the finish of the last thread placement.
6016641Spm145316 * We also must be careful to not use too small of a threshold
6026641Spm145316 * since the cumulative decay for 1 second idle time is 40%.
6036641Spm145316 * That is, the residual load from completed threads will still
6046641Spm145316 * be 60% one second after the proc goes idle or 8% after 5 seconds.
6051772Sjl139090 *
6066641Spm145316 * To allow for lag time in loadavg calculations
6076641Spm145316 * remote thresh = 3.75 * LGRP_LOADAVG_THREAD_MAX
6086641Spm145316 * local thresh = 0.75 * LGRP_LOADAVG_THREAD_MAX
6096641Spm145316 * tolerance = 0.0078 * LGRP_LOADAVG_THREAD_MAX
6106641Spm145316 *
6116641Spm145316 * The load placement algorithms consider LGRP_LOADAVG_THREAD_MAX
6126641Spm145316 * as the equivalent of a load of 1. To make the code more compact,
6136641Spm145316 * we set m = LGRP_LOADAVG_THREAD_MAX.
6141772Sjl139090 */
6156641Spm145316 lgrp_expand_proc_thresh = (m * 3) + (m >> 1) + (m >> 2);
6166641Spm145316 lgrp_expand_proc_diff = (m >> 1) + (m >> 2);
6176641Spm145316 lgrp_loadavg_tolerance = (m >> 7);
6181772Sjl139090 }
6191772Sjl139090
6201772Sjl139090 /*
6211772Sjl139090 * Platform notification of lgroup (re)configuration changes
6221772Sjl139090 */
6231772Sjl139090 /*ARGSUSED*/
6241772Sjl139090 void
plat_lgrp_config(lgrp_config_flag_t evt,uintptr_t arg)6251772Sjl139090 plat_lgrp_config(lgrp_config_flag_t evt, uintptr_t arg)
6261772Sjl139090 {
6271772Sjl139090 update_membounds_t *umb;
6281772Sjl139090 lgrp_config_mem_rename_t lmr;
6291772Sjl139090 int sbd, tbd;
6301772Sjl139090 lgrp_handle_t hand, shand, thand;
6311772Sjl139090 int mnode, snode, tnode;
6321772Sjl139090 pfn_t start, end;
6331772Sjl139090
6341772Sjl139090 if (mpo_disabled)
6351772Sjl139090 return;
6361772Sjl139090
6371772Sjl139090 switch (evt) {
6381772Sjl139090
6391772Sjl139090 case LGRP_CONFIG_MEM_ADD:
6401772Sjl139090 /*
6411772Sjl139090 * Establish the lgroup handle to memnode translation.
6421772Sjl139090 */
6431772Sjl139090 umb = (update_membounds_t *)arg;
6441772Sjl139090
6451772Sjl139090 hand = umb->u_board;
6461772Sjl139090 mnode = plat_pfn_to_mem_node(umb->u_base >> MMU_PAGESHIFT);
6471772Sjl139090 plat_assign_lgrphand_to_mem_node(hand, mnode);
6481772Sjl139090
6491772Sjl139090 break;
6501772Sjl139090
6511772Sjl139090 case LGRP_CONFIG_MEM_DEL:
6521772Sjl139090 /*
6531772Sjl139090 * Special handling for possible memory holes.
6541772Sjl139090 */
6551772Sjl139090 umb = (update_membounds_t *)arg;
6561772Sjl139090 hand = umb->u_board;
6571772Sjl139090 if ((mnode = plat_lgrphand_to_mem_node(hand)) != -1) {
6581772Sjl139090 if (mem_node_config[mnode].exists) {
6591772Sjl139090 start = mem_node_config[mnode].physbase;
6601772Sjl139090 end = mem_node_config[mnode].physmax;
66110106SJason.Beloro@Sun.COM mem_node_del_slice(start, end);
6621772Sjl139090 }
6631772Sjl139090 }
6641772Sjl139090
6651772Sjl139090 break;
6661772Sjl139090
6671772Sjl139090 case LGRP_CONFIG_MEM_RENAME:
6681772Sjl139090 /*
6691772Sjl139090 * During a DR copy-rename operation, all of the memory
6701772Sjl139090 * on one board is moved to another board -- but the
6711772Sjl139090 * addresses/pfns and memnodes don't change. This means
6721772Sjl139090 * the memory has changed locations without changing identity.
6731772Sjl139090 *
6741772Sjl139090 * Source is where we are copying from and target is where we
6751772Sjl139090 * are copying to. After source memnode is copied to target
6761772Sjl139090 * memnode, the physical addresses of the target memnode are
6771772Sjl139090 * renamed to match what the source memnode had. Then target
6781772Sjl139090 * memnode can be removed and source memnode can take its
6791772Sjl139090 * place.
6801772Sjl139090 *
6811772Sjl139090 * To do this, swap the lgroup handle to memnode mappings for
6821772Sjl139090 * the boards, so target lgroup will have source memnode and
6831772Sjl139090 * source lgroup will have empty target memnode which is where
6841772Sjl139090 * its memory will go (if any is added to it later).
6851772Sjl139090 *
6861772Sjl139090 * Then source memnode needs to be removed from its lgroup
6871772Sjl139090 * and added to the target lgroup where the memory was living
6881772Sjl139090 * but under a different name/memnode. The memory was in the
6891772Sjl139090 * target memnode and now lives in the source memnode with
6901772Sjl139090 * different physical addresses even though it is the same
6911772Sjl139090 * memory.
6921772Sjl139090 */
6931772Sjl139090 sbd = arg & 0xffff;
6941772Sjl139090 tbd = (arg & 0xffff0000) >> 16;
6951772Sjl139090 shand = sbd;
6961772Sjl139090 thand = tbd;
6971772Sjl139090 snode = plat_lgrphand_to_mem_node(shand);
6981772Sjl139090 tnode = plat_lgrphand_to_mem_node(thand);
6991772Sjl139090
7001772Sjl139090 /*
7011772Sjl139090 * Special handling for possible memory holes.
7021772Sjl139090 */
7031772Sjl139090 if (tnode != -1 && mem_node_config[tnode].exists) {
7043354Sjl139090 start = mem_node_config[tnode].physbase;
7053354Sjl139090 end = mem_node_config[tnode].physmax;
70610106SJason.Beloro@Sun.COM mem_node_del_slice(start, end);
7071772Sjl139090 }
7081772Sjl139090
7091772Sjl139090 plat_assign_lgrphand_to_mem_node(thand, snode);
7101772Sjl139090 plat_assign_lgrphand_to_mem_node(shand, tnode);
7111772Sjl139090
7121772Sjl139090 lmr.lmem_rename_from = shand;
7131772Sjl139090 lmr.lmem_rename_to = thand;
7141772Sjl139090
7151772Sjl139090 /*
7161772Sjl139090 * Remove source memnode of copy rename from its lgroup
7171772Sjl139090 * and add it to its new target lgroup
7181772Sjl139090 */
7191772Sjl139090 lgrp_config(LGRP_CONFIG_MEM_RENAME, (uintptr_t)snode,
7201772Sjl139090 (uintptr_t)&lmr);
7211772Sjl139090
7221772Sjl139090 break;
7231772Sjl139090
7241772Sjl139090 default:
7251772Sjl139090 break;
7261772Sjl139090 }
7271772Sjl139090 }
7281772Sjl139090
7291772Sjl139090 /*
7301772Sjl139090 * Return latency between "from" and "to" lgroups
7311772Sjl139090 *
7321772Sjl139090 * This latency number can only be used for relative comparison
7331772Sjl139090 * between lgroups on the running system, cannot be used across platforms,
7341772Sjl139090 * and may not reflect the actual latency. It is platform and implementation
7351772Sjl139090 * specific, so platform gets to decide its value. It would be nice if the
7361772Sjl139090 * number was at least proportional to make comparisons more meaningful though.
7371772Sjl139090 * NOTE: The numbers below are supposed to be load latencies for uncached
7381772Sjl139090 * memory divided by 10.
7391772Sjl139090 *
7401772Sjl139090 */
7411772Sjl139090 int
plat_lgrp_latency(lgrp_handle_t from,lgrp_handle_t to)7421772Sjl139090 plat_lgrp_latency(lgrp_handle_t from, lgrp_handle_t to)
7431772Sjl139090 {
7441772Sjl139090 /*
7451772Sjl139090 * Return min remote latency when there are more than two lgroups
7461772Sjl139090 * (root and child) and getting latency between two different lgroups
7471772Sjl139090 * or root is involved
7481772Sjl139090 */
7491772Sjl139090 if (lgrp_optimizations() && (from != to ||
7501772Sjl139090 from == LGRP_DEFAULT_HANDLE || to == LGRP_DEFAULT_HANDLE))
7512491Shyw return (42);
7521772Sjl139090 else
7532491Shyw return (35);
7541772Sjl139090 }
7551772Sjl139090
7561772Sjl139090 /*
7571772Sjl139090 * Return platform handle for root lgroup
7581772Sjl139090 */
7591772Sjl139090 lgrp_handle_t
plat_lgrp_root_hand(void)7601772Sjl139090 plat_lgrp_root_hand(void)
7611772Sjl139090 {
7621772Sjl139090 if (mpo_disabled)
7631772Sjl139090 return (lgrp_default_handle);
7641772Sjl139090
7651772Sjl139090 return (LGRP_DEFAULT_HANDLE);
7661772Sjl139090 }
7671772Sjl139090
7681772Sjl139090 /*ARGSUSED*/
7691772Sjl139090 void
plat_freelist_process(int mnode)7701772Sjl139090 plat_freelist_process(int mnode)
7711772Sjl139090 {
7721772Sjl139090 }
7731772Sjl139090
7741772Sjl139090 void
load_platform_drivers(void)7751772Sjl139090 load_platform_drivers(void)
7761772Sjl139090 {
7771772Sjl139090 (void) i_ddi_attach_pseudo_node("dr");
7781772Sjl139090 }
7791772Sjl139090
7801772Sjl139090 /*
7811772Sjl139090 * No platform drivers on this platform
7821772Sjl139090 */
7831772Sjl139090 char *platform_module_list[] = {
7841772Sjl139090 (char *)0
7851772Sjl139090 };
7861772Sjl139090
7871772Sjl139090 /*ARGSUSED*/
7881772Sjl139090 void
plat_tod_fault(enum tod_fault_type tod_bad)7891772Sjl139090 plat_tod_fault(enum tod_fault_type tod_bad)
7901772Sjl139090 {
7911772Sjl139090 }
7921772Sjl139090
7931772Sjl139090 /*ARGSUSED*/
7941772Sjl139090 void
cpu_sgn_update(ushort_t sgn,uchar_t state,uchar_t sub_state,int cpuid)7951772Sjl139090 cpu_sgn_update(ushort_t sgn, uchar_t state, uchar_t sub_state, int cpuid)
7961772Sjl139090 {
7971772Sjl139090 static void (*scf_panic_callback)(int);
7981772Sjl139090 static void (*scf_shutdown_callback)(int);
7991772Sjl139090
8001772Sjl139090 /*
8011772Sjl139090 * This is for notifing system panic/shutdown to SCF.
8021772Sjl139090 * In case of shutdown and panic, SCF call back
8031772Sjl139090 * function should be called.
8041772Sjl139090 * <SCF call back functions>
8051772Sjl139090 * scf_panic_callb() : panicsys()->panic_quiesce_hw()
8061772Sjl139090 * scf_shutdown_callb(): halt() or power_down() or reboot_machine()
8071772Sjl139090 * cpuid should be -1 and state should be SIGST_EXIT.
8081772Sjl139090 */
8091772Sjl139090 if (state == SIGST_EXIT && cpuid == -1) {
8101772Sjl139090
8111772Sjl139090 /*
8121772Sjl139090 * find the symbol for the SCF panic callback routine in driver
8131772Sjl139090 */
8141772Sjl139090 if (scf_panic_callback == NULL)
8151772Sjl139090 scf_panic_callback = (void (*)(int))
8165037Sjl139090 modgetsymvalue("scf_panic_callb", 0);
8171772Sjl139090 if (scf_shutdown_callback == NULL)
8181772Sjl139090 scf_shutdown_callback = (void (*)(int))
8195037Sjl139090 modgetsymvalue("scf_shutdown_callb", 0);
8201772Sjl139090
8211772Sjl139090 switch (sub_state) {
8221772Sjl139090 case SIGSUBST_PANIC:
8231772Sjl139090 if (scf_panic_callback == NULL) {
8241772Sjl139090 cmn_err(CE_NOTE, "!cpu_sgn_update: "
8251772Sjl139090 "scf_panic_callb not found\n");
8261772Sjl139090 return;
8271772Sjl139090 }
8281772Sjl139090 scf_panic_callback(SIGSUBST_PANIC);
8291772Sjl139090 break;
8301772Sjl139090
8311772Sjl139090 case SIGSUBST_HALT:
8321772Sjl139090 if (scf_shutdown_callback == NULL) {
8331772Sjl139090 cmn_err(CE_NOTE, "!cpu_sgn_update: "
8341772Sjl139090 "scf_shutdown_callb not found\n");
8351772Sjl139090 return;
8361772Sjl139090 }
8371772Sjl139090 scf_shutdown_callback(SIGSUBST_HALT);
8381772Sjl139090 break;
8391772Sjl139090
8401772Sjl139090 case SIGSUBST_ENVIRON:
8411772Sjl139090 if (scf_shutdown_callback == NULL) {
8421772Sjl139090 cmn_err(CE_NOTE, "!cpu_sgn_update: "
8431772Sjl139090 "scf_shutdown_callb not found\n");
8441772Sjl139090 return;
8451772Sjl139090 }
8461772Sjl139090 scf_shutdown_callback(SIGSUBST_ENVIRON);
8471772Sjl139090 break;
8481772Sjl139090
8491772Sjl139090 case SIGSUBST_REBOOT:
8501772Sjl139090 if (scf_shutdown_callback == NULL) {
8511772Sjl139090 cmn_err(CE_NOTE, "!cpu_sgn_update: "
8521772Sjl139090 "scf_shutdown_callb not found\n");
8531772Sjl139090 return;
8541772Sjl139090 }
8551772Sjl139090 scf_shutdown_callback(SIGSUBST_REBOOT);
8561772Sjl139090 break;
8571772Sjl139090 }
8581772Sjl139090 }
8591772Sjl139090 }
8601772Sjl139090
8611772Sjl139090 /*ARGSUSED*/
8621772Sjl139090 int
plat_get_mem_unum(int synd_code,uint64_t flt_addr,int flt_bus_id,int flt_in_memory,ushort_t flt_status,char * buf,int buflen,int * lenp)8631772Sjl139090 plat_get_mem_unum(int synd_code, uint64_t flt_addr, int flt_bus_id,
8641772Sjl139090 int flt_in_memory, ushort_t flt_status,
8651772Sjl139090 char *buf, int buflen, int *lenp)
8661772Sjl139090 {
8671772Sjl139090 /*
8681772Sjl139090 * check if it's a Memory error.
8691772Sjl139090 */
8701772Sjl139090 if (flt_in_memory) {
8711772Sjl139090 if (opl_get_mem_unum != NULL) {
8725037Sjl139090 return (opl_get_mem_unum(synd_code, flt_addr, buf,
8735037Sjl139090 buflen, lenp));
8741772Sjl139090 } else {
8751772Sjl139090 return (ENOTSUP);
8761772Sjl139090 }
8771772Sjl139090 } else {
8781772Sjl139090 return (ENOTSUP);
8791772Sjl139090 }
8801772Sjl139090 }
8811772Sjl139090
8821772Sjl139090 /*ARGSUSED*/
8831772Sjl139090 int
plat_get_cpu_unum(int cpuid,char * buf,int buflen,int * lenp)8841772Sjl139090 plat_get_cpu_unum(int cpuid, char *buf, int buflen, int *lenp)
8851772Sjl139090 {
8862214Sav145390 int ret = 0;
8875347Sjfrank int sb;
8883123Ssubhan int plen;
8891772Sjl139090
8901772Sjl139090 sb = opl_get_physical_board(LSB_ID(cpuid));
8911772Sjl139090 if (sb == -1) {
8921772Sjl139090 return (ENXIO);
8931772Sjl139090 }
8941772Sjl139090
8953627Ssubhan /*
8963627Ssubhan * opl_cur_model is assigned here
8973627Ssubhan */
8983627Ssubhan if (opl_cur_model == NULL) {
8993627Ssubhan set_model_info();
9005539Swh31274
9015539Swh31274 /*
9025539Swh31274 * if not matched, return
9035539Swh31274 */
9045539Swh31274 if (opl_cur_model == NULL)
9055539Swh31274 return (ENODEV);
9063627Ssubhan }
9073627Ssubhan
9083123Ssubhan ASSERT((opl_cur_model - opl_models) == (opl_cur_model->model_type));
9093123Ssubhan
9103123Ssubhan switch (opl_cur_model->model_type) {
9113123Ssubhan case FF1:
9122214Sav145390 plen = snprintf(buf, buflen, "/%s/CPUM%d", "MBU_A",
9132214Sav145390 CHIP_ID(cpuid) / 2);
9142214Sav145390 break;
9152214Sav145390
9163123Ssubhan case FF2:
9172214Sav145390 plen = snprintf(buf, buflen, "/%s/CPUM%d", "MBU_B",
9182808Sav145390 (CHIP_ID(cpuid) / 2) + (sb * 2));
9192214Sav145390 break;
9202214Sav145390
9213123Ssubhan case DC1:
9223123Ssubhan case DC2:
9233123Ssubhan case DC3:
9242214Sav145390 plen = snprintf(buf, buflen, "/%s%02d/CPUM%d", "CMU", sb,
9252214Sav145390 CHIP_ID(cpuid));
9262214Sav145390 break;
9272214Sav145390
9286297Sjl139090 case IKKAKU:
9296297Sjl139090 plen = snprintf(buf, buflen, "/%s", "MBU_A");
9306297Sjl139090 break;
9316297Sjl139090
9322214Sav145390 default:
9332214Sav145390 /* This should never happen */
9342214Sav145390 return (ENODEV);
9352214Sav145390 }
9362214Sav145390
9372214Sav145390 if (plen >= buflen) {
9382214Sav145390 ret = ENOSPC;
9391772Sjl139090 } else {
9401772Sjl139090 if (lenp)
9411772Sjl139090 *lenp = strlen(buf);
9421772Sjl139090 }
9432214Sav145390 return (ret);
9441772Sjl139090 }
9451772Sjl139090
9461772Sjl139090 void
plat_nodename_set(void)9471772Sjl139090 plat_nodename_set(void)
9481772Sjl139090 {
9495347Sjfrank post_xscf_msg((char *)&utsname, sizeof (struct utsname));
9501772Sjl139090 }
9511772Sjl139090
9521772Sjl139090 caddr_t efcode_vaddr = NULL;
9531772Sjl139090
9541772Sjl139090 /*
9551772Sjl139090 * Preallocate enough memory for fcode claims.
9561772Sjl139090 */
9571772Sjl139090
9581772Sjl139090 caddr_t
efcode_alloc(caddr_t alloc_base)9591772Sjl139090 efcode_alloc(caddr_t alloc_base)
9601772Sjl139090 {
9611772Sjl139090 caddr_t efcode_alloc_base = (caddr_t)roundup((uintptr_t)alloc_base,
9621772Sjl139090 MMU_PAGESIZE);
9631772Sjl139090 caddr_t vaddr;
9641772Sjl139090
9651772Sjl139090 /*
9661772Sjl139090 * allocate the physical memory for the Oberon fcode.
9671772Sjl139090 */
9681772Sjl139090 if ((vaddr = (caddr_t)BOP_ALLOC(bootops, efcode_alloc_base,
9691772Sjl139090 efcode_size, MMU_PAGESIZE)) == NULL)
9701772Sjl139090 cmn_err(CE_PANIC, "Cannot allocate Efcode Memory");
9711772Sjl139090
9721772Sjl139090 efcode_vaddr = vaddr;
9731772Sjl139090
9741772Sjl139090 return (efcode_alloc_base + efcode_size);
9751772Sjl139090 }
9761772Sjl139090
9771772Sjl139090 caddr_t
plat_startup_memlist(caddr_t alloc_base)9781772Sjl139090 plat_startup_memlist(caddr_t alloc_base)
9791772Sjl139090 {
9801772Sjl139090 caddr_t tmp_alloc_base;
9811772Sjl139090
9821772Sjl139090 tmp_alloc_base = efcode_alloc(alloc_base);
9831772Sjl139090 tmp_alloc_base =
9841772Sjl139090 (caddr_t)roundup((uintptr_t)tmp_alloc_base, ecache_alignsize);
9851772Sjl139090 return (tmp_alloc_base);
9861772Sjl139090 }
9871772Sjl139090
9885834Spt157919 /* need to forward declare these */
9895834Spt157919 static void plat_lock_delay(uint_t);
9905834Spt157919
9911772Sjl139090 void
startup_platform(void)9921772Sjl139090 startup_platform(void)
9931772Sjl139090 {
9945788Smv143129 if (clock_tick_threshold == 0)
9955788Smv143129 clock_tick_threshold = OPL_CLOCK_TICK_THRESHOLD;
9965788Smv143129 if (clock_tick_ncpus == 0)
9975788Smv143129 clock_tick_ncpus = OPL_CLOCK_TICK_NCPUS;
9985834Spt157919 mutex_lock_delay = plat_lock_delay;
9995834Spt157919 mutex_cap_factor = OPL_BOFF_MAX_SCALE;
10001772Sjl139090 }
10012214Sav145390
10025923Sjfrank static uint_t
get_mmu_id(processorid_t cpuid)10035923Sjfrank get_mmu_id(processorid_t cpuid)
10045923Sjfrank {
10055923Sjfrank int pb = opl_get_physical_board(LSB_ID(cpuid));
10065923Sjfrank
10075923Sjfrank if (pb == -1) {
10085923Sjfrank cmn_err(CE_PANIC,
10095923Sjfrank "opl_get_physical_board failed (cpu %d LSB %u)",
10105923Sjfrank cpuid, LSB_ID(cpuid));
10115923Sjfrank }
10125923Sjfrank return (pb * OPL_MAX_COREID_PER_BOARD) + (CHIP_ID(cpuid) *
10135923Sjfrank OPL_MAX_COREID_PER_CMP) + CORE_ID(cpuid);
10145923Sjfrank }
10155923Sjfrank
10162241Shuah void
plat_cpuid_to_mmu_ctx_info(processorid_t cpuid,mmu_ctx_info_t * info)10172241Shuah plat_cpuid_to_mmu_ctx_info(processorid_t cpuid, mmu_ctx_info_t *info)
10182241Shuah {
10192241Shuah int impl;
10202241Shuah
10212241Shuah impl = cpunodes[cpuid].implementation;
10225037Sjl139090 if (IS_OLYMPUS_C(impl) || IS_JUPITER(impl)) {
10235923Sjfrank info->mmu_idx = get_mmu_id(cpuid);
10242241Shuah info->mmu_nctxs = 8192;
10252241Shuah } else {
10262241Shuah cmn_err(CE_PANIC, "Unknown processor %d", impl);
10272241Shuah }
10282241Shuah }
10292241Shuah
10302214Sav145390 int
plat_get_mem_sid(char * unum,char * buf,int buflen,int * lenp)10312214Sav145390 plat_get_mem_sid(char *unum, char *buf, int buflen, int *lenp)
10322214Sav145390 {
10332214Sav145390 if (opl_get_mem_sid == NULL) {
10342214Sav145390 return (ENOTSUP);
10352214Sav145390 }
10362214Sav145390 return (opl_get_mem_sid(unum, buf, buflen, lenp));
10372214Sav145390 }
10382214Sav145390
10392214Sav145390 int
plat_get_mem_offset(uint64_t paddr,uint64_t * offp)10402214Sav145390 plat_get_mem_offset(uint64_t paddr, uint64_t *offp)
10412214Sav145390 {
10422214Sav145390 if (opl_get_mem_offset == NULL) {
10432214Sav145390 return (ENOTSUP);
10442214Sav145390 }
10452214Sav145390 return (opl_get_mem_offset(paddr, offp));
10462214Sav145390 }
10472214Sav145390
10482214Sav145390 int
plat_get_mem_addr(char * unum,char * sid,uint64_t offset,uint64_t * addrp)10492214Sav145390 plat_get_mem_addr(char *unum, char *sid, uint64_t offset, uint64_t *addrp)
10502214Sav145390 {
10512214Sav145390 if (opl_get_mem_addr == NULL) {
10522214Sav145390 return (ENOTSUP);
10532214Sav145390 }
10542214Sav145390 return (opl_get_mem_addr(unum, sid, offset, addrp));
10552214Sav145390 }
10563914Spm145316
10573914Spm145316 void
plat_lock_delay(uint_t backoff)10585834Spt157919 plat_lock_delay(uint_t backoff)
10593914Spm145316 {
10603914Spm145316 int i;
10615834Spt157919 uint_t cnt, remcnt;
10623914Spm145316 int ctr;
10635834Spt157919 hrtime_t delay_start, rem_delay;
10643914Spm145316 /*
10653914Spm145316 * Platform specific lock delay code for OPL
10663914Spm145316 *
10673914Spm145316 * Using staged linear increases in the delay.
10683914Spm145316 * The sleep instruction is the preferred method of delay,
10693914Spm145316 * but is too large of granularity for the initial backoff.
10703914Spm145316 */
10713914Spm145316
10725834Spt157919 if (backoff < 100) {
10733914Spm145316 /*
10743914Spm145316 * If desired backoff is long enough,
10753914Spm145316 * use sleep for most of it
10763914Spm145316 */
10775834Spt157919 for (cnt = backoff;
10785834Spt157919 cnt >= OPL_BOFF_SLEEP;
10795037Sjl139090 cnt -= OPL_BOFF_SLEEP) {
10803914Spm145316 cpu_smt_pause();
10813914Spm145316 }
10823914Spm145316 /*
10833914Spm145316 * spin for small remainder of backoff
10843914Spm145316 */
10853914Spm145316 for (ctr = cnt * OPL_BOFF_SPIN; ctr; ctr--) {
10865834Spt157919 mutex_delay_default();
10873914Spm145316 }
10883914Spm145316 } else {
10895834Spt157919 /* backoff is large. Fill it by sleeping */
10906592Sck142721 delay_start = gethrtime_waitfree();
10915834Spt157919 cnt = backoff / OPL_BOFF_SLEEP;
10923914Spm145316 /*
10933914Spm145316 * use sleep instructions for delay
10943914Spm145316 */
10953914Spm145316 for (i = 0; i < cnt; i++) {
10963914Spm145316 cpu_smt_pause();
10973914Spm145316 }
10983914Spm145316
10993914Spm145316 /*
11003914Spm145316 * Note: if the other strand executes a sleep instruction,
11013914Spm145316 * then the sleep ends immediately with a minimum time of
11023914Spm145316 * 42 clocks. We check gethrtime to insure we have
11033914Spm145316 * waited long enough. And we include both a short
11045834Spt157919 * spin loop and a sleep for repeated delay times.
11053914Spm145316 */
11063914Spm145316
11076592Sck142721 rem_delay = gethrtime_waitfree() - delay_start;
11085834Spt157919 while (rem_delay < cnt * OPL_BOFF_TM) {
11095834Spt157919 remcnt = cnt - (rem_delay / OPL_BOFF_TM);
11105834Spt157919 for (i = 0; i < remcnt; i++) {
11115834Spt157919 cpu_smt_pause();
11125834Spt157919 for (ctr = OPL_BOFF_SPIN; ctr; ctr--) {
11135834Spt157919 mutex_delay_default();
11145834Spt157919 }
11153914Spm145316 }
11166592Sck142721 rem_delay = gethrtime_waitfree() - delay_start;
11173914Spm145316 }
11183914Spm145316 }
11193914Spm145316 }
11205347Sjfrank
11215347Sjfrank /*
11225347Sjfrank * The following code implements asynchronous call to XSCF to setup the
11235347Sjfrank * domain node name.
11245347Sjfrank */
11255347Sjfrank
11265347Sjfrank #define FREE_MSG(m) kmem_free((m), NM_LEN((m)->len))
11275347Sjfrank
11285347Sjfrank /*
11295347Sjfrank * The following three macros define the all operations on the request
11305347Sjfrank * list we are using here, and hide the details of the list
11315347Sjfrank * implementation from the code.
11325347Sjfrank */
11335347Sjfrank #define PUSH(m) \
11345347Sjfrank { \
11355347Sjfrank (m)->next = ctl_msg.head; \
11365347Sjfrank (m)->prev = NULL; \
11375347Sjfrank if ((m)->next != NULL) \
11385347Sjfrank (m)->next->prev = (m); \
11395347Sjfrank ctl_msg.head = (m); \
11405347Sjfrank }
11415347Sjfrank
11425347Sjfrank #define REMOVE(m) \
11435347Sjfrank { \
11445347Sjfrank if ((m)->prev != NULL) \
11455347Sjfrank (m)->prev->next = (m)->next; \
11465347Sjfrank else \
11475347Sjfrank ctl_msg.head = (m)->next; \
11485347Sjfrank if ((m)->next != NULL) \
11495347Sjfrank (m)->next->prev = (m)->prev; \
11505347Sjfrank }
11515347Sjfrank
11525347Sjfrank #define FREE_THE_TAIL(head) \
11535347Sjfrank { \
11545347Sjfrank nm_msg_t *n_msg, *m; \
11555347Sjfrank m = (head)->next; \
11565347Sjfrank (head)->next = NULL; \
11575347Sjfrank while (m != NULL) { \
11585347Sjfrank n_msg = m->next; \
11595347Sjfrank FREE_MSG(m); \
11605347Sjfrank m = n_msg; \
11615347Sjfrank } \
11625347Sjfrank }
11635347Sjfrank
11645347Sjfrank #define SCF_PUTINFO(f, s, p) \
11655347Sjfrank f(KEY_ESCF, 0x01, 0, s, p)
11665347Sjfrank
11675347Sjfrank #define PASS2XSCF(m, r) ((r = SCF_PUTINFO(ctl_msg.scf_service_function, \
11685347Sjfrank (m)->len, (m)->data)) == 0)
11695347Sjfrank
11705347Sjfrank /*
11715347Sjfrank * The value of the following macro loosely depends on the
11725347Sjfrank * value of the "device busy" timeout used in the SCF driver.
11735347Sjfrank * (See pass2xscf_thread()).
11745347Sjfrank */
11755347Sjfrank #define SCF_DEVBUSY_DELAY 10
11765347Sjfrank
11775347Sjfrank /*
11785347Sjfrank * The default number of attempts to contact the scf driver
11795347Sjfrank * if we cannot fetch any information about the timeout value
11805347Sjfrank * it uses.
11815347Sjfrank */
11825347Sjfrank
11835347Sjfrank #define REPEATS 4
11845347Sjfrank
11855347Sjfrank typedef struct nm_msg {
11865347Sjfrank struct nm_msg *next;
11875347Sjfrank struct nm_msg *prev;
11885347Sjfrank int len;
11895347Sjfrank char data[1];
11905347Sjfrank } nm_msg_t;
11915347Sjfrank
11925347Sjfrank #define NM_LEN(len) (sizeof (nm_msg_t) + (len) - 1)
11935347Sjfrank
11945347Sjfrank static struct ctlmsg {
11955347Sjfrank nm_msg_t *head;
11965347Sjfrank nm_msg_t *now_serving;
11975347Sjfrank kmutex_t nm_lock;
11985347Sjfrank kthread_t *nmt;
11995347Sjfrank int cnt;
12005347Sjfrank int (*scf_service_function)(uint32_t, uint8_t,
12015347Sjfrank uint32_t, uint32_t, void *);
12025347Sjfrank } ctl_msg;
12035347Sjfrank
12045347Sjfrank static void
post_xscf_msg(char * dp,int len)12055347Sjfrank post_xscf_msg(char *dp, int len)
12065347Sjfrank {
12075347Sjfrank nm_msg_t *msg;
12085347Sjfrank
12095347Sjfrank msg = (nm_msg_t *)kmem_zalloc(NM_LEN(len), KM_SLEEP);
12105347Sjfrank
12115347Sjfrank bcopy(dp, msg->data, len);
12125347Sjfrank msg->len = len;
12135347Sjfrank
12145347Sjfrank mutex_enter(&ctl_msg.nm_lock);
12155347Sjfrank if (ctl_msg.nmt == NULL) {
12165347Sjfrank ctl_msg.nmt = thread_create(NULL, 0, pass2xscf_thread,
12175347Sjfrank NULL, 0, &p0, TS_RUN, minclsyspri);
12185347Sjfrank }
12195347Sjfrank
12205347Sjfrank PUSH(msg);
12215347Sjfrank ctl_msg.cnt++;
12225347Sjfrank mutex_exit(&ctl_msg.nm_lock);
12235347Sjfrank }
12245347Sjfrank
12255347Sjfrank static void
pass2xscf_thread()12265347Sjfrank pass2xscf_thread()
12275347Sjfrank {
12285347Sjfrank nm_msg_t *msg;
12295347Sjfrank int ret;
12305347Sjfrank uint_t i, msg_sent, xscf_driver_delay;
12315347Sjfrank static uint_t repeat_cnt;
12325347Sjfrank uint_t *scf_wait_cnt;
12335347Sjfrank
12345347Sjfrank mutex_enter(&ctl_msg.nm_lock);
12355347Sjfrank
12365347Sjfrank /*
12375347Sjfrank * Find the address of the SCF put routine if it's not done yet.
12385347Sjfrank */
12395347Sjfrank if (ctl_msg.scf_service_function == NULL) {
12405347Sjfrank if ((ctl_msg.scf_service_function =
12415347Sjfrank (int (*)(uint32_t, uint8_t, uint32_t, uint32_t, void *))
12425347Sjfrank modgetsymvalue("scf_service_putinfo", 0)) == NULL) {
12435347Sjfrank cmn_err(CE_NOTE, "pass2xscf_thread: "
12445347Sjfrank "scf_service_putinfo not found\n");
12455347Sjfrank ctl_msg.nmt = NULL;
12465347Sjfrank mutex_exit(&ctl_msg.nm_lock);
12475347Sjfrank return;
12485347Sjfrank }
12495347Sjfrank }
12505347Sjfrank
12515347Sjfrank /*
12525347Sjfrank * Calculate the number of attempts to connect XSCF based on the
12535347Sjfrank * scf driver delay (which is
12545347Sjfrank * SCF_DEVBUSY_DELAY*scf_online_wait_rcnt seconds) and the value
12555347Sjfrank * of xscf_connect_delay (the total number of seconds to wait
12565347Sjfrank * till xscf get ready.)
12575347Sjfrank */
12585347Sjfrank if (repeat_cnt == 0) {
12595347Sjfrank if ((scf_wait_cnt =
12605347Sjfrank (uint_t *)
12615347Sjfrank modgetsymvalue("scf_online_wait_rcnt", 0)) == NULL) {
12625347Sjfrank repeat_cnt = REPEATS;
12635347Sjfrank } else {
12645347Sjfrank
12655347Sjfrank xscf_driver_delay = *scf_wait_cnt *
12665347Sjfrank SCF_DEVBUSY_DELAY;
12675347Sjfrank repeat_cnt = (xscf_connect_delay/xscf_driver_delay) + 1;
12685347Sjfrank }
12695347Sjfrank }
12705347Sjfrank
12715347Sjfrank while (ctl_msg.cnt != 0) {
12725347Sjfrank
12735347Sjfrank /*
12745347Sjfrank * Take the very last request from the queue,
12755347Sjfrank */
12765347Sjfrank ctl_msg.now_serving = ctl_msg.head;
12775347Sjfrank ASSERT(ctl_msg.now_serving != NULL);
12785347Sjfrank
12795347Sjfrank /*
12805347Sjfrank * and discard all the others if any.
12815347Sjfrank */
12825347Sjfrank FREE_THE_TAIL(ctl_msg.now_serving);
12835347Sjfrank ctl_msg.cnt = 1;
12845347Sjfrank mutex_exit(&ctl_msg.nm_lock);
12855347Sjfrank
12865347Sjfrank /*
12875347Sjfrank * Pass the name to XSCF. Note please, we do not hold the
12885347Sjfrank * mutex while we are doing this.
12895347Sjfrank */
12905347Sjfrank msg_sent = 0;
12915347Sjfrank for (i = 0; i < repeat_cnt; i++) {
12925347Sjfrank if (PASS2XSCF(ctl_msg.now_serving, ret)) {
12935347Sjfrank msg_sent = 1;
12945347Sjfrank break;
12955347Sjfrank } else {
12965347Sjfrank if (ret != EBUSY) {
12975347Sjfrank cmn_err(CE_NOTE, "pass2xscf_thread:"
12985347Sjfrank " unexpected return code"
12995347Sjfrank " from scf_service_putinfo():"
13005347Sjfrank " %d\n", ret);
13015347Sjfrank }
13025347Sjfrank }
13035347Sjfrank }
13045347Sjfrank
13055347Sjfrank if (msg_sent) {
13065347Sjfrank
13075347Sjfrank /*
13085347Sjfrank * Remove the request from the list
13095347Sjfrank */
13105347Sjfrank mutex_enter(&ctl_msg.nm_lock);
13115347Sjfrank msg = ctl_msg.now_serving;
13125347Sjfrank ctl_msg.now_serving = NULL;
13135347Sjfrank REMOVE(msg);
13145347Sjfrank ctl_msg.cnt--;
13155347Sjfrank mutex_exit(&ctl_msg.nm_lock);
13165347Sjfrank FREE_MSG(msg);
13175347Sjfrank } else {
13185347Sjfrank
13195347Sjfrank /*
13205347Sjfrank * If while we have tried to communicate with
13215347Sjfrank * XSCF there were any other requests we are
13225347Sjfrank * going to drop this one and take the latest
13235347Sjfrank * one. Otherwise we will try to pass this one
13245347Sjfrank * again.
13255347Sjfrank */
13265347Sjfrank cmn_err(CE_NOTE,
13275347Sjfrank "pass2xscf_thread: "
13285347Sjfrank "scf_service_putinfo "
13295347Sjfrank "not responding\n");
13305347Sjfrank }
13315347Sjfrank mutex_enter(&ctl_msg.nm_lock);
13325347Sjfrank }
13335347Sjfrank
13345347Sjfrank /*
13355347Sjfrank * The request queue is empty, exit.
13365347Sjfrank */
13375347Sjfrank ctl_msg.nmt = NULL;
13385347Sjfrank mutex_exit(&ctl_msg.nm_lock);
13395347Sjfrank }
1340