xref: /onnv-gate/usr/src/uts/i86pc/os/fastboot.c (revision 10970:53b2abb98d0f)
17656SSherry.Moore@Sun.COM /*
27656SSherry.Moore@Sun.COM  * CDDL HEADER START
37656SSherry.Moore@Sun.COM  *
47656SSherry.Moore@Sun.COM  * The contents of this file are subject to the terms of the
57656SSherry.Moore@Sun.COM  * Common Development and Distribution License (the "License").
67656SSherry.Moore@Sun.COM  * You may not use this file except in compliance with the License.
77656SSherry.Moore@Sun.COM  *
87656SSherry.Moore@Sun.COM  * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
97656SSherry.Moore@Sun.COM  * or http://www.opensolaris.org/os/licensing.
107656SSherry.Moore@Sun.COM  * See the License for the specific language governing permissions
117656SSherry.Moore@Sun.COM  * and limitations under the License.
127656SSherry.Moore@Sun.COM  *
137656SSherry.Moore@Sun.COM  * When distributing Covered Code, include this CDDL HEADER in each
147656SSherry.Moore@Sun.COM  * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
157656SSherry.Moore@Sun.COM  * If applicable, add the following below this CDDL HEADER, with the
167656SSherry.Moore@Sun.COM  * fields enclosed by brackets "[]" replaced with your own identifying
177656SSherry.Moore@Sun.COM  * information: Portions Copyright [yyyy] [name of copyright owner]
187656SSherry.Moore@Sun.COM  *
197656SSherry.Moore@Sun.COM  * CDDL HEADER END
207656SSherry.Moore@Sun.COM  */
217656SSherry.Moore@Sun.COM 
227656SSherry.Moore@Sun.COM /*
239160SSherry.Moore@Sun.COM  * Copyright 2009 Sun Microsystems, Inc.  All rights reserved.
247656SSherry.Moore@Sun.COM  * Use is subject to license terms.
257656SSherry.Moore@Sun.COM  */
267656SSherry.Moore@Sun.COM 
277750SSherry.Moore@Sun.COM /*
287750SSherry.Moore@Sun.COM  * This file contains the functions for performing Fast Reboot -- a
297750SSherry.Moore@Sun.COM  * reboot which bypasses the firmware and bootloader, considerably
307750SSherry.Moore@Sun.COM  * reducing downtime.
317750SSherry.Moore@Sun.COM  *
329160SSherry.Moore@Sun.COM  * fastboot_load_kernel(): This function is invoked by mdpreboot() in the
339160SSherry.Moore@Sun.COM  * reboot path.  It loads the new kernel and boot archive into memory, builds
347750SSherry.Moore@Sun.COM  * the data structure containing sufficient information about the new
357750SSherry.Moore@Sun.COM  * kernel and boot archive to be passed to the fast reboot switcher
367750SSherry.Moore@Sun.COM  * (see fb_swtch_src.s for details).  When invoked the switcher relocates
377750SSherry.Moore@Sun.COM  * the new kernel and boot archive to physically contiguous low memory,
387750SSherry.Moore@Sun.COM  * similar to where the boot loader would have loaded them, and jumps to
397750SSherry.Moore@Sun.COM  * the new kernel.
407750SSherry.Moore@Sun.COM  *
419160SSherry.Moore@Sun.COM  * If fastreboot_onpanic is enabled, fastboot_load_kernel() is called
429160SSherry.Moore@Sun.COM  * by fastreboot_post_startup() to load the back up kernel in case of
439160SSherry.Moore@Sun.COM  * panic.
449160SSherry.Moore@Sun.COM  *
457750SSherry.Moore@Sun.COM  * The physical addresses of the memory allocated for the new kernel, boot
467750SSherry.Moore@Sun.COM  * archive and their page tables must be above where the boot archive ends
477750SSherry.Moore@Sun.COM  * after it has been relocated by the switcher, otherwise the new files
487750SSherry.Moore@Sun.COM  * and their page tables could be overridden during relocation.
497750SSherry.Moore@Sun.COM  *
507750SSherry.Moore@Sun.COM  * fast_reboot(): This function is invoked by mdboot() once it's determined
517750SSherry.Moore@Sun.COM  * that the system is capable of fast reboot.  It jumps to the fast reboot
529160SSherry.Moore@Sun.COM  * switcher with the data structure built by fastboot_load_kernel() as the
539160SSherry.Moore@Sun.COM  * argument.
547750SSherry.Moore@Sun.COM  */
557656SSherry.Moore@Sun.COM 
567656SSherry.Moore@Sun.COM #include <sys/types.h>
577656SSherry.Moore@Sun.COM #include <sys/param.h>
587656SSherry.Moore@Sun.COM #include <sys/segments.h>
597656SSherry.Moore@Sun.COM #include <sys/sysmacros.h>
607656SSherry.Moore@Sun.COM #include <sys/vm.h>
617656SSherry.Moore@Sun.COM 
627656SSherry.Moore@Sun.COM #include <sys/proc.h>
637656SSherry.Moore@Sun.COM #include <sys/buf.h>
647656SSherry.Moore@Sun.COM #include <sys/kmem.h>
657656SSherry.Moore@Sun.COM 
667656SSherry.Moore@Sun.COM #include <sys/reboot.h>
677656SSherry.Moore@Sun.COM #include <sys/uadmin.h>
687656SSherry.Moore@Sun.COM 
697656SSherry.Moore@Sun.COM #include <sys/cred.h>
707656SSherry.Moore@Sun.COM #include <sys/vnode.h>
717656SSherry.Moore@Sun.COM #include <sys/file.h>
727656SSherry.Moore@Sun.COM 
737656SSherry.Moore@Sun.COM #include <sys/cmn_err.h>
747656SSherry.Moore@Sun.COM #include <sys/dumphdr.h>
757656SSherry.Moore@Sun.COM #include <sys/bootconf.h>
767656SSherry.Moore@Sun.COM #include <sys/ddidmareq.h>
777656SSherry.Moore@Sun.COM #include <sys/varargs.h>
787656SSherry.Moore@Sun.COM #include <sys/promif.h>
797656SSherry.Moore@Sun.COM #include <sys/modctl.h>
807656SSherry.Moore@Sun.COM 
817656SSherry.Moore@Sun.COM #include <vm/hat.h>
827656SSherry.Moore@Sun.COM #include <vm/as.h>
837656SSherry.Moore@Sun.COM #include <vm/page.h>
847656SSherry.Moore@Sun.COM #include <vm/seg.h>
857656SSherry.Moore@Sun.COM #include <vm/hat_i86.h>
867656SSherry.Moore@Sun.COM #include <sys/vm_machparam.h>
877656SSherry.Moore@Sun.COM #include <sys/archsystm.h>
887656SSherry.Moore@Sun.COM #include <sys/machsystm.h>
897656SSherry.Moore@Sun.COM #include <sys/mman.h>
907656SSherry.Moore@Sun.COM #include <sys/x86_archext.h>
919160SSherry.Moore@Sun.COM #include <sys/smp_impldefs.h>
929160SSherry.Moore@Sun.COM #include <sys/spl.h>
937656SSherry.Moore@Sun.COM 
947656SSherry.Moore@Sun.COM #include <sys/fastboot.h>
957656SSherry.Moore@Sun.COM #include <sys/machelf.h>
967656SSherry.Moore@Sun.COM #include <sys/kobj.h>
977656SSherry.Moore@Sun.COM #include <sys/multiboot.h>
989160SSherry.Moore@Sun.COM #include <sys/kobj_lex.h>
999160SSherry.Moore@Sun.COM 
1009160SSherry.Moore@Sun.COM /*
1019160SSherry.Moore@Sun.COM  * Macro to determine how many pages are needed for PTEs to map a particular
1029160SSherry.Moore@Sun.COM  * file.  Allocate one extra page table entry for terminating the list.
1039160SSherry.Moore@Sun.COM  */
1049160SSherry.Moore@Sun.COM #define	FASTBOOT_PTE_LIST_SIZE(fsize)	\
1059160SSherry.Moore@Sun.COM 	P2ROUNDUP((((fsize) >> PAGESHIFT) + 1) * sizeof (x86pte_t), PAGESIZE)
1067656SSherry.Moore@Sun.COM 
1077750SSherry.Moore@Sun.COM /*
1087750SSherry.Moore@Sun.COM  * Data structure containing necessary information for the fast reboot
1097750SSherry.Moore@Sun.COM  * switcher to jump to the new kernel.
1107750SSherry.Moore@Sun.COM  */
1117656SSherry.Moore@Sun.COM fastboot_info_t newkernel = { 0 };
1129160SSherry.Moore@Sun.COM char		fastboot_args[OBP_MAXPATHLEN];
1137750SSherry.Moore@Sun.COM 
1147656SSherry.Moore@Sun.COM static char fastboot_filename[2][OBP_MAXPATHLEN] = { { 0 }, { 0 }};
1157656SSherry.Moore@Sun.COM static x86pte_t ptp_bits = PT_VALID | PT_REF | PT_USER | PT_WRITABLE;
1167656SSherry.Moore@Sun.COM static x86pte_t pte_bits =
1177656SSherry.Moore@Sun.COM     PT_VALID | PT_REF | PT_MOD | PT_NOCONSIST | PT_WRITABLE;
1187656SSherry.Moore@Sun.COM static uint_t fastboot_shift_amt_pae[] = {12, 21, 30, 39};
1197656SSherry.Moore@Sun.COM 
1207656SSherry.Moore@Sun.COM int fastboot_debug = 0;
1217656SSherry.Moore@Sun.COM int fastboot_contig = 0;
1227656SSherry.Moore@Sun.COM 
1237656SSherry.Moore@Sun.COM /*
1247656SSherry.Moore@Sun.COM  * Fake starting va for new kernel and boot archive.
1257656SSherry.Moore@Sun.COM  */
1267656SSherry.Moore@Sun.COM static uintptr_t fake_va = FASTBOOT_FAKE_VA;
1277656SSherry.Moore@Sun.COM 
1287656SSherry.Moore@Sun.COM /*
1299160SSherry.Moore@Sun.COM  * Reserve memory below PA 1G in preparation of fast reboot.
1309160SSherry.Moore@Sun.COM  *
1319160SSherry.Moore@Sun.COM  * This variable is only checked when fastreboot_capable is set, but
1329160SSherry.Moore@Sun.COM  * fastreboot_onpanic is not set.  The amount of memory reserved
1339160SSherry.Moore@Sun.COM  * is negligible, but just in case we are really short of low memory,
1349160SSherry.Moore@Sun.COM  * this variable will give us a backdoor to not consume memory at all.
1359160SSherry.Moore@Sun.COM  */
1369160SSherry.Moore@Sun.COM int reserve_mem_enabled = 1;
1379160SSherry.Moore@Sun.COM 
1389160SSherry.Moore@Sun.COM /*
13910559SSherry.Moore@Sun.COM  * Mutex to protect fastreboot_onpanic.
14010559SSherry.Moore@Sun.COM  */
14110559SSherry.Moore@Sun.COM kmutex_t fastreboot_config_mutex;
14210559SSherry.Moore@Sun.COM 
14310559SSherry.Moore@Sun.COM /*
1449160SSherry.Moore@Sun.COM  * Amount of memory below PA 1G to reserve for constructing the multiboot
1459160SSherry.Moore@Sun.COM  * data structure and the page tables as we tend to run out of those
1469160SSherry.Moore@Sun.COM  * when more drivers are loaded.
1479160SSherry.Moore@Sun.COM  */
1489160SSherry.Moore@Sun.COM static size_t fastboot_mbi_size = 0x2000;	/* 8K */
1499160SSherry.Moore@Sun.COM static size_t fastboot_pagetable_size = 0x5000;	/* 20K */
1509160SSherry.Moore@Sun.COM 
1519160SSherry.Moore@Sun.COM /*
15210916SSherry.Moore@Sun.COM  * Minimum system uptime in clock_t before Fast Reboot should be used
15310916SSherry.Moore@Sun.COM  * on panic.  Will be initialized in fastboot_post_startup().
15410916SSherry.Moore@Sun.COM  */
15510916SSherry.Moore@Sun.COM clock_t fastreboot_onpanic_uptime = LONG_MAX;
15610916SSherry.Moore@Sun.COM 
15710916SSherry.Moore@Sun.COM /*
15810916SSherry.Moore@Sun.COM  * lbolt value when the system booted.  This value will be used if the system
15910916SSherry.Moore@Sun.COM  * panics to calculate how long the system has been up.  If the uptime is less
16010916SSherry.Moore@Sun.COM  * than fastreboot_onpanic_uptime, a reboot through BIOS will be performed to
16110916SSherry.Moore@Sun.COM  * avoid a potential panic/reboot loop.
16210916SSherry.Moore@Sun.COM  */
16310916SSherry.Moore@Sun.COM clock_t lbolt_at_boot = LONG_MAX;
16410916SSherry.Moore@Sun.COM 
16510916SSherry.Moore@Sun.COM /*
1669160SSherry.Moore@Sun.COM  * Use below 1G for page tables as
1679160SSherry.Moore@Sun.COM  *	1. we are only doing 1:1 mapping of the bottom 1G of physical memory.
1689160SSherry.Moore@Sun.COM  *	2. we are using 2G as the fake virtual address for the new kernel and
1699160SSherry.Moore@Sun.COM  *	boot archive.
1707656SSherry.Moore@Sun.COM  */
1717656SSherry.Moore@Sun.COM static ddi_dma_attr_t fastboot_below_1G_dma_attr = {
1727656SSherry.Moore@Sun.COM 	DMA_ATTR_V0,
1737656SSherry.Moore@Sun.COM 	0x0000000008000000ULL,	/* dma_attr_addr_lo: 128MB */
1747656SSherry.Moore@Sun.COM 	0x000000003FFFFFFFULL,	/* dma_attr_addr_hi: 1G */
1757656SSherry.Moore@Sun.COM 	0x00000000FFFFFFFFULL,	/* dma_attr_count_max */
1767656SSherry.Moore@Sun.COM 	0x0000000000001000ULL,	/* dma_attr_align: 4KB */
1777656SSherry.Moore@Sun.COM 	1,			/* dma_attr_burstsize */
1787656SSherry.Moore@Sun.COM 	1,			/* dma_attr_minxfer */
1797656SSherry.Moore@Sun.COM 	0x00000000FFFFFFFFULL,	/* dma_attr_maxxfer */
1807656SSherry.Moore@Sun.COM 	0x00000000FFFFFFFFULL,	/* dma_attr_seg */
1817656SSherry.Moore@Sun.COM 	1,			/* dma_attr_sgllen */
1827656SSherry.Moore@Sun.COM 	0x1000ULL,		/* dma_attr_granular */
1837656SSherry.Moore@Sun.COM 	0,			/* dma_attr_flags */
1847656SSherry.Moore@Sun.COM };
1857656SSherry.Moore@Sun.COM 
1867656SSherry.Moore@Sun.COM static ddi_dma_attr_t fastboot_dma_attr = {
1877656SSherry.Moore@Sun.COM 	DMA_ATTR_V0,
1887656SSherry.Moore@Sun.COM 	0x0000000008000000ULL,	/* dma_attr_addr_lo: 128MB */
1898151SKonstantin.Ananyev@Sun.COM #ifdef	__amd64
1908151SKonstantin.Ananyev@Sun.COM 	0xFFFFFFFFFFFFFFFFULL,	/* dma_attr_addr_hi: 2^64B */
1918151SKonstantin.Ananyev@Sun.COM #else
1927656SSherry.Moore@Sun.COM 	0x0000000FFFFFFFFFULL,	/* dma_attr_addr_hi: 64GB */
1938151SKonstantin.Ananyev@Sun.COM #endif	/* __amd64 */
1947656SSherry.Moore@Sun.COM 	0x00000000FFFFFFFFULL,	/* dma_attr_count_max */
1957656SSherry.Moore@Sun.COM 	0x0000000000001000ULL,	/* dma_attr_align: 4KB */
1967656SSherry.Moore@Sun.COM 	1,			/* dma_attr_burstsize */
1977656SSherry.Moore@Sun.COM 	1,			/* dma_attr_minxfer */
1987656SSherry.Moore@Sun.COM 	0x00000000FFFFFFFFULL,	/* dma_attr_maxxfer */
1997656SSherry.Moore@Sun.COM 	0x00000000FFFFFFFFULL,	/* dma_attr_seg */
2007656SSherry.Moore@Sun.COM 	1,			/* dma_attr_sgllen */
2017656SSherry.Moore@Sun.COM 	0x1000ULL,		/* dma_attr_granular */
2027656SSherry.Moore@Sun.COM 	0,			/* dma_attr_flags */
2037656SSherry.Moore@Sun.COM };
2047656SSherry.Moore@Sun.COM 
2057656SSherry.Moore@Sun.COM /*
2067656SSherry.Moore@Sun.COM  * Various information saved from the previous boot to reconstruct
2077656SSherry.Moore@Sun.COM  * multiboot_info.
2087656SSherry.Moore@Sun.COM  */
2097656SSherry.Moore@Sun.COM extern multiboot_info_t saved_mbi;
2107656SSherry.Moore@Sun.COM extern mb_memory_map_t saved_mmap[FASTBOOT_SAVED_MMAP_COUNT];
21110525SKonstantin.Ananyev@Sun.COM extern uint8_t saved_drives[FASTBOOT_SAVED_DRIVES_SIZE];
2127656SSherry.Moore@Sun.COM extern char saved_cmdline[FASTBOOT_SAVED_CMDLINE_LEN];
2137656SSherry.Moore@Sun.COM extern int saved_cmdline_len;
2149160SSherry.Moore@Sun.COM extern size_t saved_file_size[];
2157656SSherry.Moore@Sun.COM 
2167656SSherry.Moore@Sun.COM extern void* contig_alloc(size_t size, ddi_dma_attr_t *attr,
2177656SSherry.Moore@Sun.COM     uintptr_t align, int cansleep);
2187750SSherry.Moore@Sun.COM extern void contig_free(void *addr, size_t size);
2197750SSherry.Moore@Sun.COM 
2207656SSherry.Moore@Sun.COM 
2217656SSherry.Moore@Sun.COM /* PRINTLIKE */
2227656SSherry.Moore@Sun.COM extern void vprintf(const char *, va_list);
2237656SSherry.Moore@Sun.COM 
2247656SSherry.Moore@Sun.COM 
2257656SSherry.Moore@Sun.COM /*
2267656SSherry.Moore@Sun.COM  * Need to be able to get boot_archives from other places
2277656SSherry.Moore@Sun.COM  */
2287656SSherry.Moore@Sun.COM #define	BOOTARCHIVE64	"/platform/i86pc/amd64/boot_archive"
2297656SSherry.Moore@Sun.COM #define	BOOTARCHIVE32	"/platform/i86pc/boot_archive"
2309160SSherry.Moore@Sun.COM #define	BOOTARCHIVE32_FAILSAFE	"/boot/x86.miniroot-safe"
2319160SSherry.Moore@Sun.COM #define	BOOTARCHIVE64_FAILSAFE	"/boot/amd64/x86.miniroot-safe"
2329160SSherry.Moore@Sun.COM #define	FAILSAFE_BOOTFILE32	"/boot/platform/i86pc/kernel/unix"
2339160SSherry.Moore@Sun.COM #define	FAILSAFE_BOOTFILE64	"/boot/platform/i86pc/kernel/amd64/unix"
2347656SSherry.Moore@Sun.COM 
2357656SSherry.Moore@Sun.COM static uint_t fastboot_vatoindex(fastboot_info_t *, uintptr_t, int);
2367656SSherry.Moore@Sun.COM static void fastboot_map_with_size(fastboot_info_t *, uintptr_t,
2377656SSherry.Moore@Sun.COM     paddr_t, size_t, int);
2387656SSherry.Moore@Sun.COM static void fastboot_build_pagetables(fastboot_info_t *);
2397656SSherry.Moore@Sun.COM static int fastboot_build_mbi(char *, fastboot_info_t *);
2409160SSherry.Moore@Sun.COM static void fastboot_free_file(fastboot_file_t *);
2417656SSherry.Moore@Sun.COM 
242*10970SSherry.Moore@Sun.COM static const char fastboot_enomem_msg[] = "!Fastboot: Couldn't allocate 0x%"
2437656SSherry.Moore@Sun.COM 	PRIx64" bytes below %s to do fast reboot";
2447656SSherry.Moore@Sun.COM 
2457656SSherry.Moore@Sun.COM static void
2467656SSherry.Moore@Sun.COM dprintf(char *fmt, ...)
2477656SSherry.Moore@Sun.COM {
2487656SSherry.Moore@Sun.COM 	va_list adx;
2497656SSherry.Moore@Sun.COM 
2507656SSherry.Moore@Sun.COM 	if (!fastboot_debug)
2517656SSherry.Moore@Sun.COM 		return;
2527656SSherry.Moore@Sun.COM 
2537656SSherry.Moore@Sun.COM 	va_start(adx, fmt);
2547656SSherry.Moore@Sun.COM 	vprintf(fmt, adx);
2557656SSherry.Moore@Sun.COM 	va_end(adx);
2567656SSherry.Moore@Sun.COM }
2577656SSherry.Moore@Sun.COM 
2587656SSherry.Moore@Sun.COM 
2597656SSherry.Moore@Sun.COM /*
2607656SSherry.Moore@Sun.COM  * Return the index corresponding to a virt address at a given page table level.
2617656SSherry.Moore@Sun.COM  */
2627656SSherry.Moore@Sun.COM static uint_t
2637656SSherry.Moore@Sun.COM fastboot_vatoindex(fastboot_info_t *nk, uintptr_t va, int level)
2647656SSherry.Moore@Sun.COM {
2657656SSherry.Moore@Sun.COM 	return ((va >> nk->fi_shift_amt[level]) & (nk->fi_ptes_per_table - 1));
2667656SSherry.Moore@Sun.COM }
2677656SSherry.Moore@Sun.COM 
2687656SSherry.Moore@Sun.COM 
2697656SSherry.Moore@Sun.COM /*
2707656SSherry.Moore@Sun.COM  * Add mapping from vstart to pstart for the specified size.
2718151SKonstantin.Ananyev@Sun.COM  * vstart, pstart and size should all have been aligned at 2M boundaries.
2727656SSherry.Moore@Sun.COM  */
2737656SSherry.Moore@Sun.COM static void
2747656SSherry.Moore@Sun.COM fastboot_map_with_size(fastboot_info_t *nk, uintptr_t vstart, paddr_t pstart,
2757656SSherry.Moore@Sun.COM     size_t size, int level)
2767656SSherry.Moore@Sun.COM {
2777656SSherry.Moore@Sun.COM 	x86pte_t	pteval, *table;
2787656SSherry.Moore@Sun.COM 	uintptr_t	vaddr;
2797656SSherry.Moore@Sun.COM 	paddr_t		paddr;
2807656SSherry.Moore@Sun.COM 	int		index, l;
2817656SSherry.Moore@Sun.COM 
2827656SSherry.Moore@Sun.COM 	table = (x86pte_t *)(nk->fi_pagetable_va);
2837656SSherry.Moore@Sun.COM 
2847656SSherry.Moore@Sun.COM 	for (l = nk->fi_top_level; l >= level; l--) {
2857656SSherry.Moore@Sun.COM 
2867656SSherry.Moore@Sun.COM 		index = fastboot_vatoindex(nk, vstart, l);
2877656SSherry.Moore@Sun.COM 
2887656SSherry.Moore@Sun.COM 		if (l == level) {
2897656SSherry.Moore@Sun.COM 			/*
2907656SSherry.Moore@Sun.COM 			 * Last level.  Program the page table entries.
2917656SSherry.Moore@Sun.COM 			 */
2927656SSherry.Moore@Sun.COM 			for (vaddr = vstart, paddr = pstart;
2937656SSherry.Moore@Sun.COM 			    vaddr < vstart + size;
2947656SSherry.Moore@Sun.COM 			    vaddr += (1ULL << nk->fi_shift_amt[l]),
2957656SSherry.Moore@Sun.COM 			    paddr += (1ULL << nk->fi_shift_amt[l])) {
2967656SSherry.Moore@Sun.COM 
2977656SSherry.Moore@Sun.COM 				uint_t index = fastboot_vatoindex(nk, vaddr, l);
2987656SSherry.Moore@Sun.COM 
2997656SSherry.Moore@Sun.COM 				if (l > 0)
3007656SSherry.Moore@Sun.COM 					pteval = paddr | pte_bits | PT_PAGESIZE;
3017656SSherry.Moore@Sun.COM 				else
3027656SSherry.Moore@Sun.COM 					pteval = paddr | pte_bits;
3037656SSherry.Moore@Sun.COM 
3047656SSherry.Moore@Sun.COM 				table[index] = pteval;
3057656SSherry.Moore@Sun.COM 			}
3067656SSherry.Moore@Sun.COM 		} else if (table[index] & PT_VALID) {
3077656SSherry.Moore@Sun.COM 
3087656SSherry.Moore@Sun.COM 			table = (x86pte_t *)
3097656SSherry.Moore@Sun.COM 			    ((uintptr_t)(((paddr_t)table[index] & MMU_PAGEMASK)
3107656SSherry.Moore@Sun.COM 			    - nk->fi_pagetable_pa) + nk->fi_pagetable_va);
3117656SSherry.Moore@Sun.COM 		} else {
3127656SSherry.Moore@Sun.COM 			/*
3138151SKonstantin.Ananyev@Sun.COM 			 * Intermediate levels.
3148151SKonstantin.Ananyev@Sun.COM 			 * Program with either valid bit or PTP bits.
3157656SSherry.Moore@Sun.COM 			 */
3167656SSherry.Moore@Sun.COM 			if (l == nk->fi_top_level) {
3178151SKonstantin.Ananyev@Sun.COM #ifdef	__amd64
3188151SKonstantin.Ananyev@Sun.COM 				ASSERT(nk->fi_top_level == 3);
3198151SKonstantin.Ananyev@Sun.COM 				table[index] = nk->fi_next_table_pa | ptp_bits;
3208151SKonstantin.Ananyev@Sun.COM #else
3217656SSherry.Moore@Sun.COM 				table[index] = nk->fi_next_table_pa | PT_VALID;
3228151SKonstantin.Ananyev@Sun.COM #endif	/* __amd64 */
3237656SSherry.Moore@Sun.COM 			} else {
3247656SSherry.Moore@Sun.COM 				table[index] = nk->fi_next_table_pa | ptp_bits;
3257656SSherry.Moore@Sun.COM 			}
3267656SSherry.Moore@Sun.COM 			table = (x86pte_t *)(nk->fi_next_table_va);
3277656SSherry.Moore@Sun.COM 			nk->fi_next_table_va += MMU_PAGESIZE;
3287656SSherry.Moore@Sun.COM 			nk->fi_next_table_pa += MMU_PAGESIZE;
3297656SSherry.Moore@Sun.COM 		}
3307656SSherry.Moore@Sun.COM 	}
3317656SSherry.Moore@Sun.COM }
3327656SSherry.Moore@Sun.COM 
3337656SSherry.Moore@Sun.COM /*
3347656SSherry.Moore@Sun.COM  * Build page tables for the lower 1G of physical memory using 2M
3357656SSherry.Moore@Sun.COM  * pages, and prepare page tables for mapping new kernel and boot
3367656SSherry.Moore@Sun.COM  * archive pages using 4K pages.
3377656SSherry.Moore@Sun.COM  */
3387656SSherry.Moore@Sun.COM static void
3397656SSherry.Moore@Sun.COM fastboot_build_pagetables(fastboot_info_t *nk)
3407656SSherry.Moore@Sun.COM {
3417656SSherry.Moore@Sun.COM 	/*
3427656SSherry.Moore@Sun.COM 	 * Map lower 1G physical memory.  Use large pages.
3437656SSherry.Moore@Sun.COM 	 */
3447656SSherry.Moore@Sun.COM 	fastboot_map_with_size(nk, 0, 0, ONE_GIG, 1);
3457656SSherry.Moore@Sun.COM 
3467656SSherry.Moore@Sun.COM 	/*
3477656SSherry.Moore@Sun.COM 	 * Map one 4K page to get the middle page tables set up.
3487656SSherry.Moore@Sun.COM 	 */
3497656SSherry.Moore@Sun.COM 	fake_va = P2ALIGN_TYPED(fake_va, nk->fi_lpagesize, uintptr_t);
3507656SSherry.Moore@Sun.COM 	fastboot_map_with_size(nk, fake_va,
3517656SSherry.Moore@Sun.COM 	    nk->fi_files[0].fb_pte_list_va[0] & MMU_PAGEMASK, PAGESIZE, 0);
3527656SSherry.Moore@Sun.COM }
3537656SSherry.Moore@Sun.COM 
3547656SSherry.Moore@Sun.COM 
3557656SSherry.Moore@Sun.COM /*
3567656SSherry.Moore@Sun.COM  * Sanity check.  Look for dboot offset.
3577656SSherry.Moore@Sun.COM  */
3587656SSherry.Moore@Sun.COM static int
3597656SSherry.Moore@Sun.COM fastboot_elf64_find_dboot_load_offset(void *img, off_t imgsz, uint32_t *offp)
3607656SSherry.Moore@Sun.COM {
3617656SSherry.Moore@Sun.COM 	Elf64_Ehdr	*ehdr = (Elf64_Ehdr *)img;
3627656SSherry.Moore@Sun.COM 	Elf64_Phdr	*phdr;
3637656SSherry.Moore@Sun.COM 	uint8_t		*phdrbase;
3647656SSherry.Moore@Sun.COM 	int		i;
3657656SSherry.Moore@Sun.COM 
3667656SSherry.Moore@Sun.COM 	if ((ehdr->e_phoff + ehdr->e_phnum * ehdr->e_phentsize) >= imgsz)
3677656SSherry.Moore@Sun.COM 		return (-1);
3687656SSherry.Moore@Sun.COM 
3697656SSherry.Moore@Sun.COM 	phdrbase = (uint8_t *)img + ehdr->e_phoff;
3707656SSherry.Moore@Sun.COM 
3717656SSherry.Moore@Sun.COM 	for (i = 0; i < ehdr->e_phnum; i++) {
3727656SSherry.Moore@Sun.COM 		phdr = (Elf64_Phdr *)(phdrbase + ehdr->e_phentsize * i);
3737656SSherry.Moore@Sun.COM 
3747656SSherry.Moore@Sun.COM 		if (phdr->p_type == PT_LOAD) {
3757656SSherry.Moore@Sun.COM 			if (phdr->p_vaddr == phdr->p_paddr &&
3767656SSherry.Moore@Sun.COM 			    phdr->p_vaddr == DBOOT_ENTRY_ADDRESS) {
3777656SSherry.Moore@Sun.COM 				ASSERT(phdr->p_offset <= UINT32_MAX);
3787656SSherry.Moore@Sun.COM 				*offp = (uint32_t)phdr->p_offset;
3797656SSherry.Moore@Sun.COM 				return (0);
3807656SSherry.Moore@Sun.COM 			}
3817656SSherry.Moore@Sun.COM 		}
3827656SSherry.Moore@Sun.COM 	}
3837656SSherry.Moore@Sun.COM 
3847656SSherry.Moore@Sun.COM 	return (-1);
3857656SSherry.Moore@Sun.COM }
3867656SSherry.Moore@Sun.COM 
3877656SSherry.Moore@Sun.COM 
3887656SSherry.Moore@Sun.COM /*
3897656SSherry.Moore@Sun.COM  * Initialize text and data section information for 32-bit kernel.
3908151SKonstantin.Ananyev@Sun.COM  * sectcntp - is both input/output parameter.
3918151SKonstantin.Ananyev@Sun.COM  * On entry, *sectcntp contains maximum allowable number of sections;
3928151SKonstantin.Ananyev@Sun.COM  * on return, it contains the actual number of sections filled.
3937656SSherry.Moore@Sun.COM  */
3947656SSherry.Moore@Sun.COM static int
3957656SSherry.Moore@Sun.COM fastboot_elf32_find_loadables(void *img, off_t imgsz, fastboot_section_t *sectp,
3967656SSherry.Moore@Sun.COM     int *sectcntp, uint32_t *offp)
3977656SSherry.Moore@Sun.COM {
3987656SSherry.Moore@Sun.COM 	Elf32_Ehdr	*ehdr = (Elf32_Ehdr *)img;
3997656SSherry.Moore@Sun.COM 	Elf32_Phdr	*phdr;
4007656SSherry.Moore@Sun.COM 	uint8_t		*phdrbase;
4017656SSherry.Moore@Sun.COM 	int		i;
4027656SSherry.Moore@Sun.COM 	int		used_sections = 0;
4038151SKonstantin.Ananyev@Sun.COM 	const int	max_sectcnt = *sectcntp;
4047656SSherry.Moore@Sun.COM 
4057656SSherry.Moore@Sun.COM 	if ((ehdr->e_phoff + ehdr->e_phnum * ehdr->e_phentsize) >= imgsz)
4067656SSherry.Moore@Sun.COM 		return (-1);
4077656SSherry.Moore@Sun.COM 
4087656SSherry.Moore@Sun.COM 	phdrbase = (uint8_t *)img + ehdr->e_phoff;
4097656SSherry.Moore@Sun.COM 
4107656SSherry.Moore@Sun.COM 	for (i = 0; i < ehdr->e_phnum; i++) {
4117656SSherry.Moore@Sun.COM 		phdr = (Elf32_Phdr *)(phdrbase + ehdr->e_phentsize * i);
4127656SSherry.Moore@Sun.COM 
4137656SSherry.Moore@Sun.COM 		if (phdr->p_type == PT_INTERP)
4147656SSherry.Moore@Sun.COM 			return (-1);
4157656SSherry.Moore@Sun.COM 
4167656SSherry.Moore@Sun.COM 		if (phdr->p_type != PT_LOAD)
4177656SSherry.Moore@Sun.COM 			continue;
4187656SSherry.Moore@Sun.COM 
4197656SSherry.Moore@Sun.COM 		if (phdr->p_vaddr == phdr->p_paddr &&
4207656SSherry.Moore@Sun.COM 		    phdr->p_paddr == DBOOT_ENTRY_ADDRESS) {
4217656SSherry.Moore@Sun.COM 			*offp = (uint32_t)phdr->p_offset;
4227656SSherry.Moore@Sun.COM 		} else {
4238151SKonstantin.Ananyev@Sun.COM 			if (max_sectcnt <= used_sections)
4248151SKonstantin.Ananyev@Sun.COM 				return (-1);
4258151SKonstantin.Ananyev@Sun.COM 
4267656SSherry.Moore@Sun.COM 			sectp[used_sections].fb_sec_offset = phdr->p_offset;
4277656SSherry.Moore@Sun.COM 			sectp[used_sections].fb_sec_paddr = phdr->p_paddr;
4287656SSherry.Moore@Sun.COM 			sectp[used_sections].fb_sec_size = phdr->p_filesz;
4297656SSherry.Moore@Sun.COM 			sectp[used_sections].fb_sec_bss_size =
4307656SSherry.Moore@Sun.COM 			    (phdr->p_filesz < phdr->p_memsz) ?
4317656SSherry.Moore@Sun.COM 			    (phdr->p_memsz - phdr->p_filesz) : 0;
4327656SSherry.Moore@Sun.COM 
4338151SKonstantin.Ananyev@Sun.COM 			/* Extra sanity check for the input object file */
4348151SKonstantin.Ananyev@Sun.COM 			if (sectp[used_sections].fb_sec_paddr +
4358151SKonstantin.Ananyev@Sun.COM 			    sectp[used_sections].fb_sec_size +
4368151SKonstantin.Ananyev@Sun.COM 			    sectp[used_sections].fb_sec_bss_size >=
4378151SKonstantin.Ananyev@Sun.COM 			    DBOOT_ENTRY_ADDRESS)
4388151SKonstantin.Ananyev@Sun.COM 				return (-1);
4398151SKonstantin.Ananyev@Sun.COM 
4407656SSherry.Moore@Sun.COM 			used_sections++;
4417656SSherry.Moore@Sun.COM 		}
4427656SSherry.Moore@Sun.COM 	}
4437656SSherry.Moore@Sun.COM 
4447656SSherry.Moore@Sun.COM 	*sectcntp = used_sections;
4457656SSherry.Moore@Sun.COM 	return (0);
4467656SSherry.Moore@Sun.COM }
4477656SSherry.Moore@Sun.COM 
4487656SSherry.Moore@Sun.COM /*
4499219SKonstantin.Ananyev@Sun.COM  * Create multiboot info structure (mbi) base on the saved mbi.
4509219SKonstantin.Ananyev@Sun.COM  * Recalculate values of the pointer type fields in the data
4519219SKonstantin.Ananyev@Sun.COM  * structure based on the new starting physical address of the
4529219SKonstantin.Ananyev@Sun.COM  * data structure.
4537656SSherry.Moore@Sun.COM  */
4547656SSherry.Moore@Sun.COM static int
4557656SSherry.Moore@Sun.COM fastboot_build_mbi(char *mdep, fastboot_info_t *nk)
4567656SSherry.Moore@Sun.COM {
4577656SSherry.Moore@Sun.COM 	mb_module_t	*mbp;
4589219SKonstantin.Ananyev@Sun.COM 	multiboot_info_t	*mbi;	/* pointer to multiboot structure */
4599219SKonstantin.Ananyev@Sun.COM 	uintptr_t	start_addr_va;	/* starting VA of mbi */
4609219SKonstantin.Ananyev@Sun.COM 	uintptr_t	start_addr_pa;	/* starting PA of mbi */
4619219SKonstantin.Ananyev@Sun.COM 	size_t		offs = 0;	/* offset from the starting address */
4629219SKonstantin.Ananyev@Sun.COM 	size_t		arglen;		/* length of the command line arg */
4639219SKonstantin.Ananyev@Sun.COM 	size_t		size;	/* size of the memory reserved for mbi */
4649219SKonstantin.Ananyev@Sun.COM 	size_t		mdnsz;	/* length of the boot archive name */
4657656SSherry.Moore@Sun.COM 
4669219SKonstantin.Ananyev@Sun.COM 	/*
4679219SKonstantin.Ananyev@Sun.COM 	 * If mdep is not NULL or empty, use the length of mdep + 1
4689219SKonstantin.Ananyev@Sun.COM 	 * (for NULL terminating) as the length of the new command
4699219SKonstantin.Ananyev@Sun.COM 	 * line; else use the saved command line length as the
4709219SKonstantin.Ananyev@Sun.COM 	 * length for the new command line.
4719219SKonstantin.Ananyev@Sun.COM 	 */
4727750SSherry.Moore@Sun.COM 	if (mdep != NULL && strlen(mdep) != 0) {
4737656SSherry.Moore@Sun.COM 		arglen = strlen(mdep) + 1;
4747656SSherry.Moore@Sun.COM 	} else {
4757656SSherry.Moore@Sun.COM 		arglen = saved_cmdline_len;
4767656SSherry.Moore@Sun.COM 	}
4777656SSherry.Moore@Sun.COM 
4789219SKonstantin.Ananyev@Sun.COM 	/*
4799219SKonstantin.Ananyev@Sun.COM 	 * Allocate memory for the new multiboot info structure (mbi).
4809219SKonstantin.Ananyev@Sun.COM 	 * If we have reserved memory for mbi but it's not enough,
4819219SKonstantin.Ananyev@Sun.COM 	 * free it and reallocate.
4829219SKonstantin.Ananyev@Sun.COM 	 */
4837656SSherry.Moore@Sun.COM 	size = PAGESIZE + P2ROUNDUP(arglen, PAGESIZE);
4849160SSherry.Moore@Sun.COM 	if (nk->fi_mbi_size && nk->fi_mbi_size < size) {
4859160SSherry.Moore@Sun.COM 		contig_free((void *)nk->fi_new_mbi_va, nk->fi_mbi_size);
4869160SSherry.Moore@Sun.COM 		nk->fi_mbi_size = 0;
4879160SSherry.Moore@Sun.COM 	}
4889160SSherry.Moore@Sun.COM 
4899160SSherry.Moore@Sun.COM 	if (nk->fi_mbi_size == 0) {
4909160SSherry.Moore@Sun.COM 		if ((nk->fi_new_mbi_va =
4919160SSherry.Moore@Sun.COM 		    (uintptr_t)contig_alloc(size, &fastboot_below_1G_dma_attr,
4929160SSherry.Moore@Sun.COM 		    PAGESIZE, 0)) == NULL) {
493*10970SSherry.Moore@Sun.COM 			cmn_err(CE_NOTE, fastboot_enomem_msg,
4949160SSherry.Moore@Sun.COM 			    (uint64_t)size, "1G");
4959160SSherry.Moore@Sun.COM 			return (-1);
4969160SSherry.Moore@Sun.COM 		}
4979160SSherry.Moore@Sun.COM 		/*
4989160SSherry.Moore@Sun.COM 		 * fi_mbi_size must be set after the allocation succeeds
4999160SSherry.Moore@Sun.COM 		 * as it's used to determine how much memory to free.
5009160SSherry.Moore@Sun.COM 		 */
5019160SSherry.Moore@Sun.COM 		nk->fi_mbi_size = size;
5027656SSherry.Moore@Sun.COM 	}
5037656SSherry.Moore@Sun.COM 
5049219SKonstantin.Ananyev@Sun.COM 	/*
5059219SKonstantin.Ananyev@Sun.COM 	 * Initalize memory
5069219SKonstantin.Ananyev@Sun.COM 	 */
5079160SSherry.Moore@Sun.COM 	bzero((void *)nk->fi_new_mbi_va, nk->fi_mbi_size);
5089160SSherry.Moore@Sun.COM 
5099219SKonstantin.Ananyev@Sun.COM 	/*
5109219SKonstantin.Ananyev@Sun.COM 	 * Get PA for the new mbi
5119219SKonstantin.Ananyev@Sun.COM 	 */
5129219SKonstantin.Ananyev@Sun.COM 	start_addr_va = nk->fi_new_mbi_va;
5139219SKonstantin.Ananyev@Sun.COM 	start_addr_pa = mmu_ptob((uint64_t)hat_getpfnum(kas.a_hat,
5149219SKonstantin.Ananyev@Sun.COM 	    (caddr_t)start_addr_va));
5159219SKonstantin.Ananyev@Sun.COM 	nk->fi_new_mbi_pa = (paddr_t)start_addr_pa;
5167656SSherry.Moore@Sun.COM 
5179160SSherry.Moore@Sun.COM 	/*
5189219SKonstantin.Ananyev@Sun.COM 	 * Populate the rest of the fields in the data structure
5199160SSherry.Moore@Sun.COM 	 */
5209219SKonstantin.Ananyev@Sun.COM 
5219219SKonstantin.Ananyev@Sun.COM 	/*
5229219SKonstantin.Ananyev@Sun.COM 	 * Copy from the saved mbi to preserve all non-pointer type fields.
5239219SKonstantin.Ananyev@Sun.COM 	 */
5249219SKonstantin.Ananyev@Sun.COM 	mbi = (multiboot_info_t *)start_addr_va;
5259219SKonstantin.Ananyev@Sun.COM 	bcopy(&saved_mbi, mbi, sizeof (*mbi));
5267656SSherry.Moore@Sun.COM 
5279219SKonstantin.Ananyev@Sun.COM 	/*
5289219SKonstantin.Ananyev@Sun.COM 	 * Recalculate mods_addr.  Set mod_start and mod_end based on
5299219SKonstantin.Ananyev@Sun.COM 	 * the physical address of the new boot archive.  Set mod_name
5309219SKonstantin.Ananyev@Sun.COM 	 * to the name of the new boto archive.
5319219SKonstantin.Ananyev@Sun.COM 	 */
5329219SKonstantin.Ananyev@Sun.COM 	offs += sizeof (multiboot_info_t);
5339219SKonstantin.Ananyev@Sun.COM 	mbi->mods_addr = start_addr_pa + offs;
5349219SKonstantin.Ananyev@Sun.COM 	mbp = (mb_module_t *)(start_addr_va + offs);
5359160SSherry.Moore@Sun.COM 	mbp->mod_start = nk->fi_files[FASTBOOT_BOOTARCHIVE].fb_dest_pa;
5369160SSherry.Moore@Sun.COM 	mbp->mod_end = nk->fi_files[FASTBOOT_BOOTARCHIVE].fb_next_pa;
5377656SSherry.Moore@Sun.COM 
5389219SKonstantin.Ananyev@Sun.COM 	offs += sizeof (mb_module_t);
5399219SKonstantin.Ananyev@Sun.COM 	mdnsz = strlen(fastboot_filename[FASTBOOT_NAME_BOOTARCHIVE]) + 1;
5409219SKonstantin.Ananyev@Sun.COM 	bcopy(fastboot_filename[FASTBOOT_NAME_BOOTARCHIVE],
5419219SKonstantin.Ananyev@Sun.COM 	    (void *)(start_addr_va + offs), mdnsz);
5429219SKonstantin.Ananyev@Sun.COM 	mbp->mod_name = start_addr_pa + offs;
5439219SKonstantin.Ananyev@Sun.COM 	mbp->reserved = 0;
5447656SSherry.Moore@Sun.COM 
5459219SKonstantin.Ananyev@Sun.COM 	/*
5469219SKonstantin.Ananyev@Sun.COM 	 * Make sure the offset is 16-byte aligned to avoid unaligned access.
5479219SKonstantin.Ananyev@Sun.COM 	 */
5489219SKonstantin.Ananyev@Sun.COM 	offs += mdnsz;
5499219SKonstantin.Ananyev@Sun.COM 	offs = P2ROUNDUP_TYPED(offs, 16, size_t);
5507656SSherry.Moore@Sun.COM 
5519219SKonstantin.Ananyev@Sun.COM 	/*
5529219SKonstantin.Ananyev@Sun.COM 	 * Recalculate mmap_addr
5539219SKonstantin.Ananyev@Sun.COM 	 */
5549219SKonstantin.Ananyev@Sun.COM 	mbi->mmap_addr = start_addr_pa + offs;
5559219SKonstantin.Ananyev@Sun.COM 	bcopy((void *)(uintptr_t)saved_mmap, (void *)(start_addr_va + offs),
5567656SSherry.Moore@Sun.COM 	    saved_mbi.mmap_length);
5579219SKonstantin.Ananyev@Sun.COM 	offs += saved_mbi.mmap_length;
5587656SSherry.Moore@Sun.COM 
5599219SKonstantin.Ananyev@Sun.COM 	/*
5609219SKonstantin.Ananyev@Sun.COM 	 * Recalculate drives_addr
5619219SKonstantin.Ananyev@Sun.COM 	 */
5629219SKonstantin.Ananyev@Sun.COM 	mbi->drives_addr = start_addr_pa + offs;
5639219SKonstantin.Ananyev@Sun.COM 	bcopy((void *)(uintptr_t)saved_drives, (void *)(start_addr_va + offs),
5647656SSherry.Moore@Sun.COM 	    saved_mbi.drives_length);
5659219SKonstantin.Ananyev@Sun.COM 	offs += saved_mbi.drives_length;
5667656SSherry.Moore@Sun.COM 
5679219SKonstantin.Ananyev@Sun.COM 	/*
5689219SKonstantin.Ananyev@Sun.COM 	 * Recalculate the address of cmdline.  Set cmdline to contain the
5699219SKonstantin.Ananyev@Sun.COM 	 * new boot argument.
5709219SKonstantin.Ananyev@Sun.COM 	 */
5719219SKonstantin.Ananyev@Sun.COM 	mbi->cmdline = start_addr_pa + offs;
5727656SSherry.Moore@Sun.COM 
5737750SSherry.Moore@Sun.COM 	if (mdep != NULL && strlen(mdep) != 0) {
5749219SKonstantin.Ananyev@Sun.COM 		bcopy(mdep, (void *)(start_addr_va + offs), arglen);
5757656SSherry.Moore@Sun.COM 	} else {
5769219SKonstantin.Ananyev@Sun.COM 		bcopy((void *)saved_cmdline, (void *)(start_addr_va + offs),
5779219SKonstantin.Ananyev@Sun.COM 		    arglen);
5787656SSherry.Moore@Sun.COM 	}
5797656SSherry.Moore@Sun.COM 
58010525SKonstantin.Ananyev@Sun.COM 	/* clear fields and flags that are not copied */
58110525SKonstantin.Ananyev@Sun.COM 	bzero(&mbi->config_table,
58210525SKonstantin.Ananyev@Sun.COM 	    sizeof (*mbi) - offsetof(multiboot_info_t, config_table));
58310525SKonstantin.Ananyev@Sun.COM 	mbi->flags &= ~(MB_INFO_CONFIG_TABLE | MB_INFO_BOOT_LOADER_NAME |
58410525SKonstantin.Ananyev@Sun.COM 	    MB_INFO_APM_TABLE | MB_INFO_VIDEO_INFO);
58510525SKonstantin.Ananyev@Sun.COM 
5867656SSherry.Moore@Sun.COM 	return (0);
5877656SSherry.Moore@Sun.COM }
5887656SSherry.Moore@Sun.COM 
5897750SSherry.Moore@Sun.COM /*
5907750SSherry.Moore@Sun.COM  * Initialize HAT related fields
5917750SSherry.Moore@Sun.COM  */
5927750SSherry.Moore@Sun.COM static void
5937750SSherry.Moore@Sun.COM fastboot_init_fields(fastboot_info_t *nk)
5947656SSherry.Moore@Sun.COM {
5957750SSherry.Moore@Sun.COM 	if (x86_feature & X86_PAE) {
5967750SSherry.Moore@Sun.COM 		nk->fi_has_pae = 1;
5977750SSherry.Moore@Sun.COM 		nk->fi_shift_amt = fastboot_shift_amt_pae;
5987750SSherry.Moore@Sun.COM 		nk->fi_ptes_per_table = 512;
5997750SSherry.Moore@Sun.COM 		nk->fi_lpagesize = (2 << 20);	/* 2M */
6008151SKonstantin.Ananyev@Sun.COM #ifdef	__amd64
6018151SKonstantin.Ananyev@Sun.COM 		nk->fi_top_level = 3;
6028151SKonstantin.Ananyev@Sun.COM #else
6037750SSherry.Moore@Sun.COM 		nk->fi_top_level = 2;
6048151SKonstantin.Ananyev@Sun.COM #endif	/* __amd64 */
6057750SSherry.Moore@Sun.COM 	}
6067750SSherry.Moore@Sun.COM }
6077656SSherry.Moore@Sun.COM 
6087750SSherry.Moore@Sun.COM /*
6097750SSherry.Moore@Sun.COM  * Process boot argument
6107750SSherry.Moore@Sun.COM  */
6117750SSherry.Moore@Sun.COM static void
6127750SSherry.Moore@Sun.COM fastboot_parse_mdep(char *mdep, char *kern_bootpath, int *bootpath_len,
6137750SSherry.Moore@Sun.COM     char *bootargs)
6147750SSherry.Moore@Sun.COM {
6157750SSherry.Moore@Sun.COM 	int	i;
6167656SSherry.Moore@Sun.COM 
6177656SSherry.Moore@Sun.COM 	/*
6187656SSherry.Moore@Sun.COM 	 * If mdep is not NULL, it comes in the format of
6197656SSherry.Moore@Sun.COM 	 *	mountpoint unix args
6207656SSherry.Moore@Sun.COM 	 */
6217750SSherry.Moore@Sun.COM 	if (mdep != NULL && strlen(mdep) != 0) {
6227656SSherry.Moore@Sun.COM 		if (mdep[0] != '-') {
6237656SSherry.Moore@Sun.COM 			/* First get the root argument */
6247656SSherry.Moore@Sun.COM 			i = 0;
6257656SSherry.Moore@Sun.COM 			while (mdep[i] != '\0' && mdep[i] != ' ') {
6267656SSherry.Moore@Sun.COM 				i++;
6277656SSherry.Moore@Sun.COM 			}
6287656SSherry.Moore@Sun.COM 
6297656SSherry.Moore@Sun.COM 			if (i < 4 || strncmp(&mdep[i-4], "unix", 4) != 0) {
6307656SSherry.Moore@Sun.COM 				/* mount point */
6317656SSherry.Moore@Sun.COM 				bcopy(mdep, kern_bootpath, i);
6327656SSherry.Moore@Sun.COM 				kern_bootpath[i] = '\0';
6337750SSherry.Moore@Sun.COM 				*bootpath_len = i;
6347656SSherry.Moore@Sun.COM 
6357656SSherry.Moore@Sun.COM 				/*
6367656SSherry.Moore@Sun.COM 				 * Get the next argument. It should be unix as
6377656SSherry.Moore@Sun.COM 				 * we have validated in in halt.c.
6387656SSherry.Moore@Sun.COM 				 */
6397656SSherry.Moore@Sun.COM 				if (strlen(mdep) > i) {
6407656SSherry.Moore@Sun.COM 					mdep += (i + 1);
6417656SSherry.Moore@Sun.COM 					i = 0;
6427656SSherry.Moore@Sun.COM 					while (mdep[i] != '\0' &&
6437656SSherry.Moore@Sun.COM 					    mdep[i] != ' ') {
6447656SSherry.Moore@Sun.COM 						i++;
6457656SSherry.Moore@Sun.COM 					}
6467656SSherry.Moore@Sun.COM 				}
6477656SSherry.Moore@Sun.COM 
6487656SSherry.Moore@Sun.COM 			}
6497656SSherry.Moore@Sun.COM 			bcopy(mdep, kern_bootfile, i);
6507656SSherry.Moore@Sun.COM 			kern_bootfile[i] = '\0';
6517750SSherry.Moore@Sun.COM 			bcopy(mdep, bootargs, strlen(mdep));
6527656SSherry.Moore@Sun.COM 		} else {
6537656SSherry.Moore@Sun.COM 			int off = strlen(kern_bootfile);
6547656SSherry.Moore@Sun.COM 			bcopy(kern_bootfile, bootargs, off);
6557656SSherry.Moore@Sun.COM 			bcopy(" ", &bootargs[off++], 1);
6567656SSherry.Moore@Sun.COM 			bcopy(mdep, &bootargs[off], strlen(mdep));
6577656SSherry.Moore@Sun.COM 			off += strlen(mdep);
6587656SSherry.Moore@Sun.COM 			bootargs[off] = '\0';
6597656SSherry.Moore@Sun.COM 		}
6607656SSherry.Moore@Sun.COM 	}
6617750SSherry.Moore@Sun.COM }
6627750SSherry.Moore@Sun.COM 
6637750SSherry.Moore@Sun.COM /*
6649160SSherry.Moore@Sun.COM  * Reserve memory under PA 1G for mapping the new kernel and boot archive.
6659160SSherry.Moore@Sun.COM  * This function is only called if fastreboot_onpanic is *not* set.
6669160SSherry.Moore@Sun.COM  */
6679160SSherry.Moore@Sun.COM static void
6689160SSherry.Moore@Sun.COM fastboot_reserve_mem(fastboot_info_t *nk)
6699160SSherry.Moore@Sun.COM {
6709160SSherry.Moore@Sun.COM 	int i;
6719160SSherry.Moore@Sun.COM 
6729160SSherry.Moore@Sun.COM 	/*
6739160SSherry.Moore@Sun.COM 	 * A valid kernel is in place.  No need to reserve any memory.
6749160SSherry.Moore@Sun.COM 	 */
6759160SSherry.Moore@Sun.COM 	if (nk->fi_valid)
6769160SSherry.Moore@Sun.COM 		return;
6779160SSherry.Moore@Sun.COM 
6789160SSherry.Moore@Sun.COM 	/*
6799160SSherry.Moore@Sun.COM 	 * Reserve memory under PA 1G for PTE lists.
6809160SSherry.Moore@Sun.COM 	 */
6819160SSherry.Moore@Sun.COM 	for (i = 0; i < FASTBOOT_MAX_FILES_MAP; i++) {
6829160SSherry.Moore@Sun.COM 		fastboot_file_t *fb = &nk->fi_files[i];
6839160SSherry.Moore@Sun.COM 		size_t fsize_roundup, size;
6849160SSherry.Moore@Sun.COM 
6859160SSherry.Moore@Sun.COM 		fsize_roundup = P2ROUNDUP_TYPED(saved_file_size[i],
6869160SSherry.Moore@Sun.COM 		    PAGESIZE, size_t);
6879160SSherry.Moore@Sun.COM 		size = FASTBOOT_PTE_LIST_SIZE(fsize_roundup);
6889160SSherry.Moore@Sun.COM 		if ((fb->fb_pte_list_va = contig_alloc(size,
6899160SSherry.Moore@Sun.COM 		    &fastboot_below_1G_dma_attr, PAGESIZE, 0)) == NULL) {
6909160SSherry.Moore@Sun.COM 			return;
6919160SSherry.Moore@Sun.COM 		}
6929160SSherry.Moore@Sun.COM 		fb->fb_pte_list_size = size;
6939160SSherry.Moore@Sun.COM 	}
6949160SSherry.Moore@Sun.COM 
6959160SSherry.Moore@Sun.COM 	/*
6969160SSherry.Moore@Sun.COM 	 * Reserve memory under PA 1G for page tables.
6979160SSherry.Moore@Sun.COM 	 */
6989160SSherry.Moore@Sun.COM 	if ((nk->fi_pagetable_va =
6999160SSherry.Moore@Sun.COM 	    (uintptr_t)contig_alloc(fastboot_pagetable_size,
7009160SSherry.Moore@Sun.COM 	    &fastboot_below_1G_dma_attr, PAGESIZE, 0)) == NULL) {
7019160SSherry.Moore@Sun.COM 		return;
7029160SSherry.Moore@Sun.COM 	}
7039160SSherry.Moore@Sun.COM 	nk->fi_pagetable_size = fastboot_pagetable_size;
7049160SSherry.Moore@Sun.COM 
7059160SSherry.Moore@Sun.COM 	/*
7069160SSherry.Moore@Sun.COM 	 * Reserve memory under PA 1G for multiboot structure.
7079160SSherry.Moore@Sun.COM 	 */
7089160SSherry.Moore@Sun.COM 	if ((nk->fi_new_mbi_va = (uintptr_t)contig_alloc(fastboot_mbi_size,
7099160SSherry.Moore@Sun.COM 	    &fastboot_below_1G_dma_attr, PAGESIZE, 0)) == NULL) {
7109160SSherry.Moore@Sun.COM 		return;
7119160SSherry.Moore@Sun.COM 	}
7129160SSherry.Moore@Sun.COM 	nk->fi_mbi_size = fastboot_mbi_size;
7139160SSherry.Moore@Sun.COM }
7149160SSherry.Moore@Sun.COM 
7159160SSherry.Moore@Sun.COM /*
7169160SSherry.Moore@Sun.COM  * Calculate MD5 digest for the given fastboot_file.
7179160SSherry.Moore@Sun.COM  * Assumes that the file is allready loaded properly.
7189160SSherry.Moore@Sun.COM  */
7199160SSherry.Moore@Sun.COM static void
7209160SSherry.Moore@Sun.COM fastboot_cksum_file(fastboot_file_t *fb, uchar_t *md5_hash)
7219160SSherry.Moore@Sun.COM {
7229160SSherry.Moore@Sun.COM 	MD5_CTX md5_ctx;
7239160SSherry.Moore@Sun.COM 
7249160SSherry.Moore@Sun.COM 	MD5Init(&md5_ctx);
7259160SSherry.Moore@Sun.COM 	MD5Update(&md5_ctx, (void *)fb->fb_va, fb->fb_size);
7269160SSherry.Moore@Sun.COM 	MD5Final(md5_hash, &md5_ctx);
7279160SSherry.Moore@Sun.COM }
7289160SSherry.Moore@Sun.COM 
7299160SSherry.Moore@Sun.COM /*
7309160SSherry.Moore@Sun.COM  * Free up the memory we have allocated for a file
7317750SSherry.Moore@Sun.COM  */
7327750SSherry.Moore@Sun.COM static void
7337750SSherry.Moore@Sun.COM fastboot_free_file(fastboot_file_t *fb)
7347750SSherry.Moore@Sun.COM {
7359160SSherry.Moore@Sun.COM 	size_t	fsize_roundup;
7367750SSherry.Moore@Sun.COM 
7377750SSherry.Moore@Sun.COM 	fsize_roundup = P2ROUNDUP_TYPED(fb->fb_size, PAGESIZE, size_t);
7389160SSherry.Moore@Sun.COM 	if (fsize_roundup) {
7399160SSherry.Moore@Sun.COM 		contig_free((void *)fb->fb_va, fsize_roundup);
7409160SSherry.Moore@Sun.COM 		fb->fb_va = NULL;
7419160SSherry.Moore@Sun.COM 		fb->fb_size = 0;
7429160SSherry.Moore@Sun.COM 	}
7439160SSherry.Moore@Sun.COM }
7449160SSherry.Moore@Sun.COM 
7459160SSherry.Moore@Sun.COM /*
7469160SSherry.Moore@Sun.COM  * Free up memory used by the PTEs for a file.
7479160SSherry.Moore@Sun.COM  */
7489160SSherry.Moore@Sun.COM static void
7499160SSherry.Moore@Sun.COM fastboot_free_file_pte(fastboot_file_t *fb, uint64_t endaddr)
7509160SSherry.Moore@Sun.COM {
7519160SSherry.Moore@Sun.COM 	if (fb->fb_pte_list_size && fb->fb_pte_list_pa < endaddr) {
7529160SSherry.Moore@Sun.COM 		contig_free((void *)fb->fb_pte_list_va, fb->fb_pte_list_size);
7539160SSherry.Moore@Sun.COM 		fb->fb_pte_list_va = 0;
7549160SSherry.Moore@Sun.COM 		fb->fb_pte_list_pa = 0;
7559160SSherry.Moore@Sun.COM 		fb->fb_pte_list_size = 0;
7569160SSherry.Moore@Sun.COM 	}
7579160SSherry.Moore@Sun.COM }
7589160SSherry.Moore@Sun.COM 
7599160SSherry.Moore@Sun.COM /*
7609160SSherry.Moore@Sun.COM  * Free up all the memory used for representing a kernel with
7619160SSherry.Moore@Sun.COM  * fastboot_info_t.
7629160SSherry.Moore@Sun.COM  */
7639160SSherry.Moore@Sun.COM static void
7649160SSherry.Moore@Sun.COM fastboot_free_mem(fastboot_info_t *nk, uint64_t endaddr)
7659160SSherry.Moore@Sun.COM {
7669160SSherry.Moore@Sun.COM 	int i;
7679160SSherry.Moore@Sun.COM 
7689160SSherry.Moore@Sun.COM 	for (i = 0; i < FASTBOOT_MAX_FILES_MAP; i++) {
7699160SSherry.Moore@Sun.COM 		fastboot_free_file(nk->fi_files + i);
7709160SSherry.Moore@Sun.COM 		fastboot_free_file_pte(nk->fi_files + i, endaddr);
7719160SSherry.Moore@Sun.COM 	}
7729160SSherry.Moore@Sun.COM 
7739160SSherry.Moore@Sun.COM 	if (nk->fi_pagetable_size && nk->fi_pagetable_pa < endaddr) {
7749160SSherry.Moore@Sun.COM 		contig_free((void *)nk->fi_pagetable_va, nk->fi_pagetable_size);
7759160SSherry.Moore@Sun.COM 		nk->fi_pagetable_va = 0;
7769160SSherry.Moore@Sun.COM 		nk->fi_pagetable_pa = 0;
7779160SSherry.Moore@Sun.COM 		nk->fi_pagetable_size = 0;
7789160SSherry.Moore@Sun.COM 	}
7799160SSherry.Moore@Sun.COM 
7809160SSherry.Moore@Sun.COM 	if (nk->fi_mbi_size && nk->fi_new_mbi_pa < endaddr) {
7819160SSherry.Moore@Sun.COM 		contig_free((void *)nk->fi_new_mbi_va, nk->fi_mbi_size);
7829160SSherry.Moore@Sun.COM 		nk->fi_new_mbi_va = 0;
7839160SSherry.Moore@Sun.COM 		nk->fi_new_mbi_pa = 0;
7849160SSherry.Moore@Sun.COM 		nk->fi_mbi_size = 0;
7859160SSherry.Moore@Sun.COM 	}
7869160SSherry.Moore@Sun.COM }
7879160SSherry.Moore@Sun.COM 
7889160SSherry.Moore@Sun.COM /*
7899160SSherry.Moore@Sun.COM  * Only free up the memory allocated for the kernel and boot archive,
7909160SSherry.Moore@Sun.COM  * but not for the page tables.
7919160SSherry.Moore@Sun.COM  */
7929160SSherry.Moore@Sun.COM void
7939160SSherry.Moore@Sun.COM fastboot_free_newkernel(fastboot_info_t *nk)
7949160SSherry.Moore@Sun.COM {
7959160SSherry.Moore@Sun.COM 	int i;
7967750SSherry.Moore@Sun.COM 
7979160SSherry.Moore@Sun.COM 	nk->fi_valid = 0;
7989160SSherry.Moore@Sun.COM 	/*
7999160SSherry.Moore@Sun.COM 	 * Free the memory we have allocated
8009160SSherry.Moore@Sun.COM 	 */
8019160SSherry.Moore@Sun.COM 	for (i = 0; i < FASTBOOT_MAX_FILES_MAP; i++) {
8029160SSherry.Moore@Sun.COM 		fastboot_free_file(&(nk->fi_files[i]));
8039160SSherry.Moore@Sun.COM 	}
8049160SSherry.Moore@Sun.COM }
8059160SSherry.Moore@Sun.COM 
8069160SSherry.Moore@Sun.COM static void
8079160SSherry.Moore@Sun.COM fastboot_cksum_cdata(fastboot_info_t *nk, uchar_t *md5_hash)
8089160SSherry.Moore@Sun.COM {
8099160SSherry.Moore@Sun.COM 	int i;
8109160SSherry.Moore@Sun.COM 	MD5_CTX md5_ctx;
8119160SSherry.Moore@Sun.COM 
8129160SSherry.Moore@Sun.COM 	MD5Init(&md5_ctx);
8139160SSherry.Moore@Sun.COM 	for (i = 0; i < FASTBOOT_MAX_FILES_MAP; i++) {
8149160SSherry.Moore@Sun.COM 		MD5Update(&md5_ctx, nk->fi_files[i].fb_pte_list_va,
8159160SSherry.Moore@Sun.COM 		    nk->fi_files[i].fb_pte_list_size);
8169160SSherry.Moore@Sun.COM 	}
8179160SSherry.Moore@Sun.COM 	MD5Update(&md5_ctx, (void *)nk->fi_pagetable_va, nk->fi_pagetable_size);
8189160SSherry.Moore@Sun.COM 	MD5Update(&md5_ctx, (void *)nk->fi_new_mbi_va, nk->fi_mbi_size);
8199160SSherry.Moore@Sun.COM 
8209160SSherry.Moore@Sun.COM 	MD5Final(md5_hash, &md5_ctx);
8219160SSherry.Moore@Sun.COM }
8229160SSherry.Moore@Sun.COM 
8239160SSherry.Moore@Sun.COM /*
8249160SSherry.Moore@Sun.COM  * Generate MD5 checksum of the given kernel.
8259160SSherry.Moore@Sun.COM  */
8269160SSherry.Moore@Sun.COM static void
8279160SSherry.Moore@Sun.COM fastboot_cksum_generate(fastboot_info_t *nk)
8289160SSherry.Moore@Sun.COM {
8299160SSherry.Moore@Sun.COM 	int i;
8309160SSherry.Moore@Sun.COM 
8319160SSherry.Moore@Sun.COM 	for (i = 0; i < FASTBOOT_MAX_FILES_MAP; i++) {
8329160SSherry.Moore@Sun.COM 		fastboot_cksum_file(nk->fi_files + i, nk->fi_md5_hash[i]);
8339160SSherry.Moore@Sun.COM 	}
8349160SSherry.Moore@Sun.COM 	fastboot_cksum_cdata(nk, nk->fi_md5_hash[i]);
8359160SSherry.Moore@Sun.COM }
8369160SSherry.Moore@Sun.COM 
8379160SSherry.Moore@Sun.COM /*
8389160SSherry.Moore@Sun.COM  * Calculate MD5 checksum of the given kernel and verify that
8399160SSherry.Moore@Sun.COM  * it matches with what was calculated before.
8409160SSherry.Moore@Sun.COM  */
8419160SSherry.Moore@Sun.COM int
8429160SSherry.Moore@Sun.COM fastboot_cksum_verify(fastboot_info_t *nk)
8439160SSherry.Moore@Sun.COM {
8449160SSherry.Moore@Sun.COM 	int i;
8459160SSherry.Moore@Sun.COM 	uchar_t md5_hash[MD5_DIGEST_LENGTH];
8469160SSherry.Moore@Sun.COM 
8479160SSherry.Moore@Sun.COM 	for (i = 0; i < FASTBOOT_MAX_FILES_MAP; i++) {
8489160SSherry.Moore@Sun.COM 		fastboot_cksum_file(nk->fi_files + i, md5_hash);
8499160SSherry.Moore@Sun.COM 		if (bcmp(nk->fi_md5_hash[i], md5_hash,
8509160SSherry.Moore@Sun.COM 		    sizeof (nk->fi_md5_hash[i])) != 0)
8519160SSherry.Moore@Sun.COM 			return (i + 1);
8529160SSherry.Moore@Sun.COM 	}
8539160SSherry.Moore@Sun.COM 
8549160SSherry.Moore@Sun.COM 	fastboot_cksum_cdata(nk, md5_hash);
8559160SSherry.Moore@Sun.COM 	if (bcmp(nk->fi_md5_hash[i], md5_hash,
8569160SSherry.Moore@Sun.COM 	    sizeof (nk->fi_md5_hash[i])) != 0)
8579160SSherry.Moore@Sun.COM 		return (i + 1);
8589160SSherry.Moore@Sun.COM 
8599160SSherry.Moore@Sun.COM 	return (0);
8607750SSherry.Moore@Sun.COM }
8617750SSherry.Moore@Sun.COM 
8627750SSherry.Moore@Sun.COM /*
8637750SSherry.Moore@Sun.COM  * This function performs the following tasks:
8647750SSherry.Moore@Sun.COM  * - Read the sizes of the new kernel and boot archive.
8657750SSherry.Moore@Sun.COM  * - Allocate memory for the new kernel and boot archive.
8667750SSherry.Moore@Sun.COM  * - Allocate memory for page tables necessary for mapping the memory
8677750SSherry.Moore@Sun.COM  *   allocated for the files.
8687750SSherry.Moore@Sun.COM  * - Read the new kernel and boot archive into memory.
8697750SSherry.Moore@Sun.COM  * - Map in the fast reboot switcher.
8707750SSherry.Moore@Sun.COM  * - Load the fast reboot switcher to FASTBOOT_SWTCH_PA.
8717750SSherry.Moore@Sun.COM  * - Build the new multiboot_info structure
8727750SSherry.Moore@Sun.COM  * - Build page tables for the low 1G of physical memory.
8737750SSherry.Moore@Sun.COM  * - Mark the data structure as valid if all steps have succeeded.
8747750SSherry.Moore@Sun.COM  */
8757750SSherry.Moore@Sun.COM void
8769160SSherry.Moore@Sun.COM fastboot_load_kernel(char *mdep)
8777750SSherry.Moore@Sun.COM {
8787750SSherry.Moore@Sun.COM 	void		*buf = NULL;
8797750SSherry.Moore@Sun.COM 	int		i;
8807750SSherry.Moore@Sun.COM 	fastboot_file_t	*fb;
8817750SSherry.Moore@Sun.COM 	uint32_t	dboot_start_offset;
8827750SSherry.Moore@Sun.COM 	char		kern_bootpath[OBP_MAXPATHLEN];
8837750SSherry.Moore@Sun.COM 	extern uintptr_t postbootkernelbase;
8849160SSherry.Moore@Sun.COM 	uintptr_t	saved_kernelbase;
8857750SSherry.Moore@Sun.COM 	int		bootpath_len = 0;
8867750SSherry.Moore@Sun.COM 	int		is_failsafe = 0;
8877750SSherry.Moore@Sun.COM 	int		is_retry = 0;
8887750SSherry.Moore@Sun.COM 	uint64_t	end_addr;
8897750SSherry.Moore@Sun.COM 
89010559SSherry.Moore@Sun.COM 	if (!fastreboot_capable)
89110559SSherry.Moore@Sun.COM 		return;
8927750SSherry.Moore@Sun.COM 
8939160SSherry.Moore@Sun.COM 	if (newkernel.fi_valid)
8949160SSherry.Moore@Sun.COM 		fastboot_free_newkernel(&newkernel);
8959160SSherry.Moore@Sun.COM 
8969160SSherry.Moore@Sun.COM 	saved_kernelbase = postbootkernelbase;
8979160SSherry.Moore@Sun.COM 
8987750SSherry.Moore@Sun.COM 	postbootkernelbase = 0;
8997750SSherry.Moore@Sun.COM 
9007750SSherry.Moore@Sun.COM 	/*
9017750SSherry.Moore@Sun.COM 	 * Initialize various HAT related fields in the data structure
9027750SSherry.Moore@Sun.COM 	 */
9037750SSherry.Moore@Sun.COM 	fastboot_init_fields(&newkernel);
9047750SSherry.Moore@Sun.COM 
9057750SSherry.Moore@Sun.COM 	bzero(kern_bootpath, OBP_MAXPATHLEN);
9067750SSherry.Moore@Sun.COM 
9077750SSherry.Moore@Sun.COM 	/*
9087750SSherry.Moore@Sun.COM 	 * Process the boot argument
9097750SSherry.Moore@Sun.COM 	 */
9109160SSherry.Moore@Sun.COM 	bzero(fastboot_args, OBP_MAXPATHLEN);
9119160SSherry.Moore@Sun.COM 	fastboot_parse_mdep(mdep, kern_bootpath, &bootpath_len, fastboot_args);
9127656SSherry.Moore@Sun.COM 
9137656SSherry.Moore@Sun.COM 	/*
9147656SSherry.Moore@Sun.COM 	 * Make sure we get the null character
9157656SSherry.Moore@Sun.COM 	 */
9167656SSherry.Moore@Sun.COM 	bcopy(kern_bootpath, fastboot_filename[FASTBOOT_NAME_UNIX],
9177656SSherry.Moore@Sun.COM 	    bootpath_len);
9187656SSherry.Moore@Sun.COM 	bcopy(kern_bootfile,
9197656SSherry.Moore@Sun.COM 	    &fastboot_filename[FASTBOOT_NAME_UNIX][bootpath_len],
9207656SSherry.Moore@Sun.COM 	    strlen(kern_bootfile) + 1);
9217656SSherry.Moore@Sun.COM 
9227656SSherry.Moore@Sun.COM 	bcopy(kern_bootpath, fastboot_filename[FASTBOOT_NAME_BOOTARCHIVE],
9237656SSherry.Moore@Sun.COM 	    bootpath_len);
9247656SSherry.Moore@Sun.COM 
9259160SSherry.Moore@Sun.COM 	if (bcmp(kern_bootfile, FAILSAFE_BOOTFILE32,
9269160SSherry.Moore@Sun.COM 	    (sizeof (FAILSAFE_BOOTFILE32) - 1)) == 0 ||
9279160SSherry.Moore@Sun.COM 	    bcmp(kern_bootfile, FAILSAFE_BOOTFILE64,
9289160SSherry.Moore@Sun.COM 	    (sizeof (FAILSAFE_BOOTFILE64) - 1)) == 0) {
9297656SSherry.Moore@Sun.COM 		is_failsafe = 1;
9307656SSherry.Moore@Sun.COM 	}
9317656SSherry.Moore@Sun.COM 
9327750SSherry.Moore@Sun.COM load_kernel_retry:
9337656SSherry.Moore@Sun.COM 	/*
9347656SSherry.Moore@Sun.COM 	 * Read in unix and boot_archive
9357656SSherry.Moore@Sun.COM 	 */
9367750SSherry.Moore@Sun.COM 	end_addr = DBOOT_ENTRY_ADDRESS;
9377656SSherry.Moore@Sun.COM 	for (i = 0; i < FASTBOOT_MAX_FILES_MAP; i++) {
9387750SSherry.Moore@Sun.COM 		struct _buf	*file;
9397750SSherry.Moore@Sun.COM 		uintptr_t	va;
9407750SSherry.Moore@Sun.COM 		uint64_t	fsize;
9417750SSherry.Moore@Sun.COM 		size_t		fsize_roundup, pt_size;
9427750SSherry.Moore@Sun.COM 		int		page_index;
9437750SSherry.Moore@Sun.COM 		uintptr_t	offset;
9447656SSherry.Moore@Sun.COM 		ddi_dma_attr_t dma_attr = fastboot_dma_attr;
9457656SSherry.Moore@Sun.COM 
9467750SSherry.Moore@Sun.COM 
9477656SSherry.Moore@Sun.COM 		dprintf("fastboot_filename[%d] = %s\n",
9487656SSherry.Moore@Sun.COM 		    i, fastboot_filename[i]);
9497656SSherry.Moore@Sun.COM 
9507656SSherry.Moore@Sun.COM 		if ((file = kobj_open_file(fastboot_filename[i])) ==
9517656SSherry.Moore@Sun.COM 		    (struct _buf *)-1) {
952*10970SSherry.Moore@Sun.COM 			cmn_err(CE_NOTE, "!Fastboot: Couldn't open %s",
9537656SSherry.Moore@Sun.COM 			    fastboot_filename[i]);
9547656SSherry.Moore@Sun.COM 			goto err_out;
9557656SSherry.Moore@Sun.COM 		}
9567656SSherry.Moore@Sun.COM 
9577656SSherry.Moore@Sun.COM 		if (kobj_get_filesize(file, &fsize) != 0) {
958*10970SSherry.Moore@Sun.COM 			cmn_err(CE_NOTE,
959*10970SSherry.Moore@Sun.COM 			    "!Fastboot: Couldn't get filesize for %s",
9607656SSherry.Moore@Sun.COM 			    fastboot_filename[i]);
9617656SSherry.Moore@Sun.COM 			goto err_out;
9627656SSherry.Moore@Sun.COM 		}
9637656SSherry.Moore@Sun.COM 
9647750SSherry.Moore@Sun.COM 		fsize_roundup = P2ROUNDUP_TYPED(fsize, PAGESIZE, size_t);
9657750SSherry.Moore@Sun.COM 
9667750SSherry.Moore@Sun.COM 		/*
9677750SSherry.Moore@Sun.COM 		 * Where the files end in physical memory after being
9687750SSherry.Moore@Sun.COM 		 * relocated by the fast boot switcher.
9697750SSherry.Moore@Sun.COM 		 */
9707750SSherry.Moore@Sun.COM 		end_addr += fsize_roundup;
9717750SSherry.Moore@Sun.COM 		if (end_addr > fastboot_below_1G_dma_attr.dma_attr_addr_hi) {
972*10970SSherry.Moore@Sun.COM 			cmn_err(CE_NOTE, "!Fastboot: boot archive is too big");
9737750SSherry.Moore@Sun.COM 			goto err_out;
9747656SSherry.Moore@Sun.COM 		}
9757656SSherry.Moore@Sun.COM 
9767750SSherry.Moore@Sun.COM 		/*
9777750SSherry.Moore@Sun.COM 		 * Adjust dma_attr_addr_lo so that the new kernel and boot
9787750SSherry.Moore@Sun.COM 		 * archive will not be overridden during relocation.
9797750SSherry.Moore@Sun.COM 		 */
9807750SSherry.Moore@Sun.COM 		if (end_addr > fastboot_dma_attr.dma_attr_addr_lo ||
9817750SSherry.Moore@Sun.COM 		    end_addr > fastboot_below_1G_dma_attr.dma_attr_addr_lo) {
9827750SSherry.Moore@Sun.COM 
9837750SSherry.Moore@Sun.COM 			if (is_retry) {
9847750SSherry.Moore@Sun.COM 				/*
9857750SSherry.Moore@Sun.COM 				 * If we have already tried and didn't succeed,
9867750SSherry.Moore@Sun.COM 				 * just give up.
9877750SSherry.Moore@Sun.COM 				 */
988*10970SSherry.Moore@Sun.COM 				cmn_err(CE_NOTE,
989*10970SSherry.Moore@Sun.COM 				    "!Fastboot: boot archive is too big");
9907750SSherry.Moore@Sun.COM 				goto err_out;
9917750SSherry.Moore@Sun.COM 			} else {
9927750SSherry.Moore@Sun.COM 				/* Set the flag so we don't keep retrying */
9937750SSherry.Moore@Sun.COM 				is_retry++;
9947750SSherry.Moore@Sun.COM 
9957750SSherry.Moore@Sun.COM 				/* Adjust dma_attr_addr_lo */
9967750SSherry.Moore@Sun.COM 				fastboot_dma_attr.dma_attr_addr_lo = end_addr;
9977750SSherry.Moore@Sun.COM 				fastboot_below_1G_dma_attr.dma_attr_addr_lo =
9987750SSherry.Moore@Sun.COM 				    end_addr;
9997750SSherry.Moore@Sun.COM 
10007750SSherry.Moore@Sun.COM 				/*
10017750SSherry.Moore@Sun.COM 				 * Free the memory we have already allocated
10027750SSherry.Moore@Sun.COM 				 * whose physical addresses might not fit
10037750SSherry.Moore@Sun.COM 				 * the new lo and hi constraints.
10047750SSherry.Moore@Sun.COM 				 */
10059160SSherry.Moore@Sun.COM 				fastboot_free_mem(&newkernel, end_addr);
10067750SSherry.Moore@Sun.COM 				goto load_kernel_retry;
10077750SSherry.Moore@Sun.COM 			}
10087750SSherry.Moore@Sun.COM 		}
10097750SSherry.Moore@Sun.COM 
10107750SSherry.Moore@Sun.COM 
10117656SSherry.Moore@Sun.COM 		if (!fastboot_contig)
10127656SSherry.Moore@Sun.COM 			dma_attr.dma_attr_sgllen = (fsize / PAGESIZE) +
10137656SSherry.Moore@Sun.COM 			    (((fsize % PAGESIZE) == 0) ? 0 : 1);
10147656SSherry.Moore@Sun.COM 
10157656SSherry.Moore@Sun.COM 		if ((buf = contig_alloc(fsize, &dma_attr, PAGESIZE, 0))
10167656SSherry.Moore@Sun.COM 		    == NULL) {
1017*10970SSherry.Moore@Sun.COM 			cmn_err(CE_NOTE, fastboot_enomem_msg, fsize, "64G");
10187656SSherry.Moore@Sun.COM 			goto err_out;
10197656SSherry.Moore@Sun.COM 		}
10207656SSherry.Moore@Sun.COM 
10217656SSherry.Moore@Sun.COM 		va = P2ROUNDUP_TYPED((uintptr_t)buf, PAGESIZE, uintptr_t);
10227656SSherry.Moore@Sun.COM 
10237656SSherry.Moore@Sun.COM 		if (kobj_read_file(file, (char *)va, fsize, 0) < 0) {
1024*10970SSherry.Moore@Sun.COM 			cmn_err(CE_NOTE, "!Fastboot: Couldn't read %s",
10257656SSherry.Moore@Sun.COM 			    fastboot_filename[i]);
10267656SSherry.Moore@Sun.COM 			goto err_out;
10277656SSherry.Moore@Sun.COM 		}
10287656SSherry.Moore@Sun.COM 
10297656SSherry.Moore@Sun.COM 		fb = &newkernel.fi_files[i];
10307656SSherry.Moore@Sun.COM 		fb->fb_va = va;
10317656SSherry.Moore@Sun.COM 		fb->fb_size = fsize;
10327656SSherry.Moore@Sun.COM 		fb->fb_sectcnt = 0;
10337656SSherry.Moore@Sun.COM 
10349160SSherry.Moore@Sun.COM 		pt_size = FASTBOOT_PTE_LIST_SIZE(fsize_roundup);
10357656SSherry.Moore@Sun.COM 
10369160SSherry.Moore@Sun.COM 		/*
10379160SSherry.Moore@Sun.COM 		 * If we have reserved memory but it not enough, free it.
10389160SSherry.Moore@Sun.COM 		 */
10399160SSherry.Moore@Sun.COM 		if (fb->fb_pte_list_size && fb->fb_pte_list_size < pt_size) {
10409160SSherry.Moore@Sun.COM 			contig_free((void *)fb->fb_pte_list_va,
10419160SSherry.Moore@Sun.COM 			    fb->fb_pte_list_size);
10429160SSherry.Moore@Sun.COM 			fb->fb_pte_list_size = 0;
10437656SSherry.Moore@Sun.COM 		}
10447656SSherry.Moore@Sun.COM 
10459160SSherry.Moore@Sun.COM 		if (fb->fb_pte_list_size == 0) {
10469160SSherry.Moore@Sun.COM 			if ((fb->fb_pte_list_va =
10479160SSherry.Moore@Sun.COM 			    (x86pte_t *)contig_alloc(pt_size,
10489160SSherry.Moore@Sun.COM 			    &fastboot_below_1G_dma_attr, PAGESIZE, 0))
10499160SSherry.Moore@Sun.COM 			    == NULL) {
1050*10970SSherry.Moore@Sun.COM 				cmn_err(CE_NOTE, fastboot_enomem_msg,
10519160SSherry.Moore@Sun.COM 				    (uint64_t)pt_size, "1G");
10529160SSherry.Moore@Sun.COM 				goto err_out;
10539160SSherry.Moore@Sun.COM 			}
10549160SSherry.Moore@Sun.COM 			/*
10559160SSherry.Moore@Sun.COM 			 * fb_pte_list_size must be set after the allocation
10569160SSherry.Moore@Sun.COM 			 * succeeds as it's used to determine how much memory to
10579160SSherry.Moore@Sun.COM 			 * free.
10589160SSherry.Moore@Sun.COM 			 */
10599160SSherry.Moore@Sun.COM 			fb->fb_pte_list_size = pt_size;
10609160SSherry.Moore@Sun.COM 		}
10619160SSherry.Moore@Sun.COM 
10629160SSherry.Moore@Sun.COM 		bzero((void *)(fb->fb_pte_list_va), fb->fb_pte_list_size);
10637656SSherry.Moore@Sun.COM 
10647656SSherry.Moore@Sun.COM 		fb->fb_pte_list_pa = mmu_ptob((uint64_t)hat_getpfnum(kas.a_hat,
10657656SSherry.Moore@Sun.COM 		    (caddr_t)fb->fb_pte_list_va));
10667656SSherry.Moore@Sun.COM 
10677656SSherry.Moore@Sun.COM 		for (page_index = 0, offset = 0; offset < fb->fb_size;
10687656SSherry.Moore@Sun.COM 		    offset += PAGESIZE) {
10697656SSherry.Moore@Sun.COM 			uint64_t paddr;
10707656SSherry.Moore@Sun.COM 
10717656SSherry.Moore@Sun.COM 			paddr = mmu_ptob((uint64_t)hat_getpfnum(kas.a_hat,
10727656SSherry.Moore@Sun.COM 			    (caddr_t)fb->fb_va + offset));
10737656SSherry.Moore@Sun.COM 
10747656SSherry.Moore@Sun.COM 			ASSERT(paddr >= fastboot_dma_attr.dma_attr_addr_lo);
10757656SSherry.Moore@Sun.COM 
10767656SSherry.Moore@Sun.COM 			/*
10777656SSherry.Moore@Sun.COM 			 * Include the pte_bits so we don't have to make
10787656SSherry.Moore@Sun.COM 			 * it in assembly.
10797656SSherry.Moore@Sun.COM 			 */
10807656SSherry.Moore@Sun.COM 			fb->fb_pte_list_va[page_index++] = (x86pte_t)
10817656SSherry.Moore@Sun.COM 			    (paddr | pte_bits);
10827656SSherry.Moore@Sun.COM 		}
10837656SSherry.Moore@Sun.COM 
10847656SSherry.Moore@Sun.COM 		fb->fb_pte_list_va[page_index] = FASTBOOT_TERMINATE;
10857656SSherry.Moore@Sun.COM 
10867656SSherry.Moore@Sun.COM 		if (i == FASTBOOT_UNIX) {
10877750SSherry.Moore@Sun.COM 			Ehdr	*ehdr = (Ehdr *)va;
10887750SSherry.Moore@Sun.COM 			int	j;
10897656SSherry.Moore@Sun.COM 
10907656SSherry.Moore@Sun.COM 			/*
10917656SSherry.Moore@Sun.COM 			 * Sanity checks:
10927656SSherry.Moore@Sun.COM 			 */
10937656SSherry.Moore@Sun.COM 			for (j = 0; j < SELFMAG; j++) {
10947656SSherry.Moore@Sun.COM 				if (ehdr->e_ident[j] != ELFMAG[j]) {
1095*10970SSherry.Moore@Sun.COM 					cmn_err(CE_NOTE, "!Fastboot: Bad ELF "
10967656SSherry.Moore@Sun.COM 					    "signature");
10977656SSherry.Moore@Sun.COM 					goto err_out;
10987656SSherry.Moore@Sun.COM 				}
10997656SSherry.Moore@Sun.COM 			}
11007656SSherry.Moore@Sun.COM 
11017656SSherry.Moore@Sun.COM 			if (ehdr->e_ident[EI_CLASS] == ELFCLASS32 &&
11027656SSherry.Moore@Sun.COM 			    ehdr->e_ident[EI_DATA] == ELFDATA2LSB &&
11037656SSherry.Moore@Sun.COM 			    ehdr->e_machine == EM_386) {
11047656SSherry.Moore@Sun.COM 
11058151SKonstantin.Ananyev@Sun.COM 				fb->fb_sectcnt = sizeof (fb->fb_sections) /
11068151SKonstantin.Ananyev@Sun.COM 				    sizeof (fb->fb_sections[0]);
11078151SKonstantin.Ananyev@Sun.COM 
11087656SSherry.Moore@Sun.COM 				if (fastboot_elf32_find_loadables((void *)va,
11097656SSherry.Moore@Sun.COM 				    fsize, &fb->fb_sections[0],
11107656SSherry.Moore@Sun.COM 				    &fb->fb_sectcnt, &dboot_start_offset) < 0) {
1111*10970SSherry.Moore@Sun.COM 					cmn_err(CE_NOTE, "!Fastboot: ELF32 "
11127656SSherry.Moore@Sun.COM 					    "program section failure");
11137656SSherry.Moore@Sun.COM 					goto err_out;
11147656SSherry.Moore@Sun.COM 				}
11157656SSherry.Moore@Sun.COM 
11167656SSherry.Moore@Sun.COM 				if (fb->fb_sectcnt == 0) {
1117*10970SSherry.Moore@Sun.COM 					cmn_err(CE_NOTE, "!Fastboot: No ELF32 "
11187656SSherry.Moore@Sun.COM 					    "program sections found");
11197656SSherry.Moore@Sun.COM 					goto err_out;
11207656SSherry.Moore@Sun.COM 				}
11217656SSherry.Moore@Sun.COM 
11227656SSherry.Moore@Sun.COM 				if (is_failsafe) {
11237656SSherry.Moore@Sun.COM 					/* Failsafe boot_archive */
11249160SSherry.Moore@Sun.COM 					bcopy(BOOTARCHIVE32_FAILSAFE,
11257656SSherry.Moore@Sun.COM 					    &fastboot_filename
11267656SSherry.Moore@Sun.COM 					    [FASTBOOT_NAME_BOOTARCHIVE]
11277656SSherry.Moore@Sun.COM 					    [bootpath_len],
11289160SSherry.Moore@Sun.COM 					    sizeof (BOOTARCHIVE32_FAILSAFE));
11297656SSherry.Moore@Sun.COM 				} else {
11307656SSherry.Moore@Sun.COM 					bcopy(BOOTARCHIVE32,
11317656SSherry.Moore@Sun.COM 					    &fastboot_filename
11327656SSherry.Moore@Sun.COM 					    [FASTBOOT_NAME_BOOTARCHIVE]
11337656SSherry.Moore@Sun.COM 					    [bootpath_len],
11347656SSherry.Moore@Sun.COM 					    sizeof (BOOTARCHIVE32));
11357656SSherry.Moore@Sun.COM 				}
11367656SSherry.Moore@Sun.COM 
11377656SSherry.Moore@Sun.COM 			} else if (ehdr->e_ident[EI_CLASS] == ELFCLASS64 &&
11387656SSherry.Moore@Sun.COM 			    ehdr->e_ident[EI_DATA] == ELFDATA2LSB &&
11397656SSherry.Moore@Sun.COM 			    ehdr->e_machine == EM_AMD64) {
11407656SSherry.Moore@Sun.COM 
11417656SSherry.Moore@Sun.COM 				if (fastboot_elf64_find_dboot_load_offset(
11427656SSherry.Moore@Sun.COM 				    (void *)va, fsize, &dboot_start_offset)
11437656SSherry.Moore@Sun.COM 				    != 0) {
1144*10970SSherry.Moore@Sun.COM 					cmn_err(CE_NOTE, "!Fastboot: Couldn't "
11457656SSherry.Moore@Sun.COM 					    "find ELF64 dboot entry offset");
11467656SSherry.Moore@Sun.COM 					goto err_out;
11477656SSherry.Moore@Sun.COM 				}
11487656SSherry.Moore@Sun.COM 
11497656SSherry.Moore@Sun.COM 				if ((x86_feature & X86_64) == 0 ||
11508151SKonstantin.Ananyev@Sun.COM 				    (x86_feature & X86_PAE) == 0) {
1151*10970SSherry.Moore@Sun.COM 					cmn_err(CE_NOTE, "!Fastboot: Cannot "
11527656SSherry.Moore@Sun.COM 					    "reboot to %s: "
11537656SSherry.Moore@Sun.COM 					    "not a 64-bit capable system",
11547656SSherry.Moore@Sun.COM 					    kern_bootfile);
11557656SSherry.Moore@Sun.COM 					goto err_out;
11567656SSherry.Moore@Sun.COM 				}
11577656SSherry.Moore@Sun.COM 
11589160SSherry.Moore@Sun.COM 				if (is_failsafe) {
11599160SSherry.Moore@Sun.COM 					/* Failsafe boot_archive */
11609160SSherry.Moore@Sun.COM 					bcopy(BOOTARCHIVE64_FAILSAFE,
11619160SSherry.Moore@Sun.COM 					    &fastboot_filename
11629160SSherry.Moore@Sun.COM 					    [FASTBOOT_NAME_BOOTARCHIVE]
11639160SSherry.Moore@Sun.COM 					    [bootpath_len],
11649160SSherry.Moore@Sun.COM 					    sizeof (BOOTARCHIVE64_FAILSAFE));
11659160SSherry.Moore@Sun.COM 				} else {
11669160SSherry.Moore@Sun.COM 					bcopy(BOOTARCHIVE64,
11679160SSherry.Moore@Sun.COM 					    &fastboot_filename
11689160SSherry.Moore@Sun.COM 					    [FASTBOOT_NAME_BOOTARCHIVE]
11699160SSherry.Moore@Sun.COM 					    [bootpath_len],
11709160SSherry.Moore@Sun.COM 					    sizeof (BOOTARCHIVE64));
11719160SSherry.Moore@Sun.COM 				}
11727656SSherry.Moore@Sun.COM 			} else {
1173*10970SSherry.Moore@Sun.COM 				cmn_err(CE_NOTE, "!Fastboot: Unknown ELF type");
11747656SSherry.Moore@Sun.COM 				goto err_out;
11757656SSherry.Moore@Sun.COM 			}
11767656SSherry.Moore@Sun.COM 
11777656SSherry.Moore@Sun.COM 			fb->fb_dest_pa = DBOOT_ENTRY_ADDRESS -
11787656SSherry.Moore@Sun.COM 			    dboot_start_offset;
11797656SSherry.Moore@Sun.COM 
11807656SSherry.Moore@Sun.COM 			fb->fb_next_pa = DBOOT_ENTRY_ADDRESS + fsize_roundup;
11817656SSherry.Moore@Sun.COM 		} else {
11827656SSherry.Moore@Sun.COM 			fb->fb_dest_pa = newkernel.fi_files[i - 1].fb_next_pa;
11837656SSherry.Moore@Sun.COM 			fb->fb_next_pa = fb->fb_dest_pa + fsize_roundup;
11847656SSherry.Moore@Sun.COM 		}
11857656SSherry.Moore@Sun.COM 
11867656SSherry.Moore@Sun.COM 		kobj_close_file(file);
11877656SSherry.Moore@Sun.COM 
11887656SSherry.Moore@Sun.COM 	}
11897656SSherry.Moore@Sun.COM 
11907750SSherry.Moore@Sun.COM 	/*
11917656SSherry.Moore@Sun.COM 	 * Add the function that will switch us to 32-bit protected mode
11927656SSherry.Moore@Sun.COM 	 */
11937656SSherry.Moore@Sun.COM 	fb = &newkernel.fi_files[FASTBOOT_SWTCH];
11947656SSherry.Moore@Sun.COM 	fb->fb_va = fb->fb_dest_pa = FASTBOOT_SWTCH_PA;
11958151SKonstantin.Ananyev@Sun.COM 	fb->fb_size = MMU_PAGESIZE;
11967656SSherry.Moore@Sun.COM 
11979160SSherry.Moore@Sun.COM 	hat_devload(kas.a_hat, (caddr_t)fb->fb_va,
11989160SSherry.Moore@Sun.COM 	    MMU_PAGESIZE, mmu_btop(fb->fb_dest_pa),
11999160SSherry.Moore@Sun.COM 	    PROT_READ | PROT_WRITE | PROT_EXEC,
12009160SSherry.Moore@Sun.COM 	    HAT_LOAD_NOCONSIST | HAT_LOAD_LOCK);
12017656SSherry.Moore@Sun.COM 
12027656SSherry.Moore@Sun.COM 	/*
12037656SSherry.Moore@Sun.COM 	 * Build the new multiboot_info structure
12047656SSherry.Moore@Sun.COM 	 */
12059160SSherry.Moore@Sun.COM 	if (fastboot_build_mbi(fastboot_args, &newkernel) != 0) {
12067656SSherry.Moore@Sun.COM 		goto err_out;
12077656SSherry.Moore@Sun.COM 	}
12087656SSherry.Moore@Sun.COM 
12097656SSherry.Moore@Sun.COM 	/*
12107656SSherry.Moore@Sun.COM 	 * Build page table for low 1G physical memory. Use big pages.
12118151SKonstantin.Ananyev@Sun.COM 	 * Allocate 4 (5 for amd64) pages for the page tables.
12128151SKonstantin.Ananyev@Sun.COM 	 *    1 page for PML4 (amd64)
12137656SSherry.Moore@Sun.COM 	 *    1 page for Page-Directory-Pointer Table
12148151SKonstantin.Ananyev@Sun.COM 	 *    2 pages for Page Directory
12157656SSherry.Moore@Sun.COM 	 *    1 page for Page Table.
12167656SSherry.Moore@Sun.COM 	 * The page table entry will be rewritten to map the physical
12177656SSherry.Moore@Sun.COM 	 * address as we do the copying.
12187656SSherry.Moore@Sun.COM 	 */
12197656SSherry.Moore@Sun.COM 	if (newkernel.fi_has_pae) {
12208151SKonstantin.Ananyev@Sun.COM #ifdef	__amd64
12218151SKonstantin.Ananyev@Sun.COM 		size_t size = MMU_PAGESIZE * 5;
12228151SKonstantin.Ananyev@Sun.COM #else
12237656SSherry.Moore@Sun.COM 		size_t size = MMU_PAGESIZE * 4;
12248151SKonstantin.Ananyev@Sun.COM #endif	/* __amd64 */
12257656SSherry.Moore@Sun.COM 
12269160SSherry.Moore@Sun.COM 		if (newkernel.fi_pagetable_size && newkernel.fi_pagetable_size
12279160SSherry.Moore@Sun.COM 		    < size) {
12289160SSherry.Moore@Sun.COM 			contig_free((void *)newkernel.fi_pagetable_va,
12299160SSherry.Moore@Sun.COM 			    newkernel.fi_pagetable_size);
12309160SSherry.Moore@Sun.COM 			newkernel.fi_pagetable_size = 0;
12319160SSherry.Moore@Sun.COM 		}
12329160SSherry.Moore@Sun.COM 
12339160SSherry.Moore@Sun.COM 		if (newkernel.fi_pagetable_size == 0) {
12349160SSherry.Moore@Sun.COM 			if ((newkernel.fi_pagetable_va = (uintptr_t)
12359160SSherry.Moore@Sun.COM 			    contig_alloc(size, &fastboot_below_1G_dma_attr,
12369160SSherry.Moore@Sun.COM 			    MMU_PAGESIZE, 0)) == NULL) {
1237*10970SSherry.Moore@Sun.COM 				cmn_err(CE_NOTE, fastboot_enomem_msg,
12389160SSherry.Moore@Sun.COM 				    (uint64_t)size, "1G");
12399160SSherry.Moore@Sun.COM 				goto err_out;
12409160SSherry.Moore@Sun.COM 			}
12419160SSherry.Moore@Sun.COM 			/*
12429160SSherry.Moore@Sun.COM 			 * fi_pagetable_size must be set after the allocation
12439160SSherry.Moore@Sun.COM 			 * succeeds as it's used to determine how much memory to
12449160SSherry.Moore@Sun.COM 			 * free.
12459160SSherry.Moore@Sun.COM 			 */
12469160SSherry.Moore@Sun.COM 			newkernel.fi_pagetable_size = size;
12477656SSherry.Moore@Sun.COM 		}
12487656SSherry.Moore@Sun.COM 
12497656SSherry.Moore@Sun.COM 		bzero((void *)(newkernel.fi_pagetable_va), size);
12507656SSherry.Moore@Sun.COM 
12517656SSherry.Moore@Sun.COM 		newkernel.fi_pagetable_pa =
12527656SSherry.Moore@Sun.COM 		    mmu_ptob((uint64_t)hat_getpfnum(kas.a_hat,
12537656SSherry.Moore@Sun.COM 		    (caddr_t)newkernel.fi_pagetable_va));
12547656SSherry.Moore@Sun.COM 
12557656SSherry.Moore@Sun.COM 		newkernel.fi_last_table_pa = newkernel.fi_pagetable_pa +
12568151SKonstantin.Ananyev@Sun.COM 		    size - MMU_PAGESIZE;
12577656SSherry.Moore@Sun.COM 
12587656SSherry.Moore@Sun.COM 		newkernel.fi_next_table_va = newkernel.fi_pagetable_va +
12597656SSherry.Moore@Sun.COM 		    MMU_PAGESIZE;
12607656SSherry.Moore@Sun.COM 		newkernel.fi_next_table_pa = newkernel.fi_pagetable_pa +
12617656SSherry.Moore@Sun.COM 		    MMU_PAGESIZE;
12627656SSherry.Moore@Sun.COM 
12637656SSherry.Moore@Sun.COM 		fastboot_build_pagetables(&newkernel);
12647656SSherry.Moore@Sun.COM 	}
12657656SSherry.Moore@Sun.COM 
12667656SSherry.Moore@Sun.COM 
12679160SSherry.Moore@Sun.COM 	/* Generate MD5 checksums */
12689160SSherry.Moore@Sun.COM 	fastboot_cksum_generate(&newkernel);
12699160SSherry.Moore@Sun.COM 
12707656SSherry.Moore@Sun.COM 	/* Mark it as valid */
12717656SSherry.Moore@Sun.COM 	newkernel.fi_valid = 1;
12727656SSherry.Moore@Sun.COM 	newkernel.fi_magic = FASTBOOT_MAGIC;
12737656SSherry.Moore@Sun.COM 
12749160SSherry.Moore@Sun.COM 	postbootkernelbase = saved_kernelbase;
12757656SSherry.Moore@Sun.COM 	return;
12767656SSherry.Moore@Sun.COM 
12777656SSherry.Moore@Sun.COM err_out:
12789160SSherry.Moore@Sun.COM 	postbootkernelbase = saved_kernelbase;
12797656SSherry.Moore@Sun.COM 	newkernel.fi_valid = 0;
12809160SSherry.Moore@Sun.COM 	fastboot_free_newkernel(&newkernel);
12819160SSherry.Moore@Sun.COM }
12829160SSherry.Moore@Sun.COM 
12839160SSherry.Moore@Sun.COM 
12849160SSherry.Moore@Sun.COM /* ARGSUSED */
12859160SSherry.Moore@Sun.COM static int
12869160SSherry.Moore@Sun.COM fastboot_xc_func(fastboot_info_t *nk, xc_arg_t unused2, xc_arg_t unused3)
12879160SSherry.Moore@Sun.COM {
12889160SSherry.Moore@Sun.COM 	void (*fastboot_func)(fastboot_info_t *);
12899160SSherry.Moore@Sun.COM 	fastboot_file_t	*fb = &nk->fi_files[FASTBOOT_SWTCH];
12909160SSherry.Moore@Sun.COM 	fastboot_func = (void (*)())(fb->fb_va);
12919160SSherry.Moore@Sun.COM 	kthread_t *t_intr = curthread->t_intr;
12929160SSherry.Moore@Sun.COM 
12939160SSherry.Moore@Sun.COM 	if (&kas != curproc->p_as) {
12949160SSherry.Moore@Sun.COM 		hat_devload(curproc->p_as->a_hat, (caddr_t)fb->fb_va,
12959160SSherry.Moore@Sun.COM 		    MMU_PAGESIZE, mmu_btop(fb->fb_dest_pa),
12969160SSherry.Moore@Sun.COM 		    PROT_READ | PROT_WRITE | PROT_EXEC,
12979160SSherry.Moore@Sun.COM 		    HAT_LOAD_NOCONSIST | HAT_LOAD_LOCK);
12989160SSherry.Moore@Sun.COM 	}
12999160SSherry.Moore@Sun.COM 
13009160SSherry.Moore@Sun.COM 	/*
13019160SSherry.Moore@Sun.COM 	 * If we have pinned a thread, make sure the address is mapped
13029160SSherry.Moore@Sun.COM 	 * in the address space of the pinned thread.
13039160SSherry.Moore@Sun.COM 	 */
13049160SSherry.Moore@Sun.COM 	if (t_intr && t_intr->t_procp->p_as->a_hat != curproc->p_as->a_hat &&
13059160SSherry.Moore@Sun.COM 	    t_intr->t_procp->p_as != &kas)
13069160SSherry.Moore@Sun.COM 		hat_devload(t_intr->t_procp->p_as->a_hat, (caddr_t)fb->fb_va,
13079160SSherry.Moore@Sun.COM 		    MMU_PAGESIZE, mmu_btop(fb->fb_dest_pa),
13089160SSherry.Moore@Sun.COM 		    PROT_READ | PROT_WRITE | PROT_EXEC,
13099160SSherry.Moore@Sun.COM 		    HAT_LOAD_NOCONSIST | HAT_LOAD_LOCK);
13109160SSherry.Moore@Sun.COM 
13119160SSherry.Moore@Sun.COM 	(*psm_shutdownf)(A_SHUTDOWN, AD_FASTREBOOT);
13129160SSherry.Moore@Sun.COM 	(*fastboot_func)(nk);
13139160SSherry.Moore@Sun.COM 
13149160SSherry.Moore@Sun.COM 	/*NOTREACHED*/
13159160SSherry.Moore@Sun.COM 	return (0);
13167656SSherry.Moore@Sun.COM }
13177656SSherry.Moore@Sun.COM 
13187750SSherry.Moore@Sun.COM /*
13197750SSherry.Moore@Sun.COM  * Jump to the fast reboot switcher.  This function never returns.
13207750SSherry.Moore@Sun.COM  */
13217656SSherry.Moore@Sun.COM void
13227656SSherry.Moore@Sun.COM fast_reboot()
13237656SSherry.Moore@Sun.COM {
13249160SSherry.Moore@Sun.COM 	processorid_t bootcpuid = 0;
13259160SSherry.Moore@Sun.COM 	extern uintptr_t postbootkernelbase;
13269160SSherry.Moore@Sun.COM 	extern char	fb_swtch_image[];
13279160SSherry.Moore@Sun.COM 	fastboot_file_t	*fb;
13289160SSherry.Moore@Sun.COM 	int i;
13299160SSherry.Moore@Sun.COM 
13309160SSherry.Moore@Sun.COM 	postbootkernelbase = 0;
13319160SSherry.Moore@Sun.COM 
13329160SSherry.Moore@Sun.COM 	fb = &newkernel.fi_files[FASTBOOT_SWTCH];
13339160SSherry.Moore@Sun.COM 
13349160SSherry.Moore@Sun.COM 	/*
13359160SSherry.Moore@Sun.COM 	 * Map the address into both the current proc's address
13369160SSherry.Moore@Sun.COM 	 * space and the kernel's address space in case the panic
13379160SSherry.Moore@Sun.COM 	 * is forced by kmdb.
13389160SSherry.Moore@Sun.COM 	 */
13399160SSherry.Moore@Sun.COM 	if (&kas != curproc->p_as) {
13409160SSherry.Moore@Sun.COM 		hat_devload(curproc->p_as->a_hat, (caddr_t)fb->fb_va,
13419160SSherry.Moore@Sun.COM 		    MMU_PAGESIZE, mmu_btop(fb->fb_dest_pa),
13429160SSherry.Moore@Sun.COM 		    PROT_READ | PROT_WRITE | PROT_EXEC,
13439160SSherry.Moore@Sun.COM 		    HAT_LOAD_NOCONSIST | HAT_LOAD_LOCK);
13449160SSherry.Moore@Sun.COM 	}
13459160SSherry.Moore@Sun.COM 
13469160SSherry.Moore@Sun.COM 	bcopy((void *)fb_swtch_image, (void *)fb->fb_va, fb->fb_size);
13479160SSherry.Moore@Sun.COM 
13489160SSherry.Moore@Sun.COM 
13499160SSherry.Moore@Sun.COM 	/*
13509160SSherry.Moore@Sun.COM 	 * Set fb_va to fake_va
13519160SSherry.Moore@Sun.COM 	 */
13529160SSherry.Moore@Sun.COM 	for (i = 0; i < FASTBOOT_MAX_FILES_MAP; i++) {
13539160SSherry.Moore@Sun.COM 		newkernel.fi_files[i].fb_va = fake_va;
13549160SSherry.Moore@Sun.COM 
13559160SSherry.Moore@Sun.COM 	}
13569160SSherry.Moore@Sun.COM 
13579160SSherry.Moore@Sun.COM 	if (panicstr && CPU->cpu_id != bootcpuid &&
13589160SSherry.Moore@Sun.COM 	    CPU_ACTIVE(cpu_get(bootcpuid))) {
13599489SJoe.Bonasera@sun.com 		extern void panic_idle(void);
13609160SSherry.Moore@Sun.COM 		cpuset_t cpuset;
13619160SSherry.Moore@Sun.COM 
13629160SSherry.Moore@Sun.COM 		CPUSET_ZERO(cpuset);
13639160SSherry.Moore@Sun.COM 		CPUSET_ADD(cpuset, bootcpuid);
13649489SJoe.Bonasera@sun.com 		xc_priority((xc_arg_t)&newkernel, 0, 0, CPUSET2BV(cpuset),
13659160SSherry.Moore@Sun.COM 		    (xc_func_t)fastboot_xc_func);
13669160SSherry.Moore@Sun.COM 
13679489SJoe.Bonasera@sun.com 		panic_idle();
13689160SSherry.Moore@Sun.COM 	} else
13699160SSherry.Moore@Sun.COM 		(void) fastboot_xc_func(&newkernel, 0, 0);
13709160SSherry.Moore@Sun.COM }
13719160SSherry.Moore@Sun.COM 
13729160SSherry.Moore@Sun.COM 
13739160SSherry.Moore@Sun.COM /*
13749160SSherry.Moore@Sun.COM  * Get boot property value for fastreboot_onpanic.
13759160SSherry.Moore@Sun.COM  *
13769160SSherry.Moore@Sun.COM  * NOTE: If fastreboot_onpanic is set to non-zero in /etc/system,
13779160SSherry.Moore@Sun.COM  * new setting passed in via "-B fastreboot_onpanic" is ignored.
13789160SSherry.Moore@Sun.COM  * This order of precedence is to enable developers debugging panics
13799160SSherry.Moore@Sun.COM  * that occur early in boot to utilize Fast Reboot on panic.
13809160SSherry.Moore@Sun.COM  */
13819160SSherry.Moore@Sun.COM static void
13829160SSherry.Moore@Sun.COM fastboot_get_bootprop(void)
13839160SSherry.Moore@Sun.COM {
13849160SSherry.Moore@Sun.COM 	int		val = 0xaa, len, ret;
13859160SSherry.Moore@Sun.COM 	dev_info_t	*devi;
13869160SSherry.Moore@Sun.COM 	char		*propstr = NULL;
13879160SSherry.Moore@Sun.COM 
13889160SSherry.Moore@Sun.COM 	devi = ddi_root_node();
13897656SSherry.Moore@Sun.COM 
13909160SSherry.Moore@Sun.COM 	ret = ddi_prop_lookup_string(DDI_DEV_T_ANY, devi, DDI_PROP_DONTPASS,
13919160SSherry.Moore@Sun.COM 	    FASTREBOOT_ONPANIC, &propstr);
13929160SSherry.Moore@Sun.COM 
13939160SSherry.Moore@Sun.COM 	if (ret == DDI_PROP_SUCCESS) {
13949160SSherry.Moore@Sun.COM 		if (FASTREBOOT_ONPANIC_NOTSET(propstr))
13959160SSherry.Moore@Sun.COM 			val = 0;
13969160SSherry.Moore@Sun.COM 		else if (FASTREBOOT_ONPANIC_ISSET(propstr))
13979160SSherry.Moore@Sun.COM 			val = UA_FASTREBOOT_ONPANIC;
13989160SSherry.Moore@Sun.COM 
13999160SSherry.Moore@Sun.COM 		/*
14009160SSherry.Moore@Sun.COM 		 * Only set fastreboot_onpanic to the value passed in
14019160SSherry.Moore@Sun.COM 		 * if it's not already set to non-zero, and the value
14029160SSherry.Moore@Sun.COM 		 * has indeed been passed in via command line.
14039160SSherry.Moore@Sun.COM 		 */
14049160SSherry.Moore@Sun.COM 		if (!fastreboot_onpanic && val != 0xaa)
14059160SSherry.Moore@Sun.COM 			fastreboot_onpanic = val;
14069160SSherry.Moore@Sun.COM 		ddi_prop_free(propstr);
14079160SSherry.Moore@Sun.COM 	} else if (ret != DDI_PROP_NOT_FOUND && ret != DDI_PROP_UNDEFINED) {
1408*10970SSherry.Moore@Sun.COM 		cmn_err(CE_NOTE, "!%s value is invalid, will be ignored",
14099160SSherry.Moore@Sun.COM 		    FASTREBOOT_ONPANIC);
14109160SSherry.Moore@Sun.COM 	}
14119160SSherry.Moore@Sun.COM 
14129160SSherry.Moore@Sun.COM 	len = sizeof (fastreboot_onpanic_cmdline);
14139160SSherry.Moore@Sun.COM 	ret = ddi_getlongprop_buf(DDI_DEV_T_ANY, devi, DDI_PROP_DONTPASS,
14149160SSherry.Moore@Sun.COM 	    FASTREBOOT_ONPANIC_CMDLINE, fastreboot_onpanic_cmdline, &len);
14159160SSherry.Moore@Sun.COM 
14169160SSherry.Moore@Sun.COM 	if (ret == DDI_PROP_BUF_TOO_SMALL)
1417*10970SSherry.Moore@Sun.COM 		cmn_err(CE_NOTE, "!%s value is too long, will be ignored",
14189160SSherry.Moore@Sun.COM 		    FASTREBOOT_ONPANIC_CMDLINE);
14197656SSherry.Moore@Sun.COM }
14209160SSherry.Moore@Sun.COM 
14219160SSherry.Moore@Sun.COM /*
14229160SSherry.Moore@Sun.COM  * This function is called by main() to either load the backup kernel for panic
14239160SSherry.Moore@Sun.COM  * fast reboot, or to reserve low physical memory for fast reboot.
14249160SSherry.Moore@Sun.COM  */
14259160SSherry.Moore@Sun.COM void
14269160SSherry.Moore@Sun.COM fastboot_post_startup()
14279160SSherry.Moore@Sun.COM {
142810916SSherry.Moore@Sun.COM 	lbolt_at_boot = ddi_get_lbolt();
142910916SSherry.Moore@Sun.COM 
143010916SSherry.Moore@Sun.COM 	/* Default to 10 minutes */
143110916SSherry.Moore@Sun.COM 	if (fastreboot_onpanic_uptime == LONG_MAX)
143210916SSherry.Moore@Sun.COM 		fastreboot_onpanic_uptime = SEC_TO_TICK(10 * 60);
143310916SSherry.Moore@Sun.COM 
14349160SSherry.Moore@Sun.COM 	if (!fastreboot_capable)
14359160SSherry.Moore@Sun.COM 		return;
14369160SSherry.Moore@Sun.COM 
143710559SSherry.Moore@Sun.COM 	mutex_enter(&fastreboot_config_mutex);
143810559SSherry.Moore@Sun.COM 
14399160SSherry.Moore@Sun.COM 	fastboot_get_bootprop();
14409160SSherry.Moore@Sun.COM 
14419160SSherry.Moore@Sun.COM 	if (fastreboot_onpanic)
14429160SSherry.Moore@Sun.COM 		fastboot_load_kernel(fastreboot_onpanic_cmdline);
14439160SSherry.Moore@Sun.COM 	else if (reserve_mem_enabled)
14449160SSherry.Moore@Sun.COM 		fastboot_reserve_mem(&newkernel);
144510559SSherry.Moore@Sun.COM 
144610559SSherry.Moore@Sun.COM 	mutex_exit(&fastreboot_config_mutex);
14479160SSherry.Moore@Sun.COM }
14489160SSherry.Moore@Sun.COM 
14499160SSherry.Moore@Sun.COM /*
14509160SSherry.Moore@Sun.COM  * Update boot configuration settings.
14519160SSherry.Moore@Sun.COM  * If the new fastreboot_onpanic setting is false, and a kernel has
14529160SSherry.Moore@Sun.COM  * been preloaded, free the memory;
14539160SSherry.Moore@Sun.COM  * if the new fastreboot_onpanic setting is true and newkernel is
14549160SSherry.Moore@Sun.COM  * not valid, load the new kernel.
14559160SSherry.Moore@Sun.COM  */
14569160SSherry.Moore@Sun.COM void
14579160SSherry.Moore@Sun.COM fastboot_update_config(const char *mdep)
14589160SSherry.Moore@Sun.COM {
14599160SSherry.Moore@Sun.COM 	uint8_t boot_config = (uint8_t)*mdep;
146010559SSherry.Moore@Sun.COM 	int cur_fastreboot_onpanic;
14619160SSherry.Moore@Sun.COM 
14629160SSherry.Moore@Sun.COM 	if (!fastreboot_capable)
14639160SSherry.Moore@Sun.COM 		return;
14649160SSherry.Moore@Sun.COM 
146510559SSherry.Moore@Sun.COM 	mutex_enter(&fastreboot_config_mutex);
146610559SSherry.Moore@Sun.COM 
146710559SSherry.Moore@Sun.COM 	cur_fastreboot_onpanic = fastreboot_onpanic;
14689160SSherry.Moore@Sun.COM 	fastreboot_onpanic = boot_config & UA_FASTREBOOT_ONPANIC;
146910559SSherry.Moore@Sun.COM 
14709160SSherry.Moore@Sun.COM 	if (fastreboot_onpanic && (!cur_fastreboot_onpanic ||
14719160SSherry.Moore@Sun.COM 	    !newkernel.fi_valid))
14729160SSherry.Moore@Sun.COM 		fastboot_load_kernel(fastreboot_onpanic_cmdline);
14739160SSherry.Moore@Sun.COM 	if (cur_fastreboot_onpanic && !fastreboot_onpanic)
14749160SSherry.Moore@Sun.COM 		fastboot_free_newkernel(&newkernel);
147510559SSherry.Moore@Sun.COM 
147610559SSherry.Moore@Sun.COM 	mutex_exit(&fastreboot_config_mutex);
14779160SSherry.Moore@Sun.COM }
147810559SSherry.Moore@Sun.COM 
147910559SSherry.Moore@Sun.COM /*
148010559SSherry.Moore@Sun.COM  * This is the interface to be called by other kernel components to
148110559SSherry.Moore@Sun.COM  * disable fastreboot_onpanic.
148210559SSherry.Moore@Sun.COM  */
148310559SSherry.Moore@Sun.COM void
148410559SSherry.Moore@Sun.COM fastreboot_disable()
148510559SSherry.Moore@Sun.COM {
148610559SSherry.Moore@Sun.COM 	uint8_t boot_config = (uint8_t)(~UA_FASTREBOOT_ONPANIC);
148710559SSherry.Moore@Sun.COM 	fastboot_update_config((const char *)&boot_config);
148810559SSherry.Moore@Sun.COM }
148910559SSherry.Moore@Sun.COM 
149010559SSherry.Moore@Sun.COM /*
149110559SSherry.Moore@Sun.COM  * This is the interface to be called by fm_panic() in case FMA has diagnosed
149210559SSherry.Moore@Sun.COM  * a terminal machine check exception.  It does not free up memory allocated
149310559SSherry.Moore@Sun.COM  * for the backup kernel.  General disabling fastreboot_onpanic in a
149410559SSherry.Moore@Sun.COM  * non-panicking situation must go through fastboot_update_config().
149510559SSherry.Moore@Sun.COM  */
149610559SSherry.Moore@Sun.COM void
149710559SSherry.Moore@Sun.COM fastreboot_disable_highpil()
149810559SSherry.Moore@Sun.COM {
149910559SSherry.Moore@Sun.COM 	fastreboot_onpanic = 0;
150010559SSherry.Moore@Sun.COM }
150110559SSherry.Moore@Sun.COM 
150210559SSherry.Moore@Sun.COM 
150310559SSherry.Moore@Sun.COM /*
150410559SSherry.Moore@Sun.COM  * A simplified interface for uadmin to call to update the configuration
150510559SSherry.Moore@Sun.COM  * setting and load a new kernel if necessary.
150610559SSherry.Moore@Sun.COM  */
150710559SSherry.Moore@Sun.COM void
150810559SSherry.Moore@Sun.COM fastboot_update_and_load(int fcn, char *mdep)
150910559SSherry.Moore@Sun.COM {
151010559SSherry.Moore@Sun.COM 	if (fcn != AD_FASTREBOOT) {
151110559SSherry.Moore@Sun.COM 		/*
151210559SSherry.Moore@Sun.COM 		 * If user has explicitly requested reboot to prom,
151310559SSherry.Moore@Sun.COM 		 * or uadmin(1M) was invoked with other functions,
151410559SSherry.Moore@Sun.COM 		 * don't try to fast reboot after dumping.
151510559SSherry.Moore@Sun.COM 		 */
151610559SSherry.Moore@Sun.COM 		fastreboot_disable();
151710559SSherry.Moore@Sun.COM 	}
151810559SSherry.Moore@Sun.COM 
151910559SSherry.Moore@Sun.COM 	mutex_enter(&fastreboot_config_mutex);
152010559SSherry.Moore@Sun.COM 
152110559SSherry.Moore@Sun.COM 	if (fastreboot_onpanic)
152210559SSherry.Moore@Sun.COM 		fastboot_load_kernel(mdep);
152310559SSherry.Moore@Sun.COM 
152410559SSherry.Moore@Sun.COM 	mutex_exit(&fastreboot_config_mutex);
152510559SSherry.Moore@Sun.COM }
1526