xref: /netbsd-src/sys/dev/kloader.c (revision 949b8d92b90e49ecf844f4376cb15fe53667f695)
1*949b8d92Srin /*	$NetBSD: kloader.c,v 1.32 2021/10/11 14:25:05 rin Exp $	*/
23a292b1bSuch 
33a292b1bSuch /*-
43a292b1bSuch  * Copyright (c) 2001, 2002, 2004 The NetBSD Foundation, Inc.
53a292b1bSuch  * All rights reserved.
63a292b1bSuch  *
73a292b1bSuch  * Redistribution and use in source and binary forms, with or without
83a292b1bSuch  * modification, are permitted provided that the following conditions
93a292b1bSuch  * are met:
103a292b1bSuch  * 1. Redistributions of source code must retain the above copyright
113a292b1bSuch  *    notice, this list of conditions and the following disclaimer.
123a292b1bSuch  * 2. Redistributions in binary form must reproduce the above copyright
133a292b1bSuch  *    notice, this list of conditions and the following disclaimer in the
143a292b1bSuch  *    documentation and/or other materials provided with the distribution.
153a292b1bSuch  *
163a292b1bSuch  * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
173a292b1bSuch  * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
183a292b1bSuch  * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
193a292b1bSuch  * PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
203a292b1bSuch  * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
213a292b1bSuch  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
223a292b1bSuch  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
233a292b1bSuch  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
243a292b1bSuch  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
253a292b1bSuch  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
263a292b1bSuch  * POSSIBILITY OF SUCH DAMAGE.
273a292b1bSuch  */
283a292b1bSuch 
293a292b1bSuch #include <sys/cdefs.h>
30*949b8d92Srin __KERNEL_RCSID(0, "$NetBSD: kloader.c,v 1.32 2021/10/11 14:25:05 rin Exp $");
313a292b1bSuch 
323a292b1bSuch #include "debug_kloader.h"
333a292b1bSuch 
343a292b1bSuch #include <sys/param.h>
353a292b1bSuch #include <sys/fcntl.h>
36*949b8d92Srin #include <sys/kmem.h>
37b9693fbfSrin #include <sys/namei.h>
38b9693fbfSrin #include <sys/proc.h>
39b9693fbfSrin #include <sys/systm.h>
40b9693fbfSrin #include <sys/vnode.h>
41b9693fbfSrin 
423a292b1bSuch #define	ELFSIZE	32
433a292b1bSuch #include <sys/exec_elf.h>
443a292b1bSuch 
459fc45356Sriastradh #include <uvm/uvm_extern.h>
463a292b1bSuch 
473a292b1bSuch #include <machine/kloader.h>
483a292b1bSuch 
493a292b1bSuch #define	PRINTF(fmt, args...)	printf("kloader: " fmt, ##args)
503a292b1bSuch 
513a292b1bSuch #ifdef KLOADER_DEBUG
523a292b1bSuch int	kloader_debug = 1;
533a292b1bSuch #define	DPRINTF(fmt, args...)						\
543a292b1bSuch 	if (kloader_debug)						\
559b2b412cSperry 		printf("%s: " fmt, __func__ , ##args)
563a292b1bSuch #define	_DPRINTF(fmt, args...)						\
573a292b1bSuch 	if (kloader_debug)						\
583a292b1bSuch 		printf(fmt, ##args)
593a292b1bSuch #define	DPRINTFN(n, fmt, args...)					\
603a292b1bSuch 	if (kloader_debug > (n))					\
619b2b412cSperry 		printf("%s: " fmt, __func__ , ##args)
623a292b1bSuch #define	_DPRINTFN(n, fmt, args...)					\
633a292b1bSuch 	if (kloader_debug > (n))					\
643a292b1bSuch 		printf(fmt, ##args)
653a292b1bSuch #define	STATIC
663a292b1bSuch #else
673a292b1bSuch #define	DPRINTF(fmt, args...)		((void)0)
683a292b1bSuch #define	_DPRINTF(fmt, args...)		((void)0)
693a292b1bSuch #define	DPRINTFN(n, fmt, args...)	((void)0)
703a292b1bSuch #define	_DPRINTFN(n, fmt, args...)	((void)0)
713a292b1bSuch #define	STATIC	static
723a292b1bSuch #endif
733a292b1bSuch 
743a292b1bSuch struct kloader {
753a292b1bSuch 	struct pglist pg_head;
765b83bdc8Suebayasi 	struct vm_page *cur_pg;		/* XXX use bus_dma(9) */
773a292b1bSuch 	struct kloader_page_tag *cur_tag;
783a292b1bSuch 	struct vnode *vp;
793a292b1bSuch 	struct kloader_page_tag *tagstart;
803a292b1bSuch 	struct kloader_bootinfo *bootinfo;
813a292b1bSuch 	struct kloader_bootinfo *rebootinfo;
823a292b1bSuch 	vaddr_t loader_sp;
833a292b1bSuch 	kloader_bootfunc_t *loader;
843a292b1bSuch 	int setuped;
853a292b1bSuch 	int called;
863a292b1bSuch 	struct kloader_ops *ops;
873a292b1bSuch };
883a292b1bSuch 
893a292b1bSuch #define	BUCKET_SIZE	(PAGE_SIZE - sizeof(struct kloader_page_tag))
9095e1ffb1Schristos #define	KLOADER_LWP	(&lwp0)
913a292b1bSuch STATIC struct kloader kloader;
923a292b1bSuch 
933a292b1bSuch #define	ROUND4(x)	(((x) + 3) & ~3)
943a292b1bSuch 
953a292b1bSuch STATIC int kloader_load(void);
963a292b1bSuch 
973a292b1bSuch STATIC int kloader_alloc_memory(size_t);
983a292b1bSuch STATIC struct kloader_page_tag *kloader_get_tag(vaddr_t);
993a292b1bSuch STATIC void kloader_from_file(vaddr_t, off_t, size_t);
1003a292b1bSuch STATIC void kloader_copy(vaddr_t, const void *, size_t);
1013a292b1bSuch STATIC void kloader_zero(vaddr_t, size_t);
1023a292b1bSuch 
1033a292b1bSuch STATIC void kloader_load_segment(Elf_Phdr *);
1043a292b1bSuch 
1053a292b1bSuch STATIC struct vnode *kloader_open(const char *);
1063a292b1bSuch STATIC void kloader_close(void);
1073a292b1bSuch STATIC int kloader_read(size_t, size_t, void *);
1083a292b1bSuch 
1093a292b1bSuch #ifdef KLOADER_DEBUG
1103a292b1bSuch STATIC void kloader_pagetag_dump(void);
1113a292b1bSuch #endif
1123a292b1bSuch 
1133a292b1bSuch void
__kloader_reboot_setup(struct kloader_ops * ops,const char * filename)1143a292b1bSuch __kloader_reboot_setup(struct kloader_ops *ops, const char *filename)
1153a292b1bSuch {
1163a292b1bSuch 
1173a292b1bSuch 	if (kloader.bootinfo == NULL) {
1183a292b1bSuch 		PRINTF("No bootinfo.\n");
1193a292b1bSuch 		return;
1203a292b1bSuch 	}
1213a292b1bSuch 
1223a292b1bSuch 	if (ops == NULL || ops->jump == NULL || ops->boot == NULL) {
1233a292b1bSuch 		PRINTF("No boot operations.\n");
1243a292b1bSuch 		return;
1253a292b1bSuch 	}
1263a292b1bSuch 	kloader.ops = ops;
1273a292b1bSuch 
1283a292b1bSuch 	if (kloader.called++ == 0) {
1293a292b1bSuch 		PRINTF("kernel file name: %s\n", filename);
1303a292b1bSuch 		kloader.vp = kloader_open(filename);
1313a292b1bSuch 		if (kloader.vp == NULL)
1323a292b1bSuch 			return;
1333a292b1bSuch 
1343a292b1bSuch 		if (kloader_load() == 0) {
1353a292b1bSuch 			kloader.setuped = TRUE;
1363a292b1bSuch #ifdef KLOADER_DEBUG
1373a292b1bSuch 			kloader_pagetag_dump();
1383a292b1bSuch #endif
1393a292b1bSuch 		}
1403a292b1bSuch 		kloader_close();
1413a292b1bSuch 	} else {
1423a292b1bSuch 		/* Fatal case. reboot from DDB etc. */
1433a292b1bSuch 		kloader_reboot();
1443a292b1bSuch 	}
1453a292b1bSuch }
1463a292b1bSuch 
1473a292b1bSuch 
1483a292b1bSuch void
kloader_reboot(void)149df7f595eScegger kloader_reboot(void)
1503a292b1bSuch {
1513a292b1bSuch 
1523a292b1bSuch 	if (kloader.setuped) {
1533a292b1bSuch 		PRINTF("Rebooting...\n");
1543a292b1bSuch 		(*kloader.ops->jump)(kloader.loader, kloader.loader_sp,
1553a292b1bSuch 		    kloader.rebootinfo, kloader.tagstart);
1563a292b1bSuch 	}
1573a292b1bSuch 
1583a292b1bSuch 	if (kloader.ops->reset != NULL) {
15984ba0cabSpeter 		PRINTF("Resetting...\n");
1603a292b1bSuch 		(*kloader.ops->reset)();
1613a292b1bSuch 	}
1623a292b1bSuch 	while (/*CONSTCOND*/1)
1635b83bdc8Suebayasi 		continue;
1643a292b1bSuch 	/* NOTREACHED */
1653a292b1bSuch }
1663a292b1bSuch 
1673a292b1bSuch 
1683a292b1bSuch int
kloader_load(void)169df7f595eScegger kloader_load(void)
1703a292b1bSuch {
1713a292b1bSuch 	Elf_Ehdr eh;
1723a292b1bSuch 	Elf_Phdr *ph, *p;
1733a292b1bSuch 	Elf_Shdr *sh;
1743a292b1bSuch 	Elf_Addr entry;
1753a292b1bSuch 	vaddr_t kv;
1763a292b1bSuch 	size_t sz;
177*949b8d92Srin 	size_t phsz, shsz, shstrsz;
1783a292b1bSuch 	char *shstrtab;
1793a292b1bSuch 	int symndx, strndx;
1803a292b1bSuch 	size_t ksymsz;
1813a292b1bSuch 	struct kloader_bootinfo nbi; /* new boot info */
1823a292b1bSuch 	char *oldbuf, *newbuf;
1833a292b1bSuch 	char **ap;
1843a292b1bSuch 	int i;
1853a292b1bSuch 
1863a292b1bSuch 	ph = NULL;
1873a292b1bSuch 	sh = NULL;
1883a292b1bSuch 	shstrtab = NULL;
1893a292b1bSuch 
1903a292b1bSuch 	/* read kernel's ELF header */
1913a292b1bSuch 	kloader_read(0, sizeof(Elf_Ehdr), &eh);
1923a292b1bSuch 
1933a292b1bSuch 	if (eh.e_ident[EI_MAG0] != ELFMAG0 ||
1943a292b1bSuch 	    eh.e_ident[EI_MAG1] != ELFMAG1 ||
1953a292b1bSuch 	    eh.e_ident[EI_MAG2] != ELFMAG2 ||
1963a292b1bSuch 	    eh.e_ident[EI_MAG3] != ELFMAG3) {
1973a292b1bSuch 		PRINTF("not an ELF file\n");
1983a292b1bSuch 		goto err;
1993a292b1bSuch 	}
2003a292b1bSuch 
2013a292b1bSuch 	/* read program headers */
202*949b8d92Srin 	phsz = eh.e_phentsize * eh.e_phnum;
203*949b8d92Srin 	if ((ph = kmem_alloc(phsz, KM_NOSLEEP)) == NULL) {
2043a292b1bSuch 		PRINTF("can't allocate program header table.\n");
2053a292b1bSuch 		goto err;
2063a292b1bSuch 	}
207*949b8d92Srin 	if (kloader_read(eh.e_phoff, phsz, ph) != 0) {
2083a292b1bSuch 		PRINTF("program header read error.\n");
2093a292b1bSuch 		goto err;
2103a292b1bSuch 	}
2113a292b1bSuch 
2123a292b1bSuch 	/* read section headers */
213*949b8d92Srin 	shsz = eh.e_shentsize * eh.e_shnum;
214*949b8d92Srin 	if ((sh = kmem_alloc(shsz, KM_NOSLEEP)) == NULL) {
2153a292b1bSuch 		PRINTF("can't allocate section header table.\n");
2163a292b1bSuch 		goto err;
2173a292b1bSuch 	}
218*949b8d92Srin 	if (kloader_read(eh.e_shoff, shsz, sh) != 0) {
2193a292b1bSuch 		PRINTF("section header read error.\n");
2203a292b1bSuch 		goto err;
2213a292b1bSuch 	}
2223a292b1bSuch 
2233a292b1bSuch 	/* read section names */
2243a292b1bSuch 	shstrsz = ROUND4(sh[eh.e_shstrndx].sh_size);
225*949b8d92Srin 	shstrtab = kmem_alloc(shstrsz, KM_NOSLEEP);
2263a292b1bSuch 	if (shstrtab == NULL) {
2273a292b1bSuch 		PRINTF("unable to allocate memory for .shstrtab\n");
2283a292b1bSuch 		goto err;
2293a292b1bSuch 	}
2303a292b1bSuch 	DPRINTF("reading 0x%x bytes of .shstrtab at 0x%x\n",
2313a292b1bSuch 	    sh[eh.e_shstrndx].sh_size, sh[eh.e_shstrndx].sh_offset);
2323a292b1bSuch 	kloader_read(sh[eh.e_shstrndx].sh_offset, sh[eh.e_shstrndx].sh_size,
2333a292b1bSuch 	    shstrtab);
2343a292b1bSuch 
2353a292b1bSuch 	/* save entry point, code to construct symbol table overwrites it */
2363a292b1bSuch 	entry = eh.e_entry;
2373a292b1bSuch 
2383a292b1bSuch 	/*
23984ba0cabSpeter 	 * Calculate memory size
2403a292b1bSuch 	 */
2413a292b1bSuch 	sz = 0;
2423a292b1bSuch 
2433a292b1bSuch 	/* loadable segments */
2443a292b1bSuch 	for (i = 0; i < eh.e_phnum; i++) {
2453a292b1bSuch 		if (ph[i].p_type == PT_LOAD) {
2463a292b1bSuch 			DPRINTF("segment %d size = file 0x%x memory 0x%x\n",
2473a292b1bSuch 			    i, ph[i].p_filesz, ph[i].p_memsz);
2483a292b1bSuch #ifdef KLOADER_ZERO_BSS
2493a292b1bSuch 			sz += round_page(ph[i].p_memsz);
2503a292b1bSuch #else
2513a292b1bSuch 			sz += round_page(ph[i].p_filesz);
2523a292b1bSuch #endif
2533a292b1bSuch 			sz += PAGE_SIZE; /* compensate for partial last tag */
2543a292b1bSuch 		}
2553a292b1bSuch 	}
2563a292b1bSuch 
2573a292b1bSuch 	if (sz == 0)		/* nothing to load? */
2583a292b1bSuch 		goto err;
2593a292b1bSuch 
2603a292b1bSuch 	/* symbols/strings sections */
2613a292b1bSuch 	symndx = strndx = -1;
2623a292b1bSuch 	for (i = 0; i < eh.e_shnum; i++) {
2633a292b1bSuch 		if (strcmp(shstrtab + sh[i].sh_name, ".symtab") == 0)
2643a292b1bSuch 			symndx = i;
2653a292b1bSuch 		else if (strcmp(shstrtab + sh[i].sh_name, ".strtab") == 0)
2663a292b1bSuch 			strndx = i;
267fffdc5e0Srin 		else if (i != eh.e_shstrndx) {
2683a292b1bSuch 			/* while here, mark all other sections as unused */
2693a292b1bSuch 			sh[i].sh_type = SHT_NULL;
270fffdc5e0Srin 			sh[i].sh_offset = 0;
271fffdc5e0Srin 		}
2723a292b1bSuch 	}
2733a292b1bSuch 
2743a292b1bSuch 	if (symndx < 0 || strndx < 0) {
2753a292b1bSuch 		if (symndx < 0)
2763a292b1bSuch 			PRINTF("no .symtab section\n");
2773a292b1bSuch 		if (strndx < 0)
2783a292b1bSuch 			PRINTF("no .strtab section\n");
2793a292b1bSuch 		ksymsz = SELFMAG; /* just a bad magic */
2803a292b1bSuch 	} else {
2813a292b1bSuch 		ksymsz = sizeof(Elf_Ehdr)
2823a292b1bSuch 		    + eh.e_shentsize * eh.e_shnum
2833a292b1bSuch 		    + shstrsz		/* rounded to 4 bytes */
2843a292b1bSuch 		    + sh[symndx].sh_size
2853a292b1bSuch 		    + sh[strndx].sh_size;
28666d780dbSpeter 		DPRINTF("ksyms size = 0x%zx\n", ksymsz);
2873a292b1bSuch 	}
2883a292b1bSuch 	sz += ROUND4(ksymsz);
2893a292b1bSuch 
2903a292b1bSuch 	/* boot info for the new kernel */
2913a292b1bSuch 	sz += sizeof(struct kloader_bootinfo);
2923a292b1bSuch 
2933a292b1bSuch 	/* get memory for new kernel */
2943a292b1bSuch 	if (kloader_alloc_memory(sz) != 0)
2953a292b1bSuch 		goto err;
2963a292b1bSuch 
2973a292b1bSuch 	/*
2983a292b1bSuch 	 * Copy new kernel in.
2993a292b1bSuch 	 */
3003a292b1bSuch 	kv = 0;			/* XXX: -Wuninitialized */
3013a292b1bSuch 	for (i = 0, p = ph; i < eh.e_phnum; i++, p++) {
3023a292b1bSuch 		if (p->p_type == PT_LOAD) {
3033a292b1bSuch 			kloader_load_segment(p);
3043a292b1bSuch 			kv = p->p_vaddr + ROUND4(p->p_memsz);
3053a292b1bSuch 		}
3063a292b1bSuch 	}
3073a292b1bSuch 
3083a292b1bSuch 	/*
3093a292b1bSuch 	 * Construct symbol table for ksyms.
3103a292b1bSuch 	 */
3113a292b1bSuch 	if (symndx < 0 || strndx < 0) {
3123a292b1bSuch 		kloader_zero(kv, SELFMAG);
3133a292b1bSuch 		kv += SELFMAG;
3143a292b1bSuch 	} else {
3153a292b1bSuch 		Elf_Off eoff;
3163a292b1bSuch 		off_t symoff, stroff;
3173a292b1bSuch 
3183a292b1bSuch 		/* save offsets of .symtab and .strtab before we change them */
3193a292b1bSuch 		symoff = sh[symndx].sh_offset;
3203a292b1bSuch 		stroff = sh[strndx].sh_offset;
3213a292b1bSuch 
3223a292b1bSuch 		/* no loadable segments */
3233a292b1bSuch 		eh.e_entry = 0;
3243a292b1bSuch 		eh.e_phnum = 0;
3253a292b1bSuch 		eh.e_phoff = 0;
3263a292b1bSuch 
3273a292b1bSuch 		/* change offsets to reflect new layout */
3283a292b1bSuch 		eoff = sizeof(Elf_Ehdr);
3293a292b1bSuch 		eh.e_shoff = eoff;
3303a292b1bSuch 
3313a292b1bSuch 		eoff += eh.e_shentsize * eh.e_shnum;
3323a292b1bSuch 		sh[eh.e_shstrndx].sh_offset = eoff;
3333a292b1bSuch 
3343a292b1bSuch 		eoff += shstrsz;
3353a292b1bSuch 		sh[symndx].sh_offset = eoff;
3363a292b1bSuch 
3373a292b1bSuch 		eoff += sh[symndx].sh_size;
3383a292b1bSuch 		sh[strndx].sh_offset = eoff;
3393a292b1bSuch 
3403a292b1bSuch 		/* local copies massaged, can serve them now */
3413a292b1bSuch 		DPRINTF("ksyms ELF header\n");
3423a292b1bSuch 		kloader_copy(kv, &eh, sizeof(Elf_Ehdr));
3433a292b1bSuch 		kv += sizeof(Elf_Ehdr);
3443a292b1bSuch 
3453a292b1bSuch 		DPRINTF("ksyms section headers\n");
3463a292b1bSuch 		kloader_copy(kv, sh, eh.e_shentsize * eh.e_shnum);
3473a292b1bSuch 		kv += eh.e_shentsize * eh.e_shnum;
3483a292b1bSuch 
3493a292b1bSuch 		DPRINTF("ksyms .shstrtab\n");
3503a292b1bSuch 		kloader_copy(kv, shstrtab, shstrsz);
3513a292b1bSuch 		kv += shstrsz;
3523a292b1bSuch 
3533a292b1bSuch 		DPRINTF("ksyms .symtab\n");
3543a292b1bSuch 		kloader_from_file(kv, symoff, sh[symndx].sh_size);
3553a292b1bSuch 		kv += sh[symndx].sh_size;
3563a292b1bSuch 
3573a292b1bSuch 		DPRINTF("ksyms .strtab\n");
3583a292b1bSuch 		kloader_from_file(kv, stroff, ROUND4(sh[strndx].sh_size));
3593a292b1bSuch 		kv += ROUND4(sh[strndx].sh_size);
3603a292b1bSuch 	}
3613a292b1bSuch 
3623a292b1bSuch 	/*
3633a292b1bSuch 	 * Create boot info to pass to the new kernel.
3643a292b1bSuch 	 * All pointers in it are *not* valid until the new kernel runs!
3653a292b1bSuch 	 */
3663a292b1bSuch 
3673a292b1bSuch 	/* get a private copy of current bootinfo to vivisect */
3685b83bdc8Suebayasi 	memcpy(&nbi, kloader.bootinfo, sizeof(struct kloader_bootinfo));
3693a292b1bSuch 
3703a292b1bSuch 	/* new kernel entry point */
3713a292b1bSuch 	nbi.entry = entry;
3723a292b1bSuch 
3733a292b1bSuch 	/* where args currently are, see kloader_bootinfo_set() */
3743a292b1bSuch 	oldbuf = &kloader.bootinfo->_argbuf[0];
3753a292b1bSuch 
3763a292b1bSuch 	/* where args *will* be after boot code copied them */
3773a292b1bSuch 	newbuf = (char *)(void *)kv
3783a292b1bSuch 	    + offsetof(struct kloader_bootinfo, _argbuf);
3793a292b1bSuch 
3803a292b1bSuch 	DPRINTF("argv: old %p -> new %p\n", oldbuf, newbuf);
3813a292b1bSuch 
3823a292b1bSuch 	/* not a valid pointer in this kernel! */
3833a292b1bSuch 	nbi.argv = (void *)newbuf;
3843a292b1bSuch 
3853a292b1bSuch 	/* local copy that we populate with new (not yet valid) pointers */
3863a292b1bSuch 	ap = (char **)(void *)nbi._argbuf;
3873a292b1bSuch 
3883a292b1bSuch 	for (i = 0; i < kloader.bootinfo->argc; ++i) {
3893a292b1bSuch 		DPRINTFN(1, " [%d]: %p -> ", i, kloader.bootinfo->argv[i]);
3903a292b1bSuch 		ap[i] = newbuf +
3913a292b1bSuch 		    (kloader.bootinfo->argv[i] - oldbuf);
3923a292b1bSuch 		_DPRINTFN(1, "%p\n", ap[i]);
3933a292b1bSuch 	}
3943a292b1bSuch 
3953a292b1bSuch 	/* arrange for the new bootinfo to get copied */
3963a292b1bSuch 	DPRINTF("bootinfo\n");
3973a292b1bSuch 	kloader_copy(kv, &nbi, sizeof(struct kloader_bootinfo));
3983a292b1bSuch 
3993a292b1bSuch 	/* will be valid by the time the new kernel starts */
4003a292b1bSuch 	kloader.rebootinfo = (void *)kv;
4013a292b1bSuch 	/* kv += sizeof(struct kloader_bootinfo); */
4023a292b1bSuch 
4033a292b1bSuch 	/*
4043a292b1bSuch 	 * Copy loader code
4053a292b1bSuch 	 */
4063a292b1bSuch 	KDASSERT(kloader.cur_pg);
4073a292b1bSuch 	kloader.loader = (void *)PG_VADDR(kloader.cur_pg);
4083a292b1bSuch 	memcpy(kloader.loader, kloader.ops->boot, PAGE_SIZE);
4093a292b1bSuch 
4103a292b1bSuch 	/* loader stack starts at the bottom of that page */
4113a292b1bSuch 	kloader.loader_sp = (vaddr_t)kloader.loader + PAGE_SIZE;
4123a292b1bSuch 
4133a292b1bSuch 	DPRINTF("[loader] addr=%p sp=%p [kernel] entry=%p\n",
4143a292b1bSuch 	    kloader.loader, (void *)kloader.loader_sp, (void *)nbi.entry);
4153a292b1bSuch 
4163a292b1bSuch 	return (0);
4173a292b1bSuch  err:
4183a292b1bSuch 	if (ph != NULL)
419*949b8d92Srin 		kmem_free(ph, phsz);
4203a292b1bSuch 	if (sh != NULL)
421*949b8d92Srin 		kmem_free(sh, shsz);
4223a292b1bSuch 	if (shstrtab != NULL)
423*949b8d92Srin 		kmem_free(shstrtab, shstrsz);
4243a292b1bSuch 
4253a292b1bSuch 	return 1;
4263a292b1bSuch }
4273a292b1bSuch 
4283a292b1bSuch 
4293a292b1bSuch int
kloader_alloc_memory(size_t sz)4303a292b1bSuch kloader_alloc_memory(size_t sz)
4313a292b1bSuch {
4323a292b1bSuch 	int n, error;
4333a292b1bSuch 
4343a292b1bSuch 	n = (sz + BUCKET_SIZE - 1) / BUCKET_SIZE	/* kernel &co */
4353a292b1bSuch 	    + 1;					/* 2nd loader */
4363a292b1bSuch 
4373a292b1bSuch 	error = uvm_pglistalloc(n * PAGE_SIZE, avail_start, avail_end,
4383a292b1bSuch 	    PAGE_SIZE, 0, &kloader.pg_head, n, 0);
4393a292b1bSuch 	if (error) {
4403a292b1bSuch 		PRINTF("can't allocate memory.\n");
4413a292b1bSuch 		return (1);
4423a292b1bSuch 	}
4433a292b1bSuch 	DPRINTF("allocated %d pages.\n", n);
4443a292b1bSuch 
4453a292b1bSuch 	kloader.cur_pg = TAILQ_FIRST(&kloader.pg_head);
4463a292b1bSuch 	kloader.tagstart = (void *)PG_VADDR(kloader.cur_pg);
4473a292b1bSuch 	kloader.cur_tag = NULL;
4483a292b1bSuch 
4493a292b1bSuch 	return (0);
4503a292b1bSuch }
4513a292b1bSuch 
4523a292b1bSuch 
4533a292b1bSuch struct kloader_page_tag *
kloader_get_tag(vaddr_t dst)4543a292b1bSuch kloader_get_tag(vaddr_t dst)
4553a292b1bSuch {
4563a292b1bSuch 	struct vm_page *pg;
4573a292b1bSuch 	vaddr_t addr;
4583a292b1bSuch 	struct kloader_page_tag *tag;
4593a292b1bSuch 
4603a292b1bSuch 	tag = kloader.cur_tag;
4613a292b1bSuch 	if (tag != NULL		/* has tag */
4623a292b1bSuch 	    && tag->sz < BUCKET_SIZE /* that has free space */
4633a292b1bSuch 	    && tag->dst + tag->sz == dst) /* and new data are contiguous */
4643a292b1bSuch 	{
4653a292b1bSuch 		DPRINTFN(1, "current tag %x/%x ok\n", tag->dst, tag->sz);
4663a292b1bSuch 		return (tag);
4673a292b1bSuch 	}
4683a292b1bSuch 
4693a292b1bSuch 	pg = kloader.cur_pg;
4703a292b1bSuch 	KDASSERT(pg != NULL);
47106c343acSad 	kloader.cur_pg = TAILQ_NEXT(pg, pageq.queue);
4723a292b1bSuch 
4733a292b1bSuch 	addr = PG_VADDR(pg);
4743a292b1bSuch 	tag = (void *)addr;
4753a292b1bSuch 
4763a292b1bSuch 	/*
4773a292b1bSuch 	 * 2nd loader uses simple word-by-word copy, so destination
4783a292b1bSuch 	 * address of a tag must be properly aligned.
4793a292b1bSuch 	 */
4803a292b1bSuch 	KASSERT(ALIGNED_POINTER(dst, register_t));
4813a292b1bSuch 
4823a292b1bSuch 	tag->src = addr + sizeof(struct kloader_page_tag);
4833a292b1bSuch 	tag->dst = dst;
4843a292b1bSuch 	tag->sz = 0;
4853a292b1bSuch 	tag->next = 0;	/* Terminate. this member may overwrite after. */
4863a292b1bSuch 	if (kloader.cur_tag)
4873a292b1bSuch 		kloader.cur_tag->next = addr;
4883a292b1bSuch 	kloader.cur_tag = tag;
4893a292b1bSuch 
4903a292b1bSuch 	return (tag);
4913a292b1bSuch }
4923a292b1bSuch 
4933a292b1bSuch 
4943a292b1bSuch /*
4953a292b1bSuch  * Operations to populate kloader_page_tag's with data.
4963a292b1bSuch  */
4973a292b1bSuch 
4983a292b1bSuch void
kloader_from_file(vaddr_t dst,off_t ofs,size_t sz)4993a292b1bSuch kloader_from_file(vaddr_t dst, off_t ofs, size_t sz)
5003a292b1bSuch {
5013a292b1bSuch 	struct kloader_page_tag *tag;
5023a292b1bSuch 	size_t freesz;
5033a292b1bSuch 
5043a292b1bSuch 	while (sz > 0) {
5053a292b1bSuch 		tag = kloader_get_tag(dst);
5063a292b1bSuch 		KDASSERT(tag != NULL);
5073a292b1bSuch 		freesz = BUCKET_SIZE - tag->sz;
5083a292b1bSuch 		if (freesz > sz)
5093a292b1bSuch 			freesz = sz;
5103a292b1bSuch 
5111d8b3e46Smatt 		DPRINTFN(1, "0x%08"PRIxVADDR" + 0x%zx <- 0x%lx\n", dst, freesz,
51266d780dbSpeter 		    (unsigned long)ofs);
5133a292b1bSuch 		kloader_read(ofs, freesz, (void *)(tag->src + tag->sz));
5143a292b1bSuch 
5153a292b1bSuch 		tag->sz += freesz;
5163a292b1bSuch 		sz -= freesz;
5173a292b1bSuch 		ofs += freesz;
5183a292b1bSuch 		dst += freesz;
5193a292b1bSuch 	}
5203a292b1bSuch }
5213a292b1bSuch 
5223a292b1bSuch 
5233a292b1bSuch void
kloader_copy(vaddr_t dst,const void * src,size_t sz)5243a292b1bSuch kloader_copy(vaddr_t dst, const void *src, size_t sz)
5253a292b1bSuch {
5263a292b1bSuch 	struct kloader_page_tag *tag;
5273a292b1bSuch 	size_t freesz;
5283a292b1bSuch 
5293a292b1bSuch 	while (sz > 0) {
5303a292b1bSuch 		tag = kloader_get_tag(dst);
5313a292b1bSuch 		KDASSERT(tag != NULL);
5323a292b1bSuch 		freesz = BUCKET_SIZE - tag->sz;
5333a292b1bSuch 		if (freesz > sz)
5343a292b1bSuch 			freesz = sz;
5353a292b1bSuch 
5361d8b3e46Smatt 		DPRINTFN(1, "0x%08"PRIxVADDR" + 0x%zx <- %p\n", dst, freesz, src);
5373a292b1bSuch 		memcpy((void *)(tag->src + tag->sz), src, freesz);
5383a292b1bSuch 
5393a292b1bSuch 		tag->sz += freesz;
5403a292b1bSuch 		sz -= freesz;
5419af1a3ffSuwe 		src = (const char *)src + freesz;
5423a292b1bSuch 		dst += freesz;
5433a292b1bSuch 	}
5443a292b1bSuch }
5453a292b1bSuch 
5463a292b1bSuch 
5473a292b1bSuch void
kloader_zero(vaddr_t dst,size_t sz)5483a292b1bSuch kloader_zero(vaddr_t dst, size_t sz)
5493a292b1bSuch {
5503a292b1bSuch 	struct kloader_page_tag *tag;
5513a292b1bSuch 	size_t freesz;
5523a292b1bSuch 
5533a292b1bSuch 	while (sz > 0) {
5543a292b1bSuch 		tag = kloader_get_tag(dst);
5553a292b1bSuch 		KDASSERT(tag != NULL);
5563a292b1bSuch 		freesz = BUCKET_SIZE - tag->sz;
5573a292b1bSuch 		if (freesz > sz)
5583a292b1bSuch 			freesz = sz;
5593a292b1bSuch 
5601d8b3e46Smatt 		DPRINTFN(1, "0x%08"PRIxVADDR" + 0x%zx\n", dst, freesz);
5613a292b1bSuch 		memset((void *)(tag->src + tag->sz), 0, freesz);
5623a292b1bSuch 
5633a292b1bSuch 		tag->sz += freesz;
5643a292b1bSuch 		sz -= freesz;
5653a292b1bSuch 		dst += freesz;
5663a292b1bSuch 	}
5673a292b1bSuch }
5683a292b1bSuch 
5693a292b1bSuch 
5703a292b1bSuch void
kloader_load_segment(Elf_Phdr * p)5713a292b1bSuch kloader_load_segment(Elf_Phdr *p)
5723a292b1bSuch {
5733a292b1bSuch 
5743a292b1bSuch 	DPRINTF("memory 0x%08x 0x%x <- file 0x%x 0x%x\n",
5753a292b1bSuch 	    p->p_vaddr, p->p_memsz, p->p_offset, p->p_filesz);
5763a292b1bSuch 
5773a292b1bSuch 	kloader_from_file(p->p_vaddr, p->p_offset, p->p_filesz);
5783a292b1bSuch #ifdef KLOADER_ZERO_BSS
5793a292b1bSuch 	kloader_zero(p->p_vaddr + p->p_filesz, p->p_memsz - p->p_filesz);
5803a292b1bSuch #endif
5813a292b1bSuch }
5823a292b1bSuch 
5833a292b1bSuch 
5843a292b1bSuch /*
5853a292b1bSuch  * file access
5863a292b1bSuch  */
5873a292b1bSuch struct vnode *
kloader_open(const char * filename)5883a292b1bSuch kloader_open(const char *filename)
5893a292b1bSuch {
5908f6ed30dSdholland 	struct pathbuf *pb;
5913a292b1bSuch 	struct nameidata nid;
592723d09ceSdholland 	struct vnode *vp;
593ba474401Suwe 	int error;
5943a292b1bSuch 
5958f6ed30dSdholland 	pb = pathbuf_create(filename);
5968f6ed30dSdholland 	if (pb == NULL) {
5978f6ed30dSdholland 		PRINTF("%s: pathbuf_create failed\n", filename);
5988f6ed30dSdholland 		return (NULL);
5998f6ed30dSdholland 	}
6008f6ed30dSdholland 
601723d09ceSdholland 	/*
602723d09ceSdholland 	 * XXX why does this call both namei and vn_open?
603723d09ceSdholland 	 */
6043a292b1bSuch 
605723d09ceSdholland 	NDINIT(&nid, LOOKUP, FOLLOW, pb);
606ba474401Suwe 	error = namei(&nid);
607ba474401Suwe 	if (error != 0) {
608ba474401Suwe 		PRINTF("%s: namei failed, errno=%d\n", filename, error);
6098f6ed30dSdholland 		pathbuf_destroy(pb);
610ba474401Suwe 		return (NULL);
6113a292b1bSuch 	}
6123a292b1bSuch 
613723d09ceSdholland 	error = vn_open(NULL, pb, 0, FREAD, 0, &vp, NULL, NULL);
614ba474401Suwe 	if (error != 0) {
615ba474401Suwe 		PRINTF("%s: open failed, errno=%d\n", filename, error);
6165fcd084dSdholland 		pathbuf_destroy(pb);
617ba474401Suwe 		return (NULL);
6183a292b1bSuch 	}
6193a292b1bSuch 
6208f6ed30dSdholland 	pathbuf_destroy(pb);
621723d09ceSdholland 	return vp;
6223a292b1bSuch }
6233a292b1bSuch 
6243a292b1bSuch void
kloader_close(void)625df7f595eScegger kloader_close(void)
6263a292b1bSuch {
62795e1ffb1Schristos 	struct lwp *l = KLOADER_LWP;
6283a292b1bSuch 	struct vnode *vp = kloader.vp;
6293a292b1bSuch 
6301423e65bShannken 	VOP_UNLOCK(vp);
631a9ca7a37Sad 	vn_close(vp, FREAD, l->l_cred);
6323a292b1bSuch }
6333a292b1bSuch 
6343a292b1bSuch int
kloader_read(size_t ofs,size_t size,void * buf)6353a292b1bSuch kloader_read(size_t ofs, size_t size, void *buf)
6363a292b1bSuch {
63795e1ffb1Schristos 	struct lwp *l = KLOADER_LWP;
6383a292b1bSuch 	struct vnode *vp = kloader.vp;
6393a292b1bSuch 	size_t resid;
6403a292b1bSuch 	int error;
6413a292b1bSuch 
6423a292b1bSuch 	error = vn_rdwr(UIO_READ, vp, buf, size, ofs, UIO_SYSSPACE,
6433029ac48Sad 	    IO_NODELOCKED | IO_SYNC, l->l_cred, &resid, NULL);
6443a292b1bSuch 
6453a292b1bSuch 	if (error)
6463a292b1bSuch 		PRINTF("read error.\n");
6473a292b1bSuch 
6483a292b1bSuch 	return (error);
6493a292b1bSuch }
6503a292b1bSuch 
6513a292b1bSuch 
6523a292b1bSuch /*
6533a292b1bSuch  * bootinfo
6543a292b1bSuch  */
6553a292b1bSuch void
kloader_bootinfo_set(struct kloader_bootinfo * kbi,int argc,char * argv[],struct bootinfo * bi,int printok)6563a292b1bSuch kloader_bootinfo_set(struct kloader_bootinfo *kbi, int argc, char *argv[],
6573a292b1bSuch     struct bootinfo *bi, int printok)
6583a292b1bSuch {
6593a292b1bSuch 	char *p, *pend, *buf;
6603a292b1bSuch 	int i;
6613a292b1bSuch 
6623a292b1bSuch 	kloader.bootinfo = kbi;
6633a292b1bSuch 	buf = kbi->_argbuf;
6643a292b1bSuch 	if (bi != NULL)
6653a292b1bSuch 		memcpy(&kbi->bootinfo, bi, sizeof(struct bootinfo));
6663a292b1bSuch 	kbi->argc = argc;
6673a292b1bSuch 	kbi->argv = (char **)buf;
6683a292b1bSuch 
6693a292b1bSuch 	p = &buf[argc * sizeof(char **)];
6703a292b1bSuch 	pend = &buf[KLOADER_KERNELARGS_MAX - 1];
6713a292b1bSuch 
6723a292b1bSuch 	for (i = 0; i < argc; i++) {
6733a292b1bSuch 		char *q = argv[i];
6743a292b1bSuch 		int len = strlen(q) + 1;
6753a292b1bSuch 		if ((p + len) > pend) {
6763a292b1bSuch 			kloader.bootinfo = NULL;
6773a292b1bSuch 			if (printok)
6783a292b1bSuch 				PRINTF("buffer insufficient.\n");
6793a292b1bSuch 			return;
6803a292b1bSuch 		}
6813a292b1bSuch 		kbi->argv[i] = p;
6823a292b1bSuch 		memcpy(p, q, len);
6833a292b1bSuch 		p += len;
6843a292b1bSuch 	}
6853a292b1bSuch }
6863a292b1bSuch 
6873a292b1bSuch 
6883a292b1bSuch #ifdef KLOADER_DEBUG
6893a292b1bSuch void
kloader_pagetag_dump(void)690df7f595eScegger kloader_pagetag_dump(void)
6913a292b1bSuch {
6923a292b1bSuch 	struct kloader_page_tag *tag = kloader.tagstart;
6933a292b1bSuch 	struct kloader_page_tag *p, *op;
694712239e3Sthorpej 	bool print;
6953a292b1bSuch 	int i, n;
6963a292b1bSuch 
6973a292b1bSuch 	p = tag;
6983a292b1bSuch 	op = NULL;
6993a292b1bSuch 	i = 0, n = 15;
7003a292b1bSuch 
7013a292b1bSuch 	PRINTF("[page tag chain]\n");
7023a292b1bSuch 	do  {
7033a292b1bSuch 		print = FALSE;
7043a292b1bSuch 		if (i < n)
7053a292b1bSuch 			print = TRUE;
706cebdea24Suwe 		if ((uint32_t)p & 3) {
7073a292b1bSuch 			printf("tag alignment error\n");
7083a292b1bSuch 			break;
7093a292b1bSuch 		}
7103a292b1bSuch 		if ((p->src & 3) || (p->dst & 3)) {
7112d1abfdfSskrll 			printf("data alignment error.\n");
7123a292b1bSuch 			print = TRUE;
7133a292b1bSuch 		}
7143a292b1bSuch 
7153a292b1bSuch 		if (print) {
7163a292b1bSuch 			printf("[%2d] next 0x%08x src 0x%08x dst 0x%08x"
7173a292b1bSuch 			    " sz 0x%x\n", i, p->next, p->src, p->dst, p->sz);
7183a292b1bSuch 		} else if (i == n) {
7193a292b1bSuch 			printf("[...]\n");
7203a292b1bSuch 		}
7213a292b1bSuch 		op = p;
7223a292b1bSuch 		i++;
7233a292b1bSuch 	} while ((p = (struct kloader_page_tag *)(p->next)) != 0);
7243a292b1bSuch 
7253a292b1bSuch 	if (op != NULL)
7263a292b1bSuch 		printf("[%d(last)] next 0x%08x src 0x%08x dst 0x%08x sz 0x%x\n",
7273a292b1bSuch 		    i - 1, op->next, op->src, op->dst, op->sz);
7283a292b1bSuch }
7293a292b1bSuch 
7303a292b1bSuch #endif /* KLOADER_DEBUG */
731