xref: /netbsd-src/sys/dev/dkwedge/dk.c (revision 7f21db1c0118155e0dd40b75182e30c589d9f63e)
1 /*	$NetBSD: dk.c,v 1.55 2010/02/07 16:04:31 mlelstv Exp $	*/
2 
3 /*-
4  * Copyright (c) 2004, 2005, 2006, 2007 The NetBSD Foundation, Inc.
5  * All rights reserved.
6  *
7  * This code is derived from software contributed to The NetBSD Foundation
8  * by Jason R. Thorpe.
9  *
10  * Redistribution and use in source and binary forms, with or without
11  * modification, are permitted provided that the following conditions
12  * are met:
13  * 1. Redistributions of source code must retain the above copyright
14  *    notice, this list of conditions and the following disclaimer.
15  * 2. Redistributions in binary form must reproduce the above copyright
16  *    notice, this list of conditions and the following disclaimer in the
17  *    documentation and/or other materials provided with the distribution.
18  *
19  * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
20  * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
21  * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
22  * PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
23  * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
24  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
25  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
26  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
27  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
28  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
29  * POSSIBILITY OF SUCH DAMAGE.
30  */
31 
32 #include <sys/cdefs.h>
33 __KERNEL_RCSID(0, "$NetBSD: dk.c,v 1.55 2010/02/07 16:04:31 mlelstv Exp $");
34 
35 #ifdef _KERNEL_OPT
36 #include "opt_dkwedge.h"
37 #endif
38 
39 #include <sys/param.h>
40 #include <sys/systm.h>
41 #include <sys/proc.h>
42 #include <sys/errno.h>
43 #include <sys/pool.h>
44 #include <sys/ioctl.h>
45 #include <sys/disklabel.h>
46 #include <sys/disk.h>
47 #include <sys/fcntl.h>
48 #include <sys/buf.h>
49 #include <sys/bufq.h>
50 #include <sys/vnode.h>
51 #include <sys/stat.h>
52 #include <sys/conf.h>
53 #include <sys/callout.h>
54 #include <sys/kernel.h>
55 #include <sys/malloc.h>
56 #include <sys/device.h>
57 #include <sys/kauth.h>
58 
59 #include <miscfs/specfs/specdev.h>
60 
61 MALLOC_DEFINE(M_DKWEDGE, "dkwedge", "Disk wedge structures");
62 
63 typedef enum {
64 	DKW_STATE_LARVAL	= 0,
65 	DKW_STATE_RUNNING	= 1,
66 	DKW_STATE_DYING		= 2,
67 	DKW_STATE_DEAD		= 666
68 } dkwedge_state_t;
69 
70 struct dkwedge_softc {
71 	struct device	*sc_dev;	/* pointer to our pseudo-device */
72 	struct cfdata	sc_cfdata;	/* our cfdata structure */
73 	uint8_t		sc_wname[128];	/* wedge name (Unicode, UTF-8) */
74 
75 	dkwedge_state_t sc_state;	/* state this wedge is in */
76 
77 	struct disk	*sc_parent;	/* parent disk */
78 	daddr_t		sc_offset;	/* LBA offset of wedge in parent */
79 	uint64_t	sc_size;	/* size of wedge in blocks */
80 	char		sc_ptype[32];	/* partition type */
81 	dev_t		sc_pdev;	/* cached parent's dev_t */
82 					/* link on parent's wedge list */
83 	LIST_ENTRY(dkwedge_softc) sc_plink;
84 
85 	struct disk	sc_dk;		/* our own disk structure */
86 	struct bufq_state *sc_bufq;	/* buffer queue */
87 	struct callout	sc_restart_ch;	/* callout to restart I/O */
88 
89 	u_int		sc_iopend;	/* I/Os pending */
90 	int		sc_flags;	/* flags (splbio) */
91 };
92 
93 #define	DK_F_WAIT_DRAIN		0x0001	/* waiting for I/O to drain */
94 
95 static void	dkstart(struct dkwedge_softc *);
96 static void	dkiodone(struct buf *);
97 static void	dkrestart(void *);
98 static void	dkminphys(struct buf *);
99 
100 static int	dklastclose(struct dkwedge_softc *);
101 static int	dkwedge_detach(device_t, int);
102 
103 static dev_type_open(dkopen);
104 static dev_type_close(dkclose);
105 static dev_type_read(dkread);
106 static dev_type_write(dkwrite);
107 static dev_type_ioctl(dkioctl);
108 static dev_type_strategy(dkstrategy);
109 static dev_type_dump(dkdump);
110 static dev_type_size(dksize);
111 
112 const struct bdevsw dk_bdevsw = {
113 	dkopen, dkclose, dkstrategy, dkioctl, dkdump, dksize, D_DISK
114 };
115 
116 const struct cdevsw dk_cdevsw = {
117 	dkopen, dkclose, dkread, dkwrite, dkioctl,
118 	    nostop, notty, nopoll, nommap, nokqfilter, D_DISK
119 };
120 
121 static struct dkwedge_softc **dkwedges;
122 static u_int ndkwedges;
123 static krwlock_t dkwedges_lock;
124 
125 static LIST_HEAD(, dkwedge_discovery_method) dkwedge_discovery_methods;
126 static krwlock_t dkwedge_discovery_methods_lock;
127 
128 /*
129  * dkwedge_match:
130  *
131  *	Autoconfiguration match function for pseudo-device glue.
132  */
133 static int
134 dkwedge_match(device_t parent, cfdata_t match,
135     void *aux)
136 {
137 
138 	/* Pseudo-device; always present. */
139 	return (1);
140 }
141 
142 /*
143  * dkwedge_attach:
144  *
145  *	Autoconfiguration attach function for pseudo-device glue.
146  */
147 static void
148 dkwedge_attach(device_t parent, device_t self,
149     void *aux)
150 {
151 
152 	if (!pmf_device_register(self, NULL, NULL))
153 		aprint_error_dev(self, "couldn't establish power handler\n");
154 }
155 
156 CFDRIVER_DECL(dk, DV_DISK, NULL);
157 CFATTACH_DECL3_NEW(dk, 0,
158     dkwedge_match, dkwedge_attach, dkwedge_detach, NULL, NULL, NULL,
159     DVF_DETACH_SHUTDOWN);
160 
161 /*
162  * dkwedge_wait_drain:
163  *
164  *	Wait for I/O on the wedge to drain.
165  *	NOTE: Must be called at splbio()!
166  */
167 static void
168 dkwedge_wait_drain(struct dkwedge_softc *sc)
169 {
170 
171 	while (sc->sc_iopend != 0) {
172 		sc->sc_flags |= DK_F_WAIT_DRAIN;
173 		(void) tsleep(&sc->sc_iopend, PRIBIO, "dkdrn", 0);
174 	}
175 }
176 
177 /*
178  * dkwedge_compute_pdev:
179  *
180  *	Compute the parent disk's dev_t.
181  */
182 static int
183 dkwedge_compute_pdev(const char *pname, dev_t *pdevp)
184 {
185 	const char *name, *cp;
186 	int punit, pmaj;
187 	char devname[16];
188 
189 	name = pname;
190 	if ((pmaj = devsw_name2blk(name, devname, sizeof(devname))) == -1)
191 		return (ENODEV);
192 
193 	name += strlen(devname);
194 	for (cp = name, punit = 0; *cp >= '0' && *cp <= '9'; cp++)
195 		punit = (punit * 10) + (*cp - '0');
196 	if (cp == name) {
197 		/* Invalid parent disk name. */
198 		return (ENODEV);
199 	}
200 
201 	*pdevp = MAKEDISKDEV(pmaj, punit, RAW_PART);
202 
203 	return (0);
204 }
205 
206 /*
207  * dkwedge_array_expand:
208  *
209  *	Expand the dkwedges array.
210  */
211 static void
212 dkwedge_array_expand(void)
213 {
214 	int newcnt = ndkwedges + 16;
215 	struct dkwedge_softc **newarray, **oldarray;
216 
217 	newarray = malloc(newcnt * sizeof(*newarray), M_DKWEDGE,
218 	    M_WAITOK|M_ZERO);
219 	if ((oldarray = dkwedges) != NULL)
220 		memcpy(newarray, dkwedges, ndkwedges * sizeof(*newarray));
221 	dkwedges = newarray;
222 	ndkwedges = newcnt;
223 	if (oldarray != NULL)
224 		free(oldarray, M_DKWEDGE);
225 }
226 
227 static void
228 dkgetproperties(struct disk *disk, struct dkwedge_info *dkw)
229 {
230 	prop_dictionary_t disk_info, odisk_info, geom;
231 
232 	disk_info = prop_dictionary_create();
233 
234 	prop_dictionary_set_cstring_nocopy(disk_info, "type", "ESDI");
235 
236 	geom = prop_dictionary_create();
237 
238 	prop_dictionary_set_uint64(geom, "sectors-per-unit", dkw->dkw_size);
239 
240 	prop_dictionary_set_uint32(geom, "sector-size",
241 	    DEV_BSIZE /* XXX 512? */);
242 
243 	prop_dictionary_set_uint32(geom, "sectors-per-track", 32);
244 
245 	prop_dictionary_set_uint32(geom, "tracks-per-cylinder", 64);
246 
247 	prop_dictionary_set_uint32(geom, "cylinders-per-unit", dkw->dkw_size / 2048);
248 
249 	prop_dictionary_set(disk_info, "geometry", geom);
250 	prop_object_release(geom);
251 
252 	odisk_info = disk->dk_info;
253 
254 	disk->dk_info = disk_info;
255 
256 	if (odisk_info != NULL)
257 		prop_object_release(odisk_info);
258 }
259 
260 /*
261  * dkwedge_add:		[exported function]
262  *
263  *	Add a disk wedge based on the provided information.
264  *
265  *	The incoming dkw_devname[] is ignored, instead being
266  *	filled in and returned to the caller.
267  */
268 int
269 dkwedge_add(struct dkwedge_info *dkw)
270 {
271 	struct dkwedge_softc *sc, *lsc;
272 	struct disk *pdk;
273 	u_int unit;
274 	int error;
275 	dev_t pdev;
276 
277 	dkw->dkw_parent[sizeof(dkw->dkw_parent) - 1] = '\0';
278 	pdk = disk_find(dkw->dkw_parent);
279 	if (pdk == NULL)
280 		return (ENODEV);
281 
282 	error = dkwedge_compute_pdev(pdk->dk_name, &pdev);
283 	if (error)
284 		return (error);
285 
286 	if (dkw->dkw_offset < 0)
287 		return (EINVAL);
288 
289 	sc = malloc(sizeof(*sc), M_DKWEDGE, M_WAITOK|M_ZERO);
290 	sc->sc_state = DKW_STATE_LARVAL;
291 	sc->sc_parent = pdk;
292 	sc->sc_pdev = pdev;
293 	sc->sc_offset = dkw->dkw_offset;
294 	sc->sc_size = dkw->dkw_size;
295 
296 	memcpy(sc->sc_wname, dkw->dkw_wname, sizeof(sc->sc_wname));
297 	sc->sc_wname[sizeof(sc->sc_wname) - 1] = '\0';
298 
299 	memcpy(sc->sc_ptype, dkw->dkw_ptype, sizeof(sc->sc_ptype));
300 	sc->sc_ptype[sizeof(sc->sc_ptype) - 1] = '\0';
301 
302 	bufq_alloc(&sc->sc_bufq, "fcfs", 0);
303 
304 	callout_init(&sc->sc_restart_ch, 0);
305 	callout_setfunc(&sc->sc_restart_ch, dkrestart, sc);
306 
307 	/*
308 	 * Wedge will be added; increment the wedge count for the parent.
309 	 * Only allow this to happend if RAW_PART is the only thing open.
310 	 */
311 	mutex_enter(&pdk->dk_openlock);
312 	if (pdk->dk_openmask & ~(1 << RAW_PART))
313 		error = EBUSY;
314 	else {
315 		/* Check for wedge overlap. */
316 		LIST_FOREACH(lsc, &pdk->dk_wedges, sc_plink) {
317 			daddr_t lastblk = sc->sc_offset + sc->sc_size - 1;
318 			daddr_t llastblk = lsc->sc_offset + lsc->sc_size - 1;
319 
320 			if (sc->sc_offset >= lsc->sc_offset &&
321 			    sc->sc_offset <= llastblk) {
322 				/* Overlaps the tail of the exsiting wedge. */
323 				break;
324 			}
325 			if (lastblk >= lsc->sc_offset &&
326 			    lastblk <= llastblk) {
327 				/* Overlaps the head of the existing wedge. */
328 			    	break;
329 			}
330 		}
331 		if (lsc != NULL)
332 			error = EINVAL;
333 		else {
334 			pdk->dk_nwedges++;
335 			LIST_INSERT_HEAD(&pdk->dk_wedges, sc, sc_plink);
336 		}
337 	}
338 	mutex_exit(&pdk->dk_openlock);
339 	if (error) {
340 		bufq_free(sc->sc_bufq);
341 		free(sc, M_DKWEDGE);
342 		return (error);
343 	}
344 
345 	/* Fill in our cfdata for the pseudo-device glue. */
346 	sc->sc_cfdata.cf_name = dk_cd.cd_name;
347 	sc->sc_cfdata.cf_atname = dk_ca.ca_name;
348 	/* sc->sc_cfdata.cf_unit set below */
349 	sc->sc_cfdata.cf_fstate = FSTATE_STAR;
350 
351 	/* Insert the larval wedge into the array. */
352 	rw_enter(&dkwedges_lock, RW_WRITER);
353 	for (error = 0;;) {
354 		struct dkwedge_softc **scpp;
355 
356 		/*
357 		 * Check for a duplicate wname while searching for
358 		 * a slot.
359 		 */
360 		for (scpp = NULL, unit = 0; unit < ndkwedges; unit++) {
361 			if (dkwedges[unit] == NULL) {
362 				if (scpp == NULL) {
363 					scpp = &dkwedges[unit];
364 					sc->sc_cfdata.cf_unit = unit;
365 				}
366 			} else {
367 				/* XXX Unicode. */
368 				if (strcmp(dkwedges[unit]->sc_wname,
369 					   sc->sc_wname) == 0) {
370 					error = EEXIST;
371 					break;
372 				}
373 			}
374 		}
375 		if (error)
376 			break;
377 		KASSERT(unit == ndkwedges);
378 		if (scpp == NULL)
379 			dkwedge_array_expand();
380 		else {
381 			KASSERT(scpp == &dkwedges[sc->sc_cfdata.cf_unit]);
382 			*scpp = sc;
383 			break;
384 		}
385 	}
386 	rw_exit(&dkwedges_lock);
387 	if (error) {
388 		mutex_enter(&pdk->dk_openlock);
389 		pdk->dk_nwedges--;
390 		LIST_REMOVE(sc, sc_plink);
391 		mutex_exit(&pdk->dk_openlock);
392 
393 		bufq_free(sc->sc_bufq);
394 		free(sc, M_DKWEDGE);
395 		return (error);
396 	}
397 
398 	/*
399 	 * Now that we know the unit #, attach a pseudo-device for
400 	 * this wedge instance.  This will provide us with the
401 	 * "struct device" necessary for glue to other parts of the
402 	 * system.
403 	 *
404 	 * This should never fail, unless we're almost totally out of
405 	 * memory.
406 	 */
407 	if ((sc->sc_dev = config_attach_pseudo(&sc->sc_cfdata)) == NULL) {
408 		aprint_error("%s%u: unable to attach pseudo-device\n",
409 		    sc->sc_cfdata.cf_name, sc->sc_cfdata.cf_unit);
410 
411 		rw_enter(&dkwedges_lock, RW_WRITER);
412 		dkwedges[sc->sc_cfdata.cf_unit] = NULL;
413 		rw_exit(&dkwedges_lock);
414 
415 		mutex_enter(&pdk->dk_openlock);
416 		pdk->dk_nwedges--;
417 		LIST_REMOVE(sc, sc_plink);
418 		mutex_exit(&pdk->dk_openlock);
419 
420 		bufq_free(sc->sc_bufq);
421 		free(sc, M_DKWEDGE);
422 		return (ENOMEM);
423 	}
424 
425 	/* Return the devname to the caller. */
426 	strlcpy(dkw->dkw_devname, device_xname(sc->sc_dev),
427 		sizeof(dkw->dkw_devname));
428 
429 	/*
430 	 * XXX Really ought to make the disk_attach() and the changing
431 	 * of state to RUNNING atomic.
432 	 */
433 
434 	disk_init(&sc->sc_dk, device_xname(sc->sc_dev), NULL);
435 	dkgetproperties(&sc->sc_dk, dkw);
436 	disk_attach(&sc->sc_dk);
437 
438 	/* Disk wedge is ready for use! */
439 	sc->sc_state = DKW_STATE_RUNNING;
440 
441 	/* Announce our arrival. */
442 	aprint_normal("%s at %s: %s\n", device_xname(sc->sc_dev), pdk->dk_name,
443 	    sc->sc_wname);	/* XXX Unicode */
444 	aprint_normal("%s: %"PRIu64" blocks at %"PRId64", type: %s\n",
445 	    device_xname(sc->sc_dev), sc->sc_size, sc->sc_offset, sc->sc_ptype);
446 
447 	return (0);
448 }
449 
450 /*
451  * dkwedge_find:
452  *
453  *	Lookup a disk wedge based on the provided information.
454  *	NOTE: We look up the wedge based on the wedge devname,
455  *	not wname.
456  *
457  *	Return NULL if the wedge is not found, otherwise return
458  *	the wedge's softc.  Assign the wedge's unit number to unitp
459  *	if unitp is not NULL.
460  */
461 static struct dkwedge_softc *
462 dkwedge_find(struct dkwedge_info *dkw, u_int *unitp)
463 {
464 	struct dkwedge_softc *sc = NULL;
465 	u_int unit;
466 
467 	/* Find our softc. */
468 	dkw->dkw_devname[sizeof(dkw->dkw_devname) - 1] = '\0';
469 	rw_enter(&dkwedges_lock, RW_READER);
470 	for (unit = 0; unit < ndkwedges; unit++) {
471 		if ((sc = dkwedges[unit]) != NULL &&
472 		    strcmp(device_xname(sc->sc_dev), dkw->dkw_devname) == 0 &&
473 		    strcmp(sc->sc_parent->dk_name, dkw->dkw_parent) == 0) {
474 			break;
475 		}
476 	}
477 	rw_exit(&dkwedges_lock);
478 	if (unit == ndkwedges)
479 		return NULL;
480 
481 	if (unitp != NULL)
482 		*unitp = unit;
483 
484 	return sc;
485 }
486 
487 /*
488  * dkwedge_del:		[exported function]
489  *
490  *	Delete a disk wedge based on the provided information.
491  *	NOTE: We look up the wedge based on the wedge devname,
492  *	not wname.
493  */
494 int
495 dkwedge_del(struct dkwedge_info *dkw)
496 {
497 	struct dkwedge_softc *sc = NULL;
498 
499 	/* Find our softc. */
500 	if ((sc = dkwedge_find(dkw, NULL)) == NULL)
501 		return (ESRCH);
502 
503 	return config_detach(sc->sc_dev, DETACH_FORCE | DETACH_QUIET);
504 }
505 
506 static int
507 dkwedge_begindetach(struct dkwedge_softc *sc, int flags)
508 {
509 	struct disk *dk = &sc->sc_dk;
510 	int rc;
511 
512 	rc = 0;
513 	mutex_enter(&dk->dk_openlock);
514 	mutex_enter(&sc->sc_parent->dk_rawlock);
515 	if (dk->dk_openmask == 0)
516 		;	/* nothing to do */
517 	else if ((flags & DETACH_FORCE) == 0)
518 		rc = EBUSY;
519 	else
520 		rc = dklastclose(sc);
521 	mutex_exit(&sc->sc_parent->dk_rawlock);
522 	mutex_exit(&dk->dk_openlock);
523 
524 	return rc;
525 }
526 
527 /*
528  * dkwedge_detach:
529  *
530  *	Autoconfiguration detach function for pseudo-device glue.
531  */
532 static int
533 dkwedge_detach(device_t self, int flags)
534 {
535 	struct dkwedge_softc *sc = NULL;
536 	u_int unit;
537 	int bmaj, cmaj, rc, s;
538 
539 	rw_enter(&dkwedges_lock, RW_WRITER);
540 	for (unit = 0; unit < ndkwedges; unit++) {
541 		if ((sc = dkwedges[unit]) != NULL && sc->sc_dev == self)
542 			break;
543 	}
544 	if (unit == ndkwedges)
545 		rc = ENXIO;
546 	else if ((rc = dkwedge_begindetach(sc, flags)) == 0) {
547 		/* Mark the wedge as dying. */
548 		sc->sc_state = DKW_STATE_DYING;
549 	}
550 	rw_exit(&dkwedges_lock);
551 
552 	if (rc != 0)
553 		return rc;
554 
555 	pmf_device_deregister(self);
556 
557 	/* Locate the wedge major numbers. */
558 	bmaj = bdevsw_lookup_major(&dk_bdevsw);
559 	cmaj = cdevsw_lookup_major(&dk_cdevsw);
560 
561 	/* Kill any pending restart. */
562 	callout_stop(&sc->sc_restart_ch);
563 
564 	/*
565 	 * dkstart() will kill any queued buffers now that the
566 	 * state of the wedge is not RUNNING.  Once we've done
567 	 * that, wait for any other pending I/O to complete.
568 	 */
569 	s = splbio();
570 	dkstart(sc);
571 	dkwedge_wait_drain(sc);
572 	splx(s);
573 
574 	/* Nuke the vnodes for any open instances. */
575 	vdevgone(bmaj, unit, unit, VBLK);
576 	vdevgone(cmaj, unit, unit, VCHR);
577 
578 	/* Clean up the parent. */
579 	mutex_enter(&sc->sc_dk.dk_openlock);
580 	mutex_enter(&sc->sc_parent->dk_rawlock);
581 	if (sc->sc_dk.dk_openmask) {
582 		if (sc->sc_parent->dk_rawopens-- == 1) {
583 			KASSERT(sc->sc_parent->dk_rawvp != NULL);
584 			(void) vn_close(sc->sc_parent->dk_rawvp, FREAD | FWRITE,
585 			    NOCRED);
586 			sc->sc_parent->dk_rawvp = NULL;
587 		}
588 		sc->sc_dk.dk_openmask = 0;
589 	}
590 	mutex_exit(&sc->sc_parent->dk_rawlock);
591 	mutex_exit(&sc->sc_dk.dk_openlock);
592 
593 	/* Announce our departure. */
594 	aprint_normal("%s at %s (%s) deleted\n", device_xname(sc->sc_dev),
595 	    sc->sc_parent->dk_name,
596 	    sc->sc_wname);	/* XXX Unicode */
597 
598 	mutex_enter(&sc->sc_parent->dk_openlock);
599 	sc->sc_parent->dk_nwedges--;
600 	LIST_REMOVE(sc, sc_plink);
601 	mutex_exit(&sc->sc_parent->dk_openlock);
602 
603 	/* Delete our buffer queue. */
604 	bufq_free(sc->sc_bufq);
605 
606 	/* Detach from the disk list. */
607 	disk_detach(&sc->sc_dk);
608 	disk_destroy(&sc->sc_dk);
609 
610 	/* Poof. */
611 	rw_enter(&dkwedges_lock, RW_WRITER);
612 	dkwedges[unit] = NULL;
613 	sc->sc_state = DKW_STATE_DEAD;
614 	rw_exit(&dkwedges_lock);
615 
616 	free(sc, M_DKWEDGE);
617 
618 	return 0;
619 }
620 
621 /*
622  * dkwedge_delall:	[exported function]
623  *
624  *	Delete all of the wedges on the specified disk.  Used when
625  *	a disk is being detached.
626  */
627 void
628 dkwedge_delall(struct disk *pdk)
629 {
630 	struct dkwedge_info dkw;
631 	struct dkwedge_softc *sc;
632 
633 	for (;;) {
634 		mutex_enter(&pdk->dk_openlock);
635 		if ((sc = LIST_FIRST(&pdk->dk_wedges)) == NULL) {
636 			KASSERT(pdk->dk_nwedges == 0);
637 			mutex_exit(&pdk->dk_openlock);
638 			return;
639 		}
640 		strcpy(dkw.dkw_parent, pdk->dk_name);
641 		strlcpy(dkw.dkw_devname, device_xname(sc->sc_dev),
642 			sizeof(dkw.dkw_devname));
643 		mutex_exit(&pdk->dk_openlock);
644 		(void) dkwedge_del(&dkw);
645 	}
646 }
647 
648 /*
649  * dkwedge_list:	[exported function]
650  *
651  *	List all of the wedges on a particular disk.
652  *	If p == NULL, the buffer is in kernel space.  Otherwise, it is
653  *	in user space of the specified process.
654  */
655 int
656 dkwedge_list(struct disk *pdk, struct dkwedge_list *dkwl, struct lwp *l)
657 {
658 	struct uio uio;
659 	struct iovec iov;
660 	struct dkwedge_softc *sc;
661 	struct dkwedge_info dkw;
662 	int error = 0;
663 
664 	iov.iov_base = dkwl->dkwl_buf;
665 	iov.iov_len = dkwl->dkwl_bufsize;
666 
667 	uio.uio_iov = &iov;
668 	uio.uio_iovcnt = 1;
669 	uio.uio_offset = 0;
670 	uio.uio_resid = dkwl->dkwl_bufsize;
671 	uio.uio_rw = UIO_READ;
672 	KASSERT(l == curlwp);
673 	uio.uio_vmspace = l->l_proc->p_vmspace;
674 
675 	dkwl->dkwl_ncopied = 0;
676 
677 	mutex_enter(&pdk->dk_openlock);
678 	LIST_FOREACH(sc, &pdk->dk_wedges, sc_plink) {
679 		if (uio.uio_resid < sizeof(dkw))
680 			break;
681 
682 		if (sc->sc_state != DKW_STATE_RUNNING)
683 			continue;
684 
685 		strlcpy(dkw.dkw_devname, device_xname(sc->sc_dev),
686 			sizeof(dkw.dkw_devname));
687 		memcpy(dkw.dkw_wname, sc->sc_wname, sizeof(dkw.dkw_wname));
688 		dkw.dkw_wname[sizeof(dkw.dkw_wname) - 1] = '\0';
689 		strcpy(dkw.dkw_parent, sc->sc_parent->dk_name);
690 		dkw.dkw_offset = sc->sc_offset;
691 		dkw.dkw_size = sc->sc_size;
692 		strcpy(dkw.dkw_ptype, sc->sc_ptype);
693 
694 		error = uiomove(&dkw, sizeof(dkw), &uio);
695 		if (error)
696 			break;
697 		dkwl->dkwl_ncopied++;
698 	}
699 	dkwl->dkwl_nwedges = pdk->dk_nwedges;
700 	mutex_exit(&pdk->dk_openlock);
701 
702 	return (error);
703 }
704 
705 device_t
706 dkwedge_find_by_wname(const char *wname)
707 {
708 	device_t dv = NULL;
709 	struct dkwedge_softc *sc;
710 	int i;
711 
712 	rw_enter(&dkwedges_lock, RW_WRITER);
713 	for (i = 0; i < ndkwedges; i++) {
714 		if ((sc = dkwedges[i]) == NULL)
715 			continue;
716 		if (strcmp(sc->sc_wname, wname) == 0) {
717 			if (dv != NULL) {
718 				printf(
719 				    "WARNING: double match for wedge name %s "
720 				    "(%s, %s)\n", wname, device_xname(dv),
721 				    device_xname(sc->sc_dev));
722 				continue;
723 			}
724 			dv = sc->sc_dev;
725 		}
726 	}
727 	rw_exit(&dkwedges_lock);
728 	return dv;
729 }
730 
731 void
732 dkwedge_print_wnames(void)
733 {
734 	struct dkwedge_softc *sc;
735 	int i;
736 
737 	rw_enter(&dkwedges_lock, RW_WRITER);
738 	for (i = 0; i < ndkwedges; i++) {
739 		if ((sc = dkwedges[i]) == NULL)
740 			continue;
741 		printf(" wedge:%s", sc->sc_wname);
742 	}
743 	rw_exit(&dkwedges_lock);
744 }
745 
746 /*
747  * dkwedge_set_bootwedge
748  *
749  *	Set the booted_wedge global based on the specified parent name
750  *	and offset/length.
751  */
752 void
753 dkwedge_set_bootwedge(device_t parent, daddr_t startblk, uint64_t nblks)
754 {
755 	struct dkwedge_softc *sc;
756 	int i;
757 
758 	rw_enter(&dkwedges_lock, RW_WRITER);
759 	for (i = 0; i < ndkwedges; i++) {
760 		if ((sc = dkwedges[i]) == NULL)
761 			continue;
762 		if (strcmp(sc->sc_parent->dk_name, device_xname(parent)) == 0 &&
763 		    sc->sc_offset == startblk &&
764 		    sc->sc_size == nblks) {
765 			if (booted_wedge) {
766 				printf("WARNING: double match for boot wedge "
767 				    "(%s, %s)\n",
768 				    device_xname(booted_wedge),
769 				    device_xname(sc->sc_dev));
770 				continue;
771 			}
772 			booted_device = parent;
773 			booted_wedge = sc->sc_dev;
774 			booted_partition = 0;
775 		}
776 	}
777 	/*
778 	 * XXX What if we don't find one?  Should we create a special
779 	 * XXX root wedge?
780 	 */
781 	rw_exit(&dkwedges_lock);
782 }
783 
784 /*
785  * We need a dummy object to stuff into the dkwedge discovery method link
786  * set to ensure that there is always at least one object in the set.
787  */
788 static struct dkwedge_discovery_method dummy_discovery_method;
789 __link_set_add_bss(dkwedge_methods, dummy_discovery_method);
790 
791 /*
792  * dkwedge_init:
793  *
794  *	Initialize the disk wedge subsystem.
795  */
796 void
797 dkwedge_init(void)
798 {
799 	__link_set_decl(dkwedge_methods, struct dkwedge_discovery_method);
800 	struct dkwedge_discovery_method * const *ddmp;
801 	struct dkwedge_discovery_method *lddm, *ddm;
802 
803 	rw_init(&dkwedges_lock);
804 	rw_init(&dkwedge_discovery_methods_lock);
805 
806 	if (config_cfdriver_attach(&dk_cd) != 0)
807 		panic("dkwedge: unable to attach cfdriver");
808 	if (config_cfattach_attach(dk_cd.cd_name, &dk_ca) != 0)
809 		panic("dkwedge: unable to attach cfattach");
810 
811 	rw_enter(&dkwedge_discovery_methods_lock, RW_WRITER);
812 
813 	LIST_INIT(&dkwedge_discovery_methods);
814 
815 	__link_set_foreach(ddmp, dkwedge_methods) {
816 		ddm = *ddmp;
817 		if (ddm == &dummy_discovery_method)
818 			continue;
819 		if (LIST_EMPTY(&dkwedge_discovery_methods)) {
820 			LIST_INSERT_HEAD(&dkwedge_discovery_methods,
821 					 ddm, ddm_list);
822 			continue;
823 		}
824 		LIST_FOREACH(lddm, &dkwedge_discovery_methods, ddm_list) {
825 			if (ddm->ddm_priority == lddm->ddm_priority) {
826 				aprint_error("dk-method-%s: method \"%s\" "
827 				    "already exists at priority %d\n",
828 				    ddm->ddm_name, lddm->ddm_name,
829 				    lddm->ddm_priority);
830 				/* Not inserted. */
831 				break;
832 			}
833 			if (ddm->ddm_priority < lddm->ddm_priority) {
834 				/* Higher priority; insert before. */
835 				LIST_INSERT_BEFORE(lddm, ddm, ddm_list);
836 				break;
837 			}
838 			if (LIST_NEXT(lddm, ddm_list) == NULL) {
839 				/* Last one; insert after. */
840 				KASSERT(lddm->ddm_priority < ddm->ddm_priority);
841 				LIST_INSERT_AFTER(lddm, ddm, ddm_list);
842 				break;
843 			}
844 		}
845 	}
846 
847 	rw_exit(&dkwedge_discovery_methods_lock);
848 }
849 
850 #ifdef DKWEDGE_AUTODISCOVER
851 int	dkwedge_autodiscover = 1;
852 #else
853 int	dkwedge_autodiscover = 0;
854 #endif
855 
856 /*
857  * dkwedge_discover:	[exported function]
858  *
859  *	Discover the wedges on a newly attached disk.
860  */
861 void
862 dkwedge_discover(struct disk *pdk)
863 {
864 	struct dkwedge_discovery_method *ddm;
865 	struct vnode *vp;
866 	int error;
867 	dev_t pdev;
868 
869 	/*
870 	 * Require people playing with wedges to enable this explicitly.
871 	 */
872 	if (dkwedge_autodiscover == 0)
873 		return;
874 
875 	rw_enter(&dkwedge_discovery_methods_lock, RW_READER);
876 
877 	error = dkwedge_compute_pdev(pdk->dk_name, &pdev);
878 	if (error) {
879 		aprint_error("%s: unable to compute pdev, error = %d\n",
880 		    pdk->dk_name, error);
881 		goto out;
882 	}
883 
884 	error = bdevvp(pdev, &vp);
885 	if (error) {
886 		aprint_error("%s: unable to find vnode for pdev, error = %d\n",
887 		    pdk->dk_name, error);
888 		goto out;
889 	}
890 
891 	error = vn_lock(vp, LK_EXCLUSIVE | LK_RETRY);
892 	if (error) {
893 		aprint_error("%s: unable to lock vnode for pdev, error = %d\n",
894 		    pdk->dk_name, error);
895 		vrele(vp);
896 		goto out;
897 	}
898 
899 	error = VOP_OPEN(vp, FREAD, NOCRED);
900 	if (error) {
901 		aprint_error("%s: unable to open device, error = %d\n",
902 		    pdk->dk_name, error);
903 		vput(vp);
904 		goto out;
905 	}
906 	VOP_UNLOCK(vp, 0);
907 
908 	/*
909 	 * For each supported partition map type, look to see if
910 	 * this map type exists.  If so, parse it and add the
911 	 * corresponding wedges.
912 	 */
913 	LIST_FOREACH(ddm, &dkwedge_discovery_methods, ddm_list) {
914 		error = (*ddm->ddm_discover)(pdk, vp);
915 		if (error == 0) {
916 			/* Successfully created wedges; we're done. */
917 			break;
918 		}
919 	}
920 
921 	error = vn_close(vp, FREAD, NOCRED);
922 	if (error) {
923 		aprint_error("%s: unable to close device, error = %d\n",
924 		    pdk->dk_name, error);
925 		/* We'll just assume the vnode has been cleaned up. */
926 	}
927  out:
928 	rw_exit(&dkwedge_discovery_methods_lock);
929 }
930 
931 /*
932  * dkwedge_read:
933  *
934  *	Read some data from the specified disk, used for
935  *	partition discovery.
936  */
937 int
938 dkwedge_read(struct disk *pdk, struct vnode *vp, daddr_t blkno,
939     void *tbuf, size_t len)
940 {
941 	struct buf *bp;
942 	int result;
943 
944 	bp = getiobuf(vp, true);
945 
946 	bp->b_dev = vp->v_rdev;
947 	bp->b_blkno = blkno;
948 	bp->b_bcount = len;
949 	bp->b_resid = len;
950 	bp->b_flags = B_READ;
951 	bp->b_data = tbuf;
952 	SET(bp->b_cflags, BC_BUSY);	/* mark buffer busy */
953 
954 	VOP_STRATEGY(vp, bp);
955 	result = biowait(bp);
956 	putiobuf(bp);
957 
958 	return result;
959 }
960 
961 /*
962  * dkwedge_lookup:
963  *
964  *	Look up a dkwedge_softc based on the provided dev_t.
965  */
966 static struct dkwedge_softc *
967 dkwedge_lookup(dev_t dev)
968 {
969 	int unit = minor(dev);
970 
971 	if (unit >= ndkwedges)
972 		return (NULL);
973 
974 	KASSERT(dkwedges != NULL);
975 
976 	return (dkwedges[unit]);
977 }
978 
979 /*
980  * dkopen:		[devsw entry point]
981  *
982  *	Open a wedge.
983  */
984 static int
985 dkopen(dev_t dev, int flags, int fmt, struct lwp *l)
986 {
987 	struct dkwedge_softc *sc = dkwedge_lookup(dev);
988 	struct vnode *vp;
989 	int error = 0;
990 
991 	if (sc == NULL)
992 		return (ENODEV);
993 
994 	if (sc->sc_state != DKW_STATE_RUNNING)
995 		return (ENXIO);
996 
997 	/*
998 	 * We go through a complicated little dance to only open the parent
999 	 * vnode once per wedge, no matter how many times the wedge is
1000 	 * opened.  The reason?  We see one dkopen() per open call, but
1001 	 * only dkclose() on the last close.
1002 	 */
1003 	mutex_enter(&sc->sc_dk.dk_openlock);
1004 	mutex_enter(&sc->sc_parent->dk_rawlock);
1005 	if (sc->sc_dk.dk_openmask == 0) {
1006 		if (sc->sc_parent->dk_rawopens == 0) {
1007 			KASSERT(sc->sc_parent->dk_rawvp == NULL);
1008 			error = bdevvp(sc->sc_pdev, &vp);
1009 			if (error)
1010 				goto popen_fail;
1011 			error = vn_lock(vp, LK_EXCLUSIVE | LK_RETRY);
1012 			if (error) {
1013 				vrele(vp);
1014 				goto popen_fail;
1015 			}
1016 			error = VOP_OPEN(vp, FREAD | FWRITE, NOCRED);
1017 			if (error) {
1018 				vput(vp);
1019 				goto popen_fail;
1020 			}
1021 			/* VOP_OPEN() doesn't do this for us. */
1022 			mutex_enter(&vp->v_interlock);
1023 			vp->v_writecount++;
1024 			mutex_exit(&vp->v_interlock);
1025 			VOP_UNLOCK(vp, 0);
1026 			sc->sc_parent->dk_rawvp = vp;
1027 		}
1028 		sc->sc_parent->dk_rawopens++;
1029 	}
1030 	if (fmt == S_IFCHR)
1031 		sc->sc_dk.dk_copenmask |= 1;
1032 	else
1033 		sc->sc_dk.dk_bopenmask |= 1;
1034 	sc->sc_dk.dk_openmask =
1035 	    sc->sc_dk.dk_copenmask | sc->sc_dk.dk_bopenmask;
1036 
1037  popen_fail:
1038 	mutex_exit(&sc->sc_parent->dk_rawlock);
1039 	mutex_exit(&sc->sc_dk.dk_openlock);
1040 	return (error);
1041 }
1042 
1043 /*
1044  * Caller must hold sc->sc_dk.dk_openlock and sc->sc_parent->dk_rawlock.
1045  */
1046 static int
1047 dklastclose(struct dkwedge_softc *sc)
1048 {
1049 	int error = 0;
1050 
1051 	if (sc->sc_parent->dk_rawopens-- == 1) {
1052 		KASSERT(sc->sc_parent->dk_rawvp != NULL);
1053 		error = vn_close(sc->sc_parent->dk_rawvp,
1054 		    FREAD | FWRITE, NOCRED);
1055 		sc->sc_parent->dk_rawvp = NULL;
1056 	}
1057 	return error;
1058 }
1059 
1060 /*
1061  * dkclose:		[devsw entry point]
1062  *
1063  *	Close a wedge.
1064  */
1065 static int
1066 dkclose(dev_t dev, int flags, int fmt, struct lwp *l)
1067 {
1068 	struct dkwedge_softc *sc = dkwedge_lookup(dev);
1069 	int error = 0;
1070 
1071 	KASSERT(sc->sc_dk.dk_openmask != 0);
1072 
1073 	mutex_enter(&sc->sc_dk.dk_openlock);
1074 	mutex_enter(&sc->sc_parent->dk_rawlock);
1075 
1076 	if (fmt == S_IFCHR)
1077 		sc->sc_dk.dk_copenmask &= ~1;
1078 	else
1079 		sc->sc_dk.dk_bopenmask &= ~1;
1080 	sc->sc_dk.dk_openmask =
1081 	    sc->sc_dk.dk_copenmask | sc->sc_dk.dk_bopenmask;
1082 
1083 	if (sc->sc_dk.dk_openmask == 0)
1084 		error = dklastclose(sc);
1085 
1086 	mutex_exit(&sc->sc_parent->dk_rawlock);
1087 	mutex_exit(&sc->sc_dk.dk_openlock);
1088 
1089 	return (error);
1090 }
1091 
1092 /*
1093  * dkstragegy:		[devsw entry point]
1094  *
1095  *	Perform I/O based on the wedge I/O strategy.
1096  */
1097 static void
1098 dkstrategy(struct buf *bp)
1099 {
1100 	struct dkwedge_softc *sc = dkwedge_lookup(bp->b_dev);
1101 	uint64_t p_size, p_offset;
1102 	int s;
1103 
1104 	if (sc->sc_state != DKW_STATE_RUNNING) {
1105 		bp->b_error = ENXIO;
1106 		goto done;
1107 	}
1108 
1109 	/* If it's an empty transfer, wake up the top half now. */
1110 	if (bp->b_bcount == 0)
1111 		goto done;
1112 
1113 	p_offset = sc->sc_offset << sc->sc_parent->dk_blkshift;
1114 	p_size   = sc->sc_size << sc->sc_parent->dk_blkshift;
1115 
1116 	/* Make sure it's in-range. */
1117 	if (bounds_check_with_mediasize(bp, DEV_BSIZE, p_size) <= 0)
1118 		goto done;
1119 
1120 	/* Translate it to the parent's raw LBA. */
1121 	bp->b_rawblkno = bp->b_blkno + p_offset;
1122 
1123 	/* Place it in the queue and start I/O on the unit. */
1124 	s = splbio();
1125 	sc->sc_iopend++;
1126 	bufq_put(sc->sc_bufq, bp);
1127 	dkstart(sc);
1128 	splx(s);
1129 	return;
1130 
1131  done:
1132 	bp->b_resid = bp->b_bcount;
1133 	biodone(bp);
1134 }
1135 
1136 /*
1137  * dkstart:
1138  *
1139  *	Start I/O that has been enqueued on the wedge.
1140  *	NOTE: Must be called at splbio()!
1141  */
1142 static void
1143 dkstart(struct dkwedge_softc *sc)
1144 {
1145 	struct vnode *vp;
1146 	struct buf *bp, *nbp;
1147 
1148 	/* Do as much work as has been enqueued. */
1149 	while ((bp = bufq_peek(sc->sc_bufq)) != NULL) {
1150 		if (sc->sc_state != DKW_STATE_RUNNING) {
1151 			(void) bufq_get(sc->sc_bufq);
1152 			if (sc->sc_iopend-- == 1 &&
1153 			    (sc->sc_flags & DK_F_WAIT_DRAIN) != 0) {
1154 				sc->sc_flags &= ~DK_F_WAIT_DRAIN;
1155 				wakeup(&sc->sc_iopend);
1156 			}
1157 			bp->b_error = ENXIO;
1158 			bp->b_resid = bp->b_bcount;
1159 			biodone(bp);
1160 		}
1161 
1162 		/* Instrumentation. */
1163 		disk_busy(&sc->sc_dk);
1164 
1165 		nbp = getiobuf(sc->sc_parent->dk_rawvp, false);
1166 		if (nbp == NULL) {
1167 			/*
1168 			 * No resources to run this request; leave the
1169 			 * buffer queued up, and schedule a timer to
1170 			 * restart the queue in 1/2 a second.
1171 			 */
1172 			disk_unbusy(&sc->sc_dk, 0, bp->b_flags & B_READ);
1173 			callout_schedule(&sc->sc_restart_ch, hz / 2);
1174 			return;
1175 		}
1176 
1177 		(void) bufq_get(sc->sc_bufq);
1178 
1179 		nbp->b_data = bp->b_data;
1180 		nbp->b_flags = bp->b_flags;
1181 		nbp->b_oflags = bp->b_oflags;
1182 		nbp->b_cflags = bp->b_cflags;
1183 		nbp->b_iodone = dkiodone;
1184 		nbp->b_proc = bp->b_proc;
1185 		nbp->b_blkno = bp->b_rawblkno;
1186 		nbp->b_dev = sc->sc_parent->dk_rawvp->v_rdev;
1187 		nbp->b_bcount = bp->b_bcount;
1188 		nbp->b_private = bp;
1189 		BIO_COPYPRIO(nbp, bp);
1190 
1191 		vp = nbp->b_vp;
1192 		if ((nbp->b_flags & B_READ) == 0) {
1193 			mutex_enter(&vp->v_interlock);
1194 			vp->v_numoutput++;
1195 			mutex_exit(&vp->v_interlock);
1196 		}
1197 		VOP_STRATEGY(vp, nbp);
1198 	}
1199 }
1200 
1201 /*
1202  * dkiodone:
1203  *
1204  *	I/O to a wedge has completed; alert the top half.
1205  */
1206 static void
1207 dkiodone(struct buf *bp)
1208 {
1209 	struct buf *obp = bp->b_private;
1210 	struct dkwedge_softc *sc = dkwedge_lookup(obp->b_dev);
1211 
1212 	int s = splbio();
1213 
1214 	if (bp->b_error != 0)
1215 		obp->b_error = bp->b_error;
1216 	obp->b_resid = bp->b_resid;
1217 	putiobuf(bp);
1218 
1219 	if (sc->sc_iopend-- == 1 && (sc->sc_flags & DK_F_WAIT_DRAIN) != 0) {
1220 		sc->sc_flags &= ~DK_F_WAIT_DRAIN;
1221 		wakeup(&sc->sc_iopend);
1222 	}
1223 
1224 	disk_unbusy(&sc->sc_dk, obp->b_bcount - obp->b_resid,
1225 	    obp->b_flags & B_READ);
1226 
1227 	biodone(obp);
1228 
1229 	/* Kick the queue in case there is more work we can do. */
1230 	dkstart(sc);
1231 	splx(s);
1232 }
1233 
1234 /*
1235  * dkrestart:
1236  *
1237  *	Restart the work queue after it was stalled due to
1238  *	a resource shortage.  Invoked via a callout.
1239  */
1240 static void
1241 dkrestart(void *v)
1242 {
1243 	struct dkwedge_softc *sc = v;
1244 	int s;
1245 
1246 	s = splbio();
1247 	dkstart(sc);
1248 	splx(s);
1249 }
1250 
1251 /*
1252  * dkminphys:
1253  *
1254  *	Call parent's minphys function.
1255  */
1256 static void
1257 dkminphys(struct buf *bp)
1258 {
1259 	struct dkwedge_softc *sc = dkwedge_lookup(bp->b_dev);
1260 	dev_t dev;
1261 
1262 	dev = bp->b_dev;
1263 	bp->b_dev = sc->sc_pdev;
1264 	(*sc->sc_parent->dk_driver->d_minphys)(bp);
1265 	bp->b_dev = dev;
1266 }
1267 
1268 /*
1269  * dkread:		[devsw entry point]
1270  *
1271  *	Read from a wedge.
1272  */
1273 static int
1274 dkread(dev_t dev, struct uio *uio, int flags)
1275 {
1276 	struct dkwedge_softc *sc = dkwedge_lookup(dev);
1277 
1278 	if (sc->sc_state != DKW_STATE_RUNNING)
1279 		return (ENXIO);
1280 
1281 	return (physio(dkstrategy, NULL, dev, B_READ, dkminphys, uio));
1282 }
1283 
1284 /*
1285  * dkwrite:		[devsw entry point]
1286  *
1287  *	Write to a wedge.
1288  */
1289 static int
1290 dkwrite(dev_t dev, struct uio *uio, int flags)
1291 {
1292 	struct dkwedge_softc *sc = dkwedge_lookup(dev);
1293 
1294 	if (sc->sc_state != DKW_STATE_RUNNING)
1295 		return (ENXIO);
1296 
1297 	return (physio(dkstrategy, NULL, dev, B_WRITE, dkminphys, uio));
1298 }
1299 
1300 /*
1301  * dkioctl:		[devsw entry point]
1302  *
1303  *	Perform an ioctl request on a wedge.
1304  */
1305 static int
1306 dkioctl(dev_t dev, u_long cmd, void *data, int flag, struct lwp *l)
1307 {
1308 	struct dkwedge_softc *sc = dkwedge_lookup(dev);
1309 	int error = 0;
1310 
1311 	if (sc->sc_state != DKW_STATE_RUNNING)
1312 		return (ENXIO);
1313 
1314 	error = disk_ioctl(&sc->sc_dk, cmd, data, flag, l);
1315 	if (error != EPASSTHROUGH)
1316 		return (error);
1317 
1318 	error = 0;
1319 
1320 	switch (cmd) {
1321 	case DIOCCACHESYNC:
1322 		/*
1323 		 * XXX Do we really need to care about having a writable
1324 		 * file descriptor here?
1325 		 */
1326 		if ((flag & FWRITE) == 0)
1327 			error = EBADF;
1328 		else
1329 			error = VOP_IOCTL(sc->sc_parent->dk_rawvp,
1330 					  cmd, data, flag,
1331 					  l != NULL ? l->l_cred : NOCRED);
1332 		break;
1333 	case DIOCGWEDGEINFO:
1334 	    {
1335 		struct dkwedge_info *dkw = (void *) data;
1336 
1337 		strlcpy(dkw->dkw_devname, device_xname(sc->sc_dev),
1338 			sizeof(dkw->dkw_devname));
1339 	    	memcpy(dkw->dkw_wname, sc->sc_wname, sizeof(dkw->dkw_wname));
1340 		dkw->dkw_wname[sizeof(dkw->dkw_wname) - 1] = '\0';
1341 		strcpy(dkw->dkw_parent, sc->sc_parent->dk_name);
1342 		dkw->dkw_offset = sc->sc_offset;
1343 		dkw->dkw_size = sc->sc_size;
1344 		strcpy(dkw->dkw_ptype, sc->sc_ptype);
1345 
1346 		break;
1347 	    }
1348 
1349 	default:
1350 		error = ENOTTY;
1351 	}
1352 
1353 	return (error);
1354 }
1355 
1356 /*
1357  * dksize:		[devsw entry point]
1358  *
1359  *	Query the size of a wedge for the purpose of performing a dump
1360  *	or for swapping to.
1361  */
1362 static int
1363 dksize(dev_t dev)
1364 {
1365 	struct dkwedge_softc *sc = dkwedge_lookup(dev);
1366 	int rv = -1;
1367 
1368 	if (sc == NULL)
1369 		return (-1);
1370 
1371 	if (sc->sc_state != DKW_STATE_RUNNING)
1372 		return (-1);
1373 
1374 	mutex_enter(&sc->sc_dk.dk_openlock);
1375 	mutex_enter(&sc->sc_parent->dk_rawlock);
1376 
1377 	/* Our content type is static, no need to open the device. */
1378 
1379 	if (strcmp(sc->sc_ptype, DKW_PTYPE_SWAP) == 0) {
1380 		/* Saturate if we are larger than INT_MAX. */
1381 		if (sc->sc_size > INT_MAX)
1382 			rv = INT_MAX;
1383 		else
1384 			rv = (int) sc->sc_size;
1385 	}
1386 
1387 	mutex_exit(&sc->sc_parent->dk_rawlock);
1388 	mutex_exit(&sc->sc_dk.dk_openlock);
1389 
1390 	return (rv);
1391 }
1392 
1393 /*
1394  * dkdump:		[devsw entry point]
1395  *
1396  *	Perform a crash dump to a wedge.
1397  */
1398 static int
1399 dkdump(dev_t dev, daddr_t blkno, void *va, size_t size)
1400 {
1401 	struct dkwedge_softc *sc = dkwedge_lookup(dev);
1402 	const struct bdevsw *bdev;
1403 	int rv = 0;
1404 
1405 	if (sc == NULL)
1406 		return (ENXIO);
1407 
1408 	if (sc->sc_state != DKW_STATE_RUNNING)
1409 		return (ENXIO);
1410 
1411 	mutex_enter(&sc->sc_dk.dk_openlock);
1412 	mutex_enter(&sc->sc_parent->dk_rawlock);
1413 
1414 	/* Our content type is static, no need to open the device. */
1415 
1416 	if (strcmp(sc->sc_ptype, DKW_PTYPE_SWAP) != 0) {
1417 		rv = ENXIO;
1418 		goto out;
1419 	}
1420 	if (size % DEV_BSIZE != 0) {
1421 		rv = EINVAL;
1422 		goto out;
1423 	}
1424 	if (blkno + size / DEV_BSIZE > sc->sc_size) {
1425 		printf("%s: blkno (%" PRIu64 ") + size / DEV_BSIZE (%zu) > "
1426 		    "sc->sc_size (%" PRIu64 ")\n", __func__, blkno,
1427 		    size / DEV_BSIZE, sc->sc_size);
1428 		rv = EINVAL;
1429 		goto out;
1430 	}
1431 
1432 	bdev = bdevsw_lookup(sc->sc_pdev);
1433 	rv = (*bdev->d_dump)(sc->sc_pdev, blkno + sc->sc_offset, va, size);
1434 
1435 out:
1436 	mutex_exit(&sc->sc_parent->dk_rawlock);
1437 	mutex_exit(&sc->sc_dk.dk_openlock);
1438 
1439 	return rv;
1440 }
1441 
1442 /*
1443  * config glue
1444  */
1445 
1446 int
1447 config_handle_wedges(struct device *dv, int par)
1448 {
1449 	struct dkwedge_list wl;
1450 	struct dkwedge_info *wi;
1451 	struct vnode *vn;
1452 	char diskname[16];
1453 	int i, error;
1454 
1455 	if ((vn = opendisk(dv)) == NULL)
1456 		return -1;
1457 
1458 	wl.dkwl_bufsize = sizeof(*wi) * 16;
1459 	wl.dkwl_buf = wi = malloc(wl.dkwl_bufsize, M_TEMP, M_WAITOK);
1460 
1461 	error = VOP_IOCTL(vn, DIOCLWEDGES, &wl, FREAD, NOCRED);
1462 	VOP_CLOSE(vn, FREAD, NOCRED);
1463 	vput(vn);
1464 	if (error) {
1465 #ifdef DEBUG_WEDGE
1466 		printf("%s: List wedges returned %d\n",
1467 		    device_xname(dv), error);
1468 #endif
1469 		free(wi, M_TEMP);
1470 		return -1;
1471 	}
1472 
1473 #ifdef DEBUG_WEDGE
1474 	printf("%s: Returned %u(%u) wedges\n", device_xname(dv),
1475 	    wl.dkwl_nwedges, wl.dkwl_ncopied);
1476 #endif
1477 	snprintf(diskname, sizeof(diskname), "%s%c", device_xname(dv),
1478 	    par + 'a');
1479 
1480 	for (i = 0; i < wl.dkwl_ncopied; i++) {
1481 #ifdef DEBUG_WEDGE
1482 		printf("%s: Looking for %s in %s\n",
1483 		    device_xname(dv), diskname, wi[i].dkw_wname);
1484 #endif
1485 		if (strcmp(wi[i].dkw_wname, diskname) == 0)
1486 			break;
1487 	}
1488 
1489 	if (i == wl.dkwl_ncopied) {
1490 #ifdef DEBUG_WEDGE
1491 		printf("%s: Cannot find wedge with parent %s\n",
1492 		    device_xname(dv), diskname);
1493 #endif
1494 		free(wi, M_TEMP);
1495 		return -1;
1496 	}
1497 
1498 #ifdef DEBUG_WEDGE
1499 	printf("%s: Setting boot wedge %s (%s) at %llu %llu\n",
1500 		device_xname(dv), wi[i].dkw_devname, wi[i].dkw_wname,
1501 		(unsigned long long)wi[i].dkw_offset,
1502 		(unsigned long long)wi[i].dkw_size);
1503 #endif
1504 	dkwedge_set_bootwedge(dv, wi[i].dkw_offset, wi[i].dkw_size);
1505 	free(wi, M_TEMP);
1506 	return 0;
1507 }
1508