xref: /dflybsd-src/sys/dev/disk/md/md.c (revision ae788f37fe53d5d1ca1e12a184a662192caad3c5)
1 /*
2  * ----------------------------------------------------------------------------
3  * "THE BEER-WARE LICENSE" (Revision 42):
4  * <phk@FreeBSD.ORG> wrote this file.  As long as you retain this notice you
5  * can do whatever you want with this stuff. If we meet some day, and you think
6  * this stuff is worth it, you can buy me a beer in return.   Poul-Henning Kamp
7  * ----------------------------------------------------------------------------
8  *
9  * $FreeBSD: src/sys/dev/md/md.c,v 1.8.2.2 2002/08/19 17:43:34 jdp Exp $
10  * $DragonFly: src/sys/dev/disk/md/md.c,v 1.20 2008/09/07 08:09:39 swildner Exp $
11  *
12  */
13 
14 #include "opt_md.h"		/* We have adopted some tasks from MFS */
15 
16 #include <sys/param.h>
17 #include <sys/systm.h>
18 #include <sys/buf.h>
19 #include <sys/conf.h>
20 #include <sys/devicestat.h>
21 #include <sys/disk.h>
22 #include <sys/kernel.h>
23 #include <sys/malloc.h>
24 #include <sys/sysctl.h>
25 #include <sys/linker.h>
26 #include <sys/proc.h>
27 #include <sys/buf2.h>
28 #include <sys/thread2.h>
29 
30 #ifndef MD_NSECT
31 #define MD_NSECT (10000 * 2)
32 #endif
33 
34 MALLOC_DEFINE(M_MD, "MD disk", "Memory Disk");
35 MALLOC_DEFINE(M_MDSECT, "MD sectors", "Memory Disk Sectors");
36 
37 static int md_debug;
38 SYSCTL_INT(_debug, OID_AUTO, mddebug, CTLFLAG_RW, &md_debug, 0, "");
39 
40 #if defined(MD_ROOT) && defined(MD_ROOT_SIZE)
41 /* Image gets put here: */
42 static u_char mfs_root[MD_ROOT_SIZE*1024] = "MFS Filesystem goes here";
43 static u_char end_mfs_root[] __unused = "MFS Filesystem had better STOP here";
44 #endif
45 
46 static int mdrootready;
47 
48 static void mdcreate_malloc(void);
49 
50 #define CDEV_MAJOR	95
51 
52 static d_strategy_t mdstrategy;
53 static d_strategy_t mdstrategy_preload;
54 static d_strategy_t mdstrategy_malloc;
55 static d_open_t mdopen;
56 static d_ioctl_t mdioctl;
57 
58 static struct dev_ops md_ops = {
59 	{ "md", CDEV_MAJOR, D_DISK | D_CANFREE | D_MEMDISK },
60         .d_open =	mdopen,
61         .d_close =	nullclose,
62         .d_read =	physread,
63         .d_write =	physwrite,
64         .d_ioctl =	mdioctl,
65         .d_strategy =	mdstrategy,
66 };
67 
68 struct md_s {
69 	int unit;
70 	struct devstat stats;
71 	struct bio_queue_head bio_queue;
72 	struct disk disk;
73 	cdev_t dev;
74 	int busy;
75 	enum {MD_MALLOC, MD_PRELOAD} type;
76 	unsigned nsect;
77 
78 	/* MD_MALLOC related fields */
79 	unsigned nsecp;
80 	u_char **secp;
81 
82 	/* MD_PRELOAD related fields */
83 	u_char *pl_ptr;
84 	unsigned pl_len;
85 };
86 
87 static int mdunits;
88 
89 static int
90 mdopen(struct dev_open_args *ap)
91 {
92 	cdev_t dev = ap->a_head.a_dev;
93 	struct md_s *sc;
94 #if 0
95 	struct disk_info info;
96 #endif
97 
98 	if (md_debug)
99 		kprintf("mdopen(%s %x %x)\n",
100 			devtoname(dev), ap->a_oflags, ap->a_devtype);
101 
102 	sc = dev->si_drv1;
103 	if (sc->unit + 1 == mdunits)
104 		mdcreate_malloc();
105 #if 0
106 	bzero(&info, sizeof(info));
107 	info.d_media_blksize = DEV_BSIZE;	/* mandatory */
108 	info.d_media_blocks = sc->nsect;
109 
110 	info.d_secpertrack = 1024;		/* optional */
111 	info.d_nheads = 1;
112 	info.d_secpercyl = info.d_secpertrack * info.d_nheads;
113 	info.d_ncylinders = (u_int)(info.d_media_blocks / info.d_secpercyl);
114 	disk_setdiskinfo(&sc->disk, &info);
115 #endif
116 	return (0);
117 }
118 
119 static int
120 mdioctl(struct dev_ioctl_args *ap)
121 {
122 	cdev_t dev = ap->a_head.a_dev;
123 
124 	if (md_debug)
125 		kprintf("mdioctl(%s %lx %p %x)\n",
126 			devtoname(dev), ap->a_cmd, ap->a_data, ap->a_fflag);
127 
128 	return (ENOIOCTL);
129 }
130 
131 static int
132 mdstrategy(struct dev_strategy_args *ap)
133 {
134 	cdev_t dev = ap->a_head.a_dev;
135 	struct bio *bio = ap->a_bio;
136 	struct buf *bp = bio->bio_buf;
137 	struct md_s *sc;
138 
139 	if (md_debug > 1) {
140 		kprintf("mdstrategy(%p) %s %08x, %lld, %d, %p)\n",
141 		    bp, devtoname(dev), bp->b_flags,
142 		    (long long)bio->bio_offset,
143 		    bp->b_bcount, bp->b_data);
144 	}
145 	bio->bio_driver_info = dev;
146 	sc = dev->si_drv1;
147 	if (sc->type == MD_MALLOC) {
148 		mdstrategy_malloc(ap);
149 	} else {
150 		mdstrategy_preload(ap);
151 	}
152 	return(0);
153 }
154 
155 
156 static int
157 mdstrategy_malloc(struct dev_strategy_args *ap)
158 {
159 	cdev_t dev = ap->a_head.a_dev;
160 	struct bio *bio = ap->a_bio;
161 	struct buf *bp = bio->bio_buf;
162 	unsigned secno, nsec, secval, uc;
163 	u_char *secp, **secpp, *dst;
164 	struct md_s *sc;
165 	int i;
166 
167 	if (md_debug > 1)
168 		kprintf("mdstrategy_malloc(%p) %s %08xx, %lld, %d, %p)\n",
169 		    bp, devtoname(dev), bp->b_flags,
170 		    (long long)bio->bio_offset,
171 		    bp->b_bcount, bp->b_data);
172 
173 	sc = dev->si_drv1;
174 
175 	crit_enter();
176 
177 	bioqdisksort(&sc->bio_queue, bio);
178 
179 	if (sc->busy) {
180 		crit_exit();
181 		return(0);
182 	}
183 
184 	sc->busy++;
185 
186 	while (1) {
187 		bio = bioq_first(&sc->bio_queue);
188 		if (bio == NULL) {
189 			crit_exit();
190 			break;
191 		}
192 		crit_exit();
193 		bioq_remove(&sc->bio_queue, bio);
194 		bp = bio->bio_buf;
195 
196 		devstat_start_transaction(&sc->stats);
197 
198 		switch (bp->b_cmd) {
199 		case BUF_CMD_FREEBLKS:
200 		case BUF_CMD_READ:
201 		case BUF_CMD_WRITE:
202 			break;
203 		default:
204 			panic("md: bad b_cmd %d", bp->b_cmd);
205 		}
206 
207 		nsec = bp->b_bcount >> DEV_BSHIFT;
208 		secno = (unsigned)(bio->bio_offset >> DEV_BSHIFT);
209 		dst = bp->b_data;
210 		while (nsec--) {
211 			if (secno < sc->nsecp) {
212 				secpp = &sc->secp[secno];
213 				if ((u_int)(uintptr_t)*secpp > 255) {
214 					secp = *secpp;
215 					secval = 0;
216 				} else {
217 					secp = 0;
218 					secval = (u_int)(uintptr_t)*secpp;
219 				}
220 			} else {
221 				secpp = 0;
222 				secp = 0;
223 				secval = 0;
224 			}
225 			if (md_debug > 2)
226 				kprintf("%08x %p %p %d\n", bp->b_flags, secpp, secp, secval);
227 
228 			switch (bp->b_cmd) {
229 			case BUF_CMD_FREEBLKS:
230 				if (secpp) {
231 					if (secp)
232 						FREE(secp, M_MDSECT);
233 					*secpp = 0;
234 				}
235 				break;
236 			case BUF_CMD_READ:
237 				if (secp) {
238 					bcopy(secp, dst, DEV_BSIZE);
239 				} else if (secval) {
240 					for (i = 0; i < DEV_BSIZE; i++)
241 						dst[i] = secval;
242 				} else {
243 					bzero(dst, DEV_BSIZE);
244 				}
245 				break;
246 			case BUF_CMD_WRITE:
247 				uc = dst[0];
248 				for (i = 1; i < DEV_BSIZE; i++)
249 					if (dst[i] != uc)
250 						break;
251 				if (i == DEV_BSIZE && !uc) {
252 					if (secp)
253 						FREE(secp, M_MDSECT);
254 					if (secpp)
255 						*secpp = (u_char *)(uintptr_t)uc;
256 				} else {
257 					if (!secpp) {
258 						MALLOC(secpp, u_char **, (secno + nsec + 1) * sizeof(u_char *), M_MD, M_WAITOK | M_ZERO);
259 						bcopy(sc->secp, secpp, sc->nsecp * sizeof(u_char *));
260 						FREE(sc->secp, M_MD);
261 						sc->secp = secpp;
262 						sc->nsecp = secno + nsec + 1;
263 						secpp = &sc->secp[secno];
264 					}
265 					if (i == DEV_BSIZE) {
266 						if (secp)
267 							FREE(secp, M_MDSECT);
268 						*secpp = (u_char *)(uintptr_t)uc;
269 					} else {
270 						if (!secp)
271 							MALLOC(secp, u_char *, DEV_BSIZE, M_MDSECT, M_WAITOK);
272 						bcopy(dst, secp, DEV_BSIZE);
273 
274 						*secpp = secp;
275 					}
276 				}
277 				break;
278 			default:
279 				panic("md: bad b_cmd %d", bp->b_cmd);
280 
281 			}
282 			secno++;
283 			dst += DEV_BSIZE;
284 		}
285 		bp->b_resid = 0;
286 		devstat_end_transaction_buf(&sc->stats, bp);
287 		biodone(bio);
288 		crit_enter();
289 	}
290 	sc->busy = 0;
291 	return(0);
292 }
293 
294 
295 static int
296 mdstrategy_preload(struct dev_strategy_args *ap)
297 {
298 	cdev_t dev = ap->a_head.a_dev;
299 	struct bio *bio = ap->a_bio;
300 	struct buf *bp = bio->bio_buf;
301 	struct md_s *sc;
302 
303 	if (md_debug > 1)
304 		kprintf("mdstrategy_preload(%p) %s %08x, %lld, %d, %p)\n",
305 		    bp, devtoname(dev), bp->b_flags,
306 		    (long long)bio->bio_offset,
307 		    bp->b_bcount, bp->b_data);
308 
309 	sc = dev->si_drv1;
310 
311 	crit_enter();
312 
313 	bioqdisksort(&sc->bio_queue, bio);
314 
315 	if (sc->busy) {
316 		crit_exit();
317 		return(0);
318 	}
319 
320 	sc->busy++;
321 
322 	while (1) {
323 		bio = bioq_first(&sc->bio_queue);
324 		if (bio)
325 			bioq_remove(&sc->bio_queue, bio);
326 		crit_exit();
327 		if (bio == NULL)
328 			break;
329 
330 		devstat_start_transaction(&sc->stats);
331 
332 		switch (bp->b_cmd) {
333 		case BUF_CMD_FREEBLKS:
334 			break;
335 		case BUF_CMD_READ:
336 			bcopy(sc->pl_ptr + bio->bio_offset,
337 			       bp->b_data, bp->b_bcount);
338 			break;
339 		case BUF_CMD_WRITE:
340 			bcopy(bp->b_data, sc->pl_ptr + bio->bio_offset,
341 			      bp->b_bcount);
342 			break;
343 		default:
344 			panic("md: bad cmd %d\n", bp->b_cmd);
345 		}
346 		bp->b_resid = 0;
347 		devstat_end_transaction_buf(&sc->stats, bp);
348 		biodone(bio);
349 		crit_enter();
350 	}
351 	sc->busy = 0;
352 	return(0);
353 }
354 
355 static struct md_s *
356 mdcreate(unsigned length)
357 {
358 	struct md_s *sc;
359 	struct disk_info info;
360 
361 	MALLOC(sc, struct md_s *,sizeof(*sc), M_MD, M_WAITOK | M_ZERO);
362 	sc->unit = mdunits++;
363 	bioq_init(&sc->bio_queue);
364 	devstat_add_entry(&sc->stats, "md", sc->unit, DEV_BSIZE,
365 		DEVSTAT_NO_ORDERED_TAGS,
366 		DEVSTAT_TYPE_DIRECT | DEVSTAT_TYPE_IF_OTHER,
367 		DEVSTAT_PRIORITY_OTHER);
368 	sc->dev = disk_create(sc->unit, &sc->disk, &md_ops);
369 	sc->dev->si_drv1 = sc;
370 	sc->dev->si_iosize_max = DFLTPHYS;
371 
372 	bzero(&info, sizeof(info));
373 	info.d_media_blksize = DEV_BSIZE;	/* mandatory */
374 	info.d_media_blocks = length / DEV_BSIZE;
375 
376 	info.d_secpertrack = 1024;		/* optional */
377 	info.d_nheads = 1;
378 	info.d_secpercyl = info.d_secpertrack * info.d_nheads;
379 	info.d_ncylinders = (u_int)(info.d_media_blocks / info.d_secpercyl);
380 	disk_setdiskinfo(&sc->disk, &info);
381 
382 	return (sc);
383 }
384 
385 static void
386 mdcreate_preload(u_char *image, unsigned length)
387 {
388 	struct md_s *sc;
389 
390 	sc = mdcreate(length);
391 	sc->type = MD_PRELOAD;
392 	sc->nsect = length / DEV_BSIZE;
393 	sc->pl_ptr = image;
394 	sc->pl_len = length;
395 
396 	if (sc->unit == 0)
397 		mdrootready = 1;
398 }
399 
400 static void
401 mdcreate_malloc(void)
402 {
403 	struct md_s *sc;
404 
405 	sc = mdcreate(0);
406 	sc->type = MD_MALLOC;
407 
408 	sc->nsect = MD_NSECT;	/* for now */
409 	MALLOC(sc->secp, u_char **, sizeof(u_char *), M_MD, M_WAITOK | M_ZERO);
410 	sc->nsecp = 1;
411 	kprintf("md%d: Malloc disk\n", sc->unit);
412 }
413 
414 static void
415 md_drvinit(void *unused)
416 {
417 
418 	caddr_t mod;
419 	caddr_t c;
420 	u_char *ptr, *name, *type;
421 	unsigned len;
422 
423 #ifdef MD_ROOT_SIZE
424 	mdcreate_preload(mfs_root, MD_ROOT_SIZE*1024);
425 #endif
426 	mod = NULL;
427 	while ((mod = preload_search_next_name(mod)) != NULL) {
428 		name = (char *)preload_search_info(mod, MODINFO_NAME);
429 		type = (char *)preload_search_info(mod, MODINFO_TYPE);
430 		if (name == NULL)
431 			continue;
432 		if (type == NULL)
433 			continue;
434 		if (strcmp(type, "md_image") && strcmp(type, "mfs_root"))
435 			continue;
436 		c = preload_search_info(mod, MODINFO_ADDR);
437 		ptr = *(u_char **)c;
438 		c = preload_search_info(mod, MODINFO_SIZE);
439 		len = *(unsigned *)c;
440 		kprintf("md%d: Preloaded image <%s> %d bytes at %p\n",
441 		   mdunits, name, len, ptr);
442 		mdcreate_preload(ptr, len);
443 	}
444 	mdcreate_malloc();
445 }
446 
447 SYSINIT(mddev,SI_SUB_DRIVERS,SI_ORDER_MIDDLE+CDEV_MAJOR, md_drvinit,NULL)
448 
449 #ifdef MD_ROOT
450 static void
451 md_takeroot(void *junk)
452 {
453 	if (mdrootready)
454 		rootdevnames[0] = "ufs:/dev/md0s0";
455 }
456 
457 SYSINIT(md_root, SI_SUB_MOUNT_ROOT, SI_ORDER_FIRST, md_takeroot, NULL);
458 #endif
459