xref: /spdk/test/unit/lib/bdev/mt/bdev.c/bdev_ut.c (revision 2e1dbc458758ba3d2709299913bc199fa3926bda)
1 /*-
2  *   BSD LICENSE
3  *
4  *   Copyright (c) Intel Corporation.
5  *   All rights reserved.
6  *
7  *   Redistribution and use in source and binary forms, with or without
8  *   modification, are permitted provided that the following conditions
9  *   are met:
10  *
11  *     * Redistributions of source code must retain the above copyright
12  *       notice, this list of conditions and the following disclaimer.
13  *     * Redistributions in binary form must reproduce the above copyright
14  *       notice, this list of conditions and the following disclaimer in
15  *       the documentation and/or other materials provided with the
16  *       distribution.
17  *     * Neither the name of Intel Corporation nor the names of its
18  *       contributors may be used to endorse or promote products derived
19  *       from this software without specific prior written permission.
20  *
21  *   THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
22  *   "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
23  *   LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
24  *   A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
25  *   OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
26  *   SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
27  *   LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
28  *   DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
29  *   THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
30  *   (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
31  *   OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
32  */
33 
34 #include "spdk_cunit.h"
35 
36 #include "common/lib/test_env.c"
37 #include "common/lib/ut_multithread.c"
38 #include "unit/lib/json_mock.c"
39 
40 /* HACK: disable VTune integration so the unit test doesn't need VTune headers and libs to build */
41 #undef SPDK_CONFIG_VTUNE
42 
43 #include "bdev/bdev.c"
44 
45 #define BDEV_UT_NUM_THREADS 3
46 
47 DEFINE_STUB_V(spdk_scsi_nvme_translate, (const struct spdk_bdev_io *bdev_io,
48 		int *sc, int *sk, int *asc, int *ascq));
49 
50 /* Return NULL to test hardcoded defaults. */
51 struct spdk_conf_section *
52 spdk_conf_find_section(struct spdk_conf *cp, const char *name)
53 {
54 	return NULL;
55 }
56 
57 /* Return NULL to test hardcoded defaults. */
58 char *
59 spdk_conf_section_get_nmval(struct spdk_conf_section *sp, const char *key, int idx1, int idx2)
60 {
61 	return NULL;
62 }
63 
64 struct ut_bdev {
65 	struct spdk_bdev	bdev;
66 	void			*io_target;
67 };
68 
69 struct ut_bdev_channel {
70 	TAILQ_HEAD(, spdk_bdev_io)	outstanding_io;
71 	uint32_t			outstanding_cnt;
72 	uint32_t			avail_cnt;
73 };
74 
75 int g_io_device;
76 struct ut_bdev g_bdev;
77 struct spdk_bdev_desc *g_desc;
78 bool g_teardown_done = false;
79 bool g_get_io_channel = true;
80 bool g_create_ch = true;
81 bool g_init_complete_called = false;
82 
83 static int
84 stub_create_ch(void *io_device, void *ctx_buf)
85 {
86 	struct ut_bdev_channel *ch = ctx_buf;
87 
88 	if (g_create_ch == false) {
89 		return -1;
90 	}
91 
92 	TAILQ_INIT(&ch->outstanding_io);
93 	ch->outstanding_cnt = 0;
94 	/*
95 	 * When avail gets to 0, the submit_request function will return ENOMEM.
96 	 *  Most tests to not want ENOMEM to occur, so by default set this to a
97 	 *  big value that won't get hit.  The ENOMEM tests can then override this
98 	 *  value to something much smaller to induce ENOMEM conditions.
99 	 */
100 	ch->avail_cnt = 2048;
101 	return 0;
102 }
103 
104 static void
105 stub_destroy_ch(void *io_device, void *ctx_buf)
106 {
107 }
108 
109 static struct spdk_io_channel *
110 stub_get_io_channel(void *ctx)
111 {
112 	struct ut_bdev *ut_bdev = ctx;
113 
114 	if (g_get_io_channel == true) {
115 		return spdk_get_io_channel(ut_bdev->io_target);
116 	} else {
117 		return NULL;
118 	}
119 }
120 
121 static int
122 stub_destruct(void *ctx)
123 {
124 	return 0;
125 }
126 
127 static void
128 stub_submit_request(struct spdk_io_channel *_ch, struct spdk_bdev_io *bdev_io)
129 {
130 	struct ut_bdev_channel *ch = spdk_io_channel_get_ctx(_ch);
131 
132 	if (bdev_io->type == SPDK_BDEV_IO_TYPE_RESET) {
133 		struct spdk_bdev_io *io;
134 
135 		while (!TAILQ_EMPTY(&ch->outstanding_io)) {
136 			io = TAILQ_FIRST(&ch->outstanding_io);
137 			TAILQ_REMOVE(&ch->outstanding_io, io, module_link);
138 			ch->outstanding_cnt--;
139 			spdk_bdev_io_complete(io, SPDK_BDEV_IO_STATUS_FAILED);
140 			ch->avail_cnt++;
141 		}
142 	}
143 
144 	if (ch->avail_cnt > 0) {
145 		TAILQ_INSERT_TAIL(&ch->outstanding_io, bdev_io, module_link);
146 		ch->outstanding_cnt++;
147 		ch->avail_cnt--;
148 	} else {
149 		spdk_bdev_io_complete(bdev_io, SPDK_BDEV_IO_STATUS_NOMEM);
150 	}
151 }
152 
153 static uint32_t
154 stub_complete_io(void *io_target, uint32_t num_to_complete)
155 {
156 	struct spdk_io_channel *_ch = spdk_get_io_channel(io_target);
157 	struct ut_bdev_channel *ch = spdk_io_channel_get_ctx(_ch);
158 	struct spdk_bdev_io *io;
159 	bool complete_all = (num_to_complete == 0);
160 	uint32_t num_completed = 0;
161 
162 	while (complete_all || num_completed < num_to_complete) {
163 		if (TAILQ_EMPTY(&ch->outstanding_io)) {
164 			break;
165 		}
166 		io = TAILQ_FIRST(&ch->outstanding_io);
167 		TAILQ_REMOVE(&ch->outstanding_io, io, module_link);
168 		ch->outstanding_cnt--;
169 		spdk_bdev_io_complete(io, SPDK_BDEV_IO_STATUS_SUCCESS);
170 		ch->avail_cnt++;
171 		num_completed++;
172 	}
173 
174 	spdk_put_io_channel(_ch);
175 	return num_completed;
176 }
177 
178 static struct spdk_bdev_fn_table fn_table = {
179 	.get_io_channel =	stub_get_io_channel,
180 	.destruct =		stub_destruct,
181 	.submit_request =	stub_submit_request,
182 };
183 
184 static int
185 module_init(void)
186 {
187 	return 0;
188 }
189 
190 static void
191 module_fini(void)
192 {
193 }
194 
195 static void
196 init_complete(void)
197 {
198 	g_init_complete_called = true;
199 }
200 
201 struct spdk_bdev_module bdev_ut_if = {
202 	.name = "bdev_ut",
203 	.module_init = module_init,
204 	.module_fini = module_fini,
205 	.init_complete = init_complete,
206 };
207 
208 SPDK_BDEV_MODULE_REGISTER(&bdev_ut_if)
209 
210 static void
211 register_bdev(struct ut_bdev *ut_bdev, char *name, void *io_target)
212 {
213 	memset(ut_bdev, 0, sizeof(*ut_bdev));
214 
215 	ut_bdev->io_target = io_target;
216 	ut_bdev->bdev.ctxt = ut_bdev;
217 	ut_bdev->bdev.name = name;
218 	ut_bdev->bdev.fn_table = &fn_table;
219 	ut_bdev->bdev.module = &bdev_ut_if;
220 	ut_bdev->bdev.blocklen = 4096;
221 	ut_bdev->bdev.blockcnt = 1024;
222 
223 	spdk_bdev_register(&ut_bdev->bdev);
224 }
225 
226 static void
227 unregister_bdev(struct ut_bdev *ut_bdev)
228 {
229 	/* Handle any deferred messages. */
230 	poll_threads();
231 	spdk_bdev_unregister(&ut_bdev->bdev, NULL, NULL);
232 }
233 
234 static void
235 bdev_init_cb(void *done, int rc)
236 {
237 	CU_ASSERT(rc == 0);
238 	*(bool *)done = true;
239 }
240 
241 static void
242 setup_test(void)
243 {
244 	bool done = false;
245 
246 	allocate_threads(BDEV_UT_NUM_THREADS);
247 	spdk_bdev_initialize(bdev_init_cb, &done);
248 	spdk_io_device_register(&g_io_device, stub_create_ch, stub_destroy_ch,
249 				sizeof(struct ut_bdev_channel));
250 	register_bdev(&g_bdev, "ut_bdev", &g_io_device);
251 	spdk_bdev_open(&g_bdev.bdev, true, NULL, NULL, &g_desc);
252 }
253 
254 static void
255 finish_cb(void *cb_arg)
256 {
257 	g_teardown_done = true;
258 }
259 
260 static void
261 teardown_test(void)
262 {
263 	g_teardown_done = false;
264 	spdk_bdev_close(g_desc);
265 	g_desc = NULL;
266 	unregister_bdev(&g_bdev);
267 	spdk_io_device_unregister(&g_io_device, NULL);
268 	spdk_bdev_finish(finish_cb, NULL);
269 	poll_threads();
270 	memset(&g_bdev, 0, sizeof(g_bdev));
271 	CU_ASSERT(g_teardown_done == true);
272 	g_teardown_done = false;
273 	free_threads();
274 }
275 
276 static uint32_t
277 bdev_io_tailq_cnt(bdev_io_tailq_t *tailq)
278 {
279 	struct spdk_bdev_io *io;
280 	uint32_t cnt = 0;
281 
282 	TAILQ_FOREACH(io, tailq, link) {
283 		cnt++;
284 	}
285 
286 	return cnt;
287 }
288 
289 static void
290 basic(void)
291 {
292 	g_init_complete_called = false;
293 	setup_test();
294 	CU_ASSERT(g_init_complete_called == true);
295 
296 	set_thread(0);
297 
298 	g_get_io_channel = false;
299 	g_ut_threads[0].ch = spdk_bdev_get_io_channel(g_desc);
300 	CU_ASSERT(g_ut_threads[0].ch == NULL);
301 
302 	g_get_io_channel = true;
303 	g_create_ch = false;
304 	g_ut_threads[0].ch = spdk_bdev_get_io_channel(g_desc);
305 	CU_ASSERT(g_ut_threads[0].ch == NULL);
306 
307 	g_get_io_channel = true;
308 	g_create_ch = true;
309 	g_ut_threads[0].ch = spdk_bdev_get_io_channel(g_desc);
310 	CU_ASSERT(g_ut_threads[0].ch != NULL);
311 	spdk_put_io_channel(g_ut_threads[0].ch);
312 
313 	teardown_test();
314 }
315 
316 static int
317 poller_run_done(void *ctx)
318 {
319 	bool	*poller_run = ctx;
320 
321 	*poller_run = true;
322 
323 	return -1;
324 }
325 
326 static int
327 poller_run_times_done(void *ctx)
328 {
329 	int	*poller_run_times = ctx;
330 
331 	(*poller_run_times)++;
332 
333 	return -1;
334 }
335 
336 static void
337 basic_poller(void)
338 {
339 	struct spdk_poller	*poller = NULL;
340 	bool			poller_run = false;
341 	int			poller_run_times = 0;
342 
343 	setup_test();
344 
345 	set_thread(0);
346 	reset_time();
347 	/* Register a poller with no-wait time and test execution */
348 	poller = spdk_poller_register(poller_run_done, &poller_run, 0);
349 	CU_ASSERT(poller != NULL);
350 
351 	poll_threads();
352 	CU_ASSERT(poller_run == true);
353 
354 	spdk_poller_unregister(&poller);
355 	CU_ASSERT(poller == NULL);
356 
357 	/* Register a poller with 1000us wait time and test single execution */
358 	poller_run = false;
359 	poller = spdk_poller_register(poller_run_done, &poller_run, 1000);
360 	CU_ASSERT(poller != NULL);
361 
362 	poll_threads();
363 	CU_ASSERT(poller_run == false);
364 
365 	increment_time(1000);
366 	poll_threads();
367 	CU_ASSERT(poller_run == true);
368 
369 	reset_time();
370 	poller_run = false;
371 	poll_threads();
372 	CU_ASSERT(poller_run == false);
373 
374 	increment_time(1000);
375 	poll_threads();
376 	CU_ASSERT(poller_run == true);
377 
378 	spdk_poller_unregister(&poller);
379 	CU_ASSERT(poller == NULL);
380 
381 	reset_time();
382 	/* Register a poller with 1000us wait time and test multiple execution */
383 	poller = spdk_poller_register(poller_run_times_done, &poller_run_times, 1000);
384 	CU_ASSERT(poller != NULL);
385 
386 	poll_threads();
387 	CU_ASSERT(poller_run_times == 0);
388 
389 	increment_time(1000);
390 	poll_threads();
391 	CU_ASSERT(poller_run_times == 1);
392 
393 	poller_run_times = 0;
394 	increment_time(2000);
395 	poll_threads();
396 	CU_ASSERT(poller_run_times == 2);
397 
398 	spdk_poller_unregister(&poller);
399 	CU_ASSERT(poller == NULL);
400 
401 	teardown_test();
402 }
403 
404 static void
405 reset_done(struct spdk_bdev_io *bdev_io, bool success, void *cb_arg)
406 {
407 	bool *done = cb_arg;
408 
409 	CU_ASSERT(success == true);
410 	*done = true;
411 	spdk_bdev_free_io(bdev_io);
412 }
413 
414 static void
415 put_channel_during_reset(void)
416 {
417 	struct spdk_io_channel *io_ch;
418 	bool done = false;
419 
420 	setup_test();
421 
422 	set_thread(0);
423 	io_ch = spdk_bdev_get_io_channel(g_desc);
424 	CU_ASSERT(io_ch != NULL);
425 
426 	/*
427 	 * Start a reset, but then put the I/O channel before
428 	 *  the deferred messages for the reset get a chance to
429 	 *  execute.
430 	 */
431 	spdk_bdev_reset(g_desc, io_ch, reset_done, &done);
432 	spdk_put_io_channel(io_ch);
433 	poll_threads();
434 	stub_complete_io(g_bdev.io_target, 0);
435 
436 	teardown_test();
437 }
438 
439 static void
440 aborted_reset_done(struct spdk_bdev_io *bdev_io, bool success, void *cb_arg)
441 {
442 	enum spdk_bdev_io_status *status = cb_arg;
443 
444 	*status = success ? SPDK_BDEV_IO_STATUS_SUCCESS : SPDK_BDEV_IO_STATUS_FAILED;
445 	spdk_bdev_free_io(bdev_io);
446 }
447 
448 static void
449 aborted_reset(void)
450 {
451 	struct spdk_io_channel *io_ch[2];
452 	enum spdk_bdev_io_status status1, status2;
453 
454 	setup_test();
455 
456 	set_thread(0);
457 	io_ch[0] = spdk_bdev_get_io_channel(g_desc);
458 	CU_ASSERT(io_ch[0] != NULL);
459 	spdk_bdev_reset(g_desc, io_ch[0], aborted_reset_done, &status1);
460 	poll_threads();
461 	CU_ASSERT(g_bdev.bdev.reset_in_progress != NULL);
462 
463 	/*
464 	 * First reset has been submitted on ch0.  Now submit a second
465 	 *  reset on ch1 which will get queued since there is already a
466 	 *  reset in progress.
467 	 */
468 	set_thread(1);
469 	io_ch[1] = spdk_bdev_get_io_channel(g_desc);
470 	CU_ASSERT(io_ch[1] != NULL);
471 	spdk_bdev_reset(g_desc, io_ch[1], aborted_reset_done, &status2);
472 	poll_threads();
473 	CU_ASSERT(g_bdev.bdev.reset_in_progress != NULL);
474 
475 	/*
476 	 * Now destroy ch1.  This will abort the queued reset.  Check that
477 	 *  the second reset was completed with failed status.  Also check
478 	 *  that bdev->reset_in_progress != NULL, since the original reset
479 	 *  has not been completed yet.  This ensures that the bdev code is
480 	 *  correctly noticing that the failed reset is *not* the one that
481 	 *  had been submitted to the bdev module.
482 	 */
483 	set_thread(1);
484 	spdk_put_io_channel(io_ch[1]);
485 	poll_threads();
486 	CU_ASSERT(status2 == SPDK_BDEV_IO_STATUS_FAILED);
487 	CU_ASSERT(g_bdev.bdev.reset_in_progress != NULL);
488 
489 	/*
490 	 * Now complete the first reset, verify that it completed with SUCCESS
491 	 *  status and that bdev->reset_in_progress is also set back to NULL.
492 	 */
493 	set_thread(0);
494 	spdk_put_io_channel(io_ch[0]);
495 	stub_complete_io(g_bdev.io_target, 0);
496 	poll_threads();
497 	CU_ASSERT(status1 == SPDK_BDEV_IO_STATUS_SUCCESS);
498 	CU_ASSERT(g_bdev.bdev.reset_in_progress == NULL);
499 
500 	teardown_test();
501 }
502 
503 static void
504 io_during_io_done(struct spdk_bdev_io *bdev_io, bool success, void *cb_arg)
505 {
506 	enum spdk_bdev_io_status *status = cb_arg;
507 
508 	*status = success ? SPDK_BDEV_IO_STATUS_SUCCESS : SPDK_BDEV_IO_STATUS_FAILED;
509 	spdk_bdev_free_io(bdev_io);
510 }
511 
512 static void
513 io_during_reset(void)
514 {
515 	struct spdk_io_channel *io_ch[2];
516 	struct spdk_bdev_channel *bdev_ch[2];
517 	enum spdk_bdev_io_status status0, status1, status_reset;
518 	int rc;
519 
520 	setup_test();
521 
522 	/*
523 	 * First test normal case - submit an I/O on each of two channels (with no resets)
524 	 *  and verify they complete successfully.
525 	 */
526 	set_thread(0);
527 	io_ch[0] = spdk_bdev_get_io_channel(g_desc);
528 	bdev_ch[0] = spdk_io_channel_get_ctx(io_ch[0]);
529 	CU_ASSERT(bdev_ch[0]->flags == 0);
530 	status0 = SPDK_BDEV_IO_STATUS_PENDING;
531 	rc = spdk_bdev_read_blocks(g_desc, io_ch[0], NULL, 0, 1, io_during_io_done, &status0);
532 	CU_ASSERT(rc == 0);
533 
534 	set_thread(1);
535 	io_ch[1] = spdk_bdev_get_io_channel(g_desc);
536 	bdev_ch[1] = spdk_io_channel_get_ctx(io_ch[1]);
537 	CU_ASSERT(bdev_ch[1]->flags == 0);
538 	status1 = SPDK_BDEV_IO_STATUS_PENDING;
539 	rc = spdk_bdev_read_blocks(g_desc, io_ch[1], NULL, 0, 1, io_during_io_done, &status1);
540 	CU_ASSERT(rc == 0);
541 
542 	poll_threads();
543 	CU_ASSERT(status0 == SPDK_BDEV_IO_STATUS_PENDING);
544 	CU_ASSERT(status1 == SPDK_BDEV_IO_STATUS_PENDING);
545 
546 	set_thread(0);
547 	stub_complete_io(g_bdev.io_target, 0);
548 	CU_ASSERT(status0 == SPDK_BDEV_IO_STATUS_SUCCESS);
549 
550 	set_thread(1);
551 	stub_complete_io(g_bdev.io_target, 0);
552 	CU_ASSERT(status1 == SPDK_BDEV_IO_STATUS_SUCCESS);
553 
554 	/*
555 	 * Now submit a reset, and leave it pending while we submit I/O on two different
556 	 *  channels.  These I/O should be failed by the bdev layer since the reset is in
557 	 *  progress.
558 	 */
559 	set_thread(0);
560 	status_reset = SPDK_BDEV_IO_STATUS_PENDING;
561 	rc = spdk_bdev_reset(g_desc, io_ch[0], io_during_io_done, &status_reset);
562 	CU_ASSERT(rc == 0);
563 
564 	CU_ASSERT(bdev_ch[0]->flags == 0);
565 	CU_ASSERT(bdev_ch[1]->flags == 0);
566 	poll_threads();
567 	CU_ASSERT(bdev_ch[0]->flags == BDEV_CH_RESET_IN_PROGRESS);
568 	CU_ASSERT(bdev_ch[1]->flags == BDEV_CH_RESET_IN_PROGRESS);
569 
570 	set_thread(0);
571 	status0 = SPDK_BDEV_IO_STATUS_PENDING;
572 	rc = spdk_bdev_read_blocks(g_desc, io_ch[0], NULL, 0, 1, io_during_io_done, &status0);
573 	CU_ASSERT(rc == 0);
574 
575 	set_thread(1);
576 	status1 = SPDK_BDEV_IO_STATUS_PENDING;
577 	rc = spdk_bdev_read_blocks(g_desc, io_ch[1], NULL, 0, 1, io_during_io_done, &status1);
578 	CU_ASSERT(rc == 0);
579 
580 	/*
581 	 * A reset is in progress so these read I/O should complete with failure.  Note that we
582 	 *  need to poll_threads() since I/O completed inline have their completion deferred.
583 	 */
584 	poll_threads();
585 	CU_ASSERT(status_reset == SPDK_BDEV_IO_STATUS_PENDING);
586 	CU_ASSERT(status0 == SPDK_BDEV_IO_STATUS_FAILED);
587 	CU_ASSERT(status1 == SPDK_BDEV_IO_STATUS_FAILED);
588 
589 	/*
590 	 * Complete the reset
591 	 */
592 	set_thread(0);
593 	stub_complete_io(g_bdev.io_target, 0);
594 
595 	/*
596 	 * Only poll thread 0. We should not get a completion.
597 	 */
598 	poll_thread(0);
599 	CU_ASSERT(status_reset == SPDK_BDEV_IO_STATUS_PENDING);
600 
601 	/*
602 	 * Poll both thread 0 and 1 so the messages can propagate and we
603 	 * get a completion.
604 	 */
605 	poll_threads();
606 	CU_ASSERT(status_reset == SPDK_BDEV_IO_STATUS_SUCCESS);
607 
608 	spdk_put_io_channel(io_ch[0]);
609 	set_thread(1);
610 	spdk_put_io_channel(io_ch[1]);
611 	poll_threads();
612 
613 	teardown_test();
614 }
615 
616 static void
617 basic_qos(void)
618 {
619 	struct spdk_io_channel *io_ch[2];
620 	struct spdk_bdev_channel *bdev_ch[2];
621 	struct spdk_bdev *bdev;
622 	enum spdk_bdev_io_status status;
623 	int rc;
624 
625 	setup_test();
626 
627 	/* Enable QoS */
628 	bdev = &g_bdev.bdev;
629 	bdev->ios_per_sec = 2000; /* 2 I/O per millisecond */
630 
631 	g_get_io_channel = true;
632 
633 	set_thread(0);
634 	io_ch[0] = spdk_bdev_get_io_channel(g_desc);
635 	bdev_ch[0] = spdk_io_channel_get_ctx(io_ch[0]);
636 	CU_ASSERT(bdev_ch[0]->flags == BDEV_CH_QOS_ENABLED);
637 
638 	set_thread(1);
639 	io_ch[1] = spdk_bdev_get_io_channel(g_desc);
640 	bdev_ch[1] = spdk_io_channel_get_ctx(io_ch[1]);
641 	CU_ASSERT(bdev_ch[1]->flags == BDEV_CH_QOS_ENABLED);
642 
643 	/*
644 	 * Send an I/O on thread 0, which is where the QoS thread is running.
645 	 */
646 	set_thread(0);
647 	status = SPDK_BDEV_IO_STATUS_PENDING;
648 	rc = spdk_bdev_read_blocks(g_desc, io_ch[0], NULL, 0, 1, io_during_io_done, &status);
649 	CU_ASSERT(rc == 0);
650 	CU_ASSERT(status == SPDK_BDEV_IO_STATUS_PENDING);
651 	poll_threads();
652 	stub_complete_io(g_bdev.io_target, 0);
653 	poll_threads();
654 	CU_ASSERT(status == SPDK_BDEV_IO_STATUS_SUCCESS);
655 
656 	/* Send an I/O on thread 1. The QoS thread is not running here. */
657 	status = SPDK_BDEV_IO_STATUS_PENDING;
658 	set_thread(1);
659 	rc = spdk_bdev_read_blocks(g_desc, io_ch[1], NULL, 0, 1, io_during_io_done, &status);
660 	CU_ASSERT(rc == 0);
661 	CU_ASSERT(status == SPDK_BDEV_IO_STATUS_PENDING);
662 	poll_threads();
663 	/* Complete I/O on thread 1. This should not complete the I/O we submitted */
664 	stub_complete_io(g_bdev.io_target, 0);
665 	poll_threads();
666 	CU_ASSERT(status == SPDK_BDEV_IO_STATUS_PENDING);
667 	/* Now complete I/O on thread 0 */
668 	set_thread(0);
669 	poll_threads();
670 	stub_complete_io(g_bdev.io_target, 0);
671 	poll_threads();
672 	CU_ASSERT(status == SPDK_BDEV_IO_STATUS_SUCCESS);
673 
674 	/* Tear down the channels */
675 	set_thread(0);
676 	spdk_put_io_channel(io_ch[0]);
677 	set_thread(1);
678 	spdk_put_io_channel(io_ch[1]);
679 	poll_threads();
680 	set_thread(0);
681 
682 	/* Close the descriptor, which should stop the qos channel */
683 	spdk_bdev_close(g_desc);
684 	CU_ASSERT(bdev->qos_channel == NULL);
685 
686 	spdk_bdev_open(bdev, true, NULL, NULL, &g_desc);
687 
688 	/* Create the channels in reverse order. */
689 	set_thread(1);
690 	io_ch[1] = spdk_bdev_get_io_channel(g_desc);
691 	bdev_ch[1] = spdk_io_channel_get_ctx(io_ch[1]);
692 	CU_ASSERT(bdev_ch[1]->flags == BDEV_CH_QOS_ENABLED);
693 
694 	set_thread(0);
695 	io_ch[0] = spdk_bdev_get_io_channel(g_desc);
696 	bdev_ch[0] = spdk_io_channel_get_ctx(io_ch[0]);
697 	CU_ASSERT(bdev_ch[0]->flags == BDEV_CH_QOS_ENABLED);
698 
699 	/* Confirm that the qos tracking was re-enabled */
700 	CU_ASSERT(bdev->qos_channel != NULL);
701 
702 	/* Tear down the channels */
703 	set_thread(0);
704 	spdk_put_io_channel(io_ch[0]);
705 	set_thread(1);
706 	spdk_put_io_channel(io_ch[1]);
707 	poll_threads();
708 
709 	set_thread(0);
710 
711 	teardown_test();
712 }
713 
714 static void
715 io_during_qos_queue(void)
716 {
717 	struct spdk_io_channel *io_ch[2];
718 	struct spdk_bdev_channel *bdev_ch[2];
719 	struct spdk_bdev *bdev;
720 	enum spdk_bdev_io_status status0, status1;
721 	int rc;
722 
723 	setup_test();
724 	reset_time();
725 
726 	/* Enable QoS */
727 	bdev = &g_bdev.bdev;
728 	bdev->ios_per_sec = 1000; /* 1000 I/O per second, or 1 per millisecond */
729 
730 	g_get_io_channel = true;
731 
732 	/* Create channels */
733 	set_thread(0);
734 	io_ch[0] = spdk_bdev_get_io_channel(g_desc);
735 	bdev_ch[0] = spdk_io_channel_get_ctx(io_ch[0]);
736 	CU_ASSERT(bdev_ch[0]->flags == BDEV_CH_QOS_ENABLED);
737 
738 	set_thread(1);
739 	io_ch[1] = spdk_bdev_get_io_channel(g_desc);
740 	bdev_ch[1] = spdk_io_channel_get_ctx(io_ch[1]);
741 	CU_ASSERT(bdev_ch[1]->flags == BDEV_CH_QOS_ENABLED);
742 
743 	/* Send two I/O */
744 	status1 = SPDK_BDEV_IO_STATUS_PENDING;
745 	rc = spdk_bdev_read_blocks(g_desc, io_ch[1], NULL, 0, 1, io_during_io_done, &status1);
746 	CU_ASSERT(rc == 0);
747 	CU_ASSERT(status1 == SPDK_BDEV_IO_STATUS_PENDING);
748 	set_thread(0);
749 	status0 = SPDK_BDEV_IO_STATUS_PENDING;
750 	rc = spdk_bdev_read_blocks(g_desc, io_ch[0], NULL, 0, 1, io_during_io_done, &status0);
751 	CU_ASSERT(rc == 0);
752 	CU_ASSERT(status0 == SPDK_BDEV_IO_STATUS_PENDING);
753 
754 	/* Complete any I/O that arrived at the disk */
755 	poll_threads();
756 	set_thread(1);
757 	stub_complete_io(g_bdev.io_target, 0);
758 	set_thread(0);
759 	stub_complete_io(g_bdev.io_target, 0);
760 	poll_threads();
761 
762 	/* Only one of the I/O should complete. (logical XOR) */
763 	if (status0 == SPDK_BDEV_IO_STATUS_SUCCESS) {
764 		CU_ASSERT(status1 == SPDK_BDEV_IO_STATUS_PENDING);
765 	} else {
766 		CU_ASSERT(status1 == SPDK_BDEV_IO_STATUS_SUCCESS);
767 	}
768 
769 	/* Advance in time by a millisecond */
770 	increment_time(1000);
771 
772 	/* Complete more I/O */
773 	poll_threads();
774 	set_thread(1);
775 	stub_complete_io(g_bdev.io_target, 0);
776 	set_thread(0);
777 	stub_complete_io(g_bdev.io_target, 0);
778 	poll_threads();
779 
780 	/* Now the second I/O should be done */
781 	CU_ASSERT(status0 == SPDK_BDEV_IO_STATUS_SUCCESS);
782 	CU_ASSERT(status1 == SPDK_BDEV_IO_STATUS_SUCCESS);
783 
784 	/* Tear down the channels */
785 	set_thread(1);
786 	spdk_put_io_channel(io_ch[1]);
787 	set_thread(0);
788 	spdk_put_io_channel(io_ch[0]);
789 	poll_threads();
790 
791 	teardown_test();
792 }
793 
794 static void
795 io_during_qos_reset(void)
796 {
797 	struct spdk_io_channel *io_ch[2];
798 	struct spdk_bdev_channel *bdev_ch[2];
799 	struct spdk_bdev *bdev;
800 	enum spdk_bdev_io_status status0, status1, reset_status;
801 	int rc;
802 
803 	setup_test();
804 	reset_time();
805 
806 	/* Enable QoS */
807 	bdev = &g_bdev.bdev;
808 	bdev->ios_per_sec = 1000; /* 1000 I/O per second, or 1 per millisecond */
809 
810 	g_get_io_channel = true;
811 
812 	/* Create channels */
813 	set_thread(0);
814 	io_ch[0] = spdk_bdev_get_io_channel(g_desc);
815 	bdev_ch[0] = spdk_io_channel_get_ctx(io_ch[0]);
816 	CU_ASSERT(bdev_ch[0]->flags == BDEV_CH_QOS_ENABLED);
817 
818 	set_thread(1);
819 	io_ch[1] = spdk_bdev_get_io_channel(g_desc);
820 	bdev_ch[1] = spdk_io_channel_get_ctx(io_ch[1]);
821 	CU_ASSERT(bdev_ch[1]->flags == BDEV_CH_QOS_ENABLED);
822 
823 	/* Send two I/O. One of these gets queued by QoS. The other is sitting at the disk. */
824 	status1 = SPDK_BDEV_IO_STATUS_PENDING;
825 	rc = spdk_bdev_read_blocks(g_desc, io_ch[1], NULL, 0, 1, io_during_io_done, &status1);
826 	CU_ASSERT(rc == 0);
827 	set_thread(0);
828 	status0 = SPDK_BDEV_IO_STATUS_PENDING;
829 	rc = spdk_bdev_read_blocks(g_desc, io_ch[0], NULL, 0, 1, io_during_io_done, &status0);
830 	CU_ASSERT(rc == 0);
831 
832 	poll_threads();
833 	CU_ASSERT(status1 == SPDK_BDEV_IO_STATUS_PENDING);
834 	CU_ASSERT(status0 == SPDK_BDEV_IO_STATUS_PENDING);
835 
836 	/* Reset the bdev. */
837 	reset_status = SPDK_BDEV_IO_STATUS_PENDING;
838 	rc = spdk_bdev_reset(g_desc, io_ch[0], io_during_io_done, &reset_status);
839 	CU_ASSERT(rc == 0);
840 
841 	/* Complete any I/O that arrived at the disk */
842 	poll_threads();
843 	set_thread(1);
844 	stub_complete_io(g_bdev.io_target, 0);
845 	set_thread(0);
846 	stub_complete_io(g_bdev.io_target, 0);
847 	poll_threads();
848 
849 	CU_ASSERT(reset_status == SPDK_BDEV_IO_STATUS_SUCCESS);
850 	CU_ASSERT(status0 == SPDK_BDEV_IO_STATUS_FAILED);
851 	CU_ASSERT(status1 == SPDK_BDEV_IO_STATUS_FAILED);
852 
853 	/* Tear down the channels */
854 	set_thread(1);
855 	spdk_put_io_channel(io_ch[1]);
856 	set_thread(0);
857 	spdk_put_io_channel(io_ch[0]);
858 	poll_threads();
859 
860 	teardown_test();
861 }
862 
863 static void
864 enomem_done(struct spdk_bdev_io *bdev_io, bool success, void *cb_arg)
865 {
866 	enum spdk_bdev_io_status *status = cb_arg;
867 
868 	*status = success ? SPDK_BDEV_IO_STATUS_SUCCESS : SPDK_BDEV_IO_STATUS_FAILED;
869 	spdk_bdev_free_io(bdev_io);
870 }
871 
872 static void
873 enomem(void)
874 {
875 	struct spdk_io_channel *io_ch;
876 	struct spdk_bdev_channel *bdev_ch;
877 	struct spdk_bdev_module_channel *module_ch;
878 	struct ut_bdev_channel *ut_ch;
879 	const uint32_t IO_ARRAY_SIZE = 64;
880 	const uint32_t AVAIL = 20;
881 	enum spdk_bdev_io_status status[IO_ARRAY_SIZE], status_reset;
882 	uint32_t nomem_cnt, i;
883 	struct spdk_bdev_io *first_io;
884 	int rc;
885 
886 	setup_test();
887 
888 	set_thread(0);
889 	io_ch = spdk_bdev_get_io_channel(g_desc);
890 	bdev_ch = spdk_io_channel_get_ctx(io_ch);
891 	module_ch = bdev_ch->module_ch;
892 	ut_ch = spdk_io_channel_get_ctx(bdev_ch->channel);
893 	ut_ch->avail_cnt = AVAIL;
894 
895 	/* First submit a number of IOs equal to what the channel can support. */
896 	for (i = 0; i < AVAIL; i++) {
897 		status[i] = SPDK_BDEV_IO_STATUS_PENDING;
898 		rc = spdk_bdev_read_blocks(g_desc, io_ch, NULL, 0, 1, enomem_done, &status[i]);
899 		CU_ASSERT(rc == 0);
900 	}
901 	CU_ASSERT(TAILQ_EMPTY(&module_ch->nomem_io));
902 
903 	/*
904 	 * Next, submit one additional I/O.  This one should fail with ENOMEM and then go onto
905 	 *  the enomem_io list.
906 	 */
907 	status[AVAIL] = SPDK_BDEV_IO_STATUS_PENDING;
908 	rc = spdk_bdev_read_blocks(g_desc, io_ch, NULL, 0, 1, enomem_done, &status[AVAIL]);
909 	CU_ASSERT(rc == 0);
910 	SPDK_CU_ASSERT_FATAL(!TAILQ_EMPTY(&module_ch->nomem_io));
911 	first_io = TAILQ_FIRST(&module_ch->nomem_io);
912 
913 	/*
914 	 * Now submit a bunch more I/O.  These should all fail with ENOMEM and get queued behind
915 	 *  the first_io above.
916 	 */
917 	for (i = AVAIL + 1; i < IO_ARRAY_SIZE; i++) {
918 		status[i] = SPDK_BDEV_IO_STATUS_PENDING;
919 		rc = spdk_bdev_read_blocks(g_desc, io_ch, NULL, 0, 1, enomem_done, &status[i]);
920 		CU_ASSERT(rc == 0);
921 	}
922 
923 	/* Assert that first_io is still at the head of the list. */
924 	CU_ASSERT(TAILQ_FIRST(&module_ch->nomem_io) == first_io);
925 	CU_ASSERT(bdev_io_tailq_cnt(&module_ch->nomem_io) == (IO_ARRAY_SIZE - AVAIL));
926 	nomem_cnt = bdev_io_tailq_cnt(&module_ch->nomem_io);
927 	CU_ASSERT(module_ch->nomem_threshold == (AVAIL - NOMEM_THRESHOLD_COUNT));
928 
929 	/*
930 	 * Complete 1 I/O only.  The key check here is bdev_io_tailq_cnt - this should not have
931 	 *  changed since completing just 1 I/O should not trigger retrying the queued nomem_io
932 	 *  list.
933 	 */
934 	stub_complete_io(g_bdev.io_target, 1);
935 	CU_ASSERT(bdev_io_tailq_cnt(&module_ch->nomem_io) == nomem_cnt);
936 
937 	/*
938 	 * Complete enough I/O to hit the nomem_theshold.  This should trigger retrying nomem_io,
939 	 *  and we should see I/O get resubmitted to the test bdev module.
940 	 */
941 	stub_complete_io(g_bdev.io_target, NOMEM_THRESHOLD_COUNT - 1);
942 	CU_ASSERT(bdev_io_tailq_cnt(&module_ch->nomem_io) < nomem_cnt);
943 	nomem_cnt = bdev_io_tailq_cnt(&module_ch->nomem_io);
944 
945 	/* Complete 1 I/O only.  This should not trigger retrying the queued nomem_io. */
946 	stub_complete_io(g_bdev.io_target, 1);
947 	CU_ASSERT(bdev_io_tailq_cnt(&module_ch->nomem_io) == nomem_cnt);
948 
949 	/*
950 	 * Send a reset and confirm that all I/O are completed, including the ones that
951 	 *  were queued on the nomem_io list.
952 	 */
953 	status_reset = SPDK_BDEV_IO_STATUS_PENDING;
954 	rc = spdk_bdev_reset(g_desc, io_ch, enomem_done, &status_reset);
955 	poll_threads();
956 	CU_ASSERT(rc == 0);
957 	/* This will complete the reset. */
958 	stub_complete_io(g_bdev.io_target, 0);
959 
960 	CU_ASSERT(bdev_io_tailq_cnt(&module_ch->nomem_io) == 0);
961 	CU_ASSERT(module_ch->io_outstanding == 0);
962 
963 	spdk_put_io_channel(io_ch);
964 	poll_threads();
965 	teardown_test();
966 }
967 
968 static void
969 enomem_multi_bdev(void)
970 {
971 	struct spdk_io_channel *io_ch;
972 	struct spdk_bdev_channel *bdev_ch;
973 	struct spdk_bdev_module_channel *module_ch;
974 	struct ut_bdev_channel *ut_ch;
975 	const uint32_t IO_ARRAY_SIZE = 64;
976 	const uint32_t AVAIL = 20;
977 	enum spdk_bdev_io_status status[IO_ARRAY_SIZE];
978 	uint32_t i;
979 	struct ut_bdev *second_bdev;
980 	struct spdk_bdev_desc *second_desc;
981 	struct spdk_bdev_channel *second_bdev_ch;
982 	struct spdk_io_channel *second_ch;
983 	int rc;
984 
985 	setup_test();
986 
987 	/* Register second bdev with the same io_target  */
988 	second_bdev = calloc(1, sizeof(*second_bdev));
989 	SPDK_CU_ASSERT_FATAL(second_bdev != NULL);
990 	register_bdev(second_bdev, "ut_bdev2", g_bdev.io_target);
991 	spdk_bdev_open(&second_bdev->bdev, true, NULL, NULL, &second_desc);
992 
993 	set_thread(0);
994 	io_ch = spdk_bdev_get_io_channel(g_desc);
995 	bdev_ch = spdk_io_channel_get_ctx(io_ch);
996 	module_ch = bdev_ch->module_ch;
997 	ut_ch = spdk_io_channel_get_ctx(bdev_ch->channel);
998 	ut_ch->avail_cnt = AVAIL;
999 
1000 	second_ch = spdk_bdev_get_io_channel(second_desc);
1001 	second_bdev_ch = spdk_io_channel_get_ctx(second_ch);
1002 	SPDK_CU_ASSERT_FATAL(module_ch == second_bdev_ch->module_ch);
1003 
1004 	/* Saturate io_target through bdev A. */
1005 	for (i = 0; i < AVAIL; i++) {
1006 		status[i] = SPDK_BDEV_IO_STATUS_PENDING;
1007 		rc = spdk_bdev_read_blocks(g_desc, io_ch, NULL, 0, 1, enomem_done, &status[i]);
1008 		CU_ASSERT(rc == 0);
1009 	}
1010 	CU_ASSERT(TAILQ_EMPTY(&module_ch->nomem_io));
1011 
1012 	/*
1013 	 * Now submit I/O through the second bdev. This should fail with ENOMEM
1014 	 * and then go onto the nomem_io list.
1015 	 */
1016 	status[AVAIL] = SPDK_BDEV_IO_STATUS_PENDING;
1017 	rc = spdk_bdev_read_blocks(second_desc, second_ch, NULL, 0, 1, enomem_done, &status[AVAIL]);
1018 	CU_ASSERT(rc == 0);
1019 	SPDK_CU_ASSERT_FATAL(!TAILQ_EMPTY(&module_ch->nomem_io));
1020 
1021 	/* Complete first bdev's I/O. This should retry sending second bdev's nomem_io */
1022 	stub_complete_io(g_bdev.io_target, AVAIL);
1023 
1024 	SPDK_CU_ASSERT_FATAL(TAILQ_EMPTY(&module_ch->nomem_io));
1025 	CU_ASSERT(module_ch->io_outstanding == 1);
1026 
1027 	/* Now complete our retried I/O  */
1028 	stub_complete_io(g_bdev.io_target, 1);
1029 	SPDK_CU_ASSERT_FATAL(module_ch->io_outstanding == 0);
1030 
1031 	spdk_put_io_channel(io_ch);
1032 	spdk_put_io_channel(second_ch);
1033 	spdk_bdev_close(second_desc);
1034 	unregister_bdev(second_bdev);
1035 	poll_threads();
1036 	free(second_bdev);
1037 	teardown_test();
1038 }
1039 
1040 int
1041 main(int argc, char **argv)
1042 {
1043 	CU_pSuite	suite = NULL;
1044 	unsigned int	num_failures;
1045 
1046 	if (CU_initialize_registry() != CUE_SUCCESS) {
1047 		return CU_get_error();
1048 	}
1049 
1050 	suite = CU_add_suite("bdev", NULL, NULL);
1051 	if (suite == NULL) {
1052 		CU_cleanup_registry();
1053 		return CU_get_error();
1054 	}
1055 
1056 	if (
1057 		CU_add_test(suite, "basic", basic) == NULL ||
1058 		CU_add_test(suite, "basic_poller", basic_poller) == NULL ||
1059 		CU_add_test(suite, "basic_qos", basic_qos) == NULL ||
1060 		CU_add_test(suite, "put_channel_during_reset", put_channel_during_reset) == NULL ||
1061 		CU_add_test(suite, "aborted_reset", aborted_reset) == NULL ||
1062 		CU_add_test(suite, "io_during_reset", io_during_reset) == NULL ||
1063 		CU_add_test(suite, "io_during_qos_queue", io_during_qos_queue) == NULL ||
1064 		CU_add_test(suite, "io_during_qos_reset", io_during_qos_reset) == NULL ||
1065 		CU_add_test(suite, "enomem", enomem) == NULL ||
1066 		CU_add_test(suite, "enomem_multi_bdev", enomem_multi_bdev) == NULL
1067 	) {
1068 		CU_cleanup_registry();
1069 		return CU_get_error();
1070 	}
1071 
1072 	CU_basic_set_mode(CU_BRM_VERBOSE);
1073 	CU_basic_run_tests();
1074 	num_failures = CU_get_number_of_failures();
1075 	CU_cleanup_registry();
1076 	return num_failures;
1077 }
1078