xref: /spdk/lib/nvmf/nvmf.c (revision 6e5d6032a09ca918509e7c6f28d6d2e20b8dc832)
1 /*-
2  *   BSD LICENSE
3  *
4  *   Copyright (c) Intel Corporation. All rights reserved.
5  *   Copyright (c) 2018-2019, 2021 Mellanox Technologies LTD. All rights reserved.
6  *
7  *   Redistribution and use in source and binary forms, with or without
8  *   modification, are permitted provided that the following conditions
9  *   are met:
10  *
11  *     * Redistributions of source code must retain the above copyright
12  *       notice, this list of conditions and the following disclaimer.
13  *     * Redistributions in binary form must reproduce the above copyright
14  *       notice, this list of conditions and the following disclaimer in
15  *       the documentation and/or other materials provided with the
16  *       distribution.
17  *     * Neither the name of Intel Corporation nor the names of its
18  *       contributors may be used to endorse or promote products derived
19  *       from this software without specific prior written permission.
20  *
21  *   THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
22  *   "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
23  *   LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
24  *   A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
25  *   OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
26  *   SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
27  *   LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
28  *   DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
29  *   THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
30  *   (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
31  *   OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
32  */
33 
34 #include "spdk/stdinc.h"
35 
36 #include "spdk/bdev.h"
37 #include "spdk/bit_array.h"
38 #include "spdk/thread.h"
39 #include "spdk/nvmf.h"
40 #include "spdk/endian.h"
41 #include "spdk/string.h"
42 #include "spdk/log.h"
43 #include "spdk_internal/usdt.h"
44 
45 #include "nvmf_internal.h"
46 #include "transport.h"
47 
48 SPDK_LOG_REGISTER_COMPONENT(nvmf)
49 
50 #define SPDK_NVMF_DEFAULT_MAX_SUBSYSTEMS 1024
51 #define SPDK_NVMF_DEFAULT_ACCEPT_POLL_RATE_US 10000
52 
53 static TAILQ_HEAD(, spdk_nvmf_tgt) g_nvmf_tgts = TAILQ_HEAD_INITIALIZER(g_nvmf_tgts);
54 
55 typedef void (*nvmf_qpair_disconnect_cpl)(void *ctx, int status);
56 static void nvmf_tgt_destroy_poll_group(void *io_device, void *ctx_buf);
57 
58 /* supplied to a single call to nvmf_qpair_disconnect */
59 struct nvmf_qpair_disconnect_ctx {
60 	struct spdk_nvmf_qpair *qpair;
61 	struct spdk_nvmf_ctrlr *ctrlr;
62 	nvmf_qpair_disconnect_cb cb_fn;
63 	struct spdk_thread *thread;
64 	void *ctx;
65 	uint16_t qid;
66 };
67 
68 /*
69  * There are several times when we need to iterate through the list of all qpairs and selectively delete them.
70  * In order to do this sequentially without overlap, we must provide a context to recover the next qpair from
71  * to enable calling nvmf_qpair_disconnect on the next desired qpair.
72  */
73 struct nvmf_qpair_disconnect_many_ctx {
74 	struct spdk_nvmf_subsystem *subsystem;
75 	struct spdk_nvmf_poll_group *group;
76 	spdk_nvmf_poll_group_mod_done cpl_fn;
77 	void *cpl_ctx;
78 	uint32_t count;
79 };
80 
81 static void
82 nvmf_qpair_set_state(struct spdk_nvmf_qpair *qpair,
83 		     enum spdk_nvmf_qpair_state state)
84 {
85 	assert(qpair != NULL);
86 	assert(qpair->group->thread == spdk_get_thread());
87 
88 	qpair->state = state;
89 }
90 
91 static int
92 nvmf_poll_group_poll(void *ctx)
93 {
94 	struct spdk_nvmf_poll_group *group = ctx;
95 	int rc;
96 	int count = 0;
97 	struct spdk_nvmf_transport_poll_group *tgroup;
98 
99 	TAILQ_FOREACH(tgroup, &group->tgroups, link) {
100 		rc = nvmf_transport_poll_group_poll(tgroup);
101 		if (rc < 0) {
102 			return SPDK_POLLER_BUSY;
103 		}
104 		count += rc;
105 	}
106 
107 	return count > 0 ? SPDK_POLLER_BUSY : SPDK_POLLER_IDLE;
108 }
109 
110 static int
111 nvmf_tgt_create_poll_group(void *io_device, void *ctx_buf)
112 {
113 	struct spdk_nvmf_tgt *tgt = io_device;
114 	struct spdk_nvmf_poll_group *group = ctx_buf;
115 	struct spdk_nvmf_transport *transport;
116 	struct spdk_thread *thread = spdk_get_thread();
117 	uint32_t sid;
118 
119 	SPDK_DTRACE_PROBE1(nvmf_create_poll_group, spdk_thread_get_id(thread));
120 
121 	TAILQ_INIT(&group->tgroups);
122 	TAILQ_INIT(&group->qpairs);
123 
124 	TAILQ_FOREACH(transport, &tgt->transports, link) {
125 		nvmf_poll_group_add_transport(group, transport);
126 	}
127 
128 	group->num_sgroups = tgt->max_subsystems;
129 	group->sgroups = calloc(tgt->max_subsystems, sizeof(struct spdk_nvmf_subsystem_poll_group));
130 	if (!group->sgroups) {
131 		return -ENOMEM;
132 	}
133 
134 	for (sid = 0; sid < tgt->max_subsystems; sid++) {
135 		struct spdk_nvmf_subsystem *subsystem;
136 
137 		subsystem = tgt->subsystems[sid];
138 		if (!subsystem) {
139 			continue;
140 		}
141 
142 		if (nvmf_poll_group_add_subsystem(group, subsystem, NULL, NULL) != 0) {
143 			nvmf_tgt_destroy_poll_group(io_device, ctx_buf);
144 			return -1;
145 		}
146 	}
147 
148 	pthread_mutex_lock(&tgt->mutex);
149 	TAILQ_INSERT_TAIL(&tgt->poll_groups, group, link);
150 	pthread_mutex_unlock(&tgt->mutex);
151 
152 	group->poller = SPDK_POLLER_REGISTER(nvmf_poll_group_poll, group, 0);
153 	group->thread = thread;
154 
155 	return 0;
156 }
157 
158 static void
159 nvmf_tgt_destroy_poll_group(void *io_device, void *ctx_buf)
160 {
161 	struct spdk_nvmf_tgt *tgt = io_device;
162 	struct spdk_nvmf_poll_group *group = ctx_buf;
163 	struct spdk_nvmf_transport_poll_group *tgroup, *tmp;
164 	struct spdk_nvmf_subsystem_poll_group *sgroup;
165 	uint32_t sid, nsid;
166 
167 	SPDK_DTRACE_PROBE1(nvmf_destroy_poll_group, spdk_thread_get_id(group->thread));
168 
169 	pthread_mutex_lock(&tgt->mutex);
170 	TAILQ_REMOVE(&tgt->poll_groups, group, link);
171 	pthread_mutex_unlock(&tgt->mutex);
172 
173 	TAILQ_FOREACH_SAFE(tgroup, &group->tgroups, link, tmp) {
174 		TAILQ_REMOVE(&group->tgroups, tgroup, link);
175 		nvmf_transport_poll_group_destroy(tgroup);
176 	}
177 
178 	for (sid = 0; sid < group->num_sgroups; sid++) {
179 		sgroup = &group->sgroups[sid];
180 
181 		for (nsid = 0; nsid < sgroup->num_ns; nsid++) {
182 			if (sgroup->ns_info[nsid].channel) {
183 				spdk_put_io_channel(sgroup->ns_info[nsid].channel);
184 				sgroup->ns_info[nsid].channel = NULL;
185 			}
186 		}
187 
188 		free(sgroup->ns_info);
189 	}
190 
191 	free(group->sgroups);
192 
193 	spdk_poller_unregister(&group->poller);
194 
195 	if (group->destroy_cb_fn) {
196 		group->destroy_cb_fn(group->destroy_cb_arg, 0);
197 	}
198 }
199 
200 static void
201 _nvmf_tgt_disconnect_next_qpair(void *ctx)
202 {
203 	struct spdk_nvmf_qpair *qpair;
204 	struct nvmf_qpair_disconnect_many_ctx *qpair_ctx = ctx;
205 	struct spdk_nvmf_poll_group *group = qpair_ctx->group;
206 	struct spdk_io_channel *ch;
207 	int rc = 0;
208 
209 	qpair = TAILQ_FIRST(&group->qpairs);
210 
211 	if (qpair) {
212 		rc = spdk_nvmf_qpair_disconnect(qpair, _nvmf_tgt_disconnect_next_qpair, ctx);
213 	}
214 
215 	if (!qpair || rc != 0) {
216 		/* When the refcount from the channels reaches 0, nvmf_tgt_destroy_poll_group will be called. */
217 		ch = spdk_io_channel_from_ctx(group);
218 		spdk_put_io_channel(ch);
219 		free(qpair_ctx);
220 	}
221 }
222 
223 static void
224 nvmf_tgt_destroy_poll_group_qpairs(struct spdk_nvmf_poll_group *group)
225 {
226 	struct nvmf_qpair_disconnect_many_ctx *ctx;
227 
228 	SPDK_DTRACE_PROBE1(nvmf_destroy_poll_group_qpairs, spdk_thread_get_id(group->thread));
229 
230 	ctx = calloc(1, sizeof(struct nvmf_qpair_disconnect_many_ctx));
231 	if (!ctx) {
232 		SPDK_ERRLOG("Failed to allocate memory for destroy poll group ctx\n");
233 		return;
234 	}
235 
236 	ctx->group = group;
237 	_nvmf_tgt_disconnect_next_qpair(ctx);
238 }
239 
240 static int
241 nvmf_tgt_accept(void *ctx)
242 {
243 	struct spdk_nvmf_tgt *tgt = ctx;
244 	struct spdk_nvmf_transport *transport, *tmp;
245 	int count = 0;
246 
247 	TAILQ_FOREACH_SAFE(transport, &tgt->transports, link, tmp) {
248 		count += nvmf_transport_accept(transport);
249 	}
250 
251 	return count > 0 ? SPDK_POLLER_BUSY : SPDK_POLLER_IDLE;
252 }
253 
254 struct spdk_nvmf_tgt *
255 spdk_nvmf_tgt_create(struct spdk_nvmf_target_opts *opts)
256 {
257 	struct spdk_nvmf_tgt *tgt, *tmp_tgt;
258 	uint32_t acceptor_poll_rate;
259 
260 	if (strnlen(opts->name, NVMF_TGT_NAME_MAX_LENGTH) == NVMF_TGT_NAME_MAX_LENGTH) {
261 		SPDK_ERRLOG("Provided target name exceeds the max length of %u.\n", NVMF_TGT_NAME_MAX_LENGTH);
262 		return NULL;
263 	}
264 
265 	TAILQ_FOREACH(tmp_tgt, &g_nvmf_tgts, link) {
266 		if (!strncmp(opts->name, tmp_tgt->name, NVMF_TGT_NAME_MAX_LENGTH)) {
267 			SPDK_ERRLOG("Provided target name must be unique.\n");
268 			return NULL;
269 		}
270 	}
271 
272 	tgt = calloc(1, sizeof(*tgt));
273 	if (!tgt) {
274 		return NULL;
275 	}
276 
277 	snprintf(tgt->name, NVMF_TGT_NAME_MAX_LENGTH, "%s", opts->name);
278 
279 	if (!opts || !opts->max_subsystems) {
280 		tgt->max_subsystems = SPDK_NVMF_DEFAULT_MAX_SUBSYSTEMS;
281 	} else {
282 		tgt->max_subsystems = opts->max_subsystems;
283 	}
284 
285 	if (!opts || !opts->acceptor_poll_rate) {
286 		acceptor_poll_rate = SPDK_NVMF_DEFAULT_ACCEPT_POLL_RATE_US;
287 	} else {
288 		acceptor_poll_rate = opts->acceptor_poll_rate;
289 	}
290 
291 	if (!opts) {
292 		tgt->crdt[0] = 0;
293 		tgt->crdt[1] = 0;
294 		tgt->crdt[2] = 0;
295 	} else {
296 		tgt->crdt[0] = opts->crdt[0];
297 		tgt->crdt[1] = opts->crdt[1];
298 		tgt->crdt[2] = opts->crdt[2];
299 	}
300 
301 	tgt->discovery_genctr = 0;
302 	TAILQ_INIT(&tgt->transports);
303 	TAILQ_INIT(&tgt->poll_groups);
304 
305 	tgt->subsystems = calloc(tgt->max_subsystems, sizeof(struct spdk_nvmf_subsystem *));
306 	if (!tgt->subsystems) {
307 		free(tgt);
308 		return NULL;
309 	}
310 
311 	pthread_mutex_init(&tgt->mutex, NULL);
312 
313 	tgt->accept_poller = SPDK_POLLER_REGISTER(nvmf_tgt_accept, tgt, acceptor_poll_rate);
314 	if (!tgt->accept_poller) {
315 		pthread_mutex_destroy(&tgt->mutex);
316 		free(tgt->subsystems);
317 		free(tgt);
318 		return NULL;
319 	}
320 
321 	spdk_io_device_register(tgt,
322 				nvmf_tgt_create_poll_group,
323 				nvmf_tgt_destroy_poll_group,
324 				sizeof(struct spdk_nvmf_poll_group),
325 				tgt->name);
326 
327 	TAILQ_INSERT_HEAD(&g_nvmf_tgts, tgt, link);
328 
329 	return tgt;
330 }
331 
332 static void
333 _nvmf_tgt_destroy_next_transport(void *ctx)
334 {
335 	struct spdk_nvmf_tgt *tgt = ctx;
336 	struct spdk_nvmf_transport *transport;
337 
338 	if (!TAILQ_EMPTY(&tgt->transports)) {
339 		transport = TAILQ_FIRST(&tgt->transports);
340 		TAILQ_REMOVE(&tgt->transports, transport, link);
341 		spdk_nvmf_transport_destroy(transport, _nvmf_tgt_destroy_next_transport, tgt);
342 	} else {
343 		spdk_nvmf_tgt_destroy_done_fn *destroy_cb_fn = tgt->destroy_cb_fn;
344 		void *destroy_cb_arg = tgt->destroy_cb_arg;
345 
346 		pthread_mutex_destroy(&tgt->mutex);
347 		free(tgt);
348 
349 		if (destroy_cb_fn) {
350 			destroy_cb_fn(destroy_cb_arg, 0);
351 		}
352 	}
353 }
354 
355 static void
356 nvmf_tgt_destroy_cb(void *io_device)
357 {
358 	struct spdk_nvmf_tgt *tgt = io_device;
359 	uint32_t i;
360 
361 	if (tgt->subsystems) {
362 		for (i = 0; i < tgt->max_subsystems; i++) {
363 			if (tgt->subsystems[i]) {
364 				nvmf_subsystem_remove_all_listeners(tgt->subsystems[i], true);
365 				spdk_nvmf_subsystem_destroy(tgt->subsystems[i]);
366 			}
367 		}
368 		free(tgt->subsystems);
369 	}
370 
371 	_nvmf_tgt_destroy_next_transport(tgt);
372 }
373 
374 void
375 spdk_nvmf_tgt_destroy(struct spdk_nvmf_tgt *tgt,
376 		      spdk_nvmf_tgt_destroy_done_fn cb_fn,
377 		      void *cb_arg)
378 {
379 	tgt->destroy_cb_fn = cb_fn;
380 	tgt->destroy_cb_arg = cb_arg;
381 
382 	spdk_poller_unregister(&tgt->accept_poller);
383 
384 	TAILQ_REMOVE(&g_nvmf_tgts, tgt, link);
385 
386 	spdk_io_device_unregister(tgt, nvmf_tgt_destroy_cb);
387 }
388 
389 const char *
390 spdk_nvmf_tgt_get_name(struct spdk_nvmf_tgt *tgt)
391 {
392 	return tgt->name;
393 }
394 
395 struct spdk_nvmf_tgt *
396 spdk_nvmf_get_tgt(const char *name)
397 {
398 	struct spdk_nvmf_tgt *tgt;
399 	uint32_t num_targets = 0;
400 
401 	TAILQ_FOREACH(tgt, &g_nvmf_tgts, link) {
402 		if (name) {
403 			if (!strncmp(tgt->name, name, NVMF_TGT_NAME_MAX_LENGTH)) {
404 				return tgt;
405 			}
406 		}
407 		num_targets++;
408 	}
409 
410 	/*
411 	 * special case. If there is only one target and
412 	 * no name was specified, return the only available
413 	 * target. If there is more than one target, name must
414 	 * be specified.
415 	 */
416 	if (!name && num_targets == 1) {
417 		return TAILQ_FIRST(&g_nvmf_tgts);
418 	}
419 
420 	return NULL;
421 }
422 
423 struct spdk_nvmf_tgt *
424 spdk_nvmf_get_first_tgt(void)
425 {
426 	return TAILQ_FIRST(&g_nvmf_tgts);
427 }
428 
429 struct spdk_nvmf_tgt *
430 spdk_nvmf_get_next_tgt(struct spdk_nvmf_tgt *prev)
431 {
432 	return TAILQ_NEXT(prev, link);
433 }
434 
435 static void
436 nvmf_write_subsystem_config_json(struct spdk_json_write_ctx *w,
437 				 struct spdk_nvmf_subsystem *subsystem)
438 {
439 	struct spdk_nvmf_host *host;
440 	struct spdk_nvmf_subsystem_listener *listener;
441 	const struct spdk_nvme_transport_id *trid;
442 	struct spdk_nvmf_ns *ns;
443 	struct spdk_nvmf_ns_opts ns_opts;
444 	uint32_t max_namespaces;
445 	char uuid_str[SPDK_UUID_STRING_LEN];
446 
447 	if (spdk_nvmf_subsystem_get_type(subsystem) != SPDK_NVMF_SUBTYPE_NVME) {
448 		return;
449 	}
450 
451 	/* { */
452 	spdk_json_write_object_begin(w);
453 	spdk_json_write_named_string(w, "method", "nvmf_create_subsystem");
454 
455 	/*     "params" : { */
456 	spdk_json_write_named_object_begin(w, "params");
457 	spdk_json_write_named_string(w, "nqn", spdk_nvmf_subsystem_get_nqn(subsystem));
458 	spdk_json_write_named_bool(w, "allow_any_host", spdk_nvmf_subsystem_get_allow_any_host(subsystem));
459 	spdk_json_write_named_string(w, "serial_number", spdk_nvmf_subsystem_get_sn(subsystem));
460 	spdk_json_write_named_string(w, "model_number", spdk_nvmf_subsystem_get_mn(subsystem));
461 
462 	max_namespaces = spdk_nvmf_subsystem_get_max_namespaces(subsystem);
463 	if (max_namespaces != 0) {
464 		spdk_json_write_named_uint32(w, "max_namespaces", max_namespaces);
465 	}
466 
467 	spdk_json_write_named_uint32(w, "min_cntlid", spdk_nvmf_subsystem_get_min_cntlid(subsystem));
468 	spdk_json_write_named_uint32(w, "max_cntlid", spdk_nvmf_subsystem_get_max_cntlid(subsystem));
469 	spdk_json_write_named_bool(w, "ana_reporting", nvmf_subsystem_get_ana_reporting(subsystem));
470 
471 	/*     } "params" */
472 	spdk_json_write_object_end(w);
473 
474 	/* } */
475 	spdk_json_write_object_end(w);
476 
477 	for (listener = spdk_nvmf_subsystem_get_first_listener(subsystem); listener != NULL;
478 	     listener = spdk_nvmf_subsystem_get_next_listener(subsystem, listener)) {
479 		trid = spdk_nvmf_subsystem_listener_get_trid(listener);
480 
481 		spdk_json_write_object_begin(w);
482 		spdk_json_write_named_string(w, "method", "nvmf_subsystem_add_listener");
483 
484 		/*     "params" : { */
485 		spdk_json_write_named_object_begin(w, "params");
486 
487 		spdk_json_write_named_string(w, "nqn", spdk_nvmf_subsystem_get_nqn(subsystem));
488 		nvmf_transport_listen_dump_opts(listener->transport, trid, w);
489 
490 		/*     } "params" */
491 		spdk_json_write_object_end(w);
492 
493 		/* } */
494 		spdk_json_write_object_end(w);
495 	}
496 
497 	for (host = spdk_nvmf_subsystem_get_first_host(subsystem); host != NULL;
498 	     host = spdk_nvmf_subsystem_get_next_host(subsystem, host)) {
499 
500 		spdk_json_write_object_begin(w);
501 		spdk_json_write_named_string(w, "method", "nvmf_subsystem_add_host");
502 
503 		/*     "params" : { */
504 		spdk_json_write_named_object_begin(w, "params");
505 
506 		spdk_json_write_named_string(w, "nqn", spdk_nvmf_subsystem_get_nqn(subsystem));
507 		spdk_json_write_named_string(w, "host", spdk_nvmf_host_get_nqn(host));
508 
509 		/*     } "params" */
510 		spdk_json_write_object_end(w);
511 
512 		/* } */
513 		spdk_json_write_object_end(w);
514 	}
515 
516 	for (ns = spdk_nvmf_subsystem_get_first_ns(subsystem); ns != NULL;
517 	     ns = spdk_nvmf_subsystem_get_next_ns(subsystem, ns)) {
518 		spdk_nvmf_ns_get_opts(ns, &ns_opts, sizeof(ns_opts));
519 
520 		spdk_json_write_object_begin(w);
521 		spdk_json_write_named_string(w, "method", "nvmf_subsystem_add_ns");
522 
523 		/*     "params" : { */
524 		spdk_json_write_named_object_begin(w, "params");
525 
526 		spdk_json_write_named_string(w, "nqn", spdk_nvmf_subsystem_get_nqn(subsystem));
527 
528 		/*     "namespace" : { */
529 		spdk_json_write_named_object_begin(w, "namespace");
530 
531 		spdk_json_write_named_uint32(w, "nsid", spdk_nvmf_ns_get_id(ns));
532 		spdk_json_write_named_string(w, "bdev_name", spdk_bdev_get_name(spdk_nvmf_ns_get_bdev(ns)));
533 
534 		if (!spdk_mem_all_zero(ns_opts.nguid, sizeof(ns_opts.nguid))) {
535 			SPDK_STATIC_ASSERT(sizeof(ns_opts.nguid) == sizeof(uint64_t) * 2, "size mismatch");
536 			spdk_json_write_named_string_fmt(w, "nguid", "%016"PRIX64"%016"PRIX64, from_be64(&ns_opts.nguid[0]),
537 							 from_be64(&ns_opts.nguid[8]));
538 		}
539 
540 		if (!spdk_mem_all_zero(ns_opts.eui64, sizeof(ns_opts.eui64))) {
541 			SPDK_STATIC_ASSERT(sizeof(ns_opts.eui64) == sizeof(uint64_t), "size mismatch");
542 			spdk_json_write_named_string_fmt(w, "eui64", "%016"PRIX64, from_be64(&ns_opts.eui64));
543 		}
544 
545 		if (!spdk_mem_all_zero(&ns_opts.uuid, sizeof(ns_opts.uuid))) {
546 			spdk_uuid_fmt_lower(uuid_str, sizeof(uuid_str), &ns_opts.uuid);
547 			spdk_json_write_named_string(w, "uuid",  uuid_str);
548 		}
549 
550 		if (nvmf_subsystem_get_ana_reporting(subsystem)) {
551 			spdk_json_write_named_uint32(w, "anagrpid", ns_opts.anagrpid);
552 		}
553 
554 		/*     "namespace" */
555 		spdk_json_write_object_end(w);
556 
557 		/*     } "params" */
558 		spdk_json_write_object_end(w);
559 
560 		/* } */
561 		spdk_json_write_object_end(w);
562 	}
563 }
564 
565 void
566 spdk_nvmf_tgt_write_config_json(struct spdk_json_write_ctx *w, struct spdk_nvmf_tgt *tgt)
567 {
568 	struct spdk_nvmf_subsystem *subsystem;
569 	struct spdk_nvmf_transport *transport;
570 
571 	spdk_json_write_object_begin(w);
572 	spdk_json_write_named_string(w, "method", "nvmf_set_max_subsystems");
573 
574 	spdk_json_write_named_object_begin(w, "params");
575 	spdk_json_write_named_uint32(w, "max_subsystems", tgt->max_subsystems);
576 	spdk_json_write_object_end(w);
577 
578 	spdk_json_write_object_end(w);
579 
580 	spdk_json_write_object_begin(w);
581 	spdk_json_write_named_string(w, "method", "nvmf_set_crdt");
582 	spdk_json_write_named_object_begin(w, "params");
583 	spdk_json_write_named_uint32(w, "crdt1", tgt->crdt[0]);
584 	spdk_json_write_named_uint32(w, "crdt2", tgt->crdt[1]);
585 	spdk_json_write_named_uint32(w, "crdt3", tgt->crdt[2]);
586 	spdk_json_write_object_end(w);
587 	spdk_json_write_object_end(w);
588 
589 	/* write transports */
590 	TAILQ_FOREACH(transport, &tgt->transports, link) {
591 		spdk_json_write_object_begin(w);
592 		spdk_json_write_named_string(w, "method", "nvmf_create_transport");
593 		nvmf_transport_dump_opts(transport, w, true);
594 		spdk_json_write_object_end(w);
595 	}
596 
597 	subsystem = spdk_nvmf_subsystem_get_first(tgt);
598 	while (subsystem) {
599 		nvmf_write_subsystem_config_json(w, subsystem);
600 		subsystem = spdk_nvmf_subsystem_get_next(subsystem);
601 	}
602 }
603 
604 static void
605 nvmf_listen_opts_copy(struct spdk_nvmf_listen_opts *opts,
606 		      const struct spdk_nvmf_listen_opts *opts_src, size_t opts_size)
607 {
608 	assert(opts);
609 	assert(opts_src);
610 
611 	opts->opts_size = opts_size;
612 
613 #define SET_FIELD(field) \
614     if (offsetof(struct spdk_nvmf_listen_opts, field) + sizeof(opts->field) <= opts_size) { \
615                  opts->field = opts_src->field; \
616     } \
617 
618 	SET_FIELD(transport_specific);
619 #undef SET_FIELD
620 
621 	/* Do not remove this statement, you should always update this statement when you adding a new field,
622 	 * and do not forget to add the SET_FIELD statement for your added field. */
623 	SPDK_STATIC_ASSERT(sizeof(struct spdk_nvmf_listen_opts) == 16, "Incorrect size");
624 }
625 
626 void
627 spdk_nvmf_listen_opts_init(struct spdk_nvmf_listen_opts *opts, size_t opts_size)
628 {
629 	struct spdk_nvmf_listen_opts opts_local = {};
630 
631 	/* local version of opts should have defaults set here */
632 
633 	nvmf_listen_opts_copy(opts, &opts_local, opts_size);
634 }
635 
636 int
637 spdk_nvmf_tgt_listen_ext(struct spdk_nvmf_tgt *tgt, const struct spdk_nvme_transport_id *trid,
638 			 struct spdk_nvmf_listen_opts *opts)
639 {
640 	struct spdk_nvmf_transport *transport;
641 	int rc;
642 	struct spdk_nvmf_listen_opts opts_local = {};
643 
644 	if (!opts) {
645 		SPDK_ERRLOG("opts should not be NULL\n");
646 		return -EINVAL;
647 	}
648 
649 	if (!opts->opts_size) {
650 		SPDK_ERRLOG("The opts_size in opts structure should not be zero\n");
651 		return -EINVAL;
652 	}
653 
654 	transport = spdk_nvmf_tgt_get_transport(tgt, trid->trstring);
655 	if (!transport) {
656 		SPDK_ERRLOG("Unable to find %s transport. The transport must be created first also make sure it is properly registered.\n",
657 			    trid->trstring);
658 		return -EINVAL;
659 	}
660 
661 	nvmf_listen_opts_copy(&opts_local, opts, opts->opts_size);
662 	rc = spdk_nvmf_transport_listen(transport, trid, &opts_local);
663 	if (rc < 0) {
664 		SPDK_ERRLOG("Unable to listen on address '%s'\n", trid->traddr);
665 	}
666 
667 	return rc;
668 }
669 
670 int
671 spdk_nvmf_tgt_stop_listen(struct spdk_nvmf_tgt *tgt,
672 			  struct spdk_nvme_transport_id *trid)
673 {
674 	struct spdk_nvmf_transport *transport;
675 	int rc;
676 
677 	transport = spdk_nvmf_tgt_get_transport(tgt, trid->trstring);
678 	if (!transport) {
679 		SPDK_ERRLOG("Unable to find %s transport. The transport must be created first also make sure it is properly registered.\n",
680 			    trid->trstring);
681 		return -EINVAL;
682 	}
683 
684 	rc = spdk_nvmf_transport_stop_listen(transport, trid);
685 	if (rc < 0) {
686 		SPDK_ERRLOG("Failed to stop listening on address '%s'\n", trid->traddr);
687 		return rc;
688 	}
689 	return 0;
690 }
691 
692 struct spdk_nvmf_tgt_add_transport_ctx {
693 	struct spdk_nvmf_tgt *tgt;
694 	struct spdk_nvmf_transport *transport;
695 	spdk_nvmf_tgt_add_transport_done_fn cb_fn;
696 	void *cb_arg;
697 };
698 
699 static void
700 _nvmf_tgt_add_transport_done(struct spdk_io_channel_iter *i, int status)
701 {
702 	struct spdk_nvmf_tgt_add_transport_ctx *ctx = spdk_io_channel_iter_get_ctx(i);
703 
704 	ctx->cb_fn(ctx->cb_arg, status);
705 
706 	free(ctx);
707 }
708 
709 static void
710 _nvmf_tgt_add_transport(struct spdk_io_channel_iter *i)
711 {
712 	struct spdk_nvmf_tgt_add_transport_ctx *ctx = spdk_io_channel_iter_get_ctx(i);
713 	struct spdk_io_channel *ch = spdk_io_channel_iter_get_channel(i);
714 	struct spdk_nvmf_poll_group *group = spdk_io_channel_get_ctx(ch);
715 	int rc;
716 
717 	rc = nvmf_poll_group_add_transport(group, ctx->transport);
718 	spdk_for_each_channel_continue(i, rc);
719 }
720 
721 void spdk_nvmf_tgt_add_transport(struct spdk_nvmf_tgt *tgt,
722 				 struct spdk_nvmf_transport *transport,
723 				 spdk_nvmf_tgt_add_transport_done_fn cb_fn,
724 				 void *cb_arg)
725 {
726 	struct spdk_nvmf_tgt_add_transport_ctx *ctx;
727 
728 	if (spdk_nvmf_tgt_get_transport(tgt, transport->ops->name)) {
729 		cb_fn(cb_arg, -EEXIST);
730 		return; /* transport already created */
731 	}
732 
733 	transport->tgt = tgt;
734 	TAILQ_INSERT_TAIL(&tgt->transports, transport, link);
735 
736 	ctx = calloc(1, sizeof(*ctx));
737 	if (!ctx) {
738 		cb_fn(cb_arg, -ENOMEM);
739 		return;
740 	}
741 
742 	ctx->tgt = tgt;
743 	ctx->transport = transport;
744 	ctx->cb_fn = cb_fn;
745 	ctx->cb_arg = cb_arg;
746 
747 	spdk_for_each_channel(tgt,
748 			      _nvmf_tgt_add_transport,
749 			      ctx,
750 			      _nvmf_tgt_add_transport_done);
751 }
752 
753 struct spdk_nvmf_subsystem *
754 spdk_nvmf_tgt_find_subsystem(struct spdk_nvmf_tgt *tgt, const char *subnqn)
755 {
756 	struct spdk_nvmf_subsystem	*subsystem;
757 	uint32_t sid;
758 
759 	if (!subnqn) {
760 		return NULL;
761 	}
762 
763 	/* Ensure that subnqn is null terminated */
764 	if (!memchr(subnqn, '\0', SPDK_NVMF_NQN_MAX_LEN + 1)) {
765 		SPDK_ERRLOG("Connect SUBNQN is not null terminated\n");
766 		return NULL;
767 	}
768 
769 	for (sid = 0; sid < tgt->max_subsystems; sid++) {
770 		subsystem = tgt->subsystems[sid];
771 		if (subsystem == NULL) {
772 			continue;
773 		}
774 
775 		if (strcmp(subnqn, subsystem->subnqn) == 0) {
776 			return subsystem;
777 		}
778 	}
779 
780 	return NULL;
781 }
782 
783 struct spdk_nvmf_transport *
784 spdk_nvmf_tgt_get_transport(struct spdk_nvmf_tgt *tgt, const char *transport_name)
785 {
786 	struct spdk_nvmf_transport *transport;
787 
788 	TAILQ_FOREACH(transport, &tgt->transports, link) {
789 		if (!strncasecmp(transport->ops->name, transport_name, SPDK_NVMF_TRSTRING_MAX_LEN)) {
790 			return transport;
791 		}
792 	}
793 	return NULL;
794 }
795 
796 struct nvmf_new_qpair_ctx {
797 	struct spdk_nvmf_qpair *qpair;
798 	struct spdk_nvmf_poll_group *group;
799 };
800 
801 static void
802 _nvmf_poll_group_add(void *_ctx)
803 {
804 	struct nvmf_new_qpair_ctx *ctx = _ctx;
805 	struct spdk_nvmf_qpair *qpair = ctx->qpair;
806 	struct spdk_nvmf_poll_group *group = ctx->group;
807 
808 	free(_ctx);
809 
810 	if (spdk_nvmf_poll_group_add(group, qpair) != 0) {
811 		SPDK_ERRLOG("Unable to add the qpair to a poll group.\n");
812 		spdk_nvmf_qpair_disconnect(qpair, NULL, NULL);
813 	}
814 }
815 
816 void
817 spdk_nvmf_tgt_new_qpair(struct spdk_nvmf_tgt *tgt, struct spdk_nvmf_qpair *qpair)
818 {
819 	struct spdk_nvmf_poll_group *group;
820 	struct nvmf_new_qpair_ctx *ctx;
821 
822 	group = spdk_nvmf_get_optimal_poll_group(qpair);
823 	if (group == NULL) {
824 		if (tgt->next_poll_group == NULL) {
825 			tgt->next_poll_group = TAILQ_FIRST(&tgt->poll_groups);
826 			if (tgt->next_poll_group == NULL) {
827 				SPDK_ERRLOG("No poll groups exist.\n");
828 				spdk_nvmf_qpair_disconnect(qpair, NULL, NULL);
829 				return;
830 			}
831 		}
832 		group = tgt->next_poll_group;
833 		tgt->next_poll_group = TAILQ_NEXT(group, link);
834 	}
835 
836 	ctx = calloc(1, sizeof(*ctx));
837 	if (!ctx) {
838 		SPDK_ERRLOG("Unable to send message to poll group.\n");
839 		spdk_nvmf_qpair_disconnect(qpair, NULL, NULL);
840 		return;
841 	}
842 
843 	ctx->qpair = qpair;
844 	ctx->group = group;
845 
846 	spdk_thread_send_msg(group->thread, _nvmf_poll_group_add, ctx);
847 }
848 
849 struct spdk_nvmf_poll_group *
850 spdk_nvmf_poll_group_create(struct spdk_nvmf_tgt *tgt)
851 {
852 	struct spdk_io_channel *ch;
853 
854 	ch = spdk_get_io_channel(tgt);
855 	if (!ch) {
856 		SPDK_ERRLOG("Unable to get I/O channel for target\n");
857 		return NULL;
858 	}
859 
860 	return spdk_io_channel_get_ctx(ch);
861 }
862 
863 void
864 spdk_nvmf_poll_group_destroy(struct spdk_nvmf_poll_group *group,
865 			     spdk_nvmf_poll_group_destroy_done_fn cb_fn,
866 			     void *cb_arg)
867 {
868 	assert(group->destroy_cb_fn == NULL);
869 	group->destroy_cb_fn = cb_fn;
870 	group->destroy_cb_arg = cb_arg;
871 
872 	/* This function will put the io_channel associated with this poll group */
873 	nvmf_tgt_destroy_poll_group_qpairs(group);
874 }
875 
876 int
877 spdk_nvmf_poll_group_add(struct spdk_nvmf_poll_group *group,
878 			 struct spdk_nvmf_qpair *qpair)
879 {
880 	int rc = -1;
881 	struct spdk_nvmf_transport_poll_group *tgroup;
882 
883 	TAILQ_INIT(&qpair->outstanding);
884 	qpair->group = group;
885 	qpair->ctrlr = NULL;
886 	qpair->disconnect_started = false;
887 
888 	TAILQ_FOREACH(tgroup, &group->tgroups, link) {
889 		if (tgroup->transport == qpair->transport) {
890 			rc = nvmf_transport_poll_group_add(tgroup, qpair);
891 			break;
892 		}
893 	}
894 
895 	/* We add the qpair to the group only it is succesfully added into the tgroup */
896 	if (rc == 0) {
897 		SPDK_DTRACE_PROBE2(nvmf_poll_group_add_qpair, qpair, spdk_thread_get_id(group->thread));
898 		TAILQ_INSERT_TAIL(&group->qpairs, qpair, link);
899 		nvmf_qpair_set_state(qpair, SPDK_NVMF_QPAIR_ACTIVE);
900 	}
901 
902 	return rc;
903 }
904 
905 static void
906 _nvmf_ctrlr_destruct(void *ctx)
907 {
908 	struct spdk_nvmf_ctrlr *ctrlr = ctx;
909 
910 	nvmf_ctrlr_destruct(ctrlr);
911 }
912 
913 static void
914 _nvmf_transport_qpair_fini_complete(void *cb_ctx)
915 {
916 	struct nvmf_qpair_disconnect_ctx *qpair_ctx = cb_ctx;
917 
918 	if (qpair_ctx->cb_fn) {
919 		spdk_thread_send_msg(qpair_ctx->thread, qpair_ctx->cb_fn, qpair_ctx->ctx);
920 	}
921 	free(qpair_ctx);
922 }
923 
924 static void
925 _nvmf_transport_qpair_fini(void *ctx)
926 {
927 	struct nvmf_qpair_disconnect_ctx *qpair_ctx = ctx;
928 
929 	spdk_nvmf_poll_group_remove(qpair_ctx->qpair);
930 	nvmf_transport_qpair_fini(qpair_ctx->qpair, _nvmf_transport_qpair_fini_complete, qpair_ctx);
931 }
932 
933 static void
934 _nvmf_ctrlr_free_from_qpair(void *ctx)
935 {
936 	struct nvmf_qpair_disconnect_ctx *qpair_ctx = ctx;
937 	struct spdk_nvmf_ctrlr *ctrlr = qpair_ctx->ctrlr;
938 	uint32_t count;
939 
940 	spdk_bit_array_clear(ctrlr->qpair_mask, qpair_ctx->qid);
941 	count = spdk_bit_array_count_set(ctrlr->qpair_mask);
942 	if (count == 0) {
943 		ctrlr->in_destruct = true;
944 		spdk_thread_send_msg(ctrlr->subsys->thread, _nvmf_ctrlr_destruct, ctrlr);
945 	}
946 
947 	spdk_thread_send_msg(qpair_ctx->thread, _nvmf_transport_qpair_fini, qpair_ctx);
948 }
949 
950 void
951 spdk_nvmf_poll_group_remove(struct spdk_nvmf_qpair *qpair)
952 {
953 	struct spdk_nvmf_transport_poll_group *tgroup;
954 	int rc;
955 
956 	SPDK_DTRACE_PROBE2(nvmf_poll_group_remove_qpair, qpair,
957 			   spdk_thread_get_id(qpair->group->thread));
958 	nvmf_qpair_set_state(qpair, SPDK_NVMF_QPAIR_ERROR);
959 
960 	/* Find the tgroup and remove the qpair from the tgroup */
961 	TAILQ_FOREACH(tgroup, &qpair->group->tgroups, link) {
962 		if (tgroup->transport == qpair->transport) {
963 			rc = nvmf_transport_poll_group_remove(tgroup, qpair);
964 			if (rc && (rc != ENOTSUP)) {
965 				SPDK_ERRLOG("Cannot remove qpair=%p from transport group=%p\n",
966 					    qpair, tgroup);
967 			}
968 			break;
969 		}
970 	}
971 
972 	TAILQ_REMOVE(&qpair->group->qpairs, qpair, link);
973 	qpair->group = NULL;
974 }
975 
976 static void
977 _nvmf_qpair_destroy(void *ctx, int status)
978 {
979 	struct nvmf_qpair_disconnect_ctx *qpair_ctx = ctx;
980 	struct spdk_nvmf_qpair *qpair = qpair_ctx->qpair;
981 	struct spdk_nvmf_ctrlr *ctrlr = qpair->ctrlr;
982 	struct spdk_nvmf_request *req, *tmp;
983 	struct spdk_nvmf_subsystem_poll_group *sgroup;
984 
985 	assert(qpair->state == SPDK_NVMF_QPAIR_DEACTIVATING);
986 	qpair_ctx->qid = qpair->qid;
987 
988 	if (ctrlr) {
989 		if (0 == qpair->qid) {
990 			assert(qpair->group->stat.current_admin_qpairs > 0);
991 			qpair->group->stat.current_admin_qpairs--;
992 		} else {
993 			assert(qpair->group->stat.current_io_qpairs > 0);
994 			qpair->group->stat.current_io_qpairs--;
995 		}
996 
997 		sgroup = &qpair->group->sgroups[ctrlr->subsys->id];
998 		TAILQ_FOREACH_SAFE(req, &sgroup->queued, link, tmp) {
999 			if (req->qpair == qpair) {
1000 				TAILQ_REMOVE(&sgroup->queued, req, link);
1001 				if (nvmf_transport_req_free(req)) {
1002 					SPDK_ERRLOG("Transport request free error!/n");
1003 				}
1004 			}
1005 		}
1006 	}
1007 
1008 	if (!ctrlr || !ctrlr->thread) {
1009 		spdk_nvmf_poll_group_remove(qpair);
1010 		nvmf_transport_qpair_fini(qpair, _nvmf_transport_qpair_fini_complete, qpair_ctx);
1011 		return;
1012 	}
1013 
1014 	qpair_ctx->ctrlr = ctrlr;
1015 	spdk_thread_send_msg(ctrlr->thread, _nvmf_ctrlr_free_from_qpair, qpair_ctx);
1016 }
1017 
1018 static void
1019 _nvmf_qpair_disconnect_msg(void *ctx)
1020 {
1021 	struct nvmf_qpair_disconnect_ctx *qpair_ctx = ctx;
1022 
1023 	spdk_nvmf_qpair_disconnect(qpair_ctx->qpair, qpair_ctx->cb_fn, qpair_ctx->ctx);
1024 	free(ctx);
1025 }
1026 
1027 int
1028 spdk_nvmf_qpair_disconnect(struct spdk_nvmf_qpair *qpair, nvmf_qpair_disconnect_cb cb_fn, void *ctx)
1029 {
1030 	struct spdk_nvmf_poll_group *group = qpair->group;
1031 	struct nvmf_qpair_disconnect_ctx *qpair_ctx;
1032 
1033 	if (__atomic_test_and_set(&qpair->disconnect_started, __ATOMIC_RELAXED)) {
1034 		if (cb_fn) {
1035 			cb_fn(ctx);
1036 		}
1037 		return 0;
1038 	}
1039 
1040 	/* If we get a qpair in the uninitialized state, we can just destroy it immediately */
1041 	if (qpair->state == SPDK_NVMF_QPAIR_UNINITIALIZED) {
1042 		nvmf_transport_qpair_fini(qpair, NULL, NULL);
1043 		if (cb_fn) {
1044 			cb_fn(ctx);
1045 		}
1046 		return 0;
1047 	}
1048 
1049 	assert(group != NULL);
1050 	if (spdk_get_thread() != group->thread) {
1051 		/* clear the atomic so we can set it on the next call on the proper thread. */
1052 		__atomic_clear(&qpair->disconnect_started, __ATOMIC_RELAXED);
1053 		qpair_ctx = calloc(1, sizeof(struct nvmf_qpair_disconnect_ctx));
1054 		if (!qpair_ctx) {
1055 			SPDK_ERRLOG("Unable to allocate context for nvmf_qpair_disconnect\n");
1056 			return -ENOMEM;
1057 		}
1058 		qpair_ctx->qpair = qpair;
1059 		qpair_ctx->cb_fn = cb_fn;
1060 		qpair_ctx->thread = group->thread;
1061 		qpair_ctx->ctx = ctx;
1062 		spdk_thread_send_msg(group->thread, _nvmf_qpair_disconnect_msg, qpair_ctx);
1063 		return 0;
1064 	}
1065 
1066 	SPDK_DTRACE_PROBE2(nvmf_qpair_disconnect, qpair, spdk_thread_get_id(group->thread));
1067 	assert(qpair->state == SPDK_NVMF_QPAIR_ACTIVE);
1068 	nvmf_qpair_set_state(qpair, SPDK_NVMF_QPAIR_DEACTIVATING);
1069 
1070 	qpair_ctx = calloc(1, sizeof(struct nvmf_qpair_disconnect_ctx));
1071 	if (!qpair_ctx) {
1072 		SPDK_ERRLOG("Unable to allocate context for nvmf_qpair_disconnect\n");
1073 		return -ENOMEM;
1074 	}
1075 
1076 	qpair_ctx->qpair = qpair;
1077 	qpair_ctx->cb_fn = cb_fn;
1078 	qpair_ctx->thread = group->thread;
1079 	qpair_ctx->ctx = ctx;
1080 
1081 	/* Check for outstanding I/O */
1082 	if (!TAILQ_EMPTY(&qpair->outstanding)) {
1083 		SPDK_DTRACE_PROBE2(nvmf_poll_group_drain_qpair, qpair, spdk_thread_get_id(group->thread));
1084 		qpair->state_cb = _nvmf_qpair_destroy;
1085 		qpair->state_cb_arg = qpair_ctx;
1086 		nvmf_qpair_free_aer(qpair);
1087 		return 0;
1088 	}
1089 
1090 	_nvmf_qpair_destroy(qpair_ctx, 0);
1091 
1092 	return 0;
1093 }
1094 
1095 int
1096 spdk_nvmf_qpair_get_peer_trid(struct spdk_nvmf_qpair *qpair,
1097 			      struct spdk_nvme_transport_id *trid)
1098 {
1099 	return nvmf_transport_qpair_get_peer_trid(qpair, trid);
1100 }
1101 
1102 int
1103 spdk_nvmf_qpair_get_local_trid(struct spdk_nvmf_qpair *qpair,
1104 			       struct spdk_nvme_transport_id *trid)
1105 {
1106 	return nvmf_transport_qpair_get_local_trid(qpair, trid);
1107 }
1108 
1109 int
1110 spdk_nvmf_qpair_get_listen_trid(struct spdk_nvmf_qpair *qpair,
1111 				struct spdk_nvme_transport_id *trid)
1112 {
1113 	return nvmf_transport_qpair_get_listen_trid(qpair, trid);
1114 }
1115 
1116 int
1117 nvmf_poll_group_add_transport(struct spdk_nvmf_poll_group *group,
1118 			      struct spdk_nvmf_transport *transport)
1119 {
1120 	struct spdk_nvmf_transport_poll_group *tgroup;
1121 
1122 	TAILQ_FOREACH(tgroup, &group->tgroups, link) {
1123 		if (tgroup->transport == transport) {
1124 			/* Transport already in the poll group */
1125 			return 0;
1126 		}
1127 	}
1128 
1129 	tgroup = nvmf_transport_poll_group_create(transport);
1130 	if (!tgroup) {
1131 		SPDK_ERRLOG("Unable to create poll group for transport\n");
1132 		return -1;
1133 	}
1134 
1135 	tgroup->group = group;
1136 	TAILQ_INSERT_TAIL(&group->tgroups, tgroup, link);
1137 
1138 	return 0;
1139 }
1140 
1141 static int
1142 poll_group_update_subsystem(struct spdk_nvmf_poll_group *group,
1143 			    struct spdk_nvmf_subsystem *subsystem)
1144 {
1145 	struct spdk_nvmf_subsystem_poll_group *sgroup;
1146 	uint32_t new_num_ns, old_num_ns;
1147 	uint32_t i, j;
1148 	struct spdk_nvmf_ns *ns;
1149 	struct spdk_nvmf_registrant *reg, *tmp;
1150 	struct spdk_io_channel *ch;
1151 	struct spdk_nvmf_subsystem_pg_ns_info *ns_info;
1152 	struct spdk_nvmf_ctrlr *ctrlr;
1153 	bool ns_changed;
1154 
1155 	/* Make sure our poll group has memory for this subsystem allocated */
1156 	if (subsystem->id >= group->num_sgroups) {
1157 		return -ENOMEM;
1158 	}
1159 
1160 	sgroup = &group->sgroups[subsystem->id];
1161 
1162 	/* Make sure the array of namespace information is the correct size */
1163 	new_num_ns = subsystem->max_nsid;
1164 	old_num_ns = sgroup->num_ns;
1165 
1166 	ns_changed = false;
1167 
1168 	if (old_num_ns == 0) {
1169 		if (new_num_ns > 0) {
1170 			/* First allocation */
1171 			sgroup->ns_info = calloc(new_num_ns, sizeof(struct spdk_nvmf_subsystem_pg_ns_info));
1172 			if (!sgroup->ns_info) {
1173 				return -ENOMEM;
1174 			}
1175 		}
1176 	} else if (new_num_ns > old_num_ns) {
1177 		void *buf;
1178 
1179 		/* Make the array larger */
1180 		buf = realloc(sgroup->ns_info, new_num_ns * sizeof(struct spdk_nvmf_subsystem_pg_ns_info));
1181 		if (!buf) {
1182 			return -ENOMEM;
1183 		}
1184 
1185 		sgroup->ns_info = buf;
1186 
1187 		/* Null out the new namespace information slots */
1188 		for (i = old_num_ns; i < new_num_ns; i++) {
1189 			memset(&sgroup->ns_info[i], 0, sizeof(struct spdk_nvmf_subsystem_pg_ns_info));
1190 		}
1191 	} else if (new_num_ns < old_num_ns) {
1192 		void *buf;
1193 
1194 		/* Free the extra I/O channels */
1195 		for (i = new_num_ns; i < old_num_ns; i++) {
1196 			ns_info = &sgroup->ns_info[i];
1197 
1198 			if (ns_info->channel) {
1199 				spdk_put_io_channel(ns_info->channel);
1200 				ns_info->channel = NULL;
1201 			}
1202 		}
1203 
1204 		/* Make the array smaller */
1205 		if (new_num_ns > 0) {
1206 			buf = realloc(sgroup->ns_info, new_num_ns * sizeof(struct spdk_nvmf_subsystem_pg_ns_info));
1207 			if (!buf) {
1208 				return -ENOMEM;
1209 			}
1210 			sgroup->ns_info = buf;
1211 		} else {
1212 			free(sgroup->ns_info);
1213 			sgroup->ns_info = NULL;
1214 		}
1215 	}
1216 
1217 	sgroup->num_ns = new_num_ns;
1218 
1219 	/* Detect bdevs that were added or removed */
1220 	for (i = 0; i < sgroup->num_ns; i++) {
1221 		ns = subsystem->ns[i];
1222 		ns_info = &sgroup->ns_info[i];
1223 		ch = ns_info->channel;
1224 
1225 		if (ns == NULL && ch == NULL) {
1226 			/* Both NULL. Leave empty */
1227 		} else if (ns == NULL && ch != NULL) {
1228 			/* There was a channel here, but the namespace is gone. */
1229 			ns_changed = true;
1230 			spdk_put_io_channel(ch);
1231 			ns_info->channel = NULL;
1232 		} else if (ns != NULL && ch == NULL) {
1233 			/* A namespace appeared but there is no channel yet */
1234 			ns_changed = true;
1235 			ch = spdk_bdev_get_io_channel(ns->desc);
1236 			if (ch == NULL) {
1237 				SPDK_ERRLOG("Could not allocate I/O channel.\n");
1238 				return -ENOMEM;
1239 			}
1240 			ns_info->channel = ch;
1241 		} else if (spdk_uuid_compare(&ns_info->uuid, spdk_bdev_get_uuid(ns->bdev)) != 0) {
1242 			/* A namespace was here before, but was replaced by a new one. */
1243 			ns_changed = true;
1244 			spdk_put_io_channel(ns_info->channel);
1245 			memset(ns_info, 0, sizeof(*ns_info));
1246 
1247 			ch = spdk_bdev_get_io_channel(ns->desc);
1248 			if (ch == NULL) {
1249 				SPDK_ERRLOG("Could not allocate I/O channel.\n");
1250 				return -ENOMEM;
1251 			}
1252 			ns_info->channel = ch;
1253 		} else if (ns_info->num_blocks != spdk_bdev_get_num_blocks(ns->bdev)) {
1254 			/* Namespace is still there but size has changed */
1255 			SPDK_DEBUGLOG(nvmf, "Namespace resized: subsystem_id %u,"
1256 				      " nsid %u, pg %p, old %" PRIu64 ", new %" PRIu64 "\n",
1257 				      subsystem->id,
1258 				      ns->nsid,
1259 				      group,
1260 				      ns_info->num_blocks,
1261 				      spdk_bdev_get_num_blocks(ns->bdev));
1262 			ns_changed = true;
1263 		}
1264 
1265 		if (ns == NULL) {
1266 			memset(ns_info, 0, sizeof(*ns_info));
1267 		} else {
1268 			ns_info->uuid = *spdk_bdev_get_uuid(ns->bdev);
1269 			ns_info->num_blocks = spdk_bdev_get_num_blocks(ns->bdev);
1270 			ns_info->crkey = ns->crkey;
1271 			ns_info->rtype = ns->rtype;
1272 			if (ns->holder) {
1273 				ns_info->holder_id = ns->holder->hostid;
1274 			}
1275 
1276 			memset(&ns_info->reg_hostid, 0, SPDK_NVMF_MAX_NUM_REGISTRANTS * sizeof(struct spdk_uuid));
1277 			j = 0;
1278 			TAILQ_FOREACH_SAFE(reg, &ns->registrants, link, tmp) {
1279 				if (j >= SPDK_NVMF_MAX_NUM_REGISTRANTS) {
1280 					SPDK_ERRLOG("Maximum %u registrants can support.\n", SPDK_NVMF_MAX_NUM_REGISTRANTS);
1281 					return -EINVAL;
1282 				}
1283 				ns_info->reg_hostid[j++] = reg->hostid;
1284 			}
1285 		}
1286 	}
1287 
1288 	if (ns_changed) {
1289 		TAILQ_FOREACH(ctrlr, &subsystem->ctrlrs, link) {
1290 			/* It is possible that a ctrlr was added but the admin_qpair hasn't been
1291 			 * assigned yet.
1292 			 */
1293 			if (!ctrlr->admin_qpair) {
1294 				continue;
1295 			}
1296 			if (ctrlr->admin_qpair->group == group) {
1297 				nvmf_ctrlr_async_event_ns_notice(ctrlr);
1298 				nvmf_ctrlr_async_event_ana_change_notice(ctrlr);
1299 			}
1300 		}
1301 	}
1302 
1303 	return 0;
1304 }
1305 
1306 int
1307 nvmf_poll_group_update_subsystem(struct spdk_nvmf_poll_group *group,
1308 				 struct spdk_nvmf_subsystem *subsystem)
1309 {
1310 	return poll_group_update_subsystem(group, subsystem);
1311 }
1312 
1313 int
1314 nvmf_poll_group_add_subsystem(struct spdk_nvmf_poll_group *group,
1315 			      struct spdk_nvmf_subsystem *subsystem,
1316 			      spdk_nvmf_poll_group_mod_done cb_fn, void *cb_arg)
1317 {
1318 	int rc = 0;
1319 	struct spdk_nvmf_subsystem_poll_group *sgroup = &group->sgroups[subsystem->id];
1320 	uint32_t i;
1321 
1322 	TAILQ_INIT(&sgroup->queued);
1323 
1324 	rc = poll_group_update_subsystem(group, subsystem);
1325 	if (rc) {
1326 		nvmf_poll_group_remove_subsystem(group, subsystem, NULL, NULL);
1327 		goto fini;
1328 	}
1329 
1330 	sgroup->state = SPDK_NVMF_SUBSYSTEM_ACTIVE;
1331 
1332 	for (i = 0; i < sgroup->num_ns; i++) {
1333 		sgroup->ns_info[i].state = SPDK_NVMF_SUBSYSTEM_ACTIVE;
1334 	}
1335 
1336 fini:
1337 	if (cb_fn) {
1338 		cb_fn(cb_arg, rc);
1339 	}
1340 
1341 	return rc;
1342 }
1343 
1344 static void
1345 _nvmf_poll_group_remove_subsystem_cb(void *ctx, int status)
1346 {
1347 	struct nvmf_qpair_disconnect_many_ctx *qpair_ctx = ctx;
1348 	struct spdk_nvmf_subsystem *subsystem;
1349 	struct spdk_nvmf_poll_group *group;
1350 	struct spdk_nvmf_subsystem_poll_group *sgroup;
1351 	spdk_nvmf_poll_group_mod_done cpl_fn = NULL;
1352 	void *cpl_ctx = NULL;
1353 	uint32_t nsid;
1354 
1355 	group = qpair_ctx->group;
1356 	subsystem = qpair_ctx->subsystem;
1357 	cpl_fn = qpair_ctx->cpl_fn;
1358 	cpl_ctx = qpair_ctx->cpl_ctx;
1359 	sgroup = &group->sgroups[subsystem->id];
1360 
1361 	if (status) {
1362 		goto fini;
1363 	}
1364 
1365 	for (nsid = 0; nsid < sgroup->num_ns; nsid++) {
1366 		if (sgroup->ns_info[nsid].channel) {
1367 			spdk_put_io_channel(sgroup->ns_info[nsid].channel);
1368 			sgroup->ns_info[nsid].channel = NULL;
1369 		}
1370 	}
1371 
1372 	sgroup->num_ns = 0;
1373 	free(sgroup->ns_info);
1374 	sgroup->ns_info = NULL;
1375 fini:
1376 	free(qpair_ctx);
1377 	if (cpl_fn) {
1378 		cpl_fn(cpl_ctx, status);
1379 	}
1380 }
1381 
1382 static void nvmf_poll_group_remove_subsystem_msg(void *ctx);
1383 
1384 static void
1385 remove_subsystem_qpair_cb(void *ctx)
1386 {
1387 	struct nvmf_qpair_disconnect_many_ctx *qpair_ctx = ctx;
1388 
1389 	assert(qpair_ctx->count > 0);
1390 	qpair_ctx->count--;
1391 	if (qpair_ctx->count == 0) {
1392 		/* All of the asynchronous callbacks for this context have been
1393 		 * completed.  Call nvmf_poll_group_remove_subsystem_msg() again
1394 		 * to check if all associated qpairs for this subsystem have
1395 		 * been removed from the poll group.
1396 		 */
1397 		nvmf_poll_group_remove_subsystem_msg(ctx);
1398 	}
1399 }
1400 
1401 static void
1402 nvmf_poll_group_remove_subsystem_msg(void *ctx)
1403 {
1404 	struct spdk_nvmf_qpair *qpair, *qpair_tmp;
1405 	struct spdk_nvmf_subsystem *subsystem;
1406 	struct spdk_nvmf_poll_group *group;
1407 	struct nvmf_qpair_disconnect_many_ctx *qpair_ctx = ctx;
1408 	bool qpairs_found = false;
1409 	int rc = 0;
1410 
1411 	group = qpair_ctx->group;
1412 	subsystem = qpair_ctx->subsystem;
1413 
1414 	/* Initialize count to 1.  This acts like a ref count, to ensure that if spdk_nvmf_qpair_disconnect
1415 	 * immediately invokes the callback (i.e. the qpairs is already in process of being disconnected)
1416 	 * that we don't recursively call nvmf_poll_group_remove_subsystem_msg before we've iterated the
1417 	 * full list of qpairs.
1418 	 */
1419 	qpair_ctx->count = 1;
1420 	TAILQ_FOREACH_SAFE(qpair, &group->qpairs, link, qpair_tmp) {
1421 		if ((qpair->ctrlr != NULL) && (qpair->ctrlr->subsys == subsystem)) {
1422 			qpairs_found = true;
1423 			qpair_ctx->count++;
1424 			rc = spdk_nvmf_qpair_disconnect(qpair, remove_subsystem_qpair_cb, ctx);
1425 			if (rc) {
1426 				break;
1427 			}
1428 		}
1429 	}
1430 	qpair_ctx->count--;
1431 
1432 	if (!qpairs_found) {
1433 		_nvmf_poll_group_remove_subsystem_cb(ctx, 0);
1434 		return;
1435 	}
1436 
1437 	if (qpair_ctx->count == 0 || rc) {
1438 		/* If count == 0, it means there were some qpairs in the poll group but they
1439 		 * were already in process of being disconnected.  So we send a message to this
1440 		 * same thread so that this function executes again later.  We won't actually
1441 		 * invoke the remove_subsystem_cb until all of the qpairs are actually removed
1442 		 * from the poll group.
1443 		 */
1444 		spdk_thread_send_msg(spdk_get_thread(), nvmf_poll_group_remove_subsystem_msg, ctx);
1445 	}
1446 }
1447 
1448 void
1449 nvmf_poll_group_remove_subsystem(struct spdk_nvmf_poll_group *group,
1450 				 struct spdk_nvmf_subsystem *subsystem,
1451 				 spdk_nvmf_poll_group_mod_done cb_fn, void *cb_arg)
1452 {
1453 	struct spdk_nvmf_subsystem_poll_group *sgroup;
1454 	struct nvmf_qpair_disconnect_many_ctx *ctx;
1455 	uint32_t i;
1456 
1457 	ctx = calloc(1, sizeof(struct nvmf_qpair_disconnect_many_ctx));
1458 	if (!ctx) {
1459 		SPDK_ERRLOG("Unable to allocate memory for context to remove poll subsystem\n");
1460 		if (cb_fn) {
1461 			cb_fn(cb_arg, -1);
1462 		}
1463 		return;
1464 	}
1465 
1466 	ctx->group = group;
1467 	ctx->subsystem = subsystem;
1468 	ctx->cpl_fn = cb_fn;
1469 	ctx->cpl_ctx = cb_arg;
1470 
1471 	sgroup = &group->sgroups[subsystem->id];
1472 	sgroup->state = SPDK_NVMF_SUBSYSTEM_INACTIVE;
1473 
1474 	for (i = 0; i < sgroup->num_ns; i++) {
1475 		sgroup->ns_info[i].state = SPDK_NVMF_SUBSYSTEM_INACTIVE;
1476 	}
1477 
1478 	nvmf_poll_group_remove_subsystem_msg(ctx);
1479 }
1480 
1481 void
1482 nvmf_poll_group_pause_subsystem(struct spdk_nvmf_poll_group *group,
1483 				struct spdk_nvmf_subsystem *subsystem,
1484 				uint32_t nsid,
1485 				spdk_nvmf_poll_group_mod_done cb_fn, void *cb_arg)
1486 {
1487 	struct spdk_nvmf_subsystem_poll_group *sgroup;
1488 	struct spdk_nvmf_subsystem_pg_ns_info *ns_info = NULL;
1489 	int rc = 0;
1490 
1491 	if (subsystem->id >= group->num_sgroups) {
1492 		rc = -1;
1493 		goto fini;
1494 	}
1495 
1496 	sgroup = &group->sgroups[subsystem->id];
1497 	if (sgroup == NULL) {
1498 		rc = -1;
1499 		goto fini;
1500 	}
1501 
1502 	if (sgroup->state == SPDK_NVMF_SUBSYSTEM_PAUSED) {
1503 		goto fini;
1504 	}
1505 	sgroup->state = SPDK_NVMF_SUBSYSTEM_PAUSING;
1506 
1507 	/* NOTE: This implicitly also checks for 0, since 0 - 1 wraps around to UINT32_MAX. */
1508 	if (nsid - 1 < sgroup->num_ns) {
1509 		ns_info  = &sgroup->ns_info[nsid - 1];
1510 		ns_info->state = SPDK_NVMF_SUBSYSTEM_PAUSING;
1511 	}
1512 
1513 	if (sgroup->mgmt_io_outstanding > 0) {
1514 		assert(sgroup->cb_fn == NULL);
1515 		sgroup->cb_fn = cb_fn;
1516 		assert(sgroup->cb_arg == NULL);
1517 		sgroup->cb_arg = cb_arg;
1518 		return;
1519 	}
1520 
1521 	if (ns_info != NULL && ns_info->io_outstanding > 0) {
1522 		assert(sgroup->cb_fn == NULL);
1523 		sgroup->cb_fn = cb_fn;
1524 		assert(sgroup->cb_arg == NULL);
1525 		sgroup->cb_arg = cb_arg;
1526 		return;
1527 	}
1528 
1529 	assert(sgroup->mgmt_io_outstanding == 0);
1530 	sgroup->state = SPDK_NVMF_SUBSYSTEM_PAUSED;
1531 fini:
1532 	if (cb_fn) {
1533 		cb_fn(cb_arg, rc);
1534 	}
1535 }
1536 
1537 void
1538 nvmf_poll_group_resume_subsystem(struct spdk_nvmf_poll_group *group,
1539 				 struct spdk_nvmf_subsystem *subsystem,
1540 				 spdk_nvmf_poll_group_mod_done cb_fn, void *cb_arg)
1541 {
1542 	struct spdk_nvmf_request *req, *tmp;
1543 	struct spdk_nvmf_subsystem_poll_group *sgroup;
1544 	int rc = 0;
1545 	uint32_t i;
1546 
1547 	if (subsystem->id >= group->num_sgroups) {
1548 		rc = -1;
1549 		goto fini;
1550 	}
1551 
1552 	sgroup = &group->sgroups[subsystem->id];
1553 
1554 	if (sgroup->state == SPDK_NVMF_SUBSYSTEM_ACTIVE) {
1555 		goto fini;
1556 	}
1557 
1558 	rc = poll_group_update_subsystem(group, subsystem);
1559 	if (rc) {
1560 		goto fini;
1561 	}
1562 
1563 	for (i = 0; i < sgroup->num_ns; i++) {
1564 		sgroup->ns_info[i].state = SPDK_NVMF_SUBSYSTEM_ACTIVE;
1565 	}
1566 
1567 	sgroup->state = SPDK_NVMF_SUBSYSTEM_ACTIVE;
1568 
1569 	/* Release all queued requests */
1570 	TAILQ_FOREACH_SAFE(req, &sgroup->queued, link, tmp) {
1571 		TAILQ_REMOVE(&sgroup->queued, req, link);
1572 		assert(req->zcopy_phase == NVMF_ZCOPY_PHASE_NONE);
1573 		spdk_nvmf_request_exec(req);
1574 	}
1575 fini:
1576 	if (cb_fn) {
1577 		cb_fn(cb_arg, rc);
1578 	}
1579 }
1580 
1581 
1582 struct spdk_nvmf_poll_group *
1583 spdk_nvmf_get_optimal_poll_group(struct spdk_nvmf_qpair *qpair)
1584 {
1585 	struct spdk_nvmf_transport_poll_group *tgroup;
1586 
1587 	tgroup = nvmf_transport_get_optimal_poll_group(qpair->transport, qpair);
1588 
1589 	if (tgroup == NULL) {
1590 		return NULL;
1591 	}
1592 
1593 	return tgroup->group;
1594 }
1595 
1596 void
1597 spdk_nvmf_poll_group_dump_stat(struct spdk_nvmf_poll_group *group, struct spdk_json_write_ctx *w)
1598 {
1599 	struct spdk_nvmf_transport_poll_group *tgroup;
1600 
1601 	spdk_json_write_object_begin(w);
1602 
1603 	spdk_json_write_named_string(w, "name", spdk_thread_get_name(spdk_get_thread()));
1604 	spdk_json_write_named_uint32(w, "admin_qpairs", group->stat.admin_qpairs);
1605 	spdk_json_write_named_uint32(w, "io_qpairs", group->stat.io_qpairs);
1606 	spdk_json_write_named_uint32(w, "current_admin_qpairs", group->stat.current_admin_qpairs);
1607 	spdk_json_write_named_uint32(w, "current_io_qpairs", group->stat.current_io_qpairs);
1608 	spdk_json_write_named_uint64(w, "pending_bdev_io", group->stat.pending_bdev_io);
1609 
1610 	spdk_json_write_named_array_begin(w, "transports");
1611 
1612 	TAILQ_FOREACH(tgroup, &group->tgroups, link) {
1613 		spdk_json_write_object_begin(w);
1614 		/*
1615 		 * The trtype field intentionally contains a transport name as this is more informative.
1616 		 * The field has not been renamed for backward compatibility.
1617 		 */
1618 		spdk_json_write_named_string(w, "trtype", spdk_nvmf_get_transport_name(tgroup->transport));
1619 
1620 		if (tgroup->transport->ops->poll_group_dump_stat) {
1621 			tgroup->transport->ops->poll_group_dump_stat(tgroup, w);
1622 		}
1623 
1624 		spdk_json_write_object_end(w);
1625 	}
1626 
1627 	spdk_json_write_array_end(w);
1628 	spdk_json_write_object_end(w);
1629 }
1630