xref: /spdk/lib/nvmf/nvmf.c (revision 7521dc6f4b7ea46945f4add1aabf3f320c81ad5a)
1 /*   SPDX-License-Identifier: BSD-3-Clause
2  *   Copyright (C) 2016 Intel Corporation. All rights reserved.
3  *   Copyright (c) 2018-2019, 2021 Mellanox Technologies LTD. All rights reserved.
4  *   Copyright (c) 2021, 2023 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
5  */
6 
7 #include "spdk/stdinc.h"
8 
9 #include "spdk/bdev.h"
10 #include "spdk/bit_array.h"
11 #include "spdk/thread.h"
12 #include "spdk/nvmf.h"
13 #include "spdk/endian.h"
14 #include "spdk/string.h"
15 #include "spdk/log.h"
16 #include "spdk_internal/usdt.h"
17 
18 #include "nvmf_internal.h"
19 #include "transport.h"
20 
21 SPDK_LOG_REGISTER_COMPONENT(nvmf)
22 
23 #define SPDK_NVMF_DEFAULT_MAX_SUBSYSTEMS 1024
24 
25 static TAILQ_HEAD(, spdk_nvmf_tgt) g_nvmf_tgts = TAILQ_HEAD_INITIALIZER(g_nvmf_tgts);
26 
27 typedef void (*nvmf_qpair_disconnect_cpl)(void *ctx, int status);
28 
29 /* supplied to a single call to nvmf_qpair_disconnect */
30 struct nvmf_qpair_disconnect_ctx {
31 	struct spdk_nvmf_qpair *qpair;
32 	struct spdk_nvmf_ctrlr *ctrlr;
33 	uint16_t qid;
34 };
35 
36 /*
37  * There are several times when we need to iterate through the list of all qpairs and selectively delete them.
38  * In order to do this sequentially without overlap, we must provide a context to recover the next qpair from
39  * to enable calling nvmf_qpair_disconnect on the next desired qpair.
40  */
41 struct nvmf_qpair_disconnect_many_ctx {
42 	struct spdk_nvmf_subsystem *subsystem;
43 	struct spdk_nvmf_poll_group *group;
44 	spdk_nvmf_poll_group_mod_done cpl_fn;
45 	void *cpl_ctx;
46 };
47 
48 static struct spdk_nvmf_referral *
49 nvmf_tgt_find_referral(struct spdk_nvmf_tgt *tgt,
50 		       const struct spdk_nvme_transport_id *trid)
51 {
52 	struct spdk_nvmf_referral *referral;
53 
54 	TAILQ_FOREACH(referral, &tgt->referrals, link) {
55 		if (spdk_nvme_transport_id_compare(&referral->trid, trid) == 0) {
56 			return referral;
57 		}
58 	}
59 
60 	return NULL;
61 }
62 
63 int
64 spdk_nvmf_tgt_add_referral(struct spdk_nvmf_tgt *tgt,
65 			   const struct spdk_nvmf_referral_opts *uopts)
66 {
67 	struct spdk_nvmf_referral *referral;
68 	struct spdk_nvmf_referral_opts opts = {};
69 	struct spdk_nvme_transport_id *trid = &opts.trid;
70 
71 	memcpy(&opts, uopts, spdk_min(uopts->size, sizeof(opts)));
72 	if (trid->subnqn[0] == '\0') {
73 		snprintf(trid->subnqn, sizeof(trid->subnqn), "%s", SPDK_NVMF_DISCOVERY_NQN);
74 	}
75 
76 	if (!nvmf_nqn_is_valid(trid->subnqn)) {
77 		SPDK_ERRLOG("Invalid subsystem NQN\n");
78 		return -EINVAL;
79 	}
80 
81 	/* If the entry already exists, just ignore it. */
82 	if (nvmf_tgt_find_referral(tgt, trid)) {
83 		return 0;
84 	}
85 
86 	referral = calloc(1, sizeof(*referral));
87 	if (!referral) {
88 		SPDK_ERRLOG("Failed to allocate memory for a referral\n");
89 		return -ENOMEM;
90 	}
91 
92 	referral->entry.subtype = nvmf_nqn_is_discovery(trid->subnqn) ?
93 				  SPDK_NVMF_SUBTYPE_DISCOVERY :
94 				  SPDK_NVMF_SUBTYPE_NVME;
95 	referral->entry.treq.secure_channel = opts.secure_channel ?
96 					      SPDK_NVMF_TREQ_SECURE_CHANNEL_REQUIRED :
97 					      SPDK_NVMF_TREQ_SECURE_CHANNEL_NOT_REQUIRED;
98 	referral->entry.cntlid = 0xffff;
99 	referral->entry.trtype = trid->trtype;
100 	referral->entry.adrfam = trid->adrfam;
101 	memcpy(&referral->trid, trid, sizeof(struct spdk_nvme_transport_id));
102 	spdk_strcpy_pad(referral->entry.subnqn, trid->subnqn, sizeof(trid->subnqn), '\0');
103 	spdk_strcpy_pad(referral->entry.trsvcid, trid->trsvcid, sizeof(referral->entry.trsvcid), ' ');
104 	spdk_strcpy_pad(referral->entry.traddr, trid->traddr, sizeof(referral->entry.traddr), ' ');
105 
106 	TAILQ_INSERT_HEAD(&tgt->referrals, referral, link);
107 	nvmf_update_discovery_log(tgt, NULL);
108 
109 	return 0;
110 }
111 
112 int
113 spdk_nvmf_tgt_remove_referral(struct spdk_nvmf_tgt *tgt,
114 			      const struct spdk_nvmf_referral_opts *uopts)
115 {
116 	struct spdk_nvmf_referral *referral;
117 	struct spdk_nvmf_referral_opts opts = {};
118 	struct spdk_nvme_transport_id *trid = &opts.trid;
119 
120 	memcpy(&opts, uopts, spdk_min(uopts->size, sizeof(opts)));
121 	if (trid->subnqn[0] == '\0') {
122 		snprintf(trid->subnqn, sizeof(trid->subnqn), "%s", SPDK_NVMF_DISCOVERY_NQN);
123 	}
124 
125 	referral = nvmf_tgt_find_referral(tgt, &opts.trid);
126 	if (referral == NULL) {
127 		return -ENOENT;
128 	}
129 
130 	TAILQ_REMOVE(&tgt->referrals, referral, link);
131 	nvmf_update_discovery_log(tgt, NULL);
132 
133 	free(referral);
134 
135 	return 0;
136 }
137 
138 void
139 nvmf_qpair_set_state(struct spdk_nvmf_qpair *qpair,
140 		     enum spdk_nvmf_qpair_state state)
141 {
142 	assert(qpair != NULL);
143 	assert(qpair->group->thread == spdk_get_thread());
144 
145 	qpair->state = state;
146 }
147 
148 static int
149 nvmf_poll_group_poll(void *ctx)
150 {
151 	struct spdk_nvmf_poll_group *group = ctx;
152 	int rc;
153 	int count = 0;
154 	struct spdk_nvmf_transport_poll_group *tgroup;
155 
156 	TAILQ_FOREACH(tgroup, &group->tgroups, link) {
157 		rc = nvmf_transport_poll_group_poll(tgroup);
158 		if (rc < 0) {
159 			return SPDK_POLLER_BUSY;
160 		}
161 		count += rc;
162 	}
163 
164 	return count > 0 ? SPDK_POLLER_BUSY : SPDK_POLLER_IDLE;
165 }
166 
167 /*
168  * Reset and clean up the poll group (I/O channel code will actually free the
169  * group).
170  */
171 static void
172 nvmf_tgt_cleanup_poll_group(struct spdk_nvmf_poll_group *group)
173 {
174 	struct spdk_nvmf_transport_poll_group *tgroup, *tmp;
175 	struct spdk_nvmf_subsystem_poll_group *sgroup;
176 	uint32_t sid, nsid;
177 
178 	TAILQ_FOREACH_SAFE(tgroup, &group->tgroups, link, tmp) {
179 		TAILQ_REMOVE(&group->tgroups, tgroup, link);
180 		nvmf_transport_poll_group_destroy(tgroup);
181 	}
182 
183 	for (sid = 0; sid < group->num_sgroups; sid++) {
184 		sgroup = &group->sgroups[sid];
185 
186 		assert(sgroup != NULL);
187 
188 		for (nsid = 0; nsid < sgroup->num_ns; nsid++) {
189 			if (sgroup->ns_info[nsid].channel) {
190 				spdk_put_io_channel(sgroup->ns_info[nsid].channel);
191 				sgroup->ns_info[nsid].channel = NULL;
192 			}
193 		}
194 
195 		free(sgroup->ns_info);
196 	}
197 
198 	free(group->sgroups);
199 
200 	spdk_poller_unregister(&group->poller);
201 
202 	if (group->destroy_cb_fn) {
203 		group->destroy_cb_fn(group->destroy_cb_arg, 0);
204 	}
205 }
206 
207 /*
208  * Callback to unregister a poll group from the target, and clean up its state.
209  */
210 static void
211 nvmf_tgt_destroy_poll_group(void *io_device, void *ctx_buf)
212 {
213 	struct spdk_nvmf_tgt *tgt = io_device;
214 	struct spdk_nvmf_poll_group *group = ctx_buf;
215 
216 	SPDK_DTRACE_PROBE1_TICKS(nvmf_destroy_poll_group, spdk_thread_get_id(group->thread));
217 
218 	pthread_mutex_lock(&tgt->mutex);
219 	TAILQ_REMOVE(&tgt->poll_groups, group, link);
220 	tgt->num_poll_groups--;
221 	pthread_mutex_unlock(&tgt->mutex);
222 
223 	assert(!(tgt->state == NVMF_TGT_PAUSING || tgt->state == NVMF_TGT_RESUMING));
224 	nvmf_tgt_cleanup_poll_group(group);
225 }
226 
227 static int
228 nvmf_poll_group_add_transport(struct spdk_nvmf_poll_group *group,
229 			      struct spdk_nvmf_transport *transport)
230 {
231 	struct spdk_nvmf_transport_poll_group *tgroup;
232 
233 	TAILQ_FOREACH(tgroup, &group->tgroups, link) {
234 		if (tgroup->transport == transport) {
235 			/* Transport already in the poll group */
236 			return 0;
237 		}
238 	}
239 
240 	tgroup = nvmf_transport_poll_group_create(transport, group);
241 	if (!tgroup) {
242 		SPDK_ERRLOG("Unable to create poll group for transport\n");
243 		return -1;
244 	}
245 	SPDK_DTRACE_PROBE2_TICKS(nvmf_transport_poll_group_create, transport,
246 				 spdk_thread_get_id(group->thread));
247 
248 	tgroup->group = group;
249 	TAILQ_INSERT_TAIL(&group->tgroups, tgroup, link);
250 
251 	return 0;
252 }
253 
254 static int
255 nvmf_tgt_create_poll_group(void *io_device, void *ctx_buf)
256 {
257 	struct spdk_nvmf_tgt *tgt = io_device;
258 	struct spdk_nvmf_poll_group *group = ctx_buf;
259 	struct spdk_nvmf_transport *transport;
260 	struct spdk_nvmf_subsystem *subsystem;
261 	struct spdk_thread *thread = spdk_get_thread();
262 	uint32_t i;
263 	int rc;
264 
265 	group->tgt = tgt;
266 	TAILQ_INIT(&group->tgroups);
267 	TAILQ_INIT(&group->qpairs);
268 	group->thread = thread;
269 	pthread_mutex_init(&group->mutex, NULL);
270 
271 	group->poller = SPDK_POLLER_REGISTER(nvmf_poll_group_poll, group, 0);
272 
273 	SPDK_DTRACE_PROBE1_TICKS(nvmf_create_poll_group, spdk_thread_get_id(thread));
274 
275 	TAILQ_FOREACH(transport, &tgt->transports, link) {
276 		rc = nvmf_poll_group_add_transport(group, transport);
277 		if (rc != 0) {
278 			nvmf_tgt_cleanup_poll_group(group);
279 			return rc;
280 		}
281 	}
282 
283 	group->num_sgroups = tgt->max_subsystems;
284 	group->sgroups = calloc(tgt->max_subsystems, sizeof(struct spdk_nvmf_subsystem_poll_group));
285 	if (!group->sgroups) {
286 		nvmf_tgt_cleanup_poll_group(group);
287 		return -ENOMEM;
288 	}
289 
290 	for (i = 0; i < tgt->max_subsystems; i++) {
291 		TAILQ_INIT(&group->sgroups[i].queued);
292 	}
293 
294 	for (subsystem = spdk_nvmf_subsystem_get_first(tgt);
295 	     subsystem != NULL;
296 	     subsystem = spdk_nvmf_subsystem_get_next(subsystem)) {
297 		if (nvmf_poll_group_add_subsystem(group, subsystem, NULL, NULL) != 0) {
298 			nvmf_tgt_cleanup_poll_group(group);
299 			return -1;
300 		}
301 	}
302 
303 	pthread_mutex_lock(&tgt->mutex);
304 	tgt->num_poll_groups++;
305 	TAILQ_INSERT_TAIL(&tgt->poll_groups, group, link);
306 	pthread_mutex_unlock(&tgt->mutex);
307 
308 	return 0;
309 }
310 
311 static void
312 _nvmf_tgt_disconnect_qpairs(void *ctx)
313 {
314 	struct spdk_nvmf_qpair *qpair, *qpair_tmp;
315 	struct nvmf_qpair_disconnect_many_ctx *qpair_ctx = ctx;
316 	struct spdk_nvmf_poll_group *group = qpair_ctx->group;
317 	struct spdk_io_channel *ch;
318 	int rc;
319 
320 	TAILQ_FOREACH_SAFE(qpair, &group->qpairs, link, qpair_tmp) {
321 		rc = spdk_nvmf_qpair_disconnect(qpair);
322 		if (rc && rc != -EINPROGRESS) {
323 			break;
324 		}
325 	}
326 
327 	if (TAILQ_EMPTY(&group->qpairs)) {
328 		/* When the refcount from the channels reaches 0, nvmf_tgt_destroy_poll_group will be called. */
329 		ch = spdk_io_channel_from_ctx(group);
330 		spdk_put_io_channel(ch);
331 		free(qpair_ctx);
332 		return;
333 	}
334 
335 	/* Some qpairs are in process of being disconnected. Send a message and try to remove them again */
336 	spdk_thread_send_msg(spdk_get_thread(), _nvmf_tgt_disconnect_qpairs, ctx);
337 }
338 
339 static void
340 nvmf_tgt_destroy_poll_group_qpairs(struct spdk_nvmf_poll_group *group)
341 {
342 	struct nvmf_qpair_disconnect_many_ctx *ctx;
343 
344 	SPDK_DTRACE_PROBE1_TICKS(nvmf_destroy_poll_group_qpairs, spdk_thread_get_id(group->thread));
345 
346 	ctx = calloc(1, sizeof(struct nvmf_qpair_disconnect_many_ctx));
347 	if (!ctx) {
348 		SPDK_ERRLOG("Failed to allocate memory for destroy poll group ctx\n");
349 		return;
350 	}
351 
352 	ctx->group = group;
353 	_nvmf_tgt_disconnect_qpairs(ctx);
354 }
355 
356 struct spdk_nvmf_tgt *
357 spdk_nvmf_tgt_create(struct spdk_nvmf_target_opts *opts)
358 {
359 	struct spdk_nvmf_tgt *tgt, *tmp_tgt;
360 
361 	if (strnlen(opts->name, NVMF_TGT_NAME_MAX_LENGTH) == NVMF_TGT_NAME_MAX_LENGTH) {
362 		SPDK_ERRLOG("Provided target name exceeds the max length of %u.\n", NVMF_TGT_NAME_MAX_LENGTH);
363 		return NULL;
364 	}
365 
366 	TAILQ_FOREACH(tmp_tgt, &g_nvmf_tgts, link) {
367 		if (!strncmp(opts->name, tmp_tgt->name, NVMF_TGT_NAME_MAX_LENGTH)) {
368 			SPDK_ERRLOG("Provided target name must be unique.\n");
369 			return NULL;
370 		}
371 	}
372 
373 	tgt = calloc(1, sizeof(*tgt));
374 	if (!tgt) {
375 		return NULL;
376 	}
377 
378 	snprintf(tgt->name, NVMF_TGT_NAME_MAX_LENGTH, "%s", opts->name);
379 
380 	if (!opts || !opts->max_subsystems) {
381 		tgt->max_subsystems = SPDK_NVMF_DEFAULT_MAX_SUBSYSTEMS;
382 	} else {
383 		tgt->max_subsystems = opts->max_subsystems;
384 	}
385 
386 	if (!opts) {
387 		tgt->crdt[0] = 0;
388 		tgt->crdt[1] = 0;
389 		tgt->crdt[2] = 0;
390 	} else {
391 		tgt->crdt[0] = opts->crdt[0];
392 		tgt->crdt[1] = opts->crdt[1];
393 		tgt->crdt[2] = opts->crdt[2];
394 	}
395 
396 	if (!opts) {
397 		tgt->discovery_filter = SPDK_NVMF_TGT_DISCOVERY_MATCH_ANY;
398 	} else {
399 		tgt->discovery_filter = opts->discovery_filter;
400 	}
401 
402 	tgt->discovery_genctr = 0;
403 	TAILQ_INIT(&tgt->transports);
404 	TAILQ_INIT(&tgt->poll_groups);
405 	TAILQ_INIT(&tgt->referrals);
406 	tgt->num_poll_groups = 0;
407 
408 	tgt->subsystem_ids = spdk_bit_array_create(tgt->max_subsystems);
409 	if (tgt->subsystem_ids == NULL) {
410 		free(tgt);
411 		return NULL;
412 	}
413 
414 	RB_INIT(&tgt->subsystems);
415 
416 	pthread_mutex_init(&tgt->mutex, NULL);
417 
418 	spdk_io_device_register(tgt,
419 				nvmf_tgt_create_poll_group,
420 				nvmf_tgt_destroy_poll_group,
421 				sizeof(struct spdk_nvmf_poll_group),
422 				tgt->name);
423 
424 	tgt->state = NVMF_TGT_RUNNING;
425 
426 	TAILQ_INSERT_HEAD(&g_nvmf_tgts, tgt, link);
427 
428 	return tgt;
429 }
430 
431 static void
432 _nvmf_tgt_destroy_next_transport(void *ctx)
433 {
434 	struct spdk_nvmf_tgt *tgt = ctx;
435 	struct spdk_nvmf_transport *transport;
436 
437 	if (!TAILQ_EMPTY(&tgt->transports)) {
438 		transport = TAILQ_FIRST(&tgt->transports);
439 		TAILQ_REMOVE(&tgt->transports, transport, link);
440 		spdk_nvmf_transport_destroy(transport, _nvmf_tgt_destroy_next_transport, tgt);
441 	} else {
442 		spdk_nvmf_tgt_destroy_done_fn *destroy_cb_fn = tgt->destroy_cb_fn;
443 		void *destroy_cb_arg = tgt->destroy_cb_arg;
444 
445 		pthread_mutex_destroy(&tgt->mutex);
446 		free(tgt);
447 
448 		if (destroy_cb_fn) {
449 			destroy_cb_fn(destroy_cb_arg, 0);
450 		}
451 	}
452 }
453 
454 static void
455 nvmf_tgt_destroy_cb(void *io_device)
456 {
457 	struct spdk_nvmf_tgt *tgt = io_device;
458 	struct spdk_nvmf_subsystem *subsystem, *subsystem_next;
459 	int rc;
460 	struct spdk_nvmf_referral *referral;
461 
462 	while ((referral = TAILQ_FIRST(&tgt->referrals))) {
463 		TAILQ_REMOVE(&tgt->referrals, referral, link);
464 		free(referral);
465 	}
466 
467 	/* We will be freeing subsystems in this loop, so we always need to get the next one
468 	 * ahead of time, since we can't call get_next() on a subsystem that's been freed.
469 	 */
470 	for (subsystem = spdk_nvmf_subsystem_get_first(tgt),
471 	     subsystem_next = spdk_nvmf_subsystem_get_next(subsystem);
472 	     subsystem != NULL;
473 	     subsystem = subsystem_next,
474 	     subsystem_next = spdk_nvmf_subsystem_get_next(subsystem_next)) {
475 		nvmf_subsystem_remove_all_listeners(subsystem, true);
476 
477 		rc = spdk_nvmf_subsystem_destroy(subsystem, nvmf_tgt_destroy_cb, tgt);
478 		if (rc) {
479 			if (rc == -EINPROGRESS) {
480 				/* If rc is -EINPROGRESS, nvmf_tgt_destroy_cb will be called again when subsystem #i
481 				 * is destroyed, nvmf_tgt_destroy_cb will continue to destroy other subsystems if any */
482 				return;
483 			} else {
484 				SPDK_ERRLOG("Failed to destroy subsystem %s, rc %d\n", subsystem->subnqn, rc);
485 			}
486 		}
487 	}
488 	spdk_bit_array_free(&tgt->subsystem_ids);
489 	_nvmf_tgt_destroy_next_transport(tgt);
490 }
491 
492 void
493 spdk_nvmf_tgt_destroy(struct spdk_nvmf_tgt *tgt,
494 		      spdk_nvmf_tgt_destroy_done_fn cb_fn,
495 		      void *cb_arg)
496 {
497 	assert(!(tgt->state == NVMF_TGT_PAUSING || tgt->state == NVMF_TGT_RESUMING));
498 
499 	tgt->destroy_cb_fn = cb_fn;
500 	tgt->destroy_cb_arg = cb_arg;
501 
502 	TAILQ_REMOVE(&g_nvmf_tgts, tgt, link);
503 
504 	spdk_io_device_unregister(tgt, nvmf_tgt_destroy_cb);
505 }
506 
507 const char *
508 spdk_nvmf_tgt_get_name(struct spdk_nvmf_tgt *tgt)
509 {
510 	return tgt->name;
511 }
512 
513 struct spdk_nvmf_tgt *
514 spdk_nvmf_get_tgt(const char *name)
515 {
516 	struct spdk_nvmf_tgt *tgt;
517 	uint32_t num_targets = 0;
518 
519 	TAILQ_FOREACH(tgt, &g_nvmf_tgts, link) {
520 		if (name) {
521 			if (!strncmp(tgt->name, name, NVMF_TGT_NAME_MAX_LENGTH)) {
522 				return tgt;
523 			}
524 		}
525 		num_targets++;
526 	}
527 
528 	/*
529 	 * special case. If there is only one target and
530 	 * no name was specified, return the only available
531 	 * target. If there is more than one target, name must
532 	 * be specified.
533 	 */
534 	if (!name && num_targets == 1) {
535 		return TAILQ_FIRST(&g_nvmf_tgts);
536 	}
537 
538 	return NULL;
539 }
540 
541 struct spdk_nvmf_tgt *
542 spdk_nvmf_get_first_tgt(void)
543 {
544 	return TAILQ_FIRST(&g_nvmf_tgts);
545 }
546 
547 struct spdk_nvmf_tgt *
548 spdk_nvmf_get_next_tgt(struct spdk_nvmf_tgt *prev)
549 {
550 	return TAILQ_NEXT(prev, link);
551 }
552 
553 static void
554 nvmf_write_nvme_subsystem_config(struct spdk_json_write_ctx *w,
555 				 struct spdk_nvmf_subsystem *subsystem)
556 {
557 	struct spdk_nvmf_host *host;
558 	struct spdk_nvmf_ns *ns;
559 	struct spdk_nvmf_ns_opts ns_opts;
560 	uint32_t max_namespaces;
561 	struct spdk_nvmf_transport *transport;
562 
563 	assert(spdk_nvmf_subsystem_get_type(subsystem) == SPDK_NVMF_SUBTYPE_NVME);
564 
565 	/* { */
566 	spdk_json_write_object_begin(w);
567 	spdk_json_write_named_string(w, "method", "nvmf_create_subsystem");
568 
569 	/*     "params" : { */
570 	spdk_json_write_named_object_begin(w, "params");
571 	spdk_json_write_named_string(w, "nqn", spdk_nvmf_subsystem_get_nqn(subsystem));
572 	spdk_json_write_named_bool(w, "allow_any_host", spdk_nvmf_subsystem_get_allow_any_host(subsystem));
573 	spdk_json_write_named_string(w, "serial_number", spdk_nvmf_subsystem_get_sn(subsystem));
574 	spdk_json_write_named_string(w, "model_number", spdk_nvmf_subsystem_get_mn(subsystem));
575 
576 	max_namespaces = spdk_nvmf_subsystem_get_max_namespaces(subsystem);
577 	if (max_namespaces != 0) {
578 		spdk_json_write_named_uint32(w, "max_namespaces", max_namespaces);
579 	}
580 
581 	spdk_json_write_named_uint32(w, "min_cntlid", spdk_nvmf_subsystem_get_min_cntlid(subsystem));
582 	spdk_json_write_named_uint32(w, "max_cntlid", spdk_nvmf_subsystem_get_max_cntlid(subsystem));
583 	spdk_json_write_named_bool(w, "ana_reporting", spdk_nvmf_subsystem_get_ana_reporting(subsystem));
584 
585 	/*     } "params" */
586 	spdk_json_write_object_end(w);
587 
588 	/* } */
589 	spdk_json_write_object_end(w);
590 
591 	for (host = spdk_nvmf_subsystem_get_first_host(subsystem); host != NULL;
592 	     host = spdk_nvmf_subsystem_get_next_host(subsystem, host)) {
593 
594 		spdk_json_write_object_begin(w);
595 		spdk_json_write_named_string(w, "method", "nvmf_subsystem_add_host");
596 
597 		/*     "params" : { */
598 		spdk_json_write_named_object_begin(w, "params");
599 
600 		spdk_json_write_named_string(w, "nqn", spdk_nvmf_subsystem_get_nqn(subsystem));
601 		spdk_json_write_named_string(w, "host", spdk_nvmf_host_get_nqn(host));
602 		if (host->dhchap_key != NULL) {
603 			spdk_json_write_named_string(w, "dhchap_key",
604 						     spdk_key_get_name(host->dhchap_key));
605 		}
606 		if (host->dhchap_ctrlr_key != NULL) {
607 			spdk_json_write_named_string(w, "dhchap_ctrlr_key",
608 						     spdk_key_get_name(host->dhchap_ctrlr_key));
609 		}
610 		TAILQ_FOREACH(transport, &subsystem->tgt->transports, link) {
611 			if (transport->ops->subsystem_dump_host != NULL) {
612 				transport->ops->subsystem_dump_host(transport, subsystem, host->nqn, w);
613 			}
614 		}
615 
616 		/*     } "params" */
617 		spdk_json_write_object_end(w);
618 
619 		/* } */
620 		spdk_json_write_object_end(w);
621 	}
622 
623 	for (ns = spdk_nvmf_subsystem_get_first_ns(subsystem); ns != NULL;
624 	     ns = spdk_nvmf_subsystem_get_next_ns(subsystem, ns)) {
625 		spdk_nvmf_ns_get_opts(ns, &ns_opts, sizeof(ns_opts));
626 
627 		spdk_json_write_object_begin(w);
628 		spdk_json_write_named_string(w, "method", "nvmf_subsystem_add_ns");
629 
630 		/*     "params" : { */
631 		spdk_json_write_named_object_begin(w, "params");
632 
633 		spdk_json_write_named_string(w, "nqn", spdk_nvmf_subsystem_get_nqn(subsystem));
634 
635 		/*     "namespace" : { */
636 		spdk_json_write_named_object_begin(w, "namespace");
637 
638 		spdk_json_write_named_uint32(w, "nsid", spdk_nvmf_ns_get_id(ns));
639 		spdk_json_write_named_string(w, "bdev_name", spdk_bdev_get_name(spdk_nvmf_ns_get_bdev(ns)));
640 
641 		if (ns->ptpl_file != NULL) {
642 			spdk_json_write_named_string(w, "ptpl_file", ns->ptpl_file);
643 		}
644 
645 		if (!spdk_mem_all_zero(ns_opts.nguid, sizeof(ns_opts.nguid))) {
646 			SPDK_STATIC_ASSERT(sizeof(ns_opts.nguid) == sizeof(uint64_t) * 2, "size mismatch");
647 			spdk_json_write_named_string_fmt(w, "nguid", "%016"PRIX64"%016"PRIX64, from_be64(&ns_opts.nguid[0]),
648 							 from_be64(&ns_opts.nguid[8]));
649 		}
650 
651 		if (!spdk_mem_all_zero(ns_opts.eui64, sizeof(ns_opts.eui64))) {
652 			SPDK_STATIC_ASSERT(sizeof(ns_opts.eui64) == sizeof(uint64_t), "size mismatch");
653 			spdk_json_write_named_string_fmt(w, "eui64", "%016"PRIX64, from_be64(&ns_opts.eui64));
654 		}
655 
656 		if (!spdk_uuid_is_null(&ns_opts.uuid)) {
657 			spdk_json_write_named_uuid(w, "uuid",  &ns_opts.uuid);
658 		}
659 
660 		if (spdk_nvmf_subsystem_get_ana_reporting(subsystem)) {
661 			spdk_json_write_named_uint32(w, "anagrpid", ns_opts.anagrpid);
662 		}
663 
664 		spdk_json_write_named_bool(w, "no_auto_visible", !ns->always_visible);
665 
666 		/*     "namespace" */
667 		spdk_json_write_object_end(w);
668 
669 		/*     } "params" */
670 		spdk_json_write_object_end(w);
671 
672 		/* } */
673 		spdk_json_write_object_end(w);
674 	}
675 }
676 
677 static void
678 nvmf_write_subsystem_config_json(struct spdk_json_write_ctx *w,
679 				 struct spdk_nvmf_subsystem *subsystem)
680 {
681 	struct spdk_nvmf_subsystem_listener *listener;
682 	struct spdk_nvmf_transport *transport;
683 	const struct spdk_nvme_transport_id *trid;
684 
685 	if (spdk_nvmf_subsystem_get_type(subsystem) == SPDK_NVMF_SUBTYPE_NVME) {
686 		nvmf_write_nvme_subsystem_config(w, subsystem);
687 	}
688 
689 	for (listener = spdk_nvmf_subsystem_get_first_listener(subsystem); listener != NULL;
690 	     listener = spdk_nvmf_subsystem_get_next_listener(subsystem, listener)) {
691 		transport = listener->transport;
692 		trid = spdk_nvmf_subsystem_listener_get_trid(listener);
693 
694 		spdk_json_write_object_begin(w);
695 		spdk_json_write_named_string(w, "method", "nvmf_subsystem_add_listener");
696 
697 		/*     "params" : { */
698 		spdk_json_write_named_object_begin(w, "params");
699 
700 		spdk_json_write_named_string(w, "nqn", spdk_nvmf_subsystem_get_nqn(subsystem));
701 
702 		spdk_json_write_named_object_begin(w, "listen_address");
703 		nvmf_transport_listen_dump_trid(trid, w);
704 		spdk_json_write_object_end(w);
705 		if (transport->ops->listen_dump_opts) {
706 			transport->ops->listen_dump_opts(transport, trid, w);
707 		}
708 
709 		spdk_json_write_named_bool(w, "secure_channel", listener->opts.secure_channel);
710 
711 		/*     } "params" */
712 		spdk_json_write_object_end(w);
713 
714 		/* } */
715 		spdk_json_write_object_end(w);
716 	}
717 }
718 
719 void
720 spdk_nvmf_tgt_write_config_json(struct spdk_json_write_ctx *w, struct spdk_nvmf_tgt *tgt)
721 {
722 	struct spdk_nvmf_subsystem *subsystem;
723 	struct spdk_nvmf_transport *transport;
724 	struct spdk_nvmf_referral *referral;
725 
726 	spdk_json_write_object_begin(w);
727 	spdk_json_write_named_string(w, "method", "nvmf_set_max_subsystems");
728 
729 	spdk_json_write_named_object_begin(w, "params");
730 	spdk_json_write_named_uint32(w, "max_subsystems", tgt->max_subsystems);
731 	spdk_json_write_object_end(w);
732 
733 	spdk_json_write_object_end(w);
734 
735 	spdk_json_write_object_begin(w);
736 	spdk_json_write_named_string(w, "method", "nvmf_set_crdt");
737 	spdk_json_write_named_object_begin(w, "params");
738 	spdk_json_write_named_uint32(w, "crdt1", tgt->crdt[0]);
739 	spdk_json_write_named_uint32(w, "crdt2", tgt->crdt[1]);
740 	spdk_json_write_named_uint32(w, "crdt3", tgt->crdt[2]);
741 	spdk_json_write_object_end(w);
742 	spdk_json_write_object_end(w);
743 
744 	/* write transports */
745 	TAILQ_FOREACH(transport, &tgt->transports, link) {
746 		spdk_json_write_object_begin(w);
747 		spdk_json_write_named_string(w, "method", "nvmf_create_transport");
748 		nvmf_transport_dump_opts(transport, w, true);
749 		spdk_json_write_object_end(w);
750 	}
751 
752 	TAILQ_FOREACH(referral, &tgt->referrals, link) {
753 		spdk_json_write_object_begin(w);
754 		spdk_json_write_named_string(w, "method", "nvmf_discovery_add_referral");
755 
756 		spdk_json_write_named_object_begin(w, "params");
757 		spdk_json_write_named_object_begin(w, "address");
758 		nvmf_transport_listen_dump_trid(&referral->trid, w);
759 		spdk_json_write_object_end(w);
760 		spdk_json_write_named_bool(w, "secure_channel",
761 					   referral->entry.treq.secure_channel ==
762 					   SPDK_NVMF_TREQ_SECURE_CHANNEL_REQUIRED);
763 		spdk_json_write_named_string(w, "subnqn", referral->trid.subnqn);
764 		spdk_json_write_object_end(w);
765 
766 		spdk_json_write_object_end(w);
767 	}
768 
769 	subsystem = spdk_nvmf_subsystem_get_first(tgt);
770 	while (subsystem) {
771 		nvmf_write_subsystem_config_json(w, subsystem);
772 		subsystem = spdk_nvmf_subsystem_get_next(subsystem);
773 	}
774 }
775 
776 static void
777 nvmf_listen_opts_copy(struct spdk_nvmf_listen_opts *opts,
778 		      const struct spdk_nvmf_listen_opts *opts_src, size_t opts_size)
779 {
780 	assert(opts);
781 	assert(opts_src);
782 
783 	opts->opts_size = opts_size;
784 
785 #define SET_FIELD(field) \
786     if (offsetof(struct spdk_nvmf_listen_opts, field) + sizeof(opts->field) <= opts_size) { \
787                  opts->field = opts_src->field; \
788     } \
789 
790 	SET_FIELD(transport_specific);
791 	SET_FIELD(secure_channel);
792 	SET_FIELD(ana_state);
793 #undef SET_FIELD
794 
795 	/* Do not remove this statement, you should always update this statement when you adding a new field,
796 	 * and do not forget to add the SET_FIELD statement for your added field. */
797 	SPDK_STATIC_ASSERT(sizeof(struct spdk_nvmf_listen_opts) == 24, "Incorrect size");
798 }
799 
800 void
801 spdk_nvmf_listen_opts_init(struct spdk_nvmf_listen_opts *opts, size_t opts_size)
802 {
803 	struct spdk_nvmf_listen_opts opts_local = {};
804 
805 	/* local version of opts should have defaults set here */
806 	opts_local.ana_state = SPDK_NVME_ANA_OPTIMIZED_STATE;
807 	nvmf_listen_opts_copy(opts, &opts_local, opts_size);
808 }
809 
810 int
811 spdk_nvmf_tgt_listen_ext(struct spdk_nvmf_tgt *tgt, const struct spdk_nvme_transport_id *trid,
812 			 struct spdk_nvmf_listen_opts *opts)
813 {
814 	struct spdk_nvmf_transport *transport;
815 	int rc;
816 	struct spdk_nvmf_listen_opts opts_local = {};
817 
818 	if (!opts) {
819 		SPDK_ERRLOG("opts should not be NULL\n");
820 		return -EINVAL;
821 	}
822 
823 	if (!opts->opts_size) {
824 		SPDK_ERRLOG("The opts_size in opts structure should not be zero\n");
825 		return -EINVAL;
826 	}
827 
828 	transport = spdk_nvmf_tgt_get_transport(tgt, trid->trstring);
829 	if (!transport) {
830 		SPDK_ERRLOG("Unable to find %s transport. The transport must be created first also make sure it is properly registered.\n",
831 			    trid->trstring);
832 		return -EINVAL;
833 	}
834 
835 	nvmf_listen_opts_copy(&opts_local, opts, opts->opts_size);
836 	rc = spdk_nvmf_transport_listen(transport, trid, &opts_local);
837 	if (rc < 0) {
838 		SPDK_ERRLOG("Unable to listen on address '%s'\n", trid->traddr);
839 	}
840 
841 	return rc;
842 }
843 
844 int
845 spdk_nvmf_tgt_stop_listen(struct spdk_nvmf_tgt *tgt,
846 			  struct spdk_nvme_transport_id *trid)
847 {
848 	struct spdk_nvmf_transport *transport;
849 	int rc;
850 
851 	transport = spdk_nvmf_tgt_get_transport(tgt, trid->trstring);
852 	if (!transport) {
853 		SPDK_ERRLOG("Unable to find %s transport. The transport must be created first also make sure it is properly registered.\n",
854 			    trid->trstring);
855 		return -EINVAL;
856 	}
857 
858 	rc = spdk_nvmf_transport_stop_listen(transport, trid);
859 	if (rc < 0) {
860 		SPDK_ERRLOG("Failed to stop listening on address '%s'\n", trid->traddr);
861 		return rc;
862 	}
863 	return 0;
864 }
865 
866 struct spdk_nvmf_tgt_add_transport_ctx {
867 	struct spdk_nvmf_tgt *tgt;
868 	struct spdk_nvmf_transport *transport;
869 	spdk_nvmf_tgt_add_transport_done_fn cb_fn;
870 	void *cb_arg;
871 	int status;
872 };
873 
874 static void
875 _nvmf_tgt_remove_transport_done(struct spdk_io_channel_iter *i, int status)
876 {
877 	struct spdk_nvmf_tgt_add_transport_ctx *ctx = spdk_io_channel_iter_get_ctx(i);
878 
879 	ctx->cb_fn(ctx->cb_arg, ctx->status);
880 	free(ctx);
881 }
882 
883 static void
884 _nvmf_tgt_remove_transport(struct spdk_io_channel_iter *i)
885 {
886 	struct spdk_nvmf_tgt_add_transport_ctx *ctx = spdk_io_channel_iter_get_ctx(i);
887 	struct spdk_io_channel *ch = spdk_io_channel_iter_get_channel(i);
888 	struct spdk_nvmf_poll_group *group = spdk_io_channel_get_ctx(ch);
889 	struct spdk_nvmf_transport_poll_group *tgroup, *tmp;
890 
891 	TAILQ_FOREACH_SAFE(tgroup, &group->tgroups, link, tmp) {
892 		if (tgroup->transport == ctx->transport) {
893 			TAILQ_REMOVE(&group->tgroups, tgroup, link);
894 			nvmf_transport_poll_group_destroy(tgroup);
895 		}
896 	}
897 
898 	spdk_for_each_channel_continue(i, 0);
899 }
900 
901 static void
902 _nvmf_tgt_add_transport_done(struct spdk_io_channel_iter *i, int status)
903 {
904 	struct spdk_nvmf_tgt_add_transport_ctx *ctx = spdk_io_channel_iter_get_ctx(i);
905 
906 	if (status) {
907 		ctx->status = status;
908 		spdk_for_each_channel(ctx->tgt,
909 				      _nvmf_tgt_remove_transport,
910 				      ctx,
911 				      _nvmf_tgt_remove_transport_done);
912 		return;
913 	}
914 
915 	ctx->transport->tgt = ctx->tgt;
916 	TAILQ_INSERT_TAIL(&ctx->tgt->transports, ctx->transport, link);
917 	ctx->cb_fn(ctx->cb_arg, status);
918 	free(ctx);
919 }
920 
921 static void
922 _nvmf_tgt_add_transport(struct spdk_io_channel_iter *i)
923 {
924 	struct spdk_nvmf_tgt_add_transport_ctx *ctx = spdk_io_channel_iter_get_ctx(i);
925 	struct spdk_io_channel *ch = spdk_io_channel_iter_get_channel(i);
926 	struct spdk_nvmf_poll_group *group = spdk_io_channel_get_ctx(ch);
927 	int rc;
928 
929 	rc = nvmf_poll_group_add_transport(group, ctx->transport);
930 	spdk_for_each_channel_continue(i, rc);
931 }
932 
933 void
934 spdk_nvmf_tgt_add_transport(struct spdk_nvmf_tgt *tgt,
935 			    struct spdk_nvmf_transport *transport,
936 			    spdk_nvmf_tgt_add_transport_done_fn cb_fn,
937 			    void *cb_arg)
938 {
939 	struct spdk_nvmf_tgt_add_transport_ctx *ctx;
940 
941 	SPDK_DTRACE_PROBE2_TICKS(nvmf_tgt_add_transport, transport, tgt->name);
942 
943 	if (spdk_nvmf_tgt_get_transport(tgt, transport->ops->name)) {
944 		cb_fn(cb_arg, -EEXIST);
945 		return; /* transport already created */
946 	}
947 
948 	ctx = calloc(1, sizeof(*ctx));
949 	if (!ctx) {
950 		cb_fn(cb_arg, -ENOMEM);
951 		return;
952 	}
953 
954 	ctx->tgt = tgt;
955 	ctx->transport = transport;
956 	ctx->cb_fn = cb_fn;
957 	ctx->cb_arg = cb_arg;
958 
959 	spdk_for_each_channel(tgt,
960 			      _nvmf_tgt_add_transport,
961 			      ctx,
962 			      _nvmf_tgt_add_transport_done);
963 }
964 
965 struct nvmf_tgt_pause_ctx {
966 	struct spdk_nvmf_tgt *tgt;
967 	spdk_nvmf_tgt_pause_polling_cb_fn cb_fn;
968 	void *cb_arg;
969 };
970 
971 static void
972 _nvmf_tgt_pause_polling_done(struct spdk_io_channel_iter *i, int status)
973 {
974 	struct nvmf_tgt_pause_ctx *ctx = spdk_io_channel_iter_get_ctx(i);
975 
976 	ctx->tgt->state = NVMF_TGT_PAUSED;
977 
978 	ctx->cb_fn(ctx->cb_arg, status);
979 	free(ctx);
980 }
981 
982 static void
983 _nvmf_tgt_pause_polling(struct spdk_io_channel_iter *i)
984 {
985 	struct spdk_io_channel *ch = spdk_io_channel_iter_get_channel(i);
986 	struct spdk_nvmf_poll_group *group = spdk_io_channel_get_ctx(ch);
987 
988 	spdk_poller_unregister(&group->poller);
989 
990 	spdk_for_each_channel_continue(i, 0);
991 }
992 
993 int
994 spdk_nvmf_tgt_pause_polling(struct spdk_nvmf_tgt *tgt, spdk_nvmf_tgt_pause_polling_cb_fn cb_fn,
995 			    void *cb_arg)
996 {
997 	struct nvmf_tgt_pause_ctx *ctx;
998 
999 	SPDK_DTRACE_PROBE2_TICKS(nvmf_tgt_pause_polling, tgt, tgt->name);
1000 
1001 	switch (tgt->state) {
1002 	case NVMF_TGT_PAUSING:
1003 	case NVMF_TGT_RESUMING:
1004 		return -EBUSY;
1005 	case NVMF_TGT_RUNNING:
1006 		break;
1007 	default:
1008 		return -EINVAL;
1009 	}
1010 
1011 	ctx = calloc(1, sizeof(*ctx));
1012 	if (!ctx) {
1013 		return -ENOMEM;
1014 	}
1015 
1016 
1017 	tgt->state = NVMF_TGT_PAUSING;
1018 
1019 	ctx->tgt = tgt;
1020 	ctx->cb_fn = cb_fn;
1021 	ctx->cb_arg = cb_arg;
1022 
1023 	spdk_for_each_channel(tgt,
1024 			      _nvmf_tgt_pause_polling,
1025 			      ctx,
1026 			      _nvmf_tgt_pause_polling_done);
1027 	return 0;
1028 }
1029 
1030 static void
1031 _nvmf_tgt_resume_polling_done(struct spdk_io_channel_iter *i, int status)
1032 {
1033 	struct nvmf_tgt_pause_ctx *ctx = spdk_io_channel_iter_get_ctx(i);
1034 
1035 	ctx->tgt->state = NVMF_TGT_RUNNING;
1036 
1037 	ctx->cb_fn(ctx->cb_arg, status);
1038 	free(ctx);
1039 }
1040 
1041 static void
1042 _nvmf_tgt_resume_polling(struct spdk_io_channel_iter *i)
1043 {
1044 	struct spdk_io_channel *ch = spdk_io_channel_iter_get_channel(i);
1045 	struct spdk_nvmf_poll_group *group = spdk_io_channel_get_ctx(ch);
1046 
1047 	assert(group->poller == NULL);
1048 	group->poller = SPDK_POLLER_REGISTER(nvmf_poll_group_poll, group, 0);
1049 
1050 	spdk_for_each_channel_continue(i, 0);
1051 }
1052 
1053 int
1054 spdk_nvmf_tgt_resume_polling(struct spdk_nvmf_tgt *tgt, spdk_nvmf_tgt_resume_polling_cb_fn cb_fn,
1055 			     void *cb_arg)
1056 {
1057 	struct nvmf_tgt_pause_ctx *ctx;
1058 
1059 	SPDK_DTRACE_PROBE2_TICKS(nvmf_tgt_resume_polling, tgt, tgt->name);
1060 
1061 	switch (tgt->state) {
1062 	case NVMF_TGT_PAUSING:
1063 	case NVMF_TGT_RESUMING:
1064 		return -EBUSY;
1065 	case NVMF_TGT_PAUSED:
1066 		break;
1067 	default:
1068 		return -EINVAL;
1069 	}
1070 
1071 	ctx = calloc(1, sizeof(*ctx));
1072 	if (!ctx) {
1073 		return -ENOMEM;
1074 	}
1075 
1076 	tgt->state = NVMF_TGT_RESUMING;
1077 
1078 	ctx->tgt = tgt;
1079 	ctx->cb_fn = cb_fn;
1080 	ctx->cb_arg = cb_arg;
1081 
1082 	spdk_for_each_channel(tgt,
1083 			      _nvmf_tgt_resume_polling,
1084 			      ctx,
1085 			      _nvmf_tgt_resume_polling_done);
1086 	return 0;
1087 }
1088 
1089 struct spdk_nvmf_subsystem *
1090 spdk_nvmf_tgt_find_subsystem(struct spdk_nvmf_tgt *tgt, const char *subnqn)
1091 {
1092 	struct spdk_nvmf_subsystem subsystem;
1093 
1094 	if (!subnqn) {
1095 		return NULL;
1096 	}
1097 
1098 	/* Ensure that subnqn is null terminated */
1099 	if (!memchr(subnqn, '\0', SPDK_NVMF_NQN_MAX_LEN + 1)) {
1100 		SPDK_ERRLOG("Connect SUBNQN is not null terminated\n");
1101 		return NULL;
1102 	}
1103 
1104 	snprintf(subsystem.subnqn, sizeof(subsystem.subnqn), "%s", subnqn);
1105 	return RB_FIND(subsystem_tree, &tgt->subsystems, &subsystem);
1106 }
1107 
1108 struct spdk_nvmf_transport *
1109 spdk_nvmf_tgt_get_transport(struct spdk_nvmf_tgt *tgt, const char *transport_name)
1110 {
1111 	struct spdk_nvmf_transport *transport;
1112 
1113 	TAILQ_FOREACH(transport, &tgt->transports, link) {
1114 		if (!strncasecmp(transport->ops->name, transport_name, SPDK_NVMF_TRSTRING_MAX_LEN)) {
1115 			return transport;
1116 		}
1117 	}
1118 	return NULL;
1119 }
1120 
1121 struct nvmf_new_qpair_ctx {
1122 	struct spdk_nvmf_qpair *qpair;
1123 	struct spdk_nvmf_poll_group *group;
1124 };
1125 
1126 static void
1127 _nvmf_poll_group_add(void *_ctx)
1128 {
1129 	struct nvmf_new_qpair_ctx *ctx = _ctx;
1130 	struct spdk_nvmf_qpair *qpair = ctx->qpair;
1131 	struct spdk_nvmf_poll_group *group = ctx->group;
1132 
1133 	free(_ctx);
1134 
1135 	if (spdk_nvmf_poll_group_add(group, qpair) != 0) {
1136 		SPDK_ERRLOG("Unable to add the qpair to a poll group.\n");
1137 		spdk_nvmf_qpair_disconnect(qpair);
1138 	}
1139 }
1140 
1141 void
1142 spdk_nvmf_tgt_new_qpair(struct spdk_nvmf_tgt *tgt, struct spdk_nvmf_qpair *qpair)
1143 {
1144 	struct spdk_nvmf_poll_group *group;
1145 	struct nvmf_new_qpair_ctx *ctx;
1146 
1147 	group = spdk_nvmf_get_optimal_poll_group(qpair);
1148 	if (group == NULL) {
1149 		if (tgt->next_poll_group == NULL) {
1150 			tgt->next_poll_group = TAILQ_FIRST(&tgt->poll_groups);
1151 			if (tgt->next_poll_group == NULL) {
1152 				SPDK_ERRLOG("No poll groups exist.\n");
1153 				spdk_nvmf_qpair_disconnect(qpair);
1154 				return;
1155 			}
1156 		}
1157 		group = tgt->next_poll_group;
1158 		tgt->next_poll_group = TAILQ_NEXT(group, link);
1159 	}
1160 
1161 	ctx = calloc(1, sizeof(*ctx));
1162 	if (!ctx) {
1163 		SPDK_ERRLOG("Unable to send message to poll group.\n");
1164 		spdk_nvmf_qpair_disconnect(qpair);
1165 		return;
1166 	}
1167 
1168 	ctx->qpair = qpair;
1169 	ctx->group = group;
1170 
1171 	pthread_mutex_lock(&group->mutex);
1172 	group->current_unassociated_qpairs++;
1173 	pthread_mutex_unlock(&group->mutex);
1174 
1175 	spdk_thread_send_msg(group->thread, _nvmf_poll_group_add, ctx);
1176 }
1177 
1178 struct spdk_nvmf_poll_group *
1179 spdk_nvmf_poll_group_create(struct spdk_nvmf_tgt *tgt)
1180 {
1181 	struct spdk_io_channel *ch;
1182 
1183 	ch = spdk_get_io_channel(tgt);
1184 	if (!ch) {
1185 		SPDK_ERRLOG("Unable to get I/O channel for target\n");
1186 		return NULL;
1187 	}
1188 
1189 	return spdk_io_channel_get_ctx(ch);
1190 }
1191 
1192 void
1193 spdk_nvmf_poll_group_destroy(struct spdk_nvmf_poll_group *group,
1194 			     spdk_nvmf_poll_group_destroy_done_fn cb_fn,
1195 			     void *cb_arg)
1196 {
1197 	assert(group->destroy_cb_fn == NULL);
1198 	group->destroy_cb_fn = cb_fn;
1199 	group->destroy_cb_arg = cb_arg;
1200 
1201 	/* This function will put the io_channel associated with this poll group */
1202 	nvmf_tgt_destroy_poll_group_qpairs(group);
1203 }
1204 
1205 int
1206 spdk_nvmf_poll_group_add(struct spdk_nvmf_poll_group *group,
1207 			 struct spdk_nvmf_qpair *qpair)
1208 {
1209 	int rc = -1;
1210 	struct spdk_nvmf_transport_poll_group *tgroup;
1211 
1212 	TAILQ_INIT(&qpair->outstanding);
1213 	qpair->group = group;
1214 	qpair->ctrlr = NULL;
1215 	qpair->disconnect_started = false;
1216 
1217 	TAILQ_FOREACH(tgroup, &group->tgroups, link) {
1218 		if (tgroup->transport == qpair->transport) {
1219 			rc = nvmf_transport_poll_group_add(tgroup, qpair);
1220 			break;
1221 		}
1222 	}
1223 
1224 	/* We add the qpair to the group only it is successfully added into the tgroup */
1225 	if (rc == 0) {
1226 		SPDK_DTRACE_PROBE2_TICKS(nvmf_poll_group_add_qpair, qpair, spdk_thread_get_id(group->thread));
1227 		TAILQ_INSERT_TAIL(&group->qpairs, qpair, link);
1228 		nvmf_qpair_set_state(qpair, SPDK_NVMF_QPAIR_CONNECTING);
1229 	}
1230 
1231 	return rc;
1232 }
1233 
1234 static void
1235 _nvmf_ctrlr_destruct(void *ctx)
1236 {
1237 	struct spdk_nvmf_ctrlr *ctrlr = ctx;
1238 
1239 	nvmf_ctrlr_destruct(ctrlr);
1240 }
1241 
1242 static void
1243 _nvmf_ctrlr_free_from_qpair(void *ctx)
1244 {
1245 	struct nvmf_qpair_disconnect_ctx *qpair_ctx = ctx;
1246 	struct spdk_nvmf_ctrlr *ctrlr = qpair_ctx->ctrlr;
1247 	uint32_t count;
1248 
1249 	spdk_bit_array_clear(ctrlr->qpair_mask, qpair_ctx->qid);
1250 	count = spdk_bit_array_count_set(ctrlr->qpair_mask);
1251 	if (count == 0) {
1252 		assert(!ctrlr->in_destruct);
1253 		SPDK_DEBUGLOG(nvmf, "Last qpair %u, destroy ctrlr 0x%hx\n", qpair_ctx->qid, ctrlr->cntlid);
1254 		ctrlr->in_destruct = true;
1255 		spdk_thread_send_msg(ctrlr->subsys->thread, _nvmf_ctrlr_destruct, ctrlr);
1256 	}
1257 	free(qpair_ctx);
1258 }
1259 
1260 static void
1261 _nvmf_transport_qpair_fini_complete(void *cb_ctx)
1262 {
1263 	struct nvmf_qpair_disconnect_ctx *qpair_ctx = cb_ctx;
1264 	struct spdk_nvmf_ctrlr *ctrlr;
1265 
1266 	ctrlr = qpair_ctx->ctrlr;
1267 	SPDK_DEBUGLOG(nvmf, "Finish destroying qid %u\n", qpair_ctx->qid);
1268 
1269 	if (ctrlr) {
1270 		if (qpair_ctx->qid == 0) {
1271 			/* Admin qpair is removed, so set the pointer to NULL.
1272 			 * This operation is safe since we are on ctrlr thread now, admin qpair's thread is the same
1273 			 * as controller's thread */
1274 			assert(ctrlr->thread == spdk_get_thread());
1275 			ctrlr->admin_qpair = NULL;
1276 		}
1277 		/* Free qpair id from controller's bit mask and destroy the controller if it is the last qpair */
1278 		if (ctrlr->thread) {
1279 			spdk_thread_send_msg(ctrlr->thread, _nvmf_ctrlr_free_from_qpair, qpair_ctx);
1280 		} else {
1281 			_nvmf_ctrlr_free_from_qpair(qpair_ctx);
1282 		}
1283 	} else {
1284 		free(qpair_ctx);
1285 	}
1286 }
1287 
1288 void
1289 spdk_nvmf_poll_group_remove(struct spdk_nvmf_qpair *qpair)
1290 {
1291 	struct spdk_nvmf_transport_poll_group *tgroup;
1292 	int rc;
1293 
1294 	SPDK_DTRACE_PROBE2_TICKS(nvmf_poll_group_remove_qpair, qpair,
1295 				 spdk_thread_get_id(qpair->group->thread));
1296 	nvmf_qpair_set_state(qpair, SPDK_NVMF_QPAIR_ERROR);
1297 
1298 	/* Find the tgroup and remove the qpair from the tgroup */
1299 	TAILQ_FOREACH(tgroup, &qpair->group->tgroups, link) {
1300 		if (tgroup->transport == qpair->transport) {
1301 			rc = nvmf_transport_poll_group_remove(tgroup, qpair);
1302 			if (rc && (rc != ENOTSUP)) {
1303 				SPDK_ERRLOG("Cannot remove qpair=%p from transport group=%p\n",
1304 					    qpair, tgroup);
1305 			}
1306 			break;
1307 		}
1308 	}
1309 
1310 	TAILQ_REMOVE(&qpair->group->qpairs, qpair, link);
1311 	qpair->group = NULL;
1312 }
1313 
1314 static void
1315 _nvmf_qpair_sgroup_req_clean(struct spdk_nvmf_subsystem_poll_group *sgroup,
1316 			     const struct spdk_nvmf_qpair *qpair)
1317 {
1318 	struct spdk_nvmf_request *req, *tmp;
1319 	TAILQ_FOREACH_SAFE(req, &sgroup->queued, link, tmp) {
1320 		if (req->qpair == qpair) {
1321 			TAILQ_REMOVE(&sgroup->queued, req, link);
1322 			if (nvmf_transport_req_free(req)) {
1323 				SPDK_ERRLOG("Transport request free error!\n");
1324 			}
1325 		}
1326 	}
1327 }
1328 
1329 static void
1330 _nvmf_qpair_destroy(void *ctx, int status)
1331 {
1332 	struct nvmf_qpair_disconnect_ctx *qpair_ctx = ctx;
1333 	struct spdk_nvmf_qpair *qpair = qpair_ctx->qpair;
1334 	struct spdk_nvmf_ctrlr *ctrlr = qpair->ctrlr;
1335 	struct spdk_nvmf_subsystem_poll_group *sgroup;
1336 	uint32_t sid;
1337 
1338 	assert(qpair->state == SPDK_NVMF_QPAIR_DEACTIVATING);
1339 	qpair_ctx->qid = qpair->qid;
1340 
1341 	if (qpair->connect_received) {
1342 		if (0 == qpair->qid) {
1343 			assert(qpair->group->stat.current_admin_qpairs > 0);
1344 			qpair->group->stat.current_admin_qpairs--;
1345 		} else {
1346 			assert(qpair->group->stat.current_io_qpairs > 0);
1347 			qpair->group->stat.current_io_qpairs--;
1348 		}
1349 	} else {
1350 		pthread_mutex_lock(&qpair->group->mutex);
1351 		qpair->group->current_unassociated_qpairs--;
1352 		pthread_mutex_unlock(&qpair->group->mutex);
1353 	}
1354 
1355 	if (ctrlr) {
1356 		sgroup = &qpair->group->sgroups[ctrlr->subsys->id];
1357 		_nvmf_qpair_sgroup_req_clean(sgroup, qpair);
1358 	} else {
1359 		for (sid = 0; sid < qpair->group->num_sgroups; sid++) {
1360 			sgroup = &qpair->group->sgroups[sid];
1361 			assert(sgroup != NULL);
1362 			_nvmf_qpair_sgroup_req_clean(sgroup, qpair);
1363 		}
1364 	}
1365 
1366 	nvmf_qpair_auth_destroy(qpair);
1367 	qpair_ctx->ctrlr = ctrlr;
1368 	spdk_nvmf_poll_group_remove(qpair);
1369 	nvmf_transport_qpair_fini(qpair, _nvmf_transport_qpair_fini_complete, qpair_ctx);
1370 }
1371 
1372 static void
1373 _nvmf_qpair_disconnect_msg(void *ctx)
1374 {
1375 	struct nvmf_qpair_disconnect_ctx *qpair_ctx = ctx;
1376 
1377 	spdk_nvmf_qpair_disconnect(qpair_ctx->qpair);
1378 	free(ctx);
1379 }
1380 
1381 int
1382 spdk_nvmf_qpair_disconnect(struct spdk_nvmf_qpair *qpair)
1383 {
1384 	struct spdk_nvmf_poll_group *group = qpair->group;
1385 	struct nvmf_qpair_disconnect_ctx *qpair_ctx;
1386 
1387 	if (__atomic_test_and_set(&qpair->disconnect_started, __ATOMIC_RELAXED)) {
1388 		return -EINPROGRESS;
1389 	}
1390 
1391 	/* If we get a qpair in the uninitialized state, we can just destroy it immediately */
1392 	if (qpair->state == SPDK_NVMF_QPAIR_UNINITIALIZED) {
1393 		nvmf_transport_qpair_fini(qpair, NULL, NULL);
1394 		return 0;
1395 	}
1396 
1397 	assert(group != NULL);
1398 	if (spdk_get_thread() != group->thread) {
1399 		/* clear the atomic so we can set it on the next call on the proper thread. */
1400 		__atomic_clear(&qpair->disconnect_started, __ATOMIC_RELAXED);
1401 		qpair_ctx = calloc(1, sizeof(struct nvmf_qpair_disconnect_ctx));
1402 		if (!qpair_ctx) {
1403 			SPDK_ERRLOG("Unable to allocate context for nvmf_qpair_disconnect\n");
1404 			return -ENOMEM;
1405 		}
1406 		qpair_ctx->qpair = qpair;
1407 		spdk_thread_send_msg(group->thread, _nvmf_qpair_disconnect_msg, qpair_ctx);
1408 		return 0;
1409 	}
1410 
1411 	SPDK_DTRACE_PROBE2_TICKS(nvmf_qpair_disconnect, qpair, spdk_thread_get_id(group->thread));
1412 	assert(spdk_nvmf_qpair_is_active(qpair));
1413 	nvmf_qpair_set_state(qpair, SPDK_NVMF_QPAIR_DEACTIVATING);
1414 
1415 	qpair_ctx = calloc(1, sizeof(struct nvmf_qpair_disconnect_ctx));
1416 	if (!qpair_ctx) {
1417 		SPDK_ERRLOG("Unable to allocate context for nvmf_qpair_disconnect\n");
1418 		return -ENOMEM;
1419 	}
1420 
1421 	qpair_ctx->qpair = qpair;
1422 
1423 	/* Check for outstanding I/O */
1424 	if (!TAILQ_EMPTY(&qpair->outstanding)) {
1425 		SPDK_DTRACE_PROBE2_TICKS(nvmf_poll_group_drain_qpair, qpair, spdk_thread_get_id(group->thread));
1426 		qpair->state_cb = _nvmf_qpair_destroy;
1427 		qpair->state_cb_arg = qpair_ctx;
1428 		nvmf_qpair_abort_pending_zcopy_reqs(qpair);
1429 		nvmf_qpair_free_aer(qpair);
1430 		return 0;
1431 	}
1432 
1433 	_nvmf_qpair_destroy(qpair_ctx, 0);
1434 
1435 	return 0;
1436 }
1437 
1438 int
1439 spdk_nvmf_qpair_get_peer_trid(struct spdk_nvmf_qpair *qpair,
1440 			      struct spdk_nvme_transport_id *trid)
1441 {
1442 	memset(trid, 0, sizeof(*trid));
1443 	return nvmf_transport_qpair_get_peer_trid(qpair, trid);
1444 }
1445 
1446 int
1447 spdk_nvmf_qpair_get_local_trid(struct spdk_nvmf_qpair *qpair,
1448 			       struct spdk_nvme_transport_id *trid)
1449 {
1450 	memset(trid, 0, sizeof(*trid));
1451 	return nvmf_transport_qpair_get_local_trid(qpair, trid);
1452 }
1453 
1454 int
1455 spdk_nvmf_qpair_get_listen_trid(struct spdk_nvmf_qpair *qpair,
1456 				struct spdk_nvme_transport_id *trid)
1457 {
1458 	memset(trid, 0, sizeof(*trid));
1459 	return nvmf_transport_qpair_get_listen_trid(qpair, trid);
1460 }
1461 
1462 static int
1463 poll_group_update_subsystem(struct spdk_nvmf_poll_group *group,
1464 			    struct spdk_nvmf_subsystem *subsystem)
1465 {
1466 	struct spdk_nvmf_subsystem_poll_group *sgroup;
1467 	uint32_t new_num_ns, old_num_ns;
1468 	uint32_t i, j;
1469 	struct spdk_nvmf_ns *ns;
1470 	struct spdk_nvmf_registrant *reg, *tmp;
1471 	struct spdk_io_channel *ch;
1472 	struct spdk_nvmf_subsystem_pg_ns_info *ns_info;
1473 	struct spdk_nvmf_ctrlr *ctrlr;
1474 	bool ns_changed;
1475 
1476 	/* Make sure our poll group has memory for this subsystem allocated */
1477 	if (subsystem->id >= group->num_sgroups) {
1478 		return -ENOMEM;
1479 	}
1480 
1481 	sgroup = &group->sgroups[subsystem->id];
1482 
1483 	/* Make sure the array of namespace information is the correct size */
1484 	new_num_ns = subsystem->max_nsid;
1485 	old_num_ns = sgroup->num_ns;
1486 
1487 	ns_changed = false;
1488 
1489 	if (old_num_ns == 0) {
1490 		if (new_num_ns > 0) {
1491 			/* First allocation */
1492 			sgroup->ns_info = calloc(new_num_ns, sizeof(struct spdk_nvmf_subsystem_pg_ns_info));
1493 			if (!sgroup->ns_info) {
1494 				return -ENOMEM;
1495 			}
1496 		}
1497 	} else if (new_num_ns > old_num_ns) {
1498 		void *buf;
1499 
1500 		/* Make the array larger */
1501 		buf = realloc(sgroup->ns_info, new_num_ns * sizeof(struct spdk_nvmf_subsystem_pg_ns_info));
1502 		if (!buf) {
1503 			return -ENOMEM;
1504 		}
1505 
1506 		sgroup->ns_info = buf;
1507 
1508 		/* Null out the new namespace information slots */
1509 		for (i = old_num_ns; i < new_num_ns; i++) {
1510 			memset(&sgroup->ns_info[i], 0, sizeof(struct spdk_nvmf_subsystem_pg_ns_info));
1511 		}
1512 	} else if (new_num_ns < old_num_ns) {
1513 		void *buf;
1514 
1515 		/* Free the extra I/O channels */
1516 		for (i = new_num_ns; i < old_num_ns; i++) {
1517 			ns_info = &sgroup->ns_info[i];
1518 
1519 			if (ns_info->channel) {
1520 				spdk_put_io_channel(ns_info->channel);
1521 				ns_info->channel = NULL;
1522 			}
1523 		}
1524 
1525 		/* Make the array smaller */
1526 		if (new_num_ns > 0) {
1527 			buf = realloc(sgroup->ns_info, new_num_ns * sizeof(struct spdk_nvmf_subsystem_pg_ns_info));
1528 			if (!buf) {
1529 				return -ENOMEM;
1530 			}
1531 			sgroup->ns_info = buf;
1532 		} else {
1533 			free(sgroup->ns_info);
1534 			sgroup->ns_info = NULL;
1535 		}
1536 	}
1537 
1538 	sgroup->num_ns = new_num_ns;
1539 
1540 	/* Detect bdevs that were added or removed */
1541 	for (i = 0; i < sgroup->num_ns; i++) {
1542 		ns = subsystem->ns[i];
1543 		ns_info = &sgroup->ns_info[i];
1544 		ch = ns_info->channel;
1545 
1546 		if (ns == NULL && ch == NULL) {
1547 			/* Both NULL. Leave empty */
1548 		} else if (ns == NULL && ch != NULL) {
1549 			/* There was a channel here, but the namespace is gone. */
1550 			ns_changed = true;
1551 			spdk_put_io_channel(ch);
1552 			ns_info->channel = NULL;
1553 		} else if (ns != NULL && ch == NULL) {
1554 			/* A namespace appeared but there is no channel yet */
1555 			ns_changed = true;
1556 			ch = spdk_bdev_get_io_channel(ns->desc);
1557 			if (ch == NULL) {
1558 				SPDK_ERRLOG("Could not allocate I/O channel.\n");
1559 				return -ENOMEM;
1560 			}
1561 			ns_info->channel = ch;
1562 		} else if (spdk_uuid_compare(&ns_info->uuid, spdk_bdev_get_uuid(ns->bdev)) != 0) {
1563 			/* A namespace was here before, but was replaced by a new one. */
1564 			ns_changed = true;
1565 			spdk_put_io_channel(ns_info->channel);
1566 			memset(ns_info, 0, sizeof(*ns_info));
1567 
1568 			ch = spdk_bdev_get_io_channel(ns->desc);
1569 			if (ch == NULL) {
1570 				SPDK_ERRLOG("Could not allocate I/O channel.\n");
1571 				return -ENOMEM;
1572 			}
1573 			ns_info->channel = ch;
1574 		} else if (ns_info->num_blocks != spdk_bdev_get_num_blocks(ns->bdev)) {
1575 			/* Namespace is still there but size has changed */
1576 			SPDK_DEBUGLOG(nvmf, "Namespace resized: subsystem_id %u,"
1577 				      " nsid %u, pg %p, old %" PRIu64 ", new %" PRIu64 "\n",
1578 				      subsystem->id,
1579 				      ns->nsid,
1580 				      group,
1581 				      ns_info->num_blocks,
1582 				      spdk_bdev_get_num_blocks(ns->bdev));
1583 			ns_changed = true;
1584 		}
1585 
1586 		if (ns == NULL) {
1587 			memset(ns_info, 0, sizeof(*ns_info));
1588 		} else {
1589 			ns_info->uuid = *spdk_bdev_get_uuid(ns->bdev);
1590 			ns_info->num_blocks = spdk_bdev_get_num_blocks(ns->bdev);
1591 			ns_info->crkey = ns->crkey;
1592 			ns_info->rtype = ns->rtype;
1593 			if (ns->holder) {
1594 				ns_info->holder_id = ns->holder->hostid;
1595 			}
1596 
1597 			memset(&ns_info->reg_hostid, 0, SPDK_NVMF_MAX_NUM_REGISTRANTS * sizeof(struct spdk_uuid));
1598 			j = 0;
1599 			TAILQ_FOREACH_SAFE(reg, &ns->registrants, link, tmp) {
1600 				if (j >= SPDK_NVMF_MAX_NUM_REGISTRANTS) {
1601 					SPDK_ERRLOG("Maximum %u registrants can support.\n", SPDK_NVMF_MAX_NUM_REGISTRANTS);
1602 					return -EINVAL;
1603 				}
1604 				ns_info->reg_hostid[j++] = reg->hostid;
1605 			}
1606 		}
1607 	}
1608 
1609 	if (ns_changed) {
1610 		TAILQ_FOREACH(ctrlr, &subsystem->ctrlrs, link) {
1611 			if (ctrlr->thread != spdk_get_thread()) {
1612 				continue;
1613 			}
1614 			/* It is possible that a ctrlr was added but the admin_qpair hasn't been
1615 			 * assigned yet.
1616 			 */
1617 			if (!ctrlr->admin_qpair) {
1618 				continue;
1619 			}
1620 			if (ctrlr->admin_qpair->group == group) {
1621 				nvmf_ctrlr_async_event_ns_notice(ctrlr);
1622 				nvmf_ctrlr_async_event_ana_change_notice(ctrlr);
1623 			}
1624 		}
1625 	}
1626 
1627 	return 0;
1628 }
1629 
1630 int
1631 nvmf_poll_group_update_subsystem(struct spdk_nvmf_poll_group *group,
1632 				 struct spdk_nvmf_subsystem *subsystem)
1633 {
1634 	return poll_group_update_subsystem(group, subsystem);
1635 }
1636 
1637 int
1638 nvmf_poll_group_add_subsystem(struct spdk_nvmf_poll_group *group,
1639 			      struct spdk_nvmf_subsystem *subsystem,
1640 			      spdk_nvmf_poll_group_mod_done cb_fn, void *cb_arg)
1641 {
1642 	int rc = 0;
1643 	struct spdk_nvmf_subsystem_poll_group *sgroup = &group->sgroups[subsystem->id];
1644 	struct spdk_nvmf_request *req, *tmp;
1645 	uint32_t i;
1646 
1647 	if (!TAILQ_EMPTY(&sgroup->queued)) {
1648 		SPDK_ERRLOG("sgroup->queued not empty when adding subsystem\n");
1649 		TAILQ_FOREACH_SAFE(req, &sgroup->queued, link, tmp) {
1650 			TAILQ_REMOVE(&sgroup->queued, req, link);
1651 			if (nvmf_transport_req_free(req)) {
1652 				SPDK_ERRLOG("Transport request free error!\n");
1653 			}
1654 		}
1655 		assert(false);
1656 	}
1657 
1658 	rc = poll_group_update_subsystem(group, subsystem);
1659 	if (rc) {
1660 		nvmf_poll_group_remove_subsystem(group, subsystem, NULL, NULL);
1661 		goto fini;
1662 	}
1663 
1664 	sgroup->state = SPDK_NVMF_SUBSYSTEM_ACTIVE;
1665 
1666 	for (i = 0; i < sgroup->num_ns; i++) {
1667 		sgroup->ns_info[i].state = SPDK_NVMF_SUBSYSTEM_ACTIVE;
1668 	}
1669 
1670 fini:
1671 	if (cb_fn) {
1672 		cb_fn(cb_arg, rc);
1673 	}
1674 
1675 	SPDK_DTRACE_PROBE2_TICKS(nvmf_poll_group_add_subsystem, spdk_thread_get_id(group->thread),
1676 				 subsystem->subnqn);
1677 
1678 	return rc;
1679 }
1680 
1681 static void
1682 _nvmf_poll_group_remove_subsystem_cb(void *ctx, int status)
1683 {
1684 	struct nvmf_qpair_disconnect_many_ctx *qpair_ctx = ctx;
1685 	struct spdk_nvmf_subsystem *subsystem;
1686 	struct spdk_nvmf_poll_group *group;
1687 	struct spdk_nvmf_subsystem_poll_group *sgroup;
1688 	spdk_nvmf_poll_group_mod_done cpl_fn = NULL;
1689 	void *cpl_ctx = NULL;
1690 	uint32_t nsid;
1691 
1692 	group = qpair_ctx->group;
1693 	subsystem = qpair_ctx->subsystem;
1694 	cpl_fn = qpair_ctx->cpl_fn;
1695 	cpl_ctx = qpair_ctx->cpl_ctx;
1696 	sgroup = &group->sgroups[subsystem->id];
1697 
1698 	if (status) {
1699 		goto fini;
1700 	}
1701 
1702 	for (nsid = 0; nsid < sgroup->num_ns; nsid++) {
1703 		if (sgroup->ns_info[nsid].channel) {
1704 			spdk_put_io_channel(sgroup->ns_info[nsid].channel);
1705 			sgroup->ns_info[nsid].channel = NULL;
1706 		}
1707 	}
1708 
1709 	sgroup->num_ns = 0;
1710 	free(sgroup->ns_info);
1711 	sgroup->ns_info = NULL;
1712 fini:
1713 	free(qpair_ctx);
1714 	if (cpl_fn) {
1715 		cpl_fn(cpl_ctx, status);
1716 	}
1717 }
1718 
1719 static void nvmf_poll_group_remove_subsystem_msg(void *ctx);
1720 
1721 static void
1722 nvmf_poll_group_remove_subsystem_msg(void *ctx)
1723 {
1724 	struct spdk_nvmf_qpair *qpair, *qpair_tmp;
1725 	struct spdk_nvmf_subsystem *subsystem;
1726 	struct spdk_nvmf_poll_group *group;
1727 	struct nvmf_qpair_disconnect_many_ctx *qpair_ctx = ctx;
1728 	bool qpairs_found = false;
1729 	int rc = 0;
1730 
1731 	group = qpair_ctx->group;
1732 	subsystem = qpair_ctx->subsystem;
1733 
1734 	TAILQ_FOREACH_SAFE(qpair, &group->qpairs, link, qpair_tmp) {
1735 		if ((qpair->ctrlr != NULL) && (qpair->ctrlr->subsys == subsystem)) {
1736 			qpairs_found = true;
1737 			rc = spdk_nvmf_qpair_disconnect(qpair);
1738 			if (rc && rc != -EINPROGRESS) {
1739 				break;
1740 			}
1741 		}
1742 	}
1743 
1744 	if (!qpairs_found) {
1745 		_nvmf_poll_group_remove_subsystem_cb(ctx, 0);
1746 		return;
1747 	}
1748 
1749 	/* Some qpairs are in process of being disconnected. Send a message and try to remove them again */
1750 	spdk_thread_send_msg(spdk_get_thread(), nvmf_poll_group_remove_subsystem_msg, ctx);
1751 }
1752 
1753 void
1754 nvmf_poll_group_remove_subsystem(struct spdk_nvmf_poll_group *group,
1755 				 struct spdk_nvmf_subsystem *subsystem,
1756 				 spdk_nvmf_poll_group_mod_done cb_fn, void *cb_arg)
1757 {
1758 	struct spdk_nvmf_subsystem_poll_group *sgroup;
1759 	struct nvmf_qpair_disconnect_many_ctx *ctx;
1760 	uint32_t i;
1761 
1762 	SPDK_DTRACE_PROBE3_TICKS(nvmf_poll_group_remove_subsystem, group, spdk_thread_get_id(group->thread),
1763 				 subsystem->subnqn);
1764 
1765 	ctx = calloc(1, sizeof(struct nvmf_qpair_disconnect_many_ctx));
1766 	if (!ctx) {
1767 		SPDK_ERRLOG("Unable to allocate memory for context to remove poll subsystem\n");
1768 		if (cb_fn) {
1769 			cb_fn(cb_arg, -1);
1770 		}
1771 		return;
1772 	}
1773 
1774 	ctx->group = group;
1775 	ctx->subsystem = subsystem;
1776 	ctx->cpl_fn = cb_fn;
1777 	ctx->cpl_ctx = cb_arg;
1778 
1779 	sgroup = &group->sgroups[subsystem->id];
1780 	sgroup->state = SPDK_NVMF_SUBSYSTEM_INACTIVE;
1781 
1782 	for (i = 0; i < sgroup->num_ns; i++) {
1783 		sgroup->ns_info[i].state = SPDK_NVMF_SUBSYSTEM_INACTIVE;
1784 	}
1785 
1786 	nvmf_poll_group_remove_subsystem_msg(ctx);
1787 }
1788 
1789 void
1790 nvmf_poll_group_pause_subsystem(struct spdk_nvmf_poll_group *group,
1791 				struct spdk_nvmf_subsystem *subsystem,
1792 				uint32_t nsid,
1793 				spdk_nvmf_poll_group_mod_done cb_fn, void *cb_arg)
1794 {
1795 	struct spdk_nvmf_subsystem_poll_group *sgroup;
1796 	struct spdk_nvmf_subsystem_pg_ns_info *ns_info = NULL;
1797 	int rc = 0;
1798 	uint32_t i;
1799 
1800 	if (subsystem->id >= group->num_sgroups) {
1801 		rc = -1;
1802 		goto fini;
1803 	}
1804 
1805 	sgroup = &group->sgroups[subsystem->id];
1806 	if (sgroup->state == SPDK_NVMF_SUBSYSTEM_PAUSED) {
1807 		goto fini;
1808 	}
1809 	sgroup->state = SPDK_NVMF_SUBSYSTEM_PAUSING;
1810 
1811 	if (nsid == SPDK_NVME_GLOBAL_NS_TAG) {
1812 		for (i = 0; i < sgroup->num_ns; i++) {
1813 			ns_info = &sgroup->ns_info[i];
1814 			ns_info->state = SPDK_NVMF_SUBSYSTEM_PAUSING;
1815 		}
1816 	} else {
1817 		/* NOTE: This implicitly also checks for 0, since 0 - 1 wraps around to UINT32_MAX. */
1818 		if (nsid - 1 < sgroup->num_ns) {
1819 			ns_info  = &sgroup->ns_info[nsid - 1];
1820 			ns_info->state = SPDK_NVMF_SUBSYSTEM_PAUSING;
1821 		}
1822 	}
1823 
1824 	if (sgroup->mgmt_io_outstanding > 0) {
1825 		assert(sgroup->cb_fn == NULL);
1826 		sgroup->cb_fn = cb_fn;
1827 		assert(sgroup->cb_arg == NULL);
1828 		sgroup->cb_arg = cb_arg;
1829 		return;
1830 	}
1831 
1832 	if (nsid == SPDK_NVME_GLOBAL_NS_TAG) {
1833 		for (i = 0; i < sgroup->num_ns; i++) {
1834 			ns_info = &sgroup->ns_info[i];
1835 
1836 			if (ns_info->io_outstanding > 0) {
1837 				assert(sgroup->cb_fn == NULL);
1838 				sgroup->cb_fn = cb_fn;
1839 				assert(sgroup->cb_arg == NULL);
1840 				sgroup->cb_arg = cb_arg;
1841 				return;
1842 			}
1843 		}
1844 	} else {
1845 		if (ns_info != NULL && ns_info->io_outstanding > 0) {
1846 			assert(sgroup->cb_fn == NULL);
1847 			sgroup->cb_fn = cb_fn;
1848 			assert(sgroup->cb_arg == NULL);
1849 			sgroup->cb_arg = cb_arg;
1850 			return;
1851 		}
1852 	}
1853 
1854 	assert(sgroup->mgmt_io_outstanding == 0);
1855 	sgroup->state = SPDK_NVMF_SUBSYSTEM_PAUSED;
1856 fini:
1857 	if (cb_fn) {
1858 		cb_fn(cb_arg, rc);
1859 	}
1860 }
1861 
1862 void
1863 nvmf_poll_group_resume_subsystem(struct spdk_nvmf_poll_group *group,
1864 				 struct spdk_nvmf_subsystem *subsystem,
1865 				 spdk_nvmf_poll_group_mod_done cb_fn, void *cb_arg)
1866 {
1867 	struct spdk_nvmf_request *req, *tmp;
1868 	struct spdk_nvmf_subsystem_poll_group *sgroup;
1869 	int rc = 0;
1870 	uint32_t i;
1871 
1872 	if (subsystem->id >= group->num_sgroups) {
1873 		rc = -1;
1874 		goto fini;
1875 	}
1876 
1877 	sgroup = &group->sgroups[subsystem->id];
1878 
1879 	if (sgroup->state == SPDK_NVMF_SUBSYSTEM_ACTIVE) {
1880 		goto fini;
1881 	}
1882 
1883 	rc = poll_group_update_subsystem(group, subsystem);
1884 	if (rc) {
1885 		goto fini;
1886 	}
1887 
1888 	for (i = 0; i < sgroup->num_ns; i++) {
1889 		sgroup->ns_info[i].state = SPDK_NVMF_SUBSYSTEM_ACTIVE;
1890 	}
1891 
1892 	sgroup->state = SPDK_NVMF_SUBSYSTEM_ACTIVE;
1893 
1894 	/* Release all queued requests */
1895 	TAILQ_FOREACH_SAFE(req, &sgroup->queued, link, tmp) {
1896 		TAILQ_REMOVE(&sgroup->queued, req, link);
1897 		if (spdk_nvmf_request_using_zcopy(req)) {
1898 			spdk_nvmf_request_zcopy_start(req);
1899 		} else {
1900 			spdk_nvmf_request_exec(req);
1901 		}
1902 
1903 	}
1904 fini:
1905 	if (cb_fn) {
1906 		cb_fn(cb_arg, rc);
1907 	}
1908 }
1909 
1910 
1911 struct spdk_nvmf_poll_group *
1912 spdk_nvmf_get_optimal_poll_group(struct spdk_nvmf_qpair *qpair)
1913 {
1914 	struct spdk_nvmf_transport_poll_group *tgroup;
1915 
1916 	tgroup = nvmf_transport_get_optimal_poll_group(qpair->transport, qpair);
1917 
1918 	if (tgroup == NULL) {
1919 		return NULL;
1920 	}
1921 
1922 	return tgroup->group;
1923 }
1924 
1925 void
1926 spdk_nvmf_poll_group_dump_stat(struct spdk_nvmf_poll_group *group, struct spdk_json_write_ctx *w)
1927 {
1928 	struct spdk_nvmf_transport_poll_group *tgroup;
1929 
1930 	spdk_json_write_object_begin(w);
1931 
1932 	spdk_json_write_named_string(w, "name", spdk_thread_get_name(spdk_get_thread()));
1933 	spdk_json_write_named_uint32(w, "admin_qpairs", group->stat.admin_qpairs);
1934 	spdk_json_write_named_uint32(w, "io_qpairs", group->stat.io_qpairs);
1935 	spdk_json_write_named_uint32(w, "current_admin_qpairs", group->stat.current_admin_qpairs);
1936 	spdk_json_write_named_uint32(w, "current_io_qpairs", group->stat.current_io_qpairs);
1937 	spdk_json_write_named_uint64(w, "pending_bdev_io", group->stat.pending_bdev_io);
1938 	spdk_json_write_named_uint64(w, "completed_nvme_io", group->stat.completed_nvme_io);
1939 
1940 	spdk_json_write_named_array_begin(w, "transports");
1941 
1942 	TAILQ_FOREACH(tgroup, &group->tgroups, link) {
1943 		spdk_json_write_object_begin(w);
1944 		/*
1945 		 * The trtype field intentionally contains a transport name as this is more informative.
1946 		 * The field has not been renamed for backward compatibility.
1947 		 */
1948 		spdk_json_write_named_string(w, "trtype", spdk_nvmf_get_transport_name(tgroup->transport));
1949 
1950 		if (tgroup->transport->ops->poll_group_dump_stat) {
1951 			tgroup->transport->ops->poll_group_dump_stat(tgroup, w);
1952 		}
1953 
1954 		spdk_json_write_object_end(w);
1955 	}
1956 
1957 	spdk_json_write_array_end(w);
1958 	spdk_json_write_object_end(w);
1959 }
1960