xref: /spdk/lib/nvmf/nvmf.c (revision 30afc27748e69257ca50f7e3a4b4ca6466ffc26b)
1 /*   SPDX-License-Identifier: BSD-3-Clause
2  *   Copyright (C) 2016 Intel Corporation. All rights reserved.
3  *   Copyright (c) 2018-2019, 2021 Mellanox Technologies LTD. All rights reserved.
4  *   Copyright (c) 2021, 2023 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
5  */
6 
7 #include "spdk/stdinc.h"
8 
9 #include "spdk/bdev.h"
10 #include "spdk/bit_array.h"
11 #include "spdk/thread.h"
12 #include "spdk/nvmf.h"
13 #include "spdk/endian.h"
14 #include "spdk/string.h"
15 #include "spdk/log.h"
16 #include "spdk_internal/usdt.h"
17 
18 #include "nvmf_internal.h"
19 #include "transport.h"
20 
21 SPDK_LOG_REGISTER_COMPONENT(nvmf)
22 
23 #define SPDK_NVMF_DEFAULT_MAX_SUBSYSTEMS 1024
24 
25 static TAILQ_HEAD(, spdk_nvmf_tgt) g_nvmf_tgts = TAILQ_HEAD_INITIALIZER(g_nvmf_tgts);
26 
27 typedef void (*nvmf_qpair_disconnect_cpl)(void *ctx, int status);
28 
29 /* supplied to a single call to nvmf_qpair_disconnect */
30 struct nvmf_qpair_disconnect_ctx {
31 	struct spdk_nvmf_qpair *qpair;
32 	struct spdk_nvmf_ctrlr *ctrlr;
33 	uint16_t qid;
34 };
35 
36 /*
37  * There are several times when we need to iterate through the list of all qpairs and selectively delete them.
38  * In order to do this sequentially without overlap, we must provide a context to recover the next qpair from
39  * to enable calling nvmf_qpair_disconnect on the next desired qpair.
40  */
41 struct nvmf_qpair_disconnect_many_ctx {
42 	struct spdk_nvmf_subsystem *subsystem;
43 	struct spdk_nvmf_poll_group *group;
44 	spdk_nvmf_poll_group_mod_done cpl_fn;
45 	void *cpl_ctx;
46 };
47 
48 static struct spdk_nvmf_referral *
49 nvmf_tgt_find_referral(struct spdk_nvmf_tgt *tgt,
50 		       const struct spdk_nvme_transport_id *trid)
51 {
52 	struct spdk_nvmf_referral *referral;
53 
54 	TAILQ_FOREACH(referral, &tgt->referrals, link) {
55 		if (spdk_nvme_transport_id_compare(&referral->trid, trid) == 0) {
56 			return referral;
57 		}
58 	}
59 
60 	return NULL;
61 }
62 
63 int
64 spdk_nvmf_tgt_add_referral(struct spdk_nvmf_tgt *tgt,
65 			   const struct spdk_nvmf_referral_opts *uopts)
66 {
67 	struct spdk_nvmf_referral *referral;
68 	struct spdk_nvmf_referral_opts opts = {};
69 	struct spdk_nvme_transport_id *trid = &opts.trid;
70 
71 	memcpy(&opts, uopts, spdk_min(uopts->size, sizeof(opts)));
72 	if (trid->subnqn[0] == '\0') {
73 		snprintf(trid->subnqn, sizeof(trid->subnqn), "%s", SPDK_NVMF_DISCOVERY_NQN);
74 	}
75 
76 	if (!nvmf_nqn_is_valid(trid->subnqn)) {
77 		SPDK_ERRLOG("Invalid subsystem NQN\n");
78 		return -EINVAL;
79 	}
80 
81 	/* If the entry already exists, just ignore it. */
82 	if (nvmf_tgt_find_referral(tgt, trid)) {
83 		return 0;
84 	}
85 
86 	referral = calloc(1, sizeof(*referral));
87 	if (!referral) {
88 		SPDK_ERRLOG("Failed to allocate memory for a referral\n");
89 		return -ENOMEM;
90 	}
91 
92 	referral->entry.subtype = nvmf_nqn_is_discovery(trid->subnqn) ?
93 				  SPDK_NVMF_SUBTYPE_DISCOVERY :
94 				  SPDK_NVMF_SUBTYPE_NVME;
95 	referral->entry.treq.secure_channel = opts.secure_channel ?
96 					      SPDK_NVMF_TREQ_SECURE_CHANNEL_REQUIRED :
97 					      SPDK_NVMF_TREQ_SECURE_CHANNEL_NOT_REQUIRED;
98 	referral->entry.cntlid = 0xffff;
99 	referral->entry.trtype = trid->trtype;
100 	referral->entry.adrfam = trid->adrfam;
101 	memcpy(&referral->trid, trid, sizeof(struct spdk_nvme_transport_id));
102 	spdk_strcpy_pad(referral->entry.subnqn, trid->subnqn, sizeof(trid->subnqn), '\0');
103 	spdk_strcpy_pad(referral->entry.trsvcid, trid->trsvcid, sizeof(referral->entry.trsvcid), ' ');
104 	spdk_strcpy_pad(referral->entry.traddr, trid->traddr, sizeof(referral->entry.traddr), ' ');
105 
106 	TAILQ_INSERT_HEAD(&tgt->referrals, referral, link);
107 	nvmf_update_discovery_log(tgt, NULL);
108 
109 	return 0;
110 }
111 
112 int
113 spdk_nvmf_tgt_remove_referral(struct spdk_nvmf_tgt *tgt,
114 			      const struct spdk_nvmf_referral_opts *uopts)
115 {
116 	struct spdk_nvmf_referral *referral;
117 	struct spdk_nvmf_referral_opts opts = {};
118 	struct spdk_nvme_transport_id *trid = &opts.trid;
119 
120 	memcpy(&opts, uopts, spdk_min(uopts->size, sizeof(opts)));
121 	if (trid->subnqn[0] == '\0') {
122 		snprintf(trid->subnqn, sizeof(trid->subnqn), "%s", SPDK_NVMF_DISCOVERY_NQN);
123 	}
124 
125 	referral = nvmf_tgt_find_referral(tgt, &opts.trid);
126 	if (referral == NULL) {
127 		return -ENOENT;
128 	}
129 
130 	TAILQ_REMOVE(&tgt->referrals, referral, link);
131 	nvmf_update_discovery_log(tgt, NULL);
132 
133 	free(referral);
134 
135 	return 0;
136 }
137 
138 void
139 nvmf_qpair_set_state(struct spdk_nvmf_qpair *qpair,
140 		     enum spdk_nvmf_qpair_state state)
141 {
142 	assert(qpair != NULL);
143 	assert(qpair->group->thread == spdk_get_thread());
144 
145 	qpair->state = state;
146 }
147 
148 static int
149 nvmf_poll_group_poll(void *ctx)
150 {
151 	struct spdk_nvmf_poll_group *group = ctx;
152 	int rc;
153 	int count = 0;
154 	struct spdk_nvmf_transport_poll_group *tgroup;
155 
156 	TAILQ_FOREACH(tgroup, &group->tgroups, link) {
157 		rc = nvmf_transport_poll_group_poll(tgroup);
158 		if (rc < 0) {
159 			return SPDK_POLLER_BUSY;
160 		}
161 		count += rc;
162 	}
163 
164 	return count > 0 ? SPDK_POLLER_BUSY : SPDK_POLLER_IDLE;
165 }
166 
167 /*
168  * Reset and clean up the poll group (I/O channel code will actually free the
169  * group).
170  */
171 static void
172 nvmf_tgt_cleanup_poll_group(struct spdk_nvmf_poll_group *group)
173 {
174 	struct spdk_nvmf_transport_poll_group *tgroup, *tmp;
175 	struct spdk_nvmf_subsystem_poll_group *sgroup;
176 	uint32_t sid, nsid;
177 
178 	TAILQ_FOREACH_SAFE(tgroup, &group->tgroups, link, tmp) {
179 		TAILQ_REMOVE(&group->tgroups, tgroup, link);
180 		nvmf_transport_poll_group_destroy(tgroup);
181 	}
182 
183 	for (sid = 0; sid < group->num_sgroups; sid++) {
184 		sgroup = &group->sgroups[sid];
185 
186 		assert(sgroup != NULL);
187 
188 		for (nsid = 0; nsid < sgroup->num_ns; nsid++) {
189 			if (sgroup->ns_info[nsid].channel) {
190 				spdk_put_io_channel(sgroup->ns_info[nsid].channel);
191 				sgroup->ns_info[nsid].channel = NULL;
192 			}
193 		}
194 
195 		free(sgroup->ns_info);
196 	}
197 
198 	free(group->sgroups);
199 
200 	spdk_poller_unregister(&group->poller);
201 
202 	if (group->destroy_cb_fn) {
203 		group->destroy_cb_fn(group->destroy_cb_arg, 0);
204 	}
205 }
206 
207 /*
208  * Callback to unregister a poll group from the target, and clean up its state.
209  */
210 static void
211 nvmf_tgt_destroy_poll_group(void *io_device, void *ctx_buf)
212 {
213 	struct spdk_nvmf_tgt *tgt = io_device;
214 	struct spdk_nvmf_poll_group *group = ctx_buf;
215 
216 	SPDK_DTRACE_PROBE1_TICKS(nvmf_destroy_poll_group, spdk_thread_get_id(group->thread));
217 
218 	pthread_mutex_lock(&tgt->mutex);
219 	TAILQ_REMOVE(&tgt->poll_groups, group, link);
220 	tgt->num_poll_groups--;
221 	pthread_mutex_unlock(&tgt->mutex);
222 
223 	assert(!(tgt->state == NVMF_TGT_PAUSING || tgt->state == NVMF_TGT_RESUMING));
224 	nvmf_tgt_cleanup_poll_group(group);
225 }
226 
227 static int
228 nvmf_poll_group_add_transport(struct spdk_nvmf_poll_group *group,
229 			      struct spdk_nvmf_transport *transport)
230 {
231 	struct spdk_nvmf_transport_poll_group *tgroup = nvmf_get_transport_poll_group(group, transport);
232 
233 	if (tgroup != NULL) {
234 		/* Transport already in the poll group */
235 		return 0;
236 	}
237 
238 	tgroup = nvmf_transport_poll_group_create(transport, group);
239 	if (!tgroup) {
240 		SPDK_ERRLOG("Unable to create poll group for transport\n");
241 		return -1;
242 	}
243 	SPDK_DTRACE_PROBE2_TICKS(nvmf_transport_poll_group_create, transport,
244 				 spdk_thread_get_id(group->thread));
245 
246 	tgroup->group = group;
247 	TAILQ_INSERT_TAIL(&group->tgroups, tgroup, link);
248 
249 	return 0;
250 }
251 
252 static void
253 nvmf_tgt_poller_set_interrupt_mode(struct spdk_poller *poller, void *cb_arg, bool interrupt_mode)
254 {
255 }
256 
257 static int
258 nvmf_tgt_create_poll_group(void *io_device, void *ctx_buf)
259 {
260 	struct spdk_nvmf_tgt *tgt = io_device;
261 	struct spdk_nvmf_poll_group *group = ctx_buf;
262 	struct spdk_nvmf_transport *transport;
263 	struct spdk_nvmf_subsystem *subsystem;
264 	struct spdk_thread *thread = spdk_get_thread();
265 	uint32_t i;
266 	int rc;
267 
268 	group->tgt = tgt;
269 	TAILQ_INIT(&group->tgroups);
270 	TAILQ_INIT(&group->qpairs);
271 	group->thread = thread;
272 	pthread_mutex_init(&group->mutex, NULL);
273 
274 	group->poller = SPDK_POLLER_REGISTER(nvmf_poll_group_poll, group, 0);
275 	spdk_poller_register_interrupt(group->poller, nvmf_tgt_poller_set_interrupt_mode, NULL);
276 
277 	SPDK_DTRACE_PROBE1_TICKS(nvmf_create_poll_group, spdk_thread_get_id(thread));
278 
279 	TAILQ_FOREACH(transport, &tgt->transports, link) {
280 		rc = nvmf_poll_group_add_transport(group, transport);
281 		if (rc != 0) {
282 			nvmf_tgt_cleanup_poll_group(group);
283 			return rc;
284 		}
285 	}
286 
287 	group->num_sgroups = tgt->max_subsystems;
288 	group->sgroups = calloc(tgt->max_subsystems, sizeof(struct spdk_nvmf_subsystem_poll_group));
289 	if (!group->sgroups) {
290 		nvmf_tgt_cleanup_poll_group(group);
291 		return -ENOMEM;
292 	}
293 
294 	for (i = 0; i < tgt->max_subsystems; i++) {
295 		TAILQ_INIT(&group->sgroups[i].queued);
296 	}
297 
298 	for (subsystem = spdk_nvmf_subsystem_get_first(tgt);
299 	     subsystem != NULL;
300 	     subsystem = spdk_nvmf_subsystem_get_next(subsystem)) {
301 		if (nvmf_poll_group_add_subsystem(group, subsystem, NULL, NULL) != 0) {
302 			nvmf_tgt_cleanup_poll_group(group);
303 			return -1;
304 		}
305 	}
306 
307 	pthread_mutex_lock(&tgt->mutex);
308 	tgt->num_poll_groups++;
309 	TAILQ_INSERT_TAIL(&tgt->poll_groups, group, link);
310 	pthread_mutex_unlock(&tgt->mutex);
311 
312 	return 0;
313 }
314 
315 static void
316 _nvmf_tgt_disconnect_qpairs(void *ctx)
317 {
318 	struct spdk_nvmf_qpair *qpair, *qpair_tmp;
319 	struct nvmf_qpair_disconnect_many_ctx *qpair_ctx = ctx;
320 	struct spdk_nvmf_poll_group *group = qpair_ctx->group;
321 	struct spdk_io_channel *ch;
322 	int rc;
323 
324 	TAILQ_FOREACH_SAFE(qpair, &group->qpairs, link, qpair_tmp) {
325 		rc = spdk_nvmf_qpair_disconnect(qpair);
326 		if (rc && rc != -EINPROGRESS) {
327 			break;
328 		}
329 	}
330 
331 	if (TAILQ_EMPTY(&group->qpairs)) {
332 		/* When the refcount from the channels reaches 0, nvmf_tgt_destroy_poll_group will be called. */
333 		ch = spdk_io_channel_from_ctx(group);
334 		spdk_put_io_channel(ch);
335 		free(qpair_ctx);
336 		return;
337 	}
338 
339 	/* Some qpairs are in process of being disconnected. Send a message and try to remove them again */
340 	spdk_thread_send_msg(spdk_get_thread(), _nvmf_tgt_disconnect_qpairs, ctx);
341 }
342 
343 static void
344 nvmf_tgt_destroy_poll_group_qpairs(struct spdk_nvmf_poll_group *group)
345 {
346 	struct nvmf_qpair_disconnect_many_ctx *ctx;
347 
348 	SPDK_DTRACE_PROBE1_TICKS(nvmf_destroy_poll_group_qpairs, spdk_thread_get_id(group->thread));
349 
350 	ctx = calloc(1, sizeof(struct nvmf_qpair_disconnect_many_ctx));
351 	if (!ctx) {
352 		SPDK_ERRLOG("Failed to allocate memory for destroy poll group ctx\n");
353 		return;
354 	}
355 
356 	ctx->group = group;
357 	_nvmf_tgt_disconnect_qpairs(ctx);
358 }
359 
360 struct spdk_nvmf_tgt *
361 spdk_nvmf_tgt_create(struct spdk_nvmf_target_opts *_opts)
362 {
363 	struct spdk_nvmf_tgt *tgt, *tmp_tgt;
364 	struct spdk_nvmf_target_opts opts = {
365 		.max_subsystems = SPDK_NVMF_DEFAULT_MAX_SUBSYSTEMS,
366 		.discovery_filter = SPDK_NVMF_TGT_DISCOVERY_MATCH_ANY,
367 	};
368 
369 	memcpy(&opts, _opts, _opts->size);
370 	if (strnlen(opts.name, NVMF_TGT_NAME_MAX_LENGTH) == NVMF_TGT_NAME_MAX_LENGTH) {
371 		SPDK_ERRLOG("Provided target name exceeds the max length of %u.\n", NVMF_TGT_NAME_MAX_LENGTH);
372 		return NULL;
373 	}
374 
375 	TAILQ_FOREACH(tmp_tgt, &g_nvmf_tgts, link) {
376 		if (!strncmp(opts.name, tmp_tgt->name, NVMF_TGT_NAME_MAX_LENGTH)) {
377 			SPDK_ERRLOG("Provided target name must be unique.\n");
378 			return NULL;
379 		}
380 	}
381 
382 	tgt = calloc(1, sizeof(*tgt));
383 	if (!tgt) {
384 		return NULL;
385 	}
386 
387 	snprintf(tgt->name, NVMF_TGT_NAME_MAX_LENGTH, "%s", opts.name);
388 
389 	if (!opts.max_subsystems) {
390 		tgt->max_subsystems = SPDK_NVMF_DEFAULT_MAX_SUBSYSTEMS;
391 	} else {
392 		tgt->max_subsystems = opts.max_subsystems;
393 	}
394 
395 	tgt->crdt[0] = opts.crdt[0];
396 	tgt->crdt[1] = opts.crdt[1];
397 	tgt->crdt[2] = opts.crdt[2];
398 	tgt->discovery_filter = opts.discovery_filter;
399 	tgt->discovery_genctr = 0;
400 	tgt->dhchap_digests = opts.dhchap_digests;
401 	tgt->dhchap_dhgroups = opts.dhchap_dhgroups;
402 	TAILQ_INIT(&tgt->transports);
403 	TAILQ_INIT(&tgt->poll_groups);
404 	TAILQ_INIT(&tgt->referrals);
405 	tgt->num_poll_groups = 0;
406 
407 	tgt->subsystem_ids = spdk_bit_array_create(tgt->max_subsystems);
408 	if (tgt->subsystem_ids == NULL) {
409 		free(tgt);
410 		return NULL;
411 	}
412 
413 	RB_INIT(&tgt->subsystems);
414 
415 	pthread_mutex_init(&tgt->mutex, NULL);
416 
417 	spdk_io_device_register(tgt,
418 				nvmf_tgt_create_poll_group,
419 				nvmf_tgt_destroy_poll_group,
420 				sizeof(struct spdk_nvmf_poll_group),
421 				tgt->name);
422 
423 	tgt->state = NVMF_TGT_RUNNING;
424 
425 	TAILQ_INSERT_HEAD(&g_nvmf_tgts, tgt, link);
426 
427 	return tgt;
428 }
429 
430 static void
431 _nvmf_tgt_destroy_next_transport(void *ctx)
432 {
433 	struct spdk_nvmf_tgt *tgt = ctx;
434 	struct spdk_nvmf_transport *transport;
435 
436 	if (!TAILQ_EMPTY(&tgt->transports)) {
437 		transport = TAILQ_FIRST(&tgt->transports);
438 		TAILQ_REMOVE(&tgt->transports, transport, link);
439 		spdk_nvmf_transport_destroy(transport, _nvmf_tgt_destroy_next_transport, tgt);
440 	} else {
441 		spdk_nvmf_tgt_destroy_done_fn *destroy_cb_fn = tgt->destroy_cb_fn;
442 		void *destroy_cb_arg = tgt->destroy_cb_arg;
443 
444 		pthread_mutex_destroy(&tgt->mutex);
445 		free(tgt);
446 
447 		if (destroy_cb_fn) {
448 			destroy_cb_fn(destroy_cb_arg, 0);
449 		}
450 	}
451 }
452 
453 static void
454 nvmf_tgt_destroy_cb(void *io_device)
455 {
456 	struct spdk_nvmf_tgt *tgt = io_device;
457 	struct spdk_nvmf_subsystem *subsystem, *subsystem_next;
458 	int rc;
459 	struct spdk_nvmf_referral *referral;
460 
461 	while ((referral = TAILQ_FIRST(&tgt->referrals))) {
462 		TAILQ_REMOVE(&tgt->referrals, referral, link);
463 		free(referral);
464 	}
465 
466 	nvmf_tgt_stop_mdns_prr(tgt);
467 
468 	/* We will be freeing subsystems in this loop, so we always need to get the next one
469 	 * ahead of time, since we can't call get_next() on a subsystem that's been freed.
470 	 */
471 	for (subsystem = spdk_nvmf_subsystem_get_first(tgt),
472 	     subsystem_next = spdk_nvmf_subsystem_get_next(subsystem);
473 	     subsystem != NULL;
474 	     subsystem = subsystem_next,
475 	     subsystem_next = spdk_nvmf_subsystem_get_next(subsystem_next)) {
476 		nvmf_subsystem_remove_all_listeners(subsystem, true);
477 
478 		rc = spdk_nvmf_subsystem_destroy(subsystem, nvmf_tgt_destroy_cb, tgt);
479 		if (rc) {
480 			if (rc == -EINPROGRESS) {
481 				/* If rc is -EINPROGRESS, nvmf_tgt_destroy_cb will be called again when subsystem #i
482 				 * is destroyed, nvmf_tgt_destroy_cb will continue to destroy other subsystems if any */
483 				return;
484 			} else {
485 				SPDK_ERRLOG("Failed to destroy subsystem %s, rc %d\n", subsystem->subnqn, rc);
486 			}
487 		}
488 	}
489 	spdk_bit_array_free(&tgt->subsystem_ids);
490 	_nvmf_tgt_destroy_next_transport(tgt);
491 }
492 
493 void
494 spdk_nvmf_tgt_destroy(struct spdk_nvmf_tgt *tgt,
495 		      spdk_nvmf_tgt_destroy_done_fn cb_fn,
496 		      void *cb_arg)
497 {
498 	assert(!(tgt->state == NVMF_TGT_PAUSING || tgt->state == NVMF_TGT_RESUMING));
499 
500 	tgt->destroy_cb_fn = cb_fn;
501 	tgt->destroy_cb_arg = cb_arg;
502 
503 	TAILQ_REMOVE(&g_nvmf_tgts, tgt, link);
504 
505 	spdk_io_device_unregister(tgt, nvmf_tgt_destroy_cb);
506 }
507 
508 const char *
509 spdk_nvmf_tgt_get_name(struct spdk_nvmf_tgt *tgt)
510 {
511 	return tgt->name;
512 }
513 
514 struct spdk_nvmf_tgt *
515 spdk_nvmf_get_tgt(const char *name)
516 {
517 	struct spdk_nvmf_tgt *tgt;
518 	uint32_t num_targets = 0;
519 
520 	TAILQ_FOREACH(tgt, &g_nvmf_tgts, link) {
521 		if (name) {
522 			if (!strncmp(tgt->name, name, NVMF_TGT_NAME_MAX_LENGTH)) {
523 				return tgt;
524 			}
525 		}
526 		num_targets++;
527 	}
528 
529 	/*
530 	 * special case. If there is only one target and
531 	 * no name was specified, return the only available
532 	 * target. If there is more than one target, name must
533 	 * be specified.
534 	 */
535 	if (!name && num_targets == 1) {
536 		return TAILQ_FIRST(&g_nvmf_tgts);
537 	}
538 
539 	return NULL;
540 }
541 
542 struct spdk_nvmf_tgt *
543 spdk_nvmf_get_first_tgt(void)
544 {
545 	return TAILQ_FIRST(&g_nvmf_tgts);
546 }
547 
548 struct spdk_nvmf_tgt *
549 spdk_nvmf_get_next_tgt(struct spdk_nvmf_tgt *prev)
550 {
551 	return TAILQ_NEXT(prev, link);
552 }
553 
554 static void
555 nvmf_write_nvme_subsystem_config(struct spdk_json_write_ctx *w,
556 				 struct spdk_nvmf_subsystem *subsystem)
557 {
558 	struct spdk_nvmf_host *host;
559 	struct spdk_nvmf_ns *ns;
560 	struct spdk_nvmf_ns_opts ns_opts;
561 	uint32_t max_namespaces;
562 	struct spdk_nvmf_transport *transport;
563 
564 	assert(spdk_nvmf_subsystem_get_type(subsystem) == SPDK_NVMF_SUBTYPE_NVME);
565 
566 	/* { */
567 	spdk_json_write_object_begin(w);
568 	spdk_json_write_named_string(w, "method", "nvmf_create_subsystem");
569 
570 	/*     "params" : { */
571 	spdk_json_write_named_object_begin(w, "params");
572 	spdk_json_write_named_string(w, "nqn", spdk_nvmf_subsystem_get_nqn(subsystem));
573 	spdk_json_write_named_bool(w, "allow_any_host", spdk_nvmf_subsystem_get_allow_any_host(subsystem));
574 	spdk_json_write_named_string(w, "serial_number", spdk_nvmf_subsystem_get_sn(subsystem));
575 	spdk_json_write_named_string(w, "model_number", spdk_nvmf_subsystem_get_mn(subsystem));
576 
577 	max_namespaces = spdk_nvmf_subsystem_get_max_namespaces(subsystem);
578 	if (max_namespaces != 0) {
579 		spdk_json_write_named_uint32(w, "max_namespaces", max_namespaces);
580 	}
581 
582 	spdk_json_write_named_uint32(w, "min_cntlid", spdk_nvmf_subsystem_get_min_cntlid(subsystem));
583 	spdk_json_write_named_uint32(w, "max_cntlid", spdk_nvmf_subsystem_get_max_cntlid(subsystem));
584 	spdk_json_write_named_bool(w, "ana_reporting", spdk_nvmf_subsystem_get_ana_reporting(subsystem));
585 
586 	/*     } "params" */
587 	spdk_json_write_object_end(w);
588 
589 	/* } */
590 	spdk_json_write_object_end(w);
591 
592 	for (host = spdk_nvmf_subsystem_get_first_host(subsystem); host != NULL;
593 	     host = spdk_nvmf_subsystem_get_next_host(subsystem, host)) {
594 
595 		spdk_json_write_object_begin(w);
596 		spdk_json_write_named_string(w, "method", "nvmf_subsystem_add_host");
597 
598 		/*     "params" : { */
599 		spdk_json_write_named_object_begin(w, "params");
600 
601 		spdk_json_write_named_string(w, "nqn", spdk_nvmf_subsystem_get_nqn(subsystem));
602 		spdk_json_write_named_string(w, "host", spdk_nvmf_host_get_nqn(host));
603 		if (host->dhchap_key != NULL) {
604 			spdk_json_write_named_string(w, "dhchap_key",
605 						     spdk_key_get_name(host->dhchap_key));
606 		}
607 		if (host->dhchap_ctrlr_key != NULL) {
608 			spdk_json_write_named_string(w, "dhchap_ctrlr_key",
609 						     spdk_key_get_name(host->dhchap_ctrlr_key));
610 		}
611 		TAILQ_FOREACH(transport, &subsystem->tgt->transports, link) {
612 			if (transport->ops->subsystem_dump_host != NULL) {
613 				transport->ops->subsystem_dump_host(transport, subsystem, host->nqn, w);
614 			}
615 		}
616 
617 		/*     } "params" */
618 		spdk_json_write_object_end(w);
619 
620 		/* } */
621 		spdk_json_write_object_end(w);
622 	}
623 
624 	for (ns = spdk_nvmf_subsystem_get_first_ns(subsystem); ns != NULL;
625 	     ns = spdk_nvmf_subsystem_get_next_ns(subsystem, ns)) {
626 		spdk_nvmf_ns_get_opts(ns, &ns_opts, sizeof(ns_opts));
627 
628 		spdk_json_write_object_begin(w);
629 		spdk_json_write_named_string(w, "method", "nvmf_subsystem_add_ns");
630 
631 		/*     "params" : { */
632 		spdk_json_write_named_object_begin(w, "params");
633 
634 		spdk_json_write_named_string(w, "nqn", spdk_nvmf_subsystem_get_nqn(subsystem));
635 
636 		/*     "namespace" : { */
637 		spdk_json_write_named_object_begin(w, "namespace");
638 
639 		spdk_json_write_named_uint32(w, "nsid", spdk_nvmf_ns_get_id(ns));
640 		spdk_json_write_named_string(w, "bdev_name", spdk_bdev_get_name(spdk_nvmf_ns_get_bdev(ns)));
641 
642 		if (ns->ptpl_file != NULL) {
643 			spdk_json_write_named_string(w, "ptpl_file", ns->ptpl_file);
644 		}
645 
646 		if (!spdk_mem_all_zero(ns_opts.nguid, sizeof(ns_opts.nguid))) {
647 			SPDK_STATIC_ASSERT(sizeof(ns_opts.nguid) == sizeof(uint64_t) * 2, "size mismatch");
648 			spdk_json_write_named_string_fmt(w, "nguid", "%016"PRIX64"%016"PRIX64, from_be64(&ns_opts.nguid[0]),
649 							 from_be64(&ns_opts.nguid[8]));
650 		}
651 
652 		if (!spdk_mem_all_zero(ns_opts.eui64, sizeof(ns_opts.eui64))) {
653 			SPDK_STATIC_ASSERT(sizeof(ns_opts.eui64) == sizeof(uint64_t), "size mismatch");
654 			spdk_json_write_named_string_fmt(w, "eui64", "%016"PRIX64, from_be64(&ns_opts.eui64));
655 		}
656 
657 		if (!spdk_uuid_is_null(&ns_opts.uuid)) {
658 			spdk_json_write_named_uuid(w, "uuid",  &ns_opts.uuid);
659 		}
660 
661 		if (spdk_nvmf_subsystem_get_ana_reporting(subsystem)) {
662 			spdk_json_write_named_uint32(w, "anagrpid", ns_opts.anagrpid);
663 		}
664 
665 		spdk_json_write_named_bool(w, "no_auto_visible", !ns->always_visible);
666 
667 		/*     "namespace" */
668 		spdk_json_write_object_end(w);
669 
670 		/*     } "params" */
671 		spdk_json_write_object_end(w);
672 
673 		/* } */
674 		spdk_json_write_object_end(w);
675 
676 		TAILQ_FOREACH(host, &ns->hosts, link) {
677 			spdk_json_write_object_begin(w);
678 			spdk_json_write_named_string(w, "method", "nvmf_ns_add_host");
679 			spdk_json_write_named_object_begin(w, "params");
680 			spdk_json_write_named_string(w, "nqn", spdk_nvmf_subsystem_get_nqn(subsystem));
681 			spdk_json_write_named_uint32(w, "nsid", spdk_nvmf_ns_get_id(ns));
682 			spdk_json_write_named_string(w, "host", spdk_nvmf_host_get_nqn(host));
683 			spdk_json_write_object_end(w);
684 			spdk_json_write_object_end(w);
685 		}
686 	}
687 }
688 
689 static void
690 nvmf_write_subsystem_config_json(struct spdk_json_write_ctx *w,
691 				 struct spdk_nvmf_subsystem *subsystem)
692 {
693 	struct spdk_nvmf_subsystem_listener *listener;
694 	struct spdk_nvmf_transport *transport;
695 	const struct spdk_nvme_transport_id *trid;
696 
697 	if (spdk_nvmf_subsystem_get_type(subsystem) == SPDK_NVMF_SUBTYPE_NVME) {
698 		nvmf_write_nvme_subsystem_config(w, subsystem);
699 	}
700 
701 	for (listener = spdk_nvmf_subsystem_get_first_listener(subsystem); listener != NULL;
702 	     listener = spdk_nvmf_subsystem_get_next_listener(subsystem, listener)) {
703 		transport = listener->transport;
704 		trid = spdk_nvmf_subsystem_listener_get_trid(listener);
705 
706 		spdk_json_write_object_begin(w);
707 		spdk_json_write_named_string(w, "method", "nvmf_subsystem_add_listener");
708 
709 		/*     "params" : { */
710 		spdk_json_write_named_object_begin(w, "params");
711 
712 		spdk_json_write_named_string(w, "nqn", spdk_nvmf_subsystem_get_nqn(subsystem));
713 
714 		spdk_json_write_named_object_begin(w, "listen_address");
715 		nvmf_transport_listen_dump_trid(trid, w);
716 		spdk_json_write_object_end(w);
717 		if (transport->ops->listen_dump_opts) {
718 			transport->ops->listen_dump_opts(transport, trid, w);
719 		}
720 
721 		spdk_json_write_named_bool(w, "secure_channel", listener->opts.secure_channel);
722 
723 		if (listener->opts.sock_impl) {
724 			spdk_json_write_named_string(w, "sock_impl", listener->opts.sock_impl);
725 		}
726 
727 		/*     } "params" */
728 		spdk_json_write_object_end(w);
729 
730 		/* } */
731 		spdk_json_write_object_end(w);
732 	}
733 }
734 
735 void
736 spdk_nvmf_tgt_write_config_json(struct spdk_json_write_ctx *w, struct spdk_nvmf_tgt *tgt)
737 {
738 	struct spdk_nvmf_subsystem *subsystem;
739 	struct spdk_nvmf_transport *transport;
740 	struct spdk_nvmf_referral *referral;
741 
742 	spdk_json_write_object_begin(w);
743 	spdk_json_write_named_string(w, "method", "nvmf_set_max_subsystems");
744 
745 	spdk_json_write_named_object_begin(w, "params");
746 	spdk_json_write_named_uint32(w, "max_subsystems", tgt->max_subsystems);
747 	spdk_json_write_object_end(w);
748 
749 	spdk_json_write_object_end(w);
750 
751 	spdk_json_write_object_begin(w);
752 	spdk_json_write_named_string(w, "method", "nvmf_set_crdt");
753 	spdk_json_write_named_object_begin(w, "params");
754 	spdk_json_write_named_uint32(w, "crdt1", tgt->crdt[0]);
755 	spdk_json_write_named_uint32(w, "crdt2", tgt->crdt[1]);
756 	spdk_json_write_named_uint32(w, "crdt3", tgt->crdt[2]);
757 	spdk_json_write_object_end(w);
758 	spdk_json_write_object_end(w);
759 
760 	/* write transports */
761 	TAILQ_FOREACH(transport, &tgt->transports, link) {
762 		spdk_json_write_object_begin(w);
763 		spdk_json_write_named_string(w, "method", "nvmf_create_transport");
764 		nvmf_transport_dump_opts(transport, w, true);
765 		spdk_json_write_object_end(w);
766 	}
767 
768 	TAILQ_FOREACH(referral, &tgt->referrals, link) {
769 		spdk_json_write_object_begin(w);
770 		spdk_json_write_named_string(w, "method", "nvmf_discovery_add_referral");
771 
772 		spdk_json_write_named_object_begin(w, "params");
773 		spdk_json_write_named_object_begin(w, "address");
774 		nvmf_transport_listen_dump_trid(&referral->trid, w);
775 		spdk_json_write_object_end(w);
776 		spdk_json_write_named_bool(w, "secure_channel",
777 					   referral->entry.treq.secure_channel ==
778 					   SPDK_NVMF_TREQ_SECURE_CHANNEL_REQUIRED);
779 		spdk_json_write_named_string(w, "subnqn", referral->trid.subnqn);
780 		spdk_json_write_object_end(w);
781 
782 		spdk_json_write_object_end(w);
783 	}
784 
785 	subsystem = spdk_nvmf_subsystem_get_first(tgt);
786 	while (subsystem) {
787 		nvmf_write_subsystem_config_json(w, subsystem);
788 		subsystem = spdk_nvmf_subsystem_get_next(subsystem);
789 	}
790 }
791 
792 static void
793 nvmf_listen_opts_copy(struct spdk_nvmf_listen_opts *opts,
794 		      const struct spdk_nvmf_listen_opts *opts_src, size_t opts_size)
795 {
796 	assert(opts);
797 	assert(opts_src);
798 
799 	opts->opts_size = opts_size;
800 
801 #define SET_FIELD(field) \
802     if (offsetof(struct spdk_nvmf_listen_opts, field) + sizeof(opts->field) <= opts_size) { \
803                  opts->field = opts_src->field; \
804     } \
805 
806 	SET_FIELD(transport_specific);
807 	SET_FIELD(secure_channel);
808 	SET_FIELD(ana_state);
809 	SET_FIELD(sock_impl);
810 #undef SET_FIELD
811 
812 	/* Do not remove this statement, you should always update this statement when you adding a new field,
813 	 * and do not forget to add the SET_FIELD statement for your added field. */
814 	SPDK_STATIC_ASSERT(sizeof(struct spdk_nvmf_listen_opts) == 32, "Incorrect size");
815 }
816 
817 void
818 spdk_nvmf_listen_opts_init(struct spdk_nvmf_listen_opts *opts, size_t opts_size)
819 {
820 	struct spdk_nvmf_listen_opts opts_local = {};
821 
822 	/* local version of opts should have defaults set here */
823 	opts_local.ana_state = SPDK_NVME_ANA_OPTIMIZED_STATE;
824 	nvmf_listen_opts_copy(opts, &opts_local, opts_size);
825 }
826 
827 int
828 spdk_nvmf_tgt_listen_ext(struct spdk_nvmf_tgt *tgt, const struct spdk_nvme_transport_id *trid,
829 			 struct spdk_nvmf_listen_opts *opts)
830 {
831 	struct spdk_nvmf_transport *transport;
832 	int rc;
833 	struct spdk_nvmf_listen_opts opts_local = {};
834 
835 	if (!opts) {
836 		SPDK_ERRLOG("opts should not be NULL\n");
837 		return -EINVAL;
838 	}
839 
840 	if (!opts->opts_size) {
841 		SPDK_ERRLOG("The opts_size in opts structure should not be zero\n");
842 		return -EINVAL;
843 	}
844 
845 	transport = spdk_nvmf_tgt_get_transport(tgt, trid->trstring);
846 	if (!transport) {
847 		SPDK_ERRLOG("Unable to find %s transport. The transport must be created first also make sure it is properly registered.\n",
848 			    trid->trstring);
849 		return -EINVAL;
850 	}
851 
852 	nvmf_listen_opts_copy(&opts_local, opts, opts->opts_size);
853 	rc = spdk_nvmf_transport_listen(transport, trid, &opts_local);
854 	if (rc < 0) {
855 		SPDK_ERRLOG("Unable to listen on address '%s'\n", trid->traddr);
856 	}
857 
858 	return rc;
859 }
860 
861 int
862 spdk_nvmf_tgt_stop_listen(struct spdk_nvmf_tgt *tgt,
863 			  struct spdk_nvme_transport_id *trid)
864 {
865 	struct spdk_nvmf_transport *transport;
866 	int rc;
867 
868 	transport = spdk_nvmf_tgt_get_transport(tgt, trid->trstring);
869 	if (!transport) {
870 		SPDK_ERRLOG("Unable to find %s transport. The transport must be created first also make sure it is properly registered.\n",
871 			    trid->trstring);
872 		return -EINVAL;
873 	}
874 
875 	rc = spdk_nvmf_transport_stop_listen(transport, trid);
876 	if (rc < 0) {
877 		SPDK_ERRLOG("Failed to stop listening on address '%s'\n", trid->traddr);
878 		return rc;
879 	}
880 	return 0;
881 }
882 
883 struct spdk_nvmf_tgt_add_transport_ctx {
884 	struct spdk_nvmf_tgt *tgt;
885 	struct spdk_nvmf_transport *transport;
886 	spdk_nvmf_tgt_add_transport_done_fn cb_fn;
887 	void *cb_arg;
888 	int status;
889 };
890 
891 static void
892 _nvmf_tgt_remove_transport_done(struct spdk_io_channel_iter *i, int status)
893 {
894 	struct spdk_nvmf_tgt_add_transport_ctx *ctx = spdk_io_channel_iter_get_ctx(i);
895 
896 	ctx->cb_fn(ctx->cb_arg, ctx->status);
897 	free(ctx);
898 }
899 
900 static void
901 _nvmf_tgt_remove_transport(struct spdk_io_channel_iter *i)
902 {
903 	struct spdk_nvmf_tgt_add_transport_ctx *ctx = spdk_io_channel_iter_get_ctx(i);
904 	struct spdk_io_channel *ch = spdk_io_channel_iter_get_channel(i);
905 	struct spdk_nvmf_poll_group *group = spdk_io_channel_get_ctx(ch);
906 	struct spdk_nvmf_transport_poll_group *tgroup, *tmp;
907 
908 	TAILQ_FOREACH_SAFE(tgroup, &group->tgroups, link, tmp) {
909 		if (tgroup->transport == ctx->transport) {
910 			TAILQ_REMOVE(&group->tgroups, tgroup, link);
911 			nvmf_transport_poll_group_destroy(tgroup);
912 		}
913 	}
914 
915 	spdk_for_each_channel_continue(i, 0);
916 }
917 
918 static void
919 _nvmf_tgt_add_transport_done(struct spdk_io_channel_iter *i, int status)
920 {
921 	struct spdk_nvmf_tgt_add_transport_ctx *ctx = spdk_io_channel_iter_get_ctx(i);
922 
923 	if (status) {
924 		ctx->status = status;
925 		spdk_for_each_channel(ctx->tgt,
926 				      _nvmf_tgt_remove_transport,
927 				      ctx,
928 				      _nvmf_tgt_remove_transport_done);
929 		return;
930 	}
931 
932 	ctx->transport->tgt = ctx->tgt;
933 	TAILQ_INSERT_TAIL(&ctx->tgt->transports, ctx->transport, link);
934 	ctx->cb_fn(ctx->cb_arg, status);
935 	free(ctx);
936 }
937 
938 static void
939 _nvmf_tgt_add_transport(struct spdk_io_channel_iter *i)
940 {
941 	struct spdk_nvmf_tgt_add_transport_ctx *ctx = spdk_io_channel_iter_get_ctx(i);
942 	struct spdk_io_channel *ch = spdk_io_channel_iter_get_channel(i);
943 	struct spdk_nvmf_poll_group *group = spdk_io_channel_get_ctx(ch);
944 	int rc;
945 
946 	rc = nvmf_poll_group_add_transport(group, ctx->transport);
947 	spdk_for_each_channel_continue(i, rc);
948 }
949 
950 void
951 spdk_nvmf_tgt_add_transport(struct spdk_nvmf_tgt *tgt,
952 			    struct spdk_nvmf_transport *transport,
953 			    spdk_nvmf_tgt_add_transport_done_fn cb_fn,
954 			    void *cb_arg)
955 {
956 	struct spdk_nvmf_tgt_add_transport_ctx *ctx;
957 
958 	SPDK_DTRACE_PROBE2_TICKS(nvmf_tgt_add_transport, transport, tgt->name);
959 
960 	if (spdk_nvmf_tgt_get_transport(tgt, transport->ops->name)) {
961 		cb_fn(cb_arg, -EEXIST);
962 		return; /* transport already created */
963 	}
964 
965 	ctx = calloc(1, sizeof(*ctx));
966 	if (!ctx) {
967 		cb_fn(cb_arg, -ENOMEM);
968 		return;
969 	}
970 
971 	ctx->tgt = tgt;
972 	ctx->transport = transport;
973 	ctx->cb_fn = cb_fn;
974 	ctx->cb_arg = cb_arg;
975 
976 	spdk_for_each_channel(tgt,
977 			      _nvmf_tgt_add_transport,
978 			      ctx,
979 			      _nvmf_tgt_add_transport_done);
980 }
981 
982 struct nvmf_tgt_pause_ctx {
983 	struct spdk_nvmf_tgt *tgt;
984 	spdk_nvmf_tgt_pause_polling_cb_fn cb_fn;
985 	void *cb_arg;
986 };
987 
988 static void
989 _nvmf_tgt_pause_polling_done(struct spdk_io_channel_iter *i, int status)
990 {
991 	struct nvmf_tgt_pause_ctx *ctx = spdk_io_channel_iter_get_ctx(i);
992 
993 	ctx->tgt->state = NVMF_TGT_PAUSED;
994 
995 	ctx->cb_fn(ctx->cb_arg, status);
996 	free(ctx);
997 }
998 
999 static void
1000 _nvmf_tgt_pause_polling(struct spdk_io_channel_iter *i)
1001 {
1002 	struct spdk_io_channel *ch = spdk_io_channel_iter_get_channel(i);
1003 	struct spdk_nvmf_poll_group *group = spdk_io_channel_get_ctx(ch);
1004 
1005 	spdk_poller_unregister(&group->poller);
1006 
1007 	spdk_for_each_channel_continue(i, 0);
1008 }
1009 
1010 int
1011 spdk_nvmf_tgt_pause_polling(struct spdk_nvmf_tgt *tgt, spdk_nvmf_tgt_pause_polling_cb_fn cb_fn,
1012 			    void *cb_arg)
1013 {
1014 	struct nvmf_tgt_pause_ctx *ctx;
1015 
1016 	SPDK_DTRACE_PROBE2_TICKS(nvmf_tgt_pause_polling, tgt, tgt->name);
1017 
1018 	switch (tgt->state) {
1019 	case NVMF_TGT_PAUSING:
1020 	case NVMF_TGT_RESUMING:
1021 		return -EBUSY;
1022 	case NVMF_TGT_RUNNING:
1023 		break;
1024 	default:
1025 		return -EINVAL;
1026 	}
1027 
1028 	ctx = calloc(1, sizeof(*ctx));
1029 	if (!ctx) {
1030 		return -ENOMEM;
1031 	}
1032 
1033 
1034 	tgt->state = NVMF_TGT_PAUSING;
1035 
1036 	ctx->tgt = tgt;
1037 	ctx->cb_fn = cb_fn;
1038 	ctx->cb_arg = cb_arg;
1039 
1040 	spdk_for_each_channel(tgt,
1041 			      _nvmf_tgt_pause_polling,
1042 			      ctx,
1043 			      _nvmf_tgt_pause_polling_done);
1044 	return 0;
1045 }
1046 
1047 static void
1048 _nvmf_tgt_resume_polling_done(struct spdk_io_channel_iter *i, int status)
1049 {
1050 	struct nvmf_tgt_pause_ctx *ctx = spdk_io_channel_iter_get_ctx(i);
1051 
1052 	ctx->tgt->state = NVMF_TGT_RUNNING;
1053 
1054 	ctx->cb_fn(ctx->cb_arg, status);
1055 	free(ctx);
1056 }
1057 
1058 static void
1059 _nvmf_tgt_resume_polling(struct spdk_io_channel_iter *i)
1060 {
1061 	struct spdk_io_channel *ch = spdk_io_channel_iter_get_channel(i);
1062 	struct spdk_nvmf_poll_group *group = spdk_io_channel_get_ctx(ch);
1063 
1064 	assert(group->poller == NULL);
1065 	group->poller = SPDK_POLLER_REGISTER(nvmf_poll_group_poll, group, 0);
1066 
1067 	spdk_for_each_channel_continue(i, 0);
1068 }
1069 
1070 int
1071 spdk_nvmf_tgt_resume_polling(struct spdk_nvmf_tgt *tgt, spdk_nvmf_tgt_resume_polling_cb_fn cb_fn,
1072 			     void *cb_arg)
1073 {
1074 	struct nvmf_tgt_pause_ctx *ctx;
1075 
1076 	SPDK_DTRACE_PROBE2_TICKS(nvmf_tgt_resume_polling, tgt, tgt->name);
1077 
1078 	switch (tgt->state) {
1079 	case NVMF_TGT_PAUSING:
1080 	case NVMF_TGT_RESUMING:
1081 		return -EBUSY;
1082 	case NVMF_TGT_PAUSED:
1083 		break;
1084 	default:
1085 		return -EINVAL;
1086 	}
1087 
1088 	ctx = calloc(1, sizeof(*ctx));
1089 	if (!ctx) {
1090 		return -ENOMEM;
1091 	}
1092 
1093 	tgt->state = NVMF_TGT_RESUMING;
1094 
1095 	ctx->tgt = tgt;
1096 	ctx->cb_fn = cb_fn;
1097 	ctx->cb_arg = cb_arg;
1098 
1099 	spdk_for_each_channel(tgt,
1100 			      _nvmf_tgt_resume_polling,
1101 			      ctx,
1102 			      _nvmf_tgt_resume_polling_done);
1103 	return 0;
1104 }
1105 
1106 struct spdk_nvmf_subsystem *
1107 spdk_nvmf_tgt_find_subsystem(struct spdk_nvmf_tgt *tgt, const char *subnqn)
1108 {
1109 	struct spdk_nvmf_subsystem subsystem;
1110 
1111 	if (!subnqn) {
1112 		return NULL;
1113 	}
1114 
1115 	/* Ensure that subnqn is null terminated */
1116 	if (!memchr(subnqn, '\0', SPDK_NVMF_NQN_MAX_LEN + 1)) {
1117 		SPDK_ERRLOG("Connect SUBNQN is not null terminated\n");
1118 		return NULL;
1119 	}
1120 
1121 	snprintf(subsystem.subnqn, sizeof(subsystem.subnqn), "%s", subnqn);
1122 	return RB_FIND(subsystem_tree, &tgt->subsystems, &subsystem);
1123 }
1124 
1125 struct spdk_nvmf_transport *
1126 spdk_nvmf_tgt_get_transport(struct spdk_nvmf_tgt *tgt, const char *transport_name)
1127 {
1128 	struct spdk_nvmf_transport *transport;
1129 
1130 	TAILQ_FOREACH(transport, &tgt->transports, link) {
1131 		if (!strncasecmp(transport->ops->name, transport_name, SPDK_NVMF_TRSTRING_MAX_LEN)) {
1132 			return transport;
1133 		}
1134 	}
1135 	return NULL;
1136 }
1137 
1138 struct nvmf_new_qpair_ctx {
1139 	struct spdk_nvmf_qpair *qpair;
1140 	struct spdk_nvmf_poll_group *group;
1141 };
1142 
1143 static void
1144 _nvmf_poll_group_add(void *_ctx)
1145 {
1146 	struct nvmf_new_qpair_ctx *ctx = _ctx;
1147 	struct spdk_nvmf_qpair *qpair = ctx->qpair;
1148 	struct spdk_nvmf_poll_group *group = ctx->group;
1149 
1150 	free(_ctx);
1151 
1152 	if (spdk_nvmf_poll_group_add(group, qpair) != 0) {
1153 		SPDK_ERRLOG("Unable to add the qpair to a poll group.\n");
1154 		spdk_nvmf_qpair_disconnect(qpair);
1155 	}
1156 }
1157 
1158 void
1159 spdk_nvmf_tgt_new_qpair(struct spdk_nvmf_tgt *tgt, struct spdk_nvmf_qpair *qpair)
1160 {
1161 	struct spdk_nvmf_poll_group *group;
1162 	struct nvmf_new_qpair_ctx *ctx;
1163 
1164 	group = spdk_nvmf_get_optimal_poll_group(qpair);
1165 	if (group == NULL) {
1166 		if (tgt->next_poll_group == NULL) {
1167 			tgt->next_poll_group = TAILQ_FIRST(&tgt->poll_groups);
1168 			if (tgt->next_poll_group == NULL) {
1169 				SPDK_ERRLOG("No poll groups exist.\n");
1170 				spdk_nvmf_qpair_disconnect(qpair);
1171 				return;
1172 			}
1173 		}
1174 		group = tgt->next_poll_group;
1175 		tgt->next_poll_group = TAILQ_NEXT(group, link);
1176 	}
1177 
1178 	ctx = calloc(1, sizeof(*ctx));
1179 	if (!ctx) {
1180 		SPDK_ERRLOG("Unable to send message to poll group.\n");
1181 		spdk_nvmf_qpair_disconnect(qpair);
1182 		return;
1183 	}
1184 
1185 	ctx->qpair = qpair;
1186 	ctx->group = group;
1187 
1188 	pthread_mutex_lock(&group->mutex);
1189 	group->current_unassociated_qpairs++;
1190 	pthread_mutex_unlock(&group->mutex);
1191 
1192 	spdk_thread_send_msg(group->thread, _nvmf_poll_group_add, ctx);
1193 }
1194 
1195 struct spdk_nvmf_poll_group *
1196 spdk_nvmf_poll_group_create(struct spdk_nvmf_tgt *tgt)
1197 {
1198 	struct spdk_io_channel *ch;
1199 
1200 	ch = spdk_get_io_channel(tgt);
1201 	if (!ch) {
1202 		SPDK_ERRLOG("Unable to get I/O channel for target\n");
1203 		return NULL;
1204 	}
1205 
1206 	return spdk_io_channel_get_ctx(ch);
1207 }
1208 
1209 void
1210 spdk_nvmf_poll_group_destroy(struct spdk_nvmf_poll_group *group,
1211 			     spdk_nvmf_poll_group_destroy_done_fn cb_fn,
1212 			     void *cb_arg)
1213 {
1214 	assert(group->destroy_cb_fn == NULL);
1215 	group->destroy_cb_fn = cb_fn;
1216 	group->destroy_cb_arg = cb_arg;
1217 
1218 	/* This function will put the io_channel associated with this poll group */
1219 	nvmf_tgt_destroy_poll_group_qpairs(group);
1220 }
1221 
1222 int
1223 spdk_nvmf_poll_group_add(struct spdk_nvmf_poll_group *group,
1224 			 struct spdk_nvmf_qpair *qpair)
1225 {
1226 	int rc;
1227 	struct spdk_nvmf_transport_poll_group *tgroup;
1228 
1229 	TAILQ_INIT(&qpair->outstanding);
1230 	qpair->group = group;
1231 	qpair->ctrlr = NULL;
1232 	qpair->disconnect_started = false;
1233 
1234 	tgroup = nvmf_get_transport_poll_group(group, qpair->transport);
1235 	if (tgroup == NULL) {
1236 		return -1;
1237 	}
1238 
1239 	rc = nvmf_transport_poll_group_add(tgroup, qpair);
1240 
1241 	/* We add the qpair to the group only it is successfully added into the tgroup */
1242 	if (rc == 0) {
1243 		SPDK_DTRACE_PROBE2_TICKS(nvmf_poll_group_add_qpair, qpair, spdk_thread_get_id(group->thread));
1244 		TAILQ_INSERT_TAIL(&group->qpairs, qpair, link);
1245 		nvmf_qpair_set_state(qpair, SPDK_NVMF_QPAIR_CONNECTING);
1246 	}
1247 
1248 	return rc;
1249 }
1250 
1251 static void
1252 _nvmf_ctrlr_destruct(void *ctx)
1253 {
1254 	struct spdk_nvmf_ctrlr *ctrlr = ctx;
1255 
1256 	nvmf_ctrlr_destruct(ctrlr);
1257 }
1258 
1259 static void
1260 _nvmf_ctrlr_free_from_qpair(void *ctx)
1261 {
1262 	struct nvmf_qpair_disconnect_ctx *qpair_ctx = ctx;
1263 	struct spdk_nvmf_ctrlr *ctrlr = qpair_ctx->ctrlr;
1264 	uint32_t count;
1265 
1266 	spdk_bit_array_clear(ctrlr->qpair_mask, qpair_ctx->qid);
1267 	SPDK_DEBUGLOG(nvmf, "qpair_mask cleared, qid %u\n", qpair_ctx->qid);
1268 	count = spdk_bit_array_count_set(ctrlr->qpair_mask);
1269 	if (count == 0) {
1270 		assert(!ctrlr->in_destruct);
1271 		SPDK_DEBUGLOG(nvmf, "Last qpair %u, destroy ctrlr 0x%hx\n", qpair_ctx->qid, ctrlr->cntlid);
1272 		ctrlr->in_destruct = true;
1273 		spdk_thread_send_msg(ctrlr->subsys->thread, _nvmf_ctrlr_destruct, ctrlr);
1274 	}
1275 	free(qpair_ctx);
1276 }
1277 
1278 static void
1279 _nvmf_transport_qpair_fini_complete(void *cb_ctx)
1280 {
1281 	struct nvmf_qpair_disconnect_ctx *qpair_ctx = cb_ctx;
1282 	struct spdk_nvmf_ctrlr *ctrlr;
1283 
1284 	ctrlr = qpair_ctx->ctrlr;
1285 	SPDK_DEBUGLOG(nvmf, "Finish destroying qid %u\n", qpair_ctx->qid);
1286 
1287 	if (ctrlr) {
1288 		if (qpair_ctx->qid == 0) {
1289 			/* Admin qpair is removed, so set the pointer to NULL.
1290 			 * This operation is safe since we are on ctrlr thread now, admin qpair's thread is the same
1291 			 * as controller's thread */
1292 			assert(ctrlr->thread == spdk_get_thread());
1293 			ctrlr->admin_qpair = NULL;
1294 		}
1295 		/* Free qpair id from controller's bit mask and destroy the controller if it is the last qpair */
1296 		if (ctrlr->thread) {
1297 			spdk_thread_send_msg(ctrlr->thread, _nvmf_ctrlr_free_from_qpair, qpair_ctx);
1298 		} else {
1299 			_nvmf_ctrlr_free_from_qpair(qpair_ctx);
1300 		}
1301 	} else {
1302 		free(qpair_ctx);
1303 	}
1304 }
1305 
1306 void
1307 spdk_nvmf_poll_group_remove(struct spdk_nvmf_qpair *qpair)
1308 {
1309 	struct spdk_nvmf_transport_poll_group *tgroup;
1310 	int rc;
1311 
1312 	SPDK_DTRACE_PROBE2_TICKS(nvmf_poll_group_remove_qpair, qpair,
1313 				 spdk_thread_get_id(qpair->group->thread));
1314 	nvmf_qpair_set_state(qpair, SPDK_NVMF_QPAIR_ERROR);
1315 
1316 	/* Find the tgroup and remove the qpair from the tgroup */
1317 	tgroup = nvmf_get_transport_poll_group(qpair->group, qpair->transport);
1318 	if (tgroup != NULL) {
1319 		rc = nvmf_transport_poll_group_remove(tgroup, qpair);
1320 		if (rc && (rc != ENOTSUP)) {
1321 			SPDK_ERRLOG("Cannot remove qpair=%p from transport group=%p\n",
1322 				    qpair, tgroup);
1323 		}
1324 	}
1325 
1326 	TAILQ_REMOVE(&qpair->group->qpairs, qpair, link);
1327 	qpair->group = NULL;
1328 }
1329 
1330 static void
1331 _nvmf_qpair_sgroup_req_clean(struct spdk_nvmf_subsystem_poll_group *sgroup,
1332 			     const struct spdk_nvmf_qpair *qpair)
1333 {
1334 	struct spdk_nvmf_request *req, *tmp;
1335 	TAILQ_FOREACH_SAFE(req, &sgroup->queued, link, tmp) {
1336 		if (req->qpair == qpair) {
1337 			TAILQ_REMOVE(&sgroup->queued, req, link);
1338 			if (nvmf_transport_req_free(req)) {
1339 				SPDK_ERRLOG("Transport request free error!\n");
1340 			}
1341 		}
1342 	}
1343 }
1344 
1345 static void
1346 _nvmf_qpair_destroy(void *ctx, int status)
1347 {
1348 	struct nvmf_qpair_disconnect_ctx *qpair_ctx = ctx;
1349 	struct spdk_nvmf_qpair *qpair = qpair_ctx->qpair;
1350 	struct spdk_nvmf_ctrlr *ctrlr = qpair->ctrlr;
1351 	struct spdk_nvmf_subsystem_poll_group *sgroup;
1352 	uint32_t sid;
1353 
1354 	assert(qpair->state == SPDK_NVMF_QPAIR_DEACTIVATING);
1355 	qpair_ctx->qid = qpair->qid;
1356 
1357 	if (qpair->connect_received) {
1358 		if (0 == qpair->qid) {
1359 			assert(qpair->group->stat.current_admin_qpairs > 0);
1360 			qpair->group->stat.current_admin_qpairs--;
1361 		} else {
1362 			assert(qpair->group->stat.current_io_qpairs > 0);
1363 			qpair->group->stat.current_io_qpairs--;
1364 		}
1365 	} else {
1366 		pthread_mutex_lock(&qpair->group->mutex);
1367 		qpair->group->current_unassociated_qpairs--;
1368 		pthread_mutex_unlock(&qpair->group->mutex);
1369 	}
1370 
1371 	if (ctrlr) {
1372 		sgroup = &qpair->group->sgroups[ctrlr->subsys->id];
1373 		_nvmf_qpair_sgroup_req_clean(sgroup, qpair);
1374 	} else {
1375 		for (sid = 0; sid < qpair->group->num_sgroups; sid++) {
1376 			sgroup = &qpair->group->sgroups[sid];
1377 			assert(sgroup != NULL);
1378 			_nvmf_qpair_sgroup_req_clean(sgroup, qpair);
1379 		}
1380 	}
1381 
1382 	nvmf_qpair_auth_destroy(qpair);
1383 	qpair_ctx->ctrlr = ctrlr;
1384 	spdk_nvmf_poll_group_remove(qpair);
1385 	nvmf_transport_qpair_fini(qpair, _nvmf_transport_qpair_fini_complete, qpair_ctx);
1386 }
1387 
1388 static void
1389 _nvmf_qpair_disconnect_msg(void *ctx)
1390 {
1391 	struct nvmf_qpair_disconnect_ctx *qpair_ctx = ctx;
1392 
1393 	spdk_nvmf_qpair_disconnect(qpair_ctx->qpair);
1394 	free(ctx);
1395 }
1396 
1397 int
1398 spdk_nvmf_qpair_disconnect(struct spdk_nvmf_qpair *qpair)
1399 {
1400 	struct spdk_nvmf_poll_group *group = qpair->group;
1401 	struct nvmf_qpair_disconnect_ctx *qpair_ctx;
1402 
1403 	if (__atomic_test_and_set(&qpair->disconnect_started, __ATOMIC_RELAXED)) {
1404 		return -EINPROGRESS;
1405 	}
1406 
1407 	/* If we get a qpair in the uninitialized state, we can just destroy it immediately */
1408 	if (qpair->state == SPDK_NVMF_QPAIR_UNINITIALIZED) {
1409 		nvmf_transport_qpair_fini(qpair, NULL, NULL);
1410 		return 0;
1411 	}
1412 
1413 	assert(group != NULL);
1414 	if (spdk_get_thread() != group->thread) {
1415 		/* clear the atomic so we can set it on the next call on the proper thread. */
1416 		__atomic_clear(&qpair->disconnect_started, __ATOMIC_RELAXED);
1417 		qpair_ctx = calloc(1, sizeof(struct nvmf_qpair_disconnect_ctx));
1418 		if (!qpair_ctx) {
1419 			SPDK_ERRLOG("Unable to allocate context for nvmf_qpair_disconnect\n");
1420 			return -ENOMEM;
1421 		}
1422 		qpair_ctx->qpair = qpair;
1423 		spdk_thread_send_msg(group->thread, _nvmf_qpair_disconnect_msg, qpair_ctx);
1424 		return 0;
1425 	}
1426 
1427 	SPDK_DTRACE_PROBE2_TICKS(nvmf_qpair_disconnect, qpair, spdk_thread_get_id(group->thread));
1428 	assert(spdk_nvmf_qpair_is_active(qpair));
1429 	nvmf_qpair_set_state(qpair, SPDK_NVMF_QPAIR_DEACTIVATING);
1430 
1431 	qpair_ctx = calloc(1, sizeof(struct nvmf_qpair_disconnect_ctx));
1432 	if (!qpair_ctx) {
1433 		SPDK_ERRLOG("Unable to allocate context for nvmf_qpair_disconnect\n");
1434 		return -ENOMEM;
1435 	}
1436 
1437 	qpair_ctx->qpair = qpair;
1438 
1439 	/* Check for outstanding I/O */
1440 	if (!TAILQ_EMPTY(&qpair->outstanding)) {
1441 		SPDK_DTRACE_PROBE2_TICKS(nvmf_poll_group_drain_qpair, qpair, spdk_thread_get_id(group->thread));
1442 		qpair->state_cb = _nvmf_qpair_destroy;
1443 		qpair->state_cb_arg = qpair_ctx;
1444 		nvmf_qpair_abort_pending_zcopy_reqs(qpair);
1445 		nvmf_qpair_free_aer(qpair);
1446 		return 0;
1447 	}
1448 
1449 	_nvmf_qpair_destroy(qpair_ctx, 0);
1450 
1451 	return 0;
1452 }
1453 
1454 int
1455 spdk_nvmf_qpair_get_peer_trid(struct spdk_nvmf_qpair *qpair,
1456 			      struct spdk_nvme_transport_id *trid)
1457 {
1458 	memset(trid, 0, sizeof(*trid));
1459 	return nvmf_transport_qpair_get_peer_trid(qpair, trid);
1460 }
1461 
1462 int
1463 spdk_nvmf_qpair_get_local_trid(struct spdk_nvmf_qpair *qpair,
1464 			       struct spdk_nvme_transport_id *trid)
1465 {
1466 	memset(trid, 0, sizeof(*trid));
1467 	return nvmf_transport_qpair_get_local_trid(qpair, trid);
1468 }
1469 
1470 int
1471 spdk_nvmf_qpair_get_listen_trid(struct spdk_nvmf_qpair *qpair,
1472 				struct spdk_nvme_transport_id *trid)
1473 {
1474 	memset(trid, 0, sizeof(*trid));
1475 	return nvmf_transport_qpair_get_listen_trid(qpair, trid);
1476 }
1477 
1478 static int
1479 poll_group_update_subsystem(struct spdk_nvmf_poll_group *group,
1480 			    struct spdk_nvmf_subsystem *subsystem)
1481 {
1482 	struct spdk_nvmf_subsystem_poll_group *sgroup;
1483 	uint32_t i, j;
1484 	struct spdk_nvmf_ns *ns;
1485 	struct spdk_nvmf_registrant *reg, *tmp;
1486 	struct spdk_io_channel *ch;
1487 	struct spdk_nvmf_subsystem_pg_ns_info *ns_info;
1488 	struct spdk_nvmf_ctrlr *ctrlr;
1489 	bool ns_changed;
1490 
1491 	/* Make sure our poll group has memory for this subsystem allocated */
1492 	if (subsystem->id >= group->num_sgroups) {
1493 		return -ENOMEM;
1494 	}
1495 
1496 	sgroup = &group->sgroups[subsystem->id];
1497 
1498 	/* Make sure the array of namespace information is the correct size */
1499 	if (sgroup->num_ns == 0 && subsystem->max_nsid > 0) {
1500 		/* First allocation */
1501 		sgroup->ns_info = calloc(subsystem->max_nsid, sizeof(struct spdk_nvmf_subsystem_pg_ns_info));
1502 		if (!sgroup->ns_info) {
1503 			return -ENOMEM;
1504 		}
1505 		sgroup->num_ns = subsystem->max_nsid;
1506 	}
1507 
1508 	ns_changed = false;
1509 
1510 	/* Detect bdevs that were added or removed */
1511 	for (i = 0; i < sgroup->num_ns; i++) {
1512 		ns = subsystem->ns[i];
1513 		ns_info = &sgroup->ns_info[i];
1514 		ch = ns_info->channel;
1515 
1516 		if (ns == NULL && ch == NULL) {
1517 			/* Both NULL. Leave empty */
1518 		} else if (ns == NULL && ch != NULL) {
1519 			/* There was a channel here, but the namespace is gone. */
1520 			ns_changed = true;
1521 			spdk_put_io_channel(ch);
1522 			ns_info->channel = NULL;
1523 		} else if (ns != NULL && ch == NULL) {
1524 			/* A namespace appeared but there is no channel yet */
1525 			ns_changed = true;
1526 			ch = spdk_bdev_get_io_channel(ns->desc);
1527 			if (ch == NULL) {
1528 				SPDK_ERRLOG("Could not allocate I/O channel.\n");
1529 				return -ENOMEM;
1530 			}
1531 			ns_info->channel = ch;
1532 		} else if (spdk_uuid_compare(&ns_info->uuid, spdk_bdev_get_uuid(ns->bdev)) != 0) {
1533 			/* A namespace was here before, but was replaced by a new one. */
1534 			ns_changed = true;
1535 			spdk_put_io_channel(ns_info->channel);
1536 			memset(ns_info, 0, sizeof(*ns_info));
1537 
1538 			ch = spdk_bdev_get_io_channel(ns->desc);
1539 			if (ch == NULL) {
1540 				SPDK_ERRLOG("Could not allocate I/O channel.\n");
1541 				return -ENOMEM;
1542 			}
1543 			ns_info->channel = ch;
1544 		} else if (ns_info->num_blocks != spdk_bdev_get_num_blocks(ns->bdev)) {
1545 			/* Namespace is still there but size has changed */
1546 			SPDK_DEBUGLOG(nvmf, "Namespace resized: subsystem_id %u,"
1547 				      " nsid %u, pg %p, old %" PRIu64 ", new %" PRIu64 "\n",
1548 				      subsystem->id,
1549 				      ns->nsid,
1550 				      group,
1551 				      ns_info->num_blocks,
1552 				      spdk_bdev_get_num_blocks(ns->bdev));
1553 			ns_changed = true;
1554 		}
1555 
1556 		if (ns == NULL) {
1557 			memset(ns_info, 0, sizeof(*ns_info));
1558 		} else {
1559 			ns_info->uuid = *spdk_bdev_get_uuid(ns->bdev);
1560 			ns_info->num_blocks = spdk_bdev_get_num_blocks(ns->bdev);
1561 			ns_info->crkey = ns->crkey;
1562 			ns_info->rtype = ns->rtype;
1563 			if (ns->holder) {
1564 				ns_info->holder_id = ns->holder->hostid;
1565 			}
1566 
1567 			memset(&ns_info->reg_hostid, 0, SPDK_NVMF_MAX_NUM_REGISTRANTS * sizeof(struct spdk_uuid));
1568 			j = 0;
1569 			TAILQ_FOREACH_SAFE(reg, &ns->registrants, link, tmp) {
1570 				if (j >= SPDK_NVMF_MAX_NUM_REGISTRANTS) {
1571 					SPDK_ERRLOG("Maximum %u registrants can support.\n", SPDK_NVMF_MAX_NUM_REGISTRANTS);
1572 					return -EINVAL;
1573 				}
1574 				ns_info->reg_hostid[j++] = reg->hostid;
1575 			}
1576 		}
1577 	}
1578 
1579 	if (ns_changed) {
1580 		TAILQ_FOREACH(ctrlr, &subsystem->ctrlrs, link) {
1581 			if (ctrlr->thread != spdk_get_thread()) {
1582 				continue;
1583 			}
1584 			/* It is possible that a ctrlr was added but the admin_qpair hasn't been
1585 			 * assigned yet.
1586 			 */
1587 			if (!ctrlr->admin_qpair) {
1588 				continue;
1589 			}
1590 			if (ctrlr->admin_qpair->group == group) {
1591 				nvmf_ctrlr_async_event_ns_notice(ctrlr);
1592 				nvmf_ctrlr_async_event_ana_change_notice(ctrlr);
1593 			}
1594 		}
1595 	}
1596 
1597 	return 0;
1598 }
1599 
1600 int
1601 nvmf_poll_group_update_subsystem(struct spdk_nvmf_poll_group *group,
1602 				 struct spdk_nvmf_subsystem *subsystem)
1603 {
1604 	return poll_group_update_subsystem(group, subsystem);
1605 }
1606 
1607 int
1608 nvmf_poll_group_add_subsystem(struct spdk_nvmf_poll_group *group,
1609 			      struct spdk_nvmf_subsystem *subsystem,
1610 			      spdk_nvmf_poll_group_mod_done cb_fn, void *cb_arg)
1611 {
1612 	int rc = 0;
1613 	struct spdk_nvmf_subsystem_poll_group *sgroup = &group->sgroups[subsystem->id];
1614 	struct spdk_nvmf_request *req, *tmp;
1615 	uint32_t i;
1616 
1617 	if (!TAILQ_EMPTY(&sgroup->queued)) {
1618 		SPDK_ERRLOG("sgroup->queued not empty when adding subsystem\n");
1619 		TAILQ_FOREACH_SAFE(req, &sgroup->queued, link, tmp) {
1620 			TAILQ_REMOVE(&sgroup->queued, req, link);
1621 			if (nvmf_transport_req_free(req)) {
1622 				SPDK_ERRLOG("Transport request free error!\n");
1623 			}
1624 		}
1625 	}
1626 
1627 	rc = poll_group_update_subsystem(group, subsystem);
1628 	if (rc) {
1629 		nvmf_poll_group_remove_subsystem(group, subsystem, NULL, NULL);
1630 		goto fini;
1631 	}
1632 
1633 	sgroup->state = SPDK_NVMF_SUBSYSTEM_ACTIVE;
1634 
1635 	for (i = 0; i < sgroup->num_ns; i++) {
1636 		sgroup->ns_info[i].state = SPDK_NVMF_SUBSYSTEM_ACTIVE;
1637 	}
1638 
1639 fini:
1640 	if (cb_fn) {
1641 		cb_fn(cb_arg, rc);
1642 	}
1643 
1644 	SPDK_DTRACE_PROBE2_TICKS(nvmf_poll_group_add_subsystem, spdk_thread_get_id(group->thread),
1645 				 subsystem->subnqn);
1646 
1647 	return rc;
1648 }
1649 
1650 static void
1651 _nvmf_poll_group_remove_subsystem_cb(void *ctx, int status)
1652 {
1653 	struct nvmf_qpair_disconnect_many_ctx *qpair_ctx = ctx;
1654 	struct spdk_nvmf_subsystem *subsystem;
1655 	struct spdk_nvmf_poll_group *group;
1656 	struct spdk_nvmf_subsystem_poll_group *sgroup;
1657 	spdk_nvmf_poll_group_mod_done cpl_fn = NULL;
1658 	void *cpl_ctx = NULL;
1659 	uint32_t nsid;
1660 
1661 	group = qpair_ctx->group;
1662 	subsystem = qpair_ctx->subsystem;
1663 	cpl_fn = qpair_ctx->cpl_fn;
1664 	cpl_ctx = qpair_ctx->cpl_ctx;
1665 	sgroup = &group->sgroups[subsystem->id];
1666 
1667 	if (status) {
1668 		goto fini;
1669 	}
1670 
1671 	for (nsid = 0; nsid < sgroup->num_ns; nsid++) {
1672 		if (sgroup->ns_info[nsid].channel) {
1673 			spdk_put_io_channel(sgroup->ns_info[nsid].channel);
1674 			sgroup->ns_info[nsid].channel = NULL;
1675 		}
1676 	}
1677 
1678 	sgroup->num_ns = 0;
1679 	free(sgroup->ns_info);
1680 	sgroup->ns_info = NULL;
1681 fini:
1682 	free(qpair_ctx);
1683 	if (cpl_fn) {
1684 		cpl_fn(cpl_ctx, status);
1685 	}
1686 }
1687 
1688 static void nvmf_poll_group_remove_subsystem_msg(void *ctx);
1689 
1690 static void
1691 nvmf_poll_group_remove_subsystem_msg(void *ctx)
1692 {
1693 	struct spdk_nvmf_qpair *qpair, *qpair_tmp;
1694 	struct spdk_nvmf_subsystem *subsystem;
1695 	struct spdk_nvmf_poll_group *group;
1696 	struct nvmf_qpair_disconnect_many_ctx *qpair_ctx = ctx;
1697 	bool qpairs_found = false;
1698 	int rc = 0;
1699 
1700 	group = qpair_ctx->group;
1701 	subsystem = qpair_ctx->subsystem;
1702 
1703 	TAILQ_FOREACH_SAFE(qpair, &group->qpairs, link, qpair_tmp) {
1704 		if ((qpair->ctrlr != NULL) && (qpair->ctrlr->subsys == subsystem)) {
1705 			qpairs_found = true;
1706 			rc = spdk_nvmf_qpair_disconnect(qpair);
1707 			if (rc && rc != -EINPROGRESS) {
1708 				break;
1709 			}
1710 		}
1711 	}
1712 
1713 	if (!qpairs_found) {
1714 		_nvmf_poll_group_remove_subsystem_cb(ctx, 0);
1715 		return;
1716 	}
1717 
1718 	/* Some qpairs are in process of being disconnected. Send a message and try to remove them again */
1719 	spdk_thread_send_msg(spdk_get_thread(), nvmf_poll_group_remove_subsystem_msg, ctx);
1720 }
1721 
1722 void
1723 nvmf_poll_group_remove_subsystem(struct spdk_nvmf_poll_group *group,
1724 				 struct spdk_nvmf_subsystem *subsystem,
1725 				 spdk_nvmf_poll_group_mod_done cb_fn, void *cb_arg)
1726 {
1727 	struct spdk_nvmf_subsystem_poll_group *sgroup;
1728 	struct nvmf_qpair_disconnect_many_ctx *ctx;
1729 	uint32_t i;
1730 
1731 	SPDK_DTRACE_PROBE3_TICKS(nvmf_poll_group_remove_subsystem, group, spdk_thread_get_id(group->thread),
1732 				 subsystem->subnqn);
1733 
1734 	ctx = calloc(1, sizeof(struct nvmf_qpair_disconnect_many_ctx));
1735 	if (!ctx) {
1736 		SPDK_ERRLOG("Unable to allocate memory for context to remove poll subsystem\n");
1737 		if (cb_fn) {
1738 			cb_fn(cb_arg, -1);
1739 		}
1740 		return;
1741 	}
1742 
1743 	ctx->group = group;
1744 	ctx->subsystem = subsystem;
1745 	ctx->cpl_fn = cb_fn;
1746 	ctx->cpl_ctx = cb_arg;
1747 
1748 	sgroup = &group->sgroups[subsystem->id];
1749 	sgroup->state = SPDK_NVMF_SUBSYSTEM_INACTIVE;
1750 
1751 	for (i = 0; i < sgroup->num_ns; i++) {
1752 		sgroup->ns_info[i].state = SPDK_NVMF_SUBSYSTEM_INACTIVE;
1753 	}
1754 
1755 	nvmf_poll_group_remove_subsystem_msg(ctx);
1756 }
1757 
1758 void
1759 nvmf_poll_group_pause_subsystem(struct spdk_nvmf_poll_group *group,
1760 				struct spdk_nvmf_subsystem *subsystem,
1761 				uint32_t nsid,
1762 				spdk_nvmf_poll_group_mod_done cb_fn, void *cb_arg)
1763 {
1764 	struct spdk_nvmf_subsystem_poll_group *sgroup;
1765 	struct spdk_nvmf_subsystem_pg_ns_info *ns_info = NULL;
1766 	int rc = 0;
1767 	uint32_t i;
1768 
1769 	if (subsystem->id >= group->num_sgroups) {
1770 		rc = -1;
1771 		goto fini;
1772 	}
1773 
1774 	sgroup = &group->sgroups[subsystem->id];
1775 	if (sgroup->state == SPDK_NVMF_SUBSYSTEM_PAUSED) {
1776 		goto fini;
1777 	}
1778 	sgroup->state = SPDK_NVMF_SUBSYSTEM_PAUSING;
1779 
1780 	if (nsid == SPDK_NVME_GLOBAL_NS_TAG) {
1781 		for (i = 0; i < sgroup->num_ns; i++) {
1782 			ns_info = &sgroup->ns_info[i];
1783 			ns_info->state = SPDK_NVMF_SUBSYSTEM_PAUSING;
1784 		}
1785 	} else {
1786 		/* NOTE: This implicitly also checks for 0, since 0 - 1 wraps around to UINT32_MAX. */
1787 		if (nsid - 1 < sgroup->num_ns) {
1788 			ns_info  = &sgroup->ns_info[nsid - 1];
1789 			ns_info->state = SPDK_NVMF_SUBSYSTEM_PAUSING;
1790 		}
1791 	}
1792 
1793 	if (sgroup->mgmt_io_outstanding > 0) {
1794 		assert(sgroup->cb_fn == NULL);
1795 		sgroup->cb_fn = cb_fn;
1796 		assert(sgroup->cb_arg == NULL);
1797 		sgroup->cb_arg = cb_arg;
1798 		return;
1799 	}
1800 
1801 	if (nsid == SPDK_NVME_GLOBAL_NS_TAG) {
1802 		for (i = 0; i < sgroup->num_ns; i++) {
1803 			ns_info = &sgroup->ns_info[i];
1804 
1805 			if (ns_info->io_outstanding > 0) {
1806 				assert(sgroup->cb_fn == NULL);
1807 				sgroup->cb_fn = cb_fn;
1808 				assert(sgroup->cb_arg == NULL);
1809 				sgroup->cb_arg = cb_arg;
1810 				return;
1811 			}
1812 		}
1813 	} else {
1814 		if (ns_info != NULL && ns_info->io_outstanding > 0) {
1815 			assert(sgroup->cb_fn == NULL);
1816 			sgroup->cb_fn = cb_fn;
1817 			assert(sgroup->cb_arg == NULL);
1818 			sgroup->cb_arg = cb_arg;
1819 			return;
1820 		}
1821 	}
1822 
1823 	assert(sgroup->mgmt_io_outstanding == 0);
1824 	sgroup->state = SPDK_NVMF_SUBSYSTEM_PAUSED;
1825 fini:
1826 	if (cb_fn) {
1827 		cb_fn(cb_arg, rc);
1828 	}
1829 }
1830 
1831 void
1832 nvmf_poll_group_resume_subsystem(struct spdk_nvmf_poll_group *group,
1833 				 struct spdk_nvmf_subsystem *subsystem,
1834 				 spdk_nvmf_poll_group_mod_done cb_fn, void *cb_arg)
1835 {
1836 	struct spdk_nvmf_request *req, *tmp;
1837 	struct spdk_nvmf_subsystem_poll_group *sgroup;
1838 	int rc = 0;
1839 	uint32_t i;
1840 
1841 	if (subsystem->id >= group->num_sgroups) {
1842 		rc = -1;
1843 		goto fini;
1844 	}
1845 
1846 	sgroup = &group->sgroups[subsystem->id];
1847 
1848 	if (sgroup->state == SPDK_NVMF_SUBSYSTEM_ACTIVE) {
1849 		goto fini;
1850 	}
1851 
1852 	rc = poll_group_update_subsystem(group, subsystem);
1853 	if (rc) {
1854 		goto fini;
1855 	}
1856 
1857 	for (i = 0; i < sgroup->num_ns; i++) {
1858 		sgroup->ns_info[i].state = SPDK_NVMF_SUBSYSTEM_ACTIVE;
1859 	}
1860 
1861 	sgroup->state = SPDK_NVMF_SUBSYSTEM_ACTIVE;
1862 
1863 	/* Release all queued requests */
1864 	TAILQ_FOREACH_SAFE(req, &sgroup->queued, link, tmp) {
1865 		TAILQ_REMOVE(&sgroup->queued, req, link);
1866 		if (spdk_nvmf_request_using_zcopy(req)) {
1867 			spdk_nvmf_request_zcopy_start(req);
1868 		} else {
1869 			spdk_nvmf_request_exec(req);
1870 		}
1871 
1872 	}
1873 fini:
1874 	if (cb_fn) {
1875 		cb_fn(cb_arg, rc);
1876 	}
1877 }
1878 
1879 
1880 struct spdk_nvmf_poll_group *
1881 spdk_nvmf_get_optimal_poll_group(struct spdk_nvmf_qpair *qpair)
1882 {
1883 	struct spdk_nvmf_transport_poll_group *tgroup;
1884 
1885 	tgroup = nvmf_transport_get_optimal_poll_group(qpair->transport, qpair);
1886 
1887 	if (tgroup == NULL) {
1888 		return NULL;
1889 	}
1890 
1891 	return tgroup->group;
1892 }
1893 
1894 void
1895 spdk_nvmf_poll_group_dump_stat(struct spdk_nvmf_poll_group *group, struct spdk_json_write_ctx *w)
1896 {
1897 	struct spdk_nvmf_transport_poll_group *tgroup;
1898 
1899 	spdk_json_write_object_begin(w);
1900 
1901 	spdk_json_write_named_string(w, "name", spdk_thread_get_name(spdk_get_thread()));
1902 	spdk_json_write_named_uint32(w, "admin_qpairs", group->stat.admin_qpairs);
1903 	spdk_json_write_named_uint32(w, "io_qpairs", group->stat.io_qpairs);
1904 	spdk_json_write_named_uint32(w, "current_admin_qpairs", group->stat.current_admin_qpairs);
1905 	spdk_json_write_named_uint32(w, "current_io_qpairs", group->stat.current_io_qpairs);
1906 	spdk_json_write_named_uint64(w, "pending_bdev_io", group->stat.pending_bdev_io);
1907 	spdk_json_write_named_uint64(w, "completed_nvme_io", group->stat.completed_nvme_io);
1908 
1909 	spdk_json_write_named_array_begin(w, "transports");
1910 
1911 	TAILQ_FOREACH(tgroup, &group->tgroups, link) {
1912 		spdk_json_write_object_begin(w);
1913 		/*
1914 		 * The trtype field intentionally contains a transport name as this is more informative.
1915 		 * The field has not been renamed for backward compatibility.
1916 		 */
1917 		spdk_json_write_named_string(w, "trtype", spdk_nvmf_get_transport_name(tgroup->transport));
1918 
1919 		if (tgroup->transport->ops->poll_group_dump_stat) {
1920 			tgroup->transport->ops->poll_group_dump_stat(tgroup, w);
1921 		}
1922 
1923 		spdk_json_write_object_end(w);
1924 	}
1925 
1926 	spdk_json_write_array_end(w);
1927 	spdk_json_write_object_end(w);
1928 }
1929