1 /* Fork a Unix child process, and set up to debug it, for GDB and GDBserver. 2 3 Copyright (C) 1990-2023 Free Software Foundation, Inc. 4 5 This file is part of GDB. 6 7 This program is free software; you can redistribute it and/or modify 8 it under the terms of the GNU General Public License as published by 9 the Free Software Foundation; either version 3 of the License, or 10 (at your option) any later version. 11 12 This program is distributed in the hope that it will be useful, 13 but WITHOUT ANY WARRANTY; without even the implied warranty of 14 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the 15 GNU General Public License for more details. 16 17 You should have received a copy of the GNU General Public License 18 along with this program. If not, see <http://www.gnu.org/licenses/>. */ 19 20 #include "gdbsupport/common-defs.h" 21 #include "fork-inferior.h" 22 #include "target/waitstatus.h" 23 #include "gdbsupport/filestuff.h" 24 #include "target/target.h" 25 #include "gdbsupport/common-inferior.h" 26 #include "gdbsupport/common-gdbthread.h" 27 #include "gdbsupport/pathstuff.h" 28 #include "gdbsupport/signals-state-save-restore.h" 29 #include "gdbsupport/gdb_tilde_expand.h" 30 #include <vector> 31 32 extern char **environ; 33 34 /* Build the argument vector for execv(3). */ 35 36 class execv_argv 37 { 38 public: 39 /* EXEC_FILE is the file to run. ALLARGS is a string containing the 40 arguments to the program. If starting with a shell, SHELL_FILE 41 is the shell to run. Otherwise, SHELL_FILE is NULL. */ 42 execv_argv (const char *exec_file, const std::string &allargs, 43 const char *shell_file); 44 45 /* Return a pointer to the built argv, in the type expected by 46 execv. The result is (only) valid for as long as this execv_argv 47 object is live. We return a "char **" because that's the type 48 that the execv functions expect. Note that it is guaranteed that 49 the execv functions do not modify the argv[] array nor the 50 strings to which the array point. */ 51 char **argv () 52 { 53 return const_cast<char **> (&m_argv[0]); 54 } 55 56 private: 57 DISABLE_COPY_AND_ASSIGN (execv_argv); 58 59 /* Helper methods for constructing the argument vector. */ 60 61 /* Used when building an argv for a straight execv call, without 62 going via the shell. */ 63 void init_for_no_shell (const char *exec_file, 64 const std::string &allargs); 65 66 /* Used when building an argv for execing a shell that execs the 67 child program. */ 68 void init_for_shell (const char *exec_file, 69 const std::string &allargs, 70 const char *shell_file); 71 72 /* The argument vector built. Holds non-owning pointers. Elements 73 either point to the strings passed to the execv_argv ctor, or 74 inside M_STORAGE. */ 75 std::vector<const char *> m_argv; 76 77 /* Storage. In the no-shell case, this contains a copy of the 78 arguments passed to the ctor, split by '\0'. In the shell case, 79 this contains the quoted shell command. I.e., SHELL_COMMAND in 80 {"$SHELL" "-c", SHELL_COMMAND, NULL}. */ 81 std::string m_storage; 82 }; 83 84 /* Create argument vector for straight call to execvp. Breaks up 85 ALLARGS into an argument vector suitable for passing to execvp and 86 stores it in M_ARGV. E.g., on "run a b c d" this routine would get 87 as input the string "a b c d", and as output it would fill in 88 M_ARGV with the four arguments "a", "b", "c", "d". Each argument 89 in M_ARGV points to a substring of a copy of ALLARGS stored in 90 M_STORAGE. */ 91 92 void 93 execv_argv::init_for_no_shell (const char *exec_file, 94 const std::string &allargs) 95 { 96 97 /* Save/work with a copy stored in our storage. The pointers pushed 98 to M_ARGV point directly into M_STORAGE, which is modified in 99 place with the necessary NULL terminators. This avoids N heap 100 allocations and string dups when 1 is sufficient. */ 101 std::string &args_copy = m_storage = allargs; 102 103 m_argv.push_back (exec_file); 104 105 for (size_t cur_pos = 0; cur_pos < args_copy.size ();) 106 { 107 /* Skip whitespace-like chars. */ 108 std::size_t pos = args_copy.find_first_not_of (" \t\n", cur_pos); 109 110 if (pos != std::string::npos) 111 cur_pos = pos; 112 113 /* Find the position of the next separator. */ 114 std::size_t next_sep = args_copy.find_first_of (" \t\n", cur_pos); 115 116 if (next_sep == std::string::npos) 117 { 118 /* No separator found, which means this is the last 119 argument. */ 120 next_sep = args_copy.size (); 121 } 122 else 123 { 124 /* Replace the separator with a terminator. */ 125 args_copy[next_sep++] = '\0'; 126 } 127 128 m_argv.push_back (&args_copy[cur_pos]); 129 130 cur_pos = next_sep; 131 } 132 133 /* NULL-terminate the vector. */ 134 m_argv.push_back (NULL); 135 } 136 137 /* When executing a command under the given shell, return true if the 138 '!' character should be escaped when embedded in a quoted 139 command-line argument. */ 140 141 static bool 142 escape_bang_in_quoted_argument (const char *shell_file) 143 { 144 size_t shell_file_len = strlen (shell_file); 145 146 /* Bang should be escaped only in C Shells. For now, simply check 147 that the shell name ends with 'csh', which covers at least csh 148 and tcsh. This should be good enough for now. */ 149 150 if (shell_file_len < 3) 151 return false; 152 153 if (shell_file[shell_file_len - 3] == 'c' 154 && shell_file[shell_file_len - 2] == 's' 155 && shell_file[shell_file_len - 1] == 'h') 156 return true; 157 158 return false; 159 } 160 161 /* See declaration. */ 162 163 execv_argv::execv_argv (const char *exec_file, 164 const std::string &allargs, 165 const char *shell_file) 166 { 167 if (shell_file == NULL) 168 init_for_no_shell (exec_file, allargs); 169 else 170 init_for_shell (exec_file, allargs, shell_file); 171 } 172 173 /* See declaration. */ 174 175 void 176 execv_argv::init_for_shell (const char *exec_file, 177 const std::string &allargs, 178 const char *shell_file) 179 { 180 const char *exec_wrapper = get_exec_wrapper (); 181 182 /* We're going to call a shell. */ 183 bool escape_bang = escape_bang_in_quoted_argument (shell_file); 184 185 /* We need to build a new shell command string, and make argv point 186 to it. So build it in the storage. */ 187 std::string &shell_command = m_storage; 188 189 shell_command = "exec "; 190 191 /* Add any exec wrapper. That may be a program name with arguments, 192 so the user must handle quoting. */ 193 if (exec_wrapper != NULL) 194 { 195 shell_command += exec_wrapper; 196 shell_command += ' '; 197 } 198 199 /* Now add exec_file, quoting as necessary. */ 200 201 /* Quoting in this style is said to work with all shells. But csh 202 on IRIX 4.0.1 can't deal with it. So we only quote it if we need 203 to. */ 204 bool need_to_quote; 205 const char *p = exec_file; 206 while (1) 207 { 208 switch (*p) 209 { 210 case '\'': 211 case '!': 212 case '"': 213 case '(': 214 case ')': 215 case '$': 216 case '&': 217 case ';': 218 case '<': 219 case '>': 220 case ' ': 221 case '\n': 222 case '\t': 223 need_to_quote = true; 224 goto end_scan; 225 226 case '\0': 227 need_to_quote = false; 228 goto end_scan; 229 230 default: 231 break; 232 } 233 ++p; 234 } 235 end_scan: 236 if (need_to_quote) 237 { 238 shell_command += '\''; 239 for (p = exec_file; *p != '\0'; ++p) 240 { 241 if (*p == '\'') 242 shell_command += "'\\''"; 243 else if (*p == '!' && escape_bang) 244 shell_command += "\\!"; 245 else 246 shell_command += *p; 247 } 248 shell_command += '\''; 249 } 250 else 251 shell_command += exec_file; 252 253 shell_command += ' ' + allargs; 254 255 /* If we decided above to start up with a shell, we exec the shell. 256 "-c" says to interpret the next arg as a shell command to 257 execute, and this command is "exec <target-program> <args>". */ 258 m_argv.reserve (4); 259 m_argv.push_back (shell_file); 260 m_argv.push_back ("-c"); 261 m_argv.push_back (shell_command.c_str ()); 262 m_argv.push_back (NULL); 263 } 264 265 /* See nat/fork-inferior.h. */ 266 267 pid_t 268 fork_inferior (const char *exec_file_arg, const std::string &allargs, 269 char **env, void (*traceme_fun) (), 270 gdb::function_view<void (int)> init_trace_fun, 271 void (*pre_trace_fun) (), 272 const char *shell_file_arg, 273 void (*exec_fun)(const char *file, char * const *argv, 274 char * const *env)) 275 { 276 pid_t pid; 277 /* Set debug_fork then attach to the child while it sleeps, to debug. */ 278 int debug_fork = 0; 279 const char *shell_file; 280 const char *exec_file; 281 char **save_our_env; 282 int i; 283 int save_errno; 284 285 /* If no exec file handed to us, get it from the exec-file command 286 -- with a good, common error message if none is specified. */ 287 if (exec_file_arg == NULL) 288 exec_file = get_exec_file (1); 289 else 290 exec_file = exec_file_arg; 291 292 /* 'startup_with_shell' is declared in inferior.h and bound to the 293 "set startup-with-shell" option. If 0, we'll just do a 294 fork/exec, no shell, so don't bother figuring out what shell. */ 295 if (startup_with_shell) 296 { 297 shell_file = shell_file_arg; 298 299 /* Figure out what shell to start up the user program under. */ 300 if (shell_file == NULL) 301 shell_file = get_shell (); 302 303 gdb_assert (shell_file != NULL); 304 } 305 else 306 shell_file = NULL; 307 308 /* Build the argument vector. */ 309 execv_argv child_argv (exec_file, allargs, shell_file); 310 311 /* Retain a copy of our environment variables, since the child will 312 replace the value of environ and if we're vforked, we have to 313 restore it. */ 314 save_our_env = environ; 315 316 /* Perform any necessary actions regarding to TTY before the 317 fork/vfork call. */ 318 prefork_hook (allargs.c_str ()); 319 320 /* It is generally good practice to flush any possible pending stdio 321 output prior to doing a fork, to avoid the possibility of both 322 the parent and child flushing the same data after the fork. */ 323 gdb_flush_out_err (); 324 325 /* Check if the user wants to set a different working directory for 326 the inferior. */ 327 std::string inferior_cwd = get_inferior_cwd (); 328 329 if (!inferior_cwd.empty ()) 330 { 331 /* Expand before forking because between fork and exec, the child 332 process may only execute async-signal-safe operations. */ 333 inferior_cwd = gdb_tilde_expand (inferior_cwd.c_str ()); 334 } 335 336 /* If there's any initialization of the target layers that must 337 happen to prepare to handle the child we're about fork, do it 338 now... */ 339 if (pre_trace_fun != NULL) 340 (*pre_trace_fun) (); 341 342 /* Create the child process. Since the child process is going to 343 exec(3) shortly afterwards, try to reduce the overhead by 344 calling vfork(2). However, if PRE_TRACE_FUN is non-null, it's 345 likely that this optimization won't work since there's too much 346 work to do between the vfork(2) and the exec(3). This is known 347 to be the case on ttrace(2)-based HP-UX, where some handshaking 348 between parent and child needs to happen between fork(2) and 349 exec(2). However, since the parent is suspended in the vforked 350 state, this doesn't work. Also note that the vfork(2) call might 351 actually be a call to fork(2) due to the fact that autoconf will 352 ``#define vfork fork'' on certain platforms. */ 353 #if !(defined(__UCLIBC__) && defined(HAS_NOMMU)) 354 if (pre_trace_fun || debug_fork) 355 pid = fork (); 356 else 357 #endif 358 pid = vfork (); 359 360 if (pid < 0) 361 perror_with_name (("vfork")); 362 363 if (pid == 0) 364 { 365 /* Close all file descriptors except those that gdb inherited 366 (usually 0/1/2), so they don't leak to the inferior. Note 367 that this closes the file descriptors of all secondary 368 UIs. */ 369 close_most_fds (); 370 371 /* Change to the requested working directory if the user 372 requested it. */ 373 if (!inferior_cwd.empty ()) 374 { 375 if (chdir (inferior_cwd.c_str ()) < 0) 376 trace_start_error_with_name (inferior_cwd.c_str ()); 377 } 378 379 if (debug_fork) 380 sleep (debug_fork); 381 382 /* Execute any necessary post-fork actions before we exec. */ 383 postfork_child_hook (); 384 385 /* Changing the signal handlers for the inferior after 386 a vfork can also change them for the superior, so we don't mess 387 with signals here. See comments in 388 initialize_signals for how we get the right signal handlers 389 for the inferior. */ 390 391 /* "Trace me, Dr. Memory!" */ 392 (*traceme_fun) (); 393 394 /* The call above set this process (the "child") as debuggable 395 by the original gdb process (the "parent"). Since processes 396 (unlike people) can have only one parent, if you are debugging 397 gdb itself (and your debugger is thus _already_ the 398 controller/parent for this child), code from here on out is 399 undebuggable. Indeed, you probably got an error message 400 saying "not parent". Sorry; you'll have to use print 401 statements! */ 402 403 restore_original_signals_state (); 404 405 /* There is no execlpe call, so we have to set the environment 406 for our child in the global variable. If we've vforked, this 407 clobbers the parent, but environ is restored a few lines down 408 in the parent. By the way, yes we do need to look down the 409 path to find $SHELL. Rich Pixley says so, and I agree. */ 410 environ = env; 411 412 char **argv = child_argv.argv (); 413 414 if (exec_fun != NULL) 415 (*exec_fun) (argv[0], &argv[0], env); 416 else 417 execvp (argv[0], &argv[0]); 418 419 /* If we get here, it's an error. */ 420 save_errno = errno; 421 warning ("Cannot exec %s", argv[0]); 422 423 for (i = 1; argv[i] != NULL; i++) 424 warning (" %s", argv[i]); 425 426 warning ("Error: %s", safe_strerror (save_errno)); 427 428 _exit (0177); 429 } 430 431 /* Restore our environment in case a vforked child clob'd it. */ 432 environ = save_our_env; 433 434 postfork_hook (pid); 435 436 /* Now that we have a child process, make it our target, and 437 initialize anything target-vector-specific that needs 438 initializing. */ 439 if (init_trace_fun) 440 init_trace_fun (pid); 441 442 /* We are now in the child process of interest, having exec'd the 443 correct program, and are poised at the first instruction of the 444 new program. */ 445 return pid; 446 } 447 448 /* See nat/fork-inferior.h. */ 449 450 ptid_t 451 startup_inferior (process_stratum_target *proc_target, pid_t pid, int ntraps, 452 struct target_waitstatus *last_waitstatus, 453 ptid_t *last_ptid) 454 { 455 int pending_execs = ntraps; 456 int terminal_initted = 0; 457 ptid_t resume_ptid; 458 459 if (startup_with_shell) 460 { 461 /* One trap extra for exec'ing the shell. */ 462 pending_execs++; 463 } 464 465 if (target_supports_multi_process ()) 466 resume_ptid = ptid_t (pid); 467 else 468 resume_ptid = minus_one_ptid; 469 470 /* The process was started by the fork that created it, but it will 471 have stopped one instruction after execing the shell. Here we 472 must get it up to actual execution of the real program. */ 473 if (get_exec_wrapper () != NULL) 474 pending_execs++; 475 476 while (1) 477 { 478 enum gdb_signal resume_signal = GDB_SIGNAL_0; 479 ptid_t event_ptid; 480 481 struct target_waitstatus ws; 482 event_ptid = target_wait (resume_ptid, &ws, 0); 483 484 if (last_waitstatus != NULL) 485 *last_waitstatus = ws; 486 if (last_ptid != NULL) 487 *last_ptid = event_ptid; 488 489 if (ws.kind () == TARGET_WAITKIND_IGNORE) 490 /* The inferior didn't really stop, keep waiting. */ 491 continue; 492 493 switch (ws.kind ()) 494 { 495 case TARGET_WAITKIND_SPURIOUS: 496 case TARGET_WAITKIND_LOADED: 497 case TARGET_WAITKIND_FORKED: 498 case TARGET_WAITKIND_VFORKED: 499 case TARGET_WAITKIND_SYSCALL_ENTRY: 500 case TARGET_WAITKIND_SYSCALL_RETURN: 501 /* Ignore gracefully during startup of the inferior. */ 502 break; 503 504 case TARGET_WAITKIND_SIGNALLED: 505 target_terminal::ours (); 506 target_mourn_inferior (event_ptid); 507 error (_("During startup program terminated with signal %s, %s."), 508 gdb_signal_to_name (ws.sig ()), 509 gdb_signal_to_string (ws.sig ())); 510 return resume_ptid; 511 512 case TARGET_WAITKIND_EXITED: 513 target_terminal::ours (); 514 target_mourn_inferior (event_ptid); 515 if (ws.exit_status ()) 516 error (_("During startup program exited with code %d."), 517 ws.exit_status ()); 518 else 519 error (_("During startup program exited normally.")); 520 return resume_ptid; 521 522 case TARGET_WAITKIND_EXECD: 523 /* Handle EXEC signals as if they were SIGTRAP signals. */ 524 resume_signal = GDB_SIGNAL_TRAP; 525 switch_to_thread (proc_target, event_ptid); 526 break; 527 528 case TARGET_WAITKIND_STOPPED: 529 resume_signal = ws.sig (); 530 /* Ignore gracefully the !TRAP signals intercepted from the shell. */ 531 if (resume_signal == GDB_SIGNAL_TRAP) 532 switch_to_thread (proc_target, event_ptid); 533 break; 534 } 535 536 if (resume_signal != GDB_SIGNAL_TRAP) 537 { 538 /* Let shell child handle its own signals in its own way. */ 539 target_continue (resume_ptid, resume_signal); 540 } 541 else 542 { 543 /* We handle SIGTRAP, however; it means child did an exec. */ 544 if (!terminal_initted) 545 { 546 /* Now that the child has exec'd we know it has already 547 set its process group. On POSIX systems, tcsetpgrp 548 will fail with EPERM if we try it before the child's 549 setpgid. */ 550 551 /* Set up the "saved terminal modes" of the inferior 552 based on what modes we are starting it with. */ 553 target_terminal::init (); 554 555 /* Install inferior's terminal modes. */ 556 target_terminal::inferior (); 557 558 terminal_initted = 1; 559 } 560 561 if (--pending_execs == 0) 562 break; 563 564 /* Just make it go on. */ 565 target_continue_no_signal (resume_ptid); 566 } 567 } 568 569 return resume_ptid; 570 } 571 572 /* See nat/fork-inferior.h. */ 573 574 void 575 trace_start_error (const char *fmt, ...) 576 { 577 va_list ap; 578 579 va_start (ap, fmt); 580 warning ("Could not trace the inferior process."); 581 vwarning (fmt, ap); 582 va_end (ap); 583 584 gdb_flush_out_err (); 585 _exit (0177); 586 } 587 588 /* See nat/fork-inferior.h. */ 589 590 void 591 trace_start_error_with_name (const char *string) 592 { 593 trace_start_error ("%s: %s", string, safe_strerror (errno)); 594 } 595