1 /* $NetBSD: fetch.c,v 1.198 2012/07/04 06:09:37 is Exp $ */ 2 3 /*- 4 * Copyright (c) 1997-2009 The NetBSD Foundation, Inc. 5 * All rights reserved. 6 * 7 * This code is derived from software contributed to The NetBSD Foundation 8 * by Luke Mewburn. 9 * 10 * This code is derived from software contributed to The NetBSD Foundation 11 * by Scott Aaron Bamford. 12 * 13 * Redistribution and use in source and binary forms, with or without 14 * modification, are permitted provided that the following conditions 15 * are met: 16 * 1. Redistributions of source code must retain the above copyright 17 * notice, this list of conditions and the following disclaimer. 18 * 2. Redistributions in binary form must reproduce the above copyright 19 * notice, this list of conditions and the following disclaimer in the 20 * documentation and/or other materials provided with the distribution. 21 * 22 * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS 23 * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED 24 * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR 25 * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS 26 * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR 27 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF 28 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS 29 * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN 30 * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) 31 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE 32 * POSSIBILITY OF SUCH DAMAGE. 33 */ 34 35 #include <sys/cdefs.h> 36 #ifndef lint 37 __RCSID("$NetBSD: fetch.c,v 1.198 2012/07/04 06:09:37 is Exp $"); 38 #endif /* not lint */ 39 40 /* 41 * FTP User Program -- Command line file retrieval 42 */ 43 44 #include <sys/types.h> 45 #include <sys/param.h> 46 #include <sys/socket.h> 47 #include <sys/stat.h> 48 #include <sys/time.h> 49 50 #include <netinet/in.h> 51 52 #include <arpa/ftp.h> 53 #include <arpa/inet.h> 54 55 #include <assert.h> 56 #include <ctype.h> 57 #include <err.h> 58 #include <errno.h> 59 #include <netdb.h> 60 #include <fcntl.h> 61 #include <stdio.h> 62 #include <stdlib.h> 63 #include <string.h> 64 #include <unistd.h> 65 #include <time.h> 66 67 #include "ftp_var.h" 68 #include "version.h" 69 70 typedef enum { 71 UNKNOWN_URL_T=-1, 72 HTTP_URL_T, 73 FTP_URL_T, 74 FILE_URL_T, 75 CLASSIC_URL_T 76 } url_t; 77 78 __dead static void aborthttp(int); 79 #ifndef NO_AUTH 80 static int auth_url(const char *, char **, const char *, const char *); 81 static void base64_encode(const unsigned char *, size_t, unsigned char *); 82 #endif 83 static int go_fetch(const char *); 84 static int fetch_ftp(const char *); 85 static int fetch_url(const char *, const char *, char *, char *); 86 static const char *match_token(const char **, const char *); 87 static int parse_url(const char *, const char *, url_t *, char **, 88 char **, char **, char **, in_port_t *, char **); 89 static void url_decode(char *); 90 91 static int redirect_loop; 92 93 94 #define STRNEQUAL(a,b) (strncasecmp((a), (b), sizeof((b))-1) == 0) 95 #define ISLWS(x) ((x)=='\r' || (x)=='\n' || (x)==' ' || (x)=='\t') 96 #define SKIPLWS(x) do { while (ISLWS((*x))) x++; } while (0) 97 98 99 #define ABOUT_URL "about:" /* propaganda */ 100 #define FILE_URL "file://" /* file URL prefix */ 101 #define FTP_URL "ftp://" /* ftp URL prefix */ 102 #define HTTP_URL "http://" /* http URL prefix */ 103 104 105 /* 106 * Determine if token is the next word in buf (case insensitive). 107 * If so, advance buf past the token and any trailing LWS, and 108 * return a pointer to the token (in buf). Otherwise, return NULL. 109 * token may be preceded by LWS. 110 * token must be followed by LWS or NUL. (I.e, don't partial match). 111 */ 112 static const char * 113 match_token(const char **buf, const char *token) 114 { 115 const char *p, *orig; 116 size_t tlen; 117 118 tlen = strlen(token); 119 p = *buf; 120 SKIPLWS(p); 121 orig = p; 122 if (strncasecmp(p, token, tlen) != 0) 123 return NULL; 124 p += tlen; 125 if (*p != '\0' && !ISLWS(*p)) 126 return NULL; 127 SKIPLWS(p); 128 orig = *buf; 129 *buf = p; 130 return orig; 131 } 132 133 #ifndef NO_AUTH 134 /* 135 * Generate authorization response based on given authentication challenge. 136 * Returns -1 if an error occurred, otherwise 0. 137 * Sets response to a malloc(3)ed string; caller should free. 138 */ 139 static int 140 auth_url(const char *challenge, char **response, const char *guser, 141 const char *gpass) 142 { 143 const char *cp, *scheme, *errormsg; 144 char *ep, *clear, *realm; 145 char uuser[BUFSIZ], *gotpass; 146 const char *upass; 147 int rval; 148 size_t len, clen, rlen; 149 150 *response = NULL; 151 clear = realm = NULL; 152 rval = -1; 153 cp = challenge; 154 scheme = "Basic"; /* only support Basic authentication */ 155 gotpass = NULL; 156 157 DPRINTF("auth_url: challenge `%s'\n", challenge); 158 159 if (! match_token(&cp, scheme)) { 160 warnx("Unsupported authentication challenge `%s'", 161 challenge); 162 goto cleanup_auth_url; 163 } 164 165 #define REALM "realm=\"" 166 if (STRNEQUAL(cp, REALM)) 167 cp += sizeof(REALM) - 1; 168 else { 169 warnx("Unsupported authentication challenge `%s'", 170 challenge); 171 goto cleanup_auth_url; 172 } 173 /* XXX: need to improve quoted-string parsing to support \ quoting, etc. */ 174 if ((ep = strchr(cp, '\"')) != NULL) { 175 len = ep - cp; 176 realm = (char *)ftp_malloc(len + 1); 177 (void)strlcpy(realm, cp, len + 1); 178 } else { 179 warnx("Unsupported authentication challenge `%s'", 180 challenge); 181 goto cleanup_auth_url; 182 } 183 184 fprintf(ttyout, "Username for `%s': ", realm); 185 if (guser != NULL) { 186 (void)strlcpy(uuser, guser, sizeof(uuser)); 187 fprintf(ttyout, "%s\n", uuser); 188 } else { 189 (void)fflush(ttyout); 190 if (get_line(stdin, uuser, sizeof(uuser), &errormsg) < 0) { 191 warnx("%s; can't authenticate", errormsg); 192 goto cleanup_auth_url; 193 } 194 } 195 if (gpass != NULL) 196 upass = gpass; 197 else { 198 gotpass = getpass("Password: "); 199 if (gotpass == NULL) { 200 warnx("Can't read password"); 201 goto cleanup_auth_url; 202 } 203 upass = gotpass; 204 } 205 206 clen = strlen(uuser) + strlen(upass) + 2; /* user + ":" + pass + "\0" */ 207 clear = (char *)ftp_malloc(clen); 208 (void)strlcpy(clear, uuser, clen); 209 (void)strlcat(clear, ":", clen); 210 (void)strlcat(clear, upass, clen); 211 if (gotpass) 212 memset(gotpass, 0, strlen(gotpass)); 213 214 /* scheme + " " + enc + "\0" */ 215 rlen = strlen(scheme) + 1 + (clen + 2) * 4 / 3 + 1; 216 *response = (char *)ftp_malloc(rlen); 217 (void)strlcpy(*response, scheme, rlen); 218 len = strlcat(*response, " ", rlen); 219 /* use `clen - 1' to not encode the trailing NUL */ 220 base64_encode((unsigned char *)clear, clen - 1, 221 (unsigned char *)*response + len); 222 memset(clear, 0, clen); 223 rval = 0; 224 225 cleanup_auth_url: 226 FREEPTR(clear); 227 FREEPTR(realm); 228 return (rval); 229 } 230 231 /* 232 * Encode len bytes starting at clear using base64 encoding into encoded, 233 * which should be at least ((len + 2) * 4 / 3 + 1) in size. 234 */ 235 static void 236 base64_encode(const unsigned char *clear, size_t len, unsigned char *encoded) 237 { 238 static const unsigned char enc[] = 239 "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789+/"; 240 unsigned char *cp; 241 size_t i; 242 243 cp = encoded; 244 for (i = 0; i < len; i += 3) { 245 *(cp++) = enc[((clear[i + 0] >> 2))]; 246 *(cp++) = enc[((clear[i + 0] << 4) & 0x30) 247 | ((clear[i + 1] >> 4) & 0x0f)]; 248 *(cp++) = enc[((clear[i + 1] << 2) & 0x3c) 249 | ((clear[i + 2] >> 6) & 0x03)]; 250 *(cp++) = enc[((clear[i + 2] ) & 0x3f)]; 251 } 252 *cp = '\0'; 253 while (i-- > len) 254 *(--cp) = '='; 255 } 256 #endif 257 258 /* 259 * Decode %xx escapes in given string, `in-place'. 260 */ 261 static void 262 url_decode(char *url) 263 { 264 unsigned char *p, *q; 265 266 if (EMPTYSTRING(url)) 267 return; 268 p = q = (unsigned char *)url; 269 270 #define HEXTOINT(x) (x - (isdigit(x) ? '0' : (islower(x) ? 'a' : 'A') - 10)) 271 while (*p) { 272 if (p[0] == '%' 273 && p[1] && isxdigit((unsigned char)p[1]) 274 && p[2] && isxdigit((unsigned char)p[2])) { 275 *q++ = HEXTOINT(p[1]) * 16 + HEXTOINT(p[2]); 276 p+=3; 277 } else 278 *q++ = *p++; 279 } 280 *q = '\0'; 281 } 282 283 284 /* 285 * Parse URL of form (per RFC 3986): 286 * <type>://[<user>[:<password>]@]<host>[:<port>][/<path>] 287 * Returns -1 if a parse error occurred, otherwise 0. 288 * It's the caller's responsibility to url_decode() the returned 289 * user, pass and path. 290 * 291 * Sets type to url_t, each of the given char ** pointers to a 292 * malloc(3)ed strings of the relevant section, and port to 293 * the number given, or ftpport if ftp://, or httpport if http://. 294 * 295 * XXX: this is not totally RFC 3986 compliant; <path> will have the 296 * leading `/' unless it's an ftp:// URL, as this makes things easier 297 * for file:// and http:// URLs. ftp:// URLs have the `/' between the 298 * host and the URL-path removed, but any additional leading slashes 299 * in the URL-path are retained (because they imply that we should 300 * later do "CWD" with a null argument). 301 * 302 * Examples: 303 * input URL output path 304 * --------- ----------- 305 * "http://host" "/" 306 * "http://host/" "/" 307 * "http://host/path" "/path" 308 * "file://host/dir/file" "dir/file" 309 * "ftp://host" "" 310 * "ftp://host/" "" 311 * "ftp://host//" "/" 312 * "ftp://host/dir/file" "dir/file" 313 * "ftp://host//dir/file" "/dir/file" 314 */ 315 static int 316 parse_url(const char *url, const char *desc, url_t *utype, 317 char **uuser, char **pass, char **host, char **port, 318 in_port_t *portnum, char **path) 319 { 320 const char *origurl, *tport; 321 char *cp, *ep, *thost; 322 size_t len; 323 324 if (url == NULL || desc == NULL || utype == NULL || uuser == NULL 325 || pass == NULL || host == NULL || port == NULL || portnum == NULL 326 || path == NULL) 327 errx(1, "parse_url: invoked with NULL argument!"); 328 DPRINTF("parse_url: %s `%s'\n", desc, url); 329 330 origurl = url; 331 *utype = UNKNOWN_URL_T; 332 *uuser = *pass = *host = *port = *path = NULL; 333 *portnum = 0; 334 tport = NULL; 335 336 if (STRNEQUAL(url, HTTP_URL)) { 337 url += sizeof(HTTP_URL) - 1; 338 *utype = HTTP_URL_T; 339 *portnum = HTTP_PORT; 340 tport = httpport; 341 } else if (STRNEQUAL(url, FTP_URL)) { 342 url += sizeof(FTP_URL) - 1; 343 *utype = FTP_URL_T; 344 *portnum = FTP_PORT; 345 tport = ftpport; 346 } else if (STRNEQUAL(url, FILE_URL)) { 347 url += sizeof(FILE_URL) - 1; 348 *utype = FILE_URL_T; 349 } else { 350 warnx("Invalid %s `%s'", desc, url); 351 cleanup_parse_url: 352 FREEPTR(*uuser); 353 if (*pass != NULL) 354 memset(*pass, 0, strlen(*pass)); 355 FREEPTR(*pass); 356 FREEPTR(*host); 357 FREEPTR(*port); 358 FREEPTR(*path); 359 return (-1); 360 } 361 362 if (*url == '\0') 363 return (0); 364 365 /* find [user[:pass]@]host[:port] */ 366 ep = strchr(url, '/'); 367 if (ep == NULL) 368 thost = ftp_strdup(url); 369 else { 370 len = ep - url; 371 thost = (char *)ftp_malloc(len + 1); 372 (void)strlcpy(thost, url, len + 1); 373 if (*utype == FTP_URL_T) /* skip first / for ftp URLs */ 374 ep++; 375 *path = ftp_strdup(ep); 376 } 377 378 cp = strchr(thost, '@'); /* look for user[:pass]@ in URLs */ 379 if (cp != NULL) { 380 if (*utype == FTP_URL_T) 381 anonftp = 0; /* disable anonftp */ 382 *uuser = thost; 383 *cp = '\0'; 384 thost = ftp_strdup(cp + 1); 385 cp = strchr(*uuser, ':'); 386 if (cp != NULL) { 387 *cp = '\0'; 388 *pass = ftp_strdup(cp + 1); 389 } 390 url_decode(*uuser); 391 if (*pass) 392 url_decode(*pass); 393 } 394 395 #ifdef INET6 396 /* 397 * Check if thost is an encoded IPv6 address, as per 398 * RFC 3986: 399 * `[' ipv6-address ']' 400 */ 401 if (*thost == '[') { 402 cp = thost + 1; 403 if ((ep = strchr(cp, ']')) == NULL || 404 (ep[1] != '\0' && ep[1] != ':')) { 405 warnx("Invalid address `%s' in %s `%s'", 406 thost, desc, origurl); 407 goto cleanup_parse_url; 408 } 409 len = ep - cp; /* change `[xyz]' -> `xyz' */ 410 memmove(thost, thost + 1, len); 411 thost[len] = '\0'; 412 if (! isipv6addr(thost)) { 413 warnx("Invalid IPv6 address `%s' in %s `%s'", 414 thost, desc, origurl); 415 goto cleanup_parse_url; 416 } 417 cp = ep + 1; 418 if (*cp == ':') 419 cp++; 420 else 421 cp = NULL; 422 } else 423 #endif /* INET6 */ 424 if ((cp = strchr(thost, ':')) != NULL) 425 *cp++ = '\0'; 426 *host = thost; 427 428 /* look for [:port] */ 429 if (cp != NULL) { 430 unsigned long nport; 431 432 nport = strtoul(cp, &ep, 10); 433 if (*cp == '\0' || *ep != '\0' || 434 nport < 1 || nport > MAX_IN_PORT_T) { 435 warnx("Unknown port `%s' in %s `%s'", 436 cp, desc, origurl); 437 goto cleanup_parse_url; 438 } 439 *portnum = nport; 440 tport = cp; 441 } 442 443 if (tport != NULL) 444 *port = ftp_strdup(tport); 445 if (*path == NULL) { 446 const char *emptypath = "/"; 447 if (*utype == FTP_URL_T) /* skip first / for ftp URLs */ 448 emptypath++; 449 *path = ftp_strdup(emptypath); 450 } 451 452 DPRINTF("parse_url: user `%s' pass `%s' host %s port %s(%d) " 453 "path `%s'\n", 454 STRorNULL(*uuser), STRorNULL(*pass), 455 STRorNULL(*host), STRorNULL(*port), 456 *portnum ? *portnum : -1, STRorNULL(*path)); 457 458 return (0); 459 } 460 461 sigjmp_buf httpabort; 462 463 /* 464 * Retrieve URL, via a proxy if necessary, using HTTP. 465 * If proxyenv is set, use that for the proxy, otherwise try ftp_proxy or 466 * http_proxy as appropriate. 467 * Supports HTTP redirects. 468 * Returns 1 on failure, 0 on completed xfer, -1 if ftp connection 469 * is still open (e.g, ftp xfer with trailing /) 470 */ 471 static int 472 fetch_url(const char *url, const char *proxyenv, char *proxyauth, char *wwwauth) 473 { 474 struct addrinfo hints, *res, *res0 = NULL; 475 int error; 476 sigfunc volatile oldintr; 477 sigfunc volatile oldintp; 478 int volatile s; 479 struct stat sb; 480 int volatile ischunked; 481 int volatile isproxy; 482 int volatile rval; 483 int volatile hcode; 484 int len; 485 size_t flen; 486 static size_t bufsize; 487 static char *xferbuf; 488 const char *cp, *token; 489 char *ep; 490 char buf[FTPBUFLEN]; 491 const char *errormsg; 492 char *volatile savefile; 493 char *volatile auth; 494 char *volatile location; 495 char *volatile message; 496 char *uuser, *pass, *host, *port, *path; 497 char *volatile decodedpath; 498 char *puser, *ppass, *useragent; 499 off_t hashbytes, rangestart, rangeend, entitylen; 500 int (*volatile closefunc)(FILE *); 501 FILE *volatile fin; 502 FILE *volatile fout; 503 time_t mtime; 504 url_t urltype; 505 in_port_t portnum; 506 507 DPRINTF("fetch_url: `%s' proxyenv `%s'\n", url, STRorNULL(proxyenv)); 508 509 oldintr = oldintp = NULL; 510 closefunc = NULL; 511 fin = fout = NULL; 512 s = -1; 513 savefile = NULL; 514 auth = location = message = NULL; 515 ischunked = isproxy = hcode = 0; 516 rval = 1; 517 uuser = pass = host = path = decodedpath = puser = ppass = NULL; 518 519 if (parse_url(url, "URL", &urltype, &uuser, &pass, &host, &port, 520 &portnum, &path) == -1) 521 goto cleanup_fetch_url; 522 523 if (urltype == FILE_URL_T && ! EMPTYSTRING(host) 524 && strcasecmp(host, "localhost") != 0) { 525 warnx("No support for non local file URL `%s'", url); 526 goto cleanup_fetch_url; 527 } 528 529 if (EMPTYSTRING(path)) { 530 if (urltype == FTP_URL_T) { 531 rval = fetch_ftp(url); 532 goto cleanup_fetch_url; 533 } 534 if (urltype != HTTP_URL_T || outfile == NULL) { 535 warnx("Invalid URL (no file after host) `%s'", url); 536 goto cleanup_fetch_url; 537 } 538 } 539 540 decodedpath = ftp_strdup(path); 541 url_decode(decodedpath); 542 543 if (outfile) 544 savefile = ftp_strdup(outfile); 545 else { 546 cp = strrchr(decodedpath, '/'); /* find savefile */ 547 if (cp != NULL) 548 savefile = ftp_strdup(cp + 1); 549 else 550 savefile = ftp_strdup(decodedpath); 551 } 552 DPRINTF("fetch_url: savefile `%s'\n", savefile); 553 if (EMPTYSTRING(savefile)) { 554 if (urltype == FTP_URL_T) { 555 rval = fetch_ftp(url); 556 goto cleanup_fetch_url; 557 } 558 warnx("No file after directory (you must specify an " 559 "output file) `%s'", url); 560 goto cleanup_fetch_url; 561 } 562 563 restart_point = 0; 564 filesize = -1; 565 rangestart = rangeend = entitylen = -1; 566 mtime = -1; 567 if (restartautofetch) { 568 if (strcmp(savefile, "-") != 0 && *savefile != '|' && 569 stat(savefile, &sb) == 0) 570 restart_point = sb.st_size; 571 } 572 if (urltype == FILE_URL_T) { /* file:// URLs */ 573 direction = "copied"; 574 fin = fopen(decodedpath, "r"); 575 if (fin == NULL) { 576 warn("Can't open `%s'", decodedpath); 577 goto cleanup_fetch_url; 578 } 579 if (fstat(fileno(fin), &sb) == 0) { 580 mtime = sb.st_mtime; 581 filesize = sb.st_size; 582 } 583 if (restart_point) { 584 if (lseek(fileno(fin), restart_point, SEEK_SET) < 0) { 585 warn("Can't seek to restart `%s'", 586 decodedpath); 587 goto cleanup_fetch_url; 588 } 589 } 590 if (verbose) { 591 fprintf(ttyout, "Copying %s", decodedpath); 592 if (restart_point) 593 fprintf(ttyout, " (restarting at " LLF ")", 594 (LLT)restart_point); 595 fputs("\n", ttyout); 596 } 597 } else { /* ftp:// or http:// URLs */ 598 const char *leading; 599 int hasleading; 600 601 if (proxyenv == NULL) { 602 if (urltype == HTTP_URL_T) 603 proxyenv = getoptionvalue("http_proxy"); 604 else if (urltype == FTP_URL_T) 605 proxyenv = getoptionvalue("ftp_proxy"); 606 } 607 direction = "retrieved"; 608 if (! EMPTYSTRING(proxyenv)) { /* use proxy */ 609 url_t purltype; 610 char *phost, *ppath; 611 char *pport, *no_proxy; 612 in_port_t pportnum; 613 614 isproxy = 1; 615 616 /* check URL against list of no_proxied sites */ 617 no_proxy = getoptionvalue("no_proxy"); 618 if (! EMPTYSTRING(no_proxy)) { 619 char *np, *np_copy, *np_iter; 620 unsigned long np_port; 621 size_t hlen, plen; 622 623 np_iter = np_copy = ftp_strdup(no_proxy); 624 hlen = strlen(host); 625 while ((cp = strsep(&np_iter, " ,")) != NULL) { 626 if (*cp == '\0') 627 continue; 628 if ((np = strrchr(cp, ':')) != NULL) { 629 *np++ = '\0'; 630 np_port = strtoul(np, &ep, 10); 631 if (*np == '\0' || *ep != '\0') 632 continue; 633 if (np_port != portnum) 634 continue; 635 } 636 plen = strlen(cp); 637 if (hlen < plen) 638 continue; 639 if (strncasecmp(host + hlen - plen, 640 cp, plen) == 0) { 641 isproxy = 0; 642 break; 643 } 644 } 645 FREEPTR(np_copy); 646 if (isproxy == 0 && urltype == FTP_URL_T) { 647 rval = fetch_ftp(url); 648 goto cleanup_fetch_url; 649 } 650 } 651 652 if (isproxy) { 653 if (restart_point) { 654 warnx("Can't restart via proxy URL `%s'", 655 proxyenv); 656 goto cleanup_fetch_url; 657 } 658 if (parse_url(proxyenv, "proxy URL", &purltype, 659 &puser, &ppass, &phost, &pport, &pportnum, 660 &ppath) == -1) 661 goto cleanup_fetch_url; 662 663 if ((purltype != HTTP_URL_T 664 && purltype != FTP_URL_T) || 665 EMPTYSTRING(phost) || 666 (! EMPTYSTRING(ppath) 667 && strcmp(ppath, "/") != 0)) { 668 warnx("Malformed proxy URL `%s'", 669 proxyenv); 670 FREEPTR(phost); 671 FREEPTR(pport); 672 FREEPTR(ppath); 673 goto cleanup_fetch_url; 674 } 675 if (isipv6addr(host) && 676 strchr(host, '%') != NULL) { 677 warnx( 678 "Scoped address notation `%s' disallowed via web proxy", 679 host); 680 FREEPTR(phost); 681 FREEPTR(pport); 682 FREEPTR(ppath); 683 goto cleanup_fetch_url; 684 } 685 686 FREEPTR(host); 687 host = phost; 688 FREEPTR(port); 689 port = pport; 690 FREEPTR(path); 691 path = ftp_strdup(url); 692 FREEPTR(ppath); 693 } 694 } /* ! EMPTYSTRING(proxyenv) */ 695 696 memset(&hints, 0, sizeof(hints)); 697 hints.ai_flags = 0; 698 hints.ai_family = family; 699 hints.ai_socktype = SOCK_STREAM; 700 hints.ai_protocol = 0; 701 error = getaddrinfo(host, port, &hints, &res0); 702 if (error) { 703 warnx("Can't LOOKUP `%s:%s': %s", host, port, 704 (error == EAI_SYSTEM) ? strerror(errno) 705 : gai_strerror(error)); 706 goto cleanup_fetch_url; 707 } 708 if (res0->ai_canonname) 709 host = res0->ai_canonname; 710 711 s = -1; 712 for (res = res0; res; res = res->ai_next) { 713 char hname[NI_MAXHOST], sname[NI_MAXSERV]; 714 715 ai_unmapped(res); 716 if (getnameinfo(res->ai_addr, res->ai_addrlen, 717 hname, sizeof(hname), sname, sizeof(sname), 718 NI_NUMERICHOST | NI_NUMERICSERV) != 0) { 719 strlcpy(hname, "?", sizeof(hname)); 720 strlcpy(sname, "?", sizeof(sname)); 721 } 722 723 if (verbose && res0->ai_next) { 724 fprintf(ttyout, "Trying %s:%s ...\n", 725 hname, sname); 726 } 727 728 s = socket(res->ai_family, SOCK_STREAM, 729 res->ai_protocol); 730 if (s < 0) { 731 warn( 732 "Can't create socket for connection to " 733 "`%s:%s'", hname, sname); 734 continue; 735 } 736 737 if (ftp_connect(s, res->ai_addr, res->ai_addrlen, 738 verbose || !res->ai_next) < 0) { 739 close(s); 740 s = -1; 741 continue; 742 } 743 744 /* success */ 745 break; 746 } 747 748 if (s < 0) { 749 warnx("Can't connect to `%s:%s'", host, port); 750 goto cleanup_fetch_url; 751 } 752 753 fin = fdopen(s, "r+"); 754 /* 755 * Construct and send the request. 756 */ 757 if (verbose) 758 fprintf(ttyout, "Requesting %s\n", url); 759 leading = " ("; 760 hasleading = 0; 761 if (isproxy) { 762 if (verbose) { 763 fprintf(ttyout, "%svia %s:%s", leading, 764 host, port); 765 leading = ", "; 766 hasleading++; 767 } 768 fprintf(fin, "GET %s HTTP/1.0\r\n", path); 769 if (flushcache) 770 fprintf(fin, "Pragma: no-cache\r\n"); 771 } else { 772 fprintf(fin, "GET %s HTTP/1.1\r\n", path); 773 if (strchr(host, ':')) { 774 char *h, *p; 775 776 /* 777 * strip off IPv6 scope identifier, since it is 778 * local to the node 779 */ 780 h = ftp_strdup(host); 781 if (isipv6addr(h) && 782 (p = strchr(h, '%')) != NULL) { 783 *p = '\0'; 784 } 785 fprintf(fin, "Host: [%s]", h); 786 free(h); 787 } else 788 fprintf(fin, "Host: %s", host); 789 if (portnum != HTTP_PORT) 790 fprintf(fin, ":%u", portnum); 791 fprintf(fin, "\r\n"); 792 fprintf(fin, "Accept: */*\r\n"); 793 fprintf(fin, "Connection: close\r\n"); 794 if (restart_point) { 795 fputs(leading, ttyout); 796 fprintf(fin, "Range: bytes=" LLF "-\r\n", 797 (LLT)restart_point); 798 fprintf(ttyout, "restarting at " LLF, 799 (LLT)restart_point); 800 leading = ", "; 801 hasleading++; 802 } 803 if (flushcache) 804 fprintf(fin, "Cache-Control: no-cache\r\n"); 805 } 806 if ((useragent=getenv("FTPUSERAGENT")) != NULL) { 807 fprintf(fin, "User-Agent: %s\r\n", useragent); 808 } else { 809 fprintf(fin, "User-Agent: %s/%s\r\n", 810 FTP_PRODUCT, FTP_VERSION); 811 } 812 if (wwwauth) { 813 if (verbose) { 814 fprintf(ttyout, "%swith authorization", 815 leading); 816 leading = ", "; 817 hasleading++; 818 } 819 fprintf(fin, "Authorization: %s\r\n", wwwauth); 820 } 821 if (proxyauth) { 822 if (verbose) { 823 fprintf(ttyout, 824 "%swith proxy authorization", leading); 825 leading = ", "; 826 hasleading++; 827 } 828 fprintf(fin, "Proxy-Authorization: %s\r\n", proxyauth); 829 } 830 if (verbose && hasleading) 831 fputs(")\n", ttyout); 832 fprintf(fin, "\r\n"); 833 if (fflush(fin) == EOF) { 834 warn("Writing HTTP request"); 835 goto cleanup_fetch_url; 836 } 837 838 /* Read the response */ 839 len = get_line(fin, buf, sizeof(buf), &errormsg); 840 if (len < 0) { 841 if (*errormsg == '\n') 842 errormsg++; 843 warnx("Receiving HTTP reply: %s", errormsg); 844 goto cleanup_fetch_url; 845 } 846 while (len > 0 && (ISLWS(buf[len-1]))) 847 buf[--len] = '\0'; 848 DPRINTF("fetch_url: received `%s'\n", buf); 849 850 /* Determine HTTP response code */ 851 cp = strchr(buf, ' '); 852 if (cp == NULL) 853 goto improper; 854 else 855 cp++; 856 hcode = strtol(cp, &ep, 10); 857 if (*ep != '\0' && !isspace((unsigned char)*ep)) 858 goto improper; 859 message = ftp_strdup(cp); 860 861 /* Read the rest of the header. */ 862 while (1) { 863 len = get_line(fin, buf, sizeof(buf), &errormsg); 864 if (len < 0) { 865 if (*errormsg == '\n') 866 errormsg++; 867 warnx("Receiving HTTP reply: %s", errormsg); 868 goto cleanup_fetch_url; 869 } 870 while (len > 0 && (ISLWS(buf[len-1]))) 871 buf[--len] = '\0'; 872 if (len == 0) 873 break; 874 DPRINTF("fetch_url: received `%s'\n", buf); 875 876 /* 877 * Look for some headers 878 */ 879 880 cp = buf; 881 882 if (match_token(&cp, "Content-Length:")) { 883 filesize = STRTOLL(cp, &ep, 10); 884 if (filesize < 0 || *ep != '\0') 885 goto improper; 886 DPRINTF("fetch_url: parsed len as: " LLF "\n", 887 (LLT)filesize); 888 889 } else if (match_token(&cp, "Content-Range:")) { 890 if (! match_token(&cp, "bytes")) 891 goto improper; 892 893 if (*cp == '*') 894 cp++; 895 else { 896 rangestart = STRTOLL(cp, &ep, 10); 897 if (rangestart < 0 || *ep != '-') 898 goto improper; 899 cp = ep + 1; 900 rangeend = STRTOLL(cp, &ep, 10); 901 if (rangeend < 0 || rangeend < rangestart) 902 goto improper; 903 cp = ep; 904 } 905 if (*cp != '/') 906 goto improper; 907 cp++; 908 if (*cp == '*') 909 cp++; 910 else { 911 entitylen = STRTOLL(cp, &ep, 10); 912 if (entitylen < 0) 913 goto improper; 914 cp = ep; 915 } 916 if (*cp != '\0') 917 goto improper; 918 919 #ifndef NO_DEBUG 920 if (ftp_debug) { 921 fprintf(ttyout, "parsed range as: "); 922 if (rangestart == -1) 923 fprintf(ttyout, "*"); 924 else 925 fprintf(ttyout, LLF "-" LLF, 926 (LLT)rangestart, 927 (LLT)rangeend); 928 fprintf(ttyout, "/" LLF "\n", (LLT)entitylen); 929 } 930 #endif 931 if (! restart_point) { 932 warnx( 933 "Received unexpected Content-Range header"); 934 goto cleanup_fetch_url; 935 } 936 937 } else if (match_token(&cp, "Last-Modified:")) { 938 struct tm parsed; 939 const char *t; 940 941 memset(&parsed, 0, sizeof(parsed)); 942 t = parse_rfc2616time(&parsed, cp); 943 if (t != NULL) { 944 parsed.tm_isdst = -1; 945 if (*t == '\0') 946 mtime = timegm(&parsed); 947 #ifndef NO_DEBUG 948 if (ftp_debug && mtime != -1) { 949 fprintf(ttyout, 950 "parsed time as: %s", 951 rfc2822time(localtime(&mtime))); 952 } 953 #endif 954 } 955 956 } else if (match_token(&cp, "Location:")) { 957 location = ftp_strdup(cp); 958 DPRINTF("fetch_url: parsed location as `%s'\n", 959 cp); 960 961 } else if (match_token(&cp, "Transfer-Encoding:")) { 962 if (match_token(&cp, "binary")) { 963 warnx( 964 "Bogus transfer encoding `binary' (fetching anyway)"); 965 continue; 966 } 967 if (! (token = match_token(&cp, "chunked"))) { 968 warnx( 969 "Unsupported transfer encoding `%s'", 970 token); 971 goto cleanup_fetch_url; 972 } 973 ischunked++; 974 DPRINTF("fetch_url: using chunked encoding\n"); 975 976 } else if (match_token(&cp, "Proxy-Authenticate:") 977 || match_token(&cp, "WWW-Authenticate:")) { 978 if (! (token = match_token(&cp, "Basic"))) { 979 DPRINTF( 980 "fetch_url: skipping unknown auth scheme `%s'\n", 981 token); 982 continue; 983 } 984 FREEPTR(auth); 985 auth = ftp_strdup(token); 986 DPRINTF("fetch_url: parsed auth as `%s'\n", cp); 987 } 988 989 } 990 /* finished parsing header */ 991 992 switch (hcode) { 993 case 200: 994 break; 995 case 206: 996 if (! restart_point) { 997 warnx("Not expecting partial content header"); 998 goto cleanup_fetch_url; 999 } 1000 break; 1001 case 300: 1002 case 301: 1003 case 302: 1004 case 303: 1005 case 305: 1006 case 307: 1007 if (EMPTYSTRING(location)) { 1008 warnx( 1009 "No redirection Location provided by server"); 1010 goto cleanup_fetch_url; 1011 } 1012 if (redirect_loop++ > 5) { 1013 warnx("Too many redirections requested"); 1014 goto cleanup_fetch_url; 1015 } 1016 if (hcode == 305) { 1017 if (verbose) 1018 fprintf(ttyout, "Redirected via %s\n", 1019 location); 1020 rval = fetch_url(url, location, 1021 proxyauth, wwwauth); 1022 } else { 1023 if (verbose) 1024 fprintf(ttyout, "Redirected to %s\n", 1025 location); 1026 rval = go_fetch(location); 1027 } 1028 goto cleanup_fetch_url; 1029 #ifndef NO_AUTH 1030 case 401: 1031 case 407: 1032 { 1033 char **authp; 1034 char *auser, *apass; 1035 1036 if (hcode == 401) { 1037 authp = &wwwauth; 1038 auser = uuser; 1039 apass = pass; 1040 } else { 1041 authp = &proxyauth; 1042 auser = puser; 1043 apass = ppass; 1044 } 1045 if (verbose || *authp == NULL || 1046 auser == NULL || apass == NULL) 1047 fprintf(ttyout, "%s\n", message); 1048 if (EMPTYSTRING(auth)) { 1049 warnx( 1050 "No authentication challenge provided by server"); 1051 goto cleanup_fetch_url; 1052 } 1053 if (*authp != NULL) { 1054 char reply[10]; 1055 1056 fprintf(ttyout, 1057 "Authorization failed. Retry (y/n)? "); 1058 if (get_line(stdin, reply, sizeof(reply), NULL) 1059 < 0) { 1060 goto cleanup_fetch_url; 1061 } 1062 if (tolower((unsigned char)reply[0]) != 'y') 1063 goto cleanup_fetch_url; 1064 auser = NULL; 1065 apass = NULL; 1066 } 1067 if (auth_url(auth, authp, auser, apass) == 0) { 1068 rval = fetch_url(url, proxyenv, 1069 proxyauth, wwwauth); 1070 memset(*authp, 0, strlen(*authp)); 1071 FREEPTR(*authp); 1072 } 1073 goto cleanup_fetch_url; 1074 } 1075 #endif 1076 default: 1077 if (message) 1078 warnx("Error retrieving file `%s'", message); 1079 else 1080 warnx("Unknown error retrieving file"); 1081 goto cleanup_fetch_url; 1082 } 1083 } /* end of ftp:// or http:// specific setup */ 1084 1085 /* Open the output file. */ 1086 if (strcmp(savefile, "-") == 0) { 1087 fout = stdout; 1088 } else if (*savefile == '|') { 1089 oldintp = xsignal(SIGPIPE, SIG_IGN); 1090 fout = popen(savefile + 1, "w"); 1091 if (fout == NULL) { 1092 warn("Can't execute `%s'", savefile + 1); 1093 goto cleanup_fetch_url; 1094 } 1095 closefunc = pclose; 1096 } else { 1097 if ((rangeend != -1 && rangeend <= restart_point) || 1098 (rangestart == -1 && filesize != -1 && filesize <= restart_point)) { 1099 /* already done */ 1100 if (verbose) 1101 fprintf(ttyout, "already done\n"); 1102 rval = 0; 1103 goto cleanup_fetch_url; 1104 } 1105 if (restart_point && rangestart != -1) { 1106 if (entitylen != -1) 1107 filesize = entitylen; 1108 if (rangestart != restart_point) { 1109 warnx( 1110 "Size of `%s' differs from save file `%s'", 1111 url, savefile); 1112 goto cleanup_fetch_url; 1113 } 1114 fout = fopen(savefile, "a"); 1115 } else 1116 fout = fopen(savefile, "w"); 1117 if (fout == NULL) { 1118 warn("Can't open `%s'", savefile); 1119 goto cleanup_fetch_url; 1120 } 1121 closefunc = fclose; 1122 } 1123 1124 /* Trap signals */ 1125 if (sigsetjmp(httpabort, 1)) 1126 goto cleanup_fetch_url; 1127 (void)xsignal(SIGQUIT, psummary); 1128 oldintr = xsignal(SIGINT, aborthttp); 1129 1130 assert(rcvbuf_size > 0); 1131 if ((size_t)rcvbuf_size > bufsize) { 1132 if (xferbuf) 1133 (void)free(xferbuf); 1134 bufsize = rcvbuf_size; 1135 xferbuf = ftp_malloc(bufsize); 1136 } 1137 1138 bytes = 0; 1139 hashbytes = mark; 1140 progressmeter(-1); 1141 1142 /* Finally, suck down the file. */ 1143 do { 1144 long chunksize; 1145 short lastchunk; 1146 1147 chunksize = 0; 1148 lastchunk = 0; 1149 /* read chunk-size */ 1150 if (ischunked) { 1151 if (fgets(xferbuf, bufsize, fin) == NULL) { 1152 warnx("Unexpected EOF reading chunk-size"); 1153 goto cleanup_fetch_url; 1154 } 1155 errno = 0; 1156 chunksize = strtol(xferbuf, &ep, 16); 1157 if (ep == xferbuf) { 1158 warnx("Invalid chunk-size"); 1159 goto cleanup_fetch_url; 1160 } 1161 if (errno == ERANGE || chunksize < 0) { 1162 errno = ERANGE; 1163 warn("Chunk-size `%.*s'", 1164 (int)(ep-xferbuf), xferbuf); 1165 goto cleanup_fetch_url; 1166 } 1167 1168 /* 1169 * XXX: Work around bug in Apache 1.3.9 and 1170 * 1.3.11, which incorrectly put trailing 1171 * space after the chunk-size. 1172 */ 1173 while (*ep == ' ') 1174 ep++; 1175 1176 /* skip [ chunk-ext ] */ 1177 if (*ep == ';') { 1178 while (*ep && *ep != '\r') 1179 ep++; 1180 } 1181 1182 if (strcmp(ep, "\r\n") != 0) { 1183 warnx("Unexpected data following chunk-size"); 1184 goto cleanup_fetch_url; 1185 } 1186 DPRINTF("fetch_url: got chunk-size of " LLF "\n", 1187 (LLT)chunksize); 1188 if (chunksize == 0) { 1189 lastchunk = 1; 1190 goto chunkdone; 1191 } 1192 } 1193 /* transfer file or chunk */ 1194 while (1) { 1195 struct timeval then, now, td; 1196 off_t bufrem; 1197 1198 if (rate_get) 1199 (void)gettimeofday(&then, NULL); 1200 bufrem = rate_get ? rate_get : (off_t)bufsize; 1201 if (ischunked) 1202 bufrem = MIN(chunksize, bufrem); 1203 while (bufrem > 0) { 1204 flen = fread(xferbuf, sizeof(char), 1205 MIN((off_t)bufsize, bufrem), fin); 1206 if (flen <= 0) 1207 goto chunkdone; 1208 bytes += flen; 1209 bufrem -= flen; 1210 if (fwrite(xferbuf, sizeof(char), flen, fout) 1211 != flen) { 1212 warn("Writing `%s'", savefile); 1213 goto cleanup_fetch_url; 1214 } 1215 if (hash && !progress) { 1216 while (bytes >= hashbytes) { 1217 (void)putc('#', ttyout); 1218 hashbytes += mark; 1219 } 1220 (void)fflush(ttyout); 1221 } 1222 if (ischunked) { 1223 chunksize -= flen; 1224 if (chunksize <= 0) 1225 break; 1226 } 1227 } 1228 if (rate_get) { 1229 while (1) { 1230 (void)gettimeofday(&now, NULL); 1231 timersub(&now, &then, &td); 1232 if (td.tv_sec > 0) 1233 break; 1234 usleep(1000000 - td.tv_usec); 1235 } 1236 } 1237 if (ischunked && chunksize <= 0) 1238 break; 1239 } 1240 /* read CRLF after chunk*/ 1241 chunkdone: 1242 if (ischunked) { 1243 if (fgets(xferbuf, bufsize, fin) == NULL) { 1244 warnx("Unexpected EOF reading chunk CRLF"); 1245 goto cleanup_fetch_url; 1246 } 1247 if (strcmp(xferbuf, "\r\n") != 0) { 1248 warnx("Unexpected data following chunk"); 1249 goto cleanup_fetch_url; 1250 } 1251 if (lastchunk) 1252 break; 1253 } 1254 } while (ischunked); 1255 1256 /* XXX: deal with optional trailer & CRLF here? */ 1257 1258 if (hash && !progress && bytes > 0) { 1259 if (bytes < mark) 1260 (void)putc('#', ttyout); 1261 (void)putc('\n', ttyout); 1262 } 1263 if (ferror(fin)) { 1264 warn("Reading file"); 1265 goto cleanup_fetch_url; 1266 } 1267 progressmeter(1); 1268 (void)fflush(fout); 1269 if (closefunc == fclose && mtime != -1) { 1270 struct timeval tval[2]; 1271 1272 (void)gettimeofday(&tval[0], NULL); 1273 tval[1].tv_sec = mtime; 1274 tval[1].tv_usec = 0; 1275 (*closefunc)(fout); 1276 fout = NULL; 1277 1278 if (utimes(savefile, tval) == -1) { 1279 fprintf(ttyout, 1280 "Can't change modification time to %s", 1281 rfc2822time(localtime(&mtime))); 1282 } 1283 } 1284 if (bytes > 0) 1285 ptransfer(0); 1286 bytes = 0; 1287 1288 rval = 0; 1289 goto cleanup_fetch_url; 1290 1291 improper: 1292 warnx("Improper response from `%s:%s'", host, port); 1293 1294 cleanup_fetch_url: 1295 if (oldintr) 1296 (void)xsignal(SIGINT, oldintr); 1297 if (oldintp) 1298 (void)xsignal(SIGPIPE, oldintp); 1299 if (fin != NULL) 1300 fclose(fin); 1301 else if (s != -1) 1302 close(s); 1303 if (closefunc != NULL && fout != NULL) 1304 (*closefunc)(fout); 1305 if (res0) 1306 freeaddrinfo(res0); 1307 FREEPTR(savefile); 1308 FREEPTR(uuser); 1309 if (pass != NULL) 1310 memset(pass, 0, strlen(pass)); 1311 FREEPTR(pass); 1312 FREEPTR(host); 1313 FREEPTR(port); 1314 FREEPTR(path); 1315 FREEPTR(decodedpath); 1316 FREEPTR(puser); 1317 if (ppass != NULL) 1318 memset(ppass, 0, strlen(ppass)); 1319 FREEPTR(ppass); 1320 FREEPTR(auth); 1321 FREEPTR(location); 1322 FREEPTR(message); 1323 return (rval); 1324 } 1325 1326 /* 1327 * Abort a HTTP retrieval 1328 */ 1329 static void 1330 aborthttp(int notused) 1331 { 1332 char msgbuf[100]; 1333 size_t len; 1334 1335 sigint_raised = 1; 1336 alarmtimer(0); 1337 len = strlcpy(msgbuf, "\nHTTP fetch aborted.\n", sizeof(msgbuf)); 1338 write(fileno(ttyout), msgbuf, len); 1339 siglongjmp(httpabort, 1); 1340 } 1341 1342 /* 1343 * Retrieve ftp URL or classic ftp argument using FTP. 1344 * Returns 1 on failure, 0 on completed xfer, -1 if ftp connection 1345 * is still open (e.g, ftp xfer with trailing /) 1346 */ 1347 static int 1348 fetch_ftp(const char *url) 1349 { 1350 char *cp, *xargv[5], rempath[MAXPATHLEN]; 1351 char *host, *path, *dir, *file, *uuser, *pass; 1352 char *port; 1353 char cmdbuf[MAXPATHLEN]; 1354 char dirbuf[4]; 1355 int dirhasglob, filehasglob, rval, transtype, xargc; 1356 int oanonftp, oautologin; 1357 in_port_t portnum; 1358 url_t urltype; 1359 1360 DPRINTF("fetch_ftp: `%s'\n", url); 1361 host = path = dir = file = uuser = pass = NULL; 1362 port = NULL; 1363 rval = 1; 1364 transtype = TYPE_I; 1365 1366 if (STRNEQUAL(url, FTP_URL)) { 1367 if ((parse_url(url, "URL", &urltype, &uuser, &pass, 1368 &host, &port, &portnum, &path) == -1) || 1369 (uuser != NULL && *uuser == '\0') || 1370 EMPTYSTRING(host)) { 1371 warnx("Invalid URL `%s'", url); 1372 goto cleanup_fetch_ftp; 1373 } 1374 /* 1375 * Note: Don't url_decode(path) here. We need to keep the 1376 * distinction between "/" and "%2F" until later. 1377 */ 1378 1379 /* check for trailing ';type=[aid]' */ 1380 if (! EMPTYSTRING(path) && (cp = strrchr(path, ';')) != NULL) { 1381 if (strcasecmp(cp, ";type=a") == 0) 1382 transtype = TYPE_A; 1383 else if (strcasecmp(cp, ";type=i") == 0) 1384 transtype = TYPE_I; 1385 else if (strcasecmp(cp, ";type=d") == 0) { 1386 warnx( 1387 "Directory listing via a URL is not supported"); 1388 goto cleanup_fetch_ftp; 1389 } else { 1390 warnx("Invalid suffix `%s' in URL `%s'", cp, 1391 url); 1392 goto cleanup_fetch_ftp; 1393 } 1394 *cp = 0; 1395 } 1396 } else { /* classic style `[user@]host:[file]' */ 1397 urltype = CLASSIC_URL_T; 1398 host = ftp_strdup(url); 1399 cp = strchr(host, '@'); 1400 if (cp != NULL) { 1401 *cp = '\0'; 1402 uuser = host; 1403 anonftp = 0; /* disable anonftp */ 1404 host = ftp_strdup(cp + 1); 1405 } 1406 cp = strchr(host, ':'); 1407 if (cp != NULL) { 1408 *cp = '\0'; 1409 path = ftp_strdup(cp + 1); 1410 } 1411 } 1412 if (EMPTYSTRING(host)) 1413 goto cleanup_fetch_ftp; 1414 1415 /* Extract the file and (if present) directory name. */ 1416 dir = path; 1417 if (! EMPTYSTRING(dir)) { 1418 /* 1419 * If we are dealing with classic `[user@]host:[path]' syntax, 1420 * then a path of the form `/file' (resulting from input of the 1421 * form `host:/file') means that we should do "CWD /" before 1422 * retrieving the file. So we set dir="/" and file="file". 1423 * 1424 * But if we are dealing with URLs like `ftp://host/path' then 1425 * a path of the form `/file' (resulting from a URL of the form 1426 * `ftp://host//file') means that we should do `CWD ' (with an 1427 * empty argument) before retrieving the file. So we set 1428 * dir="" and file="file". 1429 * 1430 * If the path does not contain / at all, we set dir=NULL. 1431 * (We get a path without any slashes if we are dealing with 1432 * classic `[user@]host:[file]' or URL `ftp://host/file'.) 1433 * 1434 * In all other cases, we set dir to a string that does not 1435 * include the final '/' that separates the dir part from the 1436 * file part of the path. (This will be the empty string if 1437 * and only if we are dealing with a path of the form `/file' 1438 * resulting from an URL of the form `ftp://host//file'.) 1439 */ 1440 cp = strrchr(dir, '/'); 1441 if (cp == dir && urltype == CLASSIC_URL_T) { 1442 file = cp + 1; 1443 (void)strlcpy(dirbuf, "/", sizeof(dirbuf)); 1444 dir = dirbuf; 1445 } else if (cp != NULL) { 1446 *cp++ = '\0'; 1447 file = cp; 1448 } else { 1449 file = dir; 1450 dir = NULL; 1451 } 1452 } else 1453 dir = NULL; 1454 if (urltype == FTP_URL_T && file != NULL) { 1455 url_decode(file); 1456 /* but still don't url_decode(dir) */ 1457 } 1458 DPRINTF("fetch_ftp: user `%s' pass `%s' host %s port %s " 1459 "path `%s' dir `%s' file `%s'\n", 1460 STRorNULL(uuser), STRorNULL(pass), 1461 STRorNULL(host), STRorNULL(port), 1462 STRorNULL(path), STRorNULL(dir), STRorNULL(file)); 1463 1464 dirhasglob = filehasglob = 0; 1465 if (doglob && urltype == CLASSIC_URL_T) { 1466 if (! EMPTYSTRING(dir) && strpbrk(dir, "*?[]{}") != NULL) 1467 dirhasglob = 1; 1468 if (! EMPTYSTRING(file) && strpbrk(file, "*?[]{}") != NULL) 1469 filehasglob = 1; 1470 } 1471 1472 /* Set up the connection */ 1473 oanonftp = anonftp; 1474 if (connected) 1475 disconnect(0, NULL); 1476 anonftp = oanonftp; 1477 (void)strlcpy(cmdbuf, getprogname(), sizeof(cmdbuf)); 1478 xargv[0] = cmdbuf; 1479 xargv[1] = host; 1480 xargv[2] = NULL; 1481 xargc = 2; 1482 if (port) { 1483 xargv[2] = port; 1484 xargv[3] = NULL; 1485 xargc = 3; 1486 } 1487 oautologin = autologin; 1488 /* don't autologin in setpeer(), use ftp_login() below */ 1489 autologin = 0; 1490 setpeer(xargc, xargv); 1491 autologin = oautologin; 1492 if ((connected == 0) || 1493 (connected == 1 && !ftp_login(host, uuser, pass))) { 1494 warnx("Can't connect or login to host `%s:%s'", 1495 host, port ? port : "?"); 1496 goto cleanup_fetch_ftp; 1497 } 1498 1499 switch (transtype) { 1500 case TYPE_A: 1501 setascii(1, xargv); 1502 break; 1503 case TYPE_I: 1504 setbinary(1, xargv); 1505 break; 1506 default: 1507 errx(1, "fetch_ftp: unknown transfer type %d", transtype); 1508 } 1509 1510 /* 1511 * Change directories, if necessary. 1512 * 1513 * Note: don't use EMPTYSTRING(dir) below, because 1514 * dir=="" means something different from dir==NULL. 1515 */ 1516 if (dir != NULL && !dirhasglob) { 1517 char *nextpart; 1518 1519 /* 1520 * If we are dealing with a classic `[user@]host:[path]' 1521 * (urltype is CLASSIC_URL_T) then we have a raw directory 1522 * name (not encoded in any way) and we can change 1523 * directories in one step. 1524 * 1525 * If we are dealing with an `ftp://host/path' URL 1526 * (urltype is FTP_URL_T), then RFC 3986 says we need to 1527 * send a separate CWD command for each unescaped "/" 1528 * in the path, and we have to interpret %hex escaping 1529 * *after* we find the slashes. It's possible to get 1530 * empty components here, (from multiple adjacent 1531 * slashes in the path) and RFC 3986 says that we should 1532 * still do `CWD ' (with a null argument) in such cases. 1533 * 1534 * Many ftp servers don't support `CWD ', so if there's an 1535 * error performing that command, bail out with a descriptive 1536 * message. 1537 * 1538 * Examples: 1539 * 1540 * host: dir="", urltype=CLASSIC_URL_T 1541 * logged in (to default directory) 1542 * host:file dir=NULL, urltype=CLASSIC_URL_T 1543 * "RETR file" 1544 * host:dir/ dir="dir", urltype=CLASSIC_URL_T 1545 * "CWD dir", logged in 1546 * ftp://host/ dir="", urltype=FTP_URL_T 1547 * logged in (to default directory) 1548 * ftp://host/dir/ dir="dir", urltype=FTP_URL_T 1549 * "CWD dir", logged in 1550 * ftp://host/file dir=NULL, urltype=FTP_URL_T 1551 * "RETR file" 1552 * ftp://host//file dir="", urltype=FTP_URL_T 1553 * "CWD ", "RETR file" 1554 * host:/file dir="/", urltype=CLASSIC_URL_T 1555 * "CWD /", "RETR file" 1556 * ftp://host///file dir="/", urltype=FTP_URL_T 1557 * "CWD ", "CWD ", "RETR file" 1558 * ftp://host/%2F/file dir="%2F", urltype=FTP_URL_T 1559 * "CWD /", "RETR file" 1560 * ftp://host/foo/file dir="foo", urltype=FTP_URL_T 1561 * "CWD foo", "RETR file" 1562 * ftp://host/foo/bar/file dir="foo/bar" 1563 * "CWD foo", "CWD bar", "RETR file" 1564 * ftp://host//foo/bar/file dir="/foo/bar" 1565 * "CWD ", "CWD foo", "CWD bar", "RETR file" 1566 * ftp://host/foo//bar/file dir="foo//bar" 1567 * "CWD foo", "CWD ", "CWD bar", "RETR file" 1568 * ftp://host/%2F/foo/bar/file dir="%2F/foo/bar" 1569 * "CWD /", "CWD foo", "CWD bar", "RETR file" 1570 * ftp://host/%2Ffoo/bar/file dir="%2Ffoo/bar" 1571 * "CWD /foo", "CWD bar", "RETR file" 1572 * ftp://host/%2Ffoo%2Fbar/file dir="%2Ffoo%2Fbar" 1573 * "CWD /foo/bar", "RETR file" 1574 * ftp://host/%2Ffoo%2Fbar%2Ffile dir=NULL 1575 * "RETR /foo/bar/file" 1576 * 1577 * Note that we don't need `dir' after this point. 1578 */ 1579 do { 1580 if (urltype == FTP_URL_T) { 1581 nextpart = strchr(dir, '/'); 1582 if (nextpart) { 1583 *nextpart = '\0'; 1584 nextpart++; 1585 } 1586 url_decode(dir); 1587 } else 1588 nextpart = NULL; 1589 DPRINTF("fetch_ftp: dir `%s', nextpart `%s'\n", 1590 STRorNULL(dir), STRorNULL(nextpart)); 1591 if (urltype == FTP_URL_T || *dir != '\0') { 1592 (void)strlcpy(cmdbuf, "cd", sizeof(cmdbuf)); 1593 xargv[0] = cmdbuf; 1594 xargv[1] = dir; 1595 xargv[2] = NULL; 1596 dirchange = 0; 1597 cd(2, xargv); 1598 if (! dirchange) { 1599 if (*dir == '\0' && code == 500) 1600 fprintf(stderr, 1601 "\n" 1602 "ftp: The `CWD ' command (without a directory), which is required by\n" 1603 " RFC 3986 to support the empty directory in the URL pathname (`//'),\n" 1604 " conflicts with the server's conformance to RFC 959.\n" 1605 " Try the same URL without the `//' in the URL pathname.\n" 1606 "\n"); 1607 goto cleanup_fetch_ftp; 1608 } 1609 } 1610 dir = nextpart; 1611 } while (dir != NULL); 1612 } 1613 1614 if (EMPTYSTRING(file)) { 1615 rval = -1; 1616 goto cleanup_fetch_ftp; 1617 } 1618 1619 if (dirhasglob) { 1620 (void)strlcpy(rempath, dir, sizeof(rempath)); 1621 (void)strlcat(rempath, "/", sizeof(rempath)); 1622 (void)strlcat(rempath, file, sizeof(rempath)); 1623 file = rempath; 1624 } 1625 1626 /* Fetch the file(s). */ 1627 xargc = 2; 1628 (void)strlcpy(cmdbuf, "get", sizeof(cmdbuf)); 1629 xargv[0] = cmdbuf; 1630 xargv[1] = file; 1631 xargv[2] = NULL; 1632 if (dirhasglob || filehasglob) { 1633 int ointeractive; 1634 1635 ointeractive = interactive; 1636 interactive = 0; 1637 if (restartautofetch) 1638 (void)strlcpy(cmdbuf, "mreget", sizeof(cmdbuf)); 1639 else 1640 (void)strlcpy(cmdbuf, "mget", sizeof(cmdbuf)); 1641 xargv[0] = cmdbuf; 1642 mget(xargc, xargv); 1643 interactive = ointeractive; 1644 } else { 1645 if (outfile == NULL) { 1646 cp = strrchr(file, '/'); /* find savefile */ 1647 if (cp != NULL) 1648 outfile = cp + 1; 1649 else 1650 outfile = file; 1651 } 1652 xargv[2] = (char *)outfile; 1653 xargv[3] = NULL; 1654 xargc++; 1655 if (restartautofetch) 1656 reget(xargc, xargv); 1657 else 1658 get(xargc, xargv); 1659 } 1660 1661 if ((code / 100) == COMPLETE) 1662 rval = 0; 1663 1664 cleanup_fetch_ftp: 1665 FREEPTR(port); 1666 FREEPTR(host); 1667 FREEPTR(path); 1668 FREEPTR(uuser); 1669 if (pass) 1670 memset(pass, 0, strlen(pass)); 1671 FREEPTR(pass); 1672 return (rval); 1673 } 1674 1675 /* 1676 * Retrieve the given file to outfile. 1677 * Supports arguments of the form: 1678 * "host:path", "ftp://host/path" if $ftpproxy, call fetch_url() else 1679 * call fetch_ftp() 1680 * "http://host/path" call fetch_url() to use HTTP 1681 * "file:///path" call fetch_url() to copy 1682 * "about:..." print a message 1683 * 1684 * Returns 1 on failure, 0 on completed xfer, -1 if ftp connection 1685 * is still open (e.g, ftp xfer with trailing /) 1686 */ 1687 static int 1688 go_fetch(const char *url) 1689 { 1690 char *proxyenv; 1691 char *p; 1692 1693 #ifndef NO_ABOUT 1694 /* 1695 * Check for about:* 1696 */ 1697 if (STRNEQUAL(url, ABOUT_URL)) { 1698 url += sizeof(ABOUT_URL) -1; 1699 if (strcasecmp(url, "ftp") == 0 || 1700 strcasecmp(url, "tnftp") == 0) { 1701 fputs( 1702 "This version of ftp has been enhanced by Luke Mewburn <lukem@NetBSD.org>\n" 1703 "for the NetBSD project. Execute `man ftp' for more details.\n", ttyout); 1704 } else if (strcasecmp(url, "lukem") == 0) { 1705 fputs( 1706 "Luke Mewburn is the author of most of the enhancements in this ftp client.\n" 1707 "Please email feedback to <lukem@NetBSD.org>.\n", ttyout); 1708 } else if (strcasecmp(url, "netbsd") == 0) { 1709 fputs( 1710 "NetBSD is a freely available and redistributable UNIX-like operating system.\n" 1711 "For more information, see http://www.NetBSD.org/\n", ttyout); 1712 } else if (strcasecmp(url, "version") == 0) { 1713 fprintf(ttyout, "Version: %s %s%s\n", 1714 FTP_PRODUCT, FTP_VERSION, 1715 #ifdef INET6 1716 "" 1717 #else 1718 " (-IPv6)" 1719 #endif 1720 ); 1721 } else { 1722 fprintf(ttyout, "`%s' is an interesting topic.\n", url); 1723 } 1724 fputs("\n", ttyout); 1725 return (0); 1726 } 1727 #endif 1728 1729 /* 1730 * Check for file:// and http:// URLs. 1731 */ 1732 if (STRNEQUAL(url, HTTP_URL) || STRNEQUAL(url, FILE_URL)) 1733 return (fetch_url(url, NULL, NULL, NULL)); 1734 1735 /* 1736 * If it contains "://" but does not begin with ftp:// 1737 * or something that was already handled, then it's 1738 * unsupported. 1739 * 1740 * If it contains ":" but not "://" then we assume the 1741 * part before the colon is a host name, not an URL scheme, 1742 * so we don't try to match that here. 1743 */ 1744 if ((p = strstr(url, "://")) != NULL && ! STRNEQUAL(url, FTP_URL)) 1745 errx(1, "Unsupported URL scheme `%.*s'", (int)(p - url), url); 1746 1747 /* 1748 * Try FTP URL-style and host:file arguments next. 1749 * If ftpproxy is set with an FTP URL, use fetch_url() 1750 * Othewise, use fetch_ftp(). 1751 */ 1752 proxyenv = getoptionvalue("ftp_proxy"); 1753 if (!EMPTYSTRING(proxyenv) && STRNEQUAL(url, FTP_URL)) 1754 return (fetch_url(url, NULL, NULL, NULL)); 1755 1756 return (fetch_ftp(url)); 1757 } 1758 1759 /* 1760 * Retrieve multiple files from the command line, 1761 * calling go_fetch() for each file. 1762 * 1763 * If an ftp path has a trailing "/", the path will be cd-ed into and 1764 * the connection remains open, and the function will return -1 1765 * (to indicate the connection is alive). 1766 * If an error occurs the return value will be the offset+1 in 1767 * argv[] of the file that caused a problem (i.e, argv[x] 1768 * returns x+1) 1769 * Otherwise, 0 is returned if all files retrieved successfully. 1770 */ 1771 int 1772 auto_fetch(int argc, char *argv[]) 1773 { 1774 volatile int argpos, rval; 1775 1776 argpos = rval = 0; 1777 1778 if (sigsetjmp(toplevel, 1)) { 1779 if (connected) 1780 disconnect(0, NULL); 1781 if (rval > 0) 1782 rval = argpos + 1; 1783 return (rval); 1784 } 1785 (void)xsignal(SIGINT, intr); 1786 (void)xsignal(SIGPIPE, lostpeer); 1787 1788 /* 1789 * Loop through as long as there's files to fetch. 1790 */ 1791 for (; (rval == 0) && (argpos < argc); argpos++) { 1792 if (strchr(argv[argpos], ':') == NULL) 1793 break; 1794 redirect_loop = 0; 1795 if (!anonftp) 1796 anonftp = 2; /* Handle "automatic" transfers. */ 1797 rval = go_fetch(argv[argpos]); 1798 if (outfile != NULL && strcmp(outfile, "-") != 0 1799 && outfile[0] != '|') 1800 outfile = NULL; 1801 if (rval > 0) 1802 rval = argpos + 1; 1803 } 1804 1805 if (connected && rval != -1) 1806 disconnect(0, NULL); 1807 return (rval); 1808 } 1809 1810 1811 /* 1812 * Upload multiple files from the command line. 1813 * 1814 * If an error occurs the return value will be the offset+1 in 1815 * argv[] of the file that caused a problem (i.e, argv[x] 1816 * returns x+1) 1817 * Otherwise, 0 is returned if all files uploaded successfully. 1818 */ 1819 int 1820 auto_put(int argc, char **argv, const char *uploadserver) 1821 { 1822 char *uargv[4], *path, *pathsep; 1823 int uargc, rval, argpos; 1824 size_t len; 1825 char cmdbuf[MAX_C_NAME]; 1826 1827 (void)strlcpy(cmdbuf, "mput", sizeof(cmdbuf)); 1828 uargv[0] = cmdbuf; 1829 uargv[1] = argv[0]; 1830 uargc = 2; 1831 uargv[2] = uargv[3] = NULL; 1832 pathsep = NULL; 1833 rval = 1; 1834 1835 DPRINTF("auto_put: target `%s'\n", uploadserver); 1836 1837 path = ftp_strdup(uploadserver); 1838 len = strlen(path); 1839 if (path[len - 1] != '/' && path[len - 1] != ':') { 1840 /* 1841 * make sure we always pass a directory to auto_fetch 1842 */ 1843 if (argc > 1) { /* more than one file to upload */ 1844 len = strlen(uploadserver) + 2; /* path + "/" + "\0" */ 1845 free(path); 1846 path = (char *)ftp_malloc(len); 1847 (void)strlcpy(path, uploadserver, len); 1848 (void)strlcat(path, "/", len); 1849 } else { /* single file to upload */ 1850 (void)strlcpy(cmdbuf, "put", sizeof(cmdbuf)); 1851 uargv[0] = cmdbuf; 1852 pathsep = strrchr(path, '/'); 1853 if (pathsep == NULL) { 1854 pathsep = strrchr(path, ':'); 1855 if (pathsep == NULL) { 1856 warnx("Invalid URL `%s'", path); 1857 goto cleanup_auto_put; 1858 } 1859 pathsep++; 1860 uargv[2] = ftp_strdup(pathsep); 1861 pathsep[0] = '/'; 1862 } else 1863 uargv[2] = ftp_strdup(pathsep + 1); 1864 pathsep[1] = '\0'; 1865 uargc++; 1866 } 1867 } 1868 DPRINTF("auto_put: URL `%s' argv[2] `%s'\n", 1869 path, STRorNULL(uargv[2])); 1870 1871 /* connect and cwd */ 1872 rval = auto_fetch(1, &path); 1873 if(rval >= 0) 1874 goto cleanup_auto_put; 1875 1876 rval = 0; 1877 1878 /* target filename provided; upload 1 file */ 1879 /* XXX : is this the best way? */ 1880 if (uargc == 3) { 1881 uargv[1] = argv[0]; 1882 put(uargc, uargv); 1883 if ((code / 100) != COMPLETE) 1884 rval = 1; 1885 } else { /* otherwise a target dir: upload all files to it */ 1886 for(argpos = 0; argv[argpos] != NULL; argpos++) { 1887 uargv[1] = argv[argpos]; 1888 mput(uargc, uargv); 1889 if ((code / 100) != COMPLETE) { 1890 rval = argpos + 1; 1891 break; 1892 } 1893 } 1894 } 1895 1896 cleanup_auto_put: 1897 free(path); 1898 FREEPTR(uargv[2]); 1899 return (rval); 1900 } 1901