X-Git-Url: https://git.librecmc.org/?a=blobdiff_plain;f=networking%2Fwget.c;h=ad1770b5803acb7a9b9a812b0fb3770936b7a5a0;hb=695fa51c80047eb25cc82e6e1630b4545a6bc0b6;hp=6c1c385b7ec4a62853666579efe457e3c5ff7f07;hpb=8c69afd992d7cc6c2fc7dea59c3c2bd3f3c21f15;p=oweals%2Fbusybox.git diff --git a/networking/wget.c b/networking/wget.c index 6c1c385b7..ad1770b58 100644 --- a/networking/wget.c +++ b/networking/wget.c @@ -4,9 +4,8 @@ * * Chip Rosenthal Covad Communications * + * Licensed under GPLv2, see file LICENSE in this tarball for details. */ - -#include /* for struct option */ #include "libbb.h" struct host_info { @@ -25,180 +24,92 @@ struct globals { off_t content_len; /* Content-length of the file */ off_t beg_range; /* Range at which continue begins */ #if ENABLE_FEATURE_WGET_STATUSBAR - off_t lastsize; - off_t totalsize; off_t transferred; /* Number of bytes transferred so far */ const char *curfile; /* Name of current file being transferred */ - unsigned lastupdate_sec; - unsigned start_sec; + bb_progress_t pmt; #endif - smallint chunked; /* chunked transfer encoding */ + smallint chunked; /* chunked transfer encoding */ + smallint got_clen; /* got content-length: from server */ }; #define G (*(struct globals*)&bb_common_bufsiz1) struct BUG_G_too_big { char BUG_G_too_big[sizeof(G) <= COMMON_BUFSIZE ? 1 : -1]; }; -#define content_len (G.content_len ) -#define beg_range (G.beg_range ) -#define lastsize (G.lastsize ) -#define totalsize (G.totalsize ) -#define transferred (G.transferred ) -#define curfile (G.curfile ) -#define lastupdate_sec (G.lastupdate_sec ) -#define start_sec (G.start_sec ) -#define chunked (G.chunked ) #define INIT_G() do { } while (0) #if ENABLE_FEATURE_WGET_STATUSBAR -enum { - STALLTIME = 5 /* Seconds when xfer considered "stalled" */ -}; -static int getttywidth(void) -{ - int width; - get_terminal_width_height(0, &width, NULL); - return width; -} - -static void progressmeter(int flag) +static void progress_meter(int flag) { /* We can be called from signal handler */ int save_errno = errno; - off_t abbrevsize; - unsigned since_last_update, elapsed; - unsigned ratio; - int barlength, i; - - if (flag == -1) { /* first call to progressmeter */ - start_sec = monotonic_sec(); - lastupdate_sec = start_sec; - lastsize = 0; - totalsize = content_len + beg_range; /* as content_len changes.. */ - } - ratio = 100; - if (totalsize != 0 && !chunked) { - /* long long helps to have it working even if !LFS */ - ratio = (unsigned) (100ULL * (transferred+beg_range) / totalsize); - if (ratio > 100) ratio = 100; + if (flag == -1) { /* first call to progress_meter */ + bb_progress_init(&G.pmt); } - fprintf(stderr, "\r%-20.20s%4d%% ", curfile, ratio); - - barlength = getttywidth() - 49; - if (barlength > 0) { - /* god bless gcc for variable arrays :) */ - i = barlength * ratio / 100; - { - char buf[i+1]; - memset(buf, '*', i); - buf[i] = '\0'; - fprintf(stderr, "|%s%*s|", buf, barlength - i, ""); - } - } - i = 0; - abbrevsize = transferred + beg_range; - while (abbrevsize >= 100000) { - i++; - abbrevsize >>= 10; - } - /* see http://en.wikipedia.org/wiki/Tera */ - fprintf(stderr, "%6d%c ", (int)abbrevsize, " kMGTPEZY"[i]); - -// Nuts! Ain't it easier to update progress meter ONLY when we transferred++? - - elapsed = monotonic_sec(); - since_last_update = elapsed - lastupdate_sec; - if (transferred > lastsize) { - lastupdate_sec = elapsed; - lastsize = transferred; - if (since_last_update >= STALLTIME) { - /* We "cut off" these seconds from elapsed time - * by adjusting start time */ - start_sec += since_last_update; - } - since_last_update = 0; /* we are un-stalled now */ - } - elapsed -= start_sec; /* now it's "elapsed since start" */ - - if (since_last_update >= STALLTIME) { - fprintf(stderr, " - stalled -"); - } else { - off_t to_download = totalsize - beg_range; - if (transferred <= 0 || (int)elapsed <= 0 || transferred > to_download || chunked) { - fprintf(stderr, "--:--:-- ETA"); - } else { - /* to_download / (transferred/elapsed) - elapsed: */ - int eta = (int) ((unsigned long long)to_download*elapsed/transferred - elapsed); - /* (long long helps to have working ETA even if !LFS) */ - i = eta % 3600; - fprintf(stderr, "%02d:%02d:%02d ETA", eta / 3600, i / 60, i % 60); - } - } + bb_progress_update(&G.pmt, G.curfile, G.beg_range, G.transferred, + G.chunked ? 0 : G.content_len + G.beg_range); if (flag == 0) { - /* last call to progressmeter */ + /* last call to progress_meter */ alarm(0); - transferred = 0; fputc('\n', stderr); + G.transferred = 0; } else { - if (flag == -1) { - /* first call to progressmeter */ - struct sigaction sa; - sa.sa_handler = progressmeter; - sigemptyset(&sa.sa_mask); - sa.sa_flags = SA_RESTART; - sigaction(SIGALRM, &sa, NULL); + if (flag == -1) { /* first call to progress_meter */ + signal_SA_RESTART_empty_mask(SIGALRM, progress_meter); } alarm(1); } errno = save_errno; } -/* Original copyright notice which applies to the CONFIG_FEATURE_WGET_STATUSBAR stuff, - * much of which was blatantly stolen from openssh. */ -/*- - * Copyright (c) 1992, 1993 - * The Regents of the University of California. All rights reserved. - * - * Redistribution and use in source and binary forms, with or without - * modification, are permitted provided that the following conditions - * are met: - * 1. Redistributions of source code must retain the above copyright - * notice, this list of conditions and the following disclaimer. - * 2. Redistributions in binary form must reproduce the above copyright - * notice, this list of conditions and the following disclaimer in the - * documentation and/or other materials provided with the distribution. - * - * 3. - * - * 4. Neither the name of the University nor the names of its contributors - * may be used to endorse or promote products derived from this software - * without specific prior written permission. - * - * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND - * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE - * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE - * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE - * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL - * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS - * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) - * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT - * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY - * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF - * SUCH DAMAGE. - * - */ + #else /* FEATURE_WGET_STATUSBAR */ -static ALWAYS_INLINE void progressmeter(int flag) { } +static ALWAYS_INLINE void progress_meter(int flag UNUSED_PARAM) { } #endif +/* IPv6 knows scoped address types i.e. link and site local addresses. Link + * local addresses can have a scope identifier to specify the + * interface/link an address is valid on (e.g. fe80::1%eth0). This scope + * identifier is only valid on a single node. + * + * RFC 4007 says that the scope identifier MUST NOT be sent across the wire, + * unless all nodes agree on the semantic. Apache e.g. regards zone identifiers + * in the Host header as invalid requests, see + * https://issues.apache.org/bugzilla/show_bug.cgi?id=35122 + */ +static void strip_ipv6_scope_id(char *host) +{ + char *scope, *cp; + + /* bbox wget actually handles IPv6 addresses without [], like + * wget "http://::1/xxx", but this is not standard. + * To save code, _here_ we do not support it. */ + + if (host[0] != '[') + return; /* not IPv6 */ + + scope = strchr(host, '%'); + if (!scope) + return; + + /* Remove the IPv6 zone identifier from the host address */ + cp = strchr(host, ']'); + if (!cp || (cp[1] != ':' && cp[1] != '\0')) { + /* malformed address (not "[xx]:nn" or "[xx]") */ + return; + } + + /* cp points to "]...", scope points to "%eth0]..." */ + overlapping_strcpy(scope, cp); +} + /* Read NMEMB bytes into PTR from STREAM. Returns the number of bytes read, * and a short count if an eof or non-interrupt error is encountered. */ static size_t safe_fread(void *ptr, size_t nmemb, FILE *stream) @@ -208,6 +119,7 @@ static size_t safe_fread(void *ptr, size_t nmemb, FILE *stream) do { clearerr(stream); + errno = 0; ret = fread(p, 1, nmemb, stream); p += ret; nmemb -= ret; @@ -224,6 +136,7 @@ static char *safe_fgets(char *s, int size, FILE *stream) do { clearerr(stream); + errno = 0; ret = fgets(s, size, stream); } while (ret == NULL && ferror(stream) && errno == EINTR); @@ -242,6 +155,14 @@ static char *base64enc_512(char buf[512], const char *str) } #endif +static char* sanitize_string(char *s) +{ + unsigned char *p = (void *) s; + while (*p >= ' ') + p++; + *p = '\0'; + return s; +} static FILE *open_socket(len_and_sockaddr *lsa) { @@ -256,7 +177,6 @@ static FILE *open_socket(len_and_sockaddr *lsa) return fp; } - static int ftpcmd(const char *s1, const char *s2, FILE *fp, char *buf) { int result; @@ -284,7 +204,6 @@ static int ftpcmd(const char *s1, const char *s2, FILE *fp, char *buf) return result; } - static void parse_url(char *src_url, struct host_info *h) { char *url, *p, *sp; @@ -300,7 +219,7 @@ static void parse_url(char *src_url, struct host_info *h) h->host = url + 6; h->is_ftp = 1; } else - bb_error_msg_and_die("not an http or ftp url: %s", url); + bb_error_msg_and_die("not an http or ftp url: %s", sanitize_string(url)); // FYI: // "Real" wget 'http://busybox.net?var=a/b' sends this request: @@ -332,8 +251,10 @@ static void parse_url(char *src_url, struct host_info *h) h->path = sp; } + // We used to set h->user to NULL here, but this interferes + // with handling of code 302 ("object was moved") + sp = strrchr(h->host, '@'); - h->user = NULL; if (sp != NULL) { h->user = h->host; *sp = '\0'; @@ -343,7 +264,6 @@ static void parse_url(char *src_url, struct host_info *h) sp = h->host; } - static char *gethdr(char *buf, size_t bufsiz, FILE *fp /*, int *istrunc*/) { char *s, *hdrval; @@ -367,7 +287,7 @@ static char *gethdr(char *buf, size_t bufsiz, FILE *fp /*, int *istrunc*/) /* verify we are at the end of the header name */ if (*s != ':') - bb_error_msg_and_die("bad header line: %s", buf); + bb_error_msg_and_die("bad header line: %s", sanitize_string(buf)); /* locate the start of the header value */ *s++ = '\0'; @@ -383,37 +303,224 @@ static char *gethdr(char *buf, size_t bufsiz, FILE *fp /*, int *istrunc*/) return hdrval; } - /* Rats! The buffer isn't big enough to hold the entire header value. */ + /* Rats! The buffer isn't big enough to hold the entire header value */ while (c = getc(fp), c != EOF && c != '\n') continue; /* *istrunc = 1; */ return hdrval; } +#if ENABLE_FEATURE_WGET_LONG_OPTIONS +static char *URL_escape(const char *str) +{ + /* URL encode, see RFC 2396 */ + char *dst; + char *res = dst = xmalloc(strlen(str) * 3 + 1); + unsigned char c; + + while (1) { + c = *str++; + if (c == '\0' + /* || strchr("!&'()*-.=_~", c) - more code */ + || c == '!' + || c == '&' + || c == '\'' + || c == '(' + || c == ')' + || c == '*' + || c == '-' + || c == '.' + || c == '=' + || c == '_' + || c == '~' + || (c >= '0' && c <= '9') + || ((c|0x20) >= 'a' && (c|0x20) <= 'z') + ) { + *dst++ = c; + if (c == '\0') + return res; + } else { + *dst++ = '%'; + *dst++ = bb_hexdigits_upcase[c >> 4]; + *dst++ = bb_hexdigits_upcase[c & 0xf]; + } + } +} +#endif + +static FILE* prepare_ftp_session(FILE **dfpp, struct host_info *target, len_and_sockaddr *lsa) +{ + char buf[512]; + FILE *sfp; + char *str; + int port; + + if (!target->user) + target->user = xstrdup("anonymous:busybox@"); + + sfp = open_socket(lsa); + if (ftpcmd(NULL, NULL, sfp, buf) != 220) + bb_error_msg_and_die("%s", sanitize_string(buf+4)); + + /* + * Splitting username:password pair, + * trying to log in + */ + str = strchr(target->user, ':'); + if (str) + *str++ = '\0'; + switch (ftpcmd("USER ", target->user, sfp, buf)) { + case 230: + break; + case 331: + if (ftpcmd("PASS ", str, sfp, buf) == 230) + break; + /* fall through (failed login) */ + default: + bb_error_msg_and_die("ftp login: %s", sanitize_string(buf+4)); + } + + ftpcmd("TYPE I", NULL, sfp, buf); + + /* + * Querying file size + */ + if (ftpcmd("SIZE ", target->path, sfp, buf) == 213) { + G.content_len = BB_STRTOOFF(buf+4, NULL, 10); + if (G.content_len < 0 || errno) { + bb_error_msg_and_die("SIZE value is garbage"); + } + G.got_clen = 1; + } + + /* + * Entering passive mode + */ + if (ftpcmd("PASV", NULL, sfp, buf) != 227) { + pasv_error: + bb_error_msg_and_die("bad response to %s: %s", "PASV", sanitize_string(buf)); + } + // Response is "227 garbageN1,N2,N3,N4,P1,P2[)garbage] + // Server's IP is N1.N2.N3.N4 (we ignore it) + // Server's port for data connection is P1*256+P2 + str = strrchr(buf, ')'); + if (str) str[0] = '\0'; + str = strrchr(buf, ','); + if (!str) goto pasv_error; + port = xatou_range(str+1, 0, 255); + *str = '\0'; + str = strrchr(buf, ','); + if (!str) goto pasv_error; + port += xatou_range(str+1, 0, 255) * 256; + set_nport(lsa, htons(port)); + + *dfpp = open_socket(lsa); + + if (G.beg_range) { + sprintf(buf, "REST %"OFF_FMT"u", G.beg_range); + if (ftpcmd(buf, NULL, sfp, buf) == 350) + G.content_len -= G.beg_range; + } + + if (ftpcmd("RETR ", target->path, sfp, buf) > 150) + bb_error_msg_and_die("bad response to %s: %s", "RETR", sanitize_string(buf)); + + return sfp; +} + +/* Must match option string! */ +enum { + WGET_OPT_CONTINUE = (1 << 0), + WGET_OPT_SPIDER = (1 << 1), + WGET_OPT_QUIET = (1 << 2), + WGET_OPT_OUTNAME = (1 << 3), + WGET_OPT_PREFIX = (1 << 4), + WGET_OPT_PROXY = (1 << 5), + WGET_OPT_USER_AGENT = (1 << 6), + WGET_OPT_RETRIES = (1 << 7), + WGET_OPT_NETWORK_READ_TIMEOUT = (1 << 8), + WGET_OPT_PASSIVE = (1 << 9), + WGET_OPT_HEADER = (1 << 10) * ENABLE_FEATURE_WGET_LONG_OPTIONS, + WGET_OPT_POST_DATA = (1 << 11) * ENABLE_FEATURE_WGET_LONG_OPTIONS, +}; + +static void NOINLINE retrieve_file_data(FILE *dfp, int output_fd) +{ + char buf[512]; + + if (!(option_mask32 & WGET_OPT_QUIET)) + progress_meter(-1); + + if (G.chunked) + goto get_clen; + + /* Loops only if chunked */ + while (1) { + while (1) { + int n; + unsigned rdsz; + + rdsz = sizeof(buf); + if (G.got_clen) { + if (G.content_len < (off_t)sizeof(buf)) { + if ((int)G.content_len <= 0) + break; + rdsz = (unsigned)G.content_len; + } + } + n = safe_fread(buf, rdsz, dfp); + if (n <= 0) { + if (ferror(dfp)) { + /* perror will not work: ferror doesn't set errno */ + bb_error_msg_and_die(bb_msg_read_error); + } + break; + } + xwrite(output_fd, buf, n); +#if ENABLE_FEATURE_WGET_STATUSBAR + G.transferred += n; +#endif + if (G.got_clen) + G.content_len -= n; + } + + if (!G.chunked) + break; + + safe_fgets(buf, sizeof(buf), dfp); /* This is a newline */ + get_clen: + safe_fgets(buf, sizeof(buf), dfp); + G.content_len = STRTOOFF(buf, NULL, 16); + /* FIXME: error check? */ + if (G.content_len == 0) + break; /* all done! */ + G.got_clen = 1; + } + + if (!(option_mask32 & WGET_OPT_QUIET)) + progress_meter(0); +} int wget_main(int argc, char **argv) MAIN_EXTERNALLY_VISIBLE; -int wget_main(int argc, char **argv) +int wget_main(int argc UNUSED_PARAM, char **argv) { char buf[512]; struct host_info server, target; len_and_sockaddr *lsa; - int status; - int port; - int try = 5; unsigned opt; - char *str; - char *proxy = 0; + int redir_limit; + char *proxy = NULL; char *dir_prefix = NULL; #if ENABLE_FEATURE_WGET_LONG_OPTIONS + char *post_data; char *extra_headers = NULL; llist_t *headers_llist = NULL; #endif - FILE *sfp = NULL; /* socket to web/ftp server */ + FILE *sfp; /* socket to web/ftp server */ FILE *dfp; /* socket to ftp server (data) */ char *fname_out; /* where to direct output (-O) */ - bool got_clen = 0; /* got content-length: from server */ int output_fd = -1; - bool use_proxy = 1; /* Use proxies if env vars are set */ + bool use_proxy; /* Use proxies if env vars are set */ const char *proxy_flag = "on"; /* Use proxies if env vars are set */ const char *user_agent = "Wget";/* "User-Agent" header field */ @@ -422,17 +529,6 @@ int wget_main(int argc, char **argv) enum { KEY_content_length = 1, KEY_transfer_encoding, KEY_chunked, KEY_location }; - enum { - WGET_OPT_CONTINUE = 0x1, - WGET_OPT_SPIDER = 0x2, - WGET_OPT_QUIET = 0x4, - WGET_OPT_OUTNAME = 0x8, - WGET_OPT_PREFIX = 0x10, - WGET_OPT_PROXY = 0x20, - WGET_OPT_USER_AGENT = 0x40, - WGET_OPT_PASSIVE = 0x80, - WGET_OPT_HEADER = 0x100, - }; #if ENABLE_FEATURE_WGET_LONG_OPTIONS static const char wget_longopts[] ALIGN1 = /* name, has_arg, val */ @@ -443,8 +539,13 @@ int wget_main(int argc, char **argv) "directory-prefix\0" Required_argument "P" "proxy\0" Required_argument "Y" "user-agent\0" Required_argument "U" + /* Ignored: */ + // "tries\0" Required_argument "t" + // "timeout\0" Required_argument "T" + /* Ignored (we always use PASV): */ "passive-ftp\0" No_argument "\xff" "header\0" Required_argument "\xfe" + "post-data\0" Required_argument "\xfd" ; #endif @@ -454,16 +555,15 @@ int wget_main(int argc, char **argv) applet_long_options = wget_longopts; #endif /* server.allocated = target.allocated = NULL; */ - opt_complementary = "-1" USE_FEATURE_WGET_LONG_OPTIONS(":\xfe::"); - opt = getopt32(argv, "csqO:P:Y:U:", + opt_complementary = "-1" IF_FEATURE_WGET_LONG_OPTIONS(":\xfe::"); + opt = getopt32(argv, "csqO:P:Y:U:" /*ignored:*/ "t:T:", &fname_out, &dir_prefix, - &proxy_flag, &user_agent - USE_FEATURE_WGET_LONG_OPTIONS(, &headers_llist) + &proxy_flag, &user_agent, + NULL, /* -t RETRIES */ + NULL /* -T NETWORK_READ_TIMEOUT */ + IF_FEATURE_WGET_LONG_OPTIONS(, &headers_llist) + IF_FEATURE_WGET_LONG_OPTIONS(, &post_data) ); - if (strcmp(proxy_flag, "off") == 0) { - /* Use the proxy if necessary */ - use_proxy = 0; - } #if ENABLE_FEATURE_WGET_LONG_OPTIONS if (headers_llist) { int size = 1; @@ -475,25 +575,37 @@ int wget_main(int argc, char **argv) } extra_headers = cp = xmalloc(size); while (headers_llist) { - cp += sprintf(cp, "%s\r\n", headers_llist->data); - headers_llist = headers_llist->link; + cp += sprintf(cp, "%s\r\n", (char*)llist_pop(&headers_llist)); } } #endif + /* TODO: compat issue: should handle "wget URL1 URL2..." */ + + target.user = NULL; parse_url(argv[optind], &target); - server.host = target.host; - server.port = target.port; /* Use the proxy if necessary */ + use_proxy = (strcmp(proxy_flag, "off") != 0); if (use_proxy) { proxy = getenv(target.is_ftp ? "ftp_proxy" : "http_proxy"); - if (proxy && *proxy) { + if (proxy && proxy[0]) { parse_url(proxy, &server); } else { use_proxy = 0; } } + if (!use_proxy) { + server.port = target.port; + if (ENABLE_FEATURE_IPV6) { + server.host = xstrdup(target.host); + } else { + server.host = target.host; + } + } + + if (ENABLE_FEATURE_IPV6) + strip_ipv6_scope_id(target.host); /* Guess an output filename, if there was no -O FILE */ if (!(opt & WGET_OPT_OUTNAME)) { @@ -512,227 +624,209 @@ int wget_main(int argc, char **argv) } } #if ENABLE_FEATURE_WGET_STATUSBAR - curfile = bb_get_last_path_component_nostrip(fname_out); + G.curfile = bb_get_last_path_component_nostrip(fname_out); #endif /* Impossible? if ((opt & WGET_OPT_CONTINUE) && !fname_out) - bb_error_msg_and_die("cannot specify continue (-c) without a filename (-O)"); */ + bb_error_msg_and_die("can't specify continue (-c) without a filename (-O)"); + */ /* Determine where to start transfer */ if (opt & WGET_OPT_CONTINUE) { output_fd = open(fname_out, O_WRONLY); if (output_fd >= 0) { - beg_range = xlseek(output_fd, 0, SEEK_END); + G.beg_range = xlseek(output_fd, 0, SEEK_END); } /* File doesn't exist. We do not create file here yet. - We are not sure it exists on remove side */ + * We are not sure it exists on remove side */ } - /* We want to do exactly _one_ DNS lookup, since some - * sites (i.e. ftp.us.debian.org) use round-robin DNS - * and we want to connect to only one IP... */ + redir_limit = 5; + resolve_lsa: lsa = xhost2sockaddr(server.host, server.port); if (!(opt & WGET_OPT_QUIET)) { - fprintf(stderr, "Connecting to %s (%s)\n", server.host, - xmalloc_sockaddr2dotted(&lsa->u.sa)); - /* We leak result of xmalloc_sockaddr2dotted */ + char *s = xmalloc_sockaddr2dotted(&lsa->u.sa); + fprintf(stderr, "Connecting to %s (%s)\n", server.host, s); + free(s); } - + establish_session: if (use_proxy || !target.is_ftp) { /* * HTTP session */ - do { - got_clen = 0; - chunked = 0; - - if (!--try) - bb_error_msg_and_die("too many redirections"); - - /* Open socket to http server */ - if (sfp) fclose(sfp); - sfp = open_socket(lsa); - - /* Send HTTP request. */ - if (use_proxy) { - fprintf(sfp, "GET %stp://%s/%s HTTP/1.1\r\n", - target.is_ftp ? "f" : "ht", target.host, - target.path); - } else { + char *str; + int status; + + /* Open socket to http server */ + sfp = open_socket(lsa); + + /* Send HTTP request */ + if (use_proxy) { + fprintf(sfp, "GET %stp://%s/%s HTTP/1.1\r\n", + target.is_ftp ? "f" : "ht", target.host, + target.path); + } else { + if (opt & WGET_OPT_POST_DATA) + fprintf(sfp, "POST /%s HTTP/1.1\r\n", target.path); + else fprintf(sfp, "GET /%s HTTP/1.1\r\n", target.path); - } + } - fprintf(sfp, "Host: %s\r\nUser-Agent: %s\r\n", - target.host, user_agent); + fprintf(sfp, "Host: %s\r\nUser-Agent: %s\r\n", + target.host, user_agent); #if ENABLE_FEATURE_WGET_AUTHENTICATION - if (target.user) { - fprintf(sfp, "Proxy-Authorization: Basic %s\r\n"+6, - base64enc_512(buf, target.user)); - } - if (use_proxy && server.user) { - fprintf(sfp, "Proxy-Authorization: Basic %s\r\n", - base64enc_512(buf, server.user)); - } + if (target.user) { + fprintf(sfp, "Proxy-Authorization: Basic %s\r\n"+6, + base64enc_512(buf, target.user)); + } + if (use_proxy && server.user) { + fprintf(sfp, "Proxy-Authorization: Basic %s\r\n", + base64enc_512(buf, server.user)); + } #endif - if (beg_range) - fprintf(sfp, "Range: bytes=%"OFF_FMT"d-\r\n", beg_range); + if (G.beg_range) + fprintf(sfp, "Range: bytes=%"OFF_FMT"u-\r\n", G.beg_range); #if ENABLE_FEATURE_WGET_LONG_OPTIONS - if (extra_headers) - fputs(extra_headers, sfp); + if (extra_headers) + fputs(extra_headers, sfp); + + if (opt & WGET_OPT_POST_DATA) { + char *estr = URL_escape(post_data); + fprintf(sfp, "Content-Type: application/x-www-form-urlencoded\r\n"); + fprintf(sfp, "Content-Length: %u\r\n" "\r\n" "%s", + (int) strlen(estr), estr); + /*fprintf(sfp, "Connection: Keep-Alive\r\n\r\n");*/ + /*fprintf(sfp, "%s\r\n", estr);*/ + free(estr); + } else #endif - fprintf(sfp, "Connection: close\r\n\r\n"); - - /* - * Retrieve HTTP response line and check for "200" status code. - */ - read_response: - if (fgets(buf, sizeof(buf), sfp) == NULL) - bb_error_msg_and_die("no response from server"); - - str = buf; - str = skip_non_whitespace(str); - str = skip_whitespace(str); - // FIXME: no error check - // xatou wouldn't work: "200 OK" - status = atoi(str); - switch (status) { - case 0: - case 100: - while (gethdr(buf, sizeof(buf), sfp /*, &n*/) != NULL) - /* eat all remaining headers */; - goto read_response; - case 200: - break; - case 300: /* redirection */ - case 301: - case 302: - case 303: - break; - case 206: - if (beg_range) - break; - /*FALLTHRU*/ - default: - /* Show first line only and kill any ESC tricks */ - buf[strcspn(buf, "\n\r\x1b")] = '\0'; - bb_error_msg_and_die("server returned error: %s", buf); - } - - /* - * Retrieve HTTP headers. - */ - while ((str = gethdr(buf, sizeof(buf), sfp /*, &n*/)) != NULL) { - /* gethdr did already convert the "FOO:" string to lowercase */ - smalluint key = index_in_strings(keywords, *&buf) + 1; - if (key == KEY_content_length) { - content_len = BB_STRTOOFF(str, NULL, 10); - if (errno || content_len < 0) { - bb_error_msg_and_die("content-length %s is garbage", str); - } - got_clen = 1; - continue; - } - if (key == KEY_transfer_encoding) { - if (index_in_strings(keywords, str_tolower(str)) + 1 != KEY_chunked) - bb_error_msg_and_die("transfer encoding '%s' is not supported", str); - chunked = got_clen = 1; - } - if (key == KEY_location) { - if (str[0] == '/') - /* free(target.allocated); */ - target.path = /* target.allocated = */ xstrdup(str+1); - else { - parse_url(str, &target); - if (use_proxy == 0) { - server.host = target.host; - server.port = target.port; - } - free(lsa); - lsa = xhost2sockaddr(server.host, server.port); - break; - } - } - } - } while (status >= 300); - - dfp = sfp; - - } else { - - /* - * FTP session - */ - if (!target.user) - target.user = xstrdup("anonymous:busybox@"); - - sfp = open_socket(lsa); - if (ftpcmd(NULL, NULL, sfp, buf) != 220) - bb_error_msg_and_die("%s", buf+4); + { /* If "Connection:" is needed, document why */ + fprintf(sfp, /* "Connection: close\r\n" */ "\r\n"); + } /* - * Splitting username:password pair, - * trying to log in + * Retrieve HTTP response line and check for "200" status code. */ - str = strchr(target.user, ':'); - if (str) - *(str++) = '\0'; - switch (ftpcmd("USER ", target.user, sfp, buf)) { - case 230: + read_response: + if (fgets(buf, sizeof(buf), sfp) == NULL) + bb_error_msg_and_die("no response from server"); + + str = buf; + str = skip_non_whitespace(str); + str = skip_whitespace(str); + // FIXME: no error check + // xatou wouldn't work: "200 OK" + status = atoi(str); + switch (status) { + case 0: + case 100: + while (gethdr(buf, sizeof(buf), sfp /*, &n*/) != NULL) + /* eat all remaining headers */; + goto read_response; + case 200: +/* +Response 204 doesn't say "null file", it says "metadata +has changed but data didn't": + +"10.2.5 204 No Content +The server has fulfilled the request but does not need to return +an entity-body, and might want to return updated metainformation. +The response MAY include new or updated metainformation in the form +of entity-headers, which if present SHOULD be associated with +the requested variant. + +If the client is a user agent, it SHOULD NOT change its document +view from that which caused the request to be sent. This response +is primarily intended to allow input for actions to take place +without causing a change to the user agent's active document view, +although any new or updated metainformation SHOULD be applied +to the document currently in the user agent's active view. + +The 204 response MUST NOT include a message-body, and thus +is always terminated by the first empty line after the header fields." + +However, in real world it was observed that some web servers +(e.g. Boa/0.94.14rc21) simply use code 204 when file size is zero. +*/ + case 204: break; - case 331: - if (ftpcmd("PASS ", str, sfp, buf) == 230) + case 300: /* redirection */ + case 301: + case 302: + case 303: + break; + case 206: + if (G.beg_range) break; - /* FALLTHRU (failed login) */ + /* fall through */ default: - bb_error_msg_and_die("ftp login: %s", buf+4); + bb_error_msg_and_die("server returned error: %s", sanitize_string(buf)); } - ftpcmd("TYPE I", NULL, sfp, buf); - /* - * Querying file size + * Retrieve HTTP headers. */ - if (ftpcmd("SIZE ", target.path, sfp, buf) == 213) { - content_len = BB_STRTOOFF(buf+4, NULL, 10); - if (errno || content_len < 0) { - bb_error_msg_and_die("SIZE value is garbage"); + while ((str = gethdr(buf, sizeof(buf), sfp /*, &n*/)) != NULL) { + /* gethdr converted "FOO:" string to lowercase */ + smalluint key; + /* strip trailing whitespace */ + char *s = strchrnul(str, '\0') - 1; + while (s >= str && (*s == ' ' || *s == '\t')) { + *s = '\0'; + s--; + } + key = index_in_strings(keywords, buf) + 1; + if (key == KEY_content_length) { + G.content_len = BB_STRTOOFF(str, NULL, 10); + if (G.content_len < 0 || errno) { + bb_error_msg_and_die("content-length %s is garbage", sanitize_string(str)); + } + G.got_clen = 1; + continue; + } + if (key == KEY_transfer_encoding) { + if (index_in_strings(keywords, str_tolower(str)) + 1 != KEY_chunked) + bb_error_msg_and_die("transfer encoding '%s' is not supported", sanitize_string(str)); + G.chunked = G.got_clen = 1; + } + if (key == KEY_location && status >= 300) { + if (--redir_limit == 0) + bb_error_msg_and_die("too many redirections"); + fclose(sfp); + G.got_clen = 0; + G.chunked = 0; + if (str[0] == '/') + /* free(target.allocated); */ + target.path = /* target.allocated = */ xstrdup(str+1); + /* lsa stays the same: it's on the same server */ + else { + parse_url(str, &target); + if (!use_proxy) { + server.host = target.host; + /* strip_ipv6_scope_id(target.host); - no! */ + /* we assume remote never gives us IPv6 addr with scope id */ + server.port = target.port; + free(lsa); + goto resolve_lsa; + } /* else: lsa stays the same: we use proxy */ + } + goto establish_session; } - got_clen = 1; } +// if (status >= 300) +// bb_error_msg_and_die("bad redirection (no Location: header from server)"); + + /* For HTTP, data is pumped over the same connection */ + dfp = sfp; + } else { /* - * Entering passive mode + * FTP session */ - if (ftpcmd("PASV", NULL, sfp, buf) != 227) { - pasv_error: - bb_error_msg_and_die("bad response to %s: %s", "PASV", buf); - } - // Response is "227 garbageN1,N2,N3,N4,P1,P2[)garbage] - // Server's IP is N1.N2.N3.N4 (we ignore it) - // Server's port for data connection is P1*256+P2 - str = strrchr(buf, ')'); - if (str) str[0] = '\0'; - str = strrchr(buf, ','); - if (!str) goto pasv_error; - port = xatou_range(str+1, 0, 255); - *str = '\0'; - str = strrchr(buf, ','); - if (!str) goto pasv_error; - port += xatou_range(str+1, 0, 255) * 256; - set_nport(lsa, htons(port)); - dfp = open_socket(lsa); - - if (beg_range) { - sprintf(buf, "REST %"OFF_FMT"d", beg_range); - if (ftpcmd(buf, NULL, sfp, buf) == 350) - content_len -= beg_range; - } - - if (ftpcmd("RETR ", target.path, sfp, buf) > 150) - bb_error_msg_and_die("bad response to %s: %s", "RETR", buf); + sfp = prepare_ftp_session(&dfp, &target, lsa); } if (opt & WGET_OPT_SPIDER) { @@ -741,11 +835,6 @@ int wget_main(int argc, char **argv) return EXIT_SUCCESS; } - /* - * Retrieve file - */ - - /* Do it before progressmeter (want to have nice error message) */ if (output_fd < 0) { int o_flags = O_WRONLY | O_CREAT | O_TRUNC | O_EXCL; /* compat with wget: -O FILE can overwrite */ @@ -754,56 +843,15 @@ int wget_main(int argc, char **argv) output_fd = xopen(fname_out, o_flags); } - if (!(opt & WGET_OPT_QUIET)) - progressmeter(-1); - - if (chunked) - goto get_clen; - - /* Loops only if chunked */ - while (1) { - while (content_len > 0 || !got_clen) { - int n; - unsigned rdsz = sizeof(buf); - - if (content_len < sizeof(buf) && (chunked || got_clen)) - rdsz = (unsigned)content_len; - n = safe_fread(buf, rdsz, dfp); - if (n <= 0) { - if (ferror(dfp)) { - /* perror will not work: ferror doesn't set errno */ - bb_error_msg_and_die(bb_msg_read_error); - } - break; - } - xwrite(output_fd, buf, n); -#if ENABLE_FEATURE_WGET_STATUSBAR - transferred += n; -#endif - if (got_clen) - content_len -= n; - } - - if (!chunked) - break; - - safe_fgets(buf, sizeof(buf), dfp); /* This is a newline */ - get_clen: - safe_fgets(buf, sizeof(buf), dfp); - content_len = STRTOOFF(buf, NULL, 16); - /* FIXME: error check? */ - if (content_len == 0) - break; /* all done! */ - } - - if (!(opt & WGET_OPT_QUIET)) - progressmeter(0); + retrieve_file_data(dfp, output_fd); + xclose(output_fd); - if ((use_proxy == 0) && target.is_ftp) { + if (dfp != sfp) { + /* It's ftp. Close it properly */ fclose(dfp); if (ftpcmd(NULL, NULL, sfp, buf) != 226) - bb_error_msg_and_die("ftp error: %s", buf+4); - ftpcmd("QUIT", NULL, sfp, buf); + bb_error_msg_and_die("ftp error: %s", sanitize_string(buf+4)); + /* ftpcmd("QUIT", NULL, sfp, buf); - why bother? */ } return EXIT_SUCCESS;