Small size optimization from Aaron Lehmann
[oweals/busybox.git] / wget.c
diff --git a/wget.c b/wget.c
index 5bec0ddd5a918dd9d5a31a981e665ee0b56395bd..59373d1d913759728ff02e6e38f189481c2ad434 100644 (file)
--- a/wget.c
+++ b/wget.c
@@ -4,14 +4,6 @@
  *
  * Chip Rosenthal Covad Communications <chip@laserlink.net>
  *
- * Note: According to RFC2616 section 3.6.1, "All HTTP/1.1 applications MUST be
- * able to receive and decode the "chunked" transfer-coding, and MUST ignore
- * chunk-extension extensions they do not understand."  
- *
- * This prevents this particular wget app from completely RFC compliant, and as
- * such, prevents it from being used as a general purpose web browser...  This
- * is a design decision, since it makes the code smaller.
- *
  */
 
 #include <stdio.h>
 #include <arpa/inet.h>
 #include <netdb.h>
 
+#ifndef _GNU_SOURCE
+#define _GNU_SOURCE
+#endif
+#include <getopt.h>
+
 #include "busybox.h"
 
 /* Stupid libc5 doesn't define this... */
@@ -59,14 +56,15 @@ static void parse_url(char *url, struct host_info *h);
 static FILE *open_socket(char *host, int port);
 static char *gethdr(char *buf, size_t bufsiz, FILE *fp, int *istrunc);
 static int ftpcmd(char *s1, char *s2, FILE *fp, char *buf);
-static void progressmeter(int flag);
 
 /* Globals (can be accessed from signal handlers */
 static off_t filesize = 0;             /* content-length of the file */
+static int chunked = 0;                        /* chunked transfer encoding */
 #ifdef BB_FEATURE_WGET_STATUSBAR
+static void progressmeter(int flag);
 static char *curfile;                  /* Name of current file being transferred. */
 static struct timeval start;   /* Time a transfer started. */
-static volatile unsigned long statbytes; /* Number of bytes transferred so far. */
+static volatile unsigned long statbytes = 0; /* Number of bytes transferred so far. */
 /* For progressmeter() -- number of seconds before xfer considered "stalled" */
 static const int STALLTIME = 5;
 #endif
@@ -79,6 +77,50 @@ static void close_and_delete_outfile(FILE* output, char *fname_out, int do_conti
        }
 }
 
+/* Read NMEMB elements of SIZE bytes into PTR from STREAM.  Returns the
+ * number of elements read, and a short count if an eof or non-interrupt
+ * error is encountered.  */
+static size_t safe_fread(void *ptr, size_t size, size_t nmemb, FILE *stream)
+{
+       size_t ret = 0;
+
+       do {
+               clearerr(stream);
+               ret += fread((char *)ptr + (ret * size), size, nmemb - ret, stream);
+       } while (ret < nmemb && ferror(stream) && errno == EINTR);
+
+       return ret;
+}
+
+/* Write NMEMB elements of SIZE bytes from PTR to STREAM.  Returns the
+ * number of elements written, and a short count if an eof or non-interrupt
+ * error is encountered.  */
+static size_t safe_fwrite(void *ptr, size_t size, size_t nmemb, FILE *stream)
+{
+       size_t ret = 0;
+
+       do {
+               clearerr(stream);
+               ret += fwrite((char *)ptr + (ret * size), size, nmemb - ret, stream);
+       } while (ret < nmemb && ferror(stream) && errno == EINTR);
+
+       return ret;
+}
+
+/* Read a line or SIZE - 1 bytes into S, whichever is less, from STREAM.
+ * Returns S, or NULL if an eof or non-interrupt error is encountered.  */
+static char *safe_fgets(char *s, int size, FILE *stream)
+{
+       char *ret;
+
+       do {
+               clearerr(stream);
+               ret = fgets(s, size, stream);
+       } while (ret == NULL && ferror(stream) && errno == EINTR);
+
+       return ret;
+}
+
 #define close_delete_and_die(s...) { \
        close_and_delete_outfile(output, fname_out, do_continue); \
        error_msg_and_die(s); }
@@ -118,9 +160,13 @@ int wget_main(int argc, char **argv)
        int n, try=5, status;
        int port;
        char *proxy;
+       char *dir_prefix=NULL;
        char *s, buf[512];
        struct stat sbuf;
-
+       char extra_headers[1024];
+       char *extra_headers_ptr = extra_headers;
+       int extra_headers_left = sizeof(extra_headers);
+       int which_long_opt = 0, option_index = -1;
        struct host_info server, target;
 
        FILE *sfp = NULL;                       /* socket to web/ftp server                     */
@@ -132,14 +178,25 @@ int wget_main(int argc, char **argv)
        FILE *output;                           /* socket to web server                         */
        int quiet_flag = FALSE;         /* Be verry, verry quiet...                     */
 
+#define LONG_HEADER    1
+       struct option long_options[] = {
+               { "continue",           0, NULL, 'c' },
+               { "quiet",              0, NULL, 'q' },
+               { "output-document",    1, NULL, 'O' },
+               { "header",             1, &which_long_opt, LONG_HEADER },
+               { 0,                    0, 0, 0 }
+       };
        /*
         * Crack command line.
         */
-       while ((n = getopt(argc, argv, "cqO:")) != EOF) {
+       while ((n = getopt_long(argc, argv, "cqO:P:", long_options, &option_index)) != EOF) {
                switch (n) {
                case 'c':
                        ++do_continue;
                        break;
+               case 'P':
+                       dir_prefix = optarg;
+                       break;
                case 'q':
                        quiet_flag = TRUE;
                        break;
@@ -148,7 +205,23 @@ int wget_main(int argc, char **argv)
                         * this gets interpreted as the auto-gen output filename
                         * case below  - tausq@debian.org
                         */
-                       fname_out = (strcmp(optarg, "-") == 0 ? (char *)1 : optarg);
+                       fname_out = optarg;
+                       break;
+               case 0:
+                       switch (which_long_opt) {
+                               case LONG_HEADER: {
+                                       int arglen = strlen(optarg);
+                                       if(extra_headers_left - arglen - 2 <= 0)
+                                               error_msg_and_die("extra_headers buffer too small(need %i)", extra_headers_left - arglen);
+                                       strcpy(extra_headers_ptr, optarg);
+                                       extra_headers_ptr += arglen;
+                                       extra_headers_left -= ( arglen + 2 );
+                                       *extra_headers_ptr++ = '\r';
+                                       *extra_headers_ptr++ = '\n';
+                                       *(extra_headers_ptr + 1) = 0;
+                                       break;
+                               }
+                       }
                        break;
                default:
                        show_usage();
@@ -183,6 +256,8 @@ int wget_main(int argc, char **argv)
 #endif
                                "index.html";
                }
+               if (dir_prefix != NULL)
+                       fname_out = concat_path_file(dir_prefix, fname_out);
 #ifdef BB_FEATURE_WGET_STATUSBAR
        } else {
                curfile = get_last_path_component(fname_out);
@@ -195,10 +270,11 @@ int wget_main(int argc, char **argv)
        /*
         * Open the output file stream.
         */
-       if (fname_out != (char *)1) {
-               output = xfopen( fname_out, (do_continue ? "a" : "w") );
-       } else {
+       if (strcmp(fname_out, "-") == 0) {
                output = stdout;
+               quiet_flag = TRUE;
+       } else {
+               output = xfopen(fname_out, (do_continue ? "a" : "w"));
        }
 
        /*
@@ -231,11 +307,11 @@ int wget_main(int argc, char **argv)
                         * Send HTTP request.
                         */
                        if (proxy) {
-                               fprintf(sfp, "GET %stp://%s:%d/%s HTTP/1.0\r\n", 
+                               fprintf(sfp, "GET %stp://%s:%d/%s HTTP/1.1\r\n",
                                        target.is_ftp ? "f" : "ht", target.host,
                                        target.port, target.path);
                        } else {
-                               fprintf(sfp, "GET /%s HTTP/1.0\r\n", target.path);
+                               fprintf(sfp, "GET /%s HTTP/1.1\r\n", target.path);
                        }
 
                        fprintf(sfp, "Host: %s\r\nUser-Agent: Wget\r\n", target.host);
@@ -253,12 +329,14 @@ int wget_main(int argc, char **argv)
 
                        if (do_continue)
                                fprintf(sfp, "Range: bytes=%ld-\r\n", beg_range);
+                       if(extra_headers_left < sizeof(extra_headers))
+                               fputs(extra_headers,sfp);
                        fprintf(sfp,"Connection: close\r\n\r\n");
 
                        /*
                        * Retrieve HTTP response line and check for "200" status code.
                        */
-                       if (fgets(buf, sizeof(buf), sfp) == NULL)
+read_response:         if (fgets(buf, sizeof(buf), sfp) == NULL)
                                close_delete_and_die("no response from server");
                                
                        for (s = buf ; *s != '\0' && !isspace(*s) ; ++s)
@@ -267,6 +345,9 @@ int wget_main(int argc, char **argv)
                        ;
                        switch (status = atoi(s)) {
                                case 0:
+                               case 100:
+                                       while (gethdr(buf, sizeof(buf), sfp, &n) != NULL);
+                                       goto read_response;
                                case 200:
                                        if (do_continue && output != stdout)
                                                output = freopen(fname_out, "w", output);
@@ -295,9 +376,13 @@ int wget_main(int argc, char **argv)
                                        got_clen = 1;
                                        continue;
                                }
-                               if (strcasecmp(buf, "transfer-encoding") == 0)
+                               if (strcasecmp(buf, "transfer-encoding") == 0) {
+                                       if (strcasecmp(s, "chunked") == 0) {
+                                               chunked = got_clen = 1;
+                                       } else {
                                        close_delete_and_die("server wants to do %s transfer encoding", s);
-
+                                       }
+                               }
                                if (strcasecmp(buf, "location") == 0) {
                                        if (s[0] == '/')
                                                target.path = xstrdup(s+1);
@@ -386,32 +471,44 @@ int wget_main(int argc, char **argv)
        /*
         * Retrieve file
         */
+       if (chunked) {
+               fgets(buf, sizeof(buf), dfp);
+               filesize = strtol(buf, (char **) NULL, 16);
+       }
 #ifdef BB_FEATURE_WGET_STATUSBAR
-       statbytes=0;
        if (quiet_flag==FALSE)
                progressmeter(-1);
 #endif
-       while ((filesize > 0 || !got_clen) && (n = fread(buf, 1, sizeof(buf), dfp)) > 0) {
-               fwrite(buf, 1, n, output);
+       do {
+               while ((filesize > 0 || !got_clen) && (n = safe_fread(buf, 1, chunked ? (filesize > sizeof(buf) ? sizeof(buf) : filesize) : sizeof(buf), dfp)) > 0) {
+               safe_fwrite(buf, 1, n, output);
 #ifdef BB_FEATURE_WGET_STATUSBAR
                statbytes+=n;
-               if (quiet_flag==FALSE)
-                       progressmeter(1);
 #endif
                if (got_clen)
                        filesize -= n;
        }
 
+               if (chunked) {
+                       safe_fgets(buf, sizeof(buf), dfp); /* This is a newline */
+                       safe_fgets(buf, sizeof(buf), dfp);
+                       filesize = strtol(buf, (char **) NULL, 16);
+                       if (filesize==0) chunked = 0; /* all done! */
+               }
+
        if (n == 0 && ferror(dfp))
                perror_msg_and_die("network read error");
-
+       } while (chunked);
+#ifdef BB_FEATURE_WGET_STATUSBAR
+       if (quiet_flag==FALSE)
+               progressmeter(1);
+#endif
        if (!proxy && target.is_ftp) {
                fclose(dfp);
                if (ftpcmd(NULL, NULL, sfp, buf) != 226)
                        error_msg_and_die("ftp error: %s", buf+4);
                ftpcmd("QUIT", NULL, sfp, buf);
        }
-
        exit(EXIT_SUCCESS);
 }
 
@@ -464,8 +561,7 @@ FILE *open_socket(char *host, int port)
 
        memset(&s_in, 0, sizeof(s_in));
        s_in.sin_family = AF_INET;
-       if ((hp = (struct hostent *) gethostbyname(host)) == NULL)
-               error_msg_and_die("cannot resolve %s", host);
+       hp = xgethostbyname(host);
        memcpy(&s_in.sin_addr, hp->h_addr_list[0], hp->h_length);
        s_in.sin_port = htons(port);
 
@@ -593,7 +689,7 @@ progressmeter(int flag)
 {
        static const char prefixes[] = " KMGTP";
        static struct timeval lastupdate;
-       static off_t lastsize;
+       static off_t lastsize, totalsize;
        struct timeval now, td, wait;
        off_t cursize, abbrevsize;
        double elapsed;
@@ -604,12 +700,13 @@ progressmeter(int flag)
                (void) gettimeofday(&start, (struct timezone *) 0);
                lastupdate = start;
                lastsize = 0;
+               totalsize = filesize; /* as filesize changes.. */
        }
 
        (void) gettimeofday(&now, (struct timezone *) 0);
        cursize = statbytes;
-       if (filesize != 0) {
-               ratio = 100.0 * cursize / filesize;
+       if (totalsize != 0 && !chunked) {
+               ratio = 100.0 * cursize / totalsize;
                ratio = MAX(ratio, 0);
                ratio = MIN(ratio, 100);
        } else
@@ -649,14 +746,14 @@ progressmeter(int flag)
        timersub(&now, &start, &td);
        elapsed = td.tv_sec + (td.tv_usec / 1000000.0);
 
-       if (statbytes <= 0 || elapsed <= 0.0 || cursize > filesize) {
-               snprintf(buf + strlen(buf), sizeof(buf) - strlen(buf),
-                        "   --:-- ETA");
-       } else if (wait.tv_sec >= STALLTIME) {
+       if (wait.tv_sec >= STALLTIME) {
                snprintf(buf + strlen(buf), sizeof(buf) - strlen(buf),
                         " - stalled -");
+       } else if (statbytes <= 0 || elapsed <= 0.0 || cursize > totalsize || chunked) {
+               snprintf(buf + strlen(buf), sizeof(buf) - strlen(buf),
+                        "   --:-- ETA");
        } else {
-               remaining = (int) (filesize / (statbytes / elapsed) - elapsed);
+               remaining = (int) (totalsize / (statbytes / elapsed) - elapsed);
                i = remaining / 3600;
                if (i)
                        snprintf(buf + strlen(buf), sizeof(buf) - strlen(buf),
@@ -680,6 +777,7 @@ progressmeter(int flag)
        } else if (flag == 1) {
                alarmtimer(0);
                statbytes = 0;
+               putc('\n', stderr);
        }
 }
 #endif
@@ -719,7 +817,7 @@ progressmeter(int flag)
  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
  * SUCH DAMAGE.
  *
- *     $Id: wget.c,v 1.31 2001/04/05 21:45:53 andersen Exp $
+ *     $Id: wget.c,v 1.45 2001/07/19 22:28:01 andersen Exp $
  */