/* vi: set sw=4 ts=4: */
/*
* split - split a file into pieces
- * Copyright (c) 2007 Bernhard Fischer
+ * Copyright (c) 2007 Bernhard Reutner-Fischer
*
- * Licensed under GPLv2 or later, see file LICENSE in this tarball for details.
+ * Licensed under GPLv2 or later, see file LICENSE in this source tree.
*/
+//config:config SPLIT
+//config: bool "split (5.4 kb)"
+//config: default y
+//config: help
+//config: Split a file into pieces.
+//config:
+//config:config FEATURE_SPLIT_FANCY
+//config: bool "Fancy extensions"
+//config: default y
+//config: depends on SPLIT
+//config: help
+//config: Add support for features not required by SUSv3.
+//config: Supports additional suffixes 'b' for 512 bytes,
+//config: 'g' for 1GiB for the -b option.
+
+//applet:IF_SPLIT(APPLET(split, BB_DIR_USR_BIN, BB_SUID_DROP))
+
+//kbuild:lib-$(CONFIG_SPLIT) += split.o
+
/* BB_AUDIT: SUSv3 compliant
* SUSv3 requirements:
* http://www.opengroup.org/onlinepubs/009695399/utilities/split.html
*/
-#include "busybox.h"
-static unsigned suffix_len = 2;
-static const struct suffix_mult split_suffices[] = {
+
+//usage:#define split_trivial_usage
+//usage: "[OPTIONS] [INPUT [PREFIX]]"
+//usage:#define split_full_usage "\n\n"
+//usage: " -b N[k|m] Split by N (kilo|mega)bytes"
+//usage: "\n -l N Split by N lines"
+//usage: "\n -a N Use N letters as suffix"
+//usage:
+//usage:#define split_example_usage
+//usage: "$ split TODO foo\n"
+//usage: "$ cat TODO | split -a 2 -l 2 TODO_\n"
+
+#include "libbb.h"
+#include "common_bufsiz.h"
+
#if ENABLE_FEATURE_SPLIT_FANCY
+static const struct suffix_mult split_suffixes[] = {
{ "b", 512 },
-#endif
{ "k", 1024 },
{ "m", 1024*1024 },
-#if ENABLE_FEATURE_SPLIT_FANCY
{ "g", 1024*1024*1024 },
-#endif
- { NULL, 0 }
+ { "", 0 }
};
+#endif
/* Increment the suffix part of the filename.
- * Returns 0 on success and 1 on error (if we are out of files)
+ * Returns NULL if we are out of filenames.
*/
-static bool next_file(char **old)
+static char *next_file(char *old, unsigned suffix_len)
{
- size_t end = strlen(*old);
+ size_t end = strlen(old);
unsigned i = 1;
char *curr;
- do {
- curr = *old + end - i;
+ while (1) {
+ curr = old + end - i;
if (*curr < 'z') {
*curr += 1;
break;
}
i++;
if (i > suffix_len) {
- bb_error_msg("Suffices exhausted");
- return 1;
+ return NULL;
}
*curr = 'a';
- } while (1);
- return 0;
+ }
+
+ return old;
}
+#define read_buffer bb_common_bufsiz1
+enum { READ_BUFFER_SIZE = COMMON_BUFSIZE - 1 };
+
#define SPLIT_OPT_l (1<<0)
#define SPLIT_OPT_b (1<<1)
#define SPLIT_OPT_a (1<<2)
-int split_main(int argc, char **argv);
-int split_main(int argc, char **argv)
+int split_main(int argc, char **argv) MAIN_EXTERNALLY_VISIBLE;
+int split_main(int argc UNUSED_PARAM, char **argv)
{
- char *pfx, *buf, *input_file;
- unsigned cnt = 1000, opt;
- bool ret = EXIT_SUCCESS;
- FILE *fp;
- char *count_p, *sfx;
-//XXX: FIXME opt_complementary = "+2"; /* at most 2 non-option arguments */
- opt = getopt32(argc, argv, "l:b:a:", &count_p, &count_p, &sfx);
+ unsigned suffix_len = 2;
+ char *pfx;
+ char *count_p;
+ const char *sfx;
+ off_t cnt = 1000;
+ off_t remaining = 0;
+ unsigned opt;
+ ssize_t bytes_read, to_write;
+ char *src;
+
+ setup_common_bufsiz();
+
+ opt = getopt32(argv, "^"
+ "l:b:a:+" /* -a N */
+ "\0" "?2"/*max 2 args*/,
+ &count_p, &count_p, &suffix_len
+ );
if (opt & SPLIT_OPT_l)
- cnt = xatoi(count_p);
- if (opt & SPLIT_OPT_b)
- cnt = xatoul_sfx(count_p, split_suffices);
- if (opt & SPLIT_OPT_a)
- suffix_len = xatoi(sfx);
+ cnt = XATOOFF(count_p);
+ if (opt & SPLIT_OPT_b) // FIXME: also needs XATOOFF
+ cnt = xatoull_sfx(count_p,
+ IF_FEATURE_SPLIT_FANCY(split_suffixes)
+ IF_NOT_FEATURE_SPLIT_FANCY(km_suffixes)
+ );
+ sfx = "x";
+
argv += optind;
- if (!*argv)
- *--argv = (char*) "-";
- input_file = *argv;
- sfx = *++argv;
+ if (argv[0]) {
+ int fd;
+ if (argv[1])
+ sfx = argv[1];
+ fd = xopen_stdin(argv[0]);
+ xmove_fd(fd, STDIN_FILENO);
+ } else {
+ argv[0] = (char *) bb_msg_standard_input;
+ }
- if (sfx && (NAME_MAX < strlen(sfx) + suffix_len))
- bb_error_msg_and_die("Suffix too long");
+ if (NAME_MAX < strlen(sfx) + suffix_len)
+ bb_error_msg_and_die("suffix too long");
{
- char *char_p = xzalloc(suffix_len);
+ char *char_p = xzalloc(suffix_len + 1);
memset(char_p, 'a', suffix_len);
- pfx = xasprintf("%s%s", sfx ? sfx : "x", char_p);
+ pfx = xasprintf("%s%s", sfx, char_p);
if (ENABLE_FEATURE_CLEAN_UP)
free(char_p);
}
- fp = fopen_or_warn_stdin(input_file);
-//XXX:FIXME: unify those two file-handling schemata below (FILE vs fd) !
- if (opt & SPLIT_OPT_b) {
- ssize_t i;
- ssize_t bytes = 0;
- int inp = fileno(fp);
+ while (1) {
+ bytes_read = safe_read(STDIN_FILENO, read_buffer, READ_BUFFER_SIZE);
+ if (!bytes_read)
+ break;
+ if (bytes_read < 0)
+ bb_simple_perror_msg_and_die(argv[0]);
+ src = read_buffer;
do {
- int out = xopen(pfx, O_WRONLY | O_CREAT | O_TRUNC);
- lseek(inp, bytes, SEEK_SET);
- buf = xzalloc(cnt);
- bytes += i = full_read(inp, buf, cnt);
- xwrite(out, buf, i);
- free(buf);
- close(out);
- if (next_file(&pfx)) {
- ret++;
- goto bail;
+ if (!remaining) {
+ if (!pfx)
+ bb_error_msg_and_die("suffixes exhausted");
+ xmove_fd(xopen(pfx, O_WRONLY | O_CREAT | O_TRUNC), 1);
+ pfx = next_file(pfx, suffix_len);
+ remaining = cnt;
}
- } while (i == cnt); /* if we read less than cnt, then nothing is left */
- } else { /* -l */
- do {
- unsigned i = cnt;
- int out = xopen(pfx, O_WRONLY | O_CREAT | O_TRUNC);
- buf = NULL;
- while (i--) {
- buf = xmalloc_fgets(fp);
- if (buf == NULL)
- break;
- xwrite(out, buf, strlen(buf));
- free(buf);
- };
- close(out);
- if (next_file(&pfx)) {
- ret++;
- goto bail;
+
+ if (opt & SPLIT_OPT_b) {
+ /* split by bytes */
+ to_write = (bytes_read < remaining) ? bytes_read : remaining;
+ remaining -= to_write;
+ } else {
+ /* split by lines */
+ /* can be sped up by using _memrchr_
+ * and writing many lines at once... */
+ char *end = memchr(src, '\n', bytes_read);
+ if (end) {
+ --remaining;
+ to_write = end - src + 1;
+ } else {
+ to_write = bytes_read;
+ }
}
- } while (buf);
- }
-bail:
- if (ENABLE_FEATURE_CLEAN_UP) {
- free(pfx);
- fclose_if_not_stdin(fp);
+
+ xwrite(STDOUT_FILENO, src, to_write);
+ bytes_read -= to_write;
+ src += to_write;
+ } while (bytes_read);
}
- return ret;
+ return EXIT_SUCCESS;
}