2007-03-25 21:50:18 +00:00
|
|
|
/* vi: set sw=4 ts=4: */
|
|
|
|
/*
|
|
|
|
* split - split a file into pieces
|
2008-09-25 12:13:34 +00:00
|
|
|
* Copyright (c) 2007 Bernhard Reutner-Fischer
|
2007-03-25 21:50:18 +00:00
|
|
|
*
|
2010-08-16 18:14:46 +00:00
|
|
|
* Licensed under GPLv2 or later, see file LICENSE in this source tree.
|
2007-03-25 21:50:18 +00:00
|
|
|
*/
|
2007-03-26 14:28:12 +00:00
|
|
|
/* BB_AUDIT: SUSv3 compliant
|
2007-03-25 21:50:18 +00:00
|
|
|
* SUSv3 requirements:
|
|
|
|
* http://www.opengroup.org/onlinepubs/009695399/utilities/split.html
|
|
|
|
*/
|
2011-03-31 12:43:25 +00:00
|
|
|
|
|
|
|
//usage:#define split_trivial_usage
|
|
|
|
//usage: "[OPTIONS] [INPUT [PREFIX]]"
|
|
|
|
//usage:#define split_full_usage "\n\n"
|
2011-06-05 01:58:28 +00:00
|
|
|
//usage: " -b N[k|m] Split by N (kilo|mega)bytes"
|
2011-03-31 12:43:25 +00:00
|
|
|
//usage: "\n -l N Split by N lines"
|
|
|
|
//usage: "\n -a N Use N letters as suffix"
|
|
|
|
//usage:
|
|
|
|
//usage:#define split_example_usage
|
|
|
|
//usage: "$ split TODO foo\n"
|
|
|
|
//usage: "$ cat TODO | split -a 2 -l 2 TODO_\n"
|
|
|
|
|
2007-05-26 19:00:18 +00:00
|
|
|
#include "libbb.h"
|
2007-03-26 20:15:40 +00:00
|
|
|
|
2007-03-28 16:48:40 +00:00
|
|
|
#if ENABLE_FEATURE_SPLIT_FANCY
|
2013-07-13 21:49:45 +00:00
|
|
|
static const struct suffix_mult split_suffixes[] = {
|
2007-03-26 10:46:31 +00:00
|
|
|
{ "b", 512 },
|
|
|
|
{ "k", 1024 },
|
|
|
|
{ "m", 1024*1024 },
|
|
|
|
{ "g", 1024*1024*1024 },
|
2009-09-06 10:47:55 +00:00
|
|
|
{ "", 0 }
|
2007-03-26 10:46:31 +00:00
|
|
|
};
|
2013-07-13 21:49:45 +00:00
|
|
|
#endif
|
2007-03-25 21:50:18 +00:00
|
|
|
|
|
|
|
/* Increment the suffix part of the filename.
|
2007-03-26 20:15:40 +00:00
|
|
|
* Returns NULL if we are out of filenames.
|
2007-03-25 21:50:18 +00:00
|
|
|
*/
|
2007-03-26 20:15:40 +00:00
|
|
|
static char *next_file(char *old, unsigned suffix_len)
|
2007-03-25 21:50:18 +00:00
|
|
|
{
|
2007-03-26 20:15:40 +00:00
|
|
|
size_t end = strlen(old);
|
2007-03-25 21:50:18 +00:00
|
|
|
unsigned i = 1;
|
|
|
|
char *curr;
|
|
|
|
|
2011-03-02 03:07:14 +00:00
|
|
|
while (1) {
|
2007-03-26 20:15:40 +00:00
|
|
|
curr = old + end - i;
|
2007-03-25 21:50:18 +00:00
|
|
|
if (*curr < 'z') {
|
2007-03-26 10:46:31 +00:00
|
|
|
*curr += 1;
|
2007-03-25 21:50:18 +00:00
|
|
|
break;
|
|
|
|
}
|
|
|
|
i++;
|
2007-03-26 14:28:12 +00:00
|
|
|
if (i > suffix_len) {
|
2007-03-26 20:15:40 +00:00
|
|
|
return NULL;
|
2007-03-26 14:28:12 +00:00
|
|
|
}
|
|
|
|
*curr = 'a';
|
2011-03-02 03:07:14 +00:00
|
|
|
}
|
2007-03-26 20:15:40 +00:00
|
|
|
|
|
|
|
return old;
|
2007-03-25 21:50:18 +00:00
|
|
|
}
|
2007-03-26 14:28:12 +00:00
|
|
|
|
2007-03-26 20:15:40 +00:00
|
|
|
#define read_buffer bb_common_bufsiz1
|
2007-06-04 10:16:52 +00:00
|
|
|
enum { READ_BUFFER_SIZE = COMMON_BUFSIZE - 1 };
|
2007-03-26 20:15:40 +00:00
|
|
|
|
2007-03-25 21:50:18 +00:00
|
|
|
#define SPLIT_OPT_l (1<<0)
|
|
|
|
#define SPLIT_OPT_b (1<<1)
|
2007-03-26 10:46:31 +00:00
|
|
|
#define SPLIT_OPT_a (1<<2)
|
2007-03-25 21:50:18 +00:00
|
|
|
|
2007-10-11 10:05:36 +00:00
|
|
|
int split_main(int argc, char **argv) MAIN_EXTERNALLY_VISIBLE;
|
2008-07-05 09:18:54 +00:00
|
|
|
int split_main(int argc UNUSED_PARAM, char **argv)
|
2007-03-25 21:50:18 +00:00
|
|
|
{
|
2007-03-26 20:15:40 +00:00
|
|
|
unsigned suffix_len = 2;
|
|
|
|
char *pfx;
|
|
|
|
char *count_p;
|
|
|
|
const char *sfx;
|
2007-03-28 16:48:40 +00:00
|
|
|
off_t cnt = 1000;
|
|
|
|
off_t remaining = 0;
|
2007-03-26 20:15:40 +00:00
|
|
|
unsigned opt;
|
2007-03-28 16:48:40 +00:00
|
|
|
ssize_t bytes_read, to_write;
|
2007-03-26 20:15:40 +00:00
|
|
|
char *src;
|
|
|
|
|
2008-03-17 09:09:09 +00:00
|
|
|
opt_complementary = "?2:a+"; /* max 2 args; -a N */
|
|
|
|
opt = getopt32(argv, "l:b:a:", &count_p, &count_p, &suffix_len);
|
2007-03-25 21:50:18 +00:00
|
|
|
|
2007-03-26 18:19:29 +00:00
|
|
|
if (opt & SPLIT_OPT_l)
|
2008-03-17 09:09:09 +00:00
|
|
|
cnt = XATOOFF(count_p);
|
|
|
|
if (opt & SPLIT_OPT_b) // FIXME: also needs XATOOFF
|
2013-07-13 21:49:45 +00:00
|
|
|
cnt = xatoull_sfx(count_p,
|
|
|
|
IF_FEATURE_SPLIT_FANCY(split_suffixes)
|
|
|
|
IF_NOT_FEATURE_SPLIT_FANCY(km_suffixes)
|
|
|
|
);
|
2007-03-26 20:15:40 +00:00
|
|
|
sfx = "x";
|
2007-03-28 16:48:40 +00:00
|
|
|
|
|
|
|
argv += optind;
|
2007-03-26 20:15:40 +00:00
|
|
|
if (argv[0]) {
|
2009-11-26 04:43:16 +00:00
|
|
|
int fd;
|
2007-03-26 20:15:40 +00:00
|
|
|
if (argv[1])
|
|
|
|
sfx = argv[1];
|
2010-08-23 01:06:46 +00:00
|
|
|
fd = xopen_stdin(argv[0]);
|
2009-11-26 04:43:16 +00:00
|
|
|
xmove_fd(fd, STDIN_FILENO);
|
2007-03-26 20:15:40 +00:00
|
|
|
} else {
|
|
|
|
argv[0] = (char *) bb_msg_standard_input;
|
|
|
|
}
|
2007-03-26 14:28:12 +00:00
|
|
|
|
2007-03-26 20:15:40 +00:00
|
|
|
if (NAME_MAX < strlen(sfx) + suffix_len)
|
|
|
|
bb_error_msg_and_die("suffix too long");
|
2007-03-25 21:50:18 +00:00
|
|
|
|
|
|
|
{
|
2007-03-26 20:15:40 +00:00
|
|
|
char *char_p = xzalloc(suffix_len + 1);
|
2007-03-25 21:50:18 +00:00
|
|
|
memset(char_p, 'a', suffix_len);
|
2007-03-26 20:15:40 +00:00
|
|
|
pfx = xasprintf("%s%s", sfx, char_p);
|
2007-03-25 21:50:18 +00:00
|
|
|
if (ENABLE_FEATURE_CLEAN_UP)
|
|
|
|
free(char_p);
|
|
|
|
}
|
2007-03-26 14:28:12 +00:00
|
|
|
|
2007-03-26 20:15:40 +00:00
|
|
|
while (1) {
|
2008-05-19 09:48:17 +00:00
|
|
|
bytes_read = safe_read(STDIN_FILENO, read_buffer, READ_BUFFER_SIZE);
|
2007-03-26 20:15:40 +00:00
|
|
|
if (!bytes_read)
|
|
|
|
break;
|
|
|
|
if (bytes_read < 0)
|
2007-10-01 11:58:38 +00:00
|
|
|
bb_simple_perror_msg_and_die(argv[0]);
|
2007-03-26 20:15:40 +00:00
|
|
|
src = read_buffer;
|
2007-03-25 21:50:18 +00:00
|
|
|
do {
|
2007-03-26 20:15:40 +00:00
|
|
|
if (!remaining) {
|
|
|
|
if (!pfx)
|
2007-03-28 16:48:40 +00:00
|
|
|
bb_error_msg_and_die("suffixes exhausted");
|
2007-03-26 20:15:40 +00:00
|
|
|
xmove_fd(xopen(pfx, O_WRONLY | O_CREAT | O_TRUNC), 1);
|
|
|
|
pfx = next_file(pfx, suffix_len);
|
|
|
|
remaining = cnt;
|
2007-03-26 14:28:12 +00:00
|
|
|
}
|
2007-03-26 20:15:40 +00:00
|
|
|
|
|
|
|
if (opt & SPLIT_OPT_b) {
|
|
|
|
/* split by bytes */
|
|
|
|
to_write = (bytes_read < remaining) ? bytes_read : remaining;
|
|
|
|
remaining -= to_write;
|
|
|
|
} else {
|
|
|
|
/* split by lines */
|
|
|
|
/* can be sped up by using _memrchr_
|
|
|
|
* and writing many lines at once... */
|
|
|
|
char *end = memchr(src, '\n', bytes_read);
|
|
|
|
if (end) {
|
|
|
|
--remaining;
|
|
|
|
to_write = end - src + 1;
|
|
|
|
} else {
|
|
|
|
to_write = bytes_read;
|
|
|
|
}
|
2007-03-26 14:28:12 +00:00
|
|
|
}
|
2007-03-26 20:15:40 +00:00
|
|
|
|
2008-05-19 09:48:17 +00:00
|
|
|
xwrite(STDOUT_FILENO, src, to_write);
|
2007-03-26 20:15:40 +00:00
|
|
|
bytes_read -= to_write;
|
|
|
|
src += to_write;
|
|
|
|
} while (bytes_read);
|
2007-03-25 21:50:18 +00:00
|
|
|
}
|
2007-11-16 12:39:16 +00:00
|
|
|
return EXIT_SUCCESS;
|
2007-03-25 21:50:18 +00:00
|
|
|
}
|