summaryrefslogtreecommitdiff
path: root/coreutils/split.c (plain)
blob: 50918a1ceb938532d7469a0a886c7deaa662b676
1/* vi: set sw=4 ts=4: */
2/*
3 * split - split a file into pieces
4 * Copyright (c) 2007 Bernhard Reutner-Fischer
5 *
6 * Licensed under GPLv2 or later, see file LICENSE in this source tree.
7 */
8//config:config SPLIT
9//config: bool "split"
10//config: default y
11//config: help
12//config: split a file into pieces.
13//config:
14//config:config FEATURE_SPLIT_FANCY
15//config: bool "Fancy extensions"
16//config: default y
17//config: depends on SPLIT
18//config: help
19//config: Add support for features not required by SUSv3.
20//config: Supports additional suffixes 'b' for 512 bytes,
21//config: 'g' for 1GiB for the -b option.
22
23//applet:IF_SPLIT(APPLET(split, BB_DIR_USR_BIN, BB_SUID_DROP))
24
25//kbuild:lib-$(CONFIG_SPLIT) += split.o
26
27/* BB_AUDIT: SUSv3 compliant
28 * SUSv3 requirements:
29 * http://www.opengroup.org/onlinepubs/009695399/utilities/split.html
30 */
31
32//usage:#define split_trivial_usage
33//usage: "[OPTIONS] [INPUT [PREFIX]]"
34//usage:#define split_full_usage "\n\n"
35//usage: " -b N[k|m] Split by N (kilo|mega)bytes"
36//usage: "\n -l N Split by N lines"
37//usage: "\n -a N Use N letters as suffix"
38//usage:
39//usage:#define split_example_usage
40//usage: "$ split TODO foo\n"
41//usage: "$ cat TODO | split -a 2 -l 2 TODO_\n"
42
43#include "libbb.h"
44#include "common_bufsiz.h"
45
46#if ENABLE_FEATURE_SPLIT_FANCY
47static const struct suffix_mult split_suffixes[] = {
48 { "b", 512 },
49 { "k", 1024 },
50 { "m", 1024*1024 },
51 { "g", 1024*1024*1024 },
52 { "", 0 }
53};
54#endif
55
56/* Increment the suffix part of the filename.
57 * Returns NULL if we are out of filenames.
58 */
59static char *next_file(char *old, unsigned suffix_len)
60{
61 size_t end = strlen(old);
62 unsigned i = 1;
63 char *curr;
64
65 while (1) {
66 curr = old + end - i;
67 if (*curr < 'z') {
68 *curr += 1;
69 break;
70 }
71 i++;
72 if (i > suffix_len) {
73 return NULL;
74 }
75 *curr = 'a';
76 }
77
78 return old;
79}
80
81#define read_buffer bb_common_bufsiz1
82enum { READ_BUFFER_SIZE = COMMON_BUFSIZE - 1 };
83
84#define SPLIT_OPT_l (1<<0)
85#define SPLIT_OPT_b (1<<1)
86#define SPLIT_OPT_a (1<<2)
87
88int split_main(int argc, char **argv) MAIN_EXTERNALLY_VISIBLE;
89int split_main(int argc UNUSED_PARAM, char **argv)
90{
91 unsigned suffix_len = 2;
92 char *pfx;
93 char *count_p;
94 const char *sfx;
95 off_t cnt = 1000;
96 off_t remaining = 0;
97 unsigned opt;
98 ssize_t bytes_read, to_write;
99 char *src;
100
101 setup_common_bufsiz();
102
103 opt_complementary = "?2"; /* max 2 args; -a N */
104 opt = getopt32(argv, "l:b:a:+", &count_p, &count_p, &suffix_len);
105
106 if (opt & SPLIT_OPT_l)
107 cnt = XATOOFF(count_p);
108 if (opt & SPLIT_OPT_b) // FIXME: also needs XATOOFF
109 cnt = xatoull_sfx(count_p,
110 IF_FEATURE_SPLIT_FANCY(split_suffixes)
111 IF_NOT_FEATURE_SPLIT_FANCY(km_suffixes)
112 );
113 sfx = "x";
114
115 argv += optind;
116 if (argv[0]) {
117 int fd;
118 if (argv[1])
119 sfx = argv[1];
120 fd = xopen_stdin(argv[0]);
121 xmove_fd(fd, STDIN_FILENO);
122 } else {
123 argv[0] = (char *) bb_msg_standard_input;
124 }
125
126 if (NAME_MAX < strlen(sfx) + suffix_len)
127 bb_error_msg_and_die("suffix too long");
128
129 {
130 char *char_p = xzalloc(suffix_len + 1);
131 memset(char_p, 'a', suffix_len);
132 pfx = xasprintf("%s%s", sfx, char_p);
133 if (ENABLE_FEATURE_CLEAN_UP)
134 free(char_p);
135 }
136
137 while (1) {
138 bytes_read = safe_read(STDIN_FILENO, read_buffer, READ_BUFFER_SIZE);
139 if (!bytes_read)
140 break;
141 if (bytes_read < 0)
142 bb_simple_perror_msg_and_die(argv[0]);
143 src = read_buffer;
144 do {
145 if (!remaining) {
146 if (!pfx)
147 bb_error_msg_and_die("suffixes exhausted");
148 xmove_fd(xopen(pfx, O_WRONLY | O_CREAT | O_TRUNC), 1);
149 pfx = next_file(pfx, suffix_len);
150 remaining = cnt;
151 }
152
153 if (opt & SPLIT_OPT_b) {
154 /* split by bytes */
155 to_write = (bytes_read < remaining) ? bytes_read : remaining;
156 remaining -= to_write;
157 } else {
158 /* split by lines */
159 /* can be sped up by using _memrchr_
160 * and writing many lines at once... */
161 char *end = memchr(src, '\n', bytes_read);
162 if (end) {
163 --remaining;
164 to_write = end - src + 1;
165 } else {
166 to_write = bytes_read;
167 }
168 }
169
170 xwrite(STDOUT_FILENO, src, to_write);
171 bytes_read -= to_write;
172 src += to_write;
173 } while (bytes_read);
174 }
175 return EXIT_SUCCESS;
176}
177