1*cf5a6c84SAndroid Build Coastguard Worker /* split.c - split a file into smaller files
2*cf5a6c84SAndroid Build Coastguard Worker *
3*cf5a6c84SAndroid Build Coastguard Worker * Copyright 2013 Rob Landley <[email protected]>
4*cf5a6c84SAndroid Build Coastguard Worker *
5*cf5a6c84SAndroid Build Coastguard Worker * See http://pubs.opengroup.org/onlinepubs/9699919799/utilities/split.html
6*cf5a6c84SAndroid Build Coastguard Worker *
7*cf5a6c84SAndroid Build Coastguard Worker * Standard does not cover:
8*cf5a6c84SAndroid Build Coastguard Worker * - should splitting an empty file produce an empty outfile? (Went with "no".)
9*cf5a6c84SAndroid Build Coastguard Worker * - permissions on output file
10*cf5a6c84SAndroid Build Coastguard Worker
11*cf5a6c84SAndroid Build Coastguard Worker USE_SPLIT(NEWTOY(split, ">2a#<1=2>9b#<1l#<1n#<1[!bl][!bn][!ln]", TOYFLAG_USR|TOYFLAG_BIN))
12*cf5a6c84SAndroid Build Coastguard Worker
13*cf5a6c84SAndroid Build Coastguard Worker config SPLIT
14*cf5a6c84SAndroid Build Coastguard Worker bool "split"
15*cf5a6c84SAndroid Build Coastguard Worker default y
16*cf5a6c84SAndroid Build Coastguard Worker help
17*cf5a6c84SAndroid Build Coastguard Worker usage: split [-a SUFFIX_LEN] [-b BYTES] [-l LINES] [-n PARTS] [INPUT [OUTPUT]]
18*cf5a6c84SAndroid Build Coastguard Worker
19*cf5a6c84SAndroid Build Coastguard Worker Copy INPUT (or stdin) data to a series of OUTPUT (or "x") files with
20*cf5a6c84SAndroid Build Coastguard Worker alphabetically increasing suffix (aa, ab, ac... az, ba, bb...).
21*cf5a6c84SAndroid Build Coastguard Worker
22*cf5a6c84SAndroid Build Coastguard Worker -a Suffix length (default 2)
23*cf5a6c84SAndroid Build Coastguard Worker -b BYTES/file (10, 10k, 10m, 10g...)
24*cf5a6c84SAndroid Build Coastguard Worker -l LINES/file (default 1000)
25*cf5a6c84SAndroid Build Coastguard Worker -n PARTS many equal length files
26*cf5a6c84SAndroid Build Coastguard Worker */
27*cf5a6c84SAndroid Build Coastguard Worker
28*cf5a6c84SAndroid Build Coastguard Worker #define FOR_split
29*cf5a6c84SAndroid Build Coastguard Worker #include "toys.h"
30*cf5a6c84SAndroid Build Coastguard Worker
GLOBALS(long n,l,b,a;char * outfile;)31*cf5a6c84SAndroid Build Coastguard Worker GLOBALS(
32*cf5a6c84SAndroid Build Coastguard Worker long n, l, b, a;
33*cf5a6c84SAndroid Build Coastguard Worker
34*cf5a6c84SAndroid Build Coastguard Worker char *outfile;
35*cf5a6c84SAndroid Build Coastguard Worker )
36*cf5a6c84SAndroid Build Coastguard Worker
37*cf5a6c84SAndroid Build Coastguard Worker static void do_split(int infd, char *in)
38*cf5a6c84SAndroid Build Coastguard Worker {
39*cf5a6c84SAndroid Build Coastguard Worker unsigned long bytesleft, linesleft, filenum, len, pos;
40*cf5a6c84SAndroid Build Coastguard Worker int outfd = -1;
41*cf5a6c84SAndroid Build Coastguard Worker struct stat st;
42*cf5a6c84SAndroid Build Coastguard Worker
43*cf5a6c84SAndroid Build Coastguard Worker // posix doesn't cover permissions on output file, so copy input (or 0777)
44*cf5a6c84SAndroid Build Coastguard Worker st.st_mode = 0777;
45*cf5a6c84SAndroid Build Coastguard Worker st.st_size = 0;
46*cf5a6c84SAndroid Build Coastguard Worker fstat(infd, &st);
47*cf5a6c84SAndroid Build Coastguard Worker
48*cf5a6c84SAndroid Build Coastguard Worker if (TT.n && (TT.b = st.st_size/TT.n)<1) return error_msg("%s: no size", in);
49*cf5a6c84SAndroid Build Coastguard Worker len = pos = filenum = bytesleft = linesleft = 0;
50*cf5a6c84SAndroid Build Coastguard Worker for (;;) {
51*cf5a6c84SAndroid Build Coastguard Worker int i, j;
52*cf5a6c84SAndroid Build Coastguard Worker
53*cf5a6c84SAndroid Build Coastguard Worker // Refill toybuf?
54*cf5a6c84SAndroid Build Coastguard Worker if (len == pos) {
55*cf5a6c84SAndroid Build Coastguard Worker if (!(len = xread(infd, toybuf, sizeof(toybuf)))) break;
56*cf5a6c84SAndroid Build Coastguard Worker pos = 0;
57*cf5a6c84SAndroid Build Coastguard Worker }
58*cf5a6c84SAndroid Build Coastguard Worker
59*cf5a6c84SAndroid Build Coastguard Worker // Start new output file?
60*cf5a6c84SAndroid Build Coastguard Worker if ((TT.b && !bytesleft) || (TT.l && !linesleft)) {
61*cf5a6c84SAndroid Build Coastguard Worker char *s = TT.outfile + strlen(TT.outfile);
62*cf5a6c84SAndroid Build Coastguard Worker
63*cf5a6c84SAndroid Build Coastguard Worker j = filenum++;
64*cf5a6c84SAndroid Build Coastguard Worker for (i = 0; i<TT.a; i++) {
65*cf5a6c84SAndroid Build Coastguard Worker *(--s) = 'a'+(j%26);
66*cf5a6c84SAndroid Build Coastguard Worker j /= 26;
67*cf5a6c84SAndroid Build Coastguard Worker }
68*cf5a6c84SAndroid Build Coastguard Worker if (j) error_exit("bad suffix");
69*cf5a6c84SAndroid Build Coastguard Worker bytesleft = TT.b + ((filenum == TT.n) ? st.st_size%TT.n : 0);
70*cf5a6c84SAndroid Build Coastguard Worker linesleft = TT.l;
71*cf5a6c84SAndroid Build Coastguard Worker xclose(outfd);
72*cf5a6c84SAndroid Build Coastguard Worker outfd = xcreate(TT.outfile, O_RDWR|O_CREAT|O_TRUNC, st.st_mode & 0777);
73*cf5a6c84SAndroid Build Coastguard Worker }
74*cf5a6c84SAndroid Build Coastguard Worker
75*cf5a6c84SAndroid Build Coastguard Worker // Write next chunk of output.
76*cf5a6c84SAndroid Build Coastguard Worker if (TT.l) {
77*cf5a6c84SAndroid Build Coastguard Worker for (i = pos; i < len; ) {
78*cf5a6c84SAndroid Build Coastguard Worker if (toybuf[i++] == '\n' && !--linesleft) break;
79*cf5a6c84SAndroid Build Coastguard Worker if (!--bytesleft) break;
80*cf5a6c84SAndroid Build Coastguard Worker }
81*cf5a6c84SAndroid Build Coastguard Worker j = i - pos;
82*cf5a6c84SAndroid Build Coastguard Worker } else {
83*cf5a6c84SAndroid Build Coastguard Worker j = len - pos;
84*cf5a6c84SAndroid Build Coastguard Worker if (j > bytesleft) j = bytesleft;
85*cf5a6c84SAndroid Build Coastguard Worker bytesleft -= j;
86*cf5a6c84SAndroid Build Coastguard Worker }
87*cf5a6c84SAndroid Build Coastguard Worker xwrite(outfd, toybuf+pos, j);
88*cf5a6c84SAndroid Build Coastguard Worker pos += j;
89*cf5a6c84SAndroid Build Coastguard Worker }
90*cf5a6c84SAndroid Build Coastguard Worker
91*cf5a6c84SAndroid Build Coastguard Worker if (CFG_TOYBOX_FREE) {
92*cf5a6c84SAndroid Build Coastguard Worker xclose(outfd);
93*cf5a6c84SAndroid Build Coastguard Worker if (infd) close(infd);
94*cf5a6c84SAndroid Build Coastguard Worker free(TT.outfile);
95*cf5a6c84SAndroid Build Coastguard Worker }
96*cf5a6c84SAndroid Build Coastguard Worker xexit();
97*cf5a6c84SAndroid Build Coastguard Worker }
98*cf5a6c84SAndroid Build Coastguard Worker
split_main(void)99*cf5a6c84SAndroid Build Coastguard Worker void split_main(void)
100*cf5a6c84SAndroid Build Coastguard Worker {
101*cf5a6c84SAndroid Build Coastguard Worker if (!TT.b && !TT.l && !TT.n) TT.l = 1000;
102*cf5a6c84SAndroid Build Coastguard Worker
103*cf5a6c84SAndroid Build Coastguard Worker // Allocate template for output filenames
104*cf5a6c84SAndroid Build Coastguard Worker TT.outfile = xmprintf("%s%*c", (toys.optc == 2) ? toys.optargs[1] : "x",
105*cf5a6c84SAndroid Build Coastguard Worker (int)TT.a, ' ');
106*cf5a6c84SAndroid Build Coastguard Worker
107*cf5a6c84SAndroid Build Coastguard Worker // We only ever use one input, but this handles '-' or no input for us.
108*cf5a6c84SAndroid Build Coastguard Worker loopfiles(toys.optargs, do_split);
109*cf5a6c84SAndroid Build Coastguard Worker }
110