xref: /aosp_15_r20/external/toybox/toys/posix/split.c (revision cf5a6c84e2b8763fc1a7db14496fd4742913b199)
1*cf5a6c84SAndroid Build Coastguard Worker /* split.c - split a file into smaller files
2*cf5a6c84SAndroid Build Coastguard Worker  *
3*cf5a6c84SAndroid Build Coastguard Worker  * Copyright 2013 Rob Landley <[email protected]>
4*cf5a6c84SAndroid Build Coastguard Worker  *
5*cf5a6c84SAndroid Build Coastguard Worker  * See http://pubs.opengroup.org/onlinepubs/9699919799/utilities/split.html
6*cf5a6c84SAndroid Build Coastguard Worker  *
7*cf5a6c84SAndroid Build Coastguard Worker  * Standard does not cover:
8*cf5a6c84SAndroid Build Coastguard Worker  * - should splitting an empty file produce an empty outfile? (Went with "no".)
9*cf5a6c84SAndroid Build Coastguard Worker  * - permissions on output file
10*cf5a6c84SAndroid Build Coastguard Worker 
11*cf5a6c84SAndroid Build Coastguard Worker USE_SPLIT(NEWTOY(split, ">2a#<1=2>9b#<1l#<1n#<1[!bl][!bn][!ln]", TOYFLAG_USR|TOYFLAG_BIN))
12*cf5a6c84SAndroid Build Coastguard Worker 
13*cf5a6c84SAndroid Build Coastguard Worker config SPLIT
14*cf5a6c84SAndroid Build Coastguard Worker   bool "split"
15*cf5a6c84SAndroid Build Coastguard Worker   default y
16*cf5a6c84SAndroid Build Coastguard Worker   help
17*cf5a6c84SAndroid Build Coastguard Worker     usage: split [-a SUFFIX_LEN] [-b BYTES] [-l LINES] [-n PARTS] [INPUT [OUTPUT]]
18*cf5a6c84SAndroid Build Coastguard Worker 
19*cf5a6c84SAndroid Build Coastguard Worker     Copy INPUT (or stdin) data to a series of OUTPUT (or "x") files with
20*cf5a6c84SAndroid Build Coastguard Worker     alphabetically increasing suffix (aa, ab, ac... az, ba, bb...).
21*cf5a6c84SAndroid Build Coastguard Worker 
22*cf5a6c84SAndroid Build Coastguard Worker     -a	Suffix length (default 2)
23*cf5a6c84SAndroid Build Coastguard Worker     -b	BYTES/file (10, 10k, 10m, 10g...)
24*cf5a6c84SAndroid Build Coastguard Worker     -l	LINES/file (default 1000)
25*cf5a6c84SAndroid Build Coastguard Worker     -n	PARTS many equal length files
26*cf5a6c84SAndroid Build Coastguard Worker */
27*cf5a6c84SAndroid Build Coastguard Worker 
28*cf5a6c84SAndroid Build Coastguard Worker #define FOR_split
29*cf5a6c84SAndroid Build Coastguard Worker #include "toys.h"
30*cf5a6c84SAndroid Build Coastguard Worker 
GLOBALS(long n,l,b,a;char * outfile;)31*cf5a6c84SAndroid Build Coastguard Worker GLOBALS(
32*cf5a6c84SAndroid Build Coastguard Worker   long n, l, b, a;
33*cf5a6c84SAndroid Build Coastguard Worker 
34*cf5a6c84SAndroid Build Coastguard Worker   char *outfile;
35*cf5a6c84SAndroid Build Coastguard Worker )
36*cf5a6c84SAndroid Build Coastguard Worker 
37*cf5a6c84SAndroid Build Coastguard Worker static void do_split(int infd, char *in)
38*cf5a6c84SAndroid Build Coastguard Worker {
39*cf5a6c84SAndroid Build Coastguard Worker   unsigned long bytesleft, linesleft, filenum, len, pos;
40*cf5a6c84SAndroid Build Coastguard Worker   int outfd = -1;
41*cf5a6c84SAndroid Build Coastguard Worker   struct stat st;
42*cf5a6c84SAndroid Build Coastguard Worker 
43*cf5a6c84SAndroid Build Coastguard Worker   // posix doesn't cover permissions on output file, so copy input (or 0777)
44*cf5a6c84SAndroid Build Coastguard Worker   st.st_mode = 0777;
45*cf5a6c84SAndroid Build Coastguard Worker   st.st_size = 0;
46*cf5a6c84SAndroid Build Coastguard Worker   fstat(infd, &st);
47*cf5a6c84SAndroid Build Coastguard Worker 
48*cf5a6c84SAndroid Build Coastguard Worker   if (TT.n && (TT.b = st.st_size/TT.n)<1) return error_msg("%s: no size", in);
49*cf5a6c84SAndroid Build Coastguard Worker   len = pos = filenum = bytesleft = linesleft = 0;
50*cf5a6c84SAndroid Build Coastguard Worker   for (;;) {
51*cf5a6c84SAndroid Build Coastguard Worker     int i, j;
52*cf5a6c84SAndroid Build Coastguard Worker 
53*cf5a6c84SAndroid Build Coastguard Worker     // Refill toybuf?
54*cf5a6c84SAndroid Build Coastguard Worker     if (len == pos) {
55*cf5a6c84SAndroid Build Coastguard Worker       if (!(len = xread(infd, toybuf, sizeof(toybuf)))) break;
56*cf5a6c84SAndroid Build Coastguard Worker       pos = 0;
57*cf5a6c84SAndroid Build Coastguard Worker     }
58*cf5a6c84SAndroid Build Coastguard Worker 
59*cf5a6c84SAndroid Build Coastguard Worker     // Start new output file?
60*cf5a6c84SAndroid Build Coastguard Worker     if ((TT.b && !bytesleft) || (TT.l && !linesleft)) {
61*cf5a6c84SAndroid Build Coastguard Worker       char *s = TT.outfile + strlen(TT.outfile);
62*cf5a6c84SAndroid Build Coastguard Worker 
63*cf5a6c84SAndroid Build Coastguard Worker       j = filenum++;
64*cf5a6c84SAndroid Build Coastguard Worker       for (i = 0; i<TT.a; i++) {
65*cf5a6c84SAndroid Build Coastguard Worker         *(--s) = 'a'+(j%26);
66*cf5a6c84SAndroid Build Coastguard Worker         j /= 26;
67*cf5a6c84SAndroid Build Coastguard Worker       }
68*cf5a6c84SAndroid Build Coastguard Worker       if (j) error_exit("bad suffix");
69*cf5a6c84SAndroid Build Coastguard Worker       bytesleft = TT.b + ((filenum == TT.n) ? st.st_size%TT.n : 0);
70*cf5a6c84SAndroid Build Coastguard Worker       linesleft = TT.l;
71*cf5a6c84SAndroid Build Coastguard Worker       xclose(outfd);
72*cf5a6c84SAndroid Build Coastguard Worker       outfd = xcreate(TT.outfile, O_RDWR|O_CREAT|O_TRUNC, st.st_mode & 0777);
73*cf5a6c84SAndroid Build Coastguard Worker     }
74*cf5a6c84SAndroid Build Coastguard Worker 
75*cf5a6c84SAndroid Build Coastguard Worker     // Write next chunk of output.
76*cf5a6c84SAndroid Build Coastguard Worker     if (TT.l) {
77*cf5a6c84SAndroid Build Coastguard Worker       for (i = pos; i < len; ) {
78*cf5a6c84SAndroid Build Coastguard Worker         if (toybuf[i++] == '\n' && !--linesleft) break;
79*cf5a6c84SAndroid Build Coastguard Worker         if (!--bytesleft) break;
80*cf5a6c84SAndroid Build Coastguard Worker       }
81*cf5a6c84SAndroid Build Coastguard Worker       j = i - pos;
82*cf5a6c84SAndroid Build Coastguard Worker     } else {
83*cf5a6c84SAndroid Build Coastguard Worker       j = len - pos;
84*cf5a6c84SAndroid Build Coastguard Worker       if (j > bytesleft) j = bytesleft;
85*cf5a6c84SAndroid Build Coastguard Worker       bytesleft -= j;
86*cf5a6c84SAndroid Build Coastguard Worker     }
87*cf5a6c84SAndroid Build Coastguard Worker     xwrite(outfd, toybuf+pos, j);
88*cf5a6c84SAndroid Build Coastguard Worker     pos += j;
89*cf5a6c84SAndroid Build Coastguard Worker   }
90*cf5a6c84SAndroid Build Coastguard Worker 
91*cf5a6c84SAndroid Build Coastguard Worker   if (CFG_TOYBOX_FREE) {
92*cf5a6c84SAndroid Build Coastguard Worker     xclose(outfd);
93*cf5a6c84SAndroid Build Coastguard Worker     if (infd) close(infd);
94*cf5a6c84SAndroid Build Coastguard Worker     free(TT.outfile);
95*cf5a6c84SAndroid Build Coastguard Worker   }
96*cf5a6c84SAndroid Build Coastguard Worker   xexit();
97*cf5a6c84SAndroid Build Coastguard Worker }
98*cf5a6c84SAndroid Build Coastguard Worker 
split_main(void)99*cf5a6c84SAndroid Build Coastguard Worker void split_main(void)
100*cf5a6c84SAndroid Build Coastguard Worker {
101*cf5a6c84SAndroid Build Coastguard Worker   if (!TT.b && !TT.l && !TT.n) TT.l = 1000;
102*cf5a6c84SAndroid Build Coastguard Worker 
103*cf5a6c84SAndroid Build Coastguard Worker   // Allocate template for output filenames
104*cf5a6c84SAndroid Build Coastguard Worker   TT.outfile = xmprintf("%s%*c", (toys.optc == 2) ? toys.optargs[1] : "x",
105*cf5a6c84SAndroid Build Coastguard Worker     (int)TT.a, ' ');
106*cf5a6c84SAndroid Build Coastguard Worker 
107*cf5a6c84SAndroid Build Coastguard Worker   // We only ever use one input, but this handles '-' or no input for us.
108*cf5a6c84SAndroid Build Coastguard Worker   loopfiles(toys.optargs, do_split);
109*cf5a6c84SAndroid Build Coastguard Worker }
110