2 * Copyright (c) 1987, 1993, 1994
3 * The Regents of the University of California. All rights reserved.
5 * Redistribution and use in source and binary forms, with or without
6 * modification, are permitted provided that the following conditions
8 * 1. Redistributions of source code must retain the above copyright
9 * notice, this list of conditions and the following disclaimer.
10 * 2. Redistributions in binary form must reproduce the above copyright
11 * notice, this list of conditions and the following disclaimer in the
12 * documentation and/or other materials provided with the distribution.
13 * 3. All advertising materials mentioning features or use of this software
14 * must display the following acknowledgement:
15 * This product includes software developed by the University of
16 * California, Berkeley and its contributors.
17 * 4. Neither the name of the University nor the names of its contributors
18 * may be used to endorse or promote products derived from this software
19 * without specific prior written permission.
21 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
22 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
23 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
24 * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
25 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
26 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
27 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
28 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
29 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
30 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
33 * @(#) Copyright (c) 1987, 1993, 1994 The Regents of the University of California. All rights reserved.
34 * @(#)split.c 8.2 (Berkeley) 4/16/94
35 * $FreeBSD: src/usr.bin/split/split.c,v 1.6.2.2 2002/07/25 12:46:36 tjr Exp $
36 * $DragonFly: src/usr.bin/split/split.c,v 1.6 2005/08/30 21:19:13 liamfoy Exp $
39 #include <sys/param.h>
53 #define DEFLINE 1000 /* Default num lines per file. */
55 off_t bytecnt
; /* Byte count to split on. */
56 long numlines
; /* Line count to split on. */
57 int file_open
; /* If a file open. */
58 int ifd
= -1, ofd
= -1; /* Input/output file descriptors. */
59 char *bfr
; /* I/O buffer. */
60 char fname
[MAXPATHLEN
]; /* File name prefix. */
63 long sufflen
= 2; /* File name suffix length. */
68 static void usage(void);
71 main(int argc
, char **argv
)
78 while ((ch
= getopt(argc
, argv
, "0123456789a:b:l:p:")) != -1)
80 case '0': case '1': case '2': case '3': case '4':
81 case '5': case '6': case '7': case '8': case '9':
83 * Undocumented kludge: split was originally designed
84 * to take a number after a dash.
88 if (p
[0] == '-' && p
[1] == ch
&& !p
[2])
89 numlines
= strtol(++p
, &ep
, 10);
92 strtol(argv
[optind
] + 1, &ep
, 10);
93 if (numlines
<= 0 || *ep
)
95 "%s: illegal line count", optarg
);
98 case 'a': /* Suffix length */
99 if ((sufflen
= strtol(optarg
, &ep
, 10)) <= 0 || *ep
)
101 "%s: illegal suffix length", optarg
);
103 case 'b': /* Byte count. */
105 if ((bytecnti
= strtoll(optarg
, &ep
, 10)) <= 0 ||
106 (*ep
!= '\0' && *ep
!= 'k' && *ep
!= 'm') ||
109 "%s: illegal byte count", optarg
);
116 bytecnt
= (off_t
)(bytecnti
* scale
);
118 case 'p' : /* pattern matching. */
119 if (regcomp(&rgx
, optarg
, REG_EXTENDED
|REG_NOSUB
) != 0)
120 errx(EX_USAGE
, "%s: illegal regexp", optarg
);
123 case 'l': /* Line count. */
126 if ((numlines
= strtol(optarg
, &ep
, 10)) <= 0 || *ep
)
128 "%s: illegal line count", optarg
);
137 if (strcmp(*argv
, "-") == 0)
139 else if ((ifd
= open(*argv
, O_RDONLY
, 0)) < 0)
140 err(EX_NOINPUT
, "%s", *argv
);
144 if (*argv
!= NULL
) /* File name prefix. */
145 if (strlcpy(fname
, *argv
++, sizeof(fname
)) >= sizeof(fname
))
146 errx(EX_USAGE
, "file name prefix is too long");
150 if (strlen(fname
) + (unsigned long)sufflen
>= sizeof(fname
))
151 errx(EX_USAGE
, "suffix is too long");
152 if (pflag
&& (numlines
!= 0 || bytecnt
!= 0))
157 else if (bytecnt
!= 0)
160 if (ifd
== -1) /* Stdin by default. */
175 * Split the input by bytes.
184 if((bfr
= (char *)malloc(bytecnt
)) == NULL
)
185 err(EX_OSERR
, "malloc");
188 switch ((len
= read(ifd
, bfr
, bytecnt
))) {
194 err(EX_IOERR
, "read");
199 if (bcnt
+ len
>= bytecnt
) {
200 dist
= bytecnt
- bcnt
;
201 if (write(ofd
, bfr
, dist
) != dist
)
202 err(EX_IOERR
, "write");
204 for (C
= bfr
+ dist
; len
>= bytecnt
;
205 len
-= bytecnt
, C
+= bytecnt
) {
208 C
, (int)bytecnt
) != bytecnt
) {
210 err(EX_IOERR
, "write");
215 if (write(ofd
, C
, len
) != len
) {
217 err(EX_IOERR
, "write");
224 if (write(ofd
, bfr
, len
) != len
) {
226 err(EX_IOERR
, "write");
235 * Split the input by lines.
244 /* Stick a stream on top of input file descriptor */
245 if ((infp
= fdopen(ifd
, "r")) == NULL
)
246 err(EX_NOINPUT
, "fdopen");
248 if((bfr
= (char *)malloc(MAXBSIZE
)) == NULL
)
249 err(EX_OSERR
, "malloc");
251 /* Process input one line at a time */
252 while (fgets(bfr
, MAXBSIZE
, infp
) != NULL
) {
253 const int len
= strlen(bfr
);
255 /* Consider starting a new file only when at beginning of a line */
257 /* Check if we need to start a new file */
262 pmatch
.rm_eo
= len
- 1;
263 if (regexec(&rgx
, bfr
, 0, &pmatch
, REG_STARTEND
) == 0)
265 } else if (lcnt
++ == numlines
) {
271 if (bfr
[len
- 1] != '\n')
276 /* Open output file if needed */
281 if (write(ofd
, bfr
, len
) != len
) {
283 err(EX_IOERR
, "write");
291 err(EX_IOERR
, "read");
298 * Open a new output file.
303 long i
, maxfiles
, tfnum
;
309 if (fname
[0] == '\0') {
314 fpnt
= fname
+ strlen(fname
);
317 ofd
= fileno(stdout
);
320 /* maxfiles = 26^sufflen, but don't use libm. */
321 for (maxfiles
= 1, i
= 0; i
< sufflen
; i
++)
322 if ((maxfiles
*= 26) <= 0)
323 errx(EX_USAGE
, "suffix is too long (max %ld)", i
);
325 if (fnum
== maxfiles
)
326 errx(EX_DATAERR
, "too many files");
328 /* Generate suffix of sufflen letters */
332 fpnt
[i
] = tfnum
% 26 + 'a';
335 fpnt
[sufflen
] = '\0';
338 if (!freopen(fname
, "w", stdout
))
339 err(EX_IOERR
, "%s", fname
);
346 (void)fprintf(stderr
,
347 "usage: split [-a sufflen] [-b byte_count] [-l line_count] [-p pattern]\n");
348 (void)fprintf(stderr
,
349 " [file [prefix]]\n");