docs/cut

changeset 14:21ad1c1548c4

Code ausgewaehlter Implementierungen eingefuegt Das Datum entspricht dem Dateiaenderungsdatum.
author markus schnalke <meillo@marmaro.de>
date Tue, 12 May 2015 06:46:59 +0200 (2015-05-12)
parents bf5e41260f89
children 77d1f55bba08
files code/cut.c__4.3bsd-reno.1990-06-25 code/cut.c__4.3bsd-uwisc.1986-11-07 code/cut.c__freebsd.1994-05-27 code/cut.c__freebsd.2012-11-24 code/cut.c__gnu.1992-11-08 code/cut.c__gnu.2015-05-01 code/cut.c__heirloom.2012-05-20 code/cut.c__netbsd.1993-03-21 code/cut.c__netbsd.2014-02-03 code/cut.c__openbsd.2008-06-27 code/cut.c__system_iii.1980-04-11
diffstat 11 files changed, 3966 insertions(+), 0 deletions(-) [+]
line diff
     1.1 --- /dev/null	Thu Jan 01 00:00:00 1970 +0000
     1.2 +++ b/code/cut.c__4.3bsd-reno.1990-06-25	Tue May 12 06:46:59 2015 +0200
     1.3 @@ -0,0 +1,256 @@
     1.4 +/*
     1.5 + * Copyright (c) 1989 The Regents of the University of California.
     1.6 + * All rights reserved.
     1.7 + *
     1.8 + * This code is derived from software contributed to Berkeley by
     1.9 + * Adam S. Moskowitz of Menlo Consulting and Marciano Pitargue.
    1.10 + *
    1.11 + * Redistribution and use in source and binary forms are permitted provided
    1.12 + * that: (1) source distributions retain this entire copyright notice and
    1.13 + * comment, and (2) distributions including binaries display the following
    1.14 + * acknowledgement:  ``This product includes software developed by the
    1.15 + * University of California, Berkeley and its contributors'' in the
    1.16 + * documentation or other materials provided with the distribution and in
    1.17 + * all advertising materials mentioning features or use of this software.
    1.18 + * Neither the name of the University nor the names of its contributors may
    1.19 + * be used to endorse or promote products derived from this software without
    1.20 + * specific prior written permission.
    1.21 + * THIS SOFTWARE IS PROVIDED ``AS IS'' AND WITHOUT ANY EXPRESS OR IMPLIED
    1.22 + * WARRANTIES, INCLUDING, WITHOUT LIMITATION, THE IMPLIED WARRANTIES OF
    1.23 + * MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE.
    1.24 + */
    1.25 +
    1.26 +#ifndef lint
    1.27 +char copyright[] =
    1.28 +"@(#) Copyright (c) 1989 The Regents of the University of California.\n\
    1.29 + All rights reserved.\n";
    1.30 +#endif /* not lint */
    1.31 +
    1.32 +#ifndef lint
    1.33 +static char sccsid[] = "@(#)cut.c	5.3 (Berkeley) 6/24/90";
    1.34 +#endif /* not lint */
    1.35 +
    1.36 +#include <limits.h>
    1.37 +#include <stdio.h>
    1.38 +#include <ctype.h>
    1.39 +
    1.40 +int	cflag;
    1.41 +char	dchar;
    1.42 +int	dflag;
    1.43 +int	fflag;
    1.44 +int	sflag;
    1.45 +
    1.46 +main(argc, argv)
    1.47 +	int argc;
    1.48 +	char **argv;
    1.49 +{
    1.50 +	extern char *optarg;
    1.51 +	extern int errno, optind;
    1.52 +	FILE *fp;
    1.53 +	int ch, (*fcn)(), c_cut(), f_cut();
    1.54 +	char *strerror();
    1.55 +
    1.56 +	dchar = '\t';			/* default delimiter is \t */
    1.57 +
    1.58 +	while ((ch = getopt(argc, argv, "c:d:f:s")) != EOF)
    1.59 +		switch(ch) {
    1.60 +		case 'c':
    1.61 +			fcn = c_cut;
    1.62 +			get_list(optarg);
    1.63 +			cflag = 1;
    1.64 +			break;
    1.65 +		case 'd':
    1.66 +			dchar = *optarg;
    1.67 +			dflag = 1;
    1.68 +			break;
    1.69 +		case 'f':
    1.70 +			get_list(optarg);
    1.71 +			fcn = f_cut;
    1.72 +			fflag = 1;
    1.73 +			break;
    1.74 +		case 's':
    1.75 +			sflag = 1;
    1.76 +			break;
    1.77 +		case '?':
    1.78 +		default:
    1.79 +			usage();
    1.80 +		}
    1.81 +	argc -= optind;
    1.82 +	argv += optind;
    1.83 +
    1.84 +	if (fflag) {
    1.85 +		if (cflag)
    1.86 +			usage();
    1.87 +	} else if (!cflag || dflag || sflag)
    1.88 +		usage();
    1.89 +
    1.90 +	if (*argv)
    1.91 +		for (; *argv; ++argv) {
    1.92 +			if (!(fp = fopen(*argv, "r"))) {
    1.93 +				(void)fprintf(stderr,
    1.94 +				    "cut: %s: %s\n", *argv, strerror(errno));
    1.95 +				exit(1);
    1.96 +			}
    1.97 +			fcn(fp, *argv);
    1.98 +		}
    1.99 +	else
   1.100 +		fcn(stdin, "stdin");
   1.101 +	exit(0);
   1.102 +}
   1.103 +
   1.104 +int autostart, autostop, maxval;
   1.105 +
   1.106 +char positions[_BSD_LINE_MAX + 1];
   1.107 +
   1.108 +get_list(list)
   1.109 +	char *list;
   1.110 +{
   1.111 +	register char *pos;
   1.112 +	register int setautostart, start, stop;
   1.113 +	char *p, *strtok();
   1.114 +
   1.115 +	/*
   1.116 +	 * set a byte in the positions array to indicate if a field or
   1.117 +	 * column is to be selected; use +1, it's 1-based, not 0-based.
   1.118 +	 * This parser is less restrictive than the Draft 9 POSIX spec.
   1.119 +	 * POSIX doesn't allow lists that aren't in increasing order or
   1.120 +	 * overlapping lists.  We also handle "-3-5" although there's no
   1.121 +	 * real reason too.
   1.122 +	 */
   1.123 +	for (; p = strtok(list, ", \t"); list = NULL) {
   1.124 +		setautostart = start = stop = 0;
   1.125 +		if (*p == '-') {
   1.126 +			++p;
   1.127 +			setautostart = 1;
   1.128 +		}
   1.129 +		if (isdigit(*p)) {
   1.130 +			start = stop = strtol(p, &p, 10);
   1.131 +			if (setautostart && start > autostart)
   1.132 +				autostart = start;
   1.133 +		}
   1.134 +		if (*p == '-') {
   1.135 +			if (isdigit(p[1]))
   1.136 +				stop = strtol(p + 1, &p, 10);
   1.137 +			if (*p == '-') {
   1.138 +				++p;
   1.139 +				if (!autostop || autostop > stop)
   1.140 +					autostop = stop;
   1.141 +			}
   1.142 +		}
   1.143 +		if (*p)
   1.144 +			badlist("illegal list value");
   1.145 +		if (!stop || !start)
   1.146 +			badlist("values may not include zero");
   1.147 +		if (stop > _BSD_LINE_MAX) {
   1.148 +			/* positions used rather than allocate a new buffer */
   1.149 +			(void)sprintf(positions, "%d too large (max %d)",
   1.150 +			    stop, _BSD_LINE_MAX);
   1.151 +			badlist(positions);
   1.152 +		}
   1.153 +		if (maxval < stop)
   1.154 +			maxval = stop;
   1.155 +		for (pos = positions + start; start++ <= stop; *pos++ = 1);
   1.156 +	}
   1.157 +
   1.158 +	/* overlapping ranges */
   1.159 +	if (autostop && maxval > autostop)
   1.160 +		maxval = autostop;
   1.161 +
   1.162 +	/* set autostart */
   1.163 +	if (autostart)
   1.164 +		memset(positions + 1, '1', autostart);
   1.165 +}
   1.166 +
   1.167 +/* ARGSUSED */
   1.168 +c_cut(fp, fname)
   1.169 +	FILE *fp;
   1.170 +	char *fname;
   1.171 +{
   1.172 +	register int ch, col;
   1.173 +	register char *pos;
   1.174 +
   1.175 +	for (;;) {
   1.176 +		pos = positions + 1;
   1.177 +		for (col = maxval; col; --col) {
   1.178 +			if ((ch = getc(fp)) == EOF)
   1.179 +				return;
   1.180 +			if (ch == '\n')
   1.181 +				break;
   1.182 +			if (*pos++)
   1.183 +				putchar(ch);
   1.184 +		}
   1.185 +		if (ch != '\n')
   1.186 +			if (autostop)
   1.187 +				while ((ch = getc(fp)) != EOF && ch != '\n')
   1.188 +					putchar(ch);
   1.189 +			else
   1.190 +				while ((ch = getc(fp)) != EOF && ch != '\n');
   1.191 +		putchar('\n');
   1.192 +	}
   1.193 +}
   1.194 +
   1.195 +f_cut(fp, fname)
   1.196 +	FILE *fp;
   1.197 +	char *fname;
   1.198 +{
   1.199 +	register int ch, field, isdelim;
   1.200 +	register char *pos, *p, sep;
   1.201 +	int output;
   1.202 +	char lbuf[_BSD_LINE_MAX + 1];
   1.203 +
   1.204 +	for (sep = dchar, output = 0; fgets(lbuf, sizeof(lbuf), fp);) {
   1.205 +		for (isdelim = 0, p = lbuf;; ++p) {
   1.206 +			if (!(ch = *p)) {
   1.207 +				(void)fprintf(stderr,
   1.208 +				    "cut: %s: line too long.\n", fname);
   1.209 +				exit(1);
   1.210 +			}
   1.211 +			/* this should work if newline is delimiter */
   1.212 +			if (ch == sep)
   1.213 +				isdelim = 1;
   1.214 +			if (ch == '\n') {
   1.215 +				if (!isdelim && !sflag)
   1.216 +					(void)printf("%s", lbuf);
   1.217 +				break;
   1.218 +			}
   1.219 +		}
   1.220 +		if (!isdelim)
   1.221 +			continue;
   1.222 +
   1.223 +		pos = positions + 1;
   1.224 +		for (field = maxval, p = lbuf; field; --field, ++pos) {
   1.225 +			if (*pos) {
   1.226 +				if (output++)
   1.227 +					putchar(sep);
   1.228 +				while ((ch = *p++) != '\n' && ch != sep)
   1.229 +					putchar(ch);
   1.230 +			} else
   1.231 +				while ((ch = *p++) != '\n' && ch != sep);
   1.232 +			if (ch == '\n')
   1.233 +				break;
   1.234 +		}
   1.235 +		if (ch != '\n')
   1.236 +			if (autostop) {
   1.237 +				if (output)
   1.238 +					putchar(sep);
   1.239 +				for (; (ch = *p) != '\n'; ++p)
   1.240 +					putchar(ch);
   1.241 +			} else
   1.242 +				for (; (ch = *p) != '\n'; ++p);
   1.243 +		putchar('\n');
   1.244 +	}
   1.245 +}
   1.246 +
   1.247 +badlist(msg)
   1.248 +	char *msg;
   1.249 +{
   1.250 +	(void)fprintf(stderr, "cut: [-cf] list: %s.\n", msg);
   1.251 +	exit(1);
   1.252 +}
   1.253 +
   1.254 +usage()
   1.255 +{
   1.256 +	(void)fprintf(stderr,
   1.257 +"usage:\tcut -c list [file1 ...]\n\tcut -f list [-s] [-d delim] [file ...]\n");
   1.258 +	exit(1);
   1.259 +}
     2.1 --- /dev/null	Thu Jan 01 00:00:00 1970 +0000
     2.2 +++ b/code/cut.c__4.3bsd-uwisc.1986-11-07	Tue May 12 06:46:59 2015 +0200
     2.3 @@ -0,0 +1,125 @@
     2.4 +static char sccsid[] = "@(#)cut.c	1.3";
     2.5 +#
     2.6 +/* cut : cut and paste columns of a table (projection of a relation) */
     2.7 +/* Release 1.5; handles single backspaces as produced by nroff    */
     2.8 +# include <stdio.h>	/* make: cc cut.c */
     2.9 +# define NFIELDS 512	/* max no of fields or resulting line length */
    2.10 +# define BACKSPACE 8
    2.11 +main(argc, argv)
    2.12 +int argc; char **argv;
    2.13 +{
    2.14 +	int del = '\t';
    2.15 +	int i, j, count, poscnt, r, s, t;
    2.16 +	int endflag, supflag, cflag, fflag, backflag, filenr;
    2.17 +	int sel[NFIELDS];
    2.18 +	register int c;
    2.19 +	register char *p1;
    2.20 +	char *p2, outbuf[NFIELDS];
    2.21 +	FILE *inptr;
    2.22 +	endflag = supflag = cflag = fflag = 0;
    2.23 + 
    2.24 + 
    2.25 +while (argc > 1 && argv[1][0] == '-'){
    2.26 +	for (i = 1; (c = argv[1][i]) != '\0'; i++) {
    2.27 +		switch(c) {
    2.28 +			case 'd' : del = argv[1][++i];
    2.29 +				if (del == '\0') diag("no delimiter\n");
    2.30 +				break;
    2.31 +			case 's': supflag++ ;
    2.32 +				break;
    2.33 +			case 'c': cflag++ ;
    2.34 +				break;
    2.35 +			case 'f': fflag++ ;
    2.36 +				break;
    2.37 +			default : diag("Usage: cut [-s] [-d<char>] {-c<list> | -f<list>} file ...\n");
    2.38 +				break;
    2.39 +		}
    2.40 +		if (!endflag && (cflag || fflag)) {
    2.41 +			endflag = 1;
    2.42 +			r = s = t = 0;
    2.43 +			do {	c = argv[1][++i];
    2.44 +				switch(c) {
    2.45 +					case '-' : if (r) diagl();
    2.46 +						r = 1;
    2.47 +						if (t == 0)  s = 1;
    2.48 +						else {s = t; t = 0;}
    2.49 +						continue;
    2.50 +					case '\0' :
    2.51 +					case ','  : if (t >= NFIELDS) diagl();
    2.52 +						if (r) { if (t == 0) t = NFIELDS - 1;
    2.53 +							if (t<s) diagl();
    2.54 +							for(j = s; j <= t; j++) sel[j] = 1;
    2.55 +							}
    2.56 +						else sel[t] = (t > 0 ? 1 : 0);
    2.57 +						r = s = t = 0;
    2.58 +						if (c == '\0') {i--; break;}
    2.59 +						continue;
    2.60 +					default :
    2.61 +						if (c< '0' || c> '9') diagl();
    2.62 +						t = 10*t + c - '0';
    2.63 +						continue;
    2.64 +				}
    2.65 +				for (j = t = 0; j < NFIELDS; j++) t += sel[j];
    2.66 +				if (t == 0) diag("no fields\n");
    2.67 +			} while (c != '\0');
    2.68 +		}
    2.69 +	}
    2.70 +	--argc;
    2.71 +	++argv;
    2.72 +} /* end options */
    2.73 +if (!(cflag || fflag)) diagl();
    2.74 +
    2.75 +--argc;
    2.76 +filenr = 1;
    2.77 +do {	/* for all input files */
    2.78 +	if (argc > 0) inptr = fopen(argv[filenr], "r");
    2.79 +	else inptr = stdin;
    2.80 +  
    2.81 +	if (inptr == NULL) {
    2.82 +		write(2,"Cannot open :",14);
    2.83 +		diag(argv[filenr]);
    2.84 +	}
    2.85 +	endflag = 0;
    2.86 +	do {	/* for all lines of a file */
    2.87 +		count = poscnt = backflag = 0;
    2.88 +		p1 = &outbuf[0] - 1 ;
    2.89 +		p2 = p1;
    2.90 +		do { 	/* for all char of the line */
    2.91 +			c = fgetc(inptr);
    2.92 +			if (c == EOF) {
    2.93 +				endflag = 1;
    2.94 +				break;
    2.95 +				}
    2.96 +			if (count == NFIELDS - 1) diag("line too long\n");
    2.97 +			if (c != '\n') *++p1 = c;
    2.98 +			if (cflag && (c == BACKSPACE)) backflag++ ; else 
    2.99 +				{ if ( !backflag ) poscnt += 1 ; else backflag-- ;}
   2.100 +			if ( backflag > 1 ) diag("cannot handle multiple adjacent backspaces\n");
   2.101 +			if ( ((c == '\n') && count > 0)  || c == del || cflag) {
   2.102 +				count += 1;
   2.103 +				if (fflag) poscnt = count  ;
   2.104 +				if (sel[poscnt]) p2 = p1; else p1 = p2;
   2.105 +			}
   2.106 +		}while (c != '\n');
   2.107 +		if ( !endflag && (count > 0 || !supflag)) {
   2.108 +			if (*p1 == del) *p1 = '\0';
   2.109 +				else *++p1 = '\0'; /*suppress trailing delimiter*/
   2.110 +			puts(outbuf);
   2.111 +			}
   2.112 +	} while (!endflag) ;
   2.113 +fclose(inptr);
   2.114 +} while(++filenr <= argc);
   2.115 +}
   2.116 +
   2.117 +diag(s)
   2.118 +char *s;
   2.119 +{
   2.120 +	write(2, "cut : ", 6);
   2.121 +	while(*s)
   2.122 +		write(2,s++,1);
   2.123 +	exit(2);
   2.124 +}
   2.125 +diagl()
   2.126 +{
   2.127 +diag("bad list for c/f option\n");
   2.128 +}
     3.1 --- /dev/null	Thu Jan 01 00:00:00 1970 +0000
     3.2 +++ b/code/cut.c__freebsd.1994-05-27	Tue May 12 06:46:59 2015 +0200
     3.3 @@ -0,0 +1,296 @@
     3.4 +/*
     3.5 + * Copyright (c) 1989, 1993
     3.6 + *	The Regents of the University of California.  All rights reserved.
     3.7 + *
     3.8 + * This code is derived from software contributed to Berkeley by
     3.9 + * Adam S. Moskowitz of Menlo Consulting and Marciano Pitargue.
    3.10 + *
    3.11 + * Redistribution and use in source and binary forms, with or without
    3.12 + * modification, are permitted provided that the following conditions
    3.13 + * are met:
    3.14 + * 1. Redistributions of source code must retain the above copyright
    3.15 + *    notice, this list of conditions and the following disclaimer.
    3.16 + * 2. Redistributions in binary form must reproduce the above copyright
    3.17 + *    notice, this list of conditions and the following disclaimer in the
    3.18 + *    documentation and/or other materials provided with the distribution.
    3.19 + * 3. All advertising materials mentioning features or use of this software
    3.20 + *    must display the following acknowledgement:
    3.21 + *	This product includes software developed by the University of
    3.22 + *	California, Berkeley and its contributors.
    3.23 + * 4. Neither the name of the University nor the names of its contributors
    3.24 + *    may be used to endorse or promote products derived from this software
    3.25 + *    without specific prior written permission.
    3.26 + *
    3.27 + * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
    3.28 + * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
    3.29 + * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
    3.30 + * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
    3.31 + * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
    3.32 + * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
    3.33 + * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
    3.34 + * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
    3.35 + * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
    3.36 + * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
    3.37 + * SUCH DAMAGE.
    3.38 + */
    3.39 +
    3.40 +#ifndef lint
    3.41 +static char copyright[] =
    3.42 +"@(#) Copyright (c) 1989, 1993\n\
    3.43 +	The Regents of the University of California.  All rights reserved.\n";
    3.44 +#endif /* not lint */
    3.45 +
    3.46 +#ifndef lint
    3.47 +static char sccsid[] = "@(#)cut.c	8.1 (Berkeley) 6/6/93";
    3.48 +#endif /* not lint */
    3.49 +
    3.50 +#include <ctype.h>
    3.51 +#include <errno.h>
    3.52 +#include <limits.h>
    3.53 +#include <stdio.h>
    3.54 +#include <stdlib.h>
    3.55 +#include <string.h>
    3.56 +
    3.57 +int	cflag;
    3.58 +char	dchar;
    3.59 +int	dflag;
    3.60 +int	fflag;
    3.61 +int	sflag;
    3.62 +
    3.63 +void	c_cut __P((FILE *, char *));
    3.64 +void	err __P((const char *, ...));
    3.65 +void	f_cut __P((FILE *, char *));
    3.66 +void	get_list __P((char *));
    3.67 +void	usage __P((void));
    3.68 +
    3.69 +int
    3.70 +main(argc, argv)
    3.71 +	int argc;
    3.72 +	char *argv[];
    3.73 +{
    3.74 +	FILE *fp;
    3.75 +	void (*fcn) __P((FILE *, char *));
    3.76 +	int ch;
    3.77 +
    3.78 +	dchar = '\t';			/* default delimiter is \t */
    3.79 +
    3.80 +	while ((ch = getopt(argc, argv, "c:d:f:s")) != EOF)
    3.81 +		switch(ch) {
    3.82 +		case 'c':
    3.83 +			fcn = c_cut;
    3.84 +			get_list(optarg);
    3.85 +			cflag = 1;
    3.86 +			break;
    3.87 +		case 'd':
    3.88 +			dchar = *optarg;
    3.89 +			dflag = 1;
    3.90 +			break;
    3.91 +		case 'f':
    3.92 +			get_list(optarg);
    3.93 +			fcn = f_cut;
    3.94 +			fflag = 1;
    3.95 +			break;
    3.96 +		case 's':
    3.97 +			sflag = 1;
    3.98 +			break;
    3.99 +		case '?':
   3.100 +		default:
   3.101 +			usage();
   3.102 +		}
   3.103 +	argc -= optind;
   3.104 +	argv += optind;
   3.105 +
   3.106 +	if (fflag) {
   3.107 +		if (cflag)
   3.108 +			usage();
   3.109 +	} else if (!cflag || dflag || sflag)
   3.110 +		usage();
   3.111 +
   3.112 +	if (*argv)
   3.113 +		for (; *argv; ++argv) {
   3.114 +			if (!(fp = fopen(*argv, "r")))
   3.115 +				err("%s: %s\n", *argv, strerror(errno));
   3.116 +			fcn(fp, *argv);
   3.117 +			(void)fclose(fp);
   3.118 +		}
   3.119 +	else
   3.120 +		fcn(stdin, "stdin");
   3.121 +	exit(0);
   3.122 +}
   3.123 +
   3.124 +int autostart, autostop, maxval;
   3.125 +
   3.126 +char positions[_POSIX2_LINE_MAX + 1];
   3.127 +
   3.128 +void
   3.129 +get_list(list)
   3.130 +	char *list;
   3.131 +{
   3.132 +	register int setautostart, start, stop;
   3.133 +	register char *pos;
   3.134 +	char *p;
   3.135 +
   3.136 +	/*
   3.137 +	 * set a byte in the positions array to indicate if a field or
   3.138 +	 * column is to be selected; use +1, it's 1-based, not 0-based.
   3.139 +	 * This parser is less restrictive than the Draft 9 POSIX spec.
   3.140 +	 * POSIX doesn't allow lists that aren't in increasing order or
   3.141 +	 * overlapping lists.  We also handle "-3-5" although there's no
   3.142 +	 * real reason too.
   3.143 +	 */
   3.144 +	for (; p = strtok(list, ", \t"); list = NULL) {
   3.145 +		setautostart = start = stop = 0;
   3.146 +		if (*p == '-') {
   3.147 +			++p;
   3.148 +			setautostart = 1;
   3.149 +		}
   3.150 +		if (isdigit(*p)) {
   3.151 +			start = stop = strtol(p, &p, 10);
   3.152 +			if (setautostart && start > autostart)
   3.153 +				autostart = start;
   3.154 +		}
   3.155 +		if (*p == '-') {
   3.156 +			if (isdigit(p[1]))
   3.157 +				stop = strtol(p + 1, &p, 10);
   3.158 +			if (*p == '-') {
   3.159 +				++p;
   3.160 +				if (!autostop || autostop > stop)
   3.161 +					autostop = stop;
   3.162 +			}
   3.163 +		}
   3.164 +		if (*p)
   3.165 +			err("[-cf] list: illegal list value\n");
   3.166 +		if (!stop || !start)
   3.167 +			err("[-cf] list: values may not include zero\n");
   3.168 +		if (stop > _POSIX2_LINE_MAX)
   3.169 +			err("[-cf] list: %d too large (max %d)\n",
   3.170 +			    stop, _POSIX2_LINE_MAX);
   3.171 +		if (maxval < stop)
   3.172 +			maxval = stop;
   3.173 +		for (pos = positions + start; start++ <= stop; *pos++ = 1);
   3.174 +	}
   3.175 +
   3.176 +	/* overlapping ranges */
   3.177 +	if (autostop && maxval > autostop)
   3.178 +		maxval = autostop;
   3.179 +
   3.180 +	/* set autostart */
   3.181 +	if (autostart)
   3.182 +		memset(positions + 1, '1', autostart);
   3.183 +}
   3.184 +
   3.185 +/* ARGSUSED */
   3.186 +void
   3.187 +c_cut(fp, fname)
   3.188 +	FILE *fp;
   3.189 +	char *fname;
   3.190 +{
   3.191 +	register int ch, col;
   3.192 +	register char *pos;
   3.193 +
   3.194 +	for (;;) {
   3.195 +		pos = positions + 1;
   3.196 +		for (col = maxval; col; --col) {
   3.197 +			if ((ch = getc(fp)) == EOF)
   3.198 +				return;
   3.199 +			if (ch == '\n')
   3.200 +				break;
   3.201 +			if (*pos++)
   3.202 +				(void)putchar(ch);
   3.203 +		}
   3.204 +		if (ch != '\n')
   3.205 +			if (autostop)
   3.206 +				while ((ch = getc(fp)) != EOF && ch != '\n')
   3.207 +					(void)putchar(ch);
   3.208 +			else
   3.209 +				while ((ch = getc(fp)) != EOF && ch != '\n');
   3.210 +		(void)putchar('\n');
   3.211 +	}
   3.212 +}
   3.213 +
   3.214 +void
   3.215 +f_cut(fp, fname)
   3.216 +	FILE *fp;
   3.217 +	char *fname;
   3.218 +{
   3.219 +	register int ch, field, isdelim;
   3.220 +	register char *pos, *p, sep;
   3.221 +	int output;
   3.222 +	char lbuf[_POSIX2_LINE_MAX + 1];
   3.223 +
   3.224 +	for (sep = dchar, output = 0; fgets(lbuf, sizeof(lbuf), fp);) {
   3.225 +		for (isdelim = 0, p = lbuf;; ++p) {
   3.226 +			if (!(ch = *p))
   3.227 +				err("%s: line too long.\n", fname);
   3.228 +			/* this should work if newline is delimiter */
   3.229 +			if (ch == sep)
   3.230 +				isdelim = 1;
   3.231 +			if (ch == '\n') {
   3.232 +				if (!isdelim && !sflag)
   3.233 +					(void)printf("%s", lbuf);
   3.234 +				break;
   3.235 +			}
   3.236 +		}
   3.237 +		if (!isdelim)
   3.238 +			continue;
   3.239 +
   3.240 +		pos = positions + 1;
   3.241 +		for (field = maxval, p = lbuf; field; --field, ++pos) {
   3.242 +			if (*pos) {
   3.243 +				if (output++)
   3.244 +					(void)putchar(sep);
   3.245 +				while ((ch = *p++) != '\n' && ch != sep)
   3.246 +					(void)putchar(ch);
   3.247 +			} else
   3.248 +				while ((ch = *p++) != '\n' && ch != sep);
   3.249 +			if (ch == '\n')
   3.250 +				break;
   3.251 +		}
   3.252 +		if (ch != '\n')
   3.253 +			if (autostop) {
   3.254 +				if (output)
   3.255 +					(void)putchar(sep);
   3.256 +				for (; (ch = *p) != '\n'; ++p)
   3.257 +					(void)putchar(ch);
   3.258 +			} else
   3.259 +				for (; (ch = *p) != '\n'; ++p);
   3.260 +		(void)putchar('\n');
   3.261 +	}
   3.262 +}
   3.263 +
   3.264 +void
   3.265 +usage()
   3.266 +{
   3.267 +	(void)fprintf(stderr,
   3.268 +"usage:\tcut -c list [file1 ...]\n\tcut -f list [-s] [-d delim] [file ...]\n");
   3.269 +	exit(1);
   3.270 +}
   3.271 +
   3.272 +#if __STDC__
   3.273 +#include <stdarg.h>
   3.274 +#else
   3.275 +#include <varargs.h>
   3.276 +#endif
   3.277 +
   3.278 +void
   3.279 +#if __STDC__
   3.280 +err(const char *fmt, ...)
   3.281 +#else
   3.282 +err(fmt, va_alist)
   3.283 +	char *fmt;
   3.284 +        va_dcl
   3.285 +#endif
   3.286 +{
   3.287 +	va_list ap;
   3.288 +#if __STDC__
   3.289 +	va_start(ap, fmt);
   3.290 +#else
   3.291 +	va_start(ap);
   3.292 +#endif
   3.293 +	(void)fprintf(stderr, "cut: ");
   3.294 +	(void)vfprintf(stderr, fmt, ap);
   3.295 +	va_end(ap);
   3.296 +	(void)fprintf(stderr, "\n");
   3.297 +	exit(1);
   3.298 +	/* NOTREACHED */
   3.299 +}
     4.1 --- /dev/null	Thu Jan 01 00:00:00 1970 +0000
     4.2 +++ b/code/cut.c__freebsd.2012-11-24	Tue May 12 06:46:59 2015 +0200
     4.3 @@ -0,0 +1,479 @@
     4.4 +/*
     4.5 + * Copyright (c) 1989, 1993
     4.6 + *	The Regents of the University of California.  All rights reserved.
     4.7 + *
     4.8 + * This code is derived from software contributed to Berkeley by
     4.9 + * Adam S. Moskowitz of Menlo Consulting and Marciano Pitargue.
    4.10 + *
    4.11 + * Redistribution and use in source and binary forms, with or without
    4.12 + * modification, are permitted provided that the following conditions
    4.13 + * are met:
    4.14 + * 1. Redistributions of source code must retain the above copyright
    4.15 + *    notice, this list of conditions and the following disclaimer.
    4.16 + * 2. Redistributions in binary form must reproduce the above copyright
    4.17 + *    notice, this list of conditions and the following disclaimer in the
    4.18 + *    documentation and/or other materials provided with the distribution.
    4.19 + * 4. Neither the name of the University nor the names of its contributors
    4.20 + *    may be used to endorse or promote products derived from this software
    4.21 + *    without specific prior written permission.
    4.22 + *
    4.23 + * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
    4.24 + * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
    4.25 + * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
    4.26 + * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
    4.27 + * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
    4.28 + * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
    4.29 + * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
    4.30 + * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
    4.31 + * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
    4.32 + * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
    4.33 + * SUCH DAMAGE.
    4.34 + */
    4.35 +
    4.36 +#ifndef lint
    4.37 +static const char copyright[] =
    4.38 +"@(#) Copyright (c) 1989, 1993\n\
    4.39 +	The Regents of the University of California.  All rights reserved.\n";
    4.40 +static const char sccsid[] = "@(#)cut.c	8.3 (Berkeley) 5/4/95";
    4.41 +#endif /* not lint */
    4.42 +#include <sys/cdefs.h>
    4.43 +__FBSDID("$FreeBSD$");
    4.44 +
    4.45 +#include <ctype.h>
    4.46 +#include <err.h>
    4.47 +#include <errno.h>
    4.48 +#include <limits.h>
    4.49 +#include <locale.h>
    4.50 +#include <stdio.h>
    4.51 +#include <stdlib.h>
    4.52 +#include <string.h>
    4.53 +#include <unistd.h>
    4.54 +#include <wchar.h>
    4.55 +
    4.56 +static int	bflag;
    4.57 +static int	cflag;
    4.58 +static wchar_t	dchar;
    4.59 +static char	dcharmb[MB_LEN_MAX + 1];
    4.60 +static int	dflag;
    4.61 +static int	fflag;
    4.62 +static int	nflag;
    4.63 +static int	sflag;
    4.64 +static int	wflag;
    4.65 +
    4.66 +static size_t	autostart, autostop, maxval;
    4.67 +static char *	positions;
    4.68 +
    4.69 +static int	b_cut(FILE *, const char *);
    4.70 +static int	b_n_cut(FILE *, const char *);
    4.71 +static int	c_cut(FILE *, const char *);
    4.72 +static int	f_cut(FILE *, const char *);
    4.73 +static void	get_list(char *);
    4.74 +static int	is_delim(wchar_t);
    4.75 +static void	needpos(size_t);
    4.76 +static void	usage(void);
    4.77 +
    4.78 +int
    4.79 +main(int argc, char *argv[])
    4.80 +{
    4.81 +	FILE *fp;
    4.82 +	int (*fcn)(FILE *, const char *);
    4.83 +	int ch, rval;
    4.84 +	size_t n;
    4.85 +
    4.86 +	setlocale(LC_ALL, "");
    4.87 +
    4.88 +	fcn = NULL;
    4.89 +	dchar = '\t';			/* default delimiter is \t */
    4.90 +	strcpy(dcharmb, "\t");
    4.91 +
    4.92 +	while ((ch = getopt(argc, argv, "b:c:d:f:snw")) != -1)
    4.93 +		switch(ch) {
    4.94 +		case 'b':
    4.95 +			get_list(optarg);
    4.96 +			bflag = 1;
    4.97 +			break;
    4.98 +		case 'c':
    4.99 +			get_list(optarg);
   4.100 +			cflag = 1;
   4.101 +			break;
   4.102 +		case 'd':
   4.103 +			n = mbrtowc(&dchar, optarg, MB_LEN_MAX, NULL);
   4.104 +			if (dchar == '\0' || n != strlen(optarg))
   4.105 +				errx(1, "bad delimiter");
   4.106 +			strcpy(dcharmb, optarg);
   4.107 +			dflag = 1;
   4.108 +			break;
   4.109 +		case 'f':
   4.110 +			get_list(optarg);
   4.111 +			fflag = 1;
   4.112 +			break;
   4.113 +		case 's':
   4.114 +			sflag = 1;
   4.115 +			break;
   4.116 +		case 'n':
   4.117 +			nflag = 1;
   4.118 +			break;
   4.119 +		case 'w':
   4.120 +			wflag = 1;
   4.121 +			break;
   4.122 +		case '?':
   4.123 +		default:
   4.124 +			usage();
   4.125 +		}
   4.126 +	argc -= optind;
   4.127 +	argv += optind;
   4.128 +
   4.129 +	if (fflag) {
   4.130 +		if (bflag || cflag || nflag || (wflag && dflag))
   4.131 +			usage();
   4.132 +	} else if (!(bflag || cflag) || dflag || sflag || wflag)
   4.133 +		usage();
   4.134 +	else if (!bflag && nflag)
   4.135 +		usage();
   4.136 +
   4.137 +	if (fflag)
   4.138 +		fcn = f_cut;
   4.139 +	else if (cflag)
   4.140 +		fcn = MB_CUR_MAX > 1 ? c_cut : b_cut;
   4.141 +	else if (bflag)
   4.142 +		fcn = nflag && MB_CUR_MAX > 1 ? b_n_cut : b_cut;
   4.143 +
   4.144 +	rval = 0;
   4.145 +	if (*argv)
   4.146 +		for (; *argv; ++argv) {
   4.147 +			if (strcmp(*argv, "-") == 0)
   4.148 +				rval |= fcn(stdin, "stdin");
   4.149 +			else {
   4.150 +				if (!(fp = fopen(*argv, "r"))) {
   4.151 +					warn("%s", *argv);
   4.152 +					rval = 1;
   4.153 +					continue;
   4.154 +				}
   4.155 +				fcn(fp, *argv);
   4.156 +				(void)fclose(fp);
   4.157 +			}
   4.158 +		}
   4.159 +	else
   4.160 +		rval = fcn(stdin, "stdin");
   4.161 +	exit(rval);
   4.162 +}
   4.163 +
   4.164 +static void
   4.165 +get_list(char *list)
   4.166 +{
   4.167 +	size_t setautostart, start, stop;
   4.168 +	char *pos;
   4.169 +	char *p;
   4.170 +
   4.171 +	/*
   4.172 +	 * set a byte in the positions array to indicate if a field or
   4.173 +	 * column is to be selected; use +1, it's 1-based, not 0-based.
   4.174 +	 * Numbers and number ranges may be overlapping, repeated, and in
   4.175 +	 * any order. We handle "-3-5" although there's no real reason to.
   4.176 +	 */
   4.177 +	for (; (p = strsep(&list, ", \t")) != NULL;) {
   4.178 +		setautostart = start = stop = 0;
   4.179 +		if (*p == '-') {
   4.180 +			++p;
   4.181 +			setautostart = 1;
   4.182 +		}
   4.183 +		if (isdigit((unsigned char)*p)) {
   4.184 +			start = stop = strtol(p, &p, 10);
   4.185 +			if (setautostart && start > autostart)
   4.186 +				autostart = start;
   4.187 +		}
   4.188 +		if (*p == '-') {
   4.189 +			if (isdigit((unsigned char)p[1]))
   4.190 +				stop = strtol(p + 1, &p, 10);
   4.191 +			if (*p == '-') {
   4.192 +				++p;
   4.193 +				if (!autostop || autostop > stop)
   4.194 +					autostop = stop;
   4.195 +			}
   4.196 +		}
   4.197 +		if (*p)
   4.198 +			errx(1, "[-bcf] list: illegal list value");
   4.199 +		if (!stop || !start)
   4.200 +			errx(1, "[-bcf] list: values may not include zero");
   4.201 +		if (maxval < stop) {
   4.202 +			maxval = stop;
   4.203 +			needpos(maxval + 1);
   4.204 +		}
   4.205 +		for (pos = positions + start; start++ <= stop; *pos++ = 1);
   4.206 +	}
   4.207 +
   4.208 +	/* overlapping ranges */
   4.209 +	if (autostop && maxval > autostop) {
   4.210 +		maxval = autostop;
   4.211 +		needpos(maxval + 1);
   4.212 +	}
   4.213 +
   4.214 +	/* set autostart */
   4.215 +	if (autostart)
   4.216 +		memset(positions + 1, '1', autostart);
   4.217 +}
   4.218 +
   4.219 +static void
   4.220 +needpos(size_t n)
   4.221 +{
   4.222 +	static size_t npos;
   4.223 +	size_t oldnpos;
   4.224 +
   4.225 +	/* Grow the positions array to at least the specified size. */
   4.226 +	if (n > npos) {
   4.227 +		oldnpos = npos;
   4.228 +		if (npos == 0)
   4.229 +			npos = n;
   4.230 +		while (n > npos)
   4.231 +			npos *= 2;
   4.232 +		if ((positions = realloc(positions, npos)) == NULL)
   4.233 +			err(1, "realloc");
   4.234 +		memset((char *)positions + oldnpos, 0, npos - oldnpos);
   4.235 +	}
   4.236 +}
   4.237 +
   4.238 +static int
   4.239 +b_cut(FILE *fp, const char *fname __unused)
   4.240 +{
   4.241 +	int ch, col;
   4.242 +	char *pos;
   4.243 +
   4.244 +	ch = 0;
   4.245 +	for (;;) {
   4.246 +		pos = positions + 1;
   4.247 +		for (col = maxval; col; --col) {
   4.248 +			if ((ch = getc(fp)) == EOF)
   4.249 +				return (0);
   4.250 +			if (ch == '\n')
   4.251 +				break;
   4.252 +			if (*pos++)
   4.253 +				(void)putchar(ch);
   4.254 +		}
   4.255 +		if (ch != '\n') {
   4.256 +			if (autostop)
   4.257 +				while ((ch = getc(fp)) != EOF && ch != '\n')
   4.258 +					(void)putchar(ch);
   4.259 +			else
   4.260 +				while ((ch = getc(fp)) != EOF && ch != '\n');
   4.261 +		}
   4.262 +		(void)putchar('\n');
   4.263 +	}
   4.264 +	return (0);
   4.265 +}
   4.266 +
   4.267 +/*
   4.268 + * Cut based on byte positions, taking care not to split multibyte characters.
   4.269 + * Although this function also handles the case where -n is not specified,
   4.270 + * b_cut() ought to be much faster.
   4.271 + */
   4.272 +static int
   4.273 +b_n_cut(FILE *fp, const char *fname)
   4.274 +{
   4.275 +	size_t col, i, lbuflen;
   4.276 +	char *lbuf;
   4.277 +	int canwrite, clen, warned;
   4.278 +	mbstate_t mbs;
   4.279 +
   4.280 +	memset(&mbs, 0, sizeof(mbs));
   4.281 +	warned = 0;
   4.282 +	while ((lbuf = fgetln(fp, &lbuflen)) != NULL) {
   4.283 +		for (col = 0; lbuflen > 0; col += clen) {
   4.284 +			if ((clen = mbrlen(lbuf, lbuflen, &mbs)) < 0) {
   4.285 +				if (!warned) {
   4.286 +					warn("%s", fname);
   4.287 +					warned = 1;
   4.288 +				}
   4.289 +				memset(&mbs, 0, sizeof(mbs));
   4.290 +				clen = 1;
   4.291 +			}
   4.292 +			if (clen == 0 || *lbuf == '\n')
   4.293 +				break;
   4.294 +			if (col < maxval && !positions[1 + col]) {
   4.295 +				/*
   4.296 +				 * Print the character if (1) after an initial
   4.297 +				 * segment of un-selected bytes, the rest of
   4.298 +				 * it is selected, and (2) the last byte is
   4.299 +				 * selected.
   4.300 +				 */
   4.301 +				i = col;
   4.302 +				while (i < col + clen && i < maxval &&
   4.303 +				    !positions[1 + i])
   4.304 +					i++;
   4.305 +				canwrite = i < col + clen;
   4.306 +				for (; i < col + clen && i < maxval; i++)
   4.307 +					canwrite &= positions[1 + i];
   4.308 +				if (canwrite)
   4.309 +					fwrite(lbuf, 1, clen, stdout);
   4.310 +			} else {
   4.311 +				/*
   4.312 +				 * Print the character if all of it has
   4.313 +				 * been selected.
   4.314 +				 */
   4.315 +				canwrite = 1;
   4.316 +				for (i = col; i < col + clen; i++)
   4.317 +					if ((i >= maxval && !autostop) ||
   4.318 +					    (i < maxval && !positions[1 + i])) {
   4.319 +						canwrite = 0;
   4.320 +						break;
   4.321 +					}
   4.322 +				if (canwrite)
   4.323 +					fwrite(lbuf, 1, clen, stdout);
   4.324 +			}
   4.325 +			lbuf += clen;
   4.326 +			lbuflen -= clen;
   4.327 +		}
   4.328 +		if (lbuflen > 0)
   4.329 +			putchar('\n');
   4.330 +	}
   4.331 +	return (warned);
   4.332 +}
   4.333 +
   4.334 +static int
   4.335 +c_cut(FILE *fp, const char *fname)
   4.336 +{
   4.337 +	wint_t ch;
   4.338 +	int col;
   4.339 +	char *pos;
   4.340 +
   4.341 +	ch = 0;
   4.342 +	for (;;) {
   4.343 +		pos = positions + 1;
   4.344 +		for (col = maxval; col; --col) {
   4.345 +			if ((ch = getwc(fp)) == WEOF)
   4.346 +				goto out;
   4.347 +			if (ch == '\n')
   4.348 +				break;
   4.349 +			if (*pos++)
   4.350 +				(void)putwchar(ch);
   4.351 +		}
   4.352 +		if (ch != '\n') {
   4.353 +			if (autostop)
   4.354 +				while ((ch = getwc(fp)) != WEOF && ch != '\n')
   4.355 +					(void)putwchar(ch);
   4.356 +			else
   4.357 +				while ((ch = getwc(fp)) != WEOF && ch != '\n');
   4.358 +		}
   4.359 +		(void)putwchar('\n');
   4.360 +	}
   4.361 +out:
   4.362 +	if (ferror(fp)) {
   4.363 +		warn("%s", fname);
   4.364 +		return (1);
   4.365 +	}
   4.366 +	return (0);
   4.367 +}
   4.368 +
   4.369 +static int
   4.370 +is_delim(wchar_t ch)
   4.371 +{
   4.372 +	if (wflag) {
   4.373 +		if (ch == ' ' || ch == '\t')
   4.374 +			return 1;
   4.375 +	} else {
   4.376 +		if (ch == dchar)
   4.377 +			return 1;
   4.378 +	}
   4.379 +	return 0;
   4.380 +}
   4.381 +
   4.382 +static int
   4.383 +f_cut(FILE *fp, const char *fname)
   4.384 +{
   4.385 +	wchar_t ch;
   4.386 +	int field, i, isdelim;
   4.387 +	char *pos, *p;
   4.388 +	int output;
   4.389 +	char *lbuf, *mlbuf;
   4.390 +	size_t clen, lbuflen, reallen;
   4.391 +
   4.392 +	mlbuf = NULL;
   4.393 +	while ((lbuf = fgetln(fp, &lbuflen)) != NULL) {
   4.394 +		reallen = lbuflen;
   4.395 +		/* Assert EOL has a newline. */
   4.396 +		if (*(lbuf + lbuflen - 1) != '\n') {
   4.397 +			/* Can't have > 1 line with no trailing newline. */
   4.398 +			mlbuf = malloc(lbuflen + 1);
   4.399 +			if (mlbuf == NULL)
   4.400 +				err(1, "malloc");
   4.401 +			memcpy(mlbuf, lbuf, lbuflen);
   4.402 +			*(mlbuf + lbuflen) = '\n';
   4.403 +			lbuf = mlbuf;
   4.404 +			reallen++;
   4.405 +		}
   4.406 +		output = 0;
   4.407 +		for (isdelim = 0, p = lbuf;; p += clen) {
   4.408 +			clen = mbrtowc(&ch, p, lbuf + reallen - p, NULL);
   4.409 +			if (clen == (size_t)-1 || clen == (size_t)-2) {
   4.410 +				warnc(EILSEQ, "%s", fname);
   4.411 +				free(mlbuf);
   4.412 +				return (1);
   4.413 +			}
   4.414 +			if (clen == 0)
   4.415 +				clen = 1;
   4.416 +			/* this should work if newline is delimiter */
   4.417 +			if (is_delim(ch))
   4.418 +				isdelim = 1;
   4.419 +			if (ch == '\n') {
   4.420 +				if (!isdelim && !sflag)
   4.421 +					(void)fwrite(lbuf, lbuflen, 1, stdout);
   4.422 +				break;
   4.423 +			}
   4.424 +		}
   4.425 +		if (!isdelim)
   4.426 +			continue;
   4.427 +
   4.428 +		pos = positions + 1;
   4.429 +		for (field = maxval, p = lbuf; field; --field, ++pos) {
   4.430 +			if (*pos && output++)
   4.431 +				for (i = 0; dcharmb[i] != '\0'; i++)
   4.432 +					putchar(dcharmb[i]);
   4.433 +			for (;;) {
   4.434 +				clen = mbrtowc(&ch, p, lbuf + reallen - p,
   4.435 +				    NULL);
   4.436 +				if (clen == (size_t)-1 || clen == (size_t)-2) {
   4.437 +					warnc(EILSEQ, "%s", fname);
   4.438 +					free(mlbuf);
   4.439 +					return (1);
   4.440 +				}
   4.441 +				if (clen == 0)
   4.442 +					clen = 1;
   4.443 +				p += clen;
   4.444 +				if (ch == '\n' || is_delim(ch)) {
   4.445 +					/* compress whitespace */
   4.446 +					if (wflag && ch != '\n')
   4.447 +						while (is_delim(*p))
   4.448 +							p++;
   4.449 +					break;
   4.450 +				}
   4.451 +				if (*pos)
   4.452 +					for (i = 0; i < (int)clen; i++)
   4.453 +						putchar(p[i - clen]);
   4.454 +			}
   4.455 +			if (ch == '\n')
   4.456 +				break;
   4.457 +		}
   4.458 +		if (ch != '\n') {
   4.459 +			if (autostop) {
   4.460 +				if (output)
   4.461 +					for (i = 0; dcharmb[i] != '\0'; i++)
   4.462 +						putchar(dcharmb[i]);
   4.463 +				for (; (ch = *p) != '\n'; ++p)
   4.464 +					(void)putchar(ch);
   4.465 +			} else
   4.466 +				for (; (ch = *p) != '\n'; ++p);
   4.467 +		}
   4.468 +		(void)putchar('\n');
   4.469 +	}
   4.470 +	free(mlbuf);
   4.471 +	return (0);
   4.472 +}
   4.473 +
   4.474 +static void
   4.475 +usage(void)
   4.476 +{
   4.477 +	(void)fprintf(stderr, "%s\n%s\n%s\n",
   4.478 +		"usage: cut -b list [-n] [file ...]",
   4.479 +		"       cut -c list [file ...]",
   4.480 +		"       cut -f list [-s] [-w | -d delim] [file ...]");
   4.481 +	exit(1);
   4.482 +}
     5.1 --- /dev/null	Thu Jan 01 00:00:00 1970 +0000
     5.2 +++ b/code/cut.c__gnu.1992-11-08	Tue May 12 06:46:59 2015 +0200
     5.3 @@ -0,0 +1,586 @@
     5.4 +/* cut - remove parts of lines of files
     5.5 +   Copyright (C) 1984 by David M. Ihnat
     5.6 + 
     5.7 +   This program is a total rewrite of the Bell Laboratories Unix(Tm)
     5.8 +   command of the same name, as of System V.  It contains no proprietary
     5.9 +   code, and therefore may be used without violation of any proprietary
    5.10 +   agreements whatsoever.  However, you will notice that the program is
    5.11 +   copyrighted by me.  This is to assure the program does *not* fall
    5.12 +   into the public domain.  Thus, I may specify just what I am now:
    5.13 +   This program may be freely copied and distributed, provided this notice
    5.14 +   remains; it may not be sold for profit without express written consent of
    5.15 +   the author.
    5.16 +   Please note that I recreated the behavior of the Unix(Tm) 'cut' command
    5.17 +   as faithfully as possible; however, I haven't run a full set of regression
    5.18 +   tests.  Thus, the user of this program accepts full responsibility for any
    5.19 +   effects or loss; in particular, the author is not responsible for any losses,
    5.20 +   explicit or incidental, that may be incurred through use of this program.
    5.21 +
    5.22 +   I ask that any bugs (and, if possible, fixes) be reported to me when
    5.23 +   possible.  -David Ihnat (312) 784-4544 ignatz@homebru.chi.il.us
    5.24 +
    5.25 +   POSIX changes, bug fixes, long-named options, and cleanup
    5.26 +   by David MacKenzie <djm@ai.mit.edu>.
    5.27 +
    5.28 +   Options:
    5.29 +   --bytes=byte-list
    5.30 +   -b byte-list			Print only the bytes in positions listed
    5.31 +				in BYTE-LIST.
    5.32 +				Tabs and backspaces are treated like any
    5.33 +				other character; they take up 1 byte.
    5.34 +
    5.35 +   --characters=character-list
    5.36 +   -c character-list		Print only characters in positions listed
    5.37 +				in CHARACTER-LIST.
    5.38 +				The same as -b for now, but
    5.39 +				internationalization will change that.
    5.40 +				Tabs and backspaces are treated like any
    5.41 +				other character; they take up 1 character.
    5.42 +
    5.43 +   --fields=field-list
    5.44 +   -f field-list		Print only the fields listed in FIELD-LIST.
    5.45 +				Fields are separated by a TAB by default.
    5.46 +
    5.47 +   --delimiter=delim
    5.48 +   -d delim			For -f, fields are separated by the first
    5.49 +				character in DELIM instead of TAB.
    5.50 +
    5.51 +   -n				Do not split multibyte chars (no-op for now).
    5.52 +
    5.53 +   --only-delimited
    5.54 +   -s				For -f, do not print lines that do not contain
    5.55 +				the field separator character.
    5.56 +
    5.57 +   The BYTE-LIST, CHARACTER-LIST, and FIELD-LIST are one or more numbers
    5.58 +   or ranges separated by commas.  The first byte, character, and field
    5.59 +   are numbered 1.
    5.60 +
    5.61 +   A FILE of `-' means standard input. */
    5.62 +
    5.63 +#define _GNU_SOURCE
    5.64 +#include <ctype.h>
    5.65 +#ifndef isblank
    5.66 +#define isblank(c) ((c) == ' ' || (c) == '\t')
    5.67 +#endif
    5.68 +#include <stdio.h>
    5.69 +#include <getopt.h>
    5.70 +#include <sys/types.h>
    5.71 +#include "system.h"
    5.72 +
    5.73 +#ifdef isascii
    5.74 +#define ISDIGIT(c) (isascii ((c)) && isdigit ((c)))
    5.75 +#else
    5.76 +#define ISDIGIT(c) (isdigit ((c)))
    5.77 +#endif
    5.78 +
    5.79 +char *xmalloc ();
    5.80 +char *xrealloc ();
    5.81 +int set_fields ();
    5.82 +int cut_file ();
    5.83 +void cut_stream ();
    5.84 +void cut_bytes ();
    5.85 +void cut_fields ();
    5.86 +void enlarge_line ();
    5.87 +void error ();
    5.88 +void invalid_list ();
    5.89 +void usage ();
    5.90 +
    5.91 +/* The number of elements allocated for the input line
    5.92 +   and the byte or field number.
    5.93 +   Enlarged as necessary. */
    5.94 +int line_size;
    5.95 +
    5.96 +/* Processed output buffer. */
    5.97 +char *outbuf;
    5.98 +
    5.99 +/* Where to save next char to output. */
   5.100 +char *outbufptr;
   5.101 +
   5.102 +/* Raw line buffer for field mode. */
   5.103 +char *inbuf;
   5.104 +
   5.105 +/* Where to save next input char. */
   5.106 +char *inbufptr;
   5.107 +
   5.108 +/* What can be done about a byte or field. */
   5.109 +enum field_action
   5.110 +{
   5.111 +  field_omit,
   5.112 +  field_output
   5.113 +};
   5.114 +
   5.115 +/* In byte mode, which bytes to output.
   5.116 +   In field mode, which `delim'-separated fields to output.
   5.117 +   Both bytes and fields are numbered starting with 1,
   5.118 +   so the first element of `fields' is unused. */
   5.119 +enum field_action *fields;
   5.120 +
   5.121 +enum operating_mode
   5.122 +{
   5.123 +  undefined_mode,
   5.124 +
   5.125 +  /* Output characters that are in the given bytes. */
   5.126 +  byte_mode,
   5.127 +
   5.128 +  /* Output the given delimeter-separated fields. */
   5.129 +  field_mode
   5.130 +};
   5.131 +
   5.132 +enum operating_mode operating_mode;
   5.133 +
   5.134 +/* If nonzero,
   5.135 +   for field mode, do not output lines containing no delimeter characters. */
   5.136 +int delimited_lines_only;
   5.137 +
   5.138 +/* The delimeter character for field mode. */
   5.139 +unsigned char delim;
   5.140 +
   5.141 +/* Nonzero if we have ever read standard input. */
   5.142 +int have_read_stdin;
   5.143 +
   5.144 +/* The name this program was run with. */
   5.145 +char *program_name;
   5.146 +
   5.147 +struct option longopts[] =
   5.148 +{
   5.149 +  {"bytes", 1, 0, 'b'},
   5.150 +  {"characters", 1, 0, 'c'},
   5.151 +  {"fields", 1, 0, 'f'},
   5.152 +  {"delimiter", 1, 0, 'd'},
   5.153 +  {"only-delimited", 0, 0, 's'},
   5.154 +  {0, 0, 0, 0}
   5.155 +};
   5.156 +
   5.157 +void
   5.158 +main (argc, argv)
   5.159 +     int argc;
   5.160 +     char **argv;
   5.161 +{
   5.162 +  int optc, exit_status = 0;
   5.163 +
   5.164 +  program_name = argv[0];
   5.165 +
   5.166 +  line_size = 512;
   5.167 +  operating_mode = undefined_mode;
   5.168 +  delimited_lines_only = 0;
   5.169 +  delim = '\0';
   5.170 +  have_read_stdin = 0;
   5.171 +
   5.172 +  fields = (enum field_action *)
   5.173 +    xmalloc (line_size * sizeof (enum field_action));
   5.174 +  outbuf = (char *) xmalloc (line_size);
   5.175 +  inbuf = (char *) xmalloc (line_size);
   5.176 +
   5.177 +  for (optc = 0; optc < line_size; optc++)
   5.178 +    fields[optc] = field_omit;
   5.179 +
   5.180 +  while ((optc = getopt_long (argc, argv, "b:c:d:f:ns", longopts, (int *) 0))
   5.181 +	 != EOF)
   5.182 +    {
   5.183 +      switch (optc)
   5.184 +	{
   5.185 +	case 'b':
   5.186 +	case 'c':
   5.187 +	  /* Build the byte list. */
   5.188 +	  if (operating_mode != undefined_mode)
   5.189 +	    usage ();
   5.190 +	  operating_mode = byte_mode;
   5.191 +	  if (set_fields (optarg) == 0)
   5.192 +	    error (2, 0, "no fields given");
   5.193 +	  break;
   5.194 +
   5.195 +	case 'f':
   5.196 +	  /* Build the field list. */
   5.197 +	  if (operating_mode != undefined_mode)
   5.198 +	    usage ();
   5.199 +	  operating_mode = field_mode;
   5.200 +	  if (set_fields (optarg) == 0)
   5.201 +	    error (2, 0, "no fields given");
   5.202 +	  break;
   5.203 +
   5.204 +	case 'd':
   5.205 +	  /* New delimiter. */
   5.206 +	  if (optarg[0] == '\0')
   5.207 +	    error (2, 0, "no delimiter given");
   5.208 +	  if (optarg[1] != '\0')
   5.209 +	    error (2, 0, "delimiter must be a single character");
   5.210 +	  delim = optarg[0];
   5.211 +	  break;
   5.212 +
   5.213 +	case 'n':
   5.214 +	  break;
   5.215 +
   5.216 +	case 's':
   5.217 +	  delimited_lines_only++;
   5.218 +	  break;
   5.219 +
   5.220 +	default:
   5.221 +	  usage ();
   5.222 +	}
   5.223 +    }
   5.224 +
   5.225 +  if (operating_mode == undefined_mode)
   5.226 +    usage ();
   5.227 +
   5.228 +  if ((delimited_lines_only || delim != '\0') && operating_mode != field_mode)
   5.229 +    usage ();
   5.230 +
   5.231 +  if (delim == '\0')
   5.232 +    delim = '\t';
   5.233 +
   5.234 +  if (optind == argc)
   5.235 +    exit_status |= cut_file ("-");
   5.236 +  else
   5.237 +    for (; optind < argc; optind++)
   5.238 +      exit_status |= cut_file (argv[optind]);
   5.239 +
   5.240 +  if (have_read_stdin && fclose (stdin) == EOF)
   5.241 +    {
   5.242 +      error (0, errno, "-");
   5.243 +      exit_status = 1;
   5.244 +    }
   5.245 +  if (ferror (stdout) || fclose (stdout) == EOF)
   5.246 +    error (1, 0, "write error");
   5.247 +
   5.248 +  exit (exit_status);
   5.249 +}
   5.250 +
   5.251 +/* Select for printing the positions in `fields' that are listed in
   5.252 +   byte or field specification FIELDSTR.  FIELDSTR should be
   5.253 +   composed of one or more numbers or ranges of numbers, separated by
   5.254 +   blanks or commas.  Incomplete ranges may be given: `-m' means
   5.255 +   `1-m'; `n-' means `n' through end of line or last field.
   5.256 +
   5.257 +   Return the number of fields selected. */
   5.258 +
   5.259 +int
   5.260 +set_fields (fieldstr)
   5.261 +     char *fieldstr;
   5.262 +{
   5.263 +  int initial = 1;		/* Value of first number in a range. */
   5.264 +  int dash_found = 0;		/* Nonzero if a '-' is found in this field. */
   5.265 +  int value = 0;		/* If nonzero, a number being accumulated. */
   5.266 +  int fields_selected = 0;	/* Number of fields selected so far. */
   5.267 +  /* If nonzero, index of first field in a range that goes to end of line. */
   5.268 +  int eol_range_start = 0;
   5.269 +
   5.270 +  for (;;)
   5.271 +    {
   5.272 +      if (*fieldstr == '-')
   5.273 +	{
   5.274 +	  /* Starting a range. */
   5.275 +	  if (dash_found)
   5.276 +	    invalid_list ();
   5.277 +	  dash_found++;
   5.278 +	  fieldstr++;
   5.279 +
   5.280 +	  if (value)
   5.281 +	    {
   5.282 +	      if (value >= line_size)
   5.283 +		enlarge_line (value);
   5.284 +	      initial = value;
   5.285 +	      value = 0;
   5.286 +	    }
   5.287 +	  else
   5.288 +	    initial = 1;
   5.289 +	}
   5.290 +      else if (*fieldstr == ',' || isblank (*fieldstr) || *fieldstr == '\0')
   5.291 +	{
   5.292 +	  /* Ending the string, or this field/byte sublist. */
   5.293 +	  if (dash_found)
   5.294 +	    {
   5.295 +	      dash_found = 0;
   5.296 +
   5.297 +	      /* A range.  Possibilites: -n, m-n, n-.
   5.298 +		 In any case, `initial' contains the start of the range. */
   5.299 +	      if (value == 0)
   5.300 +		{
   5.301 +		  /* `n-'.  From `initial' to end of line. */
   5.302 +		  eol_range_start = initial;
   5.303 +		  fields_selected++;
   5.304 +		}
   5.305 +	      else
   5.306 +		{
   5.307 +		  /* `m-n' or `-n' (1-n). */
   5.308 +		  if (value < initial)
   5.309 +		    invalid_list ();
   5.310 +
   5.311 +		  if (value >= line_size)
   5.312 +		    enlarge_line (value);
   5.313 +
   5.314 +		  /* Is there already a range going to end of line? */
   5.315 +		  if (eol_range_start != 0)
   5.316 +		    {
   5.317 +		      /* Yes.  Is the new sequence already contained
   5.318 +			 in the old one?  If so, no processing is
   5.319 +			 necessary. */
   5.320 +		      if (initial < eol_range_start)
   5.321 +			{
   5.322 +			  /* No, the new sequence starts before the
   5.323 +			     old.  Does the old range going to end of line
   5.324 +			     extend into the new range?  */
   5.325 +			  if (eol_range_start < value)
   5.326 +			    /* Yes.  Simply move the end of line marker. */
   5.327 +			    eol_range_start = initial;
   5.328 +			  else
   5.329 +			    {
   5.330 +			      /* No.  A simple range, before and disjoint from
   5.331 +				 the range going to end of line.  Fill it. */
   5.332 +			      for (; initial <= value; initial++)
   5.333 +				fields[initial] = field_output;
   5.334 +			    }
   5.335 +
   5.336 +			  /* In any case, some fields were selected. */
   5.337 +			  fields_selected++;
   5.338 +			}
   5.339 +		    }
   5.340 +		  else
   5.341 +		    {
   5.342 +		      /* There is no range going to end of line. */
   5.343 +		      for (; initial <= value; initial++)
   5.344 +			fields[initial] = field_output;
   5.345 +		      fields_selected++;
   5.346 +		    }
   5.347 +		  value = 0;
   5.348 +		}
   5.349 +	    }
   5.350 +	  else if (value != 0)
   5.351 +	    {
   5.352 +	      /* A simple field number, not a range. */
   5.353 +	      if (value >= line_size)
   5.354 +		enlarge_line (value);
   5.355 +
   5.356 +	      fields[value] = field_output;
   5.357 +	      value = 0;
   5.358 +	      fields_selected++;
   5.359 +	    }
   5.360 +
   5.361 +	  if (*fieldstr == '\0')
   5.362 +	    {
   5.363 +	      /* If there was a range going to end of line, fill the
   5.364 +		 array from the end of line point.  */
   5.365 +	      if (eol_range_start)
   5.366 +		for (initial = eol_range_start; initial < line_size; initial++)
   5.367 +		  fields[initial] = field_output;
   5.368 +
   5.369 +	      return fields_selected;
   5.370 +	    }
   5.371 +
   5.372 +	  fieldstr++;
   5.373 +	}
   5.374 +      else if (ISDIGIT (*fieldstr))
   5.375 +	{
   5.376 +	  value = 10 * value + *fieldstr - '0';
   5.377 +	  fieldstr++;
   5.378 +	}
   5.379 +      else
   5.380 +	invalid_list ();
   5.381 +    }
   5.382 +}
   5.383 +
   5.384 +/* Process file FILE to standard output.
   5.385 +   Return 0 if successful, 1 if not. */
   5.386 +
   5.387 +int
   5.388 +cut_file (file)
   5.389 +     char *file;
   5.390 +{
   5.391 +  FILE *stream;
   5.392 +
   5.393 +  if (!strcmp (file, "-"))
   5.394 +    {
   5.395 +      have_read_stdin = 1;
   5.396 +      stream = stdin;
   5.397 +    }
   5.398 +  else
   5.399 +    {
   5.400 +      stream = fopen (file, "r");
   5.401 +      if (stream == NULL)
   5.402 +	{
   5.403 +	  error (0, errno, "%s", file);
   5.404 +	  return 1;
   5.405 +	}
   5.406 +    }
   5.407 +
   5.408 +  cut_stream (stream);
   5.409 +
   5.410 +  if (ferror (stream))
   5.411 +    {
   5.412 +      error (0, errno, "%s", file);
   5.413 +      return 1;
   5.414 +    }
   5.415 +  if (!strcmp (file, "-"))
   5.416 +    clearerr (stream);		/* Also clear EOF. */
   5.417 +  else if (fclose (stream) == EOF)
   5.418 +    {
   5.419 +      error (0, errno, "%s", file);
   5.420 +      return 1;
   5.421 +    }
   5.422 +  return 0;
   5.423 +}
   5.424 +
   5.425 +void
   5.426 +cut_stream (stream)
   5.427 +     FILE *stream;
   5.428 +{
   5.429 +  if (operating_mode == byte_mode)
   5.430 +    cut_bytes (stream);
   5.431 +  else
   5.432 +    cut_fields (stream);
   5.433 +}
   5.434 +
   5.435 +/* Print the file open for reading on stream STREAM
   5.436 +   with the bytes marked `field_omit' in `fields' removed from each line. */
   5.437 +
   5.438 +void
   5.439 +cut_bytes (stream)
   5.440 +     FILE *stream;
   5.441 +{
   5.442 +  register int c;		/* Each character from the file. */
   5.443 +  int doneflag = 0;		/* Nonzero if EOF reached. */
   5.444 +  int char_count;		/* Number of chars in the line so far. */
   5.445 +
   5.446 +  while (doneflag == 0)
   5.447 +    {
   5.448 +      /* Start processing a line. */
   5.449 +      outbufptr = outbuf;
   5.450 +      char_count = 0;
   5.451 +
   5.452 +      do
   5.453 +	{
   5.454 +	  c = getc (stream);
   5.455 +	  if (c == EOF)
   5.456 +	    {
   5.457 +	      doneflag++;
   5.458 +	      break;
   5.459 +	    }
   5.460 +
   5.461 +	  /* If this character is to be sent, stow it in the outbuffer. */
   5.462 +
   5.463 +	  if (++char_count == line_size - 1)
   5.464 +	    enlarge_line (char_count);
   5.465 +
   5.466 +	  if (fields[char_count] == field_output || c == '\n')
   5.467 +	    *outbufptr++ = c;
   5.468 +	}
   5.469 +      while (c != '\n');
   5.470 +
   5.471 +      if (char_count)
   5.472 +	fwrite (outbuf, sizeof (char), outbufptr - outbuf, stdout);
   5.473 +    }
   5.474 +}
   5.475 +
   5.476 +/* Print the file open for reading on stream STREAM
   5.477 +   with the fields marked `field_omit' in `fields' removed from each line.
   5.478 +   All characters are initially stowed in the raw input buffer, until
   5.479 +   at least one field has been found. */
   5.480 +
   5.481 +void
   5.482 +cut_fields (stream)
   5.483 +     FILE *stream;
   5.484 +{
   5.485 +  register int c;		/* Each character from the file. */
   5.486 +  int doneflag = 0;		/* Nonzero if EOF reached. */
   5.487 +  int char_count;		/* Number of chars in line before any delim. */
   5.488 +  int fieldfound;		/* Nonzero if any fields to print found. */
   5.489 +  int curr_field;		/* Current index in `fields'. */
   5.490 +
   5.491 +  while (doneflag == 0)
   5.492 +    {
   5.493 +      char_count = 0;
   5.494 +      fieldfound = 0;
   5.495 +      curr_field = 1;
   5.496 +      outbufptr = outbuf;
   5.497 +      inbufptr = inbuf;
   5.498 +
   5.499 +      do
   5.500 +	{
   5.501 +	  c = getc (stream);
   5.502 +	  if (c == EOF)
   5.503 +	    {
   5.504 +	      doneflag++;
   5.505 +	      break;
   5.506 +	    }
   5.507 +
   5.508 +	  if (fields[curr_field] == field_output && c != '\n')
   5.509 +	    {
   5.510 +	      /* Working on a field.  It, and its terminating
   5.511 +		 delimiter, go only into the processed buffer. */
   5.512 +	      fieldfound = 1;
   5.513 +	      if (outbufptr - outbuf == line_size - 2)
   5.514 +		enlarge_line (outbufptr - outbuf);
   5.515 +	      *outbufptr++ = c;
   5.516 +	    }
   5.517 +	  else if (fieldfound == 0)
   5.518 +	    {
   5.519 +	      if (++char_count == line_size - 1)
   5.520 +		enlarge_line (char_count);
   5.521 +	      *inbufptr++ = c;
   5.522 +	    }
   5.523 +
   5.524 +	  if (c == delim && ++curr_field == line_size - 1)
   5.525 +	    enlarge_line (curr_field);
   5.526 +	}
   5.527 +      while (c != '\n');
   5.528 +
   5.529 +      if (fieldfound)
   5.530 +	{
   5.531 +	  /* Something was found. Print it. */
   5.532 +	  if (outbufptr[-1] == delim)
   5.533 +	    --outbufptr;	/* Suppress trailing delimiter. */
   5.534 +
   5.535 +	  fwrite (outbuf, sizeof (char), outbufptr - outbuf, stdout);
   5.536 +	  if (c == '\n')
   5.537 +	    putc (c, stdout);
   5.538 +	}
   5.539 +      else if (!delimited_lines_only && char_count)
   5.540 +	/* A line with some characters, no delimiters, and no
   5.541 +	   suppression.  Print it. */
   5.542 +	fwrite (inbuf, sizeof (char), inbufptr - inbuf, stdout);
   5.543 +    }
   5.544 +}
   5.545 +
   5.546 +/* Extend the buffers to accomodate at least NEW_SIZE characters. */
   5.547 +
   5.548 +void
   5.549 +enlarge_line (new_size)
   5.550 +     int new_size;
   5.551 +{
   5.552 +  char *newp;
   5.553 +  int i;
   5.554 +
   5.555 +  new_size += 256;		/* Leave some room to grow. */
   5.556 +
   5.557 +  fields = (enum field_action *)
   5.558 +    xrealloc (fields, new_size * sizeof (enum field_action));
   5.559 +
   5.560 +  newp = (char *) xrealloc (outbuf, new_size);
   5.561 +  outbufptr += newp - outbuf;
   5.562 +  outbuf = newp;
   5.563 +
   5.564 +  newp = (char *) xrealloc (inbuf, new_size);
   5.565 +  inbufptr += newp - inbuf;
   5.566 +  inbuf = newp;
   5.567 +
   5.568 +  for (i = line_size; i < new_size; i++)
   5.569 +    fields[i] = field_omit;
   5.570 +  line_size = new_size;
   5.571 +}
   5.572 +
   5.573 +void
   5.574 +invalid_list ()
   5.575 +{
   5.576 +  error (2, 0, "invalid byte or field list");
   5.577 +}
   5.578 +
   5.579 +void
   5.580 +usage ()
   5.581 +{
   5.582 +  fprintf (stderr, "\
   5.583 +Usage: %s {-b byte-list,--bytes=byte-list} [-n] [file...]\n\
   5.584 +       %s {-c character-list,--characters=character-list} [file...]\n\
   5.585 +       %s {-f field-list,--fields=field-list} [-d delim] [-s]\n\
   5.586 +       [--delimiter=delim] [--only-delimited] [file...]\n",
   5.587 +	   program_name, program_name, program_name);
   5.588 +  exit (2);
   5.589 +}
     6.1 --- /dev/null	Thu Jan 01 00:00:00 1970 +0000
     6.2 +++ b/code/cut.c__gnu.2015-05-01	Tue May 12 06:46:59 2015 +0200
     6.3 @@ -0,0 +1,830 @@
     6.4 +/* cut - remove parts of lines of files
     6.5 +   Copyright (C) 1997-2015 Free Software Foundation, Inc.
     6.6 +   Copyright (C) 1984 David M. Ihnat
     6.7 +
     6.8 +   This program is free software: you can redistribute it and/or modify
     6.9 +   it under the terms of the GNU General Public License as published by
    6.10 +   the Free Software Foundation, either version 3 of the License, or
    6.11 +   (at your option) any later version.
    6.12 +
    6.13 +   This program is distributed in the hope that it will be useful,
    6.14 +   but WITHOUT ANY WARRANTY; without even the implied warranty of
    6.15 +   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
    6.16 +   GNU General Public License for more details.
    6.17 +
    6.18 +   You should have received a copy of the GNU General Public License
    6.19 +   along with this program.  If not, see <http://www.gnu.org/licenses/>.  */
    6.20 +
    6.21 +/* Written by David Ihnat.  */
    6.22 +
    6.23 +/* POSIX changes, bug fixes, long-named options, and cleanup
    6.24 +   by David MacKenzie <djm@gnu.ai.mit.edu>.
    6.25 +
    6.26 +   Rewrite cut_fields and cut_bytes -- Jim Meyering.  */
    6.27 +
    6.28 +#include <config.h>
    6.29 +
    6.30 +#include <stdio.h>
    6.31 +#include <assert.h>
    6.32 +#include <getopt.h>
    6.33 +#include <sys/types.h>
    6.34 +#include "system.h"
    6.35 +
    6.36 +#include "error.h"
    6.37 +#include "fadvise.h"
    6.38 +#include "getndelim2.h"
    6.39 +#include "hash.h"
    6.40 +#include "quote.h"
    6.41 +#include "xstrndup.h"
    6.42 +
    6.43 +/* The official name of this program (e.g., no 'g' prefix).  */
    6.44 +#define PROGRAM_NAME "cut"
    6.45 +
    6.46 +#define AUTHORS \
    6.47 +  proper_name ("David M. Ihnat"), \
    6.48 +  proper_name ("David MacKenzie"), \
    6.49 +  proper_name ("Jim Meyering")
    6.50 +
    6.51 +#define FATAL_ERROR(Message)						\
    6.52 +  do									\
    6.53 +    {									\
    6.54 +      error (0, 0, (Message));						\
    6.55 +      usage (EXIT_FAILURE);						\
    6.56 +    }									\
    6.57 +  while (0)
    6.58 +
    6.59 +
    6.60 +struct range_pair
    6.61 +  {
    6.62 +    size_t lo;
    6.63 +    size_t hi;
    6.64 +  };
    6.65 +
    6.66 +/* Array of `struct range_pair' holding all the finite ranges. */
    6.67 +static struct range_pair *rp;
    6.68 +
    6.69 +/* Pointer inside RP.  When checking if a byte or field is selected
    6.70 +   by a finite range, we check if it is between CURRENT_RP.LO
    6.71 +   and CURRENT_RP.HI.  If the byte or field index is greater than
    6.72 +   CURRENT_RP.HI then we make CURRENT_RP to point to the next range pair. */
    6.73 +static struct range_pair *current_rp;
    6.74 +
    6.75 +/* Number of finite ranges specified by the user. */
    6.76 +static size_t n_rp;
    6.77 +
    6.78 +/* Number of `struct range_pair's allocated. */
    6.79 +static size_t n_rp_allocated;
    6.80 +
    6.81 +
    6.82 +/* Append LOW, HIGH to the list RP of range pairs, allocating additional
    6.83 +   space if necessary.  Update global variable N_RP.  When allocating,
    6.84 +   update global variable N_RP_ALLOCATED.  */
    6.85 +
    6.86 +static void
    6.87 +add_range_pair (size_t lo, size_t hi)
    6.88 +{
    6.89 +  if (n_rp == n_rp_allocated)
    6.90 +    rp = X2NREALLOC (rp, &n_rp_allocated);
    6.91 +  rp[n_rp].lo = lo;
    6.92 +  rp[n_rp].hi = hi;
    6.93 +  ++n_rp;
    6.94 +}
    6.95 +
    6.96 +/* This buffer is used to support the semantics of the -s option
    6.97 +   (or lack of same) when the specified field list includes (does
    6.98 +   not include) the first field.  In both of those cases, the entire
    6.99 +   first field must be read into this buffer to determine whether it
   6.100 +   is followed by a delimiter or a newline before any of it may be
   6.101 +   output.  Otherwise, cut_fields can do the job without using this
   6.102 +   buffer.  */
   6.103 +static char *field_1_buffer;
   6.104 +
   6.105 +/* The number of bytes allocated for FIELD_1_BUFFER.  */
   6.106 +static size_t field_1_bufsize;
   6.107 +
   6.108 +enum operating_mode
   6.109 +  {
   6.110 +    undefined_mode,
   6.111 +
   6.112 +    /* Output characters that are in the given bytes. */
   6.113 +    byte_mode,
   6.114 +
   6.115 +    /* Output the given delimiter-separated fields. */
   6.116 +    field_mode
   6.117 +  };
   6.118 +
   6.119 +static enum operating_mode operating_mode;
   6.120 +
   6.121 +/* If true do not output lines containing no delimiter characters.
   6.122 +   Otherwise, all such lines are printed.  This option is valid only
   6.123 +   with field mode.  */
   6.124 +static bool suppress_non_delimited;
   6.125 +
   6.126 +/* If true, print all bytes, characters, or fields _except_
   6.127 +   those that were specified.  */
   6.128 +static bool complement;
   6.129 +
   6.130 +/* The delimiter character for field mode. */
   6.131 +static unsigned char delim;
   6.132 +
   6.133 +/* True if the --output-delimiter=STRING option was specified.  */
   6.134 +static bool output_delimiter_specified;
   6.135 +
   6.136 +/* The length of output_delimiter_string.  */
   6.137 +static size_t output_delimiter_length;
   6.138 +
   6.139 +/* The output field separator string.  Defaults to the 1-character
   6.140 +   string consisting of the input delimiter.  */
   6.141 +static char *output_delimiter_string;
   6.142 +
   6.143 +/* True if we have ever read standard input. */
   6.144 +static bool have_read_stdin;
   6.145 +
   6.146 +/* For long options that have no equivalent short option, use a
   6.147 +   non-character as a pseudo short option, starting with CHAR_MAX + 1.  */
   6.148 +enum
   6.149 +{
   6.150 +  OUTPUT_DELIMITER_OPTION = CHAR_MAX + 1,
   6.151 +  COMPLEMENT_OPTION
   6.152 +};
   6.153 +
   6.154 +static struct option const longopts[] =
   6.155 +{
   6.156 +  {"bytes", required_argument, NULL, 'b'},
   6.157 +  {"characters", required_argument, NULL, 'c'},
   6.158 +  {"fields", required_argument, NULL, 'f'},
   6.159 +  {"delimiter", required_argument, NULL, 'd'},
   6.160 +  {"only-delimited", no_argument, NULL, 's'},
   6.161 +  {"output-delimiter", required_argument, NULL, OUTPUT_DELIMITER_OPTION},
   6.162 +  {"complement", no_argument, NULL, COMPLEMENT_OPTION},
   6.163 +  {GETOPT_HELP_OPTION_DECL},
   6.164 +  {GETOPT_VERSION_OPTION_DECL},
   6.165 +  {NULL, 0, NULL, 0}
   6.166 +};
   6.167 +
   6.168 +void
   6.169 +usage (int status)
   6.170 +{
   6.171 +  if (status != EXIT_SUCCESS)
   6.172 +    emit_try_help ();
   6.173 +  else
   6.174 +    {
   6.175 +      printf (_("\
   6.176 +Usage: %s OPTION... [FILE]...\n\
   6.177 +"),
   6.178 +              program_name);
   6.179 +      fputs (_("\
   6.180 +Print selected parts of lines from each FILE to standard output.\n\
   6.181 +"), stdout);
   6.182 +
   6.183 +      emit_stdin_note ();
   6.184 +      emit_mandatory_arg_note ();
   6.185 +
   6.186 +      fputs (_("\
   6.187 +  -b, --bytes=LIST        select only these bytes\n\
   6.188 +  -c, --characters=LIST   select only these characters\n\
   6.189 +  -d, --delimiter=DELIM   use DELIM instead of TAB for field delimiter\n\
   6.190 +"), stdout);
   6.191 +      fputs (_("\
   6.192 +  -f, --fields=LIST       select only these fields;  also print any line\n\
   6.193 +                            that contains no delimiter character, unless\n\
   6.194 +                            the -s option is specified\n\
   6.195 +  -n                      (ignored)\n\
   6.196 +"), stdout);
   6.197 +      fputs (_("\
   6.198 +      --complement        complement the set of selected bytes, characters\n\
   6.199 +                            or fields\n\
   6.200 +"), stdout);
   6.201 +      fputs (_("\
   6.202 +  -s, --only-delimited    do not print lines not containing delimiters\n\
   6.203 +      --output-delimiter=STRING  use STRING as the output delimiter\n\
   6.204 +                            the default is to use the input delimiter\n\
   6.205 +"), stdout);
   6.206 +      fputs (HELP_OPTION_DESCRIPTION, stdout);
   6.207 +      fputs (VERSION_OPTION_DESCRIPTION, stdout);
   6.208 +      fputs (_("\
   6.209 +\n\
   6.210 +Use one, and only one of -b, -c or -f.  Each LIST is made up of one\n\
   6.211 +range, or many ranges separated by commas.  Selected input is written\n\
   6.212 +in the same order that it is read, and is written exactly once.\n\
   6.213 +"), stdout);
   6.214 +      fputs (_("\
   6.215 +Each range is one of:\n\
   6.216 +\n\
   6.217 +  N     N'th byte, character or field, counted from 1\n\
   6.218 +  N-    from N'th byte, character or field, to end of line\n\
   6.219 +  N-M   from N'th to M'th (included) byte, character or field\n\
   6.220 +  -M    from first to M'th (included) byte, character or field\n\
   6.221 +"), stdout);
   6.222 +      emit_ancillary_info (PROGRAM_NAME);
   6.223 +    }
   6.224 +  exit (status);
   6.225 +}
   6.226 +
   6.227 +/* Comparison function for qsort to order the list of
   6.228 +   struct range_pairs.  */
   6.229 +static int
   6.230 +compare_ranges (const void *a, const void *b)
   6.231 +{
   6.232 +  int a_start = ((const struct range_pair *) a)->lo;
   6.233 +  int b_start = ((const struct range_pair *) b)->lo;
   6.234 +  return a_start < b_start ? -1 : a_start > b_start;
   6.235 +}
   6.236 +
   6.237 +/* Reallocate Range Pair entries, with corresponding
   6.238 +   entries outside the range of each specified entry.  */
   6.239 +
   6.240 +static void
   6.241 +complement_rp (void)
   6.242 +{
   6.243 +  if (complement)
   6.244 +    {
   6.245 +      struct range_pair *c = rp;
   6.246 +      size_t n = n_rp;
   6.247 +      size_t i;
   6.248 +
   6.249 +      rp = NULL;
   6.250 +      n_rp = 0;
   6.251 +      n_rp_allocated = 0;
   6.252 +
   6.253 +      if (c[0].lo > 1)
   6.254 +        add_range_pair (1, c[0].lo - 1);
   6.255 +
   6.256 +      for (i = 1; i < n; ++i)
   6.257 +        {
   6.258 +          if (c[i-1].hi + 1 == c[i].lo)
   6.259 +            continue;
   6.260 +
   6.261 +          add_range_pair (c[i-1].hi + 1, c[i].lo - 1);
   6.262 +        }
   6.263 +
   6.264 +      if (c[n-1].hi < SIZE_MAX)
   6.265 +        add_range_pair (c[n-1].hi + 1, SIZE_MAX);
   6.266 +
   6.267 +      free (c);
   6.268 +    }
   6.269 +}
   6.270 +
   6.271 +/* Given the list of field or byte range specifications FIELDSTR,
   6.272 +   allocate and initialize the RP array. FIELDSTR should
   6.273 +   be composed of one or more numbers or ranges of numbers, separated
   6.274 +   by blanks or commas.  Incomplete ranges may be given: '-m' means '1-m';
   6.275 +   'n-' means 'n' through end of line.
   6.276 +   Return true if FIELDSTR contains at least one field specification,
   6.277 +   false otherwise.  */
   6.278 +
   6.279 +static bool
   6.280 +set_fields (const char *fieldstr)
   6.281 +{
   6.282 +  size_t initial = 1;		/* Value of first number in a range.  */
   6.283 +  size_t value = 0;		/* If nonzero, a number being accumulated.  */
   6.284 +  bool lhs_specified = false;
   6.285 +  bool rhs_specified = false;
   6.286 +  bool dash_found = false;	/* True if a '-' is found in this field.  */
   6.287 +  bool field_found = false;	/* True if at least one field spec
   6.288 +                                   has been processed.  */
   6.289 +
   6.290 +  size_t i;
   6.291 +  bool in_digits = false;
   6.292 +
   6.293 +  /* Collect and store in RP the range end points. */
   6.294 +
   6.295 +  while (true)
   6.296 +    {
   6.297 +      if (*fieldstr == '-')
   6.298 +        {
   6.299 +          in_digits = false;
   6.300 +          /* Starting a range. */
   6.301 +          if (dash_found)
   6.302 +            FATAL_ERROR (_("invalid byte, character or field list"));
   6.303 +          dash_found = true;
   6.304 +          fieldstr++;
   6.305 +
   6.306 +          if (lhs_specified && !value)
   6.307 +            FATAL_ERROR (_("fields and positions are numbered from 1"));
   6.308 +
   6.309 +          initial = (lhs_specified ? value : 1);
   6.310 +          value = 0;
   6.311 +        }
   6.312 +      else if (*fieldstr == ','
   6.313 +               || isblank (to_uchar (*fieldstr)) || *fieldstr == '\0')
   6.314 +        {
   6.315 +          in_digits = false;
   6.316 +          /* Ending the string, or this field/byte sublist. */
   6.317 +          if (dash_found)
   6.318 +            {
   6.319 +              dash_found = false;
   6.320 +
   6.321 +              if (!lhs_specified && !rhs_specified)
   6.322 +                FATAL_ERROR (_("invalid range with no endpoint: -"));
   6.323 +
   6.324 +              /* A range.  Possibilities: -n, m-n, n-.
   6.325 +                 In any case, 'initial' contains the start of the range. */
   6.326 +              if (!rhs_specified)
   6.327 +                {
   6.328 +                  /* 'n-'.  From 'initial' to end of line. */
   6.329 +                  add_range_pair (initial, SIZE_MAX);
   6.330 +                  field_found = true;
   6.331 +                }
   6.332 +              else
   6.333 +                {
   6.334 +                  /* 'm-n' or '-n' (1-n). */
   6.335 +                  if (value < initial)
   6.336 +                    FATAL_ERROR (_("invalid decreasing range"));
   6.337 +
   6.338 +                  add_range_pair (initial, value);
   6.339 +                  field_found = true;
   6.340 +                }
   6.341 +              value = 0;
   6.342 +            }
   6.343 +          else
   6.344 +            {
   6.345 +              /* A simple field number, not a range. */
   6.346 +              if (value == 0)
   6.347 +                FATAL_ERROR (_("fields and positions are numbered from 1"));
   6.348 +              add_range_pair (value, value);
   6.349 +              value = 0;
   6.350 +              field_found = true;
   6.351 +            }
   6.352 +
   6.353 +          if (*fieldstr == '\0')
   6.354 +            break;
   6.355 +
   6.356 +          fieldstr++;
   6.357 +          lhs_specified = false;
   6.358 +          rhs_specified = false;
   6.359 +        }
   6.360 +      else if (ISDIGIT (*fieldstr))
   6.361 +        {
   6.362 +          /* Record beginning of digit string, in case we have to
   6.363 +             complain about it.  */
   6.364 +          static char const *num_start;
   6.365 +          if (!in_digits || !num_start)
   6.366 +            num_start = fieldstr;
   6.367 +          in_digits = true;
   6.368 +
   6.369 +          if (dash_found)
   6.370 +            rhs_specified = 1;
   6.371 +          else
   6.372 +            lhs_specified = 1;
   6.373 +
   6.374 +          /* Detect overflow.  */
   6.375 +          if (!DECIMAL_DIGIT_ACCUMULATE (value, *fieldstr - '0', size_t)
   6.376 +              || value == SIZE_MAX)
   6.377 +            {
   6.378 +              /* In case the user specified -c$(echo 2^64|bc),22,
   6.379 +                 complain only about the first number.  */
   6.380 +              /* Determine the length of the offending number.  */
   6.381 +              size_t len = strspn (num_start, "0123456789");
   6.382 +              char *bad_num = xstrndup (num_start, len);
   6.383 +              if (operating_mode == byte_mode)
   6.384 +                error (0, 0,
   6.385 +                       _("byte offset %s is too large"), quote (bad_num));
   6.386 +              else
   6.387 +                error (0, 0,
   6.388 +                       _("field number %s is too large"), quote (bad_num));
   6.389 +              free (bad_num);
   6.390 +              exit (EXIT_FAILURE);
   6.391 +            }
   6.392 +
   6.393 +          fieldstr++;
   6.394 +        }
   6.395 +      else
   6.396 +        FATAL_ERROR (_("invalid byte, character or field list"));
   6.397 +    }
   6.398 +
   6.399 +  qsort (rp, n_rp, sizeof (rp[0]), compare_ranges);
   6.400 +
   6.401 +  /* Merge range pairs (e.g. `2-5,3-4' becomes `2-5'). */
   6.402 +  for (i = 0; i < n_rp; ++i)
   6.403 +    {
   6.404 +      for (size_t j = i + 1; j < n_rp; ++j)
   6.405 +        {
   6.406 +          if (rp[j].lo <= rp[i].hi)
   6.407 +            {
   6.408 +              rp[i].hi = MAX (rp[j].hi, rp[i].hi);
   6.409 +              memmove (rp + j, rp + j + 1, (n_rp - j - 1) * sizeof *rp);
   6.410 +              n_rp--;
   6.411 +              j--;
   6.412 +            }
   6.413 +          else
   6.414 +            break;
   6.415 +        }
   6.416 +    }
   6.417 +
   6.418 +  complement_rp ();
   6.419 +
   6.420 +  /* After merging, reallocate RP so we release memory to the system.
   6.421 +     Also add a sentinel at the end of RP, to avoid out of bounds access
   6.422 +     and for performance reasons.  */
   6.423 +  ++n_rp;
   6.424 +  rp = xrealloc (rp, n_rp * sizeof (struct range_pair));
   6.425 +  rp[n_rp - 1].lo = rp[n_rp - 1].hi = SIZE_MAX;
   6.426 +
   6.427 +  return field_found;
   6.428 +}
   6.429 +
   6.430 +/* Increment *ITEM_IDX (i.e., a field or byte index),
   6.431 +   and if required CURRENT_RP.  */
   6.432 +
   6.433 +static inline void
   6.434 +next_item (size_t *item_idx)
   6.435 +{
   6.436 +  (*item_idx)++;
   6.437 +  if ((*item_idx) > current_rp->hi)
   6.438 +    current_rp++;
   6.439 +}
   6.440 +
   6.441 +/* Return nonzero if the K'th field or byte is printable. */
   6.442 +
   6.443 +static inline bool
   6.444 +print_kth (size_t k)
   6.445 +{
   6.446 +  return current_rp->lo <= k;
   6.447 +}
   6.448 +
   6.449 +/* Return nonzero if K'th byte is the beginning of a range. */
   6.450 +
   6.451 +static inline bool
   6.452 +is_range_start_index (size_t k)
   6.453 +{
   6.454 +  return k == current_rp->lo;
   6.455 +}
   6.456 +
   6.457 +/* Read from stream STREAM, printing to standard output any selected bytes.  */
   6.458 +
   6.459 +static void
   6.460 +cut_bytes (FILE *stream)
   6.461 +{
   6.462 +  size_t byte_idx;	/* Number of bytes in the line so far. */
   6.463 +  /* Whether to begin printing delimiters between ranges for the current line.
   6.464 +     Set after we've begun printing data corresponding to the first range.  */
   6.465 +  bool print_delimiter;
   6.466 +
   6.467 +  byte_idx = 0;
   6.468 +  print_delimiter = false;
   6.469 +  current_rp = rp;
   6.470 +  while (true)
   6.471 +    {
   6.472 +      int c;		/* Each character from the file. */
   6.473 +
   6.474 +      c = getc (stream);
   6.475 +
   6.476 +      if (c == '\n')
   6.477 +        {
   6.478 +          putchar ('\n');
   6.479 +          byte_idx = 0;
   6.480 +          print_delimiter = false;
   6.481 +          current_rp = rp;
   6.482 +        }
   6.483 +      else if (c == EOF)
   6.484 +        {
   6.485 +          if (byte_idx > 0)
   6.486 +            putchar ('\n');
   6.487 +          break;
   6.488 +        }
   6.489 +      else
   6.490 +        {
   6.491 +          next_item (&byte_idx);
   6.492 +          if (print_kth (byte_idx))
   6.493 +            {
   6.494 +              if (output_delimiter_specified)
   6.495 +                {
   6.496 +                  if (print_delimiter && is_range_start_index (byte_idx))
   6.497 +                    {
   6.498 +                      fwrite (output_delimiter_string, sizeof (char),
   6.499 +                              output_delimiter_length, stdout);
   6.500 +                    }
   6.501 +                  print_delimiter = true;
   6.502 +                }
   6.503 +
   6.504 +              putchar (c);
   6.505 +            }
   6.506 +        }
   6.507 +    }
   6.508 +}
   6.509 +
   6.510 +/* Read from stream STREAM, printing to standard output any selected fields.  */
   6.511 +
   6.512 +static void
   6.513 +cut_fields (FILE *stream)
   6.514 +{
   6.515 +  int c;
   6.516 +  size_t field_idx = 1;
   6.517 +  bool found_any_selected_field = false;
   6.518 +  bool buffer_first_field;
   6.519 +
   6.520 +  current_rp = rp;
   6.521 +
   6.522 +  c = getc (stream);
   6.523 +  if (c == EOF)
   6.524 +    return;
   6.525 +
   6.526 +  ungetc (c, stream);
   6.527 +  c = 0;
   6.528 +
   6.529 +  /* To support the semantics of the -s flag, we may have to buffer
   6.530 +     all of the first field to determine whether it is 'delimited.'
   6.531 +     But that is unnecessary if all non-delimited lines must be printed
   6.532 +     and the first field has been selected, or if non-delimited lines
   6.533 +     must be suppressed and the first field has *not* been selected.
   6.534 +     That is because a non-delimited line has exactly one field.  */
   6.535 +  buffer_first_field = (suppress_non_delimited ^ !print_kth (1));
   6.536 +
   6.537 +  while (1)
   6.538 +    {
   6.539 +      if (field_idx == 1 && buffer_first_field)
   6.540 +        {
   6.541 +          ssize_t len;
   6.542 +          size_t n_bytes;
   6.543 +
   6.544 +          len = getndelim2 (&field_1_buffer, &field_1_bufsize, 0,
   6.545 +                            GETNLINE_NO_LIMIT, delim, '\n', stream);
   6.546 +          if (len < 0)
   6.547 +            {
   6.548 +              free (field_1_buffer);
   6.549 +              field_1_buffer = NULL;
   6.550 +              if (ferror (stream) || feof (stream))
   6.551 +                break;
   6.552 +              xalloc_die ();
   6.553 +            }
   6.554 +
   6.555 +          n_bytes = len;
   6.556 +          assert (n_bytes != 0);
   6.557 +
   6.558 +          c = 0;
   6.559 +
   6.560 +          /* If the first field extends to the end of line (it is not
   6.561 +             delimited) and we are printing all non-delimited lines,
   6.562 +             print this one.  */
   6.563 +          if (to_uchar (field_1_buffer[n_bytes - 1]) != delim)
   6.564 +            {
   6.565 +              if (suppress_non_delimited)
   6.566 +                {
   6.567 +                  /* Empty.  */
   6.568 +                }
   6.569 +              else
   6.570 +                {
   6.571 +                  fwrite (field_1_buffer, sizeof (char), n_bytes, stdout);
   6.572 +                  /* Make sure the output line is newline terminated.  */
   6.573 +                  if (field_1_buffer[n_bytes - 1] != '\n')
   6.574 +                    putchar ('\n');
   6.575 +                  c = '\n';
   6.576 +                }
   6.577 +              continue;
   6.578 +            }
   6.579 +          if (print_kth (1))
   6.580 +            {
   6.581 +              /* Print the field, but not the trailing delimiter.  */
   6.582 +              fwrite (field_1_buffer, sizeof (char), n_bytes - 1, stdout);
   6.583 +
   6.584 +              /* With -d$'\n' don't treat the last '\n' as a delimiter.  */
   6.585 +              if (delim == '\n')
   6.586 +                {
   6.587 +                  int last_c = getc (stream);
   6.588 +                  if (last_c != EOF)
   6.589 +                    {
   6.590 +                      ungetc (last_c, stream);
   6.591 +                      found_any_selected_field = true;
   6.592 +                    }
   6.593 +                }
   6.594 +              else
   6.595 +                found_any_selected_field = true;
   6.596 +            }
   6.597 +          next_item (&field_idx);
   6.598 +        }
   6.599 +
   6.600 +      int prev_c = c;
   6.601 +
   6.602 +      if (print_kth (field_idx))
   6.603 +        {
   6.604 +          if (found_any_selected_field)
   6.605 +            {
   6.606 +              fwrite (output_delimiter_string, sizeof (char),
   6.607 +                      output_delimiter_length, stdout);
   6.608 +            }
   6.609 +          found_any_selected_field = true;
   6.610 +
   6.611 +          while ((c = getc (stream)) != delim && c != '\n' && c != EOF)
   6.612 +            {
   6.613 +              putchar (c);
   6.614 +              prev_c = c;
   6.615 +            }
   6.616 +        }
   6.617 +      else
   6.618 +        {
   6.619 +          while ((c = getc (stream)) != delim && c != '\n' && c != EOF)
   6.620 +            {
   6.621 +              prev_c = c;
   6.622 +            }
   6.623 +        }
   6.624 +
   6.625 +      /* With -d$'\n' don't treat the last '\n' as a delimiter.  */
   6.626 +      if (delim == '\n' && c == delim)
   6.627 +        {
   6.628 +          int last_c = getc (stream);
   6.629 +          if (last_c != EOF)
   6.630 +            ungetc (last_c, stream);
   6.631 +          else
   6.632 +            c = last_c;
   6.633 +        }
   6.634 +
   6.635 +      if (c == delim)
   6.636 +        next_item (&field_idx);
   6.637 +      else if (c == '\n' || c == EOF)
   6.638 +        {
   6.639 +          if (found_any_selected_field
   6.640 +              || !(suppress_non_delimited && field_idx == 1))
   6.641 +            {
   6.642 +              if (c == '\n' || prev_c != '\n' || delim == '\n')
   6.643 +                putchar ('\n');
   6.644 +            }
   6.645 +          if (c == EOF)
   6.646 +            break;
   6.647 +          field_idx = 1;
   6.648 +          current_rp = rp;
   6.649 +          found_any_selected_field = false;
   6.650 +        }
   6.651 +    }
   6.652 +}
   6.653 +
   6.654 +static void
   6.655 +cut_stream (FILE *stream)
   6.656 +{
   6.657 +  if (operating_mode == byte_mode)
   6.658 +    cut_bytes (stream);
   6.659 +  else
   6.660 +    cut_fields (stream);
   6.661 +}
   6.662 +
   6.663 +/* Process file FILE to standard output.
   6.664 +   Return true if successful.  */
   6.665 +
   6.666 +static bool
   6.667 +cut_file (char const *file)
   6.668 +{
   6.669 +  FILE *stream;
   6.670 +
   6.671 +  if (STREQ (file, "-"))
   6.672 +    {
   6.673 +      have_read_stdin = true;
   6.674 +      stream = stdin;
   6.675 +    }
   6.676 +  else
   6.677 +    {
   6.678 +      stream = fopen (file, "r");
   6.679 +      if (stream == NULL)
   6.680 +        {
   6.681 +          error (0, errno, "%s", file);
   6.682 +          return false;
   6.683 +        }
   6.684 +    }
   6.685 +
   6.686 +  fadvise (stream, FADVISE_SEQUENTIAL);
   6.687 +
   6.688 +  cut_stream (stream);
   6.689 +
   6.690 +  if (ferror (stream))
   6.691 +    {
   6.692 +      error (0, errno, "%s", file);
   6.693 +      return false;
   6.694 +    }
   6.695 +  if (STREQ (file, "-"))
   6.696 +    clearerr (stream);		/* Also clear EOF. */
   6.697 +  else if (fclose (stream) == EOF)
   6.698 +    {
   6.699 +      error (0, errno, "%s", file);
   6.700 +      return false;
   6.701 +    }
   6.702 +  return true;
   6.703 +}
   6.704 +
   6.705 +int
   6.706 +main (int argc, char **argv)
   6.707 +{
   6.708 +  int optc;
   6.709 +  bool ok;
   6.710 +  bool delim_specified = false;
   6.711 +  char *spec_list_string IF_LINT ( = NULL);
   6.712 +
   6.713 +  initialize_main (&argc, &argv);
   6.714 +  set_program_name (argv[0]);
   6.715 +  setlocale (LC_ALL, "");
   6.716 +  bindtextdomain (PACKAGE, LOCALEDIR);
   6.717 +  textdomain (PACKAGE);
   6.718 +
   6.719 +  atexit (close_stdout);
   6.720 +
   6.721 +  operating_mode = undefined_mode;
   6.722 +
   6.723 +  /* By default, all non-delimited lines are printed.  */
   6.724 +  suppress_non_delimited = false;
   6.725 +
   6.726 +  delim = '\0';
   6.727 +  have_read_stdin = false;
   6.728 +
   6.729 +  while ((optc = getopt_long (argc, argv, "b:c:d:f:ns", longopts, NULL)) != -1)
   6.730 +    {
   6.731 +      switch (optc)
   6.732 +        {
   6.733 +        case 'b':
   6.734 +        case 'c':
   6.735 +          /* Build the byte list. */
   6.736 +          if (operating_mode != undefined_mode)
   6.737 +            FATAL_ERROR (_("only one type of list may be specified"));
   6.738 +          operating_mode = byte_mode;
   6.739 +          spec_list_string = optarg;
   6.740 +          break;
   6.741 +
   6.742 +        case 'f':
   6.743 +          /* Build the field list. */
   6.744 +          if (operating_mode != undefined_mode)
   6.745 +            FATAL_ERROR (_("only one type of list may be specified"));
   6.746 +          operating_mode = field_mode;
   6.747 +          spec_list_string = optarg;
   6.748 +          break;
   6.749 +
   6.750 +        case 'd':
   6.751 +          /* New delimiter. */
   6.752 +          /* Interpret -d '' to mean 'use the NUL byte as the delimiter.'  */
   6.753 +          if (optarg[0] != '\0' && optarg[1] != '\0')
   6.754 +            FATAL_ERROR (_("the delimiter must be a single character"));
   6.755 +          delim = optarg[0];
   6.756 +          delim_specified = true;
   6.757 +          break;
   6.758 +
   6.759 +        case OUTPUT_DELIMITER_OPTION:
   6.760 +          output_delimiter_specified = true;
   6.761 +          /* Interpret --output-delimiter='' to mean
   6.762 +             'use the NUL byte as the delimiter.'  */
   6.763 +          output_delimiter_length = (optarg[0] == '\0'
   6.764 +                                     ? 1 : strlen (optarg));
   6.765 +          output_delimiter_string = xstrdup (optarg);
   6.766 +          break;
   6.767 +
   6.768 +        case 'n':
   6.769 +          break;
   6.770 +
   6.771 +        case 's':
   6.772 +          suppress_non_delimited = true;
   6.773 +          break;
   6.774 +
   6.775 +        case COMPLEMENT_OPTION:
   6.776 +          complement = true;
   6.777 +          break;
   6.778 +
   6.779 +        case_GETOPT_HELP_CHAR;
   6.780 +
   6.781 +        case_GETOPT_VERSION_CHAR (PROGRAM_NAME, AUTHORS);
   6.782 +
   6.783 +        default:
   6.784 +          usage (EXIT_FAILURE);
   6.785 +        }
   6.786 +    }
   6.787 +
   6.788 +  if (operating_mode == undefined_mode)
   6.789 +    FATAL_ERROR (_("you must specify a list of bytes, characters, or fields"));
   6.790 +
   6.791 +  if (delim_specified && operating_mode != field_mode)
   6.792 +    FATAL_ERROR (_("an input delimiter may be specified only\
   6.793 + when operating on fields"));
   6.794 +
   6.795 +  if (suppress_non_delimited && operating_mode != field_mode)
   6.796 +    FATAL_ERROR (_("suppressing non-delimited lines makes sense\n\
   6.797 +\tonly when operating on fields"));
   6.798 +
   6.799 +  if (! set_fields (spec_list_string))
   6.800 +    {
   6.801 +      if (operating_mode == field_mode)
   6.802 +        FATAL_ERROR (_("missing list of fields"));
   6.803 +      else
   6.804 +        FATAL_ERROR (_("missing list of positions"));
   6.805 +    }
   6.806 +
   6.807 +  if (!delim_specified)
   6.808 +    delim = '\t';
   6.809 +
   6.810 +  if (output_delimiter_string == NULL)
   6.811 +    {
   6.812 +      static char dummy[2];
   6.813 +      dummy[0] = delim;
   6.814 +      dummy[1] = '\0';
   6.815 +      output_delimiter_string = dummy;
   6.816 +      output_delimiter_length = 1;
   6.817 +    }
   6.818 +
   6.819 +  if (optind == argc)
   6.820 +    ok = cut_file ("-");
   6.821 +  else
   6.822 +    for (ok = true; optind < argc; optind++)
   6.823 +      ok &= cut_file (argv[optind]);
   6.824 +
   6.825 +
   6.826 +  if (have_read_stdin && fclose (stdin) == EOF)
   6.827 +    {
   6.828 +      error (0, errno, "-");
   6.829 +      ok = false;
   6.830 +    }
   6.831 +
   6.832 +  return ok ? EXIT_SUCCESS : EXIT_FAILURE;
   6.833 +}
     7.1 --- /dev/null	Thu Jan 01 00:00:00 1970 +0000
     7.2 +++ b/code/cut.c__heirloom.2012-05-20	Tue May 12 06:46:59 2015 +0200
     7.3 @@ -0,0 +1,405 @@
     7.4 +/*
     7.5 + * cut - cut out fields of lines of files
     7.6 + *
     7.7 + * Gunnar Ritter, Freiburg i. Br., Germany, December 2002.
     7.8 + */
     7.9 +/*
    7.10 + * Copyright (c) 2003 Gunnar Ritter
    7.11 + *
    7.12 + * This software is provided 'as-is', without any express or implied
    7.13 + * warranty. In no event will the authors be held liable for any damages
    7.14 + * arising from the use of this software.
    7.15 + *
    7.16 + * Permission is granted to anyone to use this software for any purpose,
    7.17 + * including commercial applications, and to alter it and redistribute
    7.18 + * it freely, subject to the following restrictions:
    7.19 + *
    7.20 + * 1. The origin of this software must not be misrepresented; you must not
    7.21 + *    claim that you wrote the original software. If you use this software
    7.22 + *    in a product, an acknowledgment in the product documentation would be
    7.23 + *    appreciated but is not required.
    7.24 + *
    7.25 + * 2. Altered source versions must be plainly marked as such, and must not be
    7.26 + *    misrepresented as being the original software.
    7.27 + *
    7.28 + * 3. This notice may not be removed or altered from any source distribution.
    7.29 + */
    7.30 +
    7.31 +#if __GNUC__ >= 3 && __GNUC_MINOR__ >= 4 || __GNUC__ >= 4
    7.32 +#define	USED	__attribute__ ((used))
    7.33 +#elif defined __GNUC__
    7.34 +#define	USED	__attribute__ ((unused))
    7.35 +#else
    7.36 +#define	USED
    7.37 +#endif
    7.38 +static const char sccsid[] USED = "@(#)cut.sl	1.20 (gritter) 5/29/05";
    7.39 +
    7.40 +#include	<sys/types.h>
    7.41 +#include	<sys/stat.h>
    7.42 +#include	<fcntl.h>
    7.43 +#include	<unistd.h>
    7.44 +#include	<stdio.h>
    7.45 +#include	<string.h>
    7.46 +#include	<stdlib.h>
    7.47 +#include	<errno.h>
    7.48 +#include	<libgen.h>
    7.49 +#include	<limits.h>
    7.50 +#include	<wchar.h>
    7.51 +#include	<ctype.h>
    7.52 +#include	<locale.h>
    7.53 +
    7.54 +#include	"iblok.h"
    7.55 +
    7.56 +#if defined (__GLIBC__) && defined (_IO_putc_unlocked)
    7.57 +#undef	putc
    7.58 +#define	putc(c, f)	_IO_putc_unlocked(c, f)
    7.59 +#endif
    7.60 +
    7.61 +struct	range {
    7.62 +	struct range	*r_nxt;
    7.63 +	long	r_min;
    7.64 +	long	r_max;
    7.65 +};
    7.66 +
    7.67 +static unsigned	errcnt;			/* count of errors */
    7.68 +static int	method;			/* one of b, c, f */
    7.69 +static int	nflag;			/* character boundary bytes */
    7.70 +static int	sflag;			/* suppress lines w/o delimiters */
    7.71 +static char	*progname;		/* argv[0] to main() */
    7.72 +static wchar_t	wcdelim = '\t';		/* delimiter character */
    7.73 +static const char	*mbdelim = "\t";/* delimiter character */
    7.74 +struct range	*fields;		/* range list */
    7.75 +static int	multibyte;		/* multibyte LC_CTYPE */
    7.76 +
    7.77 +#define	next(wc, s)	(multibyte ? mbtowc(&(wc), s, MB_LEN_MAX) :\
    7.78 +				((wc) = *(s) & 0377, (wc) != 0))
    7.79 +
    7.80 +void *
    7.81 +lrealloc(void *vp, size_t nbytes)
    7.82 +{
    7.83 +	void	*p;
    7.84 +
    7.85 +	if ((p = realloc(vp, nbytes)) == NULL) {
    7.86 +		write(2, "line too long\n", 14);
    7.87 +		exit(076);
    7.88 +	}
    7.89 +	return p;
    7.90 +}
    7.91 +
    7.92 +void *
    7.93 +smalloc(size_t nbytes)
    7.94 +{
    7.95 +	void	*p;
    7.96 +
    7.97 +	if ((p = malloc(nbytes)) == NULL) {
    7.98 +		write(2, "no memory\n", 11);
    7.99 +		exit(077);
   7.100 +	}
   7.101 +	return p;
   7.102 +}
   7.103 +
   7.104 +static void
   7.105 +error(const char *s)
   7.106 +{
   7.107 +	fprintf(stderr, "%s: ERROR: %s\n", progname, s);
   7.108 +	exit(2);
   7.109 +}
   7.110 +
   7.111 +static void
   7.112 +usage(void)
   7.113 +{
   7.114 +	error("Usage: cut [-s] [-d<char>] {-c<list> | -f<list>} file ...");
   7.115 +}
   7.116 +
   7.117 +static void
   7.118 +badlist(void)
   7.119 +{
   7.120 +	error(method == 'b' ? "bad list for b/c/f option" : 
   7.121 +			"bad list for c/f option");
   7.122 +}
   7.123 +
   7.124 +static void
   7.125 +setdelim(const char *s)
   7.126 +{
   7.127 +	int	n;
   7.128 +
   7.129 +	if ((n = next(wcdelim, s)) < 0 || (n > 0 && s[n] != '\0'))
   7.130 +		error("no delimiter");
   7.131 +	mbdelim = s;
   7.132 +}
   7.133 +
   7.134 +static void
   7.135 +addrange(long m, long n)
   7.136 +{
   7.137 +	struct range	*rp, *rq;
   7.138 +
   7.139 +	rp = smalloc(sizeof *rp);
   7.140 +	rp->r_nxt = NULL;
   7.141 +	rp->r_min = m;
   7.142 +	rp->r_max = n ? n : m;
   7.143 +	if (fields) {
   7.144 +		for (rq = fields; rq->r_nxt; rq = rq->r_nxt);
   7.145 +		rq->r_nxt = rp;
   7.146 +	} else
   7.147 +		fields = rp;
   7.148 +}
   7.149 +
   7.150 +static int
   7.151 +have(long i)
   7.152 +{
   7.153 +	struct range	*rp;
   7.154 +
   7.155 +	for (rp = fields; rp; rp = rp->r_nxt)
   7.156 +		if (i >= rp->r_min && i <= rp->r_max)
   7.157 +			return 1;
   7.158 +	return 0;
   7.159 +}
   7.160 +
   7.161 +#define	mnreset()	m = 0, n = 0, lp = &m
   7.162 +
   7.163 +static void
   7.164 +setlist(const char *s)
   7.165 +{
   7.166 +	char	*cbuf, *cp;
   7.167 +	long	m, n;
   7.168 +	long	*lp;
   7.169 +
   7.170 +	fields = NULL;
   7.171 +	cbuf = smalloc(strlen(s) + 1);
   7.172 +	mnreset();
   7.173 +	for (;;) {
   7.174 +		if (*s == '-') {
   7.175 +			if (m == 0)
   7.176 +				m = 1;
   7.177 +			n = LONG_MAX;
   7.178 +			lp = &n;
   7.179 +			s++;
   7.180 +		} else if (*s == ',' || *s == ' ' || *s == '\t' || *s == '\0') {
   7.181 +			if (m)
   7.182 +				addrange(m, n);
   7.183 +			mnreset();
   7.184 +			if (*s == '\0')
   7.185 +				break;
   7.186 +			s++;
   7.187 +		} else if (isdigit(*s & 0377)) {
   7.188 +			cp = cbuf;
   7.189 +			do
   7.190 +				*cp++ = *s++;
   7.191 +			while (isdigit(*s & 0377));
   7.192 +			*cp = '\0';
   7.193 +			*lp = strtol(cbuf, NULL, 10);
   7.194 +		} else
   7.195 +			badlist();
   7.196 +	}
   7.197 +	if (fields == NULL)
   7.198 +		error("no fields");
   7.199 +	free(cbuf);
   7.200 +}
   7.201 +
   7.202 +static void
   7.203 +cutb(struct iblok *ip)
   7.204 +{
   7.205 +	int	c, i;
   7.206 +
   7.207 +	i = 1;
   7.208 +	while ((c = ib_get(ip)) != EOF) {
   7.209 +		if (c == '\n') {
   7.210 +			i = 1;
   7.211 +			putc(c, stdout);
   7.212 +		} else if (have(i++))
   7.213 +			putc(c, stdout);
   7.214 +	}
   7.215 +}
   7.216 +
   7.217 +static void
   7.218 +cutbn(struct iblok *ip)
   7.219 +{
   7.220 +	char	*cp;
   7.221 +	int	i, m, n;
   7.222 +	wint_t	wc;
   7.223 +
   7.224 +	i = 1;
   7.225 +	while ((cp = ib_getw(ip, &wc, &n)) != NULL) {
   7.226 +		if (wc == '\n') {
   7.227 +			i = 1;
   7.228 +			putc('\n', stdout);
   7.229 +		} else {
   7.230 +			if (have(i + n - 1))
   7.231 +				for (m = 0; m < n; m++)
   7.232 +					putc(cp[m], stdout);
   7.233 +			i += n;
   7.234 +		}
   7.235 +	}
   7.236 +}
   7.237 +
   7.238 +static void
   7.239 +cutc(struct iblok *ip)
   7.240 +{
   7.241 +	char	*cp;
   7.242 +	int	i, n, m;
   7.243 +	wint_t	wc;
   7.244 +
   7.245 +	i = 1;
   7.246 +	while ((cp = ib_getw(ip, &wc, &n)) != NULL) {
   7.247 +		if (wc == '\n') {
   7.248 +			i = 1;
   7.249 +			putc('\n', stdout);
   7.250 +		} else if (wc != WEOF && have(i++)) {
   7.251 +			for (m = 0; m < n; m++)
   7.252 +				putc(cp[m], stdout);
   7.253 +		}
   7.254 +	}
   7.255 +}
   7.256 +
   7.257 +static void
   7.258 +cutf(struct iblok *ip)
   7.259 +{
   7.260 +	static char	*line;
   7.261 +	static size_t	linesize;
   7.262 +	char	*cp, *lp, *lq;
   7.263 +	int	c, i, n, m, gotcha;
   7.264 +	char	b;
   7.265 +	wint_t	wc;
   7.266 +	const int	incr = 128;
   7.267 +
   7.268 +	if (linesize == 0)
   7.269 +		line = smalloc(linesize = incr);
   7.270 +	lp = line;
   7.271 +	gotcha = 0;
   7.272 +	i = 1;
   7.273 +	do {
   7.274 +		if (multibyte)
   7.275 +			cp = ib_getw(ip, &wc, &n);
   7.276 +		else {
   7.277 +			if ((c = ib_get(ip)) != EOF) {
   7.278 +				wc = c;
   7.279 +				b = (char)c;
   7.280 +				cp = &b;
   7.281 +			} else {
   7.282 +				wc = WEOF;
   7.283 +				cp = NULL;
   7.284 +			}
   7.285 +			n = 1;
   7.286 +		}
   7.287 +		if (cp == NULL || wc == '\n' || wc == wcdelim) {
   7.288 +			if (have(i) && (!sflag || gotcha || wc == wcdelim) ||
   7.289 +					(!sflag && i == 1 &&
   7.290 +						(cp == NULL || wc == '\n'))) {
   7.291 +				if (gotcha)
   7.292 +					for (m = 0; mbdelim[m]; m++)
   7.293 +						putc(mbdelim[m], stdout);
   7.294 +				for (lq = line; lq < lp; lq++)
   7.295 +					putc(*lq, stdout);
   7.296 +				gotcha = 1;
   7.297 +			}
   7.298 +			if (wc == '\n') {
   7.299 +				if (gotcha)
   7.300 +					putc('\n', stdout);
   7.301 +				i = 1;
   7.302 +				gotcha = 0;
   7.303 +			} else
   7.304 +				i++;
   7.305 +			lp = line;
   7.306 +		} else {
   7.307 +			for (m = 0; m < n; m++) {
   7.308 +				if (lp >= &line[linesize]) {
   7.309 +					size_t	diff = lp - line;
   7.310 +					line = lrealloc(line, linesize += incr);
   7.311 +					lp = &line[diff];
   7.312 +				}
   7.313 +				*lp++ = cp[m];
   7.314 +			}
   7.315 +		}
   7.316 +	} while (cp != NULL);
   7.317 +}
   7.318 +
   7.319 +static int
   7.320 +fdcut(int fd)
   7.321 +{
   7.322 +	struct iblok	*ip;
   7.323 +
   7.324 +	ip = ib_alloc(fd, 0);
   7.325 +	switch (method) {
   7.326 +	case 'b':
   7.327 +		if (nflag && multibyte)
   7.328 +			cutbn(ip);
   7.329 +		else
   7.330 +			cutb(ip);
   7.331 +		break;
   7.332 +	case 'c':
   7.333 +		if (multibyte)
   7.334 +			cutc(ip);
   7.335 +		else
   7.336 +			cutb(ip);
   7.337 +		break;
   7.338 +	case 'f':
   7.339 +		cutf(ip);
   7.340 +		break;
   7.341 +	}
   7.342 +	ib_free(ip);
   7.343 +	return 0;
   7.344 +}
   7.345 +
   7.346 +static int
   7.347 +fncut(const char *fn)
   7.348 +{
   7.349 +	int	fd, res;
   7.350 +
   7.351 +	if (fn[0] == '-' && fn[1] == '\0')
   7.352 +		fd = 0;
   7.353 +	else if ((fd = open(fn, O_RDONLY)) < 0) {
   7.354 +		fprintf(stderr, "%s: WARNING: cannot open %s\n", progname, fn);
   7.355 +		return 1;
   7.356 +	}
   7.357 +	res = fdcut(fd);
   7.358 +	if (fd)
   7.359 +		close(fd);
   7.360 +	return res;
   7.361 +}
   7.362 +
   7.363 +int
   7.364 +main(int argc, char **argv)
   7.365 +{
   7.366 +	const char	optstring[] = "b:c:d:f:ns";
   7.367 +	int	i;
   7.368 +
   7.369 +	progname = basename(argv[0]);
   7.370 +	setlocale(LC_CTYPE, "");
   7.371 +	multibyte = MB_CUR_MAX > 1;
   7.372 +#ifdef	__GLIBC__
   7.373 +	putenv("POSIXLY_CORRECT=1");
   7.374 +#endif
   7.375 +	while ((i = getopt(argc, argv, optstring)) != EOF) {
   7.376 +		switch (i) {
   7.377 +		case 'b':
   7.378 +		case 'c':
   7.379 +		case 'f':
   7.380 +			if (method && method != i)
   7.381 +				usage();
   7.382 +			method = i;
   7.383 +			setlist(optarg);
   7.384 +			break;
   7.385 +		case 'd':
   7.386 +			setdelim(optarg);
   7.387 +			break;
   7.388 +		case 'n':
   7.389 +			nflag = 1;
   7.390 +			break;
   7.391 +		case 's':
   7.392 +			sflag = 1;
   7.393 +			break;
   7.394 +		default:
   7.395 +			usage();
   7.396 +		}
   7.397 +	}
   7.398 +	/*if ((sflag && method != 'f') || (nflag && method != 'b'))
   7.399 +		usage();*/
   7.400 +	if (method == 0)
   7.401 +		badlist();
   7.402 +	if (argv[optind]) {
   7.403 +		for (i = optind; argv[i]; i++)
   7.404 +			errcnt |= fncut(argv[i]);
   7.405 +	} else
   7.406 +		errcnt |= fdcut(0);
   7.407 +	return errcnt;
   7.408 +}
     8.1 --- /dev/null	Thu Jan 01 00:00:00 1970 +0000
     8.2 +++ b/code/cut.c__netbsd.1993-03-21	Tue May 12 06:46:59 2015 +0200
     8.3 @@ -0,0 +1,270 @@
     8.4 +/*
     8.5 + * Copyright (c) 1989 The Regents of the University of California.
     8.6 + * All rights reserved.
     8.7 + *
     8.8 + * This code is derived from software contributed to Berkeley by
     8.9 + * Adam S. Moskowitz of Menlo Consulting and Marciano Pitargue.
    8.10 + *
    8.11 + * Redistribution and use in source and binary forms, with or without
    8.12 + * modification, are permitted provided that the following conditions
    8.13 + * are met:
    8.14 + * 1. Redistributions of source code must retain the above copyright
    8.15 + *    notice, this list of conditions and the following disclaimer.
    8.16 + * 2. Redistributions in binary form must reproduce the above copyright
    8.17 + *    notice, this list of conditions and the following disclaimer in the
    8.18 + *    documentation and/or other materials provided with the distribution.
    8.19 + * 3. All advertising materials mentioning features or use of this software
    8.20 + *    must display the following acknowledgement:
    8.21 + *	This product includes software developed by the University of
    8.22 + *	California, Berkeley and its contributors.
    8.23 + * 4. Neither the name of the University nor the names of its contributors
    8.24 + *    may be used to endorse or promote products derived from this software
    8.25 + *    without specific prior written permission.
    8.26 + *
    8.27 + * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
    8.28 + * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
    8.29 + * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
    8.30 + * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
    8.31 + * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
    8.32 + * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
    8.33 + * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
    8.34 + * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
    8.35 + * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
    8.36 + * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
    8.37 + * SUCH DAMAGE.
    8.38 + */
    8.39 +
    8.40 +#ifndef lint
    8.41 +char copyright[] =
    8.42 +"@(#) Copyright (c) 1989 The Regents of the University of California.\n\
    8.43 + All rights reserved.\n";
    8.44 +#endif /* not lint */
    8.45 +
    8.46 +#ifndef lint
    8.47 +static char sccsid[] = "@(#)cut.c	5.4 (Berkeley) 10/30/90";
    8.48 +#endif /* not lint */
    8.49 +
    8.50 +#include <limits.h>
    8.51 +#include <stdio.h>
    8.52 +#include <ctype.h>
    8.53 +
    8.54 +int	cflag;
    8.55 +char	dchar;
    8.56 +int	dflag;
    8.57 +int	fflag;
    8.58 +int	sflag;
    8.59 +
    8.60 +main(argc, argv)
    8.61 +	int argc;
    8.62 +	char **argv;
    8.63 +{
    8.64 +	extern char *optarg;
    8.65 +	extern int errno, optind;
    8.66 +	FILE *fp;
    8.67 +	int ch, (*fcn)(), c_cut(), f_cut();
    8.68 +	char *strerror();
    8.69 +
    8.70 +	dchar = '\t';			/* default delimiter is \t */
    8.71 +
    8.72 +	while ((ch = getopt(argc, argv, "c:d:f:s")) != EOF)
    8.73 +		switch(ch) {
    8.74 +		case 'c':
    8.75 +			fcn = c_cut;
    8.76 +			get_list(optarg);
    8.77 +			cflag = 1;
    8.78 +			break;
    8.79 +		case 'd':
    8.80 +			dchar = *optarg;
    8.81 +			dflag = 1;
    8.82 +			break;
    8.83 +		case 'f':
    8.84 +			get_list(optarg);
    8.85 +			fcn = f_cut;
    8.86 +			fflag = 1;
    8.87 +			break;
    8.88 +		case 's':
    8.89 +			sflag = 1;
    8.90 +			break;
    8.91 +		case '?':
    8.92 +		default:
    8.93 +			usage();
    8.94 +		}
    8.95 +	argc -= optind;
    8.96 +	argv += optind;
    8.97 +
    8.98 +	if (fflag) {
    8.99 +		if (cflag)
   8.100 +			usage();
   8.101 +	} else if (!cflag || dflag || sflag)
   8.102 +		usage();
   8.103 +
   8.104 +	if (*argv)
   8.105 +		for (; *argv; ++argv) {
   8.106 +			if (!(fp = fopen(*argv, "r"))) {
   8.107 +				(void)fprintf(stderr,
   8.108 +				    "cut: %s: %s\n", *argv, strerror(errno));
   8.109 +				exit(1);
   8.110 +			}
   8.111 +			fcn(fp, *argv);
   8.112 +		}
   8.113 +	else
   8.114 +		fcn(stdin, "stdin");
   8.115 +	exit(0);
   8.116 +}
   8.117 +
   8.118 +int autostart, autostop, maxval;
   8.119 +
   8.120 +char positions[_POSIX2_LINE_MAX + 1];
   8.121 +
   8.122 +get_list(list)
   8.123 +	char *list;
   8.124 +{
   8.125 +	register char *pos;
   8.126 +	register int setautostart, start, stop;
   8.127 +	char *p, *strtok();
   8.128 +
   8.129 +	/*
   8.130 +	 * set a byte in the positions array to indicate if a field or
   8.131 +	 * column is to be selected; use +1, it's 1-based, not 0-based.
   8.132 +	 * This parser is less restrictive than the Draft 9 POSIX spec.
   8.133 +	 * POSIX doesn't allow lists that aren't in increasing order or
   8.134 +	 * overlapping lists.  We also handle "-3-5" although there's no
   8.135 +	 * real reason too.
   8.136 +	 */
   8.137 +	for (; p = strtok(list, ", \t"); list = NULL) {
   8.138 +		setautostart = start = stop = 0;
   8.139 +		if (*p == '-') {
   8.140 +			++p;
   8.141 +			setautostart = 1;
   8.142 +		}
   8.143 +		if (isdigit(*p)) {
   8.144 +			start = stop = strtol(p, &p, 10);
   8.145 +			if (setautostart && start > autostart)
   8.146 +				autostart = start;
   8.147 +		}
   8.148 +		if (*p == '-') {
   8.149 +			if (isdigit(p[1]))
   8.150 +				stop = strtol(p + 1, &p, 10);
   8.151 +			if (*p == '-') {
   8.152 +				++p;
   8.153 +				if (!autostop || autostop > stop)
   8.154 +					autostop = stop;
   8.155 +			}
   8.156 +		}
   8.157 +		if (*p)
   8.158 +			badlist("illegal list value");
   8.159 +		if (!stop || !start)
   8.160 +			badlist("values may not include zero");
   8.161 +		if (stop > _POSIX2_LINE_MAX) {
   8.162 +			/* positions used rather than allocate a new buffer */
   8.163 +			(void)sprintf(positions, "%d too large (max %d)",
   8.164 +			    stop, _POSIX2_LINE_MAX);
   8.165 +			badlist(positions);
   8.166 +		}
   8.167 +		if (maxval < stop)
   8.168 +			maxval = stop;
   8.169 +		for (pos = positions + start; start++ <= stop; *pos++ = 1);
   8.170 +	}
   8.171 +
   8.172 +	/* overlapping ranges */
   8.173 +	if (autostop && maxval > autostop)
   8.174 +		maxval = autostop;
   8.175 +
   8.176 +	/* set autostart */
   8.177 +	if (autostart)
   8.178 +		memset(positions + 1, '1', autostart);
   8.179 +}
   8.180 +
   8.181 +/* ARGSUSED */
   8.182 +c_cut(fp, fname)
   8.183 +	FILE *fp;
   8.184 +	char *fname;
   8.185 +{
   8.186 +	register int ch, col;
   8.187 +	register char *pos;
   8.188 +
   8.189 +	for (;;) {
   8.190 +		pos = positions + 1;
   8.191 +		for (col = maxval; col; --col) {
   8.192 +			if ((ch = getc(fp)) == EOF)
   8.193 +				return;
   8.194 +			if (ch == '\n')
   8.195 +				break;
   8.196 +			if (*pos++)
   8.197 +				putchar(ch);
   8.198 +		}
   8.199 +		if (ch != '\n')
   8.200 +			if (autostop)
   8.201 +				while ((ch = getc(fp)) != EOF && ch != '\n')
   8.202 +					putchar(ch);
   8.203 +			else
   8.204 +				while ((ch = getc(fp)) != EOF && ch != '\n');
   8.205 +		putchar('\n');
   8.206 +	}
   8.207 +}
   8.208 +
   8.209 +f_cut(fp, fname)
   8.210 +	FILE *fp;
   8.211 +	char *fname;
   8.212 +{
   8.213 +	register int ch, field, isdelim;
   8.214 +	register char *pos, *p, sep;
   8.215 +	int output;
   8.216 +	char lbuf[_POSIX2_LINE_MAX + 1];
   8.217 +
   8.218 +	for (sep = dchar, output = 0; fgets(lbuf, sizeof(lbuf), fp);) {
   8.219 +		for (isdelim = 0, p = lbuf;; ++p) {
   8.220 +			if (!(ch = *p)) {
   8.221 +				(void)fprintf(stderr,
   8.222 +				    "cut: %s: line too long.\n", fname);
   8.223 +				exit(1);
   8.224 +			}
   8.225 +			/* this should work if newline is delimiter */
   8.226 +			if (ch == sep)
   8.227 +				isdelim = 1;
   8.228 +			if (ch == '\n') {
   8.229 +				if (!isdelim && !sflag)
   8.230 +					(void)printf("%s", lbuf);
   8.231 +				break;
   8.232 +			}
   8.233 +		}
   8.234 +		if (!isdelim)
   8.235 +			continue;
   8.236 +
   8.237 +		pos = positions + 1;
   8.238 +		for (field = maxval, p = lbuf; field; --field, ++pos) {
   8.239 +			if (*pos) {
   8.240 +				if (output++)
   8.241 +					putchar(sep);
   8.242 +				while ((ch = *p++) != '\n' && ch != sep)
   8.243 +					putchar(ch);
   8.244 +			} else
   8.245 +				while ((ch = *p++) != '\n' && ch != sep);
   8.246 +			if (ch == '\n')
   8.247 +				break;
   8.248 +		}
   8.249 +		if (ch != '\n')
   8.250 +			if (autostop) {
   8.251 +				if (output)
   8.252 +					putchar(sep);
   8.253 +				for (; (ch = *p) != '\n'; ++p)
   8.254 +					putchar(ch);
   8.255 +			} else
   8.256 +				for (; (ch = *p) != '\n'; ++p);
   8.257 +		putchar('\n');
   8.258 +	}
   8.259 +}
   8.260 +
   8.261 +badlist(msg)
   8.262 +	char *msg;
   8.263 +{
   8.264 +	(void)fprintf(stderr, "cut: [-cf] list: %s.\n", msg);
   8.265 +	exit(1);
   8.266 +}
   8.267 +
   8.268 +usage()
   8.269 +{
   8.270 +	(void)fprintf(stderr,
   8.271 +"usage:\tcut -c list [file1 ...]\n\tcut -f list [-s] [-d delim] [file ...]\n");
   8.272 +	exit(1);
   8.273 +}
     9.1 --- /dev/null	Thu Jan 01 00:00:00 1970 +0000
     9.2 +++ b/code/cut.c__netbsd.2014-02-03	Tue May 12 06:46:59 2015 +0200
     9.3 @@ -0,0 +1,306 @@
     9.4 +/*	$NetBSD: cut.c,v 1.29 2014/02/03 20:22:19 wiz Exp $	*/
     9.5 +
     9.6 +/*
     9.7 + * Copyright (c) 1989, 1993
     9.8 + *	The Regents of the University of California.  All rights reserved.
     9.9 + *
    9.10 + * This code is derived from software contributed to Berkeley by
    9.11 + * Adam S. Moskowitz of Menlo Consulting and Marciano Pitargue.
    9.12 + *
    9.13 + * Redistribution and use in source and binary forms, with or without
    9.14 + * modification, are permitted provided that the following conditions
    9.15 + * are met:
    9.16 + * 1. Redistributions of source code must retain the above copyright
    9.17 + *    notice, this list of conditions and the following disclaimer.
    9.18 + * 2. Redistributions in binary form must reproduce the above copyright
    9.19 + *    notice, this list of conditions and the following disclaimer in the
    9.20 + *    documentation and/or other materials provided with the distribution.
    9.21 + * 3. Neither the name of the University nor the names of its contributors
    9.22 + *    may be used to endorse or promote products derived from this software
    9.23 + *    without specific prior written permission.
    9.24 + *
    9.25 + * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
    9.26 + * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
    9.27 + * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
    9.28 + * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
    9.29 + * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
    9.30 + * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
    9.31 + * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
    9.32 + * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
    9.33 + * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
    9.34 + * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
    9.35 + * SUCH DAMAGE.
    9.36 + */
    9.37 +
    9.38 +#include <sys/cdefs.h>
    9.39 +#ifndef lint
    9.40 +__COPYRIGHT("@(#) Copyright (c) 1989, 1993\
    9.41 + The Regents of the University of California.  All rights reserved.");
    9.42 +#endif /* not lint */
    9.43 +
    9.44 +#ifndef lint
    9.45 +#if 0
    9.46 +static char sccsid[] = "@(#)cut.c	8.3 (Berkeley) 5/4/95";
    9.47 +#endif
    9.48 +__RCSID("$NetBSD: cut.c,v 1.29 2014/02/03 20:22:19 wiz Exp $");
    9.49 +#endif /* not lint */
    9.50 +
    9.51 +#include <ctype.h>
    9.52 +#include <err.h>
    9.53 +#include <errno.h>
    9.54 +#include <limits.h>
    9.55 +#include <locale.h>
    9.56 +#include <stdio.h>
    9.57 +#include <stdlib.h>
    9.58 +#include <string.h>
    9.59 +#include <unistd.h>
    9.60 +#include <util.h>
    9.61 +#include <wchar.h>
    9.62 +#include <sys/param.h>
    9.63 +
    9.64 +static int bflag;
    9.65 +static int	cflag;
    9.66 +static char	dchar;
    9.67 +static int	dflag;
    9.68 +static int	fflag;
    9.69 +static int	sflag;
    9.70 +
    9.71 +static void	b_cut(FILE *, const char *);
    9.72 +static void	c_cut(FILE *, const char *);
    9.73 +static void	f_cut(FILE *, const char *);
    9.74 +static void	get_list(char *);
    9.75 +static void	usage(void) __dead;
    9.76 +
    9.77 +int
    9.78 +main(int argc, char *argv[])
    9.79 +{
    9.80 +	FILE *fp;
    9.81 +	void (*fcn)(FILE *, const char *);
    9.82 +	int ch, rval;
    9.83 +
    9.84 +	fcn = NULL;
    9.85 +	(void)setlocale(LC_ALL, "");
    9.86 +
    9.87 +	dchar = '\t';			/* default delimiter is \t */
    9.88 +
    9.89 +	/* Since we don't support multi-byte characters, the -c and -b
    9.90 +	   options are equivalent, and the -n option is meaningless. */
    9.91 +	while ((ch = getopt(argc, argv, "b:c:d:f:sn")) != -1)
    9.92 +		switch(ch) {
    9.93 +		case 'b':
    9.94 +			fcn = b_cut;
    9.95 +			get_list(optarg);
    9.96 +			bflag = 1;
    9.97 +			break;
    9.98 +		case 'c':
    9.99 +			fcn = c_cut;
   9.100 +			get_list(optarg);
   9.101 +			cflag = 1;
   9.102 +			break;
   9.103 +		case 'd':
   9.104 +			dchar = *optarg;
   9.105 +			dflag = 1;
   9.106 +			break;
   9.107 +		case 'f':
   9.108 +			get_list(optarg);
   9.109 +			fcn = f_cut;
   9.110 +			fflag = 1;
   9.111 +			break;
   9.112 +		case 's':
   9.113 +			sflag = 1;
   9.114 +			break;
   9.115 +		case 'n':
   9.116 +			break;
   9.117 +		case '?':
   9.118 +		default:
   9.119 +			usage();
   9.120 +		}
   9.121 +	argc -= optind;
   9.122 +	argv += optind;
   9.123 +
   9.124 +	if (fflag) {
   9.125 +		if (cflag || bflag)
   9.126 +			usage();
   9.127 +	} else if ((!cflag && !bflag) || dflag || sflag)
   9.128 +		usage();
   9.129 +	else if (bflag && cflag)
   9.130 +		usage();
   9.131 +
   9.132 +	rval = 0;
   9.133 +	if (*argv)
   9.134 +		for (; *argv; ++argv) {
   9.135 +			if (strcmp(*argv, "-") == 0)
   9.136 +				fcn(stdin, "stdin");
   9.137 +			else {
   9.138 +				if ((fp = fopen(*argv, "r"))) {
   9.139 +					fcn(fp, *argv);
   9.140 +					(void)fclose(fp);
   9.141 +				} else {
   9.142 +					rval = 1;
   9.143 +					warn("%s", *argv);
   9.144 +				}
   9.145 +			}
   9.146 +		}
   9.147 +	else
   9.148 +		fcn(stdin, "stdin");
   9.149 +	return(rval);
   9.150 +}
   9.151 +
   9.152 +static size_t autostart, autostop, maxval;
   9.153 +
   9.154 +static char *positions = NULL;
   9.155 +static size_t numpositions = 0;
   9.156 +#define ALLOC_CHUNK	_POSIX2_LINE_MAX	/* malloc granularity */
   9.157 +
   9.158 +static void
   9.159 +get_list(char *list)
   9.160 +{
   9.161 +	size_t setautostart, start, stop;
   9.162 +	char *pos;
   9.163 +	char *p;
   9.164 +
   9.165 +	if (positions == NULL) {
   9.166 +		numpositions = ALLOC_CHUNK;
   9.167 +		positions = ecalloc(numpositions, sizeof(*positions));
   9.168 +	}
   9.169 +
   9.170 +	/*
   9.171 +	 * set a byte in the positions array to indicate if a field or
   9.172 +	 * column is to be selected; use +1, it's 1-based, not 0-based.
   9.173 +	 * This parser is less restrictive than the Draft 9 POSIX spec.
   9.174 +	 * POSIX doesn't allow lists that aren't in increasing order or
   9.175 +	 * overlapping lists.  We also handle "-3-5" although there's no
   9.176 +	 * real reason to.
   9.177 +	 */
   9.178 +	for (; (p = strtok(list, ", \t")) != NULL; list = NULL) {
   9.179 +		setautostart = start = stop = 0;
   9.180 +		if (*p == '-') {
   9.181 +			++p;
   9.182 +			setautostart = 1;
   9.183 +		}
   9.184 +		if (isdigit((unsigned char)*p)) {
   9.185 +			start = stop = strtol(p, &p, 10);
   9.186 +			if (setautostart && start > autostart)
   9.187 +				autostart = start;
   9.188 +		}
   9.189 +		if (*p == '-') {
   9.190 +			if (isdigit((unsigned char)p[1]))
   9.191 +				stop = strtol(p + 1, &p, 10);
   9.192 +			if (*p == '-') {
   9.193 +				++p;
   9.194 +				if (!autostop || autostop > stop)
   9.195 +					autostop = stop;
   9.196 +			}
   9.197 +		}
   9.198 +		if (*p)
   9.199 +			errx(1, "[-bcf] list: illegal list value");
   9.200 +		if (!stop || !start)
   9.201 +			errx(1, "[-bcf] list: values may not include zero");
   9.202 +		if (stop + 1 > numpositions) {
   9.203 +			size_t newsize;
   9.204 +			newsize = roundup(stop + 1, ALLOC_CHUNK);
   9.205 +			positions = erealloc(positions, newsize);
   9.206 +			(void)memset(positions + numpositions, 0,
   9.207 +			    newsize - numpositions);
   9.208 +			numpositions = newsize;
   9.209 +		}
   9.210 +		if (maxval < stop)
   9.211 +			maxval = stop;
   9.212 +		for (pos = positions + start; start++ <= stop; pos++)
   9.213 +			*pos = 1;
   9.214 +	}
   9.215 +
   9.216 +	/* overlapping ranges */
   9.217 +	if (autostop && maxval > autostop)
   9.218 +		maxval = autostop;
   9.219 +
   9.220 +	/* set autostart */
   9.221 +	if (autostart)
   9.222 +		(void)memset(positions + 1, '1', autostart);
   9.223 +}
   9.224 +
   9.225 +static void
   9.226 +/*ARGSUSED*/
   9.227 +f_cut(FILE *fp, const char *fname __unused)
   9.228 +{
   9.229 +	int ch, field, isdelim;
   9.230 +	char *pos, *p, sep;
   9.231 +	int output;
   9.232 +	size_t len;
   9.233 +	char *lbuf, *tbuf;
   9.234 +
   9.235 +	for (sep = dchar, tbuf = NULL; (lbuf = fgetln(fp, &len)) != NULL;) {
   9.236 +		output = 0;
   9.237 +		if (lbuf[len - 1] != '\n') {
   9.238 +			/* no newline at the end of the last line so add one */
   9.239 +			if ((tbuf = (char *)malloc(len + 1)) == NULL)
   9.240 +				err(1, NULL);
   9.241 +			(void)memcpy(tbuf, lbuf, len);
   9.242 +			tbuf[len++] = '\n';
   9.243 +			lbuf = tbuf;
   9.244 +		}
   9.245 +		for (isdelim = 0, p = lbuf;; ++p) {
   9.246 +			ch = *p;
   9.247 +			/* this should work if newline is delimiter */
   9.248 +			if (ch == sep)
   9.249 +				isdelim = 1;
   9.250 +			if (ch == '\n') {
   9.251 +				if (!isdelim && !sflag)
   9.252 +					(void)fwrite(lbuf, len, 1, stdout);
   9.253 +				break;
   9.254 +			}
   9.255 +		}
   9.256 +		if (!isdelim)
   9.257 +			continue;
   9.258 +
   9.259 +		pos = positions + 1;
   9.260 +		for (field = maxval, p = lbuf; field; --field, ++pos) {
   9.261 +			if (*pos) {
   9.262 +				if (output++)
   9.263 +					(void)putchar(sep);
   9.264 +				while ((ch = *p++) != '\n' && ch != sep)
   9.265 +					(void)putchar(ch);
   9.266 +			} else {
   9.267 +				while ((ch = *p++) != '\n' && ch != sep)
   9.268 +					continue;
   9.269 +			}
   9.270 +			if (ch == '\n')
   9.271 +				break;
   9.272 +		}
   9.273 +		if (ch != '\n') {
   9.274 +			if (autostop) {
   9.275 +				if (output)
   9.276 +					(void)putchar(sep);
   9.277 +				for (; (ch = *p) != '\n'; ++p)
   9.278 +					(void)putchar(ch);
   9.279 +			} else
   9.280 +				for (; (ch = *p) != '\n'; ++p);
   9.281 +		}
   9.282 +		(void)putchar('\n');
   9.283 +		if (tbuf) {
   9.284 +			free(tbuf);
   9.285 +			tbuf = NULL;
   9.286 +		}
   9.287 +	}
   9.288 +	if (tbuf)
   9.289 +		free(tbuf);
   9.290 +}
   9.291 +
   9.292 +static void
   9.293 +usage(void)
   9.294 +{
   9.295 +	(void)fprintf(stderr, "usage:\tcut -b list [-n] [file ...]\n"
   9.296 +	    "\tcut -c list [file ...]\n"
   9.297 +	    "\tcut -f list [-d string] [-s] [file ...]\n");
   9.298 +	exit(1);
   9.299 +}
   9.300 +
   9.301 +/* make b_put(): */
   9.302 +#define CUT_BYTE 1
   9.303 +#include "x_cut.c"
   9.304 +#undef CUT_BYTE
   9.305 +
   9.306 +/* make c_put(): */
   9.307 +#define CUT_BYTE 0
   9.308 +#include "x_cut.c"
   9.309 +#undef CUT_BYTE
    10.1 --- /dev/null	Thu Jan 01 00:00:00 1970 +0000
    10.2 +++ b/code/cut.c__openbsd.2008-06-27	Tue May 12 06:46:59 2015 +0200
    10.3 @@ -0,0 +1,290 @@
    10.4 +/*	$OpenBSD: cut.c,v 1.13 2008/06/27 08:02:13 sobrado Exp $	*/
    10.5 +/*	$NetBSD: cut.c,v 1.9 1995/09/02 05:59:23 jtc Exp $	*/
    10.6 +
    10.7 +/*
    10.8 + * Copyright (c) 1989, 1993
    10.9 + *	The Regents of the University of California.  All rights reserved.
   10.10 + *
   10.11 + * This code is derived from software contributed to Berkeley by
   10.12 + * Adam S. Moskowitz of Menlo Consulting and Marciano Pitargue.
   10.13 + *
   10.14 + * Redistribution and use in source and binary forms, with or without
   10.15 + * modification, are permitted provided that the following conditions
   10.16 + * are met:
   10.17 + * 1. Redistributions of source code must retain the above copyright
   10.18 + *    notice, this list of conditions and the following disclaimer.
   10.19 + * 2. Redistributions in binary form must reproduce the above copyright
   10.20 + *    notice, this list of conditions and the following disclaimer in the
   10.21 + *    documentation and/or other materials provided with the distribution.
   10.22 + * 3. Neither the name of the University nor the names of its contributors
   10.23 + *    may be used to endorse or promote products derived from this software
   10.24 + *    without specific prior written permission.
   10.25 + *
   10.26 + * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
   10.27 + * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
   10.28 + * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
   10.29 + * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
   10.30 + * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
   10.31 + * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
   10.32 + * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
   10.33 + * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
   10.34 + * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
   10.35 + * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
   10.36 + * SUCH DAMAGE.
   10.37 + */
   10.38 +
   10.39 +#ifndef lint
   10.40 +static char copyright[] =
   10.41 +"@(#) Copyright (c) 1989, 1993\n\
   10.42 +	The Regents of the University of California.  All rights reserved.\n";
   10.43 +#endif /* not lint */
   10.44 +
   10.45 +#ifndef lint
   10.46 +#if 0
   10.47 +static char sccsid[] = "@(#)cut.c	8.3 (Berkeley) 5/4/95";
   10.48 +#endif
   10.49 +static char rcsid[] = "$OpenBSD: cut.c,v 1.13 2008/06/27 08:02:13 sobrado Exp $";
   10.50 +#endif /* not lint */
   10.51 +
   10.52 +#include <ctype.h>
   10.53 +#include <err.h>
   10.54 +#include <errno.h>
   10.55 +#include <limits.h>
   10.56 +#include <locale.h>
   10.57 +#include <stdio.h>
   10.58 +#include <stdlib.h>
   10.59 +#include <string.h>
   10.60 +#include <unistd.h>
   10.61 +
   10.62 +int	cflag;
   10.63 +char	dchar;
   10.64 +int	dflag;
   10.65 +int	fflag;
   10.66 +int	sflag;
   10.67 +
   10.68 +void	c_cut(FILE *, char *);
   10.69 +void	f_cut(FILE *, char *);
   10.70 +void	get_list(char *);
   10.71 +void	usage(void);
   10.72 +
   10.73 +int
   10.74 +main(int argc, char *argv[])
   10.75 +{
   10.76 +	FILE *fp;
   10.77 +	void (*fcn)(FILE *, char *);
   10.78 +	int ch;
   10.79 +
   10.80 +	setlocale (LC_ALL, "");
   10.81 +
   10.82 +	dchar = '\t';			/* default delimiter is \t */
   10.83 +
   10.84 +	/* Since we don't support multi-byte characters, the -c and -b 
   10.85 +	   options are equivalent, and the -n option is meaningless. */
   10.86 +	while ((ch = getopt(argc, argv, "b:c:d:f:sn")) != -1)
   10.87 +		switch(ch) {
   10.88 +		case 'b':
   10.89 +		case 'c':
   10.90 +			fcn = c_cut;
   10.91 +			get_list(optarg);
   10.92 +			cflag = 1;
   10.93 +			break;
   10.94 +		case 'd':
   10.95 +			dchar = *optarg;
   10.96 +			dflag = 1;
   10.97 +			break;
   10.98 +		case 'f':
   10.99 +			get_list(optarg);
  10.100 +			fcn = f_cut;
  10.101 +			fflag = 1;
  10.102 +			break;
  10.103 +		case 's':
  10.104 +			sflag = 1;
  10.105 +			break;
  10.106 +		case 'n':
  10.107 +			break;
  10.108 +		case '?':
  10.109 +		default:
  10.110 +			usage();
  10.111 +		}
  10.112 +	argc -= optind;
  10.113 +	argv += optind;
  10.114 +
  10.115 +	if (fflag) {
  10.116 +		if (cflag)
  10.117 +			usage();
  10.118 +	} else if (!cflag || dflag || sflag)
  10.119 +		usage();
  10.120 +
  10.121 +	if (*argv)
  10.122 +		for (; *argv; ++argv) {
  10.123 +			if (!(fp = fopen(*argv, "r")))
  10.124 +				err(1, "%s", *argv);
  10.125 +			fcn(fp, *argv);
  10.126 +			(void)fclose(fp);
  10.127 +		}
  10.128 +	else
  10.129 +		fcn(stdin, "stdin");
  10.130 +	exit(0);
  10.131 +}
  10.132 +
  10.133 +int autostart, autostop, maxval;
  10.134 +
  10.135 +char positions[_POSIX2_LINE_MAX + 1];
  10.136 +
  10.137 +void
  10.138 +get_list(char *list)
  10.139 +{
  10.140 +	int setautostart, start, stop;
  10.141 +	char *pos;
  10.142 +	char *p;
  10.143 +
  10.144 +	/*
  10.145 +	 * set a byte in the positions array to indicate if a field or
  10.146 +	 * column is to be selected; use +1, it's 1-based, not 0-based.
  10.147 +	 * This parser is less restrictive than the Draft 9 POSIX spec.
  10.148 +	 * POSIX doesn't allow lists that aren't in increasing order or
  10.149 +	 * overlapping lists.  We also handle "-3-5" although there's no
  10.150 +	 * real reason too.
  10.151 +	 */
  10.152 +	while ((p = strsep(&list, ", \t"))) {
  10.153 +		setautostart = start = stop = 0;
  10.154 +		if (*p == '-') {
  10.155 +			++p;
  10.156 +			setautostart = 1;
  10.157 +		}
  10.158 +		if (isdigit(*p)) {
  10.159 +			start = stop = strtol(p, &p, 10);
  10.160 +			if (setautostart && start > autostart)
  10.161 +				autostart = start;
  10.162 +		}
  10.163 +		if (*p == '-') {
  10.164 +			if (isdigit(p[1]))
  10.165 +				stop = strtol(p + 1, &p, 10);
  10.166 +			if (*p == '-') {
  10.167 +				++p;
  10.168 +				if (!autostop || autostop > stop)
  10.169 +					autostop = stop;
  10.170 +			}
  10.171 +		}
  10.172 +		if (*p)
  10.173 +			errx(1, "[-cf] list: illegal list value");
  10.174 +		if (!stop || !start)
  10.175 +			errx(1, "[-cf] list: values may not include zero");
  10.176 +		if (stop > _POSIX2_LINE_MAX)
  10.177 +			errx(1, "[-cf] list: %d too large (max %d)",
  10.178 +			    stop, _POSIX2_LINE_MAX);
  10.179 +		if (maxval < stop)
  10.180 +			maxval = stop;
  10.181 +		for (pos = positions + start; start++ <= stop; *pos++ = 1)
  10.182 +			;
  10.183 +	}
  10.184 +
  10.185 +	/* overlapping ranges */
  10.186 +	if (autostop && maxval > autostop)
  10.187 +		maxval = autostop;
  10.188 +
  10.189 +	/* set autostart */
  10.190 +	if (autostart)
  10.191 +		memset(positions + 1, '1', autostart);
  10.192 +}
  10.193 +
  10.194 +/* ARGSUSED */
  10.195 +void
  10.196 +c_cut(FILE *fp, char *fname)
  10.197 +{
  10.198 +	int ch, col;
  10.199 +	char *pos;
  10.200 +
  10.201 +	for (;;) {
  10.202 +		pos = positions + 1;
  10.203 +		for (col = maxval; col; --col) {
  10.204 +			if ((ch = getc(fp)) == EOF)
  10.205 +				return;
  10.206 +			if (ch == '\n')
  10.207 +				break;
  10.208 +			if (*pos++)
  10.209 +				(void)putchar(ch);
  10.210 +		}
  10.211 +		if (ch != '\n') {
  10.212 +			if (autostop)
  10.213 +				while ((ch = getc(fp)) != EOF && ch != '\n')
  10.214 +					(void)putchar(ch);
  10.215 +			else
  10.216 +				while ((ch = getc(fp)) != EOF && ch != '\n')
  10.217 +					;
  10.218 +		}
  10.219 +		(void)putchar('\n');
  10.220 +	}
  10.221 +}
  10.222 +
  10.223 +void
  10.224 +f_cut(FILE *fp, char *fname)
  10.225 +{
  10.226 +	int ch, field, isdelim;
  10.227 +	char *pos, *p, sep;
  10.228 +	int output;
  10.229 +	size_t len;
  10.230 +	char *lbuf, *tbuf;
  10.231 +
  10.232 +	for (sep = dchar, tbuf = NULL; (lbuf = fgetln(fp, &len));) {
  10.233 +		output = 0;
  10.234 +		if (lbuf[len - 1] != '\n') {
  10.235 +			/* no newline at the end of the last line so add one */
  10.236 +			if ((tbuf = (char *)malloc(len + 1)) == NULL)
  10.237 +				err(1, NULL);
  10.238 +			memcpy(tbuf, lbuf, len);
  10.239 +			tbuf[len] = '\n';
  10.240 +			lbuf = tbuf;
  10.241 +		}
  10.242 +		for (isdelim = 0, p = lbuf;; ++p) {
  10.243 +			ch = *p;
  10.244 +			/* this should work if newline is delimiter */
  10.245 +			if (ch == sep)
  10.246 +				isdelim = 1;
  10.247 +			if (ch == '\n') {
  10.248 +				if (!isdelim && !sflag)
  10.249 +					(void)fwrite(lbuf, len, 1, stdout);
  10.250 +				break;
  10.251 +			}
  10.252 +		}
  10.253 +		if (!isdelim)
  10.254 +			continue;
  10.255 +
  10.256 +		pos = positions + 1;
  10.257 +		for (field = maxval, p = lbuf; field; --field, ++pos) {
  10.258 +			if (*pos) {
  10.259 +				if (output++)
  10.260 +					(void)putchar(sep);
  10.261 +				while ((ch = *p++) != '\n' && ch != sep)
  10.262 +					(void)putchar(ch);
  10.263 +			} else
  10.264 +				while ((ch = *p++) != '\n' && ch != sep)
  10.265 +					;
  10.266 +			if (ch == '\n')
  10.267 +				break;
  10.268 +		}
  10.269 +		if (ch != '\n') {
  10.270 +			if (autostop) {
  10.271 +				if (output)
  10.272 +					(void)putchar(sep);
  10.273 +				for (; (ch = *p) != '\n'; ++p)
  10.274 +					(void)putchar(ch);
  10.275 +			} else
  10.276 +				for (; (ch = *p) != '\n'; ++p)
  10.277 +					;
  10.278 +		}
  10.279 +		(void)putchar('\n');
  10.280 +	}
  10.281 +	if (tbuf)
  10.282 +		free(tbuf);
  10.283 +}
  10.284 +
  10.285 +void
  10.286 +usage(void)
  10.287 +{
  10.288 +	(void)fprintf(stderr,
  10.289 +	    "usage: cut -b list [-n] [file ...]\n"
  10.290 +	    "       cut -c list [file ...]\n"
  10.291 +	    "       cut -f list [-s] [-d delim] [file ...]\n");
  10.292 +	exit(1);
  10.293 +}
    11.1 --- /dev/null	Thu Jan 01 00:00:00 1970 +0000
    11.2 +++ b/code/cut.c__system_iii.1980-04-11	Tue May 12 06:46:59 2015 +0200
    11.3 @@ -0,0 +1,123 @@
    11.4 +#
    11.5 +/* cut : cut and paste columns of a table (projection of a relation)  (GWRL) */
    11.6 +/* Release 1.5; handles single backspaces as produced by nroff    */
    11.7 +# include <stdio.h>	/* make: cc cut.c */
    11.8 +# define NFIELDS 512	/* max no of fields or resulting line length */
    11.9 +# define BACKSPACE 8
   11.10 +main(argc, argv)
   11.11 +int argc; char **argv;
   11.12 +{
   11.13 +	int del = '\t';
   11.14 +	int i, j, count, poscnt, r, s, t;
   11.15 +	int endflag, supflag, cflag, fflag, backflag, filenr;
   11.16 +	int sel[NFIELDS];
   11.17 +	register int c;
   11.18 +	register char *p1;
   11.19 +	char *p2, outbuf[NFIELDS];
   11.20 +	FILE *inptr;
   11.21 + 
   11.22 + 
   11.23 +while (argc > 1 && argv[1][0] == '-'){
   11.24 +	for (i = 1; (c = argv[1][i]) != '\0'; i++) {
   11.25 +		switch(c) {
   11.26 +			case 'd' : del = argv[1][++i];
   11.27 +				if (del == '\0') diag("no delimiter\n");
   11.28 +				break;
   11.29 +			case 's': supflag++ ;
   11.30 +				break;
   11.31 +			case 'c': cflag++ ;
   11.32 +				break;
   11.33 +			case 'f': fflag++ ;
   11.34 +				break;
   11.35 +			default : diag("Usage: cut [-s] [-d<char>] {-c<list> | -f<list>} file ...\n");
   11.36 +				break;
   11.37 +		}
   11.38 +		if (!endflag && (cflag || fflag)) {
   11.39 +			endflag = 1;
   11.40 +			r = s = t = 0;
   11.41 +			do {	c = argv[1][++i];
   11.42 +				switch(c) {
   11.43 +					case '-' : if (r) diagl();
   11.44 +						r = 1;
   11.45 +						if (t == 0)  s = 1;
   11.46 +						else {s = t; t = 0;}
   11.47 +						continue;
   11.48 +					case '\0' :
   11.49 +					case ','  : if (t >= NFIELDS) diagl();
   11.50 +						if (r) { if (t == 0) t = NFIELDS - 1;
   11.51 +							if (t<s) diagl();
   11.52 +							for(j = s; j <= t; j++) sel[j] = 1;
   11.53 +							}
   11.54 +						else sel[t] = (t > 0 ? 1 : 0);
   11.55 +						r = s = t = 0;
   11.56 +						if (c == '\0') {i--; break;}
   11.57 +						continue;
   11.58 +					default :
   11.59 +						if (c< '0' || c> '9') diagl();
   11.60 +						t = 10*t + c - '0';
   11.61 +						continue;
   11.62 +				}
   11.63 +				for (j = t = 0; j < NFIELDS; j++) t += sel[j];
   11.64 +				if (t == 0) diag("no fields\n");
   11.65 +			} while (c != '\0');
   11.66 +		}
   11.67 +	}
   11.68 +	--argc;
   11.69 +	++argv;
   11.70 +} /* end options */
   11.71 +if (!(cflag || fflag)) diagl();
   11.72 +
   11.73 +--argc;
   11.74 +filenr = 1;
   11.75 +do {	/* for all input files */
   11.76 +	if (argc > 0) inptr = fopen(argv[filenr], "r");
   11.77 +	else inptr = stdin;
   11.78 +  
   11.79 +	if (inptr == NULL) {
   11.80 +		write(2,"Cannot open :",14);
   11.81 +		diag(argv[filenr]);
   11.82 +	}
   11.83 +	endflag = 0;
   11.84 +	do {	/* for all lines of a file */
   11.85 +		count = poscnt = backflag = 0;
   11.86 +		p1 = &outbuf[0] - 1 ;
   11.87 +		p2 = p1;
   11.88 +		do { 	/* for all char of the line */
   11.89 +			c = fgetc(inptr);
   11.90 +			if (c == EOF) {
   11.91 +				endflag = 1;
   11.92 +				break;
   11.93 +				}
   11.94 +			if (count == NFIELDS - 1) diag("line too long\n");
   11.95 +			if (c != '\n') *++p1 = c;
   11.96 +			if (cflag && (c == BACKSPACE)) backflag++ ; else 
   11.97 +				{ if ( !backflag ) poscnt += 1 ; else backflag-- ;}
   11.98 +			if ( backflag > 1 ) diag("cannot handle multiple adjacent backspaces\n");
   11.99 +			if ( ((c == '\n') && count > 0)  || c == del || cflag) {
  11.100 +				count += 1;
  11.101 +				if (fflag) poscnt = count  ;
  11.102 +				if (sel[poscnt]) p2 = p1; else p1 = p2;
  11.103 +			}
  11.104 +		}while (c != '\n');
  11.105 +		if ( !endflag && (count > 0 || !supflag)) {
  11.106 +			if (*p1 == del) *p1 = '\0';
  11.107 +				else *++p1 = '\0'; /*suppress trailing delimiter*/
  11.108 +			puts(outbuf);
  11.109 +			}
  11.110 +	} while (!endflag) ;
  11.111 +fclose(inptr);
  11.112 +} while(++filenr <= argc);
  11.113 +}
  11.114 +
  11.115 +diag(s)
  11.116 +char *s;
  11.117 +{
  11.118 +	write(2, "cut : ", 6);
  11.119 +	while(*s)
  11.120 +		write(2,s++,1);
  11.121 +	exit(2);
  11.122 +}
  11.123 +diagl()
  11.124 +{
  11.125 +diag("bad list for c/f option\n");
  11.126 +}