File: [local] / src / usr.bin / rs / rs.c (download)
Revision 1.30, Thu Dec 3 12:23:15 2015 UTC (8 years, 5 months ago) by schwarze
Branch: MAIN
CVS Tags: OPENBSD_7_5_BASE, OPENBSD_7_5, OPENBSD_7_4_BASE, OPENBSD_7_4, OPENBSD_7_3_BASE, OPENBSD_7_3, OPENBSD_7_2_BASE, OPENBSD_7_2, OPENBSD_7_1_BASE, OPENBSD_7_1, OPENBSD_7_0_BASE, OPENBSD_7_0, OPENBSD_6_9_BASE, OPENBSD_6_9, OPENBSD_6_8_BASE, OPENBSD_6_8, OPENBSD_6_7_BASE, OPENBSD_6_7, OPENBSD_6_6_BASE, OPENBSD_6_6, OPENBSD_6_5_BASE, OPENBSD_6_5, OPENBSD_6_4_BASE, OPENBSD_6_4, OPENBSD_6_3_BASE, OPENBSD_6_3, OPENBSD_6_2_BASE, OPENBSD_6_2, OPENBSD_6_1_BASE, OPENBSD_6_1, OPENBSD_6_0_BASE, OPENBSD_6_0, OPENBSD_5_9_BASE, OPENBSD_5_9, HEAD Changes since 1.29: +69 -71 lines
UTF-8 support: In a UTF-8 locale, properly align columns in the
presence of zero-width and double-width characters and replace
non-printable codepoints and invalid bytes with ASCII question
marks. No change in the C/POSIX locale.
As a side effect, get rid of all pointer to pointer variables
and simplify some of the code.
Partially based on ideas from tedu@.
Feedback and OK czarkoff@, OK tedu@.
|
/* $OpenBSD: rs.c,v 1.30 2015/12/03 12:23:15 schwarze Exp $ */
/*-
* Copyright (c) 1993
* The Regents of the University of California. All rights reserved.
*
* Redistribution and use in source and binary forms, with or without
* modification, are permitted provided that the following conditions
* are met:
* 1. Redistributions of source code must retain the above copyright
* notice, this list of conditions and the following disclaimer.
* 2. Redistributions in binary form must reproduce the above copyright
* notice, this list of conditions and the following disclaimer in the
* documentation and/or other materials provided with the distribution.
* 3. Neither the name of the University nor the names of its contributors
* may be used to endorse or promote products derived from this software
* without specific prior written permission.
*
* THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
* ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
* IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
* ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
* FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
* DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
* OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
* HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
* LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
* OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
* SUCH DAMAGE.
*/
/*
* rs - reshape a data array
* Author: John Kunze, Office of Comp. Affairs, UCB
* BEWARE: lots of unfinished edges
*/
#include <ctype.h>
#include <err.h>
#include <errno.h>
#include <limits.h>
#include <locale.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <unistd.h>
struct entry {
int w; /* Display width. */
char *s; /* Multibyte string. */
};
long flags;
#define TRANSPOSE 000001
#define MTRANSPOSE 000002
#define ONEPERLINE 000004
#define ONEISEPONLY 000010
#define ONEOSEPONLY 000020
#define NOTRIMENDCOL 000040
#define SQUEEZE 000100
#define SHAPEONLY 000200
#define DETAILSHAPE 000400
#define RIGHTADJUST 001000
#define NULLPAD 002000
#define RECYCLE 004000
#define SKIPPRINT 010000
#define ONEPERCHAR 0100000
#define NOARGS 0200000
short *colwidths;
int nelem;
struct entry *elem;
struct entry *endelem;
char *curline;
int allocsize = BUFSIZ;
int irows, icols;
int orows, ocols;
int maxwidth;
int skip;
int propgutter;
char isep = ' ', osep = ' ';
int owidth = 80, gutter = 2;
int mbsavis(char **, const char *);
void usage(void);
void getargs(int, char *[]);
void getfile(void);
int get_line(void);
struct entry *getptrs(struct entry *);
void prepfile(void);
void prints(struct entry *, int);
void putfile(void);
#define INCR(ep) do { \
if (++ep >= endelem) \
ep = getptrs(ep); \
} while(0)
int
main(int argc, char *argv[])
{
setlocale(LC_CTYPE, "");
if (pledge("stdio", NULL) == -1)
err(1, "pledge");
getargs(argc, argv);
getfile();
if (flags & SHAPEONLY) {
printf("%d %d\n", irows, icols);
exit(0);
}
prepfile();
putfile();
exit(0);
}
void
getfile(void)
{
const char delim[2] = { isep, '\0' };
char *p;
struct entry *ep;
int multisep = (flags & ONEISEPONLY ? 0 : 1);
int nullpad = flags & NULLPAD;
struct entry *padto;
curline = NULL;
while (skip--) {
if (get_line() == EOF)
return;
if (flags & SKIPPRINT)
puts(curline);
}
if (get_line() == EOF)
return;
if (flags & NOARGS && strlen(curline) < (size_t)owidth)
flags |= ONEPERLINE;
if (flags & ONEPERLINE)
icols = 1;
else /* count cols on first line */
for (p = curline; *p != '\0'; p++) {
if (*p == isep && multisep)
continue;
icols++;
while (*p && *p != isep)
p++;
}
ep = getptrs(NULL);
p = curline;
do {
if (flags & ONEPERLINE) {
ep->w = mbsavis(&ep->s, curline);
if (maxwidth < ep->w)
maxwidth = ep->w;
INCR(ep); /* prepare for next entry */
irows++;
continue;
}
p = curline;
while (p != NULL && *p != '\0') {
if (*p == isep) {
p++;
if (multisep)
continue;
ep->s = ""; /* empty column */
ep->w = 0;
} else
ep->w = mbsavis(&ep->s, strsep(&p, delim));
if (maxwidth < ep->w)
maxwidth = ep->w;
INCR(ep); /* prepare for next entry */
}
irows++; /* update row count */
if (nullpad) { /* pad missing entries */
padto = elem + irows * icols;
while (ep < padto) {
ep->s = "";
ep->w = 0;
INCR(ep);
}
}
} while (get_line() != EOF);
nelem = ep - elem;
}
void
putfile(void)
{
struct entry *ep;
int i, j, n;
ep = elem;
if (flags & TRANSPOSE) {
for (i = 0; i < orows; i++) {
for (j = i; j < nelem; j += orows)
prints(ep + j, (j - i) / orows);
putchar('\n');
}
} else {
for (n = 0, i = 0; i < orows && n < nelem; i++) {
for (j = 0; j < ocols; j++) {
if (n++ >= nelem)
break;
prints(ep++, j);
}
putchar('\n');
}
}
}
void
prints(struct entry *ep, int col)
{
int n;
n = (flags & ONEOSEPONLY ? 1 : colwidths[col] - ep->w);
if (flags & RIGHTADJUST)
while (n-- > 0)
putchar(osep);
fputs(ep->s, stdout);
while (n-- > 0)
putchar(osep);
}
void
usage(void)
{
extern char *__progname;
fprintf(stderr,
"usage: %s [-CcSs[x]] [-GgKkw N] [-EeHhjmnTtyz] [rows [cols]]\n",
__progname);
exit(1);
}
void
prepfile(void)
{
struct entry *ep;
int i;
int j;
struct entry *lp;
int colw;
int max = 0;
int n;
if (!nelem)
exit(0);
gutter += maxwidth * propgutter / 100.0;
colw = maxwidth + gutter;
if (flags & MTRANSPOSE) {
orows = icols;
ocols = irows;
}
else if (orows == 0 && ocols == 0) { /* decide rows and cols */
ocols = owidth / colw;
if (ocols == 0) {
warnx("Display width %d is less than column width %d",
owidth, colw);
ocols = 1;
}
if (ocols > nelem)
ocols = nelem;
orows = nelem / ocols + (nelem % ocols ? 1 : 0);
}
else if (orows == 0) /* decide on rows */
orows = nelem / ocols + (nelem % ocols ? 1 : 0);
else if (ocols == 0) /* decide on cols */
ocols = nelem / orows + (nelem % orows ? 1 : 0);
while ((lp = elem + orows * ocols) > endelem)
(void)getptrs(NULL);
if (flags & RECYCLE) {
for (ep = elem + nelem; ep < lp; ep++)
memcpy(ep, ep - nelem, sizeof(*ep));
nelem = lp - elem;
}
if (!(colwidths = calloc(ocols, sizeof(short))))
errx(1, "malloc: No gutter space");
if (flags & SQUEEZE) {
for (ep = elem, i = 0; i < ocols; i++) {
max = 0;
if (flags & TRANSPOSE) {
for (j = 0; j < orows; j++, ep++)
if (ep->w > max)
max = ep->w;
} else {
for (j = i; j < nelem; j += ocols)
if (ep[j].w > max)
max = ep[j].w;
}
colwidths[i] = max + gutter;
}
} else {
for (i = 0; i < ocols; i++)
colwidths[i] = colw;
}
if (!(flags & NOTRIMENDCOL)) {
if (flags & RIGHTADJUST)
colwidths[0] -= gutter;
else
colwidths[ocols - 1] = 0;
}
n = orows * ocols;
if (n > nelem && (flags & RECYCLE))
nelem = n;
}
int
get_line(void)
{
static size_t cursz;
static ssize_t curlen;
if (irows > 0 && flags & DETAILSHAPE)
printf(" %zd line %d\n", curlen, irows);
if ((curlen = getline(&curline, &cursz, stdin)) == EOF) {
if (ferror(stdin))
err(1, NULL);
return EOF;
}
if (curlen > 0 && curline[curlen - 1] == '\n')
curline[--curlen] = '\0';
return 0;
}
struct entry *
getptrs(struct entry *sp)
{
struct entry *p;
int newsize;
newsize = allocsize * 2;
p = reallocarray(elem, newsize, sizeof(*p));
if (p == NULL)
err(1, "no memory");
allocsize = newsize;
sp = sp == NULL ? p : p + (sp - elem);
elem = p;
endelem = elem + allocsize;
return(sp);
}
void
getargs(int ac, char *av[])
{
int ch;
const char *errstr;
if (ac == 1)
flags |= NOARGS | TRANSPOSE;
while ((ch = getopt(ac, av, "c::C::s::S::k:K:g:G:w:tTeEnyjhHmz")) != -1) {
switch (ch) {
case 'T':
flags |= MTRANSPOSE;
/* FALLTHROUGH */
case 't':
flags |= TRANSPOSE;
break;
case 'c': /* input col. separator */
flags |= ONEISEPONLY;
/* FALLTHROUGH */
case 's': /* one or more allowed */
if (optarg == NULL)
isep = '\t'; /* default is ^I */
else if (optarg[1] != '\0')
usage(); /* single char only */
else
isep = *optarg;
break;
case 'C':
flags |= ONEOSEPONLY;
/* FALLTHROUGH */
case 'S':
if (optarg == NULL)
osep = '\t'; /* default is ^I */
else if (optarg[1] != '\0')
usage(); /* single char only */
else
osep = *optarg;
break;
case 'w': /* window width, default 80 */
owidth = strtonum(optarg, 1, INT_MAX, &errstr);
if (errstr) {
warnx("width %s", errstr);
usage();
}
break;
case 'K': /* skip N lines */
flags |= SKIPPRINT;
/* FALLTHROUGH */
case 'k': /* skip, do not print */
skip = strtonum(optarg, 0, INT_MAX, &errstr);
if (errstr) {
warnx("skip value %s", errstr);
usage();
}
if (skip == 0)
skip = 1;
break;
case 'm':
flags |= NOTRIMENDCOL;
break;
case 'g': /* gutter width */
gutter = strtonum(optarg, 0, INT_MAX, &errstr);
if (errstr) {
warnx("gutter width %s", errstr);
usage();
}
break;
case 'G':
propgutter = strtonum(optarg, 0, INT_MAX, &errstr);
if (errstr) {
warnx("gutter proportion %s", errstr);
usage();
}
break;
case 'e': /* each line is an entry */
flags |= ONEPERLINE;
break;
case 'E':
flags |= ONEPERCHAR;
break;
case 'j': /* right adjust */
flags |= RIGHTADJUST;
break;
case 'n': /* null padding for missing values */
flags |= NULLPAD;
break;
case 'y':
flags |= RECYCLE;
break;
case 'H': /* print shape only */
flags |= DETAILSHAPE;
/* FALLTHROUGH */
case 'h':
flags |= SHAPEONLY;
break;
case 'z': /* squeeze col width */
flags |= SQUEEZE;
break;
default:
usage();
}
}
ac -= optind;
av += optind;
switch (ac) {
case 2:
ocols = strtonum(av[1], 0, INT_MAX, &errstr);
if (errstr) {
warnx("columns value %s", errstr);
usage();
}
/* FALLTHROUGH */
case 1:
orows = strtonum(av[0], 0, INT_MAX, &errstr);
if (errstr) {
warnx("columns value %s", errstr);
usage();
}
/* FALLTHROUGH */
case 0:
break;
default:
usage();
}
}