Annotation of src/usr.bin/less/line.c, Revision 1.35
1.1 etheisen 1: /*
1.12 shadchin 2: * Copyright (C) 1984-2012 Mark Nudelman
1.14 nicm 3: * Modified for use with illumos by Garrett D'Amore.
4: * Copyright 2014 Garrett D'Amore <garrett@damore.org>
1.1 etheisen 5: *
1.5 millert 6: * You may distribute under the terms of either the GNU General Public
7: * License or the Less License, as specified in the README file.
1.1 etheisen 8: *
1.12 shadchin 9: * For more information, see the README file.
1.13 nicm 10: */
1.1 etheisen 11:
12: /*
13: * Routines to manipulate the "line buffer".
14: * The line buffer holds a line of output as it is being built
15: * in preparation for output to the screen.
16: */
17:
1.23 schwarze 18: #include <wchar.h>
1.28 schwarze 19: #include <wctype.h>
1.23 schwarze 20:
1.19 mmcc 21: #include "charset.h"
1.1 etheisen 22: #include "less.h"
23:
1.10 shadchin 24: static char *linebuf = NULL; /* Buffer which holds the current output line */
1.5 millert 25: static char *attr = NULL; /* Extension of linebuf to hold attributes */
1.13 nicm 26: int size_linebuf = 0; /* Size of line buffer (and attr buffer) */
1.5 millert 27:
1.10 shadchin 28: static int cshift; /* Current left-shift of output line buffer */
1.13 nicm 29: int hshift; /* Desired left-shift of output line buffer */
30: int tabstops[TABSTOP_MAX] = { 0 }; /* Custom tabstops */
31: int ntabstops = 1; /* Number of tabstops */
32: int tabdefault = 8; /* Default repeated tabstops */
33: off_t highest_hilite; /* Pos of last hilite in file found so far */
1.1 etheisen 34:
1.30 schwarze 35: static int curr; /* Total number of bytes in linebuf */
36: static int column; /* Display columns needed to show linebuf */
1.1 etheisen 37: static int overstrike; /* Next char should overstrike previous char */
38: static int is_null_line; /* There is no current line */
1.30 schwarze 39: static int lmargin; /* Index in linebuf of start of content */
1.1 etheisen 40: static char pendc;
1.13 nicm 41: static off_t pendpos;
1.5 millert 42: static char *end_ansi_chars;
1.10 shadchin 43: static char *mid_ansi_chars;
1.1 etheisen 44:
1.13 nicm 45: static int attr_swidth(int);
46: static int attr_ewidth(int);
47: static int do_append(LWCHAR, char *, off_t);
1.1 etheisen 48:
49: extern int bs_mode;
50: extern int linenums;
51: extern int ctldisp;
52: extern int twiddle;
53: extern int binattr;
1.5 millert 54: extern int status_col;
1.1 etheisen 55: extern int auto_wrap, ignaw;
56: extern int bo_s_width, bo_e_width;
57: extern int ul_s_width, ul_e_width;
58: extern int bl_s_width, bl_e_width;
59: extern int so_s_width, so_e_width;
60: extern int sc_width, sc_height;
1.5 millert 61: extern int utf_mode;
1.13 nicm 62: extern off_t start_attnpos;
63: extern off_t end_attnpos;
1.5 millert 64:
1.10 shadchin 65: static char mbc_buf[MAX_UTF_CHAR_LEN];
66: static int mbc_buf_index = 0;
1.13 nicm 67: static off_t mbc_pos;
1.10 shadchin 68:
1.5 millert 69: /*
70: * Initialize from environment variables.
71: */
1.13 nicm 72: void
73: init_line(void)
1.5 millert 74: {
75: end_ansi_chars = lgetenv("LESSANSIENDCHARS");
76: if (end_ansi_chars == NULL || *end_ansi_chars == '\0')
77: end_ansi_chars = "m";
1.10 shadchin 78:
79: mid_ansi_chars = lgetenv("LESSANSIMIDCHARS");
80: if (mid_ansi_chars == NULL || *mid_ansi_chars == '\0')
81: mid_ansi_chars = "0123456789;[?!\"'#%()*+ ";
82:
1.13 nicm 83: linebuf = ecalloc(LINEBUF_SIZE, sizeof (char));
84: attr = ecalloc(LINEBUF_SIZE, sizeof (char));
1.5 millert 85: size_linebuf = LINEBUF_SIZE;
86: }
87:
88: /*
89: * Expand the line buffer.
90: */
1.13 nicm 91: static int
92: expand_linebuf(void)
1.5 millert 93: {
1.10 shadchin 94: /* Double the size of the line buffer. */
1.7 millert 95: int new_size = size_linebuf * 2;
1.10 shadchin 96:
97: /* Just realloc to expand the buffer, if we can. */
1.22 deraadt 98: char *new_buf = recallocarray(linebuf, size_linebuf, new_size, 1);
1.35 ! tobias 99: if (new_buf != NULL) {
! 100: char *new_attr = recallocarray(attr, size_linebuf, new_size, 1);
! 101: linebuf = new_buf;
! 102: if (new_attr != NULL) {
! 103: attr = new_attr;
! 104: size_linebuf = new_size;
! 105: return (0);
! 106: }
1.5 millert 107: }
1.35 ! tobias 108: return (1);
1.5 millert 109: }
1.1 etheisen 110:
111: /*
1.10 shadchin 112: * Is a character ASCII?
113: */
1.25 schwarze 114: static int
1.13 nicm 115: is_ascii_char(LWCHAR ch)
1.10 shadchin 116: {
117: return (ch <= 0x7F);
118: }
119:
120: /*
1.1 etheisen 121: * Rewind the line buffer.
122: */
1.13 nicm 123: void
124: prewind(void)
1.1 etheisen 125: {
126: curr = 0;
127: column = 0;
1.10 shadchin 128: cshift = 0;
1.1 etheisen 129: overstrike = 0;
130: is_null_line = 0;
131: pendc = '\0';
1.5 millert 132: lmargin = 0;
133: if (status_col)
134: lmargin += 1;
1.1 etheisen 135: }
136:
137: /*
138: * Insert the line number (of the given position) into the line buffer.
139: */
1.13 nicm 140: void
141: plinenum(off_t pos)
1.1 etheisen 142: {
1.16 mmcc 143: off_t linenum = 0;
1.13 nicm 144: int i;
1.5 millert 145:
1.13 nicm 146: if (linenums == OPT_ONPLUS) {
1.5 millert 147: /*
148: * Get the line number and put it in the current line.
149: * {{ Note: since find_linenum calls forw_raw_line,
1.13 nicm 150: * it may seek in the input file, requiring the caller
1.5 millert 151: * of plinenum to re-seek if necessary. }}
152: * {{ Since forw_raw_line modifies linebuf, we must
153: * do this first, before storing anything in linebuf. }}
154: */
155: linenum = find_linenum(pos);
156: }
1.1 etheisen 157:
158: /*
1.5 millert 159: * Display a status column if the -J option is set.
1.1 etheisen 160: */
1.13 nicm 161: if (status_col) {
1.5 millert 162: linebuf[curr] = ' ';
1.13 nicm 163: if (start_attnpos != -1 &&
1.5 millert 164: pos >= start_attnpos && pos < end_attnpos)
1.10 shadchin 165: attr[curr] = AT_NORMAL|AT_HILITE;
1.5 millert 166: else
1.10 shadchin 167: attr[curr] = AT_NORMAL;
1.5 millert 168: curr++;
169: column++;
170: }
1.1 etheisen 171: /*
1.5 millert 172: * Display the line number at the start of each line
173: * if the -N option is set.
1.1 etheisen 174: */
1.13 nicm 175: if (linenums == OPT_ONPLUS) {
1.18 mmcc 176: char buf[23];
1.5 millert 177: int n;
1.1 etheisen 178:
1.17 mmcc 179: postoa(linenum, buf, sizeof(buf));
1.5 millert 180: n = strlen(buf);
181: if (n < MIN_LINENUM_WIDTH)
182: n = MIN_LINENUM_WIDTH;
1.6 millert 183: snprintf(linebuf+curr, size_linebuf-curr, "%*s ", n, buf);
1.21 deraadt 184: n++; /* One space after the line number. */
1.5 millert 185: for (i = 0; i < n; i++)
186: attr[curr+i] = AT_NORMAL;
187: curr += n;
188: column += n;
189: lmargin += n;
190: }
1.1 etheisen 191:
192: /*
1.5 millert 193: * Append enough spaces to bring us to the lmargin.
1.1 etheisen 194: */
1.13 nicm 195: while (column < lmargin) {
1.1 etheisen 196: linebuf[curr] = ' ';
197: attr[curr++] = AT_NORMAL;
198: column++;
1.5 millert 199: }
200: }
201:
202: /*
1.10 shadchin 203: * Shift the input line left.
1.30 schwarze 204: * Starting at lmargin, some bytes are discarded from the linebuf,
205: * until the number of display columns needed to show these bytes
206: * would exceed the argument.
1.5 millert 207: */
1.13 nicm 208: static void
209: pshift(int shift)
1.10 shadchin 210: {
1.30 schwarze 211: int shifted = 0; /* Number of display columns already discarded. */
212: int from; /* Index in linebuf of the current character. */
213: int to; /* Index in linebuf to move this character to. */
214: int len; /* Number of bytes in this character. */
215: int width = 0; /* Display columns needed for this character. */
216: int prev_attr; /* Attributes of the preceding character. */
217: int next_attr; /* Attributes of the following character. */
218: unsigned char c; /* First byte of current character. */
1.10 shadchin 219:
220: if (shift > column - lmargin)
221: shift = column - lmargin;
222: if (shift > curr - lmargin)
223: shift = curr - lmargin;
1.5 millert 224:
1.10 shadchin 225: to = from = lmargin;
1.5 millert 226: /*
1.10 shadchin 227: * We keep on going when shifted == shift
228: * to get all combining chars.
1.5 millert 229: */
1.13 nicm 230: while (shifted <= shift && from < curr) {
1.10 shadchin 231: c = linebuf[from];
1.24 schwarze 232: if (ctldisp == OPT_ONPLUS && c == ESC) {
1.10 shadchin 233: /* Keep cumulative effect. */
234: linebuf[to] = c;
235: attr[to++] = attr[from++];
1.13 nicm 236: while (from < curr && linebuf[from]) {
1.10 shadchin 237: linebuf[to] = linebuf[from];
238: attr[to++] = attr[from];
239: if (!is_ansi_middle(linebuf[from++]))
240: break;
1.13 nicm 241: }
1.10 shadchin 242: continue;
243: }
1.31 schwarze 244: if (utf_mode && !isascii(c)) {
1.30 schwarze 245: wchar_t ch;
246: /*
247: * Before this point, UTF-8 validity was already
248: * checked, but for additional safety, treat
249: * invalid bytes as single-width characters
250: * if they ever make it here. Similarly, treat
251: * non-printable characters as width 1.
252: */
253: len = mbtowc(&ch, linebuf + from, curr - from);
254: if (len == -1)
255: len = width = 1;
256: else if ((width = wcwidth(ch)) == -1)
257: width = 1;
1.13 nicm 258: } else {
1.10 shadchin 259: len = 1;
260: if (c == '\b')
261: /* XXX - Incorrect if several '\b' in a row. */
1.30 schwarze 262: width = width > 0 ? -width : -1;
263: else
264: width = iscntrl(c) ? 0 : 1;
1.10 shadchin 265: }
266:
267: if (width == 2 && shift - shifted == 1) {
268: /*
1.30 schwarze 269: * Move the first half of a double-width character
270: * off screen. Print a space instead of the second
271: * half. This should never happen when called
272: * by pshift_all().
1.10 shadchin 273: */
1.30 schwarze 274: attr[to] = attr[from];
275: linebuf[to++] = ' ';
1.10 shadchin 276: from += len;
277: shifted++;
1.30 schwarze 278: break;
1.10 shadchin 279: }
280:
281: /* Adjust width for magic cookies. */
282: prev_attr = (to > 0) ? attr[to-1] : AT_NORMAL;
283: next_attr = (from + len < curr) ? attr[from + len] : prev_attr;
1.13 nicm 284: if (!is_at_equiv(attr[from], prev_attr) &&
285: !is_at_equiv(attr[from], next_attr)) {
1.10 shadchin 286: width += attr_swidth(attr[from]);
287: if (from + len < curr)
288: width += attr_ewidth(attr[from]);
1.13 nicm 289: if (is_at_equiv(prev_attr, next_attr)) {
1.10 shadchin 290: width += attr_ewidth(prev_attr);
291: if (from + len < curr)
292: width += attr_swidth(next_attr);
1.5 millert 293: }
294: }
295:
1.10 shadchin 296: if (shift - shifted < width)
297: break;
298: from += len;
299: shifted += width;
300: if (shifted < 0)
301: shifted = 0;
302: }
1.13 nicm 303: while (from < curr) {
1.10 shadchin 304: linebuf[to] = linebuf[from];
305: attr[to++] = attr[from++];
306: }
307: curr = to;
308: column -= shifted;
309: cshift += shifted;
1.5 millert 310: }
311:
312: /*
1.10 shadchin 313: *
1.5 millert 314: */
1.13 nicm 315: void
316: pshift_all(void)
1.5 millert 317: {
1.10 shadchin 318: pshift(column);
1.1 etheisen 319: }
320:
321: /*
322: * Return the printing width of the start (enter) sequence
323: * for a given character attribute.
324: */
1.13 nicm 325: static int
326: attr_swidth(int a)
1.1 etheisen 327: {
1.10 shadchin 328: int w = 0;
329:
330: a = apply_at_specials(a);
331:
332: if (a & AT_UNDERLINE)
333: w += ul_s_width;
334: if (a & AT_BOLD)
335: w += bo_s_width;
336: if (a & AT_BLINK)
337: w += bl_s_width;
338: if (a & AT_STANDOUT)
339: w += so_s_width;
340:
1.13 nicm 341: return (w);
1.1 etheisen 342: }
343:
344: /*
345: * Return the printing width of the end (exit) sequence
346: * for a given character attribute.
347: */
1.13 nicm 348: static int
349: attr_ewidth(int a)
1.1 etheisen 350: {
1.10 shadchin 351: int w = 0;
352:
353: a = apply_at_specials(a);
354:
355: if (a & AT_UNDERLINE)
356: w += ul_e_width;
357: if (a & AT_BOLD)
358: w += bo_e_width;
359: if (a & AT_BLINK)
360: w += bl_e_width;
361: if (a & AT_STANDOUT)
362: w += so_e_width;
363:
1.13 nicm 364: return (w);
1.1 etheisen 365: }
366:
367: /*
368: * Return the printing width of a given character and attribute,
369: * if the character were added to the current position in the line buffer.
370: * Adding a character with a given attribute may cause an enter or exit
371: * attribute sequence to be inserted, so this must be taken into account.
372: */
1.13 nicm 373: static int
1.23 schwarze 374: pwidth(wchar_t ch, int a, wchar_t prev_ch)
1.1 etheisen 375: {
1.10 shadchin 376: int w;
1.1 etheisen 377:
1.23 schwarze 378: /*
379: * In case of a backspace, back up by the width of the previous
380: * character. If that is non-printable (for example another
381: * backspace) or zero width (for example a combining accent),
382: * the terminal may actually back up to a character even further
383: * back, but we no longer know how wide that may have been.
384: * The best guess possible at this point is that it was
385: * hopefully width one.
386: */
387: if (ch == L'\b') {
388: w = wcwidth(prev_ch);
389: if (w <= 0)
390: w = 1;
391: return (-w);
392: }
393:
394: w = wcwidth(ch);
395:
396: /*
397: * Non-printable characters can get here if the -r flag is in
398: * effect, and possibly in some other situations (XXX check that!).
399: * Treat them as zero width.
400: * That may not always match their actual behaviour,
401: * but there is no reasonable way to be more exact.
402: */
403: if (w == -1)
404: w = 0;
1.13 nicm 405:
1.23 schwarze 406: /*
407: * Combining accents take up no space.
408: * Some terminals, upon failure to compose them with the
409: * characters that precede them, will actually take up one column
410: * for the combining accent; there isn't much we could do short
411: * of testing the (complex) composition process ourselves and
412: * printing a binary representation when it fails.
413: */
414: if (w == 0)
415: return (0);
1.1 etheisen 416:
417: /*
1.10 shadchin 418: * Other characters take one or two columns,
1.1 etheisen 419: * plus the width of any attribute enter/exit sequence.
420: */
1.10 shadchin 421: if (curr > 0 && !is_at_equiv(attr[curr-1], a))
1.1 etheisen 422: w += attr_ewidth(attr[curr-1]);
1.10 shadchin 423: if ((apply_at_specials(a) != AT_NORMAL) &&
424: (curr == 0 || !is_at_equiv(attr[curr-1], a)))
1.1 etheisen 425: w += attr_swidth(a);
426: return (w);
427: }
428:
429: /*
1.10 shadchin 430: * Delete to the previous base character in the line buffer.
431: * Return 1 if one is found.
1.1 etheisen 432: */
1.13 nicm 433: static int
434: backc(void)
1.1 etheisen 435: {
1.27 schwarze 436: wchar_t ch, prev_ch;
1.34 kn 437: int len, width;
1.27 schwarze 438:
1.32 schwarze 439: if ((len = mbtowc_left(&ch, linebuf + curr, curr)) <= 0)
1.27 schwarze 440: return (0);
1.32 schwarze 441: curr -= len;
1.10 shadchin 442:
443: /* This assumes that there is no '\b' in linebuf. */
1.32 schwarze 444: while (curr >= lmargin && column > lmargin &&
445: !(attr[curr] & (AT_ANSI|AT_BINARY))) {
446: if ((len = mbtowc_left(&prev_ch, linebuf + curr, curr)) <= 0)
1.27 schwarze 447: prev_ch = L'\0';
1.10 shadchin 448: width = pwidth(ch, attr[curr], prev_ch);
449: column -= width;
450: if (width > 0)
1.13 nicm 451: return (1);
1.32 schwarze 452: curr -= len;
1.27 schwarze 453: if (prev_ch == L'\0')
454: return (0);
1.10 shadchin 455: ch = prev_ch;
456: }
1.13 nicm 457: return (0);
1.1 etheisen 458: }
459:
460: /*
1.25 schwarze 461: * Is a character the end of an ANSI escape sequence?
1.5 millert 462: */
1.13 nicm 463: static int
464: is_ansi_end(LWCHAR ch)
1.10 shadchin 465: {
466: if (!is_ascii_char(ch))
467: return (0);
1.13 nicm 468: return (strchr(end_ansi_chars, (char)ch) != NULL);
1.10 shadchin 469: }
470:
471: /*
472: *
473: */
1.13 nicm 474: int
475: is_ansi_middle(LWCHAR ch)
1.5 millert 476: {
1.10 shadchin 477: if (!is_ascii_char(ch))
478: return (0);
479: if (is_ansi_end(ch))
480: return (0);
1.13 nicm 481: return (strchr(mid_ansi_chars, (char)ch) != NULL);
1.5 millert 482: }
483:
484: /*
1.1 etheisen 485: * Append a character and attribute to the line buffer.
486: */
1.13 nicm 487: static int
488: store_char(LWCHAR ch, char a, char *rep, off_t pos)
1.1 etheisen 489: {
1.25 schwarze 490: int i;
1.10 shadchin 491: int w;
492: int replen;
493: char cs;
1.13 nicm 494: int matches;
1.10 shadchin 495:
1.13 nicm 496: if (is_hilited(pos, pos+1, 0, &matches)) {
497: /*
498: * This character should be highlighted.
499: * Override the attribute passed in.
500: */
501: if (a != AT_ANSI) {
502: if (highest_hilite != -1 && pos > highest_hilite)
503: highest_hilite = pos;
504: a |= AT_HILITE;
1.10 shadchin 505: }
1.5 millert 506: }
1.10 shadchin 507:
1.25 schwarze 508: w = -1;
509: if (ctldisp == OPT_ONPLUS) {
510: /*
511: * Set i to the beginning of an ANSI escape sequence
512: * that was begun and not yet ended, or to -1 otherwise.
513: */
514: for (i = curr - 1; i >= 0; i--) {
515: if (linebuf[i] == ESC)
516: break;
517: if (!is_ansi_middle(linebuf[i]))
518: i = 0;
519: }
520: if (i >= 0 && !is_ansi_end(ch) && !is_ansi_middle(ch)) {
1.10 shadchin 521: /* Remove whole unrecognized sequence. */
1.25 schwarze 522: curr = i;
1.13 nicm 523: return (0);
1.10 shadchin 524: }
1.25 schwarze 525: if (i >= 0 || ch == ESC) {
526: a = AT_ANSI; /* Will force re-AT_'ing around it. */
527: w = 0;
528: }
529: }
530: if (w == -1) {
531: wchar_t prev_ch;
1.32 schwarze 532: if (mbtowc_left(&prev_ch, linebuf + curr, curr) <= 0)
533: prev_ch = L' ';
1.10 shadchin 534: w = pwidth(ch, a, prev_ch);
535: }
536:
1.5 millert 537: if (ctldisp != OPT_ON && column + w + attr_ewidth(a) > sc_width)
1.1 etheisen 538: /*
539: * Won't fit on screen.
540: */
541: return (1);
542:
1.13 nicm 543: if (rep == NULL) {
544: cs = (char)ch;
1.10 shadchin 545: rep = &cs;
546: replen = 1;
1.13 nicm 547: } else {
1.10 shadchin 548: replen = utf_len(rep[0]);
549: }
1.13 nicm 550: if (curr + replen >= size_linebuf-6) {
1.1 etheisen 551: /*
552: * Won't fit in line buffer.
1.5 millert 553: * Try to expand it.
1.1 etheisen 554: */
1.5 millert 555: if (expand_linebuf())
556: return (1);
557: }
1.1 etheisen 558:
1.13 nicm 559: while (replen-- > 0) {
1.10 shadchin 560: linebuf[curr] = *rep++;
561: attr[curr] = a;
562: curr++;
1.1 etheisen 563: }
564: column += w;
565: return (0);
566: }
567:
568: /*
1.5 millert 569: * Append a tab to the line buffer.
570: * Store spaces to represent the tab.
571: */
1.13 nicm 572: static int
573: store_tab(int attr, off_t pos)
1.5 millert 574: {
575: int to_tab = column + cshift - lmargin;
576: int i;
577:
578: if (ntabstops < 2 || to_tab >= tabstops[ntabstops-1])
579: to_tab = tabdefault -
1.13 nicm 580: ((to_tab - tabstops[ntabstops-1]) % tabdefault);
581: else {
1.21 deraadt 582: for (i = ntabstops - 2; i >= 0; i--)
1.5 millert 583: if (to_tab >= tabstops[i])
584: break;
585: to_tab = tabstops[i+1] - to_tab;
586: }
587:
1.13 nicm 588: if (column + to_tab - 1 + pwidth(' ', attr, 0) +
589: attr_ewidth(attr) > sc_width)
590: return (1);
1.10 shadchin 591:
1.5 millert 592: do {
1.26 schwarze 593: if (store_char(' ', attr, " ", pos))
594: return (1);
1.5 millert 595: } while (--to_tab > 0);
1.13 nicm 596: return (0);
1.5 millert 597: }
598:
1.13 nicm 599: static int
600: store_prchar(char c, off_t pos)
1.10 shadchin 601: {
602: char *s;
603:
604: /*
605: * Convert to printable representation.
606: */
607: s = prchar(c);
608:
609: /*
610: * Make sure we can get the entire representation
611: * of the character on this line.
612: */
1.13 nicm 613: if (column + (int)strlen(s) - 1 +
614: pwidth(' ', binattr, 0) + attr_ewidth(binattr) > sc_width)
615: return (1);
1.10 shadchin 616:
1.13 nicm 617: for (; *s != 0; s++) {
1.26 schwarze 618: if (store_char(*s, AT_BINARY, NULL, pos))
619: return (1);
1.13 nicm 620: }
621: return (0);
1.10 shadchin 622: }
623:
1.13 nicm 624: static int
625: flush_mbc_buf(off_t pos)
1.10 shadchin 626: {
627: int i;
628:
1.26 schwarze 629: for (i = 0; i < mbc_buf_index; i++) {
1.10 shadchin 630: if (store_prchar(mbc_buf[i], pos))
1.13 nicm 631: return (mbc_buf_index - i);
1.26 schwarze 632: }
1.13 nicm 633: return (0);
1.10 shadchin 634: }
635:
1.5 millert 636: /*
1.1 etheisen 637: * Append a character to the line buffer.
638: * Expand tabs into spaces, handle underlining, boldfacing, etc.
639: * Returns 0 if ok, 1 if couldn't fit in buffer.
640: */
1.13 nicm 641: int
642: pappend(char c, off_t pos)
1.1 etheisen 643: {
1.29 schwarze 644: mbstate_t mbs;
645: size_t sz;
646: wchar_t ch;
1.5 millert 647: int r;
648:
1.13 nicm 649: if (pendc) {
1.10 shadchin 650: if (do_append(pendc, NULL, pendpos))
1.1 etheisen 651: /*
652: * Oops. We've probably lost the char which
653: * was in pendc, since caller won't back up.
654: */
655: return (1);
656: pendc = '\0';
657: }
658:
1.13 nicm 659: if (c == '\r' && bs_mode == BS_SPECIAL) {
1.29 schwarze 660: if (mbc_buf_index > 0) /* utf_mode must be on. */ {
1.10 shadchin 661: /* Flush incomplete (truncated) sequence. */
662: r = flush_mbc_buf(mbc_pos);
1.29 schwarze 663: mbc_buf_index = 0;
1.10 shadchin 664: if (r)
1.29 schwarze 665: return (r + 1);
1.10 shadchin 666: }
667:
1.1 etheisen 668: /*
1.13 nicm 669: * Don't put the CR into the buffer until we see
1.1 etheisen 670: * the next char. If the next char is a newline,
671: * discard the CR.
672: */
673: pendc = c;
674: pendpos = pos;
675: return (0);
676: }
677:
1.13 nicm 678: if (!utf_mode) {
1.10 shadchin 679: r = do_append((LWCHAR) c, NULL, pos);
1.13 nicm 680: } else {
1.29 schwarze 681: for (;;) {
682: if (mbc_buf_index == 0)
1.10 shadchin 683: mbc_pos = pos;
1.29 schwarze 684: mbc_buf[mbc_buf_index++] = c;
685: memset(&mbs, 0, sizeof(mbs));
686: sz = mbrtowc(&ch, mbc_buf, mbc_buf_index, &mbs);
1.33 deraadt 687:
1.29 schwarze 688: /* Incomplete UTF-8: wait for more bytes. */
689: if (sz == (size_t)-2)
1.10 shadchin 690: return (0);
1.29 schwarze 691:
692: /* Valid UTF-8: use the character. */
693: if (sz != (size_t)-1) {
694: r = do_append(ch, mbc_buf, mbc_pos) ?
695: mbc_buf_index : 0;
696: break;
697: }
698:
699: /* Invalid start byte: encode it. */
700: if (mbc_buf_index == 1) {
701: r = store_prchar(c, pos);
702: break;
1.13 nicm 703: }
1.29 schwarze 704:
705: /*
706: * Invalid continuation.
707: * Encode the preceding bytes.
708: * If they fit, handle the interrupting byte.
709: * Otherwise, tell the caller to back up
710: * by the number of bytes that do not fit,
711: * plus one for the new byte.
712: */
713: mbc_buf_index--;
714: if ((r = flush_mbc_buf(mbc_pos) + 1) == 1)
715: mbc_buf_index = 0;
1.10 shadchin 716: else
1.29 schwarze 717: break;
1.13 nicm 718: }
1.10 shadchin 719: }
720:
1.5 millert 721: /*
722: * If we need to shift the line, do it.
723: * But wait until we get to at least the middle of the screen,
724: * so shifting it doesn't affect the chars we're currently
725: * pappending. (Bold & underline can get messed up otherwise.)
726: */
1.13 nicm 727: if (cshift < hshift && column > sc_width / 2) {
1.5 millert 728: linebuf[curr] = '\0';
729: pshift(hshift - cshift);
730: }
1.29 schwarze 731: mbc_buf_index = 0;
1.5 millert 732: return (r);
1.1 etheisen 733: }
734:
1.13 nicm 735: static int
736: do_append(LWCHAR ch, char *rep, off_t pos)
1.1 etheisen 737: {
1.28 schwarze 738: wchar_t prev_ch;
1.13 nicm 739: int a;
1.1 etheisen 740:
1.10 shadchin 741: a = AT_NORMAL;
1.1 etheisen 742:
1.13 nicm 743: if (ch == '\b') {
1.10 shadchin 744: if (bs_mode == BS_CONTROL)
1.5 millert 745: goto do_control_char;
1.10 shadchin 746:
747: /*
748: * A better test is needed here so we don't
749: * backspace over part of the printed
750: * representation of a binary character.
751: */
1.13 nicm 752: if (curr <= lmargin ||
753: column <= lmargin ||
754: (attr[curr - 1] & (AT_ANSI|AT_BINARY))) {
1.26 schwarze 755: if (store_prchar('\b', pos))
756: return (1);
1.13 nicm 757: } else if (bs_mode == BS_NORMAL) {
1.26 schwarze 758: if (store_char(ch, AT_NORMAL, NULL, pos))
759: return (1);
1.13 nicm 760: } else if (bs_mode == BS_SPECIAL) {
1.10 shadchin 761: overstrike = backc();
1.13 nicm 762: }
1.10 shadchin 763:
1.13 nicm 764: return (0);
1.10 shadchin 765: }
766:
1.13 nicm 767: if (overstrike > 0) {
1.1 etheisen 768: /*
769: * Overstrike the character at the current position
1.13 nicm 770: * in the line buffer. This will cause either
771: * underline (if a "_" is overstruck),
1.1 etheisen 772: * bold (if an identical character is overstruck),
773: * or just deletion of the character in the buffer.
774: */
1.10 shadchin 775: overstrike = utf_mode ? -1 : 0;
776: /* To be correct, this must be a base character. */
1.28 schwarze 777: if (mbtowc(&prev_ch, linebuf + curr, MB_CUR_MAX) == -1) {
778: (void)mbtowc(NULL, NULL, MB_CUR_MAX);
779: prev_ch = L'\0';
780: }
1.10 shadchin 781: a = attr[curr];
1.13 nicm 782: if (ch == prev_ch) {
1.5 millert 783: /*
784: * Overstriking a char with itself means make it bold.
785: * But overstriking an underscore with itself is
786: * ambiguous. It could mean make it bold, or
787: * it could mean make it underlined.
788: * Use the previous overstrike to resolve it.
789: */
1.13 nicm 790: if (ch == '_') {
1.10 shadchin 791: if ((a & (AT_BOLD|AT_UNDERLINE)) != AT_NORMAL)
792: a |= (AT_BOLD|AT_UNDERLINE);
1.20 natano 793: else if (curr > 0 && attr[curr - 1] & AT_UNDERLINE)
794: a |= AT_UNDERLINE;
795: else if (curr > 0 && attr[curr - 1] & AT_BOLD)
796: a |= AT_BOLD;
1.10 shadchin 797: else
1.20 natano 798: a |= AT_INDET;
1.13 nicm 799: } else {
1.10 shadchin 800: a |= AT_BOLD;
1.13 nicm 801: }
1.28 schwarze 802: } else if (ch == '_' && prev_ch != L'\0') {
1.10 shadchin 803: a |= AT_UNDERLINE;
804: ch = prev_ch;
805: rep = linebuf + curr;
1.13 nicm 806: } else if (prev_ch == '_') {
1.10 shadchin 807: a |= AT_UNDERLINE;
808: }
809: /* Else we replace prev_ch, but we keep its attributes. */
1.13 nicm 810: } else if (overstrike < 0) {
1.28 schwarze 811: if (wcwidth(ch) == 0) {
1.10 shadchin 812: /* Continuation of the same overstrike. */
1.20 natano 813: if (curr > 0)
814: a = attr[curr - 1] & (AT_UNDERLINE | AT_BOLD);
815: else
816: a = AT_NORMAL;
817: } else
1.10 shadchin 818: overstrike = 0;
819: }
820:
1.13 nicm 821: if (ch == '\t') {
1.5 millert 822: /*
823: * Expand a tab into spaces.
824: */
1.13 nicm 825: switch (bs_mode) {
1.1 etheisen 826: case BS_CONTROL:
827: goto do_control_char;
1.5 millert 828: case BS_NORMAL:
1.1 etheisen 829: case BS_SPECIAL:
1.26 schwarze 830: if (store_tab(a, pos))
831: return (1);
1.1 etheisen 832: break;
833: }
1.28 schwarze 834: } else if ((!utf_mode || is_ascii_char(ch)) &&
835: !isprint((unsigned char)ch)) {
1.13 nicm 836: do_control_char:
837: if (ctldisp == OPT_ON ||
1.24 schwarze 838: (ctldisp == OPT_ONPLUS && ch == ESC)) {
1.1 etheisen 839: /*
840: * Output as a normal character.
841: */
1.26 schwarze 842: if (store_char(ch, AT_NORMAL, rep, pos))
843: return (1);
1.13 nicm 844: } else {
1.26 schwarze 845: if (store_prchar(ch, pos))
846: return (1);
1.10 shadchin 847: }
1.28 schwarze 848: } else if (utf_mode && ctldisp != OPT_ON && !iswprint(ch)) {
1.10 shadchin 849: char *s;
850:
851: s = prutfchar(ch);
1.1 etheisen 852:
1.13 nicm 853: if (column + (int)strlen(s) - 1 +
1.10 shadchin 854: pwidth(' ', binattr, 0) + attr_ewidth(binattr) > sc_width)
855: return (1);
1.1 etheisen 856:
1.26 schwarze 857: for (; *s != 0; s++) {
858: if (store_char(*s, AT_BINARY, NULL, pos))
859: return (1);
860: }
1.13 nicm 861: } else {
1.26 schwarze 862: if (store_char(ch, a, rep, pos))
863: return (1);
1.1 etheisen 864: }
1.13 nicm 865: return (0);
1.10 shadchin 866: }
867:
868: /*
869: *
870: */
1.13 nicm 871: int
872: pflushmbc(void)
1.10 shadchin 873: {
874: int r = 0;
1.1 etheisen 875:
1.29 schwarze 876: if (mbc_buf_index > 0) {
1.10 shadchin 877: /* Flush incomplete (truncated) sequence. */
878: r = flush_mbc_buf(mbc_pos);
1.29 schwarze 879: mbc_buf_index = 0;
1.10 shadchin 880: }
1.13 nicm 881: return (r);
1.1 etheisen 882: }
883:
884: /*
885: * Terminate the line in the line buffer.
886: */
1.13 nicm 887: void
888: pdone(int endline, int forw)
1.1 etheisen 889: {
1.20 natano 890: int i;
891:
1.10 shadchin 892: (void) pflushmbc();
893:
1.1 etheisen 894: if (pendc && (pendc != '\r' || !endline))
895: /*
896: * If we had a pending character, put it in the buffer.
897: * But discard a pending CR if we are at end of line
898: * (that is, discard the CR in a CR/LF sequence).
899: */
1.10 shadchin 900: (void) do_append(pendc, NULL, pendpos);
1.20 natano 901:
902: for (i = curr - 1; i >= 0; i--) {
903: if (attr[i] & AT_INDET) {
904: attr[i] &= ~AT_INDET;
905: if (i < curr - 1 && attr[i + 1] & AT_BOLD)
906: attr[i] |= AT_BOLD;
907: else
908: attr[i] |= AT_UNDERLINE;
909: }
910: }
1.1 etheisen 911:
912: /*
1.5 millert 913: * Make sure we've shifted the line, if we need to.
914: */
915: if (cshift < hshift)
916: pshift(hshift - cshift);
917:
1.13 nicm 918: if (ctldisp == OPT_ONPLUS && is_ansi_end('m')) {
1.10 shadchin 919: /* Switch to normal attribute at end of line. */
920: char *p = "\033[m";
1.13 nicm 921: for (; *p != '\0'; p++) {
1.10 shadchin 922: linebuf[curr] = *p;
923: attr[curr++] = AT_ANSI;
924: }
925: }
926:
1.5 millert 927: /*
1.1 etheisen 928: * Add a newline if necessary,
929: * and append a '\0' to the end of the line.
1.10 shadchin 930: * We output a newline if we're not at the right edge of the screen,
931: * or if the terminal doesn't auto wrap,
932: * or if this is really the end of the line AND the terminal ignores
933: * a newline at the right edge.
1.13 nicm 934: * (In the last case we don't want to output a newline if the terminal
1.10 shadchin 935: * doesn't ignore it since that would produce an extra blank line.
936: * But we do want to output a newline if the terminal ignores it in case
937: * the next line is blank. In that case the single newline output for
938: * that blank line would be ignored!)
1.1 etheisen 939: */
1.13 nicm 940: if (column < sc_width || !auto_wrap || (endline && ignaw) ||
941: ctldisp == OPT_ON) {
1.1 etheisen 942: linebuf[curr] = '\n';
943: attr[curr] = AT_NORMAL;
944: curr++;
1.13 nicm 945: } else if (ignaw && column >= sc_width && forw) {
1.10 shadchin 946: /*
947: * Terminals with "ignaw" don't wrap until they *really* need
948: * to, i.e. when the character *after* the last one to fit on a
949: * line is output. But they are too hard to deal with when they
950: * get in the state where a full screen width of characters
951: * have been output but the cursor is sitting on the right edge
952: * instead of at the start of the next line.
1.13 nicm 953: * So we nudge them into wrapping by outputting a space
954: * character plus a backspace. But do this only if moving
1.10 shadchin 955: * forward; if we're moving backward and drawing this line at
956: * the top of the screen, the space would overwrite the first
1.13 nicm 957: * char on the next line. We don't need to do this "nudge"
1.10 shadchin 958: * at the top of the screen anyway.
959: */
960: linebuf[curr] = ' ';
961: attr[curr++] = AT_NORMAL;
1.13 nicm 962: linebuf[curr] = '\b';
1.10 shadchin 963: attr[curr++] = AT_NORMAL;
1.1 etheisen 964: }
965: linebuf[curr] = '\0';
966: attr[curr] = AT_NORMAL;
1.10 shadchin 967: }
1.5 millert 968:
1.10 shadchin 969: /*
970: *
971: */
1.13 nicm 972: void
973: set_status_col(char c)
1.10 shadchin 974: {
975: linebuf[0] = c;
976: attr[0] = AT_NORMAL|AT_HILITE;
1.1 etheisen 977: }
978:
979: /*
980: * Get a character from the current line.
981: * Return the character as the function return value,
982: * and the character attribute in *ap.
983: */
1.13 nicm 984: int
985: gline(int i, int *ap)
1.1 etheisen 986: {
1.13 nicm 987: if (is_null_line) {
1.1 etheisen 988: /*
989: * If there is no current line, we pretend the line is
990: * either "~" or "", depending on the "twiddle" flag.
991: */
1.13 nicm 992: if (twiddle) {
993: if (i == 0) {
1.10 shadchin 994: *ap = AT_BOLD;
1.13 nicm 995: return ('~');
1.10 shadchin 996: }
997: --i;
998: }
999: /* Make sure we're back to AT_NORMAL before the '\n'. */
1000: *ap = AT_NORMAL;
1.13 nicm 1001: return (i ? '\0' : '\n');
1.1 etheisen 1002: }
1003:
1004: *ap = attr[i];
1.10 shadchin 1005: return (linebuf[i] & 0xFF);
1.1 etheisen 1006: }
1007:
1008: /*
1009: * Indicate that there is no current line.
1010: */
1.13 nicm 1011: void
1012: null_line(void)
1.1 etheisen 1013: {
1014: is_null_line = 1;
1.5 millert 1015: cshift = 0;
1.1 etheisen 1016: }
1017:
1018: /*
1019: * Analogous to forw_line(), but deals with "raw lines":
1020: * lines which are not split for screen width.
1021: * {{ This is supposed to be more efficient than forw_line(). }}
1022: */
1.13 nicm 1023: off_t
1024: forw_raw_line(off_t curr_pos, char **linep, int *line_lenp)
1025: {
1026: int n;
1027: int c;
1028: off_t new_pos;
1029:
1030: if (curr_pos == -1 || ch_seek(curr_pos) ||
1031: (c = ch_forw_get()) == EOI)
1032: return (-1);
1.1 etheisen 1033:
1.5 millert 1034: n = 0;
1.13 nicm 1035: for (;;) {
1.33 deraadt 1036: if (c == '\n' || c == EOI || abort_sigs()) {
1.1 etheisen 1037: new_pos = ch_tell();
1038: break;
1039: }
1.13 nicm 1040: if (n >= size_linebuf-1) {
1041: if (expand_linebuf()) {
1.5 millert 1042: /*
1043: * Overflowed the input buffer.
1044: * Pretend the line ended here.
1045: */
1046: new_pos = ch_tell() - 1;
1047: break;
1048: }
1.1 etheisen 1049: }
1.13 nicm 1050: linebuf[n++] = (char)c;
1.1 etheisen 1051: c = ch_forw_get();
1052: }
1.5 millert 1053: linebuf[n] = '\0';
1.1 etheisen 1054: if (linep != NULL)
1055: *linep = linebuf;
1.10 shadchin 1056: if (line_lenp != NULL)
1057: *line_lenp = n;
1.1 etheisen 1058: return (new_pos);
1059: }
1060:
1061: /*
1062: * Analogous to back_line(), but deals with "raw lines".
1063: * {{ This is supposed to be more efficient than back_line(). }}
1064: */
1.13 nicm 1065: off_t
1066: back_raw_line(off_t curr_pos, char **linep, int *line_lenp)
1067: {
1068: int n;
1069: int c;
1070: off_t new_pos;
1071:
1072: if (curr_pos == -1 || curr_pos <= ch_zero() || ch_seek(curr_pos - 1))
1073: return (-1);
1.1 etheisen 1074:
1.5 millert 1075: n = size_linebuf;
1076: linebuf[--n] = '\0';
1.13 nicm 1077: for (;;) {
1.1 etheisen 1078: c = ch_back_get();
1.33 deraadt 1079: if (c == '\n' || abort_sigs()) {
1.1 etheisen 1080: /*
1081: * This is the newline ending the previous line.
1082: * We have hit the beginning of the line.
1083: */
1084: new_pos = ch_tell() + 1;
1085: break;
1086: }
1.13 nicm 1087: if (c == EOI) {
1.1 etheisen 1088: /*
1089: * We have hit the beginning of the file.
1090: * This must be the first line in the file.
1091: * This must, of course, be the beginning of the line.
1092: */
1093: new_pos = ch_zero();
1094: break;
1095: }
1.13 nicm 1096: if (n <= 0) {
1.5 millert 1097: int old_size_linebuf = size_linebuf;
1.13 nicm 1098: if (expand_linebuf()) {
1.5 millert 1099: /*
1100: * Overflowed the input buffer.
1101: * Pretend the line ended here.
1102: */
1103: new_pos = ch_tell() + 1;
1104: break;
1105: }
1.1 etheisen 1106: /*
1.5 millert 1107: * Shift the data to the end of the new linebuf.
1.1 etheisen 1108: */
1.5 millert 1109: n = size_linebuf - old_size_linebuf;
1.8 millert 1110: memmove(linebuf + n, linebuf, old_size_linebuf);
1.1 etheisen 1111: }
1.5 millert 1112: linebuf[--n] = c;
1.1 etheisen 1113: }
1114: if (linep != NULL)
1.5 millert 1115: *linep = &linebuf[n];
1.10 shadchin 1116: if (line_lenp != NULL)
1117: *line_lenp = size_linebuf - 1 - n;
1.1 etheisen 1118: return (new_pos);
1119: }