Annotation of src/usr.bin/mandoc/term.c, Revision 1.125
1.125 ! schwarze 1: /* $OpenBSD: term.c,v 1.124 2017/06/04 22:43:50 schwarze Exp $ */
1.1 kristaps 2: /*
1.59 schwarze 3: * Copyright (c) 2008, 2009, 2010, 2011 Kristaps Dzonsons <kristaps@bsd.lv>
1.119 schwarze 4: * Copyright (c) 2010-2017 Ingo Schwarze <schwarze@openbsd.org>
1.1 kristaps 5: *
6: * Permission to use, copy, modify, and distribute this software for any
1.2 schwarze 7: * purpose with or without fee is hereby granted, provided that the above
8: * copyright notice and this permission notice appear in all copies.
1.1 kristaps 9: *
1.106 schwarze 10: * THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHORS DISCLAIM ALL WARRANTIES
1.2 schwarze 11: * WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
1.106 schwarze 12: * MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHORS BE LIABLE FOR
1.2 schwarze 13: * ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
14: * WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN
15: * ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF
16: * OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
1.1 kristaps 17: */
1.20 schwarze 18: #include <sys/types.h>
19:
1.1 kristaps 20: #include <assert.h>
1.20 schwarze 21: #include <ctype.h>
1.1 kristaps 22: #include <stdio.h>
23: #include <stdlib.h>
24: #include <string.h>
25:
1.34 schwarze 26: #include "mandoc.h"
1.79 schwarze 27: #include "mandoc_aux.h"
1.16 schwarze 28: #include "out.h"
1.1 kristaps 29: #include "term.h"
1.16 schwarze 30: #include "main.h"
1.1 kristaps 31:
1.64 schwarze 32: static size_t cond_width(const struct termp *, int, int *);
1.71 schwarze 33: static void adjbuf(struct termp *p, size_t);
1.59 schwarze 34: static void bufferc(struct termp *, char);
35: static void encode(struct termp *, const char *, size_t);
36: static void encode1(struct termp *, int);
1.124 schwarze 37: static void endline(struct termp *);
1.1 kristaps 38:
1.83 schwarze 39:
1.37 schwarze 40: void
41: term_free(struct termp *p)
1.1 kristaps 42: {
43:
1.91 schwarze 44: free(p->buf);
1.98 schwarze 45: free(p->fontq);
1.37 schwarze 46: free(p);
1.1 kristaps 47: }
48:
1.13 schwarze 49: void
1.83 schwarze 50: term_begin(struct termp *p, term_margin head,
1.106 schwarze 51: term_margin foot, const struct roff_meta *arg)
1.1 kristaps 52: {
53:
1.37 schwarze 54: p->headf = head;
55: p->footf = foot;
56: p->argf = arg;
57: (*p->begin)(p);
1.1 kristaps 58: }
59:
1.37 schwarze 60: void
61: term_end(struct termp *p)
1.1 kristaps 62: {
63:
1.37 schwarze 64: (*p->end)(p);
1.1 kristaps 65: }
66:
67: /*
1.82 schwarze 68: * Flush a chunk of text. By default, break the output line each time
69: * the right margin is reached, and continue output on the next line
70: * at the same offset as the chunk itself. By default, also break the
71: * output line at the end of the chunk.
1.27 schwarze 72: * The following flags may be specified:
1.1 kristaps 73: *
1.82 schwarze 74: * - TERMP_NOBREAK: Do not break the output line at the right margin,
75: * but only at the max right margin. Also, do not break the output
76: * line at the end of the chunk, such that the next call can pad to
77: * the next column. However, if less than p->trailspace blanks,
78: * which can be 0, 1, or 2, remain to the right margin, the line
79: * will be broken.
1.110 schwarze 80: * - TERMP_BRTRSP: Consider trailing whitespace significant
81: * when deciding whether the chunk fits or not.
1.82 schwarze 82: * - TERMP_BRIND: If the chunk does not fit and the output line has
83: * to be broken, start the next line at the right margin instead
84: * of at the offset. Used together with TERMP_NOBREAK for the tags
85: * in various kinds of tagged lists.
1.123 schwarze 86: * - TERMP_HANG: Do not break the output line at the right margin,
1.82 schwarze 87: * append the next chunk after it even if this one is too long.
88: * To be used together with TERMP_NOBREAK.
1.123 schwarze 89: * - TERMP_NOPAD: Start writing at the current position,
90: * do not pad with blank characters up to the offset.
1.1 kristaps 91: */
92: void
93: term_flushln(struct termp *p)
94: {
1.71 schwarze 95: size_t i; /* current input position in p->buf */
1.66 schwarze 96: int ntab; /* number of tabs to prepend */
1.19 schwarze 97: size_t vis; /* current visual position on output */
98: size_t vbl; /* number of blanks to prepend to output */
1.33 schwarze 99: size_t vend; /* end of word visual position on output */
1.19 schwarze 100: size_t bp; /* visual right border position */
1.51 schwarze 101: size_t dv; /* temporary for visual pos calculations */
1.71 schwarze 102: size_t j; /* temporary loop index for p->buf */
103: size_t jhy; /* last hyph before overflow w/r/t j */
1.42 schwarze 104: size_t maxvis; /* output position of visible boundary */
1.1 kristaps 105:
1.123 schwarze 106: vbl = (p->flags & TERMP_NOPAD) || p->offset < p->viscol ? 0 :
107: p->offset - p->viscol;
108: if (p->minbl && vbl < p->minbl)
109: vbl = p->minbl;
110: maxvis = p->rmargin > p->viscol + vbl ?
111: p->rmargin - p->viscol - vbl : 0;
112: bp = !(p->flags & TERMP_NOBREAK) ? maxvis :
113: p->maxrmargin > p->viscol + vbl ?
114: p->maxrmargin - p->viscol - vbl : 0;
1.53 schwarze 115: vis = vend = 0;
116: i = 0;
1.19 schwarze 117:
1.125 ! schwarze 118: while (i < p->lastcol) {
1.22 schwarze 119: /*
1.42 schwarze 120: * Handle literal tab characters: collapse all
121: * subsequent tabs into a single huge set of spaces.
1.30 schwarze 122: */
1.66 schwarze 123: ntab = 0;
1.125 ! schwarze 124: while (i < p->lastcol && p->buf[i] == '\t') {
1.120 schwarze 125: vend = term_tab_next(vis);
1.30 schwarze 126: vbl += vend - vis;
127: vis = vend;
1.66 schwarze 128: ntab++;
1.49 schwarze 129: i++;
1.30 schwarze 130: }
1.22 schwarze 131:
1.1 kristaps 132: /*
133: * Count up visible word characters. Control sequences
134: * (starting with the CSI) aren't counted. A space
135: * generates a non-printing word, which is valid (the
136: * space is printed according to regular spacing rules).
137: */
138:
1.125 ! schwarze 139: for (j = i, jhy = 0; j < p->lastcol; j++) {
1.69 schwarze 140: if (' ' == p->buf[j] || '\t' == p->buf[j])
1.1 kristaps 141: break;
1.42 schwarze 142:
1.117 krw 143: /* Back over the last printed character. */
1.42 schwarze 144: if (8 == p->buf[j]) {
145: assert(j);
146: vend -= (*p->width)(p, p->buf[j - 1]);
147: continue;
148: }
149:
150: /* Regular word. */
151: /* Break at the hyphen point if we overrun. */
1.83 schwarze 152: if (vend > vis && vend < bp &&
1.77 schwarze 153: (ASCII_HYPH == p->buf[j] ||
154: ASCII_BREAK == p->buf[j]))
1.42 schwarze 155: jhy = j;
156:
1.78 schwarze 157: /*
158: * Hyphenation now decided, put back a real
159: * hyphen such that we get the correct width.
160: */
161: if (ASCII_HYPH == p->buf[j])
162: p->buf[j] = '-';
163:
1.42 schwarze 164: vend += (*p->width)(p, p->buf[j]);
1.1 kristaps 165: }
166:
167: /*
1.5 schwarze 168: * Find out whether we would exceed the right margin.
1.33 schwarze 169: * If so, break to the next line.
1.5 schwarze 170: */
1.124 schwarze 171: if (vend > bp && 0 == jhy && vis > 0 &&
172: (p->flags & TERMP_BRNEVER) == 0) {
1.22 schwarze 173: vend -= vis;
1.124 schwarze 174: endline(p);
1.66 schwarze 175:
1.120 schwarze 176: /* Use pending tabs on the new line. */
177:
178: vbl = 0;
179: while (ntab--)
180: vbl = term_tab_next(vbl);
181:
182: /* Re-establish indentation. */
1.66 schwarze 183:
1.123 schwarze 184: if (p->flags & TERMP_BRIND)
1.120 schwarze 185: vbl += p->rmargin;
1.123 schwarze 186: else
1.120 schwarze 187: vbl += p->offset;
1.123 schwarze 188: maxvis = p->rmargin > vbl ? p->rmargin - vbl : 0;
189: bp = !(p->flags & TERMP_NOBREAK) ? maxvis :
190: p->maxrmargin > vbl ? p->maxrmargin - vbl : 0;
1.1 kristaps 191: }
1.30 schwarze 192:
1.33 schwarze 193: /* Write out the [remaining] word. */
1.125 ! schwarze 194: for ( ; i < p->lastcol; i++) {
1.25 schwarze 195: if (vend > bp && jhy > 0 && i > jhy)
1.30 schwarze 196: break;
197: if ('\t' == p->buf[i])
1.1 kristaps 198: break;
1.22 schwarze 199: if (' ' == p->buf[i]) {
1.46 schwarze 200: j = i;
1.125 ! schwarze 201: while (i < p->lastcol && ' ' == p->buf[i])
1.33 schwarze 202: i++;
1.71 schwarze 203: dv = (i - j) * (*p->width)(p, ' ');
1.51 schwarze 204: vbl += dv;
205: vend += dv;
1.22 schwarze 206: break;
207: }
1.33 schwarze 208: if (ASCII_NBRSP == p->buf[i]) {
1.42 schwarze 209: vbl += (*p->width)(p, ' ');
1.33 schwarze 210: continue;
211: }
1.77 schwarze 212: if (ASCII_BREAK == p->buf[i])
213: continue;
1.33 schwarze 214:
215: /*
216: * Now we definitely know there will be
217: * printable characters to output,
218: * so write preceding white space now.
219: */
220: if (vbl) {
1.37 schwarze 221: (*p->advance)(p, vbl);
1.33 schwarze 222: p->viscol += vbl;
223: vbl = 0;
1.61 schwarze 224: }
225:
226: (*p->letter)(p, p->buf[i]);
227: if (8 == p->buf[i])
228: p->viscol -= (*p->width)(p, p->buf[i-1]);
1.83 schwarze 229: else
1.42 schwarze 230: p->viscol += (*p->width)(p, p->buf[i]);
1.1 kristaps 231: }
1.22 schwarze 232: vis = vend;
1.1 kristaps 233: }
1.48 schwarze 234:
235: /*
236: * If there was trailing white space, it was not printed;
237: * so reset the cursor position accordingly.
238: */
1.95 schwarze 239: if (vis > vbl)
1.61 schwarze 240: vis -= vbl;
1.95 schwarze 241: else
242: vis = 0;
1.18 schwarze 243:
1.125 ! schwarze 244: p->col = p->lastcol = 0;
1.124 schwarze 245: p->minbl = p->trailspace;
1.123 schwarze 246: p->flags &= ~(TERMP_BACKAFTER | TERMP_BACKBEFORE | TERMP_NOPAD);
1.1 kristaps 247:
1.110 schwarze 248: /* Trailing whitespace is significant in some columns. */
249: if (vis && vbl && (TERMP_BRTRSP & p->flags))
250: vis += vbl;
1.1 kristaps 251:
1.61 schwarze 252: /* If the column was overrun, break the line. */
1.124 schwarze 253: if ((p->flags & TERMP_NOBREAK) == 0 ||
254: ((p->flags & TERMP_HANG) == 0 &&
255: vis + p->trailspace * (*p->width)(p, ' ') > maxvis))
256: endline(p);
257: }
258:
259: static void
260: endline(struct termp *p)
261: {
262: if ((p->flags & (TERMP_NEWMC | TERMP_ENDMC)) == TERMP_ENDMC) {
263: p->mc = NULL;
264: p->flags &= ~TERMP_ENDMC;
265: }
266: if (p->mc != NULL) {
267: if (p->viscol && p->maxrmargin >= p->viscol)
268: (*p->advance)(p, p->maxrmargin - p->viscol + 1);
269: p->flags |= TERMP_NOBUF | TERMP_NOSPACE;
270: term_word(p, p->mc);
271: p->flags &= ~(TERMP_NOBUF | TERMP_NEWMC);
272: }
273: p->viscol = 0;
274: p->minbl = 0;
275: (*p->endline)(p);
1.1 kristaps 276: }
277:
1.83 schwarze 278: /*
1.1 kristaps 279: * A newline only breaks an existing line; it won't assert vertical
280: * space. All data in the output buffer is flushed prior to the newline
281: * assertion.
282: */
283: void
284: term_newln(struct termp *p)
285: {
286:
287: p->flags |= TERMP_NOSPACE;
1.125 ! schwarze 288: if (p->lastcol || p->viscol)
1.61 schwarze 289: term_flushln(p);
1.1 kristaps 290: }
291:
292: /*
293: * Asserts a vertical space (a full, empty line-break between lines).
294: * Note that if used twice, this will cause two blank spaces and so on.
295: * All data in the output buffer is flushed prior to the newline
296: * assertion.
297: */
298: void
299: term_vspace(struct termp *p)
300: {
301:
302: term_newln(p);
1.29 schwarze 303: p->viscol = 0;
1.124 schwarze 304: p->minbl = 0;
1.63 schwarze 305: if (0 < p->skipvsp)
306: p->skipvsp--;
307: else
308: (*p->endline)(p);
1.1 kristaps 309: }
310:
1.98 schwarze 311: /* Swap current and previous font; for \fP and .ft P */
1.20 schwarze 312: void
313: term_fontlast(struct termp *p)
314: {
315: enum termfont f;
1.11 schwarze 316:
1.20 schwarze 317: f = p->fontl;
318: p->fontl = p->fontq[p->fonti];
319: p->fontq[p->fonti] = f;
320: }
321:
1.98 schwarze 322: /* Set font, save current, discard previous; for \f, .ft, .B etc. */
1.20 schwarze 323: void
324: term_fontrepl(struct termp *p, enum termfont f)
325: {
326:
327: p->fontl = p->fontq[p->fonti];
328: p->fontq[p->fonti] = f;
1.1 kristaps 329: }
330:
1.98 schwarze 331: /* Set font, save previous. */
1.20 schwarze 332: void
333: term_fontpush(struct termp *p, enum termfont f)
1.1 kristaps 334: {
1.7 schwarze 335:
1.20 schwarze 336: p->fontl = p->fontq[p->fonti];
1.98 schwarze 337: if (++p->fonti == p->fontsz) {
338: p->fontsz += 8;
339: p->fontq = mandoc_reallocarray(p->fontq,
1.116 schwarze 340: p->fontsz, sizeof(*p->fontq));
1.98 schwarze 341: }
342: p->fontq[p->fonti] = f;
1.20 schwarze 343: }
1.1 kristaps 344:
1.98 schwarze 345: /* Flush to make the saved pointer current again. */
1.20 schwarze 346: void
1.104 schwarze 347: term_fontpopq(struct termp *p, int i)
1.20 schwarze 348: {
1.1 kristaps 349:
1.104 schwarze 350: assert(i >= 0);
351: if (p->fonti > i)
352: p->fonti = i;
1.20 schwarze 353: }
1.1 kristaps 354:
1.98 schwarze 355: /* Pop one font off the stack. */
1.20 schwarze 356: void
357: term_fontpop(struct termp *p)
358: {
1.1 kristaps 359:
1.20 schwarze 360: assert(p->fonti);
361: p->fonti--;
1.1 kristaps 362: }
363:
364: /*
365: * Handle pwords, partial words, which may be either a single word or a
366: * phrase that cannot be broken down (such as a literal string). This
367: * handles word styling.
368: */
1.7 schwarze 369: void
370: term_word(struct termp *p, const char *word)
1.1 kristaps 371: {
1.121 schwarze 372: struct roffsu su;
1.75 schwarze 373: const char nbrsp[2] = { ASCII_NBRSP, 0 };
1.59 schwarze 374: const char *seq, *cp;
375: int sz, uc;
1.122 schwarze 376: size_t csz, lsz, ssz;
1.59 schwarze 377: enum mandoc_esc esc;
1.1 kristaps 378:
1.124 schwarze 379: if ((p->flags & TERMP_NOBUF) == 0) {
380: if ((p->flags & TERMP_NOSPACE) == 0) {
381: if ((p->flags & TERMP_KEEP) == 0) {
1.40 schwarze 382: bufferc(p, ' ');
1.124 schwarze 383: if (p->flags & TERMP_SENTENCE)
384: bufferc(p, ' ');
385: } else
386: bufferc(p, ASCII_NBRSP);
387: }
388: if (p->flags & TERMP_PREKEEP)
389: p->flags |= TERMP_KEEP;
390: if (p->flags & TERMP_NONOSPACE)
391: p->flags |= TERMP_NOSPACE;
392: else
393: p->flags &= ~TERMP_NOSPACE;
394: p->flags &= ~(TERMP_SENTENCE | TERMP_NONEWLINE);
395: p->skipvsp = 0;
1.31 schwarze 396: }
397:
1.59 schwarze 398: while ('\0' != *word) {
1.64 schwarze 399: if ('\\' != *word) {
1.75 schwarze 400: if (TERMP_NBRWORD & p->flags) {
401: if (' ' == *word) {
402: encode(p, nbrsp, 1);
403: word++;
404: continue;
405: }
406: ssz = strcspn(word, "\\ ");
407: } else
408: ssz = strcspn(word, "\\");
1.45 schwarze 409: encode(p, word, ssz);
1.64 schwarze 410: word += (int)ssz;
1.20 schwarze 411: continue;
1.64 schwarze 412: }
1.20 schwarze 413:
1.59 schwarze 414: word++;
415: esc = mandoc_escape(&word, &seq, &sz);
416: if (ESCAPE_ERROR == esc)
1.85 schwarze 417: continue;
1.59 schwarze 418:
419: switch (esc) {
1.83 schwarze 420: case ESCAPE_UNICODE:
1.89 schwarze 421: uc = mchars_num2uc(seq + 1, sz - 1);
1.56 schwarze 422: break;
1.83 schwarze 423: case ESCAPE_NUMBERED:
1.93 schwarze 424: uc = mchars_num2char(seq, sz);
425: if (uc < 0)
426: continue;
1.20 schwarze 427: break;
1.83 schwarze 428: case ESCAPE_SPECIAL:
1.89 schwarze 429: if (p->enc == TERMENC_ASCII) {
1.114 schwarze 430: cp = mchars_spec2str(seq, sz, &ssz);
1.92 schwarze 431: if (cp != NULL)
1.89 schwarze 432: encode(p, cp, ssz);
433: } else {
1.114 schwarze 434: uc = mchars_spec2cp(seq, sz);
1.90 schwarze 435: if (uc > 0)
436: encode1(p, uc);
1.89 schwarze 437: }
1.93 schwarze 438: continue;
1.83 schwarze 439: case ESCAPE_FONTBOLD:
1.20 schwarze 440: term_fontrepl(p, TERMFONT_BOLD);
1.93 schwarze 441: continue;
1.83 schwarze 442: case ESCAPE_FONTITALIC:
1.20 schwarze 443: term_fontrepl(p, TERMFONT_UNDER);
1.93 schwarze 444: continue;
1.83 schwarze 445: case ESCAPE_FONTBI:
1.70 schwarze 446: term_fontrepl(p, TERMFONT_BI);
1.93 schwarze 447: continue;
1.83 schwarze 448: case ESCAPE_FONT:
449: case ESCAPE_FONTROMAN:
1.20 schwarze 450: term_fontrepl(p, TERMFONT_NONE);
1.93 schwarze 451: continue;
1.83 schwarze 452: case ESCAPE_FONTPREV:
1.20 schwarze 453: term_fontlast(p);
1.93 schwarze 454: continue;
1.83 schwarze 455: case ESCAPE_NOSPACE:
1.108 schwarze 456: if (p->flags & TERMP_BACKAFTER)
457: p->flags &= ~TERMP_BACKAFTER;
458: else if (*word == '\0')
1.97 schwarze 459: p->flags |= (TERMP_NOSPACE | TERMP_NONEWLINE);
1.121 schwarze 460: continue;
461: case ESCAPE_HORIZ:
462: if (a2roffsu(seq, &su, SCALE_EM) == 0)
463: continue;
464: uc = term_hspan(p, &su) / 24;
465: if (uc > 0)
466: while (uc-- > 0)
467: bufferc(p, ASCII_NBRSP);
468: else if (p->col > (size_t)(-uc))
469: p->col += uc;
470: else {
471: uc += p->col;
472: p->col = 0;
473: if (p->offset > (size_t)(-uc)) {
474: p->ti += uc;
475: p->offset += uc;
476: } else {
477: p->ti -= p->offset;
478: p->offset = 0;
479: }
1.122 schwarze 480: }
481: continue;
482: case ESCAPE_HLINE:
483: if (a2roffsu(seq, &su, SCALE_EM) == 0)
484: continue;
485: uc = term_hspan(p, &su) / 24;
486: if (uc <= 0) {
487: if (p->rmargin <= p->offset)
488: continue;
489: lsz = p->rmargin - p->offset;
490: } else
491: lsz = uc;
492: while (sz &&
493: strchr(" %&()*+-./0123456789:<=>", *seq)) {
494: seq++;
495: sz--;
496: }
497: if (sz && strchr("cifMmnPpuv", *seq)) {
498: seq++;
499: sz--;
500: }
501: if (sz == 0)
502: uc = -1;
503: else if (*seq == '\\') {
504: seq++;
505: esc = mandoc_escape(&seq, &cp, &sz);
506: switch (esc) {
507: case ESCAPE_UNICODE:
508: uc = mchars_num2uc(cp + 1, sz - 1);
509: break;
510: case ESCAPE_NUMBERED:
511: uc = mchars_num2char(cp, sz);
512: break;
513: case ESCAPE_SPECIAL:
514: uc = mchars_spec2cp(cp, sz);
515: break;
516: default:
517: uc = -1;
518: break;
519: }
520: } else
521: uc = *seq;
522: if (uc < 0x20 || (uc > 0x7E && uc < 0xA0))
523: uc = '_';
524: if (p->enc == TERMENC_ASCII) {
525: cp = ascii_uc2str(uc);
526: csz = term_strlen(p, cp);
527: ssz = strlen(cp);
528: } else
529: csz = (*p->width)(p, uc);
530: while (lsz >= csz) {
531: if (p->enc == TERMENC_ASCII)
532: encode(p, cp, ssz);
533: else
534: encode1(p, uc);
535: lsz -= csz;
1.121 schwarze 536: }
1.93 schwarze 537: continue;
1.83 schwarze 538: case ESCAPE_SKIPCHAR:
1.108 schwarze 539: p->flags |= TERMP_BACKAFTER;
1.93 schwarze 540: continue;
1.103 schwarze 541: case ESCAPE_OVERSTRIKE:
542: cp = seq + sz;
543: while (seq < cp) {
544: if (*seq == '\\') {
545: mandoc_escape(&seq, NULL, NULL);
546: continue;
547: }
548: encode1(p, *seq++);
1.108 schwarze 549: if (seq < cp) {
550: if (p->flags & TERMP_BACKBEFORE)
551: p->flags |= TERMP_BACKAFTER;
552: else
553: p->flags |= TERMP_BACKBEFORE;
554: }
1.103 schwarze 555: }
1.109 schwarze 556: /* Trim trailing backspace/blank pair. */
1.125 ! schwarze 557: if (p->lastcol > 2 &&
! 558: (p->buf[p->lastcol - 1] == ' ' ||
! 559: p->buf[p->lastcol - 1] == '\t'))
! 560: p->lastcol -= 2;
! 561: if (p->col > p->lastcol)
! 562: p->col = p->lastcol;
1.108 schwarze 563: continue;
1.20 schwarze 564: default:
1.93 schwarze 565: continue;
566: }
567:
568: /*
569: * Common handling for Unicode and numbered
570: * character escape sequences.
571: */
572:
573: if (p->enc == TERMENC_ASCII) {
574: cp = ascii_uc2str(uc);
575: encode(p, cp, strlen(cp));
576: } else {
577: if ((uc < 0x20 && uc != 0x09) ||
578: (uc > 0x7E && uc < 0xA0))
579: uc = 0xFFFD;
580: encode1(p, uc);
1.20 schwarze 581: }
582: }
1.75 schwarze 583: p->flags &= ~TERMP_NBRWORD;
1.1 kristaps 584: }
585:
586: static void
1.71 schwarze 587: adjbuf(struct termp *p, size_t sz)
1.1 kristaps 588: {
589:
1.20 schwarze 590: if (0 == p->maxcols)
591: p->maxcols = 1024;
592: while (sz >= p->maxcols)
593: p->maxcols <<= 2;
594:
1.84 schwarze 595: p->buf = mandoc_reallocarray(p->buf, p->maxcols, sizeof(int));
1.1 kristaps 596: }
597:
1.4 schwarze 598: static void
1.20 schwarze 599: bufferc(struct termp *p, char c)
600: {
1.124 schwarze 601: if (p->flags & TERMP_NOBUF) {
602: (*p->letter)(p, c);
603: return;
604: }
1.20 schwarze 605: if (p->col + 1 >= p->maxcols)
606: adjbuf(p, p->col + 1);
1.125 ! schwarze 607: if (p->lastcol <= p->col || (c != ' ' && c != ASCII_NBRSP))
! 608: p->buf[p->col] = c;
! 609: if (p->lastcol < ++p->col)
! 610: p->lastcol = p->col;
1.20 schwarze 611: }
612:
1.59 schwarze 613: /*
614: * See encode().
615: * Do this for a single (probably unicode) value.
616: * Does not check for non-decorated glyphs.
617: */
618: static void
619: encode1(struct termp *p, int c)
620: {
621: enum termfont f;
622:
1.124 schwarze 623: if (p->flags & TERMP_NOBUF) {
624: (*p->letter)(p, c);
625: return;
626: }
627:
1.108 schwarze 628: if (p->col + 7 >= p->maxcols)
629: adjbuf(p, p->col + 7);
1.59 schwarze 630:
1.115 schwarze 631: f = (c == ASCII_HYPH || c > 127 || isgraph(c)) ?
1.108 schwarze 632: p->fontq[p->fonti] : TERMFONT_NONE;
1.59 schwarze 633:
1.108 schwarze 634: if (p->flags & TERMP_BACKBEFORE) {
1.118 schwarze 635: if (p->buf[p->col - 1] == ' ' || p->buf[p->col - 1] == '\t')
1.109 schwarze 636: p->col--;
637: else
638: p->buf[p->col++] = 8;
1.108 schwarze 639: p->flags &= ~TERMP_BACKBEFORE;
640: }
1.70 schwarze 641: if (TERMFONT_UNDER == f || TERMFONT_BI == f) {
1.59 schwarze 642: p->buf[p->col++] = '_';
1.70 schwarze 643: p->buf[p->col++] = 8;
644: }
645: if (TERMFONT_BOLD == f || TERMFONT_BI == f) {
646: if (ASCII_HYPH == c)
647: p->buf[p->col++] = '-';
648: else
649: p->buf[p->col++] = c;
650: p->buf[p->col++] = 8;
651: }
1.125 ! schwarze 652: if (p->lastcol <= p->col || (c != ' ' && c != ASCII_NBRSP))
! 653: p->buf[p->col] = c;
! 654: if (p->lastcol < ++p->col)
! 655: p->lastcol = p->col;
1.108 schwarze 656: if (p->flags & TERMP_BACKAFTER) {
657: p->flags |= TERMP_BACKBEFORE;
658: p->flags &= ~TERMP_BACKAFTER;
659: }
1.59 schwarze 660: }
1.20 schwarze 661:
662: static void
663: encode(struct termp *p, const char *word, size_t sz)
1.4 schwarze 664: {
1.71 schwarze 665: size_t i;
1.124 schwarze 666:
667: if (p->flags & TERMP_NOBUF) {
668: for (i = 0; i < sz; i++)
669: (*p->letter)(p, word[i]);
670: return;
671: }
1.59 schwarze 672:
1.108 schwarze 673: if (p->col + 2 + (sz * 5) >= p->maxcols)
674: adjbuf(p, p->col + 2 + (sz * 5));
1.46 schwarze 675:
1.71 schwarze 676: for (i = 0; i < sz; i++) {
1.70 schwarze 677: if (ASCII_HYPH == word[i] ||
678: isgraph((unsigned char)word[i]))
679: encode1(p, word[i]);
1.119 schwarze 680: else {
1.125 ! schwarze 681: if (p->lastcol <= p->col ||
! 682: (word[i] != ' ' && word[i] != ASCII_NBRSP))
! 683: p->buf[p->col] = word[i];
! 684: p->col++;
1.119 schwarze 685:
686: /*
687: * Postpone the effect of \z while handling
688: * an overstrike sequence from ascii_uc2str().
689: */
690:
691: if (word[i] == '\b' &&
692: (p->flags & TERMP_BACKBEFORE)) {
693: p->flags &= ~TERMP_BACKBEFORE;
694: p->flags |= TERMP_BACKAFTER;
695: }
696: }
1.4 schwarze 697: }
1.125 ! schwarze 698: if (p->lastcol < p->col)
! 699: p->lastcol = p->col;
1.80 schwarze 700: }
701:
702: void
703: term_setwidth(struct termp *p, const char *wstr)
704: {
705: struct roffsu su;
1.107 schwarze 706: int iop, width;
1.80 schwarze 707:
1.81 schwarze 708: iop = 0;
709: width = 0;
1.80 schwarze 710: if (NULL != wstr) {
711: switch (*wstr) {
1.83 schwarze 712: case '+':
1.80 schwarze 713: iop = 1;
714: wstr++;
715: break;
1.83 schwarze 716: case '-':
1.80 schwarze 717: iop = -1;
718: wstr++;
719: break;
720: default:
721: break;
722: }
1.81 schwarze 723: if (a2roffsu(wstr, &su, SCALE_MAX))
724: width = term_hspan(p, &su);
725: else
1.80 schwarze 726: iop = 0;
727: }
728: (*p->setwidth)(p, iop, width);
1.4 schwarze 729: }
1.16 schwarze 730:
731: size_t
1.39 schwarze 732: term_len(const struct termp *p, size_t sz)
733: {
734:
1.112 schwarze 735: return (*p->width)(p, ' ') * sz;
1.39 schwarze 736: }
737:
1.64 schwarze 738: static size_t
739: cond_width(const struct termp *p, int c, int *skip)
740: {
741:
742: if (*skip) {
743: (*skip) = 0;
1.112 schwarze 744: return 0;
1.64 schwarze 745: } else
1.112 schwarze 746: return (*p->width)(p, c);
1.64 schwarze 747: }
1.39 schwarze 748:
749: size_t
750: term_strlen(const struct termp *p, const char *cp)
751: {
1.59 schwarze 752: size_t sz, rsz, i;
1.93 schwarze 753: int ssz, skip, uc;
1.50 schwarze 754: const char *seq, *rhs;
1.59 schwarze 755: enum mandoc_esc esc;
1.77 schwarze 756: static const char rej[] = { '\\', ASCII_NBRSP, ASCII_HYPH,
757: ASCII_BREAK, '\0' };
1.59 schwarze 758:
759: /*
760: * Account for escaped sequences within string length
761: * calculations. This follows the logic in term_word() as we
762: * must calculate the width of produced strings.
763: */
764:
765: sz = 0;
1.64 schwarze 766: skip = 0;
1.59 schwarze 767: while ('\0' != *cp) {
768: rsz = strcspn(cp, rej);
769: for (i = 0; i < rsz; i++)
1.64 schwarze 770: sz += cond_width(p, *cp++, &skip);
1.59 schwarze 771:
772: switch (*cp) {
1.83 schwarze 773: case '\\':
1.59 schwarze 774: cp++;
775: esc = mandoc_escape(&cp, &seq, &ssz);
776: if (ESCAPE_ERROR == esc)
1.85 schwarze 777: continue;
1.59 schwarze 778:
779: rhs = NULL;
1.50 schwarze 780:
1.59 schwarze 781: switch (esc) {
1.83 schwarze 782: case ESCAPE_UNICODE:
1.94 schwarze 783: uc = mchars_num2uc(seq + 1, ssz - 1);
1.59 schwarze 784: break;
1.83 schwarze 785: case ESCAPE_NUMBERED:
1.93 schwarze 786: uc = mchars_num2char(seq, ssz);
787: if (uc < 0)
788: continue;
1.50 schwarze 789: break;
1.83 schwarze 790: case ESCAPE_SPECIAL:
1.93 schwarze 791: if (p->enc == TERMENC_ASCII) {
1.114 schwarze 792: rhs = mchars_spec2str(seq, ssz, &rsz);
1.93 schwarze 793: if (rhs != NULL)
794: break;
795: } else {
1.114 schwarze 796: uc = mchars_spec2cp(seq, ssz);
1.93 schwarze 797: if (uc > 0)
798: sz += cond_width(p, uc, &skip);
1.89 schwarze 799: }
1.93 schwarze 800: continue;
1.83 schwarze 801: case ESCAPE_SKIPCHAR:
1.64 schwarze 802: skip = 1;
1.103 schwarze 803: continue;
804: case ESCAPE_OVERSTRIKE:
805: rsz = 0;
806: rhs = seq + ssz;
807: while (seq < rhs) {
808: if (*seq == '\\') {
809: mandoc_escape(&seq, NULL, NULL);
810: continue;
811: }
812: i = (*p->width)(p, *seq++);
813: if (rsz < i)
814: rsz = i;
815: }
816: sz += rsz;
1.93 schwarze 817: continue;
1.50 schwarze 818: default:
1.93 schwarze 819: continue;
1.50 schwarze 820: }
1.39 schwarze 821:
1.93 schwarze 822: /*
823: * Common handling for Unicode and numbered
824: * character escape sequences.
825: */
826:
827: if (rhs == NULL) {
828: if (p->enc == TERMENC_ASCII) {
829: rhs = ascii_uc2str(uc);
830: rsz = strlen(rhs);
831: } else {
832: if ((uc < 0x20 && uc != 0x09) ||
833: (uc > 0x7E && uc < 0xA0))
834: uc = 0xFFFD;
835: sz += cond_width(p, uc, &skip);
836: continue;
837: }
838: }
1.59 schwarze 839:
1.64 schwarze 840: if (skip) {
841: skip = 0;
842: break;
843: }
1.93 schwarze 844:
845: /*
846: * Common handling for all escape sequences
847: * printing more than one character.
848: */
1.64 schwarze 849:
1.59 schwarze 850: for (i = 0; i < rsz; i++)
851: sz += (*p->width)(p, *rhs++);
852: break;
1.83 schwarze 853: case ASCII_NBRSP:
1.64 schwarze 854: sz += cond_width(p, ' ', &skip);
1.55 schwarze 855: cp++;
1.59 schwarze 856: break;
1.83 schwarze 857: case ASCII_HYPH:
1.64 schwarze 858: sz += cond_width(p, '-', &skip);
1.55 schwarze 859: cp++;
1.59 schwarze 860: break;
861: default:
862: break;
863: }
864: }
1.39 schwarze 865:
1.112 schwarze 866: return sz;
1.39 schwarze 867: }
868:
1.100 schwarze 869: int
1.39 schwarze 870: term_vspan(const struct termp *p, const struct roffsu *su)
1.16 schwarze 871: {
872: double r;
1.101 schwarze 873: int ri;
1.16 schwarze 874:
875: switch (su->unit) {
1.99 schwarze 876: case SCALE_BU:
877: r = su->scale / 40.0;
878: break;
1.83 schwarze 879: case SCALE_CM:
1.99 schwarze 880: r = su->scale * 6.0 / 2.54;
881: break;
882: case SCALE_FS:
883: r = su->scale * 65536.0 / 40.0;
1.16 schwarze 884: break;
1.83 schwarze 885: case SCALE_IN:
1.86 schwarze 886: r = su->scale * 6.0;
1.16 schwarze 887: break;
1.99 schwarze 888: case SCALE_MM:
889: r = su->scale * 0.006;
890: break;
1.83 schwarze 891: case SCALE_PC:
1.16 schwarze 892: r = su->scale;
893: break;
1.83 schwarze 894: case SCALE_PT:
1.99 schwarze 895: r = su->scale / 12.0;
1.16 schwarze 896: break;
1.99 schwarze 897: case SCALE_EN:
898: case SCALE_EM:
899: r = su->scale * 0.6;
1.16 schwarze 900: break;
1.83 schwarze 901: case SCALE_VS:
1.16 schwarze 902: r = su->scale;
903: break;
904: default:
1.99 schwarze 905: abort();
1.16 schwarze 906: }
1.101 schwarze 907: ri = r > 0.0 ? r + 0.4995 : r - 0.4995;
1.112 schwarze 908: return ri < 66 ? ri : 1;
1.16 schwarze 909: }
910:
1.107 schwarze 911: /*
912: * Convert a scaling width to basic units, rounding down.
913: */
1.100 schwarze 914: int
1.39 schwarze 915: term_hspan(const struct termp *p, const struct roffsu *su)
1.16 schwarze 916: {
917:
1.112 schwarze 918: return (*p->hspan)(p, su);
1.16 schwarze 919: }