[BACK]Return to term.c CVS log [TXT][DIR] Up to [cvsweb.bsd.lv] / mandoc

Annotation of mandoc/term.c, Revision 1.84

1.84    ! kristaps    1: /*     $Id: term.c,v 1.83 2009/06/22 13:13:10 kristaps Exp $ */
1.1       kristaps    2: /*
1.75      kristaps    3:  * Copyright (c) 2008, 2009 Kristaps Dzonsons <kristaps@kth.se>
1.1       kristaps    4:  *
                      5:  * Permission to use, copy, modify, and distribute this software for any
1.74      kristaps    6:  * purpose with or without fee is hereby granted, provided that the above
                      7:  * copyright notice and this permission notice appear in all copies.
1.1       kristaps    8:  *
1.74      kristaps    9:  * THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES
                     10:  * WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
                     11:  * MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR
                     12:  * ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
                     13:  * WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN
                     14:  * ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF
                     15:  * OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
1.1       kristaps   16:  */
                     17: #include <assert.h>
1.23      kristaps   18: #include <err.h>
1.22      kristaps   19: #include <stdio.h>
1.1       kristaps   20: #include <stdlib.h>
                     21: #include <string.h>
                     22:
1.71      kristaps   23: #include "term.h"
                     24: #include "man.h"
                     25: #include "mdoc.h"
1.1       kristaps   26:
1.71      kristaps   27: extern int               man_run(struct termp *,
                     28:                                const struct man *);
                     29: extern int               mdoc_run(struct termp *,
                     30:                                const struct mdoc *);
1.1       kristaps   31:
1.71      kristaps   32: static struct termp     *term_alloc(enum termenc);
                     33: static void              term_free(struct termp *);
                     34: static void              term_pword(struct termp *, const char *, int);
                     35: static void              term_pescape(struct termp *,
                     36:                                const char *, int *, int);
                     37: static void              term_nescape(struct termp *,
                     38:                                const char *, size_t);
                     39: static void              term_chara(struct termp *, char);
1.79      kristaps   40: static void              term_encodea(struct termp *, char);
1.71      kristaps   41: static int               term_isopendelim(const char *, int);
                     42: static int               term_isclosedelim(const char *, int);
1.1       kristaps   43:
                     44:
1.71      kristaps   45: void *
                     46: ascii_alloc(void)
1.10      kristaps   47: {
1.1       kristaps   48:
1.71      kristaps   49:        return(term_alloc(TERMENC_ASCII));
1.1       kristaps   50: }
                     51:
                     52:
1.71      kristaps   53: int
1.72      kristaps   54: terminal_man(void *arg, const struct man *man)
1.1       kristaps   55: {
1.71      kristaps   56:        struct termp    *p;
1.1       kristaps   57:
1.71      kristaps   58:        p = (struct termp *)arg;
                     59:        if (NULL == p->symtab)
                     60:                p->symtab = term_ascii2htab();
1.2       kristaps   61:
1.72      kristaps   62:        return(man_run(p, man));
                     63: }
                     64:
                     65:
                     66: int
                     67: terminal_mdoc(void *arg, const struct mdoc *mdoc)
                     68: {
                     69:        struct termp    *p;
                     70:
                     71:        p = (struct termp *)arg;
                     72:        if (NULL == p->symtab)
                     73:                p->symtab = term_ascii2htab();
1.2       kristaps   74:
1.72      kristaps   75:        return(mdoc_run(p, mdoc));
1.1       kristaps   76: }
                     77:
                     78:
1.71      kristaps   79: void
                     80: terminal_free(void *arg)
1.11      kristaps   81: {
                     82:
1.71      kristaps   83:        term_free((struct termp *)arg);
1.11      kristaps   84: }
                     85:
                     86:
1.71      kristaps   87: static void
                     88: term_free(struct termp *p)
1.14      kristaps   89: {
                     90:
1.71      kristaps   91:        if (p->buf)
                     92:                free(p->buf);
                     93:        if (TERMENC_ASCII == p->enc && p->symtab)
                     94:                term_asciifree(p->symtab);
1.14      kristaps   95:
1.71      kristaps   96:        free(p);
1.14      kristaps   97: }
                     98:
                     99:
1.71      kristaps  100: static struct termp *
                    101: term_alloc(enum termenc enc)
1.14      kristaps  102: {
1.71      kristaps  103:        struct termp *p;
1.14      kristaps  104:
1.71      kristaps  105:        if (NULL == (p = malloc(sizeof(struct termp))))
                    106:                err(1, "malloc");
                    107:        bzero(p, sizeof(struct termp));
1.80      kristaps  108:        p->maxrmargin = 78;
1.71      kristaps  109:        p->enc = enc;
                    110:        return(p);
1.14      kristaps  111: }
                    112:
                    113:
                    114: static int
1.71      kristaps  115: term_isclosedelim(const char *p, int len)
1.14      kristaps  116: {
                    117:
1.71      kristaps  118:        if (1 != len)
                    119:                return(0);
1.14      kristaps  120:
1.71      kristaps  121:        switch (*p) {
                    122:        case('.'):
                    123:                /* FALLTHROUGH */
                    124:        case(','):
                    125:                /* FALLTHROUGH */
                    126:        case(';'):
                    127:                /* FALLTHROUGH */
                    128:        case(':'):
                    129:                /* FALLTHROUGH */
                    130:        case('?'):
                    131:                /* FALLTHROUGH */
                    132:        case('!'):
                    133:                /* FALLTHROUGH */
                    134:        case(')'):
                    135:                /* FALLTHROUGH */
                    136:        case(']'):
                    137:                /* FALLTHROUGH */
                    138:        case('}'):
                    139:                return(1);
                    140:        default:
                    141:                break;
                    142:        }
1.14      kristaps  143:
1.71      kristaps  144:        return(0);
1.30      kristaps  145: }
                    146:
                    147:
1.14      kristaps  148: static int
1.71      kristaps  149: term_isopendelim(const char *p, int len)
1.14      kristaps  150: {
1.43      kristaps  151:
1.71      kristaps  152:        if (1 != len)
                    153:                return(0);
1.14      kristaps  154:
1.71      kristaps  155:        switch (*p) {
                    156:        case('('):
                    157:                /* FALLTHROUGH */
                    158:        case('['):
                    159:                /* FALLTHROUGH */
                    160:        case('{'):
                    161:                return(1);
                    162:        default:
                    163:                break;
                    164:        }
1.43      kristaps  165:
1.14      kristaps  166:        return(0);
                    167: }
1.15      kristaps  168:
                    169:
1.71      kristaps  170: /*
                    171:  * Flush a line of text.  A "line" is loosely defined as being something
                    172:  * that should be followed by a newline, regardless of whether it's
                    173:  * broken apart by newlines getting there.  A line can also be a
                    174:  * fragment of a columnar list.
                    175:  *
                    176:  * Specifically, a line is whatever's in p->buf of length p->col, which
                    177:  * is zeroed after this function returns.
                    178:  *
1.84    ! kristaps  179:  * The usage of termp:flags is as follows:
1.71      kristaps  180:  *
                    181:  *  - TERMP_NOLPAD: when beginning to write the line, don't left-pad the
                    182:  *    offset value.  This is useful when doing columnar lists where the
                    183:  *    prior column has right-padded.
                    184:  *
                    185:  *  - TERMP_NOBREAK: this is the most important and is used when making
                    186:  *    columns.  In short: don't print a newline and instead pad to the
                    187:  *    right margin.  Used in conjunction with TERMP_NOLPAD.
                    188:  *
1.84    ! kristaps  189:  *  - TERMP_DANGLE: don't newline when TERMP_NOBREAK is specified and
        !           190:  *    the line is overrun, and don't pad-right if it's underrun.
        !           191:  *
        !           192:  *  - TERMP_HANG: like TERMP_DANGLE, but doesn't newline when
        !           193:  *    overruning, instead save the position and continue at that point
        !           194:  *    when the next invocation.
1.71      kristaps  195:  *
                    196:  *  In-line line breaking:
                    197:  *
                    198:  *  If TERMP_NOBREAK is specified and the line overruns the right
                    199:  *  margin, it will break and pad-right to the right margin after
                    200:  *  writing.  If maxrmargin is violated, it will break and continue
                    201:  *  writing from the right-margin, which will lead to the above
                    202:  *  scenario upon exit.
                    203:  *
                    204:  *  Otherwise, the line will break at the right margin.  Extremely long
                    205:  *  lines will cause the system to emit a warning (TODO: hyphenate, if
                    206:  *  possible).
1.82      kristaps  207:  *
                    208:  *  FIXME: newline breaks occur (in groff) also occur when a single
                    209:  *  space follows a NOBREAK!
1.71      kristaps  210:  */
                    211: void
                    212: term_flushln(struct termp *p)
1.53      kristaps  213: {
1.71      kristaps  214:        int              i, j;
1.81      kristaps  215:        size_t           vbl, vsz, vis, maxvis, mmax, bp;
1.84    ! kristaps  216:        static int       sv = -1;
1.53      kristaps  217:
1.71      kristaps  218:        /*
                    219:         * First, establish the maximum columns of "visible" content.
                    220:         * This is usually the difference between the right-margin and
                    221:         * an indentation, but can be, for tagged lists or columns, a
                    222:         * small set of values.
                    223:         */
1.53      kristaps  224:
1.71      kristaps  225:        assert(p->offset < p->rmargin);
                    226:        maxvis = p->rmargin - p->offset;
                    227:        mmax = p->maxrmargin - p->offset;
                    228:        bp = TERMP_NOBREAK & p->flags ? mmax : maxvis;
                    229:        vis = 0;
1.53      kristaps  230:
1.84    ! kristaps  231:        if (sv >= 0) {
        !           232:                vis = (size_t)sv;
        !           233:                sv = -1;
        !           234:        }
        !           235:
1.71      kristaps  236:        /*
                    237:         * If in the standard case (left-justified), then begin with our
                    238:         * indentation, otherwise (columns, etc.) just start spitting
                    239:         * out text.
                    240:         */
1.53      kristaps  241:
1.71      kristaps  242:        if ( ! (p->flags & TERMP_NOLPAD))
                    243:                /* LINTED */
                    244:                for (j = 0; j < (int)p->offset; j++)
                    245:                        putchar(' ');
                    246:
                    247:        for (i = 0; i < (int)p->col; i++) {
                    248:                /*
                    249:                 * Count up visible word characters.  Control sequences
                    250:                 * (starting with the CSI) aren't counted.  A space
                    251:                 * generates a non-printing word, which is valid (the
                    252:                 * space is printed according to regular spacing rules).
                    253:                 */
                    254:
                    255:                /* LINTED */
                    256:                for (j = i, vsz = 0; j < (int)p->col; j++) {
                    257:                        if (' ' == p->buf[j])
                    258:                                break;
                    259:                        else if (8 == p->buf[j])
                    260:                                j += 1;
                    261:                        else
                    262:                                vsz++;
                    263:                }
1.53      kristaps  264:
1.71      kristaps  265:                /*
1.81      kristaps  266:                 * Choose the number of blanks to prepend: no blank at the
                    267:                 * beginning of a line, one between words -- but do not
                    268:                 * actually write them yet.
1.71      kristaps  269:                 */
1.81      kristaps  270:                vbl = (size_t)(0 == vis ? 0 : 1);
1.71      kristaps  271:
1.81      kristaps  272:                /*
                    273:                 * Find out whether we would exceed the right margin.
                    274:                 * If so, break to the next line.  (TODO: hyphenate)
                    275:                 * Otherwise, write the chosen number of blanks now.
                    276:                 */
                    277:                if (vis && vis + vbl + vsz > bp) {
                    278:                        putchar('\n');
                    279:                        if (TERMP_NOBREAK & p->flags) {
                    280:                                for (j = 0; j < (int)p->rmargin; j++)
                    281:                                        putchar(' ');
                    282:                                vis = p->rmargin - p->offset;
                    283:                        } else {
1.71      kristaps  284:                                for (j = 0; j < (int)p->offset; j++)
                    285:                                        putchar(' ');
                    286:                                vis = 0;
1.81      kristaps  287:                        }
                    288:                } else {
                    289:                        for (j = 0; j < (int)vbl; j++)
1.71      kristaps  290:                                putchar(' ');
1.81      kristaps  291:                        vis += vbl;
1.71      kristaps  292:                }
1.53      kristaps  293:
1.78      kristaps  294:                /*
1.81      kristaps  295:                 * Finally, write out the word.
1.71      kristaps  296:                 */
                    297:                for ( ; i < (int)p->col; i++) {
                    298:                        if (' ' == p->buf[i])
                    299:                                break;
                    300:                        putchar(p->buf[i]);
                    301:                }
                    302:                vis += vsz;
                    303:        }
1.15      kristaps  304:
1.71      kristaps  305:        /*
                    306:         * If we've overstepped our maximum visible no-break space, then
                    307:         * cause a newline and offset at the right margin.
                    308:         */
1.15      kristaps  309:
1.81      kristaps  310:        if ((TERMP_NOBREAK & p->flags) && vis >= maxvis) {
1.84    ! kristaps  311:                if ( ! (TERMP_DANGLE & p->flags) &&
        !           312:                                ! (TERMP_HANG & p->flags)) {
1.71      kristaps  313:                        putchar('\n');
                    314:                        for (i = 0; i < (int)p->rmargin; i++)
                    315:                                putchar(' ');
                    316:                }
1.84    ! kristaps  317:                if (TERMP_HANG & p->flags)
        !           318:                        sv = vis - maxvis;
1.71      kristaps  319:                p->col = 0;
1.15      kristaps  320:                return;
1.71      kristaps  321:        }
1.15      kristaps  322:
1.71      kristaps  323:        /*
                    324:         * If we're not to right-marginalise it (newline), then instead
                    325:         * pad to the right margin and stay off.
                    326:         */
1.15      kristaps  327:
1.71      kristaps  328:        if (p->flags & TERMP_NOBREAK) {
1.84    ! kristaps  329:                if ( ! (TERMP_DANGLE & p->flags))
1.81      kristaps  330:                        for ( ; vis < maxvis; vis++)
1.71      kristaps  331:                                putchar(' ');
                    332:        } else
                    333:                putchar('\n');
1.15      kristaps  334:
1.71      kristaps  335:        p->col = 0;
1.15      kristaps  336: }
                    337:
                    338:
1.71      kristaps  339: /*
                    340:  * A newline only breaks an existing line; it won't assert vertical
                    341:  * space.  All data in the output buffer is flushed prior to the newline
                    342:  * assertion.
                    343:  */
                    344: void
                    345: term_newln(struct termp *p)
1.15      kristaps  346: {
                    347:
1.71      kristaps  348:        p->flags |= TERMP_NOSPACE;
                    349:        if (0 == p->col) {
                    350:                p->flags &= ~TERMP_NOLPAD;
1.15      kristaps  351:                return;
1.16      kristaps  352:        }
1.71      kristaps  353:        term_flushln(p);
                    354:        p->flags &= ~TERMP_NOLPAD;
1.16      kristaps  355: }
                    356:
                    357:
1.71      kristaps  358: /*
                    359:  * Asserts a vertical space (a full, empty line-break between lines).
                    360:  * Note that if used twice, this will cause two blank spaces and so on.
                    361:  * All data in the output buffer is flushed prior to the newline
                    362:  * assertion.
                    363:  */
                    364: void
                    365: term_vspace(struct termp *p)
1.16      kristaps  366: {
                    367:
1.62      kristaps  368:        term_newln(p);
1.71      kristaps  369:        putchar('\n');
1.16      kristaps  370: }
                    371:
                    372:
1.71      kristaps  373: /*
                    374:  * Break apart a word into "pwords" (partial-words, usually from
                    375:  * breaking up a phrase into individual words) and, eventually, put them
                    376:  * into the output buffer.  If we're a literal word, then don't break up
                    377:  * the word and put it verbatim into the output buffer.
                    378:  */
                    379: void
                    380: term_word(struct termp *p, const char *word)
1.17      kristaps  381: {
1.71      kristaps  382:        int              i, j, len;
1.17      kristaps  383:
1.71      kristaps  384:        len = (int)strlen(word);
1.17      kristaps  385:
1.71      kristaps  386:        if (p->flags & TERMP_LITERAL) {
                    387:                term_pword(p, word, len);
                    388:                return;
                    389:        }
1.17      kristaps  390:
1.71      kristaps  391:        /* LINTED */
                    392:        for (j = i = 0; i < len; i++) {
                    393:                if (' ' != word[i]) {
                    394:                        j++;
                    395:                        continue;
                    396:                }
                    397:
                    398:                /* Escaped spaces don't delimit... */
                    399:                if (i && ' ' == word[i] && '\\' == word[i - 1]) {
                    400:                        j++;
                    401:                        continue;
                    402:                }
1.17      kristaps  403:
1.71      kristaps  404:                if (0 == j)
                    405:                        continue;
                    406:                assert(i >= j);
                    407:                term_pword(p, &word[i - j], j);
                    408:                j = 0;
                    409:        }
                    410:        if (j > 0) {
                    411:                assert(i >= j);
                    412:                term_pword(p, &word[i - j], j);
                    413:        }
1.17      kristaps  414: }
                    415:
                    416:
1.71      kristaps  417: /*
                    418:  * Determine the symbol indicated by an escape sequences, that is, one
                    419:  * starting with a backslash.  Once done, we pass this value into the
                    420:  * output buffer by way of the symbol table.
                    421:  */
                    422: static void
                    423: term_nescape(struct termp *p, const char *word, size_t len)
1.17      kristaps  424: {
1.71      kristaps  425:        const char      *rhs;
                    426:        size_t           sz;
1.79      kristaps  427:        int              i;
1.17      kristaps  428:
1.83      kristaps  429:        rhs = term_a2ascii(p->symtab, word, len, &sz);
                    430:        if (rhs)
1.79      kristaps  431:                for (i = 0; i < (int)sz; i++)
                    432:                        term_encodea(p, rhs[i]);
1.17      kristaps  433: }
                    434:
                    435:
1.71      kristaps  436: /*
                    437:  * Handle an escape sequence: determine its length and pass it to the
                    438:  * escape-symbol look table.  Note that we assume mdoc(3) has validated
                    439:  * the escape sequence (we assert upon badly-formed escape sequences).
                    440:  */
                    441: static void
                    442: term_pescape(struct termp *p, const char *word, int *i, int len)
1.17      kristaps  443: {
1.71      kristaps  444:        int              j;
1.17      kristaps  445:
1.71      kristaps  446:        if (++(*i) >= len)
                    447:                return;
1.17      kristaps  448:
1.71      kristaps  449:        if ('(' == word[*i]) {
                    450:                (*i)++;
                    451:                if (*i + 1 >= len)
                    452:                        return;
1.22      kristaps  453:
1.71      kristaps  454:                term_nescape(p, &word[*i], 2);
                    455:                (*i)++;
                    456:                return;
1.22      kristaps  457:
1.71      kristaps  458:        } else if ('*' == word[*i]) {
                    459:                (*i)++;
                    460:                if (*i >= len)
                    461:                        return;
1.22      kristaps  462:
1.71      kristaps  463:                switch (word[*i]) {
                    464:                case ('('):
                    465:                        (*i)++;
                    466:                        if (*i + 1 >= len)
                    467:                                return;
1.65      kristaps  468:
1.71      kristaps  469:                        term_nescape(p, &word[*i], 2);
                    470:                        (*i)++;
                    471:                        return;
                    472:                case ('['):
                    473:                        break;
                    474:                default:
                    475:                        term_nescape(p, &word[*i], 1);
                    476:                        return;
                    477:                }
                    478:
                    479:        } else if ('f' == word[*i]) {
                    480:                (*i)++;
                    481:                if (*i >= len)
                    482:                        return;
                    483:                switch (word[*i]) {
                    484:                case ('B'):
                    485:                        p->flags |= TERMP_BOLD;
                    486:                        break;
                    487:                case ('I'):
                    488:                        p->flags |= TERMP_UNDER;
                    489:                        break;
                    490:                case ('P'):
                    491:                        /* FALLTHROUGH */
                    492:                case ('R'):
                    493:                        p->flags &= ~TERMP_STYLE;
                    494:                        break;
                    495:                default:
                    496:                        break;
                    497:                }
                    498:                return;
1.22      kristaps  499:
1.71      kristaps  500:        } else if ('[' != word[*i]) {
                    501:                term_nescape(p, &word[*i], 1);
                    502:                return;
                    503:        }
1.28      kristaps  504:
1.71      kristaps  505:        (*i)++;
                    506:        for (j = 0; word[*i] && ']' != word[*i]; (*i)++, j++)
                    507:                /* Loop... */ ;
1.28      kristaps  508:
1.71      kristaps  509:        if (0 == word[*i])
                    510:                return;
1.48      kristaps  511:
1.71      kristaps  512:        term_nescape(p, &word[*i - j], (size_t)j);
1.48      kristaps  513: }
                    514:
                    515:
1.71      kristaps  516: /*
                    517:  * Handle pwords, partial words, which may be either a single word or a
                    518:  * phrase that cannot be broken down (such as a literal string).  This
                    519:  * handles word styling.
                    520:  */
                    521: static void
                    522: term_pword(struct termp *p, const char *word, int len)
1.65      kristaps  523: {
1.71      kristaps  524:        int              i;
                    525:
                    526:        if (term_isclosedelim(word, len))
                    527:                if ( ! (TERMP_IGNDELIM & p->flags))
                    528:                        p->flags |= TERMP_NOSPACE;
1.65      kristaps  529:
1.71      kristaps  530:        if ( ! (TERMP_NOSPACE & p->flags))
                    531:                term_chara(p, ' ');
1.65      kristaps  532:
1.71      kristaps  533:        if ( ! (p->flags & TERMP_NONOSPACE))
                    534:                p->flags &= ~TERMP_NOSPACE;
1.65      kristaps  535:
1.71      kristaps  536:        /*
                    537:         * If ANSI (word-length styling), then apply our style now,
                    538:         * before the word.
                    539:         */
1.28      kristaps  540:
1.79      kristaps  541:        for (i = 0; i < len; i++)
                    542:                if ('\\' == word[i])
1.71      kristaps  543:                        term_pescape(p, word, &i, len);
1.79      kristaps  544:                else
                    545:                        term_encodea(p, word[i]);
1.65      kristaps  546:
1.71      kristaps  547:        if (term_isopendelim(word, len))
                    548:                p->flags |= TERMP_NOSPACE;
1.65      kristaps  549: }
                    550:
                    551:
1.71      kristaps  552: /*
                    553:  * Insert a single character into the line-buffer.  If the buffer's
                    554:  * space is exceeded, then allocate more space by doubling the buffer
                    555:  * size.
                    556:  */
                    557: static void
                    558: term_chara(struct termp *p, char c)
1.51      kristaps  559: {
1.71      kristaps  560:        size_t           s;
1.51      kristaps  561:
1.71      kristaps  562:        if (p->col + 1 >= p->maxcols) {
                    563:                if (0 == p->maxcols)
                    564:                        p->maxcols = 256;
                    565:                s = p->maxcols * 2;
                    566:                p->buf = realloc(p->buf, s);
                    567:                if (NULL == p->buf)
                    568:                        err(1, "realloc");
                    569:                p->maxcols = s;
                    570:        }
                    571:        p->buf[(int)(p->col)++] = c;
1.51      kristaps  572: }
                    573:
1.79      kristaps  574:
                    575: static void
                    576: term_encodea(struct termp *p, char c)
                    577: {
                    578:
                    579:        if (TERMP_STYLE & p->flags) {
                    580:                if (TERMP_BOLD & p->flags) {
                    581:                        term_chara(p, c);
                    582:                        term_chara(p, 8);
                    583:                }
                    584:                if (TERMP_UNDER & p->flags) {
                    585:                        term_chara(p, '_');
                    586:                        term_chara(p, 8);
                    587:                }
                    588:        }
                    589:        term_chara(p, c);
                    590: }

CVSweb