diff options
author | Kristaps Dzonsons <kristaps@bsd.lv> | 2010-05-07 15:49:36 +0000 |
---|---|---|
committer | Kristaps Dzonsons <kristaps@bsd.lv> | 2010-05-07 15:49:36 +0000 |
commit | 0f679b197ab273ae0779713155a8a455d4a770fe (patch) | |
tree | aff454adb0052ff2632ea4814e8e19e9cc7dd9f1 /mdoc.c | |
parent | 14c096e3772b640b87176e27eaa291c9fefbe0de (diff) | |
download | mandoc-0f679b197ab273ae0779713155a8a455d4a770fe.tar.gz |
De-chunking of text removed from parsers. This is a significant change (and I don't really like it), but it's what groff does.
Distinction of ARGS_PHRASE and ARGS_PPHRASE in backend (not yet used).
Diffstat (limited to 'mdoc.c')
-rw-r--r-- | mdoc.c | 93 |
1 files changed, 28 insertions, 65 deletions
@@ -154,8 +154,7 @@ static int node_append(struct mdoc *, static int mdoc_ptext(struct mdoc *, int, char *); static int mdoc_pmacro(struct mdoc *, int, char *); static int macrowarn(struct mdoc *, int, const char *); -static int pstring(struct mdoc *, int, int, - const char *, size_t); + const struct mdoc_node * mdoc_node(const struct mdoc *m) @@ -535,11 +534,13 @@ mdoc_elem_alloc(struct mdoc *m, int line, int pos, } -static int -pstring(struct mdoc *m, int line, int pos, const char *p, size_t len) +int +mdoc_word_alloc(struct mdoc *m, int line, int pos, const char *p) { struct mdoc_node *n; - size_t sv; + size_t sv, len; + + len = strlen(p); n = node_alloc(m, line, pos, -1, MDOC_TEXT); n->string = mandoc_malloc(len + 1); @@ -550,19 +551,12 @@ pstring(struct mdoc *m, int line, int pos, const char *p, size_t len) if ( ! node_append(m, n)) return(0); + m->next = MDOC_NEXT_SIBLING; return(1); } -int -mdoc_word_alloc(struct mdoc *m, int line, int pos, const char *p) -{ - - return(pstring(m, line, pos, p, strlen(p))); -} - - void mdoc_node_free(struct mdoc_node *p) { @@ -633,88 +627,57 @@ mdoc_node_delete(struct mdoc *m, struct mdoc_node *p) static int mdoc_ptext(struct mdoc *m, int line, char *buf) { - int i, j; - char sv; + int i; /* Ignore bogus comments. */ if ('\\' == buf[0] && '.' == buf[1] && '\"' == buf[2]) return(mdoc_pwarn(m, line, 0, EBADCOMMENT)); + /* No text before an initial macro. */ + if (SEC_NONE == m->lastnamed) return(mdoc_perr(m, line, 0, ETEXTPROL)); - - /* - * If in literal mode, then pass the buffer directly to the - * back-end, as it should be preserved as a single term. - */ + /* Literal just gets pulled in as-is. */ + if (MDOC_LITERAL & m->flags) return(mdoc_word_alloc(m, line, 0, buf)); - /* Disallow blank/white-space lines in non-literal mode. */ + /* Check for a blank line, which may also consist of spaces. */ for (i = 0; ' ' == buf[i]; i++) - /* Skip leading whitespace. */ ; + /* Skip to first non-space. */ ; if ('\0' == buf[i]) { if ( ! mdoc_pwarn(m, line, 0, ENOBLANK)) return(0); + /* - * Assume that a `Pp' should be inserted in the case of - * a blank line. Technically, blank lines aren't - * allowed, but enough manuals assume this behaviour - * that we want to work around it. + * Insert a `Pp' in the case of a blank line. Technically, + * blank lines aren't allowed, but enough manuals assume this + * behaviour that we want to work around it. */ if ( ! mdoc_elem_alloc(m, line, 0, MDOC_Pp, NULL)) return(0); - } - - /* - * Break apart a free-form line into tokens. Spaces are - * stripped out of the input. - */ - for (j = i; buf[i]; i++) { - if (' ' != buf[i]) - continue; - - /* Escaped whitespace. */ - if (i && ' ' == buf[i] && '\\' == buf[i - 1]) - continue; - - sv = buf[i]; - buf[i++] = '\0'; - - if ( ! pstring(m, line, j, &buf[j], (size_t)(i - j))) - return(0); - - /* Trailing whitespace? Check at overwritten byte. */ - - if (' ' == sv && '\0' == buf[i]) - if ( ! mdoc_pwarn(m, line, i - 1, ETAILWS)) - return(0); - - for ( ; ' ' == buf[i]; i++) - /* Skip trailing whitespace. */ ; + m->next = MDOC_NEXT_SIBLING; + return(1); + } - j = i; + /* Warn if the last un-escaped character is whitespace. */ - /* Trailing whitespace? */ + i = (int)strlen(buf); + assert(i); - if (' ' == buf[i - 1] && '\0' == buf[i]) + if (' ' == buf[i - 1] || '\t' == buf[i - 1]) + if (1 == i || ('\\' != buf[i - 2])) if ( ! mdoc_pwarn(m, line, i - 1, ETAILWS)) return(0); - if ('\0' == buf[i]) - break; - } - - if (j != i && ! pstring(m, line, j, &buf[j], (size_t)(i - j))) - return(0); + /* Allocate the whole word. */ - m->next = MDOC_NEXT_SIBLING; - return(1); + return(mdoc_word_alloc(m, line, 0, buf)); } |