/* * man page backend for Halibut */ #include #include #include #include "halibut.h" static void man_text(FILE *, word *, int newline, int quote_props, int charset); static void man_codepara(FILE *, word *, int charset); static int man_convert(wchar_t const *s, int maxlen, char **result, int quote_props, int charset, charset_state *state); typedef struct { wchar_t *th; int headnumbers; int mindepth; char *filename; int charset; } manconfig; static manconfig man_configure(paragraph *source) { manconfig ret; /* * Defaults. */ ret.th = NULL; ret.headnumbers = FALSE; ret.mindepth = 0; ret.filename = dupstr("output.1"); ret.charset = CS_ASCII; for (; source; source = source->next) { if (source->type == para_Config) { if (!ustricmp(source->keyword, L"man-identity")) { wchar_t *wp, *ep; wp = uadv(source->keyword); ep = wp; while (*ep) ep = uadv(ep); sfree(ret.th); ret.th = mknewa(wchar_t, ep - wp + 1); memcpy(ret.th, wp, (ep - wp + 1) * sizeof(wchar_t)); } else if (!ustricmp(source->keyword, L"man-charset")) { char *csname = utoa_dup(uadv(source->keyword), CS_ASCII); ret.charset = charset_from_localenc(csname); sfree(csname); } else if (!ustricmp(source->keyword, L"man-headnumbers")) { ret.headnumbers = utob(uadv(source->keyword)); } else if (!ustricmp(source->keyword, L"man-mindepth")) { ret.mindepth = utoi(uadv(source->keyword)); } else if (!ustricmp(source->keyword, L"man-filename")) { sfree(ret.filename); ret.filename = dupstr(adv(source->origkeyword)); } } } return ret; } static void man_conf_cleanup(manconfig cf) { sfree(cf.th); sfree(cf.filename); } paragraph *man_config_filename(char *filename) { return cmdline_cfg_simple("man-filename", filename, NULL); } #define QUOTE_INITCTRL 1 /* quote initial . and ' on a line */ #define QUOTE_QUOTES 2 /* quote double quotes by doubling them */ void man_backend(paragraph *sourceform, keywordlist *keywords, indexdata *idx, void *unused) { paragraph *p; FILE *fp; manconfig conf; IGNORE(unused); IGNORE(keywords); IGNORE(idx); conf = man_configure(sourceform); /* * Open the output file. */ fp = fopen(conf.filename, "w"); if (!fp) { error(err_cantopenw, conf.filename); return; } /* Do the version ID */ for (p = sourceform; p; p = p->next) if (p->type == para_VersionID) { fprintf(fp, ".\\\" "); man_text(fp, p->words, TRUE, 0, conf.charset); } /* .TH name-of-program manual-section */ fprintf(fp, ".TH"); if (conf.th && *conf.th) { char *c; wchar_t *wp; for (wp = conf.th; *wp; wp = uadv(wp)) { fputs(" \"", fp); man_convert(wp, 0, &c, QUOTE_QUOTES, conf.charset, NULL); fputs(c, fp); sfree(c); fputc('"', fp); } } fputc('\n', fp); fprintf(fp, ".UC\n"); for (p = sourceform; p; p = p->next) switch (p->type) { /* * Things we ignore because we've already processed them or * aren't going to touch them in this pass. */ case para_IM: case para_BR: case para_Biblio: /* only touch BiblioCited */ case para_VersionID: case para_NoCite: case para_Title: break; /* * Headings. */ case para_Chapter: case para_Appendix: case para_UnnumberedChapter: case para_Heading: case para_Subsect: { int depth; if (p->type == para_Subsect) depth = p->aux + 2; else if (p->type == para_Heading) depth = 1; else depth = 0; if (depth >= conf.mindepth) { fprintf(fp, ".SH \""); if (conf.headnumbers && p->kwtext) { man_text(fp, p->kwtext, FALSE, QUOTE_QUOTES, conf.charset); fprintf(fp, " "); } man_text(fp, p->words, FALSE, QUOTE_QUOTES, conf.charset); fprintf(fp, "\"\n"); } break; } /* * Code paragraphs. */ case para_Code: fprintf(fp, ".PP\n"); man_codepara(fp, p->words, conf.charset); break; /* * Normal paragraphs. */ case para_Normal: case para_Copyright: fprintf(fp, ".PP\n"); man_text(fp, p->words, TRUE, 0, conf.charset); break; /* * List paragraphs. */ case para_Description: case para_BiblioCited: case para_Bullet: case para_NumberedList: if (p->type == para_Bullet) { fprintf(fp, ".IP \"\\fBo\\fP\"\n"); /* FIXME: configurable? */ } else if (p->type == para_NumberedList) { fprintf(fp, ".IP \""); man_text(fp, p->kwtext, FALSE, QUOTE_QUOTES, conf.charset); fprintf(fp, "\"\n"); } else if (p->type == para_Description) { /* * Do nothing; the .xP for this paragraph is the .IP * which has come before it in the DescribedThing. */ } else if (p->type == para_BiblioCited) { fprintf(fp, ".IP \""); man_text(fp, p->kwtext, FALSE, QUOTE_QUOTES, conf.charset); fprintf(fp, "\"\n"); } man_text(fp, p->words, TRUE, 0, conf.charset); break; case para_DescribedThing: fprintf(fp, ".IP \""); man_text(fp, p->words, FALSE, QUOTE_QUOTES, conf.charset); fprintf(fp, "\"\n"); break; case para_Rule: /* * This isn't terribly good. Anyone who wants to do better * should feel free! */ fprintf(fp, ".PP\n----------------------------------------\n"); break; case para_LcontPush: case para_QuotePush: fprintf(fp, ".RS\n"); break; case para_LcontPop: case para_QuotePop: fprintf(fp, ".RE\n"); break; } /* * Tidy up. */ fclose(fp); man_conf_cleanup(conf); } /* * Convert a wide string into a string of chars; mallocs the * resulting string and stores a pointer to it in `*result'. * * If `state' is non-NULL, updates the charset state pointed to. If * `state' is NULL, this function uses its own state, initialises * it from scratch, and cleans it up when finished. If `state' is * non-NULL but _s_ is NULL, cleans up a provided state. * * Return is nonzero if all characters are OK. If not all * characters are OK but `result' is non-NULL, a result _will_ * still be generated! * * This function also does escaping of groff special characters. */ static int man_convert(wchar_t const *s, int maxlen, char **result, int quote_props, int charset, charset_state *state) { charset_state internal_state = CHARSET_INIT_STATE; int slen, err; char *p = NULL, *q; int plen = 0, psize = 0; rdstringc out = {0, 0, NULL}; if (!state) state = &internal_state; slen = (s ? ustrlen(s) : 0); if (slen > maxlen && maxlen > 0) slen = maxlen; psize = 384; plen = 0; p = mknewa(char, psize); err = 0; while (slen > 0) { int ret = charset_from_unicode(&s, &slen, p+plen, psize-plen, charset, state, (err ? NULL : &err)); if (ret > 0) { plen += ret; if (psize - plen < 256) { psize = plen + 256; p = resize(p, psize); } } } if (state == &internal_state || s == NULL) { int ret = charset_from_unicode(NULL, 0, p+plen, psize-plen, charset, state, NULL); if (ret > 0) plen += ret; } for (q = p; q < p+plen; q++) { if (q == p && (*q == '.' || *q == '\'') && (quote_props & QUOTE_INITCTRL)) { /* * Control character (. or ') at the start of a * line. Quote it by putting \& (troff zero-width * space) before it. */ rdaddc(&out, '\\'); rdaddc(&out, '&'); } else if (*q == '\\') { /* * Quote backslashes by doubling them, always. */ rdaddc(&out, '\\'); } else if (*q == '"' && (quote_props & QUOTE_QUOTES)) { /* * Double quote within double quotes. Quote it by * doubling. */ rdaddc(&out, '"'); } rdaddc(&out, *q); } sfree(p); if (out.text) *result = rdtrimc(&out); else *result = dupstr(""); return !err; } static void man_rdaddwc(rdstringc *rs, word *text, word *end, int quote_props, int charset, charset_state *state) { char *c; for (; text && text != end; text = text->next) switch (text->type) { case word_HyperLink: case word_HyperEnd: case word_UpperXref: case word_LowerXref: case word_XrefEnd: case word_IndexRef: break; case word_Normal: case word_Emph: case word_Code: case word_WeakCode: case word_WhiteSpace: case word_EmphSpace: case word_CodeSpace: case word_WkCodeSpace: case word_Quote: case word_EmphQuote: case word_CodeQuote: case word_WkCodeQuote: assert(text->type != word_CodeQuote && text->type != word_WkCodeQuote); if (towordstyle(text->type) == word_Emph && (attraux(text->aux) == attr_First || attraux(text->aux) == attr_Only)) { if (rs->pos > 0) quote_props &= ~QUOTE_INITCTRL; /* not at start any more */ man_convert(NULL, 0, &c, quote_props, charset, state); rdaddsc(rs, c); sfree(c); *state = charset_init_state; rdaddsc(rs, "\\fI"); } else if ((towordstyle(text->type) == word_Code || towordstyle(text->type) == word_WeakCode) && (attraux(text->aux) == attr_First || attraux(text->aux) == attr_Only)) { if (rs->pos > 0) quote_props &= ~QUOTE_INITCTRL; /* not at start any more */ man_convert(NULL, 0, &c, quote_props, charset, state); rdaddsc(rs, c); sfree(c); *state = charset_init_state; rdaddsc(rs, "\\fB"); } if (removeattr(text->type) == word_Normal) { charset_state s2 = *state; if (rs->pos > 0) quote_props &= ~QUOTE_INITCTRL; /* not at start any more */ if (man_convert(text->text, 0, &c, quote_props, charset, &s2) || !text->alt) { rdaddsc(rs, c); *state = s2; } else { man_rdaddwc(rs, text->alt, NULL, quote_props, charset, state); } sfree(c); } else if (removeattr(text->type) == word_WhiteSpace) { if (rs->pos > 0) quote_props &= ~QUOTE_INITCTRL; /* not at start any more */ man_convert(L" ", 1, &c, quote_props, charset, state); rdaddsc(rs, c); sfree(c); } else if (removeattr(text->type) == word_Quote) { if (rs->pos > 0) quote_props &= ~QUOTE_INITCTRL; /* not at start any more */ man_convert(L"\"", 1, &c, quote_props, charset, state); rdaddsc(rs, c); sfree(c); } if (towordstyle(text->type) != word_Normal && (attraux(text->aux) == attr_Last || attraux(text->aux) == attr_Only)) { if (rs->pos > 0) quote_props &= ~QUOTE_INITCTRL; /* not at start any more */ man_convert(NULL, 0, &c, quote_props, charset, state); rdaddsc(rs, c); sfree(c); *state = charset_init_state; rdaddsc(rs, "\\fP"); } break; } man_convert(NULL, 0, &c, quote_props, charset, state); rdaddsc(rs, c); sfree(c); } static void man_text(FILE *fp, word *text, int newline, int quote_props, int charset) { rdstringc t = { 0, 0, NULL }; charset_state state = CHARSET_INIT_STATE; man_rdaddwc(&t, text, NULL, quote_props | QUOTE_INITCTRL, charset, &state); fprintf(fp, "%s", t.text); sfree(t.text); if (newline) fputc('\n', fp); } static void man_codepara(FILE *fp, word *text, int charset) { fprintf(fp, ".nf\n"); for (; text; text = text->next) if (text->type == word_WeakCode) { char *c; wchar_t *t, *e; int quote_props = QUOTE_INITCTRL; t = text->text; if (text->next && text->next->type == word_Emph) { e = text->next->text; text = text->next; } else e = NULL; while (e && *e && *t) { int n; int ec = *e; for (n = 0; t[n] && e[n] && e[n] == ec; n++); if (ec == 'i') fprintf(fp, "\\fI"); else if (ec == 'b') fprintf(fp, "\\fB"); man_convert(t, n, &c, quote_props, charset, NULL); quote_props &= ~QUOTE_INITCTRL; fprintf(fp, "%s", c); sfree(c); if (ec == 'i' || ec == 'b') fprintf(fp, "\\fP"); t += n; e += n; } man_convert(t, 0, &c, quote_props, charset, NULL); fprintf(fp, "%s\n", c); sfree(c); } fprintf(fp, ".fi\n"); }