/* * man page backend for Halibut */ #include #include #include #include "halibut.h" static void man_text(FILE *, word *, int newline, int quote_props); static void man_codepara(FILE *, word *); #define QUOTE_INITCTRL 1 /* quote initial . and ' on a line */ #define QUOTE_QUOTES 2 /* quote double quotes by doubling them */ void man_backend(paragraph *sourceform, keywordlist *keywords, indexdata *idx) { paragraph *p; FILE *fp; char const *sep; IGNORE(keywords); /* we don't happen to need this */ IGNORE(idx); /* or this */ /* * Determine the output file name, and open the output file * * FIXME: want configurable output file names here. For the * moment, we'll just call it `output.1'. */ fp = fopen("output.1", "w"); if (!fp) { error(err_cantopenw, "output.1"); return; } /* Do the version ID */ for (p = sourceform; p; p = p->next) if (p->type == para_VersionID) { fprintf(fp, ".\\\" "); man_text(fp, p->words, TRUE, 0); } /* FIXME: .TH name-of-program manual-section */ fprintf(fp, ".TH FIXME 1\n"); fprintf(fp, ".UC\n"); /* Do the preamble and copyright */ sep = ""; for (p = sourceform; p; p = p->next) if (p->type == para_Preamble) { fprintf(fp, "%s", sep); man_text(fp, p->words, TRUE, 0); sep = "\n"; } for (p = sourceform; p; p = p->next) if (p->type == para_Copyright) { fprintf(fp, "%s", sep); man_text(fp, p->words, TRUE, 0); sep = "\n"; } /* * FIXME: * * - figure out precisely what needs to be escaped. * * A dot or apostrophe at the start of a line wants to be * preceded by `\&', which is a zero-width space. * * Literal backslashes always want doubling. * * Within double quotes, a double quote needs doubling * too. * * - work out what to do about hyphens / minuses... */ for (p = sourceform; p; p = p->next) switch (p->type) { /* * Things we ignore because we've already processed them or * aren't going to touch them in this pass. */ case para_IM: case para_BR: case para_Biblio: /* only touch BiblioCited */ case para_VersionID: case para_Copyright: case para_Preamble: case para_NoCite: case para_Title: break; /* * Headings. */ case para_Chapter: case para_Appendix: case para_UnnumberedChapter: case para_Heading: case para_Subsect: fprintf(fp, ".SH \""); /* FIXME: disable this, at _least_ by default */ if (p->kwtext) man_text(fp, p->kwtext, FALSE, QUOTE_QUOTES); fprintf(fp, " "); man_text(fp, p->words, FALSE, QUOTE_QUOTES); fprintf(fp, "\"\n"); break; /* * Code paragraphs. */ case para_Code: fprintf(fp, ".PP\n"); man_codepara(fp, p->words); break; /* * Normal paragraphs. */ case para_Normal: fprintf(fp, ".PP\n"); man_text(fp, p->words, TRUE, 0); break; /* * List paragraphs. */ case para_Description: case para_BiblioCited: case para_Bullet: case para_NumberedList: if (p->type == para_Bullet) { fprintf(fp, ".IP \"\\fBo\\fP\"\n"); /* FIXME: configurable? */ } else if (p->type == para_NumberedList) { fprintf(fp, ".IP \""); man_text(fp, p->kwtext, FALSE, QUOTE_QUOTES); fprintf(fp, "\"\n"); } else if (p->type == para_Description) { /* * Do nothing; the .xP for this paragraph is the .IP * which has come before it in the DescribedThing. */ } else if (p->type == para_BiblioCited) { fprintf(fp, ".IP \""); man_text(fp, p->kwtext, FALSE, QUOTE_QUOTES); fprintf(fp, "\"\n"); } man_text(fp, p->words, TRUE, 0); break; case para_DescribedThing: fprintf(fp, ".IP \""); man_text(fp, p->words, FALSE, QUOTE_QUOTES); fprintf(fp, "\"\n"); break; case para_Rule: /* * FIXME. */ break; case para_LcontPush: fprintf(fp, ".RS\n"); break; case para_LcontPop: fprintf(fp, ".RE\n"); break; } /* * Tidy up. */ fclose(fp); } /* * Convert a wide string into a string of chars. If `result' is * non-NULL, mallocs the resulting string and stores a pointer to * it in `*result'. If `result' is NULL, merely checks whether all * characters in the string are feasible for the output character * set. * * Return is nonzero if all characters are OK. If not all * characters are OK but `result' is non-NULL, a result _will_ * still be generated! * * FIXME: Here is probably also a good place to do escaping sorts * of things. I know I at least need to escape backslash, and full * stops at the starts of words are probably trouble as well. */ static int man_convert(wchar_t *s, char **result, int quote_props) { /* * FIXME. Currently this is ISO8859-1 only. */ int doing = (result != 0); int ok = TRUE; char *p = NULL; int plen = 0, psize = 0; for (; *s; s++) { wchar_t c = *s; char outc; if ((c >= 32 && c <= 126) || (c >= 160 && c <= 255)) { /* Char is OK. */ outc = (char)c; } else { /* Char is not OK. */ ok = FALSE; outc = 0xBF; /* approximate the good old DEC `uh?' */ } if (doing) { if (plen+3 >= psize) { psize = plen + 256; p = resize(p, psize); } if (plen == 0 && (outc == '.' || outc == '\'') && (quote_props & QUOTE_INITCTRL)) { /* * Control character (. or ') at the start of a * line. Quote it by putting \& (troff zero-width * space) before it. */ p[plen++] = '\\'; p[plen++] = '&'; } else if (outc == '\\') { /* * Quote backslashes by doubling them, always. */ p[plen++] = '\\'; } else if (outc == '"' && (quote_props & QUOTE_QUOTES)) { /* * Double quote within double quotes. Quote it by * doubling. */ p[plen++] = '"'; } p[plen++] = outc; } } if (doing) { p = resize(p, plen+1); p[plen] = '\0'; *result = p; } return ok; } static void man_rdaddwc(rdstringc *rs, word *text, word *end, int quote_props) { char *c; for (; text && text != end; text = text->next) switch (text->type) { case word_HyperLink: case word_HyperEnd: case word_UpperXref: case word_LowerXref: case word_XrefEnd: case word_IndexRef: break; case word_Normal: case word_Emph: case word_Code: case word_WeakCode: case word_WhiteSpace: case word_EmphSpace: case word_CodeSpace: case word_WkCodeSpace: case word_Quote: case word_EmphQuote: case word_CodeQuote: case word_WkCodeQuote: assert(text->type != word_CodeQuote && text->type != word_WkCodeQuote); if (towordstyle(text->type) == word_Emph && (attraux(text->aux) == attr_First || attraux(text->aux) == attr_Only)) rdaddsc(rs, "\\fI"); else if (towordstyle(text->type) == word_Code && (attraux(text->aux) == attr_First || attraux(text->aux) == attr_Only)) rdaddsc(rs, "\\fB"); if (removeattr(text->type) == word_Normal) { if (rs->pos > 0) quote_props &= ~QUOTE_INITCTRL; /* not at start any more */ if (man_convert(text->text, &c, quote_props)) rdaddsc(rs, c); else man_rdaddwc(rs, text->alt, NULL, quote_props); sfree(c); } else if (removeattr(text->type) == word_WhiteSpace) { rdaddc(rs, ' '); } else if (removeattr(text->type) == word_Quote) { rdaddc(rs, quoteaux(text->aux) == quote_Open ? '`' : '\''); /* FIXME: configurability */ } if (towordstyle(text->type) == word_Emph && (attraux(text->aux) == attr_Last || attraux(text->aux) == attr_Only)) rdaddsc(rs, "\\fP"); else if (towordstyle(text->type) == word_Code && (attraux(text->aux) == attr_Last || attraux(text->aux) == attr_Only)) rdaddsc(rs, "\\fP"); break; } } static void man_text(FILE *fp, word *text, int newline, int quote_props) { rdstringc t = { 0, 0, NULL }; man_rdaddwc(&t, text, NULL, quote_props | QUOTE_INITCTRL); fprintf(fp, "%s", t.text); sfree(t.text); if (newline) fputc('\n', fp); } static void man_codepara(FILE *fp, word *text) { fprintf(fp, ".nf\n"); for (; text; text = text->next) if (text->type == word_WeakCode) { char *c; man_convert(text->text, &c, QUOTE_INITCTRL); fprintf(fp, "%s\n", c); sfree(c); } fprintf(fp, ".fi\n"); }