diff options
Diffstat (limited to 'nx-X11/extras/rman/rman.c')
-rw-r--r-- | nx-X11/extras/rman/rman.c | 4974 |
1 files changed, 0 insertions, 4974 deletions
diff --git a/nx-X11/extras/rman/rman.c b/nx-X11/extras/rman/rman.c deleted file mode 100644 index 1f0d540ba..000000000 --- a/nx-X11/extras/rman/rman.c +++ /dev/null @@ -1,4974 +0,0 @@ -#ifdef UNDEF -static char cvsid[] = "Header: /usr/build/rman/rman-031225/phelps/RCS/rman.c,v 1.154 2003/07/26 19:00:48 phelps Exp $"; -#endif - -/* - PolyglotMan by Thomas A. Phelps (phelps@ACM.org) - - accept man pages as formatted by (10) - Hewlett-Packard HP-UX, AT&T System V, SunOS, Sun Solaris, OSF/1, - DEC Ultrix, SGI IRIX, Linux, FreeBSD, SCO - - output as (9) - printable ASCII, section headers only, TkMan, [tn]roff, HTML, - LaTeX, LaTeX2e, RTF, Perl pod, MIME, DocBook XML - - written March 24, 1993 - bs2tk generalized into RosettaMan November 4-5, 1993 - source interpretation added September 24, 1996 - renamed PolyglotMan due to lawsuit by Rosetta, Inc. August 8, 1997 -*/ -/* $XFree86: xc/extras/rman/rman.c,v 1.18 2003/10/22 19:50:36 tsi Exp $ */ - -#include <unistd.h> -#include <stdio.h> -#include <string.h> -#include <ctype.h> -#include <stdlib.h> -#include <assert.h> -#include <sys/types.h> -#include <sys/stat.h> -#include <fcntl.h> - -#if defined(Lynx) || defined(__QNXNTO__) -extern int optind; -extern char *optarg; -#endif -#ifdef __CYGWIN__ -#include <getopt.h> -#endif - -/*** make #define's into consts? => can't because compilers not smart enough ***/ -/* maximum number of tags per line */ -#define MAXTAGS 50*100 -#define MAXBUF 2*5000 -#define MAXLINES 20000 -#define MAXTOC 500 -#define xputchar(c) (fcharout? putchar(c): (c)) -#define sputchar(c) (fcharout? plain[sI++]=(char)c: (char)(c)) -#define stagadd(tag) tagadd(tag,sI,0) -enum { c_dagger='\xa7', c_bullet='\xb7', c_plusminus='\xb1' }; - - -/*** tag management ***/ - -enum tagtype { NOTAG, TITLE, ITALICS, BOLD, SYMBOL, SMALLCAPS, BOLDITALICS, MONO, MANREF }; /* MANREF last */ -struct { enum tagtype type; int first; int last; } tags[MAXTAGS], tagtmp; -int tagc=0; -struct { char *text; int type; int line; } toc[MAXTOC]; -int tocc=0; - - -/* characters in this list automatically prefixed by a backslash (set in output format function */ -char *escchars=""; -char *vollist = VOLLIST; -const char *manvalid = "._-+:"; /* in addition to alphanumerics, valid characters to find in a man page name */ -char *manrefname; -char *manrefsect; - -enum command { - NOCOMMAND=-1, - - /*BEGINCHARTAGS,*/ - CHARTAB='\t', - CHARPERIOD='.', CHARLSQUOTE='`', CHARRSQUOTE='\'', CHARGT='>', CHARLT='<', - CHARAMP='&', CHARBACKSLASH='\\', CHARDASH='-', CHARHAT='^', CHARVBAR='|', - CHARNBSP=0xa0, CHARCENT=0xa2, CHARSECT=0xa7, CHARCOPYR=0xa9, CHARNOT=0xac, - CHARDAGGER=0xad, CHARREGTM=0xae, CHARDEG=0xb0, CHARPLUSMINUS=0xb1, - CHARACUTE=0xb4, CHARBULLET=0xb7, CHAR14=0xbc, CHAR12=0xbd, CHAR34=0xbe, - CHARMUL=0xd7, CHARDIV=0xf7, - CHANGEBAR=0x100, CHARLQUOTE, CHARRQUOTE, - /*ENDCHARTAGS,*/ - - /*BEGINFONTTAGS,*/ - BEGINBOLD, ENDBOLD, BEGINITALICS, ENDITALICS, BEGINBOLDITALICS, ENDBOLDITALICS, - BEGINSC, ENDSC, BEGINY, ENDY, BEGINCODE, ENDCODE, BEGINMANREF, ENDMANREF, - FONTSIZE, - /*ENDFONTTAGS*/ - - /*BEGINLAYOUTTAGS,*/ - ITAB, BEGINCENTER, ENDCENTER, HR, - /*ENDLAYOUTTAGS,*/ - - /*BEGINSTRUCTTAGS,*/ - BEGINDOC, ENDDOC, BEGINCOMMENT, ENDCOMMENT, COMMENTLINE, BEGINBODY, ENDBODY, - BEGINHEADER, ENDHEADER, BEGINFOOTER, ENDFOOTER, BEGINLINE, ENDLINE, SHORTLINE, - BEGINSECTION, ENDSECTION, BEGINSUBSECTION, ENDSUBSECTION, - BEGINSECTHEAD, ENDSECTHEAD, BEGINSUBSECTHEAD, ENDSUBSECTHEAD, - BEGINBULPAIR, ENDBULPAIR, BEGINBULLET, ENDBULLET, BEGINBULTXT, ENDBULTXT, - BEGINTABLE, ENDTABLE, BEGINTABLELINE, ENDTABLELINE, BEGINTABLEENTRY, ENDTABLEENTRY, - BEGININDENT, ENDINDENT, BEGINCODEBLOCK, ENDCODEBLOCK, - - BEGINDIFFA, ENDDIFFA, BEGINDIFFD, ENDDIFFD - /*,*//*ENDSTRUCTTAGS,*/ -}; - -const char *tcltkOP[] = { "Command-Line Name", "Database Name", "Database Class" }; - - -/* characters that need special handling in any output format, *more than just a backslash* */ -/* characters in this list need a corresponding case statement in each output format */ -/*char *trouble="\t.`'><&\\^|-\xa7\xb7\xb1";*/ -const unsigned char trouble[]= { CHARTAB, CHARPERIOD, CHARLSQUOTE, CHARRSQUOTE, - CHARGT, CHARLT, CHARAMP, CHARBACKSLASH, CHARDASH, CHARHAT, CHARVBAR, CHARCENT, - CHARSECT, CHARCOPYR, CHARNOT, CHARDAGGER, CHARREGTM, CHARDEG, CHARPLUSMINUS, - CHARACUTE, CHARBULLET, CHAR14, CHAR12, CHAR34, CHARMUL, CHARDIV, - 0 }; - - -enum command tagbeginend[][2] = { /* parallel to enum tagtype */ - { NOCOMMAND, NOCOMMAND }, - { NOCOMMAND, NOCOMMAND }, - { BEGINITALICS, ENDITALICS }, - { BEGINBOLD, ENDBOLD }, - { BEGINY, ENDY }, - { BEGINSC, ENDSC }, - { BEGINBOLDITALICS, ENDBOLDITALICS }, - { NOCOMMAND, NOCOMMAND }, - { BEGINMANREF, ENDMANREF } -}; - -void (*fn)(enum command) = NULL; -enum command prevcmd = BEGINDOC; - - -/*** globals ***/ - -int fSource=-1; /* -1 => not determined yet */ -int finlist=0; -int fDiff=0; -FILE *difffd; -char diffline[MAXBUF]; -char diffline2[MAXBUF]; -char *message = NULL; -int fontdelta=0; -int intArg; - -int fPara=0; /* line or paragraph groupings of text */ -int fSubsections=0; /* extract subsection titles too? */ -int fChangeleft=0; /* move change bars to left? (-1 => delete them) */ -int fReflow=0; -int fURL=0; /* scan for URLs too? */ -#if 0 -int fMan=1; /* invoke agressive man page filtering? */ -#endif -int fQS=0; /* squeeze out spaces (scnt and interword)? */ -int fIQS=0; /* squeeze out initial spaces (controlled separately from fQS) */ -int fILQS=0; /* squeeze out spaces for usual indent */ -int fHeadfoot=0; /* show canonical header and footer at bottom? */ -int falluc=0; -int itabcnt=0; -int fQuiet=0; -int fTclTk=0; - -/* patterns observed in section heads that don't conform to first-letter-uppercase-rest-lowercase pattern (stay all uc, or go all lc, or have subsequent uc) */ -int lcexceptionslen = -1; /* computed by system */ -char *lcexceptions[] = { -/* new rule: double/all consonants == UC? */ - /* articles, verbs, conjunctions, prepositions, pronouns */ - "a", "an", "the", - "am", "are", "is", "were", - "and", "or", - "by", "for", "from", "in", "into", "it", "of", "on", "to", "with", - "that", "this", - - /* terms */ - "API", "CD", "GUI", "UI", /*I/O=>I/O already*/ "ID", "IDs", "OO", - "IOCTLs", "IPC", "RPC", - - /* system names */ - "AWK", "cvs", "rcs", "GL", "vi", "PGP", "QuickTime", "DDD", "XPG/3", - "NFS", "NIS", "NIS+", "AFS", - "UNIX", "SysV", - "Xorg", "XOrg", "X.Org", "XFree86", "ICCCM", - "MH", "MIME", - "TeX", "LaTeX", "PicTeX", - "PostScript", "EPS", "EPSF", "EPSI", - "HTML", "URL", "WWW", - - /* institution names */ - "ANSI", "CERN", "GNU", "ISO", "NCSA", - - /* Sun-specific */ - "MT-Level", "SPARC", - - NULL -}; - - -int TabStops=8; -int hanging=0; /* location of hanging indent (if ==0, none) */ -enum { NAME, SYNOPSIS, DESCRIPTION, SEEALSO, FILES, AUTHOR, RANDOM/*last!*/ }; -char *sectheadname[] = { - "NAME:NOMBRE", "SYNOPSIS", "DESCRIPTION:INTRODUCTION", "SEE ALSO:RELATED INFORMATION", "FILES", "AUTHOR:AUTHORS", "RANDOM" -}; -int sectheadid = RANDOM; -int oldsectheadid = RANDOM; - -int fCodeline=0; -int fNOHY=0; /* re-linebreak so no words are hyphenated; not used by TkMan, but gotta keep for people converting formatted text */ -int fNORM=0; /* normalize? initial space => tabs, no changebars, exactly one blank line between sections */ -const char TABLEOFCONTENTS[] = "Table of Contents"; -const char HEADERANDFOOTER[] = "Header and Footer"; -char manName[80] = "man page"; -char manSect[10] = "1"; -const char PROVENANCE[] = - "manual page source format generated by PolyglotMan v" POLYGLOTMANVERSION; -const char HOME[] = "available at http://polyglotman.sourceforge.net/"; -const char horizontalrule[] = "------------------------------------------------------------"; - -const int LINEBREAK = 70; -int linelen = 0; /* length of result in plain[] */ -int spcsqz; /* number of spaces squeezed out */ -int ccnt = 0; /* # of changebars */ -int scnt, scnt2; /* counts of initial spaces in line */ -int s_sum, s_cnt; -int bs_sum, bs_cnt; -int ncnt=0, oncnt=0; /* count of interline newlines */ -int CurLine=1; -int AbsLine=1-1; /* absolute line number */ -int indent=0; /* global indentation */ -int lindent=0; /* usual local indent */ -int auxindent=0; /* aux indent */ -int I; /* index into line/paragraph */ -int fcharout=1; /* show text or not */ -char lookahead; -/*int tabgram[MAXBUF];*/ /* histogram of first character positions */ -char buf[MAXBUF]; -char plain[MAXBUF]; /* current text line with control characters stripped out */ -char hitxt[MAXBUF]; /* highlighted text (available at time of BEGIN<highlight> signal */ - -char header[MAXBUF]; /* complete line */ -char header2[MAXBUF]; /* SGIs have two lines of headers and footers */ -char header3[MAXBUF]; /* GNU and some others have a third! */ -char footer[MAXBUF]; -char footer2[MAXBUF]; -#define CRUFTS 5 -char *cruft[CRUFTS] = { header, header2, header3, footer, footer2 }; - -char *File, *in; /* File = pointer to full file contents, in = current file pointer */ -char *argv0; -int finTable=0; -char tableSep='\0'; /*\t';*/ -/*int fTable=0; -int fotable=0;*/ -char *tblcellformat; -int tblcellspan; -/*int tblspanmax;*/ -int listtype=-1; /* current list type bogus to begin with */ -enum listtypes { DL, OL, UL }; - -int fIP=0; - - - -/*** utility functions ***/ - - -/* case insensitive versions of strcmp and strncmp */ - -static int -stricmp(const char *s1, const char *s2) -{ - assert(s1!=NULL && s2!=NULL); - /*strincmp(s1, s2, strlen(s1)+1);*/ - - while (tolower(*s1)==tolower(*s2)) { - if (*s1=='\0' /*&& *s2=='\0'*/) return 0; - s1++; s2++; - } - - if (tolower(*s1)<tolower(*s2)) return -1; - else return 1; -} - -static int -lcexceptionscmp(const void *a, const void *b) -{ - return stricmp(*(char **)a, *(char **)b); -} - -static int -strincmp(const char *s1, const char *s2, size_t n) -{ - assert(s1!=NULL && s2!=NULL && n>0); - - while (n>0 && tolower(*s1)==tolower(*s2)) { - n--; s1++; s2++; - } - if (n==0) return 0; - else if (tolower(*s1)<tolower(*s2)) return -1; - else return 1; -} - -/* compare string and a colon-separated list of strings */ -static int -strcoloncmp2(char *candidate, int end, const char *list, int sen) -{ - const char *l = list; - char *c,c2; - - assert(candidate!=NULL && list!=NULL); - assert(end>=-1 && end<=255); - assert(sen==0 || sen==1); - - if (*l==':') l++; /* tolerate a leading colon */ - - /* invariant: c and v point to start of strings to compare */ - while (*l) { - assert(l==list || l[-1]==':'); - for (c=candidate; *c && *l; c++,l++) - if ((sen && *c!=*l) || (!sen && tolower(*c)!=tolower(*l))) - break; - - /* if candidate matches a valid one as far as valid goes, it's a keeper */ - if ((*l=='\0' || *l==':') && (*c==end || end==-1)) { - if (*c=='\b') { - c2 = c[-1]; - while (*c=='\b' && c[1]==c2) c+=2; - } - /* no volume qualifiers with digits */ - if (!isdigit(*c)) return 1; - } - - /* bump to start of next valid */ - while (*l && *l++!=':') /* nada */; - } - - return 0; -} - -static int -strcoloncmp(char *candidate, int end, const char *list) -{ - int sen=1; - const char *l = list; - - assert(candidate!=NULL && list!=NULL); - assert(end>=-1 && end<=255); - - if (*l=='=') l++; else end=-1; - if (*l=='i') { sen=0; l++; } - - return strcoloncmp2(candidate, end, l, sen); -} - -/* strdup not universally available */ -static char * -mystrdup(const char *p) -{ - char *q; - - if (p==NULL) return NULL; - - q = malloc(strlen(p)+1); /* +1 gives space for \0 that is not reported by strlen */ - if (q!=NULL) strcpy(q,p); - return q; -} - - -/* given line of text, return "casified" version in place: - if word in exceptions list, return exception conversion - else uc first letter, lc rest -*/ -static void -casify(char *p) -{ - char tmpch, *q, **exp; - int fuc; - - for (fuc=1; *p; p++) { - if (isspace(*p) || strchr("&/",*p)!=NULL) fuc=1; - else if (fuc) { - /* usually */ - if (p[1] && isupper(p[1]) /*&& p[2] && isupper(p[2])*/) fuc=0; - /* check for exceptions */ - for (q=p; *q && !isspace(*q); q++) /*nada*/; - tmpch = *q; *q='\0'; - exp = (char **)bsearch(&p, lcexceptions, lcexceptionslen, sizeof(char *), lcexceptionscmp); - *q = tmpch; - if (exp!=NULL) { - for (q=*exp; *q; q++) *p++=*q; - fuc = 1; - } - } else *p=tolower(*p); - } -} - - -/* add an attribute tag to a range of characters */ - -static void -tagadd(int /*enum tagtype--abused in source parsing*/ type, int first, int last) -{ - assert(type!=NOTAG); - - if (tagc<MAXTAGS) { - tags[tagc].type = (enum tagtype)type; - tags[tagc].first = first; - tags[tagc].last = last; - tagc++; - } -} - - -/* - collect all saves to string table one one place, so that - if decide to go with string table instead of multiple malloc, it's easy - (probably few enough malloc's that more sophistication is unnecessary) -*/ - -static void -tocadd(char *text, enum command type, int line) -{ - char *r; - - assert(text!=NULL && strlen(text)>0); - assert(type==BEGINSECTION || type==BEGINSUBSECTION); - - if (tocc<MAXTOC) { - r = malloc(strlen(text)+1); if (r==NULL) return; - strcpy(r,text); - toc[tocc].text = r; - toc[tocc].type = type; - toc[tocc].line = line; - tocc++; - } -} - - - -char *manTitle = MANTITLEPRINTF; -char *manRef = MANREFPRINTF; -char *href; -int fmanRef=1; /* make 'em links or just show 'em? */ - -static void -manrefextract(char *p) -{ - char *p0; - static char *nonhref = "\">'"; - static char *punct = ".,:;)]}?!"; - - while (*p==' ') p++; - if (strincmp(p,"http",4)==0) { - href="%s"; manrefname = p; - p+=4; - while (*p && !isspace(*p) && !strchr(nonhref,*p)) p++; - while (strchr(punct, *(p - 1))) p--; - } else { - href = manRef; - - manrefname = p; - while (*p && *p!=' ' && *p!='(') p++; *p++='\0'; - while (*p==' ' || *p=='(') p++; p0=p; -#if defined(XOrg) || defined(XFree86) - /* Don't allow a letter after the man section number */ - p++; -#else - while (*p && *p!=')') p++; -#endif - manrefsect = p0; - } - *p='\0'; -} - - - - -/* - * OUTPUT FORMATS - */ - -static void -formattedonly(void) -{ - fprintf(stderr, "The output formats for Tk and TkMan require nroff-formatted input\n"); - exit(1); -} - - -/* - * DefaultFormat -- in weak OO inheritance, top of hierarchy for everybody - */ -static void -DefaultFormat(enum command cmd) -{ - int i; - - switch (cmd) { - case ITAB: - for (i=0; i<itabcnt; i++) putchar('\t'); - break; - default: - /* nada */ - break; - } -} - - -/* - * DefaultLine -- in weak OO inheritance, top of hierarchy for line-based formats - * for output format to "inherit", have "default: DefaultLine(cmd)" and override case statement "methods" - */ - -static void -DefaultLine(enum command cmd) { - switch (cmd) { - default: - DefaultFormat(cmd); - } -} - - -/* - * DefaultPara -- top of hierarchy for output formats that are formatted by their viewers - */ - -static void -DefaultPara(enum command cmd) -{ - switch (cmd) { - default: - DefaultFormat(cmd); - } -} - - - -/* - * Tk -- just emit list of text-tags pairs - */ - -static void -Tk(enum command cmd) -{ - static int skip=0; /* skip==1 when line has no text */ - int i; - - if (fSource) formattedonly(); - - /* invariant: always ready to insert text */ - - switch (cmd) { - case BEGINDOC: - I=0; CurLine=1; - escchars = "\"[]$"; - printf(/*$t insert end */ "\""); - break; - case ENDDOC: - if (fHeadfoot) { -/* grr, should have +mark syntax for Tk text widget! -- maybe just just +sect#, +subsect# - printf("\\n\\n\" {} \"%s\\n\" {+headfoot h2}\n", HEADERANDFOOTER); -*/ - printf("\\n\\n\" {} \"%s\\n\" h2\n",HEADERANDFOOTER); - /*printf("$t mark set headfoot %d.0\n", CurLine);*/ - CurLine++; - - for (i=0; i<CRUFTS; i++) { - if (*cruft[i]) { - printf(/*$t insert end */"{%s} sc \\n\n", cruft[i]); - CurLine++; - } - } - } else printf("\"\n"); - break; - - case COMMENTLINE: printf("# "); break; - - case BEGINLINE: - /*I=0; -- need to do this at end of line so set for filterline() */ - /* nothing to do at start of line except catch up on newlines */ - for (i=0; i<ncnt; i++) printf("\\n"); - CurLine+=ncnt; - /*if (fSource) for (i=0; i<indent; i++) putchar('\t');*/ - break; - case ENDLINE: - /*if (!fSource) {*/ - if (!skip) /*if (ncnt)*/ printf("\\n"); /*else xputchar(' ');*/ - skip=0; - CurLine++; I=0; - /* - } else { - putchar(' '); I++; - } - */ - break; - - case ENDSECTHEAD: - printf("\\n\" h2 \""); - tagc=0; - skip=1; - break; - case ENDSUBSECTHEAD: - printf("\\n\" h3 \""); /* add h3? */ - tagc=0; - skip=1; - break; - case HR: /*printf("\\n%s\\n", horizontalrule); CurLine+=2; I=0;*/ break; - case BEGINTABLEENTRY: - /*if (fSource) putchar('\t');*/ - break; - case BEGINTABLELINE: - case ENDTABLEENTRY: - break; - case ENDTABLELINE: - printf("\" tt \""); - /*tagadd(MONO, 0, I);*/ - break; - - case CHANGEBAR: putchar('|'); I++; break; - case CHARLQUOTE: - case CHARRQUOTE: - putchar('\\'); putchar('"'); I++; - break; - case CHARLSQUOTE: - case CHARRSQUOTE: - case CHARPERIOD: - case CHARTAB: - case CHARDASH: - case CHARLT: - case CHARGT: - case CHARHAT: - case CHARVBAR: - case CHARAMP: - case CHARPLUSMINUS: - case CHARNBSP: - case CHARCENT: - case CHARSECT: - case CHARCOPYR: - case CHARNOT: - case CHARREGTM: - case CHARDEG: - case CHARACUTE: - case CHAR14: - case CHAR12: - case CHAR34: - case CHARMUL: - case CHARDIV: - putchar(cmd); I++; break; - case CHARDAGGER: - putchar('+'); I++; break; - case CHARBACKSLASH: printf("\\\\"); I++; break; - case CHARBULLET: printf("\" {} %c symbol \"",c_bullet); I++; break; - - - case BEGINSECTHEAD: - case BEGINSUBSECTHEAD: - /*if (fSource && sectheadid!=NAME) { printf("\\n\\n"); CurLine+=2; I=0; }*/ - tagc=0; /* section and subsection formatting controlled descriptively */ - /* no break;*/ - - case BEGINBOLD: - case BEGINITALICS: - case BEGINBOLDITALICS: - case BEGINCODE: - case BEGINY: - case BEGINSC: - case BEGINMANREF: - /* end text, begin attributed text */ - printf("\" {} \""); - break; - - /* rely on the fact that no more than one tag per range of text */ - case ENDBOLD: printf("\" b \""); break; - case ENDITALICS: printf("\" i \""); break; - case ENDBOLDITALICS: printf("\" bi \""); break; - case ENDCODE: printf("\" tt \""); break; - case ENDY: printf("\" symbol \""); break; - case ENDSC: printf("\" sc \""); break; - case ENDMANREF: printf("\" manref \""); break; - /* presentation attributes dealt with at end of line */ - - case BEGINBODY: - /*if (fSource) { printf("\\n\\n"); CurLine+=2; I=0; }*/ - break; - case SHORTLINE: - /*if (fSource) { printf("\\n"); CurLine++; I=0; }*/ - break; - case ENDBODY: - case BEGINBULPAIR: case ENDBULPAIR: - /*if (fSource) { printf("\\n"); CurLine++; I=0; }*/ - break; - case BEGINBULTXT: - /*if (fSource) putchar('\t');*/ - break; - case BEGINBULLET: case ENDBULLET: - case ENDBULTXT: - case BEGINSECTION: case ENDSECTION: - case BEGINSUBSECTION: case ENDSUBSECTION: - case BEGINHEADER: case ENDHEADER: - case BEGINFOOTER: case ENDFOOTER: - case BEGINTABLE: case ENDTABLE: - case FONTSIZE: - case BEGININDENT: case ENDINDENT: - /* no action */ - break; - default: - DefaultLine(cmd); - } -} - - -/* - * TkMan -- Tk format wrapped with commands - */ - -int linetabcnt[MAXLINES]; /* don't want to bother with realloc */ -int clocnt=0, clo[MAXLINES]; -int paracnt=0, para[MAXLINES]; -int rebuscnt=0, rebus[MAXLINES]; -int rebuspatcnt=0, rebuspatlen[25]; -char *rebuspat[25]; - -static void -TkMan(enum command cmd) -{ - static int lastscnt=-1; - static int lastlinelen=-1; - static int lastsect=0; - /*static int coalese=0;*/ - static int finflow=0; - int i; - char c,*p; - - /* invariant: always ready to insert text */ - - switch (cmd) { - case BEGINDOC: - printf("$t insert end "); /* opening quote supplied in Tk() below */ - Tk(cmd); - break; - case ENDDOC: - Tk(ENDLINE); - - if (fHeadfoot) { -/* grr, should have +mark syntax for Tk text widget! - printf("\\n\\n\" {} \"%s\\n\" {+headfoot h2}\n", HEADERANDFOOTER); -*/ - printf("\\n\\n\" {} \"%s\\n\" h2\n", HEADERANDFOOTER); -/* printf("$t mark set headfoot end-2l\n");*/ - CurLine++; - - for (i=0; i<CRUFTS; i++) { - if (*cruft[i]) { - printf("$t insert end {%s} sc \\n\n", cruft[i]); - CurLine++; - } - } - } else printf("\"\n"); - -/* - printf("$t insert 1.0 {"); - for (i=0; i<MAXBUF; i++) if (tabgram[i]) printf("%d=%d, ", i, tabgram[i]); - printf("\\n\\n}\n"); -*/ - - printf("set manx(tabcnts) {"); for (i=1; i<CurLine; i++) printf("%d ", linetabcnt[i]); printf("}\n"); - printf("set manx(clo) {"); for (i=0; i<clocnt; i++) printf("%d ", clo[i]); printf("}\n"); - printf("set manx(para) {"); for (i=0; i<paracnt; i++) printf("%d ", para[i]); printf("}\n"); - printf("set manx(reb) {"); for (i=0; i<rebuscnt; i++) printf("%d ", rebus[i]); printf("}\n"); - - break; - - case BEGINCOMMENT: fcharout=0; break; - case ENDCOMMENT: fcharout=1; break; - case COMMENTLINE: break; - - case ENDSECTHEAD: - case ENDSUBSECTHEAD: - lastsect=1; - Tk(cmd); - break; - - case BEGINLINE: - Tk(cmd); - linetabcnt[CurLine] = itabcnt; - /* old pattern for command line options "^\\|*\[ \t\]+-\[^-\].*\[^ \t\]" */ - c = plain[0]; - if (linelen>=2 && ((c=='-' || c=='%' || c=='\\' || c=='$' /**/ /* not much talk of money in man pages so reasonable */) && (isalnum(plain[1]) /*<= plain[1]!='-'*//*no dash*/ || ncnt/*GNU long option*/) && plain[1]!=' ') ) clo[clocnt++] = CurLine; - /* - would like to require second letter to be a capital letter to cut down on number of matches, - but command names usually start with lowercase letter - maybe use a uppercase requirement as secondary strategy, but probably not - */ - if ((ncnt || lastsect) && linelen>0 && scnt>0 && scnt<=7/*used to be <=5 until groff spontaneously started putting in 7*/) para[paracnt++] = CurLine; - lastsect=0; - - - /* rebus too, instead of search through whole Tk widget */ - if (rebuspatcnt && scnt>=5 /* not sect or subsect heads */) { - for (p=plain; *p && *p!=' '; p++) /*empty*/; /* never first word */ - while (*p) { - for (i=0; i<rebuspatcnt; i++) { - if (tolower(*p) == tolower(*rebuspat[i]) && strincmp(p, rebuspat[i], rebuspatlen[i])==0) { - /* don't interfere with man page refs */ - for (; *p && !isspace(*p); p++) if (*p=='(') continue; - rebus[rebuscnt++] = CurLine; - p=""; /* break for outer */ - break; /* just locating any line with any rebus, not exact positions */ - } - } - /* just check start of words, though doesn't have to be full word (if did, could use strlen rather than strnlen) */ - while (*p && *p!=' ') p++; - while (*p && *p==' ') p++; - } - } - - - if (fReflow && !ncnt && (finflow || lastlinelen>50) && (abs(scnt-lastscnt)<=1 || abs(scnt-hanging)<=1)) { - finflow=1; - putchar(' '); - } else { - Tk(ENDLINE); - /*if ((CurLine&0x3f)==0x3f) printf("\"\nupdate idletasks\n$t insert end \""); blows up some Tk text buffer, apparently, on long lines*/ - if ((CurLine&0x1f)==0x1f) printf("\"\nupdate idletasks\n$t insert end \""); - finflow=0; - - /*if (fCodeline) printf("CODE");*/ - } - lastlinelen=linelen; lastscnt=scnt; - break; - - case ENDLINE: - /* don't call Tk(ENDLINE) */ - break; - - default: /* if not caught above, it's the same as Tk */ - Tk(cmd); - } -} - - - - -/* - * ASCII - */ - -static void -ASCII(enum command cmd) -{ - int i; - - switch (cmd) { - case ENDDOC: - if (fHeadfoot) { - printf("\n%s\n", HEADERANDFOOTER); - for (i=0; i<CRUFTS; i++) if (*cruft[i]) printf("%s\n", cruft[i]); - } - break; - case CHARRQUOTE: - case CHARLQUOTE: - putchar('"'); - break; - case CHARLSQUOTE: - putchar('`'); - break; - case CHARRSQUOTE: - case CHARACUTE: - putchar('\''); - break; - case CHARPERIOD: - case CHARTAB: - case CHARDASH: - case CHARLT: - case CHARAMP: - case CHARBACKSLASH: - case CHARGT: - case CHARHAT: - case CHARVBAR: - case CHARNBSP: - putchar(cmd); break; - case CHARDAGGER: putchar('+'); break; - case CHARBULLET: putchar('*'); break; - case CHARPLUSMINUS: printf("+-"); break; - case CHANGEBAR: putchar('|'); break; - case CHARCENT: putchar('c'); break; - case CHARSECT: putchar('S'); break; - case CHARCOPYR: printf("(C)"); break; - case CHARNOT: putchar('~'); break; - case CHARREGTM: printf("(R)"); break; - case CHARDEG: putchar('o'); break; - case CHAR14: printf("1/4"); break; - case CHAR12: printf("1/2"); break; - case CHAR34: printf("3/4"); break; - case CHARMUL: putchar('X'); break; - case CHARDIV: putchar('/'); break; - case HR: printf("\n%s\n", horizontalrule); break; - - case BEGINLINE: - for (i=0; i<ncnt; i++) putchar('\n'); - break; - case BEGINBODY: - case SHORTLINE: - if (!fSource) break; - case ENDLINE: - putchar('\n'); - CurLine++; - break; - - case BEGINDOC: - case ENDBODY: - case BEGINHEADER: case ENDHEADER: - case BEGINFOOTER: case ENDFOOTER: - case BEGINSECTION: case ENDSECTION: - case BEGINSECTHEAD: case ENDSECTHEAD: - case BEGINSUBSECTHEAD: case ENDSUBSECTHEAD: - case BEGINBULPAIR: case ENDBULPAIR: - case BEGINBULLET: case ENDBULLET: - case BEGINBULTXT: case ENDBULTXT: - case BEGINSUBSECTION: case ENDSUBSECTION: - - case BEGINTABLE: case ENDTABLE: - case BEGINTABLELINE: case ENDTABLELINE: case BEGINTABLEENTRY: case ENDTABLEENTRY: - case BEGININDENT: case ENDINDENT: - case FONTSIZE: - case BEGINBOLD: case ENDBOLD: - case BEGINCODE: case ENDCODE: - case BEGINITALICS: case ENDITALICS: - case BEGINMANREF: case ENDMANREF: - case BEGINBOLDITALICS: case ENDBOLDITALICS: - case BEGINY: case ENDY: - case BEGINSC: case ENDSC: - /* nothing */ - break; - default: - DefaultLine(cmd); - } -} - - - -/* - * Perl 5 pod ("plain old documentation") - */ - -static void -pod(enum command cmd) -{ - static int curindent=0; - int i; - - if (hanging==-1) { - if (curindent) hanging=curindent; else hanging=5; - } - - - if (cmd==BEGINBULPAIR) { - /* want to have multiply indented text */ - if (curindent && hanging!=curindent) printf("\n=back\n\n"); - if (hanging!=curindent) printf("\n=over %d\n\n",hanging); - curindent=hanging; - } else if (cmd==ENDBULPAIR) { - /* nothing--wait until next command */ - } else if (cmd==BEGINLINE && !scnt) { - if (curindent) printf("\n=back\n\n"); - curindent=0; - } else if (cmd==BEGINBODY) { - if (curindent) { - printf("\n=back\n\n"); - curindent=0; - auxindent=0; - } - } -/* - case BEGINBULPAIR: - printf("=over %d\n\n", hanging); - break; - case ENDBULPAIR: - printf("\n=back\n\n"); - break; -*/ - switch (cmd) { - case BEGINDOC: I=0; break; - - case BEGINCOMMENT: fcharout=0; break; - case ENDCOMMENT: fcharout=1; break; - case COMMENTLINE: break; - - case CHARRQUOTE: - case CHARLQUOTE: - putchar('"'); - break; - case CHARLSQUOTE: - putchar('`'); - break; - case CHARRSQUOTE: - case CHARACUTE: - putchar('\''); - break; - case CHARPERIOD: - case CHARTAB: - case CHARDASH: - case CHARLT: - case CHARAMP: - case CHARBACKSLASH: - case CHARGT: - case CHARHAT: - case CHARVBAR: - case CHARNBSP: - putchar(cmd); break; - case CHARDAGGER: putchar('+'); break; - case CHARPLUSMINUS: printf("+-"); break; - case CHANGEBAR: putchar('|'); break; - case CHARCENT: putchar('c'); break; - case CHARSECT: putchar('S'); break; - case CHARCOPYR: printf("(C)"); break; - case CHARNOT: putchar('~'); break; - case CHARREGTM: printf("(R)"); break; - case CHARDEG: putchar('o'); break; - case CHAR14: printf("1/4"); break; - case CHAR12: printf("1/2"); break; - case CHAR34: printf("3/4"); break; - case CHARMUL: putchar('X'); break; - case CHARDIV: putchar('/'); break; - case HR: printf("\n%s\n", horizontalrule); break; - case CHARBULLET: putchar('*'); break; - - case BEGINLINE: - for (i=0; i<ncnt; i++) putchar('\n'); - CurLine+=ncnt; - break; - case ENDLINE: - putchar('\n'); - CurLine++; - I=0; - break; - - case BEGINSECTHEAD: printf("=head1 "); break; - case BEGINSUBSECTHEAD: printf("=head2 "); break; - - case ENDSECTHEAD: - case ENDSUBSECTHEAD: - printf("\n"); - break; - - case BEGINCODE: - case BEGINBOLD: printf("B<"); break; - case BEGINITALICS: printf("I<"); break; - case BEGINMANREF: printf("L<"); break; - - case ENDBOLD: - case ENDCODE: - case ENDITALICS: - case ENDMANREF: - printf(">"); - break; - - case BEGINBULLET: - printf("\n=item "); - break; - case ENDBULLET: - printf("\n\n"); - fcharout=0; - break; - case BEGINBULTXT: - fcharout=1; - auxindent=hanging; - break; - case ENDBULTXT: - auxindent=0; - break; - - - case ENDDOC: - case BEGINBODY: case ENDBODY: - case BEGINHEADER: case ENDHEADER: - case BEGINFOOTER: case ENDFOOTER: - case BEGINSECTION: case ENDSECTION: - case BEGINSUBSECTION: case ENDSUBSECTION: - case BEGINBULPAIR: case ENDBULPAIR: - - case SHORTLINE: - case BEGINTABLE: case ENDTABLE: - case BEGINTABLELINE: case ENDTABLELINE: case BEGINTABLEENTRY: case ENDTABLEENTRY: - case BEGININDENT: case ENDINDENT: - case FONTSIZE: - case BEGINBOLDITALICS: case ENDBOLDITALICS: - case BEGINY: case ENDY: - case BEGINSC: case ENDSC: - /* nothing */ - break; - default: - DefaultLine(cmd); - } -} - - - -static void -Sections(enum command cmd) -{ - - switch (cmd) { - case ENDSECTHEAD: - case ENDSUBSECTHEAD: - putchar('\n'); - case BEGINDOC: - fcharout=0; - break; - - case BEGINCOMMENT: fcharout=0; break; - case ENDCOMMENT: fcharout=1; break; - case COMMENTLINE: break; - - case BEGINSUBSECTHEAD: - printf(" "); - /* no break */ - case BEGINSECTHEAD: - fcharout=1; - break; - case CHARRQUOTE: - case CHARLQUOTE: - xputchar('"'); - break; - case CHARLSQUOTE: - xputchar('`'); - break; - case CHARRSQUOTE: - case CHARACUTE: - xputchar('\''); - break; - case BEGINTABLE: case ENDTABLE: - case BEGINTABLELINE: case ENDTABLELINE: case BEGINTABLEENTRY: case ENDTABLEENTRY: - case BEGININDENT: case ENDINDENT: - case FONTSIZE: - break; - case CHARPERIOD: - case CHARTAB: - case CHARDASH: - case CHARBACKSLASH: - case CHARLT: - case CHARGT: - case CHARHAT: - case CHARVBAR: - case CHARAMP: - case CHARNBSP: - xputchar(cmd); break; - case CHARDAGGER: xputchar('+'); break; - case CHARBULLET: xputchar('*'); break; - case CHARPLUSMINUS: xputchar('+'); xputchar('-'); break; - case CHARCENT: xputchar('c'); break; - case CHARSECT: xputchar('S'); break; - case CHARCOPYR: xputchar('('); xputchar('C'); xputchar(')'); break; - case CHARNOT: xputchar('~'); break; - case CHARREGTM: xputchar('('); xputchar('R'); xputchar(')'); break; - case CHARDEG: xputchar('o'); break; - case CHAR14: xputchar('1'); xputchar('/'); xputchar('4'); break; - case CHAR12: xputchar('1'); xputchar('/'); xputchar('2'); break; - case CHAR34: xputchar('3'); xputchar('/'); xputchar('4'); break; - case CHARMUL: xputchar('X'); break; - case CHARDIV: xputchar('/'); break; - case ITAB: DefaultLine(cmd); break; - - - default: - /* nothing */ - break; - } -} - - - -static void -Roff(enum command cmd) -{ - switch (cmd) { - case BEGINDOC: - I=1; - printf(".TH %s %s \"generated by PolyglotMan\" UCB\n", manName, manSect); - printf(".\\\" %s,\n", PROVENANCE); - printf(".\\\" %s\n", HOME); - CurLine=1; - break; - case BEGINBODY: printf(".LP\n"); break; - - case BEGINCOMMENT: - case ENDCOMMENT: - break; - case COMMENTLINE: printf("'\\\" "); break; - - case BEGINSECTHEAD: printf(".SH "); break; - case BEGINSUBSECTHEAD:printf(".SS "); break; - case BEGINBULPAIR: printf(".IP "); break; - case SHORTLINE: printf("\n.br"); break; - case BEGINBOLD: printf("\\fB"); break; /* \n.B -- grr! */ - case ENDCODE: - case ENDBOLD: printf("\\fR"); break; /* putchar('\n'); */ - case BEGINITALICS: printf("\\fI"); break; - case ENDITALICS: printf("\\fR"); break; - case BEGINCODE: - case BEGINBOLDITALICS:printf("\\f4"); break; - case ENDBOLDITALICS: printf("\\fR"); break; - - case CHARLQUOTE: printf("\\*(rq"); break; - case CHARRQUOTE: printf("\\*(lq"); break; - case CHARNBSP: printf("\\|"); break; - case CHARLSQUOTE: putchar('`'); break; - case CHARRSQUOTE: putchar('\''); break; - case CHARPERIOD: if (I==1) printf("\\&"); putchar('.'); I++; break; - case CHARDASH: printf("\\-"); break; - case CHARTAB: - case CHARLT: - case CHARGT: - case CHARHAT: - case CHARVBAR: - case CHARAMP: - putchar(cmd); break; - case CHARBULLET: printf("\\(bu"); break; - case CHARDAGGER: printf("\\(dg"); break; - case CHARPLUSMINUS: printf("\\(+-"); break; - case CHANGEBAR: putchar('|'); break; - case CHARCENT: printf("\\(ct"); break; - case CHARSECT: printf("\\(sc"); break; - case CHARCOPYR: printf("\\(co"); break; - case CHARNOT: printf("\\(no"); break; - case CHARREGTM: printf("\\(rg"); break; - case CHARDEG: printf("\\(de"); break; - case CHARACUTE: printf("\\(aa"); break; - case CHAR14: printf("\\(14"); break; - case CHAR12: printf("\\(12"); break; - case CHAR34: printf("\\(34"); break; - case CHARMUL: printf("\\(mu"); break; - case CHARDIV: printf("\\(di"); break; - case HR: /*printf("\n%s\n", horizontalrule);*/ break; - case CHARBACKSLASH: printf("\\\\"); break; /* correct? */ - - case BEGINLINE: - /*for (i=0; i<ncnt; i++) putchar('\n');*/ - break; - - case BEGINBULLET: putchar('"'); break; - case ENDBULLET: printf("\"\n"); break; - - case ENDLINE: - CurLine++; - I=1; - /* no break */ - case ENDSUBSECTHEAD: - case ENDSECTHEAD: - case ENDDOC: - putchar('\n'); - break; - - case BEGINCODEBLOCK: printf(".nf\n"); - case ENDCODEBLOCK: printf(".fi\n"); - - case ENDBODY: - case ENDBULPAIR: - case BEGINBULTXT: case ENDBULTXT: - case BEGINSECTION: case ENDSECTION: - case BEGINSUBSECTION: case ENDSUBSECTION: - case BEGINY: case ENDY: - case BEGINSC: case ENDSC: - case BEGINTABLE: case ENDTABLE: - case BEGINTABLELINE: case ENDTABLELINE: case BEGINTABLEENTRY: case ENDTABLEENTRY: - case BEGININDENT: case ENDINDENT: - case FONTSIZE: - case BEGINHEADER: case ENDHEADER: - case BEGINFOOTER: case ENDFOOTER: - case BEGINMANREF: case ENDMANREF: - /* nothing */ - break; - default: - DefaultPara(cmd); - } -} - - - -/* - * HTML - */ - -static void -HTML(enum command cmd) -{ - static int pre=0; - int i; - int lasttoc; - - /* always respond to these signals */ - switch (cmd) { - case CHARNBSP: printf(" "); I++; break; - case CHARTAB: printf("<tt> </tt> <tt> </tt> "); break; -#if defined(XOrg) || defined(XFree86) - /* using named entities for ASCII quote characters is redundant */ - case CHARLQUOTE: - case CHARRQUOTE: - case CHARLSQUOTE: - case CHARRSQUOTE: - putchar(cmd); break; -#else - case CHARLQUOTE: printf("“"); break; - case CHARRQUOTE: printf("”"); break; - case CHARLSQUOTE: printf("‘"); break; - case CHARRSQUOTE: printf("’"); break; -#endif - case CHARPERIOD: - case CHARDASH: - case CHARBACKSLASH: - case CHARVBAR: /*printf("¦"); -- broken bar no good */ - case CHARHAT: - putchar(cmd); - break; - case CHARDAGGER: printf("†"); break; - case CHARBULLET: if (I>0 || !finlist) printf("·"/*"·"*//*§--middot hardly visible*/); - break; - case CHARPLUSMINUS: printf("±"); break; - case CHARGT: printf(">"); break; - case CHARLT: printf("<"); break; - case CHARAMP: printf("&"); break; - case CHARCENT: printf("¢"); break; - case CHARSECT: printf("§"); break; - case CHARCOPYR: printf("©"); break; - case CHARNOT: printf("¬"); break; - case CHARREGTM: printf("®"); break; - case CHARDEG: printf("°"); break; - case CHARACUTE: printf("´"); break; - case CHAR14: printf("¼"); break; - case CHAR12: printf("½"); break; - case CHAR34: printf("¾"); break; - case CHARMUL: printf("×"); break; - case CHARDIV: printf("÷"); break; - default: - break; - } - - /* while in pre mode... */ - if (pre) { - switch (cmd) { - case ENDLINE: I=0; CurLine++; if (!fPara && scnt) printf("<br>"); printf("\n"); break; - case ENDTABLE: - if (fSource) { - printf("</table>\n"); - } else { - printf("</pre><br>\n"); pre=0; fQS=fIQS=fPara=1; - } - break; - case ENDCODEBLOCK: printf("</pre>"); pre=0; break; - case SHORTLINE: - case ENDBODY: - printf("\n"); - break; - case BEGINBOLD: printf("<b>"); break; - case ENDBOLD: printf("</b>"); break; - case BEGINITALICS: printf("<i>"); break; - case ENDITALICS: printf("</i>"); break; - default: - /* nothing */ - break; - } - return; - } - - /* usual operation */ - switch (cmd) { - case BEGINDOC: - /* escchars = ... => HTML doesn't backslash-quote metacharacters */ - printf("<!-- %s, -->\n", PROVENANCE); - printf("<!-- %s -->\n\n", HOME); - printf("<html>\n<head>\n"); -/* printf("<isindex>\n");*/ - /* better title possible? */ - printf("<title>"); printf(manTitle, manName, manSect); printf("</title>\n"); -#if defined(XOrg) || defined(XFree86) - printf("</head>\n<body bgcolor='#efefef' text='black' " - "link='blue' vlink='#551A8B' alink='red'>\n"); -#else - printf("</head>\n<body bgcolor='white'>\n"); -#endif - printf("<a href='#toc'>%s</a><p>\n", TABLEOFCONTENTS); - I=0; - break; - case ENDDOC: - /* header and footer wanted? */ - printf("<p>\n"); - if (fHeadfoot) { - printf("<hr><h2>%s</h2>\n", HEADERANDFOOTER); - for (i=0; i<CRUFTS; i++) if (*cruft[i]) printf("%s<br>\n", cruft[i]); - } - - if (!tocc) { - /*printf("\n<h1>ERROR: Empty man page</h1>\n");*/ - } else { - printf("\n<hr><p>\n"); - printf("<a name='toc'><b>%s</b></a><p>\n", TABLEOFCONTENTS); - printf("<ul>\n"); - for (i=0, lasttoc=BEGINSECTION; i<tocc; lasttoc=toc[i].type, i++) { - if (lasttoc!=toc[i].type) { - if (toc[i].type==BEGINSUBSECTION) printf("<ul>\n"); - else printf("</ul>\n"); - } - printf("<li><a name='toc%d' href='#sect%d'>%s</a></li>\n", i, i, toc[i].text); - } - if (lasttoc==BEGINSUBSECTION) printf("</ul>"); - printf("</ul>\n"); - } - printf("</body>\n</html>\n"); - break; - case BEGINBODY: - printf("<p>\n"); - break; - case ENDBODY: break; - - case BEGINCOMMENT: printf("\n<!--\n"); break; - case ENDCOMMENT: printf("\n-->\n"); break; - case COMMENTLINE: printf(" "); break; - - case BEGINSECTHEAD: - printf("\n<h2><a name='sect%d' href='#toc%d'>", tocc, tocc); - break; - case ENDSECTHEAD: - printf("</a></h2>\n"); - /* useful extraction from FILES, ENVIRONMENT? */ - break; - case BEGINSUBSECTHEAD: - printf("\n<h3><a name='sect%d' href='#toc%d'>", tocc, tocc); - break; - case ENDSUBSECTHEAD: - printf("</a></h3>\n"); - break; - case BEGINSECTION: break; - case ENDSECTION: - if (sectheadid==NAME && message!=NULL) printf(message); - break; - case BEGINSUBSECTION: break; - case ENDSUBSECTION: break; - - case BEGINBULPAIR: - if (listtype==OL) printf("\n<ol>\n"); - else if (listtype==UL) printf("\n<ul>\n"); - else printf("\n<dl>\n"); - break; - case ENDBULPAIR: - if (listtype==OL) printf("\n</ol>\n"); - else if (listtype==UL) printf("\n</ul>\n"); - else printf("</dl>\n"); - break; - case BEGINBULLET: - if (listtype==OL || listtype==UL) fcharout=0; - else printf("\n<dt>"); - break; - case ENDBULLET: - if (listtype==OL || listtype==UL) fcharout=1; - else printf("</dt>"); - break; - case BEGINBULTXT: - if (listtype==OL || listtype==UL) printf("<li>"); - else printf("\n<dd>"); - break; - case ENDBULTXT: - if (listtype==OL || listtype==UL) printf("</li>"); - else printf("</dd>\n"); - break; - - case BEGINLINE: - /* if (ncnt) printf("<p>\n"); -- if haven't already generated structural tag */ - if (ncnt) printf("\n<p>"); - - /* trailing spaces already trimmed off, so look for eol now */ - if (fCodeline) { - printf("<code>"); - for (i=0; i<scnt-indent; i++) printf(" "/* */); /* ? */ - tagc=0; - - /* already have .tag=BOLDITALICS, .first=0 */ - /* would be more elegant, but can't print initial spaces before first tag - tags[0].last = linelen; - tagc=1; - fIQS=0; - */ - } - - break; - - case ENDLINE: - /*if (fCodeline) { fIQS=1; fCodeline=0; }*/ - if (fCodeline) { printf("</code><br>"); fCodeline=0; } - I=0; CurLine++; if (!fPara && scnt) printf("<br>"); printf("\n"); - break; - - case SHORTLINE: - if (fCodeline) { printf("</code>"); fCodeline=0; } - if (!fIP) printf("<br>\n"); - break; - - - case BEGINTABLE: - if (fSource) { - /*printf("<center><table border>\n");*/ - printf("<table border='0'>\n"); - } else { - printf("<br><pre>\n"); pre=1; fQS=fIQS=fPara=0; - } - break; - case ENDTABLE: - if (fSource) { - printf("</table>\n"); - } else { - printf("</pre><br>\n"); pre=0; fQS=fIQS=fPara=1; - } - break; - case BEGINTABLELINE: printf("<tr>"); break; - case ENDTABLELINE: printf("</tr>\n"); break; - case BEGINTABLEENTRY: - printf("<td align='"); - switch (tblcellformat[0]) { - case 'c': printf("center"); break; - case 'n': /*printf("decimal"); break; -- fall through to right for now */ - case 'r': printf("right"); break; - case 'l': - default: - printf("left"); - } - if (tblcellspan>1) printf(" colspan=%d", tblcellspan); - printf("'>"); - break; - case ENDTABLEENTRY: - printf("</td>"); - break; - - /* something better with CSS */ - case BEGININDENT: printf("<blockquote>"); break; - case ENDINDENT: printf("</blockquote>\n"); break; - - case FONTSIZE: - /* HTML font step sizes are bigger than troff's */ - if ((fontdelta+=intArg)!=0) printf("<font size='%c1'>", (intArg>0)?'+':'-'); else printf("</font>\n"); - break; - - case BEGINBOLD: printf("<b>"); break; - case ENDBOLD: printf("</b>"); break; - case BEGINITALICS: printf("<i>"); break; - case ENDITALICS: printf("</i>"); break; - case BEGINBOLDITALICS: - case BEGINCODE: printf("<code>"); break; - case ENDBOLDITALICS: - case ENDCODE: printf("</code>"); break; - case BEGINCODEBLOCK: printf("<pre>"); pre=1; break; /* wrong for two-column lists in kermit.1, pine.1, perl4.1 */ - case ENDCODEBLOCK: printf("</pre>"); pre=0; break; - case BEGINCENTER: printf("<center>"); break; - case ENDCENTER: printf("</center>"); break; - case BEGINMANREF: - manrefextract(hitxt); - if (fmanRef) { printf("<a href='"); printf(href, manrefname, manrefsect); printf("'>"); } - else printf("<i>"); - break; - case ENDMANREF: - if (fmanRef) printf("</a>\n"); else printf("</i>"); - break; - case HR: printf("\n<hr>\n"); break; - - /* U (was B, I), strike -- all temporary until HTML 4.0's INS and DEL widespread */ - case BEGINDIFFA: printf("<ins><u>"); break; - case ENDDIFFA: printf("</u></ins>"); break; - case BEGINDIFFD: printf("<del><strike>"); break; - case ENDDIFFD: printf("</strike></del>"); break; - - case BEGINSC: case ENDSC: - case BEGINY: case ENDY: - case BEGINHEADER: case ENDHEADER: - case BEGINFOOTER: case ENDFOOTER: - case CHANGEBAR: - /* nothing */ - break; - default: - DefaultPara(cmd); - } -} - - - -/* - * DocBook XML - * improvements by Aaron Hawley applied 2003 June 5 - * - * N.B. The framework for XML is in place but not done. If you - * are familiar with the DocBook DTD, however, it shouldn't be - * too difficult to finish it. If you do so, please send your - * code to me so that I may share the wealth in the next release. - */ - -const char *DOCBOOKPATH = "http://www.oasis-open.org/docbook/xml/4.1.2/docbookx.dtd"; - -static void -XML(enum command cmd) -{ - static int pre=0; - int i; - char *p; - static int fRefEntry=0; - static int fRefPurpose=0; - /*static char *bads => XML doesn't backslash-quote metacharacters */ - -/* -*/ - - /* always respond to these signals */ - switch (cmd) { - case CHARLQUOTE: case CHARRQUOTE: printf("""); break; - case CHARBULLET: printf("•"); break; - case CHARDAGGER: printf("†"); break; - case CHARPLUSMINUS: printf("±"); break; - case CHARCOPYR: printf("©"); break; - case CHARNOT: printf("¬"); break; - case CHARMUL: printf("×"); break; - case CHARDIV: printf("÷"); break; - case CHARAMP: printf("&"); break; - case CHARDASH: - if (sectheadid==NAME && !fRefPurpose) { - printf("</refname><refpurpose>"); - fRefPurpose=1; - } else putchar('-'); - break; - case CHARBACKSLASH: putchar('\\'); break; - case CHARGT: printf(">"); break; - case CHARLT: printf("<"); break; - case CHARLSQUOTE: - case CHARRSQUOTE: - case CHARPERIOD: - case CHARTAB: - case CHARHAT: - case CHARVBAR: - case CHARNBSP: - case CHARCENT: - case CHARSECT: - case CHARREGTM: - case CHARDEG: - case CHARACUTE: - case CHAR14: - case CHAR12: - case CHAR34: - putchar(cmd); - break; - default: - break; - } - - /* while in pre mode... */ - if (pre) { - switch (cmd) { - case ENDLINE: I=0; CurLine++; if (!fPara && scnt) putchar(' '); break; - case ENDTABLE: - if (fSource) printf("</table>\n"); - else { printf("</literallayout>\n"); pre=0; fQS=fIQS=fPara=1; } - break; - default: - /* nothing */ - break; - } - return; - } - - /* usual operation */ - switch (cmd) { - case BEGINDOC: - printf("\n<!DOCTYPE refentry PUBLIC \"-//OASIS//DTD DocBook XML V4.1.2//EN\"\n"); - printf(" \"%s\">\n", DOCBOOKPATH); - - printf("<!--\n\n\tI am looking for help to finish DocBook XML.\n\n-->\n"); - - printf("<!-- %s\n", PROVENANCE); - printf(" %s -->\n\n",HOME); - /* better title possible? */ - for (p=manName; *p; p++) *p = tolower(*p); - printf("<refentry id='%s.%s'>\n", manName, manSect); - printf("<refmeta>\n<refentrytitle>%s</refentrytitle>\n", manName); - printf("<manvolnum>%s</manvolnum>\n</refmeta>\n\n", manSect); - - I=0; - break; - - case ENDDOC: - /* header and footer wanted? */ - if (fHeadfoot) { - printf("\n<refsect1>\n<title>%s</title>\n", HEADERANDFOOTER); - for (i=0; i<CRUFTS; i++) if (*cruft[i]) printf("<para>%s</para>\n", cruft[i]); - printf("\n</refsect1>"); - } - - /* table of contents, such as found in HTML, can be generated automatically by XML software */ - - printf("</refentry>\n"); - break; - case BEGINBODY: - if (fPara) printf("\n</para>"); - printf("<para>"); fPara = 1; - break; - case ENDBODY: - if (fRefPurpose) { printf("</refpurpose>"); fRefPurpose=0; } - else { printf("\n</para>"); fPara=0; } - break; - - case BEGINCOMMENT: printf("\n<!--\n"); break; - case ENDCOMMENT: printf("\n-->\n"); break; - case COMMENTLINE: break; - - case BEGINSECTHEAD: - case BEGINSUBSECTHEAD: - if (sectheadid != NAME && sectheadid != SYNOPSIS) printf("<title>"); - break; - case ENDSECTHEAD: - case ENDSUBSECTHEAD: - if (sectheadid == NAME) printf("<refname>"); - else if (sectheadid == SYNOPSIS) {} - else { printf("</title>\n<para>"); fPara=1; } - break; - - case BEGINSECTION: - if (sectheadid==NAME) printf("<refnamediv>\n"); - /*printf("<RefEntry>"); -- do lotsa parsing here for RefName, RefPurpose*/ - else if (sectheadid==SYNOPSIS) printf("<refsynopsisdiv>\n<cmdsynopsis>\n"); - else printf("\n<refsect1>\n"); - break; - case ENDSECTION: - if (sectheadid==NAME) { - if (fRefPurpose) { printf("</refpurpose>"); fRefPurpose=0; } - printf("\n</refnamediv>\n\n"); - } else if (sectheadid==SYNOPSIS) printf("\n</cmdsynopsis>\n</refsynopsisdiv>\n"); - else { - if (fPara) { printf("\n</para>"); fPara=0; } - printf("\n</refsect1>\n"); - } - break; - - case BEGINSUBSECTION: printf("\n<refsect2>"); break; - case ENDSUBSECTION: printf("\n</refsect2>"); break; - - /* need to update this for enumerated and plain lists */ - case BEGINBULPAIR: printf("<variablelist>\n"); break; - case ENDBULPAIR: printf("</variablelist>\n"); break; - case BEGINBULLET: printf("<term>"); break; - case ENDBULLET: printf("</term>\n"); break; - case BEGINBULTXT: printf("<listitem>\n<para>"); break; - case ENDBULTXT: printf("\n</para></listitem>\n"); break; - - case BEGINLINE: - /* remember, get BEGINBODY call at start of paragraph */ - if (fRefEntry) { - if (fRefPurpose) { - for (p=plain; *p!='-'; p++) { - /* nothing?! */ - } - } - } - - break; - - case ENDLINE: - /*if (fCodeline) { fIQS=1; fCodeline=0; }*/ - if (fCodeline) { printf("</code>"); fCodeline=0; } /* */ - I=0; CurLine++; if (!fPara && scnt) printf("<sbr/>"); else putchar(' '); - break; - - case SHORTLINE: - if (fCodeline) { printf("</code>"); fCodeline=0; } - if (!fIP && !fPara) printf("<sbr/>\n"); - break; - - case BEGINTABLE: - if (fSource) printf("<table>\n"); - else { printf("<literallayout>\n"); pre=1; fQS=fIQS=fPara=0; } - break; - case ENDTABLE: - if (fSource) printf("</table>\n"); - else { printf("</literallayout>\n"); pre=0; fQS=fIQS=fPara=1; } - break; - case BEGINTABLELINE: printf("<row>"); break; - case ENDTABLELINE: printf("</row>\n"); break; - case BEGINTABLEENTRY: printf("<entry>"); break; - case ENDTABLEENTRY: printf("</entry>"); break; - - case BEGININDENT: case ENDINDENT: - case FONTSIZE: - break; - - /* have to make some guess about bold and italics */ - case BEGINBOLD: printf("<command>"); break; - case ENDBOLD: printf("</command>"); break; - case BEGINITALICS: printf("<emphasis>"); break; /* could be literal or arg */ - case ENDITALICS: printf("</emphasis>"); break; - case BEGINBOLDITALICS: case BEGINCODE: printf("<literal>"); break; - case ENDBOLDITALICS: case ENDCODE: printf("</literal>"); break; - case BEGINMANREF: - manrefextract(hitxt); - if (fmanRef) { printf("<link linkend='"); printf(href, manrefname, manrefsect); printf("'>"); } - break; - case ENDMANREF: - if (fmanRef) printf("</link>"); - break; - - case HR: - case BEGINSC: case ENDSC: - case BEGINY: case ENDY: - case BEGINHEADER: case ENDHEADER: - case BEGINFOOTER: case ENDFOOTER: - case CHANGEBAR: - /* nothing */ - break; - default: - DefaultPara(cmd); - } -} - - - -/* generates MIME compliant to RFC 1563 */ - -static void -MIME(enum command cmd) -{ - static int pre=0; - int i; - - /* always respond to these signals */ - switch (cmd) { - case CHARDASH: - case CHARAMP: - case CHARPERIOD: - case CHARTAB: - putchar(cmd); break; - case CHARLSQUOTE: putchar('`'); break; - case CHARACUTE: - case CHARRSQUOTE: putchar('\''); break; - case CHARBULLET: putchar('*'); break; - case CHARDAGGER: putchar('|'); break; - case CHARPLUSMINUS: printf("+-"); break; - case CHARNBSP: putchar(' '); break; - case CHARCENT: putchar('c'); break; - case CHARSECT: putchar('S'); break; - case CHARCOPYR: printf("(C)"); break; - case CHARNOT: putchar('~'); break; - case CHARREGTM: printf("(R)"); break; - case CHARDEG: putchar('o'); break; - case CHAR14: printf("1/4"); break; - case CHAR12: printf("1/2"); break; - case CHAR34: printf("3/4"); break; - case CHARMUL: putchar('X'); break; - case CHARDIV: putchar('/'); break; - case CHARLQUOTE: - case CHARRQUOTE: - putchar('"'); - break; - case CHARBACKSLASH: /* these should be caught as escaped chars */ - case CHARGT: - case CHARLT: -#if 0 - assert(1); -#endif - break; - default: - break; - } - - /* while in pre mode... */ - if (pre) { - switch (cmd) { - case ENDLINE: I=0; CurLine++; if (!fPara && scnt) printf("\n\n"); break; - case ENDTABLE: printf("</fixed>\n\n"); pre=0; fQS=fIQS=fPara=1; break; - default: - /* nothing */ - break; - } - return; - } - - /* usual operation */ - switch (cmd) { - case BEGINDOC: - printf("Content-Type: text/enriched\n"); - printf("Text-Width: 60\n"); - escchars = "<>\\"; - - I=0; - break; - case ENDDOC: - /* header and footer wanted? */ - printf("\n\n"); - if (fHeadfoot) { - printf("\n"); - MIME(BEGINSECTHEAD); printf("%s",HEADERANDFOOTER); MIME(ENDSECTHEAD); - for (i=0; i<CRUFTS; i++) if (*cruft[i]) printf("\n%s\n", cruft[i]); - } - -/* - printf("\n<comment>\n"); - printf("%s\n%s\n", PROVENANCE, HOME); - printf("</comment>\n\n"); -*/ - -/* - printf("\n<HR><P>\n"); - printf("<A NAME=\"toc\"><B>%s</B></A><P>\n", TABLEOFCONTENTS); - printf("<UL>\n"); - for (i=0, lasttoc=BEGINSECTION; i<tocc; lasttoc=toc[i].type, i++) { - if (lasttoc!=toc[i].type) { - if (toc[i].type==BEGINSUBSECTION) printf("<UL>\n"); - else printf("</UL>\n"); - } - printf("<LI><A NAME=\"toc%d\" HREF=\"#sect%d\">%s</A></LI>\n", i, i, toc[i].text); - } - if (lasttoc==BEGINSUBSECTION) printf("</UL>"); - printf("</UL>\n"); - printf("</BODY></HTML>\n"); -*/ - break; - case BEGINBODY: - printf("\n\n"); - break; - case ENDBODY: break; - - case BEGINCOMMENT: fcharout=0; break; - case ENDCOMMENT: fcharout=1; break; - case COMMENTLINE: break; - - case BEGINSECTHEAD: - printf("\n<bigger><bigger><underline>"); - /*A NAME=\"sect%d\" HREF=\"#toc%d\"><H2>", tocc, tocc);*/ - break; - case ENDSECTHEAD: - printf("</underline></bigger></bigger>\n\n<indent>"); - /* useful extraction from files, environment? */ - break; - case BEGINSUBSECTHEAD: - printf("<bigger>"); - /*\n<A NAME=\"sect%d\" HREF=\"#toc%d\"><H3>", tocc, tocc);*/ - break; - case ENDSUBSECTHEAD: - printf("</bigger>\n\n</indent>"); - break; - case BEGINSECTION: - case BEGINSUBSECTION: - break; - case ENDSECTION: - case ENDSUBSECTION: - printf("</indent>\n"); - break; - - case BEGINBULPAIR: break; - case ENDBULPAIR: break; - case BEGINBULLET: printf("<bold>"); break; - case ENDBULLET: printf("</bold>\t"); break; - case BEGINBULTXT: - case BEGININDENT: - printf("<indent>"); - break; - case ENDBULTXT: - case ENDINDENT: - printf("</indent>\n"); - break; - - case FONTSIZE: - if ((fontdelta+=intArg)==0) { - if (intArg>0) printf("</smaller>"); else printf("</bigger>"); - } else { - if (intArg>0) printf("<bigger>"); else printf("<smaller>"); - } - break; - - case BEGINLINE: /*if (ncnt) printf("\n\n");*/ break; - case ENDLINE: I=0; CurLine++; printf("\n"); break; - case SHORTLINE: if (!fIP) printf("\n\n"); break; - case BEGINTABLE: printf("<nl><fixed>\n"); pre=1; fQS=fIQS=fPara=0; break; - case ENDTABLE: printf("</fixed><nl>\n"); pre=0; fQS=fIQS=fPara=1; break; - case BEGINTABLELINE: case ENDTABLELINE: case BEGINTABLEENTRY: case ENDTABLEENTRY: - break; - /* could use a new list type */ - - case BEGINBOLD: printf("<bold>"); break; - case ENDBOLD: printf("</bold>"); break; - case BEGINITALICS: printf("<italics>"); break; - case ENDITALICS: printf("</italics>"); break; - case BEGINCODE: - case BEGINBOLDITALICS:printf("<bold><italics>"); break; - case ENDCODE: - case ENDBOLDITALICS: printf("</bold></italics>"); break; - case BEGINMANREF: - printf("<x-color><param>blue</param>"); -/* how to make this hypertext? - manrefextract(hitxt); - if (fmanRef) { printf("<A HREF=\""); printf(href, manrefname, manrefsect); printf("\">\n"); } - else printf("<I>"); - break; -*/ - break; - case ENDMANREF: - printf("</x-color>"); - break; - - case HR: printf("\n\n%s\n\n", horizontalrule); break; - - case BEGINSC: case ENDSC: - case BEGINY: case ENDY: - case BEGINHEADER: case ENDHEADER: - case BEGINFOOTER: case ENDFOOTER: - case CHANGEBAR: - /* nothing */ - break; - default: - DefaultPara(cmd); - } -} - - - -/* - * LaTeX - */ - -static void -LaTeX(enum command cmd) -{ - - switch (cmd) { - case BEGINDOC: - escchars = "$&%#_{}"; /* and more to come? */ - printf("%% %s,\n", PROVENANCE); - printf("%% %s\n\n", HOME); - /* definitions */ - printf( - "\\documentstyle{article}\n" - "\\def\\thefootnote{\\fnsymbol{footnote}}\n" - "\\setlength{\\parindent}{0pt}\n" - "\\setlength{\\parskip}{0.5\\baselineskip plus 2pt minus 1pt}\n" - "\\begin{document}\n" - ); - I=0; - break; - case ENDDOC: - /* header and footer wanted? */ - printf("\n\\end{document}\n"); - - break; - case BEGINBODY: - printf("\n\n"); - break; - case ENDBODY: break; - - case BEGINCOMMENT: - case ENDCOMMENT: - break; - case COMMENTLINE: printf("%% "); break; - - - case BEGINSECTION: break; - case ENDSECTION: break; - case BEGINSECTHEAD: printf("\n\\section{"); tagc=0; break; - case ENDSECTHEAD: - printf("}"); -/* - if (CurLine==1) printf("\\footnote{" - "\\it conversion to \\LaTeX\ format by PolyglotMan " - "available via anonymous ftp from {\\tt ftp.berkeley.edu:/ucb/people/phelps/tcltk}}" - ); -*/ - /* useful extraction from files, environment? */ - printf("\n"); - break; - case BEGINSUBSECTHEAD:printf("\n\\subsection{"); break; - case ENDSUBSECTHEAD: - printf("}"); - break; - case BEGINSUBSECTION: break; - case ENDSUBSECTION: break; - case BEGINBULPAIR: printf("\\begin{itemize}\n"); break; - case ENDBULPAIR: printf("\\end{itemize}\n"); break; - case BEGINBULLET: printf("\\item ["); break; - case ENDBULLET: printf("] "); break; - case BEGINLINE: /*if (ncnt) printf("\n\n");*/ break; - case ENDLINE: I=0; putchar('\n'); CurLine++; break; - case BEGINTABLE: printf("\\begin{verbatim}\n"); break; - case ENDTABLE: printf("\\end{verbatim}\n"); break; - case BEGINTABLELINE: case ENDTABLELINE: case BEGINTABLEENTRY: case ENDTABLEENTRY: - break; - case BEGININDENT: case ENDINDENT: - case FONTSIZE: - break; - case SHORTLINE: if (!fIP) printf("\n\n"); break; - case BEGINBULTXT: break; - case ENDBULTXT: putchar('\n'); break; - - case CHARLQUOTE: printf("``"); break; - case CHARRQUOTE: printf("''"); break; - case CHARLSQUOTE: - case CHARRSQUOTE: - case CHARPERIOD: - case CHARTAB: - case CHARDASH: - case CHARNBSP: - putchar(cmd); break; - case CHARBACKSLASH: printf("$\\backslash$"); break; - case CHARGT: printf("$>$"); break; - case CHARLT: printf("$<$"); break; - case CHARHAT: printf("$\\char94{}$"); break; - case CHARVBAR: printf("$|$"); break; - case CHARAMP: printf("\\&"); break; - case CHARBULLET: printf("$\\bullet$ "); break; - case CHARDAGGER: printf("\\dag "); break; - case CHARPLUSMINUS: printf("\\pm "); break; - case CHARCENT: printf("\\hbox{\\rm\\rlap/c}"); break; - case CHARSECT: printf("\\S "); break; - case CHARCOPYR: printf("\\copyright "); break; - case CHARNOT: printf("$\\neg$"); break; - case CHARREGTM: printf("(R)"); break; - case CHARDEG: printf("$^\\circ$"); break; - case CHARACUTE: putchar('\''); break; - case CHAR14: printf("$\\frac{1}{4}$"); break; - case CHAR12: printf("$\\frac{1}{2}$"); break; - case CHAR34: printf("$\\frac{3}{4}$"); break; - case CHARMUL: printf("\\times "); break; - case CHARDIV: printf("\\div "); break; - - case BEGINCODE: - case BEGINBOLD: printf("{\\bf "); break; /* } */ - case BEGINSC: printf("{\\sc "); break; /* } */ - case BEGINITALICS: printf("{\\it "); break; /* } */ - case BEGINBOLDITALICS:printf("{\\bf\\it "); break; /* } */ - case BEGINMANREF: printf("{\\sf "); break; /* } */ - case ENDCODE: - case ENDBOLD: - case ENDSC: - case ENDITALICS: - case ENDBOLDITALICS: - case ENDMANREF: /* { */ - putchar('}'); - break; - case HR: /*printf("\n%s\n", horizontalrule);*/ break; - - case BEGINY: case ENDY: - case BEGINHEADER: case ENDHEADER: - case BEGINFOOTER: case ENDFOOTER: - case CHANGEBAR: - /* nothing */ - break; - default: - DefaultPara(cmd); - } -} - - -static void -LaTeX2e(enum command cmd) -{ - switch (cmd) { - /* replace selected commands ... */ - case BEGINDOC: - escchars = "$&%#_{}"; - printf("%% %s,\n", PROVENANCE); - printf("%% %s\n\n", HOME); - /* definitions */ - printf( - "\\documentclass{article}\n" - "\\def\\thefootnote{\\fnsymbol{footnote}}\n" - "\\setlength{\\parindent}{0pt}\n" - "\\setlength{\\parskip}{0.5\\baselineskip plus 2pt minus 1pt}\n" - "\\begin{document}\n" - ); - I=0; - break; - case BEGINCODE: - case BEGINBOLD: printf("\\textbf{"); break; /* } */ - case BEGINSC: printf("\\textsc{"); break; /* } */ - case BEGINITALICS: printf("\\textit{"); break; /* } */ - case BEGINBOLDITALICS:printf("\\textbf{\\textit{"); break; /* }} */ - case BEGINMANREF: printf("\\textsf{"); break; /* } {{ */ - case ENDBOLDITALICS: printf("}}"); break; - - /* ... rest same as old LaTeX */ - default: - LaTeX(cmd); - } -} - - - -/* - * Rich Text Format (RTF) - */ - -/* RTF could use more work */ - -static void -RTF(enum command cmd) -{ - - switch (cmd) { - case BEGINDOC: - escchars = "{}"; - /* definitions */ - printf( - /* fonts */ - "{\\rtf1\\deff2 {\\fonttbl" - "{\\f20\\froman Times;}{\\f150\\fnil I Times Italic;}" - "{\\f151\\fnil B Times Bold;}{\\f152\\fnil BI Times BoldItalic;}" - "{\\f22\\fmodern Courier;}{\\f23\\ftech Symbol;}" - "{\\f135\\fnil I Courier Oblique;}{\\f136\\fnil B Courier Bold;}{\\f137\\fnil BI Courier BoldOblique;}" - "{\\f138\\fnil I Helvetica Oblique;}{\\f139\\fnil B Helvetica Bold;}}" - "\n" - - /* style sheets */ - "{\\stylesheet{\\li720\\sa120 \\f20 \\sbasedon222\\snext0 Normal;}" - "{\\s2\\sb200\\sa120 \\b\\f3\\fs20 \\sbasedon0\\snext2 section head;}" - "{\\s3\\li180\\sa120 \\b\\f20 \\sbasedon0\\snext3 subsection head;}" - "{\\s4\\fi-1440\\li2160\\sa240\\tx2160 \\f20 \\sbasedon0\\snext4 detailed list;}}" - "\n" - -/* more header to come--do undefined values default to nice values? */ - ); - I=0; - break; - case ENDDOC: - /* header and footer wanted? */ - printf("\\par{\\f150 %s,\n%s}", PROVENANCE, HOME); - printf("}\n"); - break; - case BEGINBODY: - printf("\n\n"); - break; - case ENDBODY: - CurLine++; - printf("\\par\n"); - tagc=0; - break; - - case BEGINCOMMENT: fcharout=0; break; - case ENDCOMMENT: fcharout=1; break; - case COMMENTLINE: break; - - case BEGINSECTION: break; - case ENDSECTION: printf("\n\\par\n"); break; - case BEGINSECTHEAD: printf("{\\s2 "); tagc=0; break; - case ENDSECTHEAD: - printf("}\\par"); - /* useful extraction from files, environment? */ - printf("\n"); - break; - case BEGINSUBSECTHEAD:printf("{\\s3 "); break; - case ENDSUBSECTHEAD: - printf("}\\par\n"); - break; - case BEGINSUBSECTION: break; - case ENDSUBSECTION: break; - case BEGINLINE: /*if (ncnt) printf("\n\n");*/ break; - case ENDLINE: I=0; putchar(' '); /*putchar('\n'); CurLine++;*/ break; - case SHORTLINE: if (!fIP) printf("\\line\n"); break; - case BEGINBULPAIR: printf("{\\s4 "); break; - case ENDBULPAIR: printf("}\\par\n"); break; - case BEGINBULLET: break; - case ENDBULLET: printf("\\tab "); fcharout=0; break; - case BEGINBULTXT: fcharout=1; break; - case ENDBULTXT: break; - - case CHARLQUOTE: printf("``"); break; - case CHARRQUOTE: printf("''"); break; - case CHARLSQUOTE: - case CHARRSQUOTE: - case CHARPERIOD: - case CHARTAB: - case CHARDASH: - case CHARBACKSLASH: - case CHARGT: - case CHARLT: - case CHARHAT: - case CHARVBAR: - case CHARAMP: - case CHARNBSP: - case CHARCENT: - case CHARSECT: - case CHARCOPYR: - case CHARNOT: - case CHARREGTM: - case CHARDEG: - case CHARACUTE: - case CHAR14: - case CHAR12: - case CHAR34: - case CHARMUL: - case CHARDIV: - putchar(cmd); break; - case CHARBULLET: printf("\\bullet "); break; - case CHARDAGGER: printf("\\dag "); break; - case CHARPLUSMINUS: printf("\\pm "); break; - - case BEGINCODE: - case BEGINBOLD: printf("{\\b "); break; /* } */ - case BEGINSC: printf("{\\fs20 "); break; /* } */ - case BEGINITALICS: printf("{\\i "); break; /* } */ - case BEGINBOLDITALICS:printf("{\\b \\i "); break; /* } */ - case BEGINMANREF: printf("{\\f22 "); break; /* } */ - case ENDBOLD: - case ENDCODE: - case ENDSC: - case ENDITALICS: - case ENDBOLDITALICS: - case ENDMANREF: /* { */ - putchar('}'); - break; - case HR: printf("\n%s\n", horizontalrule); break; - - case BEGINY: case ENDY: - case BEGINHEADER: case ENDHEADER: - case BEGINFOOTER: case ENDFOOTER: - case BEGINTABLE: case ENDTABLE: - case BEGINTABLELINE: case ENDTABLELINE: case BEGINTABLEENTRY: case ENDTABLEENTRY: - case BEGININDENT: case ENDINDENT: - case FONTSIZE: - case CHANGEBAR: - /* nothing */ - break; - default: - DefaultPara(cmd); - } -} - - - -/* - * pointers to existing tools - */ - -static void -PostScript(enum command cmd) -{ - fprintf(stderr, "Use groff or psroff to generate PostScript.\n"); - exit(1); -} - - -static void -FrameMaker(enum command cmd) -{ - fprintf(stderr, "FrameMaker comes with filters that convert from roff to MIF.\n"); - exit(1); -} - - - - -/* - * Utilities common to both parses - */ - - -/* - level 0: DOC - need match - level 1: SECTION - need match - level 2: SUBSECTION | BODY | BULLETPAIR - level 3: BODY (within SUB) | BULLETPAIR (within SUB) | BULTXT (within BULLETPAIR) - level 4: BULTXT (within BULLETPAIR within SUBSECTION) - - never see: SECTHEAD, SUBSECTHEAD, BULLET -*/ - -int Psect=0, Psub=0, Pbp=0, Pbt=0, Pb=0, Pbul=0; - -static void -pop(enum command cmd) -{ - assert(cmd==ENDINDENT || cmd==BEGINBULLET || cmd==BEGINBULTXT || cmd==BEGINBULPAIR || cmd==BEGINBODY || cmd==BEGINSECTION || cmd==BEGINSUBSECTION || cmd==ENDDOC); -/* - int i; - int p; - int match; - - p=cmdp-1; - for (i=cmdp-1;i>=0; i--) - if (cmd==cmdstack[i]) { match=i; break; } -*/ - - /* if match, pop off all up to and including match */ - /* otherwise, pop off one level*/ - - if (Pbul) { - (*fn)(ENDBULLET); Pbul=0; - if (cmd==BEGINBULLET) return; - } /* else close off ENDBULTXT */ - - if (Pbt) { (*fn)(ENDBULTXT); Pbt=0; } - if (cmd==BEGINBULTXT || cmd==BEGINBULLET) return; - - if (Pb && cmd==BEGINBULPAIR) { (*fn)(ENDBODY); Pb=0; } /* special */ - if (Pbp) { (*fn)(ENDBULPAIR); Pbp=0; } - if (cmd==BEGINBULPAIR || cmd==ENDINDENT) return; - - if (Pb) { (*fn)(ENDBODY); Pb=0; } - if (cmd==BEGINBODY) return; - - if (Psub) { (*fn)(ENDSUBSECTION); Psub=0; } - if (cmd==BEGINSUBSECTION) return; - - if (Psect) { (*fn)(ENDSECTION); Psect=0; } - if (cmd==BEGINSECTION) return; -} - - -static void -poppush(enum command cmd) -{ - assert(cmd==ENDINDENT || cmd==BEGINBULLET || cmd==BEGINBULTXT || cmd==BEGINBULPAIR || cmd==BEGINBODY || cmd==BEGINSECTION || cmd==BEGINSUBSECTION); - - pop(cmd); - - switch (cmd) { - case BEGINBULLET: Pbul=1; break; - case BEGINBULTXT: Pbt=1; break; - case BEGINBULPAIR: Pbp=1; break; - case BEGINBODY: Pb=1; break; - case BEGINSECTION: Psect=1; break; - case BEGINSUBSECTION: Psub=1; break; - default: - if (!fQuiet) fprintf(stderr, "poppush: unrecognized code %d\n", cmd); - } - - (*fn)(cmd); - prevcmd = cmd; -} - - - -/* - * PREFORMATTED PAGES PARSING - */ - -/* wrapper for getchar() that expands tabs, and sends maximum of n=40 consecutive spaces */ - -static int -getchartab(void) -{ - static int tabexp = 0; - static int charinline = 0; - static int cspccnt = 0; - char c; - - c = lookahead; - if (tabexp) tabexp--; - else if (c=='\n') { - charinline=0; - cspccnt=0; - } else if (c=='\t') { - tabexp = TabStops-(charinline%TabStops); if (tabexp==TabStops) tabexp=0; - lookahead = c = ' '; - } else if (cspccnt>=40) { - if (*in==' ') { - while (*in==' '||*in=='\t') in++; - in--; - } - cspccnt=0; - } - - if (!tabexp && lookahead) lookahead = *in++; - if (c=='\b') charinline--; else charinline++; - if (c==' ') cspccnt++; - return c; -} - - -/* replace gets. handles hyphenation too */ -static char * -la_gets(char *buf) -{ - static char la_buf[MAXBUF]; /* can lookahead a full line, but nobody does now */ - static int fla=0, hy=0; - char *ret,*p; - int c,i; - - assert(buf!=NULL); - - if (fla) { - /* could avoid copying if callers used return value */ - strcpy(buf,la_buf); fla=0; - ret=buf; /* correct? */ - } else { - /*ret=gets(buf); -- gets is deprecated (since it can read too much?) */ - /* could do this... - ret=fgets(buf, MAXBUF, stdin); - buf[strlen(buf)-1]='\0'; - ... but don't want to have to rescan line with strlen, so... */ - - i=0; p=buf; - - /* recover spaces if re-linebreaking */ - for (; hy; hy--) { *p++=' '; i++; } - - while (lookahead && (c=getchartab())!='\n' && i<MAXBUF) { *p++=c; i++; } - assert(i<MAXBUF); - -#if 0 - lookahead=ungetc(getchar(), stdin); /* only looking ahead one character for now */ -#endif - - /* very special case: if in SEE ALSO section, re-linebreak so references aren't linebroken - (also do this if fNOHY flag is set) -- doesn't affect lookahead */ - /* 0xad is an en dash on Linux? */ - if ((fPara || sectheadid==SEEALSO || fNOHY) && p>buf && p[-1]=='-' && isspace(lookahead)) { - p--; /* zap hyphen */ - /* zap boldfaced hyphens, gr! */ - while (p[-1]=='\b' && p[-2]=='-') p-=2; - - /* start getting next line, spaces first ... */ - while (lookahead && isspace(lookahead) && lookahead!='\n') { getchartab(); hy++; } - - /* ... append next nonspace string to previous ... */ - while (lookahead && !isspace(lookahead) && i++<MAXBUF) *p++=getchartab(); - - /* gobble following spaces (until, perhaps including, end of line) */ - while (lookahead && isspace(lookahead) && lookahead!='\n') getchartab(); - if (lookahead=='\n') { getchartab(); hy=0; } - } - - *p='\0'; - ret=(lookahead)?buf:NULL; - } - - AbsLine++; - return ret; /* change this to line length? (-1==old NULL) */ -} - - -/*** Kong ***/ - -char phrase[MAXBUF]; /* first "phrase" (space of >=3 spaces) */ -int phraselen; - -static void -filterline(char *buf, char *plain) -{ - char *p,*q,*r; - char *ph; - int iq; - int i,j; - int hl=-1, hl2=-1; - int iscnt=0; /* interword space count */ - int tagci; - int I0; - int etype; - int efirst; - enum tagtype tag = NOTAG; - int esccode; - - assert(buf!=NULL && plain!=NULL); - - etype=NOTAG; - efirst=-1; - tagci=tagc; - ph=phrase; phraselen=0; - scnt=scnt2=0; - s_sum=s_cnt=0; - bs_sum=bs_cnt=0; - ccnt=0; - spcsqz=0; - - /* strip only certain \x1b's and only at very beginning of line */ - for (p=buf; *p=='\x1b' && (p[1]=='8'||p[1]=='9'); p+=2) - /* nop */; - - strcpy(plain,p); - q=&plain[strlen(p)]; - - /*** spaces and change bars ***/ - for (scnt=0,p=plain; *p==' '; p++) scnt++; /* initial space count */ - if (scnt>200) scnt=130-(q-p); - - assert(*q=='\0'); - q--; - if (fChangeleft) - for (; q-40>plain && *q=='|'; q--) { /* change bars */ - if (fChangeleft!=-1) ccnt++; - while (q-2>=plain && q[-1]=='\b' && q[-2]=='|') q-=2; /* boldface changebars! */ - } - - /*if (q!=&plain[scnt-1])*/ /* zap trailing spaces */ - for (; *q==' ' && q>plain; q--) /* nop */; - - /* second changebar way out east! HACK HACK HACK */ - if (q-plain>100 && *q=='|') { - while (*q=='|' && q>plain) { q--; if (fChangeleft!=-1) ccnt++; } - while ((*q==' ' || *q=='_' || *q=='-') && q>plain) q--; - } - - for (r=q; (*r&0xff)==CHARDAGGER; r--) *r='-'; /* convert daggers at end of line to hyphens */ - - if (q-plain < scnt) scnt = q-plain+1; - q[1]='\0'; - - /* set I for tags below */ - if (indent>=0 && scnt>=indent) scnt-=indent; - if (!fPara && !fIQS) { - if (fChangeleft) I+=(scnt>ccnt)?scnt:ccnt; - else I+=scnt; - } - I0=I; - - /*** tags and filler spaces ***/ - - iq=0; falluc=1; - for (q=plain; *p; p++) { - - iscnt=0; - if (*p==' ') { - for (r=p; *r==' '; r++) { iscnt++; spcsqz++; } - s_sum+=iscnt; s_cnt++; - if (iscnt>1 && !scnt2 && *p==' ') scnt2=iscnt; - if (iscnt>2) { bs_cnt++; bs_sum+=iscnt; } /* keep track of large gaps */ - iscnt--; /* leave last space for tail portion of loop */ - - /* write out spaces */ - if (fQS && iscnt<3) { p=r-1; iscnt=0; } /* reduce strings of <3 spaces to 1 */ - /* else if (fQS && iscnt>=3) { replace with tab? } */ - else { - for (i=0; i<iscnt; i++) { p++; *q++=' '; } - } - } /* need to go through if chain for closing off annotations */ - - /** backspace-related filtering **/ - - if (*p=='\b' && p[1]=='_' && q>plain && q[-1]=='+') { - /* bold plus/minus(!) */ - q[-1]=c_plusminus; - while (*p=='\b' && p[1]=='_') p+=2; - continue; - } else if ((*p=='_' && p[1]=='\b' && p[2]!='_' && p[3]!='\b') - || (*p=='\b' && p[1]=='_')) { - /* italics */ - if (tag!=ITALICS && hl>=0) { tagadd(tag, hl, I+iq); hl=-1; } - if (hl==-1) hl=I+iq; - tag=ITALICS; - p+=2; - } else if (*p=='_' && p[2]==p[4] && p[1]=='\b' && p[3]=='\b' && p[2]!='_') { - /* bold italics (for Solaris) */ - for (p+=2; *p==p[2] && p[1]=='\b';) p+=2; - if (tag!=BOLDITALICS && hl>=0) { tagadd(tag, hl, I+iq); hl=-1; } - if (hl==-1) hl=I+iq; - tag=BOLDITALICS; - } else if (*p==p[2] && p[1]=='\b') { - /* boldface */ - while (*p==p[2] && p[1]=='\b') p+=2; - if (tag!=BOLD && hl>=0) { tagadd(tag, hl, I+iq); hl=-1; } - if (hl==-1) hl=I+iq; - tag=BOLD; - } else if (p[1]=='\b' && - ((*p=='o' && p[2]=='+') || - (*p=='+' && p[2]=='o')) ) { - /* bullets */ - p+=2; - while (p[1]=='\b' && (*p=='o' || p[2]=='+') ) p+=2; /* bold bullets(!) */ - *q++=c_bullet; iq++; - continue; - } else if (*p=='\b' && p>plain && p[-1]=='o' && p[1]=='+') { - /* OSF bullets */ - while (*p=='\b' && p[1]=='+') p+=2; /* bold bullets(!) */ - q[-1]=c_bullet; p--; - continue; - } else if (p[1]=='\b' && *p=='+' && p[2]=='_') { - /* plus/minus */ - p+=2; - *q++=c_plusminus; iq++; - continue; - } else if (p[1]=='\b' && *p=='|' && p[2]=='-') { - /* dagger */ - *q++=c_dagger; iq++; - p+=2; continue; - } else if (*p=='\b') { - /* supress unattended backspaces */ - continue; - } else if (*p=='\x1b') { - p++; - if (*p=='[' && isdigit(p[1])) { /* 0/1/22/24/.../8/9/... */ - esccode=0; for (p++; isdigit(*p); p++) esccode = esccode * 10 + *p - '0'; - - if (efirst>=0 /*&& (esccode==0 || esccode==1 || esccode==4 || esccode==22 || esccode==24) **&& hl>=0 && hl2==-1 && tags[MAXTAGS].first<I+iq*/) { - /* doesn't catch tag if spans line -- just make tag and hl static? */ - /*tagadd(tags[MAXTAGS].type, tags[MAXTAGS].first, I+iq);*/ - if (hl==-1 && hl2==-1 && efirst!=-1/*<I+iq*/) - tagadd(etype, efirst, I+iq); - efirst=-1; - } - - if (esccode==1 /*&& hl==-1*/) { - /* stash attributes in "invalid" array element */ - efirst=I+iq; etype=BOLD; - /*hl=I+iq; tag=BOLD; -- faces immediate end of range */ - } else if (esccode==4 /*&& hl==-1*/) { - efirst=I+iq; etype=ITALICS; - - } /* else skip unrecognized escape codes like 8/9 */ - } - - /*assert(*p=='m'); OR if (*p == 'm') ? */ - /*p++; ** ending 'm' -- inc done in overarching for */ - continue; - - } else if ((isupper(*p) /*|| *p=='_' || *p=='&'*/) && - (hl>=0 || isupper(p[1]) || (p[1]=='_' && p[2]!='\b') || p[1]=='&')) { - if (hl==-1 && efirst==-1) { hl=I+iq; tag=SMALLCAPS; } - } else { - /* end of tag, one way or another */ - /* collect tags in this pass, interspersed later if need be */ - /* can't handle overlapping tags */ - if (hl>=0) { - if (hl2==-1) tagadd(tag, hl, I+iq); - hl=-1; - } - } - - /** non-backspace related filtering **/ - /* case statement here in place of if chain? */ -/* Tk 3.x's text widget tabs too crazy - if (*p==' ' && strncmp(" ",p,5)==0) { - xputchar('\t'); i+=5-1; ci++; continue; - } else -*/ -/* copyright symbol: too much work for so little - if (p[i]=='o' && (strncmp("opyright (C) 19",&p[i],15)==0 - || strncmp("opyright (c) 19",&p[i],15)==0)) { - printf("opyright \xd3 19"); - tagadd(SYMBOL, ci+9, ci+10); - i+=15-1; ci+=13; continue; - } else -*/ - if (*p=='(' && q>plain && (isalnum(q[-1])||strchr(manvalid/*"._-+"*/,q[-1])!=NULL) - && strcoloncmp(&p[1],')',vollist) - /* && p[1]!='s' && p[-1]!='`' && p[-1]!='\'' && p[-1]!='"'*/ ) { - hl2=I+iq; - for (r=q-1; r>=plain && (isalnum(*r)||strchr(manvalid/*"._-+:"*/,*r)!=NULL); r--) - hl2--; - /* else ref to a function? */ - /* maybe save position of opening paren so don't highlight it later */ - } else if (*p==')' && hl2!=-1) { - /* don't overlap tags on man page references */ - while (tagc>0 && tags[tagc-1].last>hl2) tagc--; - tagadd(MANREF, hl2, I+iq+1); - hl2=hl=-1; - } else if (hl2!=-1) { - /* section names are alphanumic or '+' for C++ */ - if (!isalnum(*p) && *p!='+') hl2=-1; - } - - - /*assert(*p!='\0');*/ - if (!*p) break; /* not just safety check -- check out sgmls.1 */ - - *q++=*p; -/* falluc = falluc && (isupper(*p) || isspace(*p) || isdigit(*p) || strchr("-+&_'/()?!.,;",*p)!=NULL);*/ - falluc = falluc && !islower(*p); - if (!scnt2) { *ph++=*p; phraselen++; } - iq+=iscnt+1; - } - if (hl>=0) tagadd(tag, hl, I+iq); - else if (efirst>=0) tagadd(etype, efirst, I+iq); - *q=*ph='\0'; - linelen=iq+ccnt; - - - /* special case for Solaris: - if line has ONLY <CODE> tags AND they SPAN line, convert to one tag */ - fCodeline=0; - if (tagc && tags[0].first==0 && tags[tagc-1].last==linelen) { - fCodeline=1; - j=0; - /* invariant: at start of a tag */ - for (i=0; fCodeline && i<tagc; i++) { - if (tags[i].type!=BOLDITALICS /*&& tags[i].type!=BOLD*/) fCodeline=0; - else if ((j=tags[i].last)<linelen) { - for (; j < tags[i+1].first ; j++) - if (!isspace(plain[j])) { fCodeline=0; break; } - } - } - } - - - /* verify tag lists -- in production, compiler should kill with dead code elimination */ - for (i=tagci; i<tagc; i++) { - /* verify valid ranges */ - assert(tags[i].type>NOTAG && tags[i].type<=MANREF); - assert(tags[i].first>=I0 && tags[i].last<=linelen+I0); - assert(tags[i].first<=tags[i].last); - - /* verify for no overlap with other tags */ - for (j=i+1; j<tagc; j++) { - assert(tags[i].last<=tags[j].first /*|| tags[i].first>=tags[j].last*/); - } - } -} - - -/* - buf[] == input text (read only) - plain[] == output (initial, trailing spaces stripped; tabs=>spaces; - underlines, overstrikes => tag array; spaces squeezed, if requested) - ccnt = count of changebars - scnt = count of initial spaces - linelen = length result in plain[] -*/ - -int fHead=0; -int fFoot=0; - -static void -preformatted_filter(void) -{ - const int MINRM=50; /* minimum column for right margin */ - const int MINMID=20; - const int HEADFOOTSKIP=20; - const int HEADFOOTMAX=25; - int curtag; - char *p,*r; - char head[MAXBUF]=""; /* first "word" */ - char foot[MAXBUF]=""; - int header_m=0, footer_m=0; - int headlen=0, footlen=0; -/* int line=1-1; */ - int i,j,k,l,off; - int sect=0,subsect=0,bulpair=0,osubsect=0; - int title=1; - int oscnt=-1; - int empty=0; - int fcont=0; - int Pnew=0,I0; - float s_avg=0.0; - int spaceout; - int skiplines=0; - int c; - - /* try to keep tabeginend[][] in parallel with enum tagtype */ - assert(tagbeginend[ITALICS][0]==BEGINITALICS); - assert(tagbeginend[MANREF][1]==ENDMANREF); - in++; /* lookahead = current character, in points to following */ - - /* for (i=0; i<MAXBUF; i++) tabgram[i]=0;*/ - - /*if (fMan) */indent=-1; - I=1; - CurLine=1; - (*fn)(BEGINDOC); I0=I; - - /* run through each line */ - while (la_gets(buf)!=NULL) { - if (title) I=I0; - /* strip out Ousterhout box: it's confusing the section line counts in TkMan outlining */ - if (fNORM && *buf=='_' - && strncmp(buf,"_________________________________________________________________",65)==0) { - fTclTk = 1; - if (fChangeleft==0) fChangeleft=1; - skiplines = 2; - } - if (skiplines) { skiplines--; AbsLine++; continue; } - filterline(buf,plain); /* ALL LINES ARE FILTERED */ - -#if 0 - /* dealing with tables in formatted pages is hopeless */ - finTable = fTable && - ((!ncnt && fotable) || - (ncnt && bs_cnt>=2 && bs_cnt<=5 && ((float) bs_sum / (float) bs_cnt)>3.0)); - if (finTable) { - if (!fotable) (*fn)(BEGINTABLE); - } else if (fotable) { - (*fn)(ENDTABLE); - I=I0; tagc=0; filterline(buf,plain); /* rescan first line out of table */ - } -#endif - - s_avg=(float) s_sum; - if (s_cnt>=2) { - /* don't count large second space gap */ - if (scnt2) s_avg= (float) (s_sum - scnt2) / (float) (s_cnt-1); - else s_avg= (float) (s_sum) / (float) (s_cnt); - } - - p=plain; /* points to current character in plain */ - - /*** determine header and global indentation ***/ - if (/*fMan && (*/!fHead || indent==-1/*)*/) { - if (!linelen) continue; - if (!*header) { - /* check for missing first header--but this doesn't catch subsequent pages */ - if (stricmp(p,"NAME")==0 || stricmp(p,"NOMBRE")==0) { /* works because line already filtered */ - indent=scnt; /*filterline(buf,plain);*/ scnt=0; I=I0; fHead=1; - } else { - fHead=1; - (*fn)(BEGINHEADER); - /* grab header and its first word */ - strcpy(header,p); - if ((header_m=HEADFOOTSKIP)>linelen) header_m=0; - strcpy(head,phrase); headlen=phraselen; - la_gets(buf); filterline(buf,plain); - if (linelen) { - strcpy(header2,plain); - if (strincmp(plain,"Digital",7)==0 || strincmp(plain,"OSF",3)==0) { - fFoot=1; - fSubsections=0; - } - } - (*fn)(ENDHEADER); tagc=0; - continue; - } - } else { - /* some idiot pages have a *third* header line, possibly after a null line */ - if (*header && scnt>MINMID) { strcpy(header3,p); ncnt=0; continue; } - /* indent of first line ("NAME") after header sets global indent */ - /* check '<' for Plan 9(?) */ - if (*p!='<') { - indent=scnt; I=I0; scnt=0; - } else continue; - } -/* if (indent==-1) continue;*/ - } - if (!lindent && scnt) lindent=scnt; -/*printf("lindent = %d, scnt=%d\n", lindent,scnt);*/ - - - /**** for each ordinary line... *****/ - - /*** skip over global indentation */ - empty=(linelen==0); - if (empty) {ncnt++; continue;} - - /*** strip out per-page titles ***/ - - if (/*fMan && (*/scnt==0 || scnt>MINMID/*)*/) { -/*printf("***ncnt = %d, fFoot = %d, line = %d***", ncnt,fFoot,AbsLine);*/ - if (!fFoot && !isspace(*p) && (scnt>5 || (*p!='-' && *p!='_')) && - /* don't add ncnt -- AbsLine gets absolute line number */ - (((ncnt>=2 && AbsLine/*+ncnt*/>=61/*was 58*/ && AbsLine/*+ncnt*/<70) - || (ncnt>=4 && AbsLine/*+ncnt*/>=59 && AbsLine/*+ncnt*/<74) - || (ncnt && AbsLine/*+ncnt*/>=61 && AbsLine/*+ncnt*/<=66)) - && (/*lookahead!=' ' ||*/ (s_cnt>=1 && s_avg>1.1) || !falluc) ) - ) { - (*fn)(BEGINFOOTER); - /* grab footer and its first word */ - strcpy(footer,p); -/* if ((footer_m=linelen-HEADFOOTSKIP)<0) footer_m=0;*/ - if ((footer_m=HEADFOOTSKIP)>linelen) footer_m=0; - /*grabphrase(p);*/ strcpy(foot,phrase); footlen=phraselen; - /* permit variations at end, as for SGI "Page N", but keep minimum length */ - if (footlen>3) footlen--; - la_gets(buf); filterline(buf,plain); if (linelen) strcpy(footer2,plain); - title=1; - (*fn)(ENDFOOTER); tagc=0; - - /* if no header on first page, try again after first footer */ - if (!fFoot && *header=='\0') fHead=0; /* this is dangerous */ - fFoot=1; - continue; - } else - /* a lot of work, but only for a few lines (about 4%) */ - if (fFoot && (scnt==0 || scnt+indent>MINMID) && - ( (headlen && strncmp(head,p,headlen)==0) - || strcmp(header2,p)==0 || strcmp(header3,p)==0 - || (footlen && strncmp(foot,p,footlen)==0) - || strcmp(footer2,p)==0 - /* try to recognize lines with dates and page numbers */ - /* skip into line */ - || (header_m && header_m<linelen && - strncmp(&header[header_m],&p[header_m],HEADFOOTMAX)==0) - || (footer_m && footer_m<linelen && - strncmp(&footer[footer_m],&p[footer_m],HEADFOOTMAX)==0) - /* skip into line allowing for off-by-one */ - || (header_m && header_m<linelen && - strncmp(&header[header_m],&p[header_m+1],HEADFOOTMAX)==0) - || (footer_m && footer_m<linelen && - strncmp(&footer[footer_m],&p[footer_m+1],HEADFOOTMAX)==0) - /* or two */ - || (header_m && header_m<linelen && - strncmp(&header[header_m],&p[header_m+2],HEADFOOTMAX)==0) - || (footer_m && footer_m<linelen && - strncmp(&footer[footer_m],&p[footer_m+2],HEADFOOTMAX)==0) - /* or with reflected odd and even pages */ - || (headlen && headlen<linelen && - strncmp(head,&p[linelen-headlen],headlen)==0) - || (footlen && footlen<linelen && - strncmp(foot,&p[linelen-footlen],footlen)==0) - )) { - tagc=0; title=1; continue; - } - - /* page numbers at end of line */ - for(i=0; p[i] && isdigit(p[i]); i++) - /* empty */; - if (&p[i]!=plain && !p[i]) {title=1; fFoot=1; continue;} - } - - /*** interline spacing ***/ - /* multiple \n: paragraph mode=>new paragraph, line mode=>blank lines */ - /* need to chop up lines for Roff */ - - /*tabgram[scnt]++;*/ - if (title) ncnt=(scnt!=oscnt || (/*scnt<4 &&*/ isupper(*p))); - itabcnt = scnt/5; - if (CurLine==1) {ncnt=0; tagc=0;} /* gobble all newlines before first text line */ - sect = (scnt==0 && isupper(*p)); - subsect = (fSubsections && (scnt==2||scnt==3)); - if ((sect || subsect) && ncnt>1) ncnt=1; /* single blank line between sections */ - (*fn)(BEGINLINE); - if (/*fPara &&*/ ncnt) Pnew=1; - title=0; /*ncnt=0;--moved down*/ - /*if (finTable) (*fn)(BEGINTABLELINE);*/ - oscnt=scnt; /*fotable=finTable;*/ - -/* let output modules decide what to do at the start of a paragraph - if (fPara && !Pnew && (prevcmd==BEGINBODY || prevcmd==BEGINBULTXT)) { - putchar(' '); I++; - } -*/ - - /*** identify structural sections and notify fn */ - - /*if (fMan) {*/ -/* bulpair = (scnt<7 && (*p==c_bullet || *p=='-'));*/ - /* decode the below */ - bulpair = ((!auxindent || scnt!=lindent+auxindent) /*!bulpair*/ - && ((scnt>=2 && scnt2>5) || scnt>=5 || (tagc>0 && tags[0].first==scnt) ) /* scnt>=2?? */ - && (((*p==c_bullet || strchr("-+.",*p)!=NULL || falluc) && (ncnt || scnt2>4)) || - (scnt2-s_avg>=2 && phrase[phraselen-1]!='.') || - (scnt2>3 && s_cnt==1) - )); - if (bulpair) { - if (tagc>0 && tags[0].first==scnt) { - k=tags[0].last; - for (l=1; l<tagc; l++) { - if (tags[l].first - k <=3) - k=tags[l].last; - else break; - } - phraselen=k-scnt; - for (k=phraselen; plain[k]==' ' && k<linelen; k++) /* nothing */; - if (k>=5 && k<linelen) hanging=k; else hanging=-1; - } else if (scnt2) hanging=phraselen+scnt2; - else hanging=5; - } else hanging=0; - -/* hanging = bulpair? phraselen+scnt2 : 0;*/ -/*if (bulpair) printf("hanging = %d\n", hanging);*/ - /* maybe, bulpair=0 would be best */ - /*end fMan}*/ - - /* certain sections (subsections too?) special, like SEE ALSO */ - /* to make canonical name as plain, all lowercase */ - if (sect /*||subsect -- no widespread subsection names*/) { - for (j=0; (sectheadid=j)<RANDOM; j++) if (strcoloncmp2(plain,'\0',sectheadname[j],0)) break; - } - - /* normalized section headers are put into mixed case */ - if (/*fNORM &&*/falluc && (sect || subsect)) casify(plain); - - if (sect) { - poppush(BEGINSECTION); (*fn)(BEGINSECTHEAD); - tocadd(plain, BEGINSECTION, CurLine); - } else if (subsect && !osubsect) { - poppush(BEGINSUBSECTION); (*fn)(BEGINSUBSECTHEAD); - tocadd(plain, BEGINSUBSECTION, CurLine); - } else if (bulpair) { - /* used to be just poppush(BEGINBULPAIR); */ - if (!Pbp) poppush(BEGINBULPAIR); - (poppush)(BEGINBULLET); - fIP=1; /*grabphrase(plain);*/ - } else if (Pnew) { - poppush(BEGINBODY); - } - Pnew=0; - oldsectheadid = sectheadid; - - - /* move change bars to left */ - if (fChangeleft && !fNORM) { - if (fPara) (*fn)(CHANGEBAR); - /* replace initial spaces with changebars */ - else for (i=0; i<ccnt; i++) { /*xputchar('|'); */ (*fn)(CHANGEBAR); } - } - - /* show initial spaces */ - if (!fIQS && fcharout) { - spaceout = (scnt>ccnt)?(scnt-ccnt):0; - if (fILQS) { if (spaceout>=lindent) spaceout-=lindent; else spaceout=0; } - if (auxindent) { if (spaceout>=auxindent) spaceout-=auxindent; else spaceout=0; } - if (fNORM) { - if (itabcnt>0) (*fn)(ITAB); - for (i=0; i<(scnt%5); i++) putchar(' '); - } else printf("%*s",spaceout,""); - } - - - /*** iterate over each character in line, ***/ - /*** handling underlining, tabbing, copyrights ***/ - - off=(!fIQS&&!fPara)?scnt:0; - for (i=0, p=plain, curtag=0, fcont=0; *p; p++,i++,fcont=0) { - /* interspersed presentation signals */ - /* start tags in reverse order of addition (so structural first) */ - if (curtag<tagc && i+I0+off==tags[curtag].first) { - for (r=hitxt, j=tags[curtag].last-tags[curtag].first, hitxt[j]='\0'; j; j--) - hitxt[j-1]=p[j-1]; - (*fn)(tagbeginend[tags[curtag].type][0]); - } - - /* special characters */ - switch(*p) { - case '"': - if (p==plain || isspace(p[-1])) { (*fn)(CHARLQUOTE); fcont=1; } - else if (isspace(p[1])) { (*fn)(CHARRQUOTE); fcont=1; } - break; - case '\'': - if (p==plain || isspace(p[-1])) { (*fn)(CHARLSQUOTE); fcont=1; } - else if (isspace(p[1])) { (*fn)(CHARRSQUOTE); fcont=1; } - break; - case '-': - /* check for -opt => \-opt */ - if (p==plain || (isspace(p[-1]) && !isspace(p[1]))) { - (*fn)(CHARDASH); fcont=1; - } - break; - } - - /* troublemaker characters */ - c = (*p)&0xff; - if (!fcont && fcharout) { - if (strchr(escchars,c)!=NULL) { - putchar('\\'); putchar(c); I++; - } else if (strchr((char *)trouble,c)!=NULL) { - (*fn)((enum command)c); fcont=1; - } else { - putchar(c); I++; - } - } - -/*default:*/ - if (curtag<tagc && i+I0+off+1==tags[curtag].last) { - (*fn)(tagbeginend[tags[curtag].type][1]); - curtag++; - } - - if (fIP && ((*p==' ' && i==phraselen) || *p=='\0')) { - p++; /* needed but why? */ - (*fn)(ENDBULLET); fIP=0; - if (*p!='\0') { - /*oscnt+=phraselen;*/ - oscnt+=i; - for (r=p; *r==' '; r++) { - oscnt++; -/* - i++; - if (fQS || !fcharout) p++; -*/ - } - } - p--; /* to counteract increment in loop */ - - poppush(BEGINBULTXT); - } - } - - - /*** end of line in buf[] ***/ - /*** deal with section titles, hyperlinks ***/ - - if (sect) { (*fn)(ENDSECTHEAD); Pnew=1; } - else if (subsect) { (*fn)(ENDSUBSECTHEAD); Pnew=1; } - else if (fIP) { (*fn)(ENDBULLET); fIP=0; poppush(BEGINBULTXT); } -/* oscnt not right here */ - else if (scnt+linelen+spcsqz<MINRM /*&& ncnt*/ && lookahead!='\n' - && prevcmd!=BEGINBULTXT && prevcmd!=ENDSUBSECTHEAD && prevcmd!=ENDSUBSECTHEAD) - (*fn)(SHORTLINE); - osubsect=subsect; - - /*if (finTable) (*fn)(ENDTABLELINE);*/ - /*if (!fPara)*/ (*fn)(ENDLINE); tagc=0; - ncnt=0; - I0=I; /* save I here in case skipping lines screws it up */ - } - - /* wrap up at end */ - pop(ENDDOC); /* clear up all tags on stack */ - (*fn)(ENDDOC); -} - - - -/* - * SOURCE CODE PARSING - * for better transcription short of full nroff interpreter - * - * Macros derived empirically, except for weird register ones that were looked up in groff - * - * buffer usage - * buf = incoming text from man page file - * plain = "second pass" buffer used to identify man page references - * - * test pages - * Solaris: fdisk.1m, fcntl.2, curs_getwch.3x, locale.5 (numbered lists), - * getservbyname.3n (font size changes) - */ - -/* macros */ -/* put as much in here, as opposed to in code, as possible. - less expensive and here they can be overridden by other macros */ -/*const int macromax=100; -- dumb compiler */ -#define MACROMAX 1000 -struct { char *key; char *subst; } macro[MACROMAX] = { - /* Solaris */ - {"NA", ".SH NAME"}, - {"SB", "\\s-2\\fB\\$1\\fR\\s0"}, - /* HP-UX */ -#if 0 - {"SM", "\\s-2\\$1\\s0"}, - {"C", "\\f3\\$1\\fR"}, - {"CR", "\\f3\\$1\\fR\\$2"}, - {"CI", "\\f3\\$1\\fI\\$2\\fR"}, - {"RC", "\\fR\\$1\\f3\\$2\\fR"}, -#endif - /* SGI -- doesn't ship man page source */ - - /* 4.4BSD - http://intergate.sonyinteractive.com/cgi-bin/manlink/7/mdoc */ - /* scads more, but for them definition in -mandoc is sufficient */ -#if 0 - {"Dt", ".TH \\$1 \\$2 \\$3"}, - {"Sh", ".SH \\$1 \\$2 \\$3 \\$4 \\$5 \\$6 \\$7 \\$8 \\$9"}, - {"Ss", ".SS \\$1 \\$2 \\$3 \\$4 \\$5 \\$6 \\$7 \\$8 \\$9"}, - {"Pp", ".P"}, - {"Nm", ".BR \\$1 \\$2 \\$3 \\$4 \\$5 \\$6 \\$7 \\$8 \\$9"}, /* name */ - {"Ar", ".IR \\$1 \\$2 \\$3 \\$4 \\$5 \\$6 \\$7 \\$8 \\$9"}, -#endif - { NULL, NULL } -}; -/* what all can be represented as a macro? */ -int macrocnt=-1; /* length of table counted at start */ - -char *macnotfound[MACROMAX]; -int macnotcnt=0; - -#define SUBSTMAX 1000 -/* "*" or "*(" prefixed */ -struct { char *key; char *subst; } subst[SUBSTMAX] = { - {"rq", "'"}, {"lq", "`"}, {"L\"", "``"}, {"R\"", "''"}, - {"L", "\\f3"}, {"E", "\\f2"}, {"V", "\\f4"}, {"O", "\\f1"} -}; -int substcnt=8; - -#define REGISTERMAX 1000 -struct { char *name; char *value; } reg[REGISTERMAX]; -int regcnt=0; - -/* special characters */ -const struct { char key[4]; unsigned char subst[4]; } spec[] = { - { "**", "*" }, - { "+-", { CHARPLUSMINUS, '\0' }}, - { "12", { CHAR12, '\0' }}, - { "14", { CHAR14, '\0' }}, - { "34", { CHAR34, '\0' }}, - { "aa", { CHARACUTE, '\0' }}, - { "ap", "~" }, - { "br", "|" }, - { "bu", { CHARBULLET, '\0' }}, - { "bv", "|" }, - { "ci", "O" }, - { "co", { CHARCOPYR, '\0' }}, - { "ct", { CHARCENT, '\0' }}, - { "de", { CHARDEG, '\0' }}, - { "dg", { CHARDAGGER, '\0' }}, - { "di", { CHARDIV, '\0' }}, - { "em", "--" }, - { "eq", "=" }, - { "hy", "-" }, - { "mi", "-" }, - { "mu", { CHARMUL, '\0' }}, - { "no", { CHARNOT, '\0' }}, - { "or", "|" }, - { "pl", "+" }, - { "rg", { CHARREGTM, '\0' }}, - { "ru", "_" }, - { "sc", { CHARSECT, '\0' }}, - { "sl", "/" }, - { "ua", "^" }, - { "ul", "_" } -}; -#define speccnt (sizeof spec / sizeof spec[0]) - -/* tbl line descriptions */ -char *tbl[20][20]; /* space enough for twenty description lines, twenty parts each */ -int tblc=0; -int tbli; - -int fsourceTab = 0, fosourceTab=0; -int supresseol=0; -int finitDoc=0; -int sublevel=0; - -static char * -source_gets(void) -{ - char *p,*q; - char *ret = (*in)?buf:NULL; - int i; - char *begin; - char tmpbuf[MAXBUF]; - char name[3]; - - if (!sublevel) AbsLine++; - - p = tmpbuf; - falluc = 1; - while (1) { - /* collect characters in line */ - while (*in && *in!='\n') { - if (p[0]=='\\' && p[1]=='\n') p+=2; /* \<newline> */ - falluc = falluc && !islower(*in); - *p++ = *in++; - } - if (*in) in++; - *p='\0'; - - /* normalize commands */ - p=tmpbuf; q=buf; /* copy from tmpbuf to buf */ - /* no spaces between command-initiating period and command letters */ - if (*p=='\'') { *p='.'; } /* what's the difference? */ - if (*p=='.') { *q++ = *p++; while (isspace(*p)) p++; } - - - /* convert lines with tabs to tables? */ - fsourceTab=0; - - /* if comment at start of line, OK */ - /* dynamically determine iff Tcl/Tk page by scanning comments */ - begin = p; - if (*p=='\\' && *(p+1)=='"') { - if (!fTclTk && strstr(p+1,"supplemental macros used in Tcl/Tk")!=NULL) fTclTk=1; - if (fTclTk) - p+=2; - } - - while (*p) { - if (*p=='\t') fsourceTab++; - if (*p=='\\') { - p++; - if (*p=='n') { - p++; - if (*p=='(') { - p++; name[0]=*p++; name[1]=*p++; name[2]='\0'; - } else { - name[0]=*p++; name[1]='\0'; - } - *q='0'; *(q+1)='\0'; /* defaults to 0, in case doesn't exist */ - for (i=0; i<regcnt; i++) { - if (strcmp(reg[i].name,name)==0) { - strcpy(q, reg[i].value); - break; - } - } - q+=strlen(q); - } else if (*p=='"' && (p != begin+1)) { /* comment in Digital UNIX, OK elsewhere? */ - *p='\0'; - q--; while (q>buf && isspace(*q)) q--; /* trim tailing whitespace */ - q++; *q='\0'; - } else { - /* verbatim character (often a backslash) */ - *q++ = '\\'; /* postpone interpretation (not the right thing but...) */ - *q++ = *p++; - } - } else *q++ = *p++; - } - - /* dumb Digital--later */ - /*if (q-3>plain && q[-1]=='{' && q[-2]=='\\' && q[-3]==' ') q[-3]='\n'; }*/ - - /* close off buf */ - *q='\0'; - -#if 0 - if (q>buf && q[-1]=='\\' && *in=='.') /* append next line * / else break;*/ -#endif - break; - } - - /*printf("*ret = |%s|\n", ret!=NULL?ret : "NULL");*/ - return ret; -} - - -/* dump characters from buffer, signalling right tags along the way */ -/* all this work to introduce an internal second pass to recognize man page references */ -/* now for HTTP references too */ - -int sI=0; -/* use int linelen from up top */ -int fFlush=1; - -static void -source_flush(void) -{ - int i,j; - char *p,*q,*r; - int c; - int manoff,posn; - - if (!sI) return; - plain[sI] = '\0'; - - /* flush called often enough that all man page references are at end of text to be flushed */ - /* find man page ref */ - if (sI>=4/*+1*/ && (plain[sI-(manoff=1)-1]==')' || plain[sI-(manoff=0)-1]==')')) { - for (q=&plain[sI-manoff-1-1]; q>plain && isalnum(*q) && *q!='('; q--) /* nada */; - if (*q=='(' && strcoloncmp(&q[1],')',vollist)) { - r=q-1; - if (*r==' ' && (sectheadid==SEEALSO || /*single letter volume */ *(q+2)==')' || *(q+3)==')')) r--; /* permitted single intervening space */ - for ( ; r>=plain && (isalnum(*r) || strchr(manvalid,*r)!=NULL); r--) /* nada */; - r++; - if (isalpha(*r) && r<q) { - /* got one: clear out tags and spaces to make normalized form */ - posn = r-plain; - /*while (tagc && tags[tagc-1].first >= posn) tagc--;*/ - - /* add MANREF tags */ - strcpy(hitxt,r); - tagadd(BEGINMANREF, posn, 0); - /* already generated other start tags, so move BEGINMANREF to start in order to be well nested (ugh) */ - tagtmp = tags[tagc-1]; for (j=tagc-1; j>0; j--) tags[j]=tags[j-1]; tags[0]=tagtmp; - tagadd(ENDMANREF, sI-manoff-1+1, 0); - } - } - - /* HTML hyperlinks */ - } else if (fURL && sI>=4 && (p=strstr(plain,"http"))!=NULL) { - i = p-plain; - tagadd(BEGINMANREF, i, 0); tagtmp = tags[tagc-1]; for (j=tagc-1; j>0; j--) tags[j]=tags[j-1]; tags[0]=tagtmp; - for (j=0; i<sI && !isspace(*p) && *p!='"' && *p!='>'; i++,j++) hitxt[j] = *p++; - hitxt[j]='\0'; - tagadd(ENDMANREF, i, 0); - } - - if (!fFlush) return; - - /* output text */ - for (i=0,j=0,p=plain; i<sI && *p; i++,p++) { - if (!linelen) (*fn)(BEGINLINE); /* issue BEGINLINE when know will be chars on line */ - - /* dump tags */ - /*for ( ; j<tagc && tags[j].first == i; j++) (*fn)(tags[j].type);*/ - for (j=0; j<tagc; j++) if (tags[j].first == i) (*fn)((enum command)tags[j].type); - - /* dump text */ - c = (*p)&0xff; /* just make c unsigned? */ - if (strchr(escchars,c)!=NULL) { - xputchar('\\'); xputchar(c); - if (fcharout) linelen++; - } else if (strchr((char *)trouble,c)!=NULL) { - (*fn)((enum command)c); - } else if (linelen>=LINEBREAK && c==' ') { (*fn)(ENDLINE); linelen=0; - } else { /* normal character */ - xputchar(c); - if (fcharout) linelen++; - } - - /*if (linelen>=LINEBREAK && c==' ') { (*fn)(ENDLINE); linelen=0; } -- leaves space at end of line*/ - } - /* dump tags at end */ - /*for ( ; j<tagc && tags[j].first == sI; j++) (*fn)(tags[j].type);*/ - for (j=0; j<tagc; j++) if (tags[j].first==sI) (*fn)((enum command)tags[j].type); - - sI=0; tagc=0; -} - - -/* source_out stuffs characters in a buffer */ -static char * -source_out0(const char *pin, char end) -{ - /* stack of character formattings */ - static enum tagtype styles[20]; - static int style=-1; - int funwind=0; - int i, j; - int len; - int sign; - char *p, *pstart; - - pstart = p = mystrdup(pin); - while (*p && *p!=end) { - if (*p=='\\') { /* escape character */ - switch (*++p) { - case '&': /* no space. used as a no-op sometimes */ - case '^': /* 1/12 em space */ - case '|': /* 1/6 em space */ - case '%': /* hyphenation indicator */ - /* just ignore it */ - p++; - break; - case '0': /* digit width space */ - p++; - sputchar(' '); - break; - case ' ': /* unpaddable space */ - stagadd(CHARNBSP); /* nonbreaking space */ - /*sputchar(' ');*/ - p++; - break; - case 's': /* font size change */ - p++; - sign=1; - if (*p=='-' || *p=='+') if (*p++=='-') sign=-1; - intArg = sign * ((*p++)-'0'); - if (intArg==0) intArg = -fontdelta; /* s0 returns to normal height */ - if (fontdelta || intArg) { source_flush(); (*fn)(FONTSIZE); } - break; - case 'v': /* vertical motion */ - case 'h': /* horizontal motion */ - case 'L': /* vertical line */ - case 'l': /* horizontal line */ - /* ignore */ - p++; - if (*p=='\'') { p++; while (*p++!='\''); } - break; - case '"': /* comment */ - *p='\0'; /* rest of line is comment */ - break; - case 'f': - p++; - switch (*p++) { - case '3': case 'B': /* boldface */ - styles[++style] = BOLD; - stagadd(BEGINBOLD); - break; - case '2': case 'I': /* italics */ - styles[++style] = ITALICS; - stagadd(BEGINITALICS); - break; - case '4': /* bolditalics mode => program code */ - styles[++style] = BOLDITALICS; - stagadd(BEGINBOLDITALICS); - break; - case '1': case '0': case 'R': case 'P': /* back to Roman */ - /*sputchar(' '); -- taken out; not needed, I hope */ - funwind=1; - break; - case '-': - p++; - break; - } - break; - case '(': /* multicharacter macros */ - p++; - for (i=0; (unsigned)i<speccnt; i++) { - if (p[0]==spec[i].key[0] && p[1]==spec[i].key[1]) { - p+=2; - for (j=0; spec[i].subst[j]; j++) sputchar(spec[i].subst[j]); - break; - } - } - break; - case '*': /* strings */ - p++; - if (*p!='(') { /* single character */ - for (i=0; i<substcnt; i++) { - if (*p==subst[i].key[0] && subst[i].key[1]=='\0') { - source_out0(subst[i].subst,'\0'); - break; - } - } - p++; - } else { /* multicharacter macros */ - p++; - for (i=0; i<substcnt; i++) { - len = strlen(subst[i].key); - if (strncmp(p,subst[i].key,len)==0) { - source_out0(subst[i].subst,'\0'); - p+=len; - break; - } - } - } - break; -#if 0 - case '|': - stagadd(CHARNBSP); /* nonbreaking space */ -#if 0 - sputchar(' '); -#endif - p++; -#endif - case 'e': /* escape */ - sputchar('\\'); - p++; - break; - case 'c': - /* supress following carriage return-induced space */ - /* handled in source_gets(); ignore within line => can't because next line might start with a command */ - supresseol=1; - p++; - break; - case '-': /* minus sign */ - sputchar(CHARDASH); - p++; - break; -#if 0 - case '^': - /* end stylings? (found in Solaris) */ - p++; -#endif - case 'N': - p++; - if (*p == '\'') { - char *tmp; - p++; - if ((tmp = strchr(p, '\'')) != NULL) { - sputchar(atoi(p)); - p = tmp + 1; - } - } - break; - case 0: - /* ignore */ - break; - default: /* unknown escaped character */ - sputchar(*p++); - } - - } else { /* normal character */ - if (*p) sputchar(*p++); - } - - - /* unwind character formatting stack */ - if (funwind) { - for ( ; style>=0; style--) { - if (styles[style]==BOLD) stagadd(ENDBOLD); - else if (styles[style]==ITALICS) stagadd(ENDITALICS); - else stagadd(ENDBOLDITALICS); - } /* else error */ - assert(style==-1); - - funwind=0; - } - - /* check for man page reference and flush buffer if safe */ - /* postpone check until after following character so catch closing tags */ - if ((sI>=4+1 && plain[sI-1-1]==')') || - /* (plain[sI-1]==' ' && (q=strchr(plain,' '))!=NULL && q<&plain[sI-1])) */ - (sI>=2 && plain[sI-1]==' ' && !isalnum(plain[sI-1-1]))) { - /* regardless, flush buffer */ - source_flush(); - } - } - - if (*p && *p!=' ') p++; /* skip over end character */ - free(pstart); - return (char *)pin + (p - pstart); - -} - -/* oh, for function overloading. inlined by compiler, probably */ -static char * -source_out(const char *p) -{ - return source_out0(p,'\0'); -} - - -static char * -source_out_word(const char *p) -{ - char end = ' '; - - while (*p && isspace(*p)) p++; - if (*p=='"' /* || *p=='`' ? */) { - end = *p; - p++; - } - p = source_out0(p,end); - /*while (*p && isspace(*p)) p++;*/ - return (char *)p; -} - - -static void -source_struct(enum command cmd) -{ - source_out("\\fR\\s0"); /* don't let run-on stylings run past structural units */ - source_flush(); - if (cmd==SHORTLINE) linelen=0; - (*fn)(cmd); -} - -#define checkcmd(str) strcmp(cmd,str)==0 - -int finnf=0; - -static void source_line(char *p); - -static void -source_subfile(char *newin) -{ - char *p; - char *oldin = in; - - sublevel++; - - in = newin; - while ((p=source_gets())!=NULL) { - source_line(p); - } - in = oldin; - - sublevel--; -} - -/* have to delay acquisition of list tag */ -static void -source_list(void) -{ - static int oldlisttype; /* OK to have just one because nested lists done with RS/RE */ - char *q; - int i; - - /* guard against empty bullet */ - for (i=0, q=plain; i<sI && isspace(*q); q++,i++) /* empty */; - if (i==sI) return; - - assert(finlist); - - fFlush=1; - - /* try to determine type of list: DL, OL, UL */ - q=plain; plain[sI]='\0'; - if (/*c==CHARBULLET || q=='-' -- command line opts! ||*/ *q=='.' || *q&0x80) { - listtype=UL; - q++; - } else { - if (strchr("[(",*q)) q++; - while (isdigit(*q)) { listtype=OL; q++; } /* I hope this gives the right number */ - if (*q=='.') q++; - if (strchr(")]",*q)) q++; - if (*q=='.') q++; - while (isspace(*q)) q++; - if (*q) listtype=DL; - } - oldlisttype = listtype; - - /* interpretation left to output formats based on listtype (HTML: DL, OL, UL) */ - i = sI; sI=0; - if (!Pbp || listtype!=oldlisttype) poppush(BEGINBULPAIR); - poppush(BEGINBULLET); - /*if (tphp) source_line(p); else source_out_word(p);*/ - /*if (listtype!=OL && listtype!=UL)*/ sI=i; - source_struct(ENDBULLET); Pbul=0; /* handled immediately below */ - poppush(BEGINBULTXT); - - finlist=0; -} - -static int inComment=0; -static int isComment=0; - -static void -source_command(char *p) -{ - static int lastif=1; - int mylastif; - char *cmd=p; - char *q; - int i,j,endch; - int fid; - struct stat fileinfo; - char *sobuf; - char *macroArg[9]; - char endig[10]; - int err=0; - char ch; - int tphp=0; - int ie=0; - int cond,invcond=0; - char delim,op; - char if0[MAXBUF], if1[MAXBUF]; - float nif0, nif1; - int insertat; - char macrobuf[MAXBUF]; /* local so can have nested macros */ - static char ft='\0'; - static int fTableCenter=0; - - /* should centralize command matching (binary search?), pointer bumping here - if for no other reason than to catch conflicts -- and allow overrides? */ - /* parse out command */ - while (*p && !isspace(*p)) p++; - if (*p) { *p='\0'; p++; } - /* should set up argv, argc for command arguments--it's regular enough that everyone doesn't have to do it itself */ - - isComment = (/*checkcmd("") ||*/ !strncmp(cmd, "\\\"", 2) || /*DEC triple dot*/checkcmd("..")); - if (inComment && !isComment) { source_struct(ENDCOMMENT); inComment=0; } /* special case to handle transition */ - - if (isComment) { - /* maybe have BEGINCOMMENT, ENDCOMMENT, COMMENTLINE */ - supresseol=0; - if (!inComment) { source_flush(); source_struct(BEGINCOMMENT); inComment=1; } - source_struct(COMMENTLINE); - printf("%s\n", p); /* could contain --> or other comment closer, but unlikely */ - - /* structural commands */ - } else if (checkcmd("TH")) { - /* sample: .TH CC 1 "Dec 1990" */ - /* overrides command line -- should fix this */ - if (!finitDoc) { - while (isspace(*p)) p++; - if (*p) { - /* name */ - q=strchr(p, ' '); if (q!=NULL) *q++='\0'; - strcpy(manName, p); - /* number */ - p = q; - if (p!=NULL) { - while (isspace(*p)) p++; - if (*p) { q=strchr(p,' '); if (q!=NULL) *q++='\0'; } - } - strcpy(manSect, p!=NULL? p: "?"); - } - sI=0; - finitDoc=1; - (*fn)(BEGINDOC); - /* emit information in .TH line? */ - } /* else complain about multiple definitions? */ - - } else if (checkcmd("SH") || checkcmd("Sh")) { /* section title */ - while (indent) { source_command("RE"); } - source_flush(); - - pop(BEGINSECTION); /* before reset sectheadid */ - - if (*p) { - if (*p=='"') { p++; q=p; while (*q && *q!='"') q++; *q='\0'; } - finnf=0; - for (j=0; (sectheadid=j)<RANDOM; j++) if (strcoloncmp2(p,'\0',sectheadname[j],0)) break; - if (!finitDoc) { - /* handle missing .TH */ - /* if secthead!=NAME -- insist on this? - fprintf(stderr, "Bogus man page: no .TH or \".SH NAME\" lines\n"); - exit(1); - */ - (*fn)(BEGINDOC); - finitDoc=1; - } - poppush(BEGINSECTION); source_struct(BEGINSECTHEAD); - fFlush=0; - if (falluc) casify(p); - source_out(p); /* people forget the quotes around multiple words */ - while (isspace(plain[--sI])) /*nada*/; - plain[++sI]='\0'; tocadd(plain, BEGINSECTION, CurLine); /* flushed with source_struct above */ - fFlush=1; - source_struct(ENDSECTHEAD); - } - } else if (checkcmd("SS")) { /* subsection title */ - while (indent) { source_command("RE"); } - source_flush(); - - if (*p) { - if (*p=='"') { p++; q=p; while (*q && *q!='"') q++; *q='\0'; } - finnf=0; - source_flush(); - poppush(BEGINSUBSECTION); source_struct(BEGINSUBSECTHEAD); - fFlush=0; - - if (falluc) casify(p); - source_out(p); /* people forget the quotes around multiple words */ - while (isspace(plain[--sI])) /*nada*/; - plain[++sI]='\0'; tocadd(plain, BEGINSUBSECTION, CurLine); - fFlush=1; - source_struct(ENDSUBSECTHEAD); - } - - } else if (checkcmd("P") || checkcmd("PP") || checkcmd("LP")) { /* new paragraph */ - source_flush(); - poppush(BEGINBODY); - - } else if ((tphp=checkcmd("TP")) || (tphp=checkcmd("HP")) || checkcmd("IP") || checkcmd("LI")) { - /* TP, HP: indented paragraph, tag on next line (DL list) */ - /* IP, LI: tag as argument */ - source_flush(); - fFlush=0; - finlist=1; - if (!tphp) { source_out_word(p); source_list(); } - /* lists terminated only at start of non-lists */ - } else if (checkcmd("RS")) { /* set indent */ - source_struct(BEGININDENT); - indent++; - } else if (checkcmd("RE")) { - if (indent) indent--; - pop(ENDINDENT); - source_struct(ENDINDENT); -#if 0 - } else if (checkcmd("Xr")) { - /* 4.4BSD man ref */ - supresseol=0; - p=source_out_word(p); - source_out("("); - p=source_out_word(p); - source_out(")"); -#endif - - } else if (checkcmd("nf")) { - source_struct(SHORTLINE); - finnf=1; - source_struct(BEGINCODEBLOCK); - } else if (checkcmd("fi")) { - source_struct(ENDCODEBLOCK); - finnf=0; - } else if (checkcmd("br")) { - source_struct(SHORTLINE); - } else if (checkcmd("sp") || checkcmd("SP")) { /* blank lines */ - /*if (!finTable) {*/ - if (finnf) source_struct(SHORTLINE); else source_struct(BEGINBODY); - /*}*/ - } else if (checkcmd("ta")) { /* set tab stop(s?) */ - /* argument is tab stop -- handle these as tables => leave to output format */ - /* HTML handles tables but not tabs, Tk's text tabs but not tables */ - /* does cause a linebreak */ - stagadd(BEGINBODY); - } else if (checkcmd("ce")) { - /* get line count, recursively filter for that many lines */ - if (sscanf(p, "%d", &i)) { - source_struct(BEGINCENTER); - for (; i>0 && (p=source_gets())!=NULL; i--) source_line(p); - source_struct(ENDCENTER); - } - - /* limited selection of control structures */ - } else if (checkcmd("if") || (checkcmd("ie"))) { /* if <test> cmd, if <test> command and else on next line */ - supresseol=1; - ie = checkcmd("ie"); - mylastif=lastif; - - if (*p=='!') { invcond=1; p++; } - - if (*p=='n') { cond=1; p++; } /* masquerading as nroff the right thing to do? */ - else if (*p=='t') { cond=0; p++; } - else if (*p=='(' || *p=='-' || *p=='+' || isdigit(*p)) { - if (*p=='(') p++; - nif0=atof(p); - if (*p=='-' || *p=='+') p++; while (isdigit(*p)) p++; - op = *p++; /* operator: =, >, < */ - if (op==' ') { - cond = (nif0!=0); - } else { - nif1=atoi(p); - while (isdigit(*p)) p++; - if (*p==')') p++; - if (op=='=') cond = (nif0==nif1); - else if (op=='<') cond = (nif0<nif1); - else /* op=='>' -- ignore >=, <= */ cond = (nif0>nif1); - } - } else if (!isalpha(*p)) { /* usually quote, ^G in Digital UNIX */ - /* gobble up comparators between delimiters */ - delim = *p++; - q = if0; - while (*p && *p!=delim) { - *q++=*p++; - } - *q='\0'; - p++; - q = if1; - while (*p && *p!=delim) { - *q++=*p++; - } - *q='\0'; - p++; - cond = (strcmp(if0,if1)==0); - } else cond=0; /* a guess, seems to be right bettern than half the time */ - if (invcond) cond=1-cond; - while (isspace(*p)) p++; - - lastif = cond; - if (strncmp(p,"\\{",2)==0) { /* rather than handle groups here, have turn on/off output flag? */ - p+=2; while (isspace(*p)) p++; /* {{ */ - while (strncmp(p,".\\}",3)!=0 || strncmp(p,"\\}",2)!=0 /*Solaris*/) { - if (cond) source_line(p); - if ((p=source_gets())==NULL) break; - } - } else if (cond) source_line(p); - - if (ie) source_line(source_gets()); /* do else part with prevailing lastif */ - - lastif=mylastif; - - } else if (checkcmd("el")) { - mylastif=lastif; - - /* should centralize gobbling of groups */ - cond = lastif = !lastif; - if (strncmp(p,"\\{",2)==0) { - p+=2; while (isspace(*p)) p++; - while (strncmp(p,".\\}",3)!=0 || strncmp(p,"\\}",2)!=0 /*Solaris*/) { - if (cond) source_line(p); - if ((p=source_gets())==NULL) break; - } - } else if (cond) source_line(p); - - lastif=mylastif; - - } else if (checkcmd("ig")) { /* "ignore group" */ - strcpy(endig,".."); if (*p) { endig[0]='.'; strcpy(&endig[1],p); } - while ((p=source_gets())!=NULL) { - if (strcmp(p,endig)==0) break; - if (!lastif) source_line(p); /* usually ignore line, except in one weird case */ - } - - - /* macros and substitutions */ - } else if (checkcmd("de")) { - /* grab key */ - q=p; while (*q && !isspace(*q)) q++; *q='\0'; - - /* if already have a macro of that name, override it */ - /* could use a good dictionary class */ - for (insertat=0; insertat<macrocnt; insertat++) { - if (strcmp(p,macro[insertat].key)==0) break; - } - if (insertat==macrocnt) macrocnt++; - - /* should replace one with same name, if one exists */ - macro[insertat].key = mystrdup(p); - - /* build up macro in plain[] ... */ - /* everything until ".." line part of macro */ - q=plain; i=0; - while ((p=source_gets())!=NULL) { - if (strcmp(p,"..")==0) break; - while (*p) { /* append string, interpreting quotes along the way--just double backslash to single now */ - if (*p=='\\' && p[1]=='\\') p++; - *q++=*p++; - } - *q++='\n'; - } - *q='\0'; - - /* ... then copy once have whole thing */ - macro[insertat].subst = mystrdup(plain); - /*fprintf(stderr, "defining macro %s as %s\n", macro[insertat].key, macro[insertat].subst);*/ - sI=0; - - } else if (checkcmd("rm")) { /* remove macro definition, can have multiple arguments */ - for (i=0; i<macrocnt; i++) { /* moot as new definitions replace old when conflicts */ - if (strcmp(p,macro[i].key)) { - macro[i] = macro[--macrocnt]; - break; - } - } - - } else if (checkcmd("ds")) { /* text substitutions (like macros) */ - /* /usr/sww/man/man1/CC.1 a good test of this */ - q = strchr(p,' '); - if (q!=NULL) { - *q='\0'; q++; -#if 0 - while (*++q) /*nada*/; -#endif - if (*q=='"') q++; - if (substcnt<SUBSTMAX) { - subst[substcnt].key = mystrdup(p); subst[substcnt].subst = mystrdup(q); substcnt++; - } - /*fprintf(stderr, "defining substitution: name=%s, body=%s\n", p, q);*/ - } - - } else if (checkcmd("so")) { - /* assuming in .../man like nroff, source in file and execute it as nested file, */ - /* so nested .so's OK */ - - err = 1; /* assume error unless successful */ - if (fTclTk) { - err=0; - } else if (stat(p, &fileinfo)==0) { - sobuf = malloc(fileinfo.st_size + 1); - if (sobuf!=NULL) { - /* suck in entire file */ - fid = open(p, O_RDONLY); - if (fid!=-1) { - if (read(fid, sobuf, fileinfo.st_size) == fileinfo.st_size) { - sobuf[fileinfo.st_size]='\0'; - /* dumb Digital puts \\} closers on same line */ - /* {{ */ - for (q=sobuf; (q=strstr(q," \\}"))!=NULL; q+=3) *q='\n'; - source_subfile(sobuf); - err = 0; - } - close(fid); - } - free(sobuf); - } - } - - if (err) { - fprintf(stderr, "%s: couldn't read in referenced file %s.\n", argv0, p); - if (strchr(p,'/')==NULL) { - fprintf(stderr, "\tTry cd'ing into same directory of man page first.\n"); - } else if (strchr(p,'/')==strrchr(p,'.')) { - fprintf(stderr, "\tTry cd'ing into parent directory of man page first.\n"); - } else { - fprintf(stderr, "\tTry cd'ing into ancestor directory that makes relative path valid first.\n"); - } - exit(1); - } - - - /* character formatting */ - /* reencode m/any as macro definitions? would like to but the below don't have "words" */ - } else if (checkcmd("ft")) { /* change font, next char is R,I,B. P=previous not supported */ - if (ft=='B') stagadd(ENDBOLD); else if (ft=='I') stagadd(ENDITALICS); - ft = *p++; - if (ft=='B') stagadd(BEGINBOLD); else if (ft=='I') stagadd(BEGINITALICS); - } else if (checkcmd("B")) { - supresseol=0; - stagadd(BEGINBOLD); p = source_out_word(p); source_out(p); stagadd(ENDBOLD); - if (finnf) source_struct(SHORTLINE); - } else if (checkcmd("I")) { - supresseol=0; - stagadd(BEGINITALICS); p = source_out_word(p); stagadd(ENDITALICS); - source_out(p); - if (finnf) source_struct(SHORTLINE); - } else if (checkcmd("BI")) { - supresseol=0; - while (*p) { - stagadd(BEGINBOLD); p = source_out_word(p); stagadd(ENDBOLD); - if (*p) { stagadd(BEGINITALICS); p = source_out_word(p); stagadd(ENDITALICS); } - } - if (finnf) source_struct(SHORTLINE); - } else if (checkcmd("IB")) { - supresseol=0; - while (*p) { - stagadd(BEGINITALICS); p = source_out_word(p); stagadd(ENDITALICS); - if (*p) { stagadd(BEGINBOLD); p = source_out_word(p); stagadd(ENDBOLD); } - } - if (finnf) source_struct(SHORTLINE); - } else if (checkcmd("RB")) { - supresseol=0; - while (*p) { - p = source_out_word(p); - if (*p) { stagadd(BEGINBOLD); p = source_out_word(p); stagadd(ENDBOLD); } - } - if (finnf) source_struct(SHORTLINE); - } else if (checkcmd("BR")) { - supresseol=0; - while (*p) { - stagadd(BEGINBOLD); p = source_out_word(p); stagadd(ENDBOLD); - p = source_out_word(p); - } - if (finnf) source_struct(SHORTLINE); - } else if (checkcmd("IR")) { - supresseol=0; - while (*p) { - stagadd(BEGINITALICS); p=source_out_word(p); stagadd(ENDITALICS); - p=source_out_word(p); - } - if (finnf) source_struct(SHORTLINE); - } else if (checkcmd("RI")) { - supresseol=0; - while (*p) { - p=source_out_word(p); - stagadd(BEGINITALICS); p=source_out_word(p); stagadd(ENDITALICS); - } - if (finnf) source_struct(SHORTLINE); - - - /* HP-UX */ - } else if (checkcmd("SM")) { - supresseol=0; source_out("\\s-1"); while (*p) p=source_out(p); source_out("\\s0"); - } else if (checkcmd("C")) { - supresseol=0; - stagadd(BEGINCODE); while (*p) p=source_out_word(p); stagadd(ENDCODE); - } else if (checkcmd("CR")) { - supresseol=0; - while (*p) { - stagadd(BEGINCODE); p=source_out_word(p); stagadd(ENDCODE); - if (*p) p=source_out_word(p); - } - } else if (checkcmd("RC")) { - supresseol=0; - while (*p) { - p=source_out_word(p); - if (*p) { stagadd(BEGINCODE); p=source_out_word(p); stagadd(ENDCODE); } - } - } else if (checkcmd("CI")) { - supresseol=0; - while (*p) { - stagadd(BEGINCODE); p=source_out_word(p); stagadd(ENDCODE); - if (*p) { stagadd(BEGINITALICS); p=source_out_word(p); stagadd(ENDITALICS); } - } - - - /* tables */ - } else if (checkcmd("TS")) { - tblc=0; /*tblspanmax=0;*/ tableSep='\0'; /* need to reset each time because tabbed lines (.ta) made into tables too */ - while ((p = source_gets())!=NULL) { - if ((q=strstr(p,"tab"))!=NULL) { /* "tab(" or "tab (". table entry separator */ - p=(q+3); while (isspace(*p)) p++; - p++; /* jump over '(' */ - tableSep=*p; - continue; - } - if (strincmp(p,"center",strlen("center"))==0) { /* center entire table; should look for "left" and "right", probably */ - fTableCenter=1; source_struct(BEGINCENTER); - p+=strlen("center"); while (isspace(*p)) p++; - continue; - } - if (p[strlen(p)-1]==';') { tblc=0; continue; } /* HP has a prequel terminated by ';' */ - - for (i=0; *p; i++,p=q) { - if (*p=='.') break; - if (*p=='f') p+=2; /* DEC sets font here */ - q=p+1; - if (strchr("lrcn",*q)==NULL) { /* dumb DEC doesn't put spaces between them */ - while (*q && *q!='.' && !isspace(*q)) q++; - } - ch=*q; *q='\0'; - tbl[tblc][i] = mystrdup(p); - tbl[tblc][i+1] = ""; /* mark end */ - *q=ch; - while (*q && isspace(*q)) q++; - } - /*if (i>tblspanmax) tblspanmax=i;*/ - tbl[tblc++][i]=""; /* mark end */ - if (*p=='.') break; - } - tbli=0; - source_struct(BEGINTABLE); - - while ((p=source_gets())!=NULL) { - if (strncmp(p,".TE",3)==0) break; - if (*p=='.') { source_line(p); continue; } - - /* count number of entries on line. if >1, can use to set tableSep */ - insertat=0; for (j=0; *tbl[tbli][j]; j++) if (*tbl[tbli][j]!='s') insertat++; - if (!tableSep && insertat>1) { if (fsourceTab) tableSep='\t'; else tableSep='@'; } - source_struct(BEGINTABLELINE); - if (strcmp(p,"_")==0 || /* double line */ strcmp(p,"=")==0) { - source_out(" "); - /*stagadd(HR);*/ /* empty row -- need ROWSPAN for HTML */ - continue; - } - - for (i=0; *tbl[tbli][i] && *p; i++) { - tblcellspan=1; - tblcellformat = tbl[tbli][i]; - if (*tblcellformat=='^') { /* vertical span => blank entry */ - tblcellformat="l"; - } else if (*tblcellformat=='|') { - /* stagadd(VBAR); */ - continue; - } else if (strchr("lrcn", *tblcellformat)==NULL) { - tblcellformat="l"; - /*continue;*/ - } - - while (strncmp(tbl[tbli][i+1],"s",1)==0) { tblcellspan++; i++; } - - source_struct(BEGINTABLEENTRY); - if (toupper(tblcellformat[1])=='B') stagadd(BEGINBOLD); - else if (toupper(tblcellformat[1])=='I') stagadd(BEGINITALICS); - /* not supporting DEC's w(<num><unit>) */ - - if (strcmp(p,"T{")==0) { /* DEC, HP */ - while (strncmp(p=source_gets(),"T}",2)!=0) source_line(p); - p+=2; if (*p) p++; - } else { - p = source_out0(p, tableSep); - } - if (toupper(tblcellformat[1])=='B') stagadd(ENDBOLD); - else if (toupper(tblcellformat[1])=='I') stagadd(ENDITALICS); - source_struct(ENDTABLEENTRY); - } - if (tbli+1<tblc) tbli++; - source_struct(ENDTABLELINE); - } - source_struct(ENDTABLE); - if (fTableCenter) { source_struct(ENDCENTER); fTableCenter=0; } - - - } else if (checkcmd("nr")) { - q=p; while (*q && !isspace(*q)) q++; *q='\0'; q++; - - for (insertat=0; insertat<regcnt; insertat++) { - if (strcmp(reg[insertat].name,p)==0) break; - } - if (insertat==regcnt) { regcnt++; reg[insertat].name = mystrdup(p); } /* else use same name */ - p=q; - if (*q=='+' || *q=='-') q++; /* accept signed, floating point numbers */ - if (*q=='.') q++; - if (!*q || isspace(*q)) { *q++='0'; *q++='\0'; } - while (isdigit(*q)) { q++; } *q='\0'; /* ignore units */ - reg[insertat].value = mystrdup(p); - - } else if (checkcmd("EQ")) { /* eqn not supported */ - source_out("\\s-1\\fBeqn not supported\\fR\\s0"); - while ((p=source_gets())!=NULL) { - if (strncmp(p,".EN",3)==0) break; - } - - - - /* Tcl/Tk macros */ - } else if (fTclTk && (checkcmd("VS") || checkcmd("VE"))) { - /* nothing for sidebars */ - } else if (fTclTk && checkcmd("OP")) { - source_struct(BEGINBODY); - for (i=0; i<3; i++) { - if (fcharout) { source_out(tcltkOP[i]); source_out(": "); } - stagadd(BEGINBOLD); p=source_out_word(p); stagadd(ENDBOLD); - source_struct(SHORTLINE); - } - source_struct(BEGINBODY); - - } else if (fTclTk && checkcmd("BS")) { /* box */ - /*source_struct(HR); -- ugh, no Ouster box */ - } else if (fTclTk && checkcmd("BE")) { - /*source_struct(HR);*/ - - } else if (fTclTk && (checkcmd("CS")||checkcmd("DS"))) { /* code excerpt */ - /* respect line ends, set in teletype */ - /* source_struct(SHORTLINE); -- done as part of CS's ENDLINE */ - finnf=1; - source_struct(SHORTLINE); - if (checkcmd("DS")) source_line(".P"); - stagadd(BEGINCODE); - } else if (fTclTk && (checkcmd("CE")||checkcmd("DE"))) { - stagadd(ENDCODE); - finnf=0; - - } else if (fTclTk && checkcmd("SO")) { - source_struct(BEGINSECTION); - source_struct(BEGINSECTHEAD); source_out("STANDARD OPTIONS"); source_struct(ENDSECTHEAD); - tblc=1; tbl[0][0]=tbl[0][1]=tbl[0][2]="l"; tbl[0][3]=""; - source_struct(BEGINTABLE); - while (1) { - p = source_gets(); - if ((strncmp(p,".SE",3))==0) break; - tblcellformat = "l"; - source_struct(BEGINTABLELINE); - if (*p=='.') { - source_command(p); - } else { - while (*p) { - source_struct(BEGINTABLEENTRY); - p = source_out0(p, '\t'); - source_struct(ENDTABLEENTRY); - } - } - source_struct(ENDTABLELINE); - } - source_struct(ENDTABLE); - source_struct(ENDSECTION); - - } else if (fTclTk && checkcmd("AP")) { /* arguments */ - source_struct(BEGINBODY); - p = source_out_word(p); source_out(" "); - stagadd(BEGINITALICS); p = source_out_word(p); stagadd(ENDITALICS); source_out("\t"); - source_out("("); p = source_out_word(p); source_out(")"); - source_struct(SHORTLINE); - source_out("\t"); - } else if (fTclTk && checkcmd("AS")) { /* arguments */ - -#if 0 -/* let these be defined as macros. if they're not, they're just caught as unrecognized macros */ - } else if (checkcmd("ll") || checkcmd("IX") || - checkcmd("nh")||checkcmd("hy")||checkcmd("hc")||checkcmd("hw") /* hyphenation */ - ) { /* unsupported macros -- usually roff specific */ - - fprintf(stderr, "macro \"%s\" not supported -- ignoring\n", cmd); -#endif - - } else { /* could be a macro definition */ - supresseol=0; - - for (i=0; i<macrocnt; i++) { - if (macro[i].key == NULL) continue; /* !!! how does this happen? */ - if (checkcmd(macro[i].key)) { - - /* it is, collect arguments */ - for (j=0; j<9; j++) macroArg[j]=""; - for (j=0; p!=NULL && *p && j<9; j++, p=q) { - endch=' '; if (*p=='"') { endch='"'; p++; } - q = strchr(p,endch); - if (q!=NULL) { - *q++='\0'; - if (*q && endch!=' ') q++; - } - macroArg[j] = p; - } - - /* instantiate that text, substituting \\[1-9]'s */ - p = macro[i].subst; - q = macrobuf; /* allocated on stack */ - while (*p) { - if (*p=='\\') { - p++; - if (*p=='t') { - *q++ = '\t'; - p++; - } else if (*p=='$' && isdigit(p[1])) { - j = p[1]-'0'-1; /* convert to ASCII and align with macroArg array */ - p+=2; - /* *q++='"'; -- no */ - strcpy(q, macroArg[j]); q += strlen(q); - /* *q++='"'; -- no */ - - } else { - *q++ = '\\'; - } - } else { - *q++ = *p++; - } - } - *q='\0'; - - /* execute that text */ - /*fprintf(stderr, "for macro %s, substituted text is \n%s\n", macro[i].key, macrobuf);*/ - source_subfile(macrobuf); - - break; - } - } - - /* macro not found */ - if (i==macrocnt) { - /* report missing macros only once */ - for (j=0; j<macnotcnt; j++) if (strcmp(macnotfound[j],cmd)==0) break; - if (j==macnotcnt) { - if (!fQuiet) fprintf(stderr, "macro \"%s\" not recognized -- ignoring\n", cmd); - q = malloc(strlen(cmd)+1); strcpy(q,cmd); - macnotfound[macnotcnt++] = q; - } - } - } /* else command is unrecognized -- ignore it: we're not a complete [tn]roff implementation */ - - /* popular but meaningless commands: .ne (need <n> lines--on infinite scroll */ -} - - -static void -source_line(char *p) -{ - /*stagadd(BEGINLINE);*/ - char *cmd=p; - if (p==NULL) return; /* bug somewhere else, but where? */ - -#if 0 - if (*p!='.' && *p!='\'' && !finlist) { - if (fsourceTab && !fosourceTab) { - tblc=1; tbli=0; tableSep='\t'; - tbl[0][0]=tbl[0][1]=tbl[0][2]=tbl[0][3]=tbl[0][4]=tbl[0][5]=tbl[0][6]=tbl[0][7]=tbl[0][8]="l"; - source_struct(BEGINTABLE); finTable=1; - } else if (!fsourceTab && fosourceTab) { - source_struct(ENDTABLE); finTable=0; - } - fosourceTab=fsourceTab; - } -#endif - - if (*p=='.' /*|| *p=='\'' -- normalized */) { /* command == starts with "." */ - p++; - supresseol=1; - source_command(p); - - } else if (!*p) { /* blank line */ - /*source_command("P");*/ - ncnt=1; source_struct(BEGINLINE); ncnt=0; /* empty line => paragraph break */ - -#if 0 - } else if (fsourceTab && !finlist /* && pmode */) { /* can't handle tabs, so try tables */ - source_struct(BEGINTABLE); - tblcellformat = "l"; - do { - source_struct(BEGINTABLELINE); - while (*p) { - source_struct(BEGINTABLEENTRY); - p = source_out0(p, '\t'); - source_struct(ENDTABLEENTRY); - } - source_struct(ENDTABLELINE); - } while ((p=source_gets())!=NULL && fsourceTab); - source_struct(ENDTABLE); - source_line(p); -#endif - - } else { /* otherwise normal text */ - source_out(p); - if (finnf || isspace(*cmd)) source_struct(SHORTLINE); - } - - if (!supresseol && !finnf) { source_out(" "); if (finlist) source_list(); } - supresseol=0; - /*stagadd(ENDLINE);*/ -} - - -static void -source_filter(void) -{ - char *p = in, *q; - char *oldv,*newv,*shiftp,*shiftq,*endq; - int lenp,lenq; - int i,on1,on2,nn1,nn2,first; - int insertcnt=0, deletecnt=0, insertcnt0; - int nextDiffLine=-1; - char diffcmd, tmpc, tmpendq; - - AbsLine=0; - - /* just count length of macro table! */ - for (i=0; macro[i].key!=NULL; i++) /*empty*/; - macrocnt = i; - - /* {{ dumb Digital puts \\} closers on same line */ - for (p=in; (p=strstr(p," \\}"))!=NULL; p+=3) *p='\n'; - - sI=0; - /* (*fn)(BEGINDOC); -- done at .TH or first .SH */ - - - /* was: source_subfile(in); */ - while (fDiff && fgets(diffline, MAXBUF, difffd)!=NULL) { - /* requirements: no context lines, no errors in files, ... - change-command: 8a12,15 or 5,7c8,10 or 5,7d3 - < from-file-line - < from-file-line... - -- - > to-file-line - > to-file-line... - */ - for (q=diffline; ; q++) { diffcmd=*q; if (diffcmd=='a'||diffcmd=='c'||diffcmd=='d') break; } - if (sscanf(diffline, "%d,%d", &on1,&on2)==1) on2=on1-1+(diffcmd=='d'||diffcmd=='c'); - if (sscanf(++q, "%d,%d", &nn1,&nn2)==1) nn2=nn1-1+(diffcmd=='a'||diffcmd=='c'); - - deletecnt = on2-on1+1; - insertcnt = nn2-nn1+1; - - nextDiffLine = nn1; - /*assert(nextDiffLine>=AbsLine); -- can happen if inside a macro? */ - if (nextDiffLine<AbsLine) continue; - - while (AbsLine<nextDiffLine && (p=source_gets())!=NULL) { - source_line(p); - } - - insertcnt0=insertcnt+1; /* eat duplicate insert lines and '---' too */ - diffline2[0] = '\0'; - while (insertcnt && deletecnt) { - if (ungetc(fgetc(difffd),difffd)=='<') { fgetc(difffd); fgetc(difffd); } /* skip '<' */ - /* fill buffer with old line -- but replace if command */ - /* stay away from commands -- too careful if .B <word> */ - do { - p = oldv = fgets(diffline, MAXBUF, difffd); - p[strlen(p)-1]='\0'; /* fgets's \n ending => \0 */ - deletecnt--; - } while (deletecnt && *p=='.'); /* throw out commands in old version */ - - q = newv = source_gets(); - insertcnt--; - while (insertcnt && *q=='.') { - source_line(q); - insertcnt--; - } - - if (*p=='.' || *q=='.') break; - - - /* make larger chunk for better diff -- but still keep away from commands */ - lenp=strlen(p); lenq=strlen(q); - while (deletecnt && MAXBUF-lenq>80*2) { - fgetc(difffd); fgetc(difffd); /* skip '<' */ - if (ungetc(fgetc(difffd),difffd)=='.') break; - p=&diffline[lenp]; *p++=' '; lenp++; - fgets(p, MAXBUF-lenp, difffd); p[strlen(p)-1]='\0'; lenp+=strlen(p); - deletecnt--; - } - - while (insertcnt && *in!='.' && MAXBUF-lenq>80*2) { - if (newv!=diffline2) { strcpy(diffline2,q); newv=diffline2; } - q=source_gets(); diffline2[lenq]=' '; lenq++; - strcpy(&diffline2[lenq],q); lenq+=strlen(q); - insertcnt--; - } - - /* common endings */ - p = &p[strlen(oldv)]; q=&q[strlen(newv)]; - while (p>oldv && q>newv && p[-1]==q[-1]) { p--; q--; } - if ((p>oldv && p[-1]=='\\') || (q>newv && q[-1]=='\\')) - while (*p && *q && !isspace(*p)) { p++; q++; } /* steer clear of escapes */ - tmpendq=*q; *p=*q='\0'; endq=q; - - p=oldv; q=newv; - while (*p && *q) { - /* common starts */ - newv=q; while (*p && *q && *p==*q) { p++; q++; } - if (q>newv) { - tmpc=*q; *q='\0'; source_line(newv); *q=tmpc; - } - - /* too hard to read */ - /* difference: try to find hunk of p in remainder of q */ - if (strlen(p)<15 || (shiftp=strchr(&p[15],' ') /*|| shiftp-p>30*/)==NULL) break; - shiftp++; /* include the space */ - tmpc=*shiftp; *shiftp='\0'; shiftq=strstr(q,p); *shiftp=tmpc; /* includes space */ - if (shiftq!=NULL) { - /* call that part of q inserted */ - tmpc=*shiftq; *shiftq='\0'; - stagadd(BEGINDIFFA); source_line(q); stagadd(ENDDIFFA); source_line(" "); - *shiftq=tmpc; q=shiftq; - } else { - /* call that part of p deleted */ - shiftp--; *shiftp='\0'; /* squash the trailing space */ - stagadd(BEGINDIFFD); source_line(p); stagadd(ENDDIFFD); source_line(" "); - p=shiftp+1; - } -/*#endif*/ - } - - if (*p) { stagadd(BEGINDIFFD); source_line(p); stagadd(ENDDIFFD); } - if (*q) { stagadd(BEGINDIFFA); source_line(q); stagadd(ENDDIFFA); } - if (tmpendq!='\0') { *endq=tmpendq; source_line(endq); } - source_line(" "); - } - - /* even if diffcmd=='c', could still have remaining old version lines */ - first=1; - while (deletecnt--) { - fgets(diffline, MAXBUF, difffd); - if (diffline[2]!='.') { - if (first) { stagadd(BEGINDIFFD); first=0; } - source_line(&diffline[2]); /* don't do commands; skip initial '<' */ - } - } - if (!first) { stagadd(ENDDIFFD); source_line(" "); } - - /* skip over duplicated from old */ - if (diffcmd=='c') while (insertcnt0--) fgets(diffline, MAXBUF, difffd); - - /* even if diffcmd=='c', could still have remaining new version lines */ - first=1; - nextDiffLine = AbsLine + insertcnt; - while (insertcnt--) fgets(diffline, MAXBUF, difffd); /* eat duplicate text of above */ - while (/*insertcnt--*/AbsLine<nextDiffLine && (p=source_gets())!=NULL) { - if (first && *p!='.') { stagadd(BEGINDIFFA); first=0; } - source_line(p); - } - if (!first) { stagadd(ENDDIFFA); source_line(" "); } - } - /* finish up remainder (identical to both) */ - while ((p=source_gets())!=NULL) { - source_line(p); - } - - source_flush(); - pop(ENDDOC); (*fn)(ENDDOC); -} - - - -/* - * STARTUP - */ - -static int -setFilterDefaults(char *outputformat) -{ - static struct { - void (*fn)(enum command); - int fPara; int fQS; int fIQS; int fNOHY; int fChangeleft; int fURL; char *names; - /* (could set parameters at BEGINDOC call...) */ - } format[] = { - /*{default 0par 0qs 0iqs 0hy 0cl 0url "name"},*/ - { ASCII, 0, 0, 0, 0, 0, 0, "ASCII" }, - { TkMan, 0, 0, 0, 0, 0, 0, "TkMan" }, - { Tk, 0, 0, 0, 0, 0, 0, "Tk:Tcl" }, - { Sections, 0, 0, 0, 0, 0, 0, "sections" }, - { Roff, 0, 1, 1, 1, -1, 0, "roff:troff:nroff" }, - { HTML, 1, 1, 1, 1, 1, 1, "HTML:WWW:htm" }, - { XML, 1, 1, 1, 1, 1, 1, "XML:docbook:DocBook" }, - { MIME, 1, 1, 1, 1, 1, 0, "MIME:Emacs:enriched" }, - { LaTeX, 1, 1, 1, 1, 1, 0, "LaTeX:LaTeX209:209:TeX" }, - { LaTeX2e, 1, 1, 1, 1, 1, 0, "LaTeX2e:2e" }, - { RTF, 1, 1, 1, 1, 1, 0, "RTF" }, - { pod, 0, 0, 1, 0, -1, 0, "pod:Perl" }, - - { PostScript, 0, 0, 0, 0, 0, 0, "PostScript:ps" }, - { FrameMaker, 0, 0, 0, 0, 0, 0, "FrameMaker:Frame:Maker:MIF" }, - - { NULL, 0, 0, 0, 0, 0, 0, NULL } - }; - - int i, found=0; - for (i=0; format[i].fn!=NULL; i++) { - if (strcoloncmp2(outputformat,'\0',format[i].names,0)) { - fn = format[i].fn; - fPara = format[i].fPara; - fQS = format[i].fQS; - fIQS = format[i].fIQS; - fNOHY = format[i].fNOHY; - fChangeleft = format[i].fChangeleft; - fURL = format[i].fURL; - found=1; - break; - } - } - - return (found==0); -} - - -/* read in whole file. caller responsible for freeing memory */ -static char * -filesuck(FILE *in) -{ - const int inc=1024*100; /* what's 100K these days? */ - int len=0,cnt; - char *file = malloc(1); /*NULL -- relloc on NULL not reducing to malloc on some machines? */ - - do { - file = realloc(file, len+inc+1); /* what's the ANSI way to find the file size? */ - cnt = fread(&file[len], 1, inc, in); - len+=cnt; - } while (cnt==inc); - file[len]='\0'; - - return file; -} - -int -main(int argc, char *argv[]) -{ - int c; - int i,j; - char *p,*oldp; - int fname=0; - const int helpbreak=75; - const int helpispace=4; - int helplen=0; - int desclen; - char **argvch; /* remapped argv */ -/* FILE *macros; -- interpret -man macros? */ - - char strgetopt[80]; - /* options with an arg must have a '<' in the description */ - static struct { char letter; int arg; char *longnames; char *desc; } option[] = { - { 'f', 1, "filter", " <ASCII|roff|TkMan|Tk|Sections|HTML|XML|MIME|LaTeX|LaTeX2e|RTF|pod>" }, - { 'S', 0, "source", "(ource of man page passed in)" }, /* autodetected */ - { 'F', 0, "formatted:format", "(ormatted man page passed in)" }, /* autodetected */ - - { 'r', 1, "reference:manref:ref", " <man reference printf string>" }, - { 'l', 1, "title", " <title printf string>" }, - { 'V', 1, "volumes:vol", "(olume) <colon-separated list>" }, - { 'U', 0, "url:urls", "(RLs as hyperlinks)" }, - - /* following options apply to formatted pages only */ - { 'b', 0, "subsections:sub", " (show subsections)" }, - { 'k', 0, "keep:head:foot:header:footer", "(eep head/foot)" }, - { 'n', 1, "name", "(ame of man page) <string>" }, - { 's', 1, "section:sect", "(ection) <string>" }, - { 'p', 0, "paragraph:para", "(aragraph mode toggle)" }, - { 't', 1, "tabstop:tabstops", "(abstops spacing) <number>" }, - { 'N', 0, "normalize:normal", "(ormalize spacing, changebars)" }, - { 'y', 0, "zap:nohyphens", " (zap hyphens toggle)" }, - { 'K', 0, "nobreak", " (declare that page has no breaks)" }, /* autodetected */ - { 'd', 1, "diff", "(iff) <file> (diff of old page source to incorporate)" }, - { 'M', 1, "message", "(essage) <text> (included verbatim at end of Name section)" }, - /*{ 'l', 0, "number lines", "... can number lines in a pipe" } */ - /*{ 'T', 0, "tables", "(able agressive parsing ON)" },*/ -/* { 'c', 0, "changeleft:changebar", "(hangebarstoleft toggle)" }, -- default is perfect */ - /*{ 'R', 0, "reflow", "(eflow text lines)" },*/ - { 'R', 1, "rebus", "(ebus words for TkMan)" }, - { 'C', 0, "TclTk", " (enable Tcl/Tk formatting)" }, /* autodetected */ - - /*{ 'D', 0, "debug", "(ebugging mode)" }, -- dump unrecognized macros, e.g.*/ - { 'o', 0, "noop", " (no op)" }, - { 'O', 0, "noop", " <arg> (no op with arg)" }, - { 'q', 0, "quiet", "(uiet--don't report warnings)" }, - { 'h', 0, "help", "(elp)" }, - /*{ '?', 0, "help", " (help)" }, -- getopt returns '?' as error flag */ - { 'v', 0, "version", "(ersion)" }, - { '\0', 0, "", NULL } - }; - - /* calculate strgetopt from options list */ - for (i=0,p=strgetopt; option[i].letter!='\0'; i++) { - *p++ = option[i].letter; - /* check for duplicate option letters */ - assert(strchr(strgetopt,option[i].letter)==&p[-1]); - if (option[i].arg) *p++=':'; - } - *p='\0'; - - /* spot check construction of strgetopt */ - assert(p<strgetopt+80); - assert(strlen(strgetopt)>10); - assert(strchr(strgetopt,'f')!=NULL); - assert(strchr(strgetopt,'v')!=NULL); - assert(strchr(strgetopt,':')!=NULL); - - /* count, sort exception strings */ - for (lcexceptionslen=0; (p=lcexceptions[lcexceptionslen])!=NULL; lcexceptionslen++) /*empty*/; - qsort(lcexceptions, lcexceptionslen, sizeof(char*), lcexceptionscmp); - - /* map long option names to single letters for switching */ - /* (GNU probably has a reusable function to do this...) */ - /* deep six getopt in favor of integrated long names + letters? */ - argvch = malloc(argc * sizeof(char*)); - p = malloc(argc*3 * sizeof(char)); /* either -<char>'\0' or no space used */ - for (i=0; i<argc; i++) argvch[i]=argv[i]; /* need argvch[0] for getopt? */ - argv0 = mystrdup(argv[0]); - for (i=1; i<argc; i++) { - if (argv[i][0]=='-' && argv[i][1]=='-') { - if (argv[i][2]=='\0') break; /* end of options */ - for (j=0; option[j].letter!='\0'; j++) { - if (strcoloncmp2(&argv[i][2],'\0',option[j].longnames,0)) { - argvch[i] = p; - *p++ = '-'; *p++ = option[j].letter; *p++ = '\0'; - if (option[j].arg) i++; /* skip arguments of options */ - break; - } - } - if (option[j].letter=='\0') fprintf(stderr, "%s: unknown option %s\n", argv[0], argv[i]); - } - } - - - - /* pass through options to set defaults for chosen format */ - setFilterDefaults("ASCII"); /* default to ASCII (used by TkMan's Glimpse indexing */ - - /* initialize header/footer buffers (save room in binary) */ - for (i=0; i<CRUFTS; i++) { *cruft[i] = '\0'; } /* automatically done, guaranteed? */ - /*for (i=0; i<MAXLINES; i++) { linetabcnt[i] = 0; } */ - - while ((c=getopt(argc,argvch,strgetopt))!=-1) { - - switch (c) { - case 'k': fHeadfoot=1; break; - case 'b': fSubsections=1; break; -/* case 'c': fChangeleft=1; break; -- obsolete */ - /* case 'R': fReflow=1; break;*/ - case 'n': strcpy(manName,optarg); fname=1; break; /* name & section for when using stdin */ - case 's': strcpy(manSect,optarg); break; - /*case 'D': docbookpath = optarg; break;*/ - case 'V': vollist = optarg; break; - case 'l': manTitle = optarg; break; - case 'r': manRef = optarg; - if (strlen(manRef)==0 || strcmp(manRef,"-")==0 || strcmp(manRef,"off")==0) fmanRef=0; - break; - case 't': TabStops=atoi(optarg); break; - /*case 'T': fTable=1; break; -- if preformatted doesn't work, if source automatic */ - case 'p': fPara=!fPara; break; - case 'K': fFoot=1; break; - case 'y': fNOHY=1; break; - case 'N': fNORM=1; break; - - case 'f': /* set format */ - if (setFilterDefaults(optarg)) { - fprintf(stderr, "%s: unknown format: %s\n", argv0, optarg); - exit(1); - } - break; - case 'F': fSource=0; break; - case 'S': fSource=1; break; - - case 'd': - difffd = fopen(optarg, "r"); - if (difffd==NULL) { fprintf(stderr, "%s: can't open %s\n", argv0, optarg); exit(1); } -/* read in a line at a time - diff = filesuck(fd); - fclose(fd); -*/ - fDiff=1; - break; - - case 'M': message = optarg; break; - - case 'C': fTclTk=1; break; - case 'R': - p = malloc(strlen(optarg)+1); - strcpy(p, optarg); /* string may not be in writable address space */ - oldp = ""; - for (; *p; oldp=p, p++) { - if (*oldp=='\0') rebuspat[rebuspatcnt++] = p; - if (*p=='|') *p='\0'; - } - for (i=0; i<rebuspatcnt; i++) rebuspatlen[i] = strlen(rebuspat[i]); /* for strnlen() */ - break; - - case 'q': fQuiet=1; break; - case 'o': /*no op*/ break; - case 'O': /* no op with arg */ break; - case 'h': - printf("rman"); helplen=strlen("rman"); - - /* linebreak options */ - assert(helplen>0); - for (i=0; option[i].letter!='\0'; i++) { - desclen = strlen(option[i].desc); - if (helplen+desclen+5 > helpbreak) { printf("\n%*s",helpispace,""); helplen=helpispace; } - printf(" [-%c%s]", option[i].letter, option[i].desc); - helplen += desclen+5; - } - if (helplen>helpispace) printf("\n"); - printf("%*s [<filename>]\n",helpispace,""); - exit(0); - - case 'v': /*case '?':*/ - printf("PolyglotMan v" POLYGLOTMANVERSION "\n"); - exit(0); - - default: - fprintf(stderr, "%s: unidentified option -%c (-h for help)\n",argvch[0],c); - exit(2); - } - } - - - - /* read from given file name(s) */ - if (optind<argc) { - if (!fname) { /* if no name given, create from file name */ - /* take name from tail of path */ - if ((p=strrchr(argvch[optind],'/'))!=NULL) p++; else p=argvch[optind]; - strcpy(manName,p); - - /* search backward from end for final dot. split there */ - if ((p=strrchr(manName,'.'))!=NULL) { - strcpy(manSect,p+1); - *p='\0'; - } - } - - strcpy(plain,argvch[optind]); - - if (freopen(argvch[optind], "r", stdin)==NULL) { - fprintf(stderr, "%s: can't open %s\n", argvch[0], argvch[optind]); - exit(1); - } - } - - /* need to read macros, ok if fail; from /usr/lib/tmac/an => needs to be set in Makefile, maybe a searchpath */ - /* - if ((macros=fopen("/usr/lib/tmac/an", "r"))!=NULL) { - in = File = filesuck(macros); - lookahead = File[0]; - source_filter(); - free(File); - } - */ - - /* suck in whole file and just operate on pointers */ - in = File = filesuck(stdin); - - - /* minimal check for roff source: first character dot command or apostrophe comment */ - /* MUST initialize lookahead here, BEFORE first call to la_gets */ - if (fSource==-1) { - lookahead = File[0]; - fSource = (lookahead=='.' || lookahead=='\'' || /*dumb HP*/lookahead=='/' - /* HP needs this too but causes problems || isalpha(lookahead)--use --source flag*/); - } - - if (fDiff && (!fSource || fn!=HTML)) { - fprintf(stderr, "diff incorporation supported for man page source, generating HTML\n"); - exit(1); - } - - if (fSource) source_filter(); else preformatted_filter(); - if (fDiff) fclose(difffd); - /*free(File); -- let system clean up, perhaps more efficiently */ - - return 0; -} |