#!/usr/bin/awk # # Copyright (c) 2003 Peter Stuge <stuge-mdoc2man@cdy.org> # # Permission to use, copy, modify, and distribute this software for any # purpose with or without fee is hereby granted, provided that the above # copyright notice and this permission notice appear in all copies. # # THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES # WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF # MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR # ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES # WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN # ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF # OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE. # Dramatically overhauled by Tim Kientzle. This version almost # handles library-style pages with Fn, Ft, etc commands. Still # a lot of problems... BEGIN { displaylines = 0 listdepth = 0 trailer = "" out = "" sep = "" nextsep = " " spaces = " " } # Add a word with appropriate preceding whitespace # Maintain a short queue of the expected upcoming word separators. function add(str) { out=out sep str sep = nextsep nextsep = " " } # Add a word with no following whitespace # Use for opening punctuation such as '(' function addopen(str) { add(str) sep = "" } # Add a word with no preceding whitespace # Use for closing punctuation such as ')' or '.' function addclose(str) { sep = "" add(str) } # Add a word with no space before or after # Use for separating punctuation such as '=' function addpunct(str) { sep = "" add(str) sep = "" } # Emit the current line so far function endline() { addclose(trailer) trailer = "" if(length(out) > 0) { print out out="" } if(displaylines > 0) { displaylines = displaylines - 1 if (displaylines == 0) dispend() } # First word on next line has no preceding whitespace sep = "" } function linecmd(cmd) { endline() add(cmd) endline() } function breakline() { linecmd("<br>") } # Start an indented display function dispstart() { linecmd("{{{") } # End an indented display function dispend() { linecmd("}}}") } # Collect rest of input line function wtail() { retval="" while(w<nwords) { if(length(retval)) retval=retval " " retval=retval words[++w] } return retval } function splitwords(l, dest, n, o, w) { n = 1 delete dest while (length(l) > 0) { sub("^[ \t]*", "", l) if (match(l, "^\"")) { l = substr(l, 2) o = index(l, "\"") if (o > 0) { w = substr(l, 1, o-1) l = substr(l, o+1) dest[n++] = w } else { dest[n++] = l l = "" } } else { o = match(l, "[ \t]") if (o > 0) { w = substr(l, 1, o-1) l = substr(l, o+1) dest[n++] = w } else { dest[n++] = l l = "" } } } return n-1 } ! /^\./ { out = $0 endline() next } /^\.\\"/ { next } { sub("^\\.","") nwords=splitwords($0, words) # TODO: Instead of iterating 'w' over the array, have a separate # function that returns 'next word' and use that. This will allow # proper handling of double-quoted arguments as well. for(w=1;w<=nwords;w++) { if(match(words[w],"^Li$")) { # Literal; rest of line is unformatted dispstart() displaylines = 1 } else if(match(words[w],"^Dl$")) { # Display literal dispstart() displaylines = 1 } else if(match(words[w],"^Bd$")) { # Begin display if(match(words[w+1],"-literal")) { dispstart() displaylines=10000 w=nwords } } else if(match(words[w],"^Ed$")) { # End display displaylines = 0 dispend() } else if(match(words[w],"^Ns$")) { # Suppress space before next word sep="" } else if(match(words[w],"^No$")) { # Normal text add(words[++w]) } else if(match(words[w],"^Dq$")) { # Quote addopen("\"") add(words[++w]) while(w<nwords&&!match(words[w+1],"^[\\.,]")) add(words[++w]) addclose("\"") } else if(match(words[w],"^Do$")) { addopen("\"") } else if(match(words[w],"^Dc$")) { addclose("\"") } else if(match(words[w],"^Oo$")) { addopen("`[`") } else if(match(words[w],"^Oc$")) { addclose("`]`") } else if(match(words[w],"^Ao$")) { addopen("`<`") } else if(match(words[w],"^Ac$")) { addclose("`>`") } else if(match(words[w],"^Dd$")) { date=wtail() next } else if(match(words[w],"^Dt$")) { id=wtail() next } else if(match(words[w],"^Ox$")) { add("OpenBSD") } else if(match(words[w],"^Fx$")) { add("FreeBSD") } else if(match(words[w],"^Bx$")) { add("BSD") } else if(match(words[w],"^Nx$")) { add("NetBSD") } else if(match(words[w],"^St$")) { if (match(words[w+1], "^-p1003.1$")) { w++ add("IEEE Std 1003.1 (``POSIX.1'')") } else if(match(words[w+1], "^-p1003.1-96$")) { w++ add("ISO/IEC 9945-1:1996 (``POSIX.1'')") } else if(match(words[w+1], "^-p1003.1-88$")) { w++ add("IEEE Std 1003.1-1988 (``POSIX.1'')") } else if(match(words[w+1], "^-p1003.1-2001$")) { w++ add("IEEE Std 1003.1-2001 (``POSIX.1'')") } else if(match(words[w+1], "^-susv2$")) { w++ add("Version 2 of the Single UNIX Specification (``SUSv2'')") } } else if(match(words[w],"^Ex$")) { if (match(words[w+1], "^-std$")) { w++ add("The *" name "* utility exits 0 on success, and >0 if an error occurs.") } } else if(match(words[w],"^Os$")) { add("#summary " id " manual page") } else if(match(words[w],"^Sh$")) { section=wtail() linecmd("== " section " ==") } else if(match(words[w],"^Xr$")) { add("*" words[++w] "*(" words[++w] ")" words[++w]) } else if(match(words[w],"^Nm$")) { if(match(section,"SYNOPSIS")) breakline() if(w >= nwords) n=name else if (match(words[w+1], "^[A-Z][a-z]$")) n=name else if (match(words[w+1], "^[.,;:]$")) n=name else { n=words[++w] if(!length(name)) name=n } if(!length(n)) n=name if (displaylines == 0) add("*" n "*") else add(n) } else if(match(words[w],"^Nd$")) { add("- " wtail()) } else if(match(words[w],"^Fl$")) { if (displaylines == 0) add("*-" words[++w] "*") else add("-" words[++w]) } else if(match(words[w],"^Ar$")) { if(w==nwords) add("_file ..._") else { ++w gsub("<", "`<`", words[w]) add("_" words[w] "_") } } else if(match(words[w],"^Cm$")) { ++w if (displaylines == 0) { gsub("^_", "`_`", words[w]) gsub("\\*$", "`*`", words[w]) add("*" words[w] "*") } else add(words[w]) } else if(match(words[w],"^Op$")) { addopen("`[`") option=1 trailer="`]`" trailer } else if(match(words[w],"^Pp$")) { ++w endline() print "" } else if(match(words[w],"^An$")) { if (match(words[w+1],"-nosplit")) ++w endline() } else if(match(words[w],"^Ss$")) { add("===") trailer="===" } else if(match(words[w],"^Ft$")) { if (match(section, "SYNOPSIS")) { breakline() } l = wtail() gsub("\\*", "`*`", l) add("*" l "*") if (match(section, "SYNOPSIS")) { breakline() } } else if(match(words[w],"^Fn$")) { ++w F = "*" words[w] "*(" Fsep = "" while(w<nwords) { ++w if (match(words[w], "^[.,:]$")) { --w break } gsub("\\*", "`*`", words[w]) F = F Fsep "_" words[w] "_" Fsep = ", " } add(F ")") if (match(section, "SYNOPSIS")) { addclose(";") } } else if(match(words[w],"^Fo$")) { w++ F = "*" words[w] "*(" Fsep = "" } else if(match(words[w],"^Fa$")) { w++ gsub("\\*", "`*`", words[w]) F = F Fsep "_" words[w] "_" Fsep = ", " } else if(match(words[w],"^Fc$")) { add(F ")") if (match(section, "SYNOPSIS")) { addclose(";") } } else if(match(words[w],"^Va$")) { w++ add("_" words[w] "_") } else if(match(words[w],"^In$")) { w++ add("*#include <" words[w] ">*") } else if(match(words[w],"^Pa$")) { w++ # if(match(words[w],"^\\.")) # add("\\&") if (displaylines == 0) add("_" words[w] "_") else add(words[w]) } else if(match(words[w],"^Dv$")) { linecmd() } else if(match(words[w],"^Em|Ev$")) { add(".IR") } else if(match(words[w],"^Pq$")) { addopen("(") trailer=")" trailer } else if(match(words[w],"^Aq$")) { addopen(" <") trailer=">" trailer } else if(match(words[w],"^Brq$")) { addopen("{") trailer="}" trailer } else if(match(words[w],"^S[xy]$")) { add(".B " wtail()) } else if(match(words[w],"^Tn$")) { n=wtail() gsub("\\*$", "`*`", n) add("*" n "*") } else if(match(words[w],"^Ic$")) { add("\\fB") trailer="\\fP" trailer } else if(match(words[w],"^Bl$")) { ++listdepth listnext[listdepth]="" if(match(words[w+1],"-bullet")) { optlist[listdepth]=1 addopen("<ul>") listclose[listdepth]="</ul>" } else if(match(words[w+1],"-enum")) { optlist[listdepth]=2 enum=0 addopen("<ol>") listclose[listdepth]="</ol>" } else if(match(words[w+1],"-tag")) { optlist[listdepth]=3 addopen("<dl>") listclose[listdepth]="</dl>" } else if(match(words[w+1],"-item")) { optlist[listdepth]=4 addopen("<ul>") listclose[listdepth]="</ul>" } w=nwords } else if(match(words[w],"^El$")) { addclose(listnext[listdepth]) addclose(listclose[listdepth]) listclose[listdepth]="" listdepth-- } else if(match(words[w],"^It$")) { addclose(listnext[listdepth]) if(optlist[listdepth]==1) { addpunct("<li>") listnext[listdepth] = "</li>" } else if(optlist[listdepth]==2) { addpunct("<li>") listnext[listdepth] = "</li>" } else if(optlist[listdepth]==3) { addpunct("<dt>") listnext[listdepth] = "</dt>" if(match(words[w+1],"^Xo$")) { # Suppress trailer w++ } else if(match(words[w+1],"^Pa$|^Ev$")) { addopen("*") w++ add(words[++w] "*") } else { trailer = listnext[listdepth] "<dd>" trailer listnext[listdepth] = "</dd>" } } else if(optlist[listdepth]==4) { addpunct("<li>") listnext[listdepth] = "</li>" } } else if(match(words[w],"^Xo$")) { # TODO: Figure out how to handle this } else if(match(words[w],"^Xc$")) { # TODO: Figure out how to handle this if (optlist[listdepth] == 3) { addclose(listnext[listdepth]) addopen("<dd>") listnext[listdepth] = "</dd>" } } else if(match(words[w],"^[=]$")) { addpunct(words[w]) } else if(match(words[w],"^[\[{(]$")) { addopen(words[w]) } else if(match(words[w],"^[\\\])}.,;:]$")) { addclose(words[w]) } else { sub("\\\\&", "", words[w]) add(words[w]) } } if(match(out,"^\\.[^a-zA-Z]")) sub("^\\.","",out) endline() }