) ** * Some manpages rely on the fact that troff/nroff is used to convert ** them and use features which are not descripted in the man manpages. ** (definitions, calculations, conditionals, requests). I can't guarantee ** that all these features work on all manpages. (I didn't have the ** time to look through all the available manpages.) */ #ifdef SIMPLE_MAN2HTML // We suppose that we run on a standard Linux # define HAVE_STRING_H 1 # define HAVE_UNISTD_H 1 #else # include #endif #include #ifdef HAVE_UNISTD_H # include #endif #ifdef HAVE_STRING_H # include #endif #include #include #include #include #include #include #ifdef SIMPLE_MAN2HTML # include # include # include # include # define kdDebug(x) cerr # define kdWarning(x) cerr << "WARNING " #else # include # include # include #endif #include "man2html.h" using namespace std; #define NULL_TERMINATED(n) ((n) + 1) #define HUGE_STR_MAX 10000 #define LARGE_STR_MAX 2000 #define MED_STR_MAX 500 #define SMALL_STR_MAX 100 #define TINY_STR_MAX 10 #if 1 // The output is current too horrible to be called HTML 4.01 #define DOCTYPE "" #else #define DOCTYPE "\n" #endif /* mdoc(7) Bl/El lists to HTML list types */ #define BL_DESC_LIST 1 #define BL_BULLET_LIST 2 #define BL_ENUM_LIST 4 /* mdoc(7) Bd/Ed example(?) blocks */ #define BD_LITERAL 1 #define BD_INDENT 2 static int s_nroff = 1; // NROFF mode by default static int mandoc_name_count = 0; /* Don't break on the first Nm */ static char *stralloc(int len) { /* allocate enough for len + NULL */ char *news = new char [len+1]; #ifdef SIMPLE_MAN2HTML if (!news) { cerr << "man2html: out of memory" << endl; exit(EXIT_FAILURE); } #else // modern compilers do not return a NULL pointer for a new #endif return news; } static char *strlimitcpy(char *to, char *from, int n, int limit) { /* Assumes space for limit plus a null */ const int len = n > limit ? limit : n; tqstrncpy(to, from, len + 1); to[len] = '\0'; return to; } /* below this you should not change anything unless you know a lot ** about this program or about troff. */ /// Structure for character definitions struct CSTRDEF { int nr, slen; const char *st; }; const char NEWLINE[2]="\n"; /** * Class for defining strings and macros */ class StringDefinition { public: StringDefinition( void ) : m_length(0) {} StringDefinition( int len, const char* cstr ) : m_length( len ), m_output( cstr ) {} public: int m_length; ///< Length of output text TQCString m_output; ///< Defined string }; /** * Class for defining number registers * \note Not for internal read-only registers */ class NumberDefinition { public: NumberDefinition( void ) : m_value(0), m_increment(0) {} NumberDefinition( int value ) : m_value( value ), m_increment(0) {} NumberDefinition( int value, int incr) : m_value( value ), m_increment( incr ) {} public: int m_value; ///< value of number register int m_increment; ///< Increment of number register // ### TODO: display form (.af) }; /** * Map of character definitions */ static TQMap s_characterDefinitionMap; /** * Map of string variable and macro definitions * \note String variables and macros are the same thing! */ static TQMap s_stringDefinitionMap; /** * Map of number registers * \note Intern number registers (starting with a dot are not handled here) */ static TQMap s_numberDefinitionMap; static void fill_old_character_definitions( void ); /** * Initialize character variables */ static void InitCharacterDefinitions( void ) { fill_old_character_definitions(); // ### HACK: as we are converting to HTML too early, define characters with HTML references s_characterDefinitionMap.insert( "<-", StringDefinition( 1, "←" ) ); // <- s_characterDefinitionMap.insert( "->", StringDefinition( 1, "→" ) ); // -> s_characterDefinitionMap.insert( "<>", StringDefinition( 1, "↔" ) ); // <> s_characterDefinitionMap.insert( "<=", StringDefinition( 1, "≤" ) ); // <= s_characterDefinitionMap.insert( ">=", StringDefinition( 1, "≥" ) ); // >= // End HACK } /** * Initialize string variables */ static void InitStringDefinitions( void ) { // mdoc-only, see mdoc.samples(7) s_stringDefinitionMap.insert( "<=", StringDefinition( 1, "≤" ) ); s_stringDefinitionMap.insert( ">=", StringDefinition( 1, "≥" ) ); s_stringDefinitionMap.insert( "Rq", StringDefinition( 1, "”" ) ); s_stringDefinitionMap.insert( "Lq", StringDefinition( 1, "“" ) ); s_stringDefinitionMap.insert( "ua", StringDefinition( 1, "&circ" ) ); // Note this is different from \(ua s_stringDefinitionMap.insert( "aa", StringDefinition( 1, "´" ) ); s_stringDefinitionMap.insert( "ga", StringDefinition( 1, "`" ) ); s_stringDefinitionMap.insert( "q", StringDefinition( 1, """ ) ); s_stringDefinitionMap.insert( "Pi", StringDefinition( 1, "π" ) ); s_stringDefinitionMap.insert( "Ne", StringDefinition( 1, "≠" ) ); s_stringDefinitionMap.insert( "Le", StringDefinition( 1, "≤" ) ); s_stringDefinitionMap.insert( "Ge", StringDefinition( 1, "≥" ) ); s_stringDefinitionMap.insert( "Lt", StringDefinition( 1, "<" ) ); s_stringDefinitionMap.insert( "Gt", StringDefinition( 1, ">" ) ); s_stringDefinitionMap.insert( "Pm", StringDefinition( 1, "±" ) ); s_stringDefinitionMap.insert( "If", StringDefinition( 1, "∞" ) ); s_stringDefinitionMap.insert( "Na", StringDefinition( 3, "NaN" ) ); s_stringDefinitionMap.insert( "Ba", StringDefinition( 1, "|" ) ); // end mdoc-only // man(7) s_stringDefinitionMap.insert( "Tm", StringDefinition( 1, "™" ) ); // \*(TM s_stringDefinitionMap.insert( "R", StringDefinition( 1, "®" ) ); // \*R // end man(7) // Missing characters from man(7): // \*S "Change to default font size" #ifndef SIMPLE_MAN2HTML // Special KDE TDEIO man: const TQCString tdeversion(TDE_VERSION_STRING); s_stringDefinitionMap.insert( ".TDE_VERSION_STRING", StringDefinition( tdeversion.length(), tdeversion ) ); #endif } /** * Initialize number registers * \note Internal read-only registers are not handled here */ static void InitNumberDefinitions( void ) { // As the date number registers are more for end-users, better choose local time. // Groff seems to support Gregorian dates only TQDate today( TQDate::currentDate( TQt::LocalTime ) ); s_numberDefinitionMap.insert( "year", today.year() ); // Y2K-correct year s_numberDefinitionMap.insert( "yr", today.year() - 1900 ); // Y2K-incorrect year s_numberDefinitionMap.insert( "mo", today.month() ); s_numberDefinitionMap.insert( "dy", today.day() ); s_numberDefinitionMap.insert( "dw", today.dayOfWeek() ); } #define V(A,B) ((A)*256+(B)) //used in expand_char, e.g. for "\(bu" // see groff_char(7) for list static CSTRDEF standardchar[] = { { V('*','*'), 1, "*" }, { V('*','A'), 1, "Α" }, { V('*','B'), 1, "Β" }, { V('*','C'), 1, "Ξ" }, { V('*','D'), 1, "Δ" }, { V('*','E'), 1, "Ε" }, { V('*','F'), 1, "Φ" }, { V('*','G'), 1, "Γ" }, { V('*','H'), 1, "Θ" }, { V('*','I'), 1, "Ι" }, { V('*','K'), 1, "Κ" }, { V('*','L'), 1, "Λ" }, { V('*','M'), 1, "&Mu:" }, { V('*','N'), 1, "Ν" }, { V('*','O'), 1, "Ο" }, { V('*','P'), 1, "Π" }, { V('*','Q'), 1, "Ψ" }, { V('*','R'), 1, "Ρ" }, { V('*','S'), 1, "Σ" }, { V('*','T'), 1, "Τ" }, { V('*','U'), 1, "Υ" }, { V('*','W'), 1, "Ω" }, { V('*','X'), 1, "Χ" }, { V('*','Y'), 1, "Η" }, { V('*','Z'), 1, "Ζ" }, { V('*','a'), 1, "α"}, { V('*','b'), 1, "β"}, { V('*','c'), 1, "ξ"}, { V('*','d'), 1, "δ"}, { V('*','e'), 1, "ε"}, { V('*','f'), 1, "φ"}, { V('*','g'), 1, "γ"}, { V('*','h'), 1, "θ"}, { V('*','i'), 1, "ι"}, { V('*','k'), 1, "κ"}, { V('*','l'), 1, "λ"}, { V('*','m'), 1, "μ" }, { V('*','n'), 1, "ν"}, { V('*','o'), 1, "ο"}, { V('*','p'), 1, "π"}, { V('*','q'), 1, "ψ"}, { V('*','r'), 1, "ρ"}, { V('*','s'), 1, "σ"}, { V('*','t'), 1, "τ"}, { V('*','u'), 1, "υ"}, { V('*','w'), 1, "ω"}, { V('*','x'), 1, "χ"}, { V('*','y'), 1, "η"}, { V('*','z'), 1, "ζ"}, { V('+','-'), 1, "±" }, // not in groff_char(7) { V('+','f'), 1, "φ"}, // phi1, we use the standard phi { V('+','h'), 1, "θ"}, // theta1, we use the standard theta { V('+','p'), 1, "ω"}, // omega1, we use the standard omega { V('1','2'), 1, "½" }, { V('1','4'), 1, "¼" }, { V('3','4'), 1, "¾" }, { V('F','i'), 1, "ﬃ" }, // ffi ligature { V('F','l'), 1, "ﬄ" }, // ffl ligature { V('a','p'), 1, "~" }, { V('b','r'), 1, "|" }, { V('b','u'), 1, "•" }, { V('b','v'), 1, "|" }, { V('c','i'), 1, "○" }, // circle ### TODO verify { V('c','o'), 1, "©" }, { V('c','t'), 1, "¢" }, { V('d','e'), 1, "°" }, { V('d','g'), 1, "†" }, { V('d','i'), 1, "÷" }, { V('e','m'), 1, "&emdash;" }, { V('e','n'), 1, "&endash;"}, { V('e','q'), 1, "=" }, { V('e','s'), 1, "∅" }, { V('f','f'), 1, "�xFB00;" }, // ff ligature { V('f','i'), 1, "�xFB01;" }, // fi ligature { V('f','l'), 1, "�xFB02;" }, // fl ligature { V('f','m'), 1, "′" }, { V('g','a'), 1, "`" }, { V('h','y'), 1, "-" }, { V('l','c'), 2, "|¯" }, // ### TODO: not in groff_char(7) { V('l','f'), 2, "|_" }, // ### TODO: not in groff_char(7) { V('l','k'), 1, "{" }, // ### TODO: not in groff_char(7) { V('m','i'), 1, "-" }, // ### TODO: not in groff_char(7) { V('m','u'), 1, "×" }, { V('n','o'), 1, "¬" }, { V('o','r'), 1, "|" }, { V('p','l'), 1, "+" }, { V('r','c'), 2, "¯|" }, // ### TODO: not in groff_char(7) { V('r','f'), 2, "_|" }, // ### TODO: not in groff_char(7) { V('r','g'), 1, "®" }, { V('r','k'), 1, "}" }, // ### TODO: not in groff_char(7) { V('r','n'), 1, "‾" }, { V('r','u'), 1, "_" }, { V('s','c'), 1, "§" }, { V('s','l'), 1, "/" }, { V('s','q'), 2, "□" }, // WHITE SQUARE { V('t','s'), 1, "ς" }, // FINAL SIGMA { V('u','l'), 1, "_" }, { V('-','D'), 1, "Ð" }, { V('S','d'), 1, "ð" }, { V('T','P'), 1, "Þ" }, { V('T','p'), 1, "þ" }, { V('A','E'), 1, "Æ" }, { V('a','e'), 1, "æ" }, { V('O','E'), 1, "Œ" }, { V('o','e'), 1, "œ" }, { V('s','s'), 1, "ß" }, { V('\'','A'), 1, "Á" }, { V('\'','E'), 1, "É" }, { V('\'','I'), 1, "Í" }, { V('\'','O'), 1, "Ó" }, { V('\'','U'), 1, "Ú" }, { V('\'','Y'), 1, "Ý" }, { V('\'','a'), 1, "á" }, { V('\'','e'), 1, "é" }, { V('\'','i'), 1, "í" }, { V('\'','o'), 1, "ó" }, { V('\'','u'), 1, "ú" }, { V('\'','y'), 1, "ý" }, { V(':','A'), 1, "Ä" }, { V(':','E'), 1, "Ë" }, { V(':','I'), 1, "Ï" }, { V(':','O'), 1, "Ö" }, { V(':','U'), 1, "Ü" }, { V(':','a'), 1, "ä" }, { V(':','e'), 1, "ë" }, { V(':','i'), 1, "ï" }, { V(':','o'), 1, "ö" }, { V(':','u'), 1, "ü" }, { V(':','y'), 1, "ÿ" }, { V('^','A'), 1, "Â" }, { V('^','E'), 1, "Ê" }, { V('^','I'), 1, "Î" }, { V('^','O'), 1, "Ô" }, { V('^','U'), 1, "Û" }, { V('^','a'), 1, "â" }, { V('^','e'), 1, "ê" }, { V('^','i'), 1, "î" }, { V('^','o'), 1, "ô" }, { V('^','u'), 1, "û" }, { V('`','A'), 1, "À" }, { V('`','E'), 1, "È" }, { V('`','I'), 1, "Ì" }, { V('`','O'), 1, "Ò" }, { V('`','U'), 1, "Ù" }, { V('`','a'), 1, "à" }, { V('`','e'), 1, "è" }, { V('`','i'), 1, "ì" }, { V('`','o'), 1, "ò" }, { V('`','u'), 1, "ù" }, { V('~','A'), 1, "Ã" }, { V('~','N'), 1, "Ñ" }, { V('~','O'), 1, "Õ" }, { V('~','a'), 1, "ã" }, { V('~','n'), 1, "&ntidle;" }, { V('~','o'), 1, "&otidle;" }, { V(',','C'), 1, "Ç" }, { V(',','c'), 1, "ç" }, { V('/','L'), 1, "Ł" }, { V('/','l'), 1, "ł" }, { V('/','O'), 1, "Ø" }, { V('/','o'), 1, "ø" }, { V('o','A'), 1, "Å" }, { V('o','a'), 1, "å" }, { V('a','"'), 1, "\"" }, { V('a','-'), 1, "¯" }, { V('a','.'), 1, "." }, { V('a','^'), 1, "ˆ" }, { V('a','a'), 1, "´" }, { V('a','b'), 1, "`" }, { V('a','c'), 1, "¸" }, { V('a','d'), 1, "¨" }, { V('a','h'), 1, "˂" }, // caron { V('a','o'), 1, "˚" }, // ring { V('a','~'), 1, "˜" }, { V('h','o'), 1, "˛" }, // ogonek { V('.','i'), 1, "ı" }, // dot less i { V('C','s'), 1, "¤" }, { V('D','o'), 1, "$" }, { V('P','o'), 1, "£" }, { V('Y','e'), 1, "¥" }, { V('F','n'), 1, "ƒ" }, { V('F','o'), 1, "«" }, { V('F','c'), 1, "»" }, { V('f','o'), 1, "‹" }, // single left guillemet { V('f','c'), 1, "›" }, // single right guillemet { V('r','!'), 1, "&iecl;" }, { V('r','?'), 1, "¿" }, { V('O','f'), 1, "ª" }, { V('O','m'), 1, "º" }, { V('p','c'), 1, "·" }, { V('S','1'), 1, "¹" }, { V('S','2'), 1, "²" }, { V('S','3'), 1, "³" }, { V('<','-'), 1, "←" }, { V('-','>'), 1, "→" }, { V('<','>'), 1, "↔" }, { V('d','a'), 1, "↓" }, { V('u','a'), 1, "↑" }, { V('l','A'), 1, "⇐" }, { V('r','A'), 1, "⇒" }, { V('h','A'), 1, "⇔" }, { V('d','A'), 1, "⇓" }, { V('u','A'), 1, "⇑" }, { V('b','a'), 1, "|" }, { V('b','b'), 1, "¦" }, { V('t','m'), 1, "™" }, { V('d','d'), 1, "‡" }, { V('p','s'), 1, "¶" }, { V('%','0'), 1, "‰" }, { V('f','/'), 1, "⁄" }, // Fraction slash { V('s','d'), 1, "″" }, { V('h','a'), 1, "^" }, { V('t','i'), 1, "&tidle;" }, { V('l','B'), 1, "[" }, { V('r','B'), 1, "]" }, { V('l','C'), 1, "{" }, { V('r','C'), 1, "}" }, { V('l','a'), 1, "<" }, { V('r','a'), 1, ">" }, { V('l','h'), 1, "≤" }, { V('r','h'), 1, "≥" }, { V('B','q'), 1, "„" }, { V('b','q'), 1, "‚" }, { V('l','q'), 1, "“" }, { V('r','q'), 1, "”" }, { V('o','q'), 1, "‘" }, { V('c','q'), 1, "’" }, { V('a','q'), 1, "'" }, { V('d','q'), 1, "\"" }, { V('a','t'), 1, "@" }, { V('s','h'), 1, "#" }, { V('r','s'), 1, "\\" }, { V('t','f'), 1, "∴" }, { V('~','~'), 1, "≅" }, { V('~','='), 1, "≈" }, { V('!','='), 1, "≠" }, { V('<','='), 1, "≤" }, { V('=','='), 1, "≡" }, { V('=','~'), 1, "≅" }, // ### TODO: verify { V('>','='), 1, "≥" }, { V('A','N'), 1, "∧" }, { V('O','R'), 1, "∨" }, { V('t','e'), 1, "∃" }, { V('f','a'), 1, "∀" }, { V('A','h'), 1, "ℵ" }, { V('I','m'), 1, "ℑ" }, { V('R','e'), 1, "ℜ" }, { V('i','f'), 1, "∞" }, { V('m','d'), 1, "⋅" }, { V('m','o'), 1, "∆" }, // element ### TODO verify { V('n','m'), 1, "∉" }, { V('p','t'), 1, "∝" }, { V('p','p'), 1, "⊥" }, { V('s','b'), 1, "⊂" }, { V('s','p'), 1, "⊃" }, { V('i','b'), 1, "⊆" }, { V('i','p'), 1, "⊇" }, { V('i','s'), 1, "∫" }, { V('s','r'), 1, "√" }, { V('p','d'), 1, "∂" }, { V('c','*'), 1, "⊗" }, { V('c','+'), 1, "⊕" }, { V('c','a'), 1, "∩" }, { V('c','u'), 1, "∪" }, { V('g','r'), 1, "V" }, // gradient ### TODO Where in Unicode? { V('C','R'), 1, "↵" }, { V('s','t'), 2, "-)" }, // "such that" ### TODO Where in Unicode? { V('/','_'), 1, "∠" }, { V('w','p'), 1, "℘" }, { V('l','z'), 1, "◊" }, { V('a','n'), 1, "-" }, // "horizontal arrow extension" ### TODO Where in Unicode? }; /* default: print code */ /* static char eqndelimopen=0, eqndelimclose=0; */ static char escapesym='\\', nobreaksym='\'', controlsym='.', fieldsym=0, padsym=0; static char *buffer=NULL; static int buffpos=0, buffmax=0; static bool scaninbuff=false; static int itemdepth=0; static int section=0; static int dl_set[20]= { 0 }; static bool still_dd=0; static int tabstops[20] = { 8, 16, 24, 32, 40, 48, 56, 64, 72, 80, 88, 96 }; static int maxtstop=12; static int curpos=0; static char *scan_troff(char *c, bool san, char **result); static char *scan_troff_mandoc(char *c, bool san, char **result); static TQValueList s_argumentList; static TQCString htmlPath, cssPath; static TQCString s_dollarZero; // Value of $0 void setResourcePath(const TQCString& _htmlPath, const TQCString& _cssPath) { htmlPath=_htmlPath; cssPath=_cssPath; } static void fill_old_character_definitions( void ) { for (size_t i = 0; i < sizeof(standardchar)/sizeof(CSTRDEF); i++) { const int nr = standardchar[i].nr; const char temp[3] = { (char)(nr / 256), (char)(nr % 256), 0 }; TQCString name( temp ); s_characterDefinitionMap.insert( name, StringDefinition( standardchar[i].slen, standardchar[i].st ) ); } } static char outbuffer[NULL_TERMINATED(HUGE_STR_MAX)]; static int no_newline_output=0; static int newline_for_fun=0; static bool output_possible=false; static const char *includedirs[] = { "/usr/include", "/usr/include/sys", "/usr/local/include", "/opt/local/include", "/usr/ccs", "/usr/X11R6/include", "/usr/openwin/include", "/usr/include/g++", 0 }; static bool ignore_links=false; static void add_links(char *c) { /* ** Add the links to the output. ** At the moment the following are recognized: ** ** name(*) -> ../man?/name.* ** method://string -> method://string ** www.host.name -> http://www.host.name ** ftp.host.name -> ftp://ftp.host.name ** name@host -> mailto:name@host ** -> file:/usr/include/name.h (guess) ** ** Other possible links to add in the future: ** ** /dir/dir/file -> file:/dir/dir/file */ if (ignore_links) { output_real(c); return; } int i,j,nr; char *f, *h; char *g; const int numtests=6; // Nmber of tests char *idtest[numtests]; // url, mailto, www, ftp, manpage, C header file bool ok; /* search for (section) */ nr=0; idtest[0]=strstr(c+1,"://"); idtest[1]=strchr(c+1,'@'); idtest[2]=strstr(c,"www."); idtest[3]=strstr(c,"ftp."); idtest[4]=strchr(c+1,'('); idtest[5]=strstr(c+1,".h>"); for (i=0; i */ f=idtest[5]; h=f+2; g=f; while (g>c && g[-1]!=';') g--; bool wrote_include = false; if (g!=c) { TQCString dir; TQCString file(g, h - g + 1); file = file.stripWhiteSpace(); for (int index = 0; includedirs[index]; index++) { TQCString str = TQCString(includedirs[index]) + "/" + file; if (!access(str, R_OK)) { dir = includedirs[index]; break; } } if (!dir.isEmpty()) { char t; t=*g; *g=0; output_real(c); *g=t;*h=0; TQCString str; str.sprintf("%s>", dir.data(), file.data(), file.data()); output_real(str.data()); c=f+6; wrote_include = true; } } if (!wrote_include) { f[5]=0; output_real(c); f[5]=';'; c=f+5; } } break; case 4: /* manpage */ f=idtest[j]; /* check section */ g=strchr(f,')'); // The character before f must alphanumeric, the end of a HTML tag or the end of a if (g!=NULL && f>c && (g-f)<12 && (isalnum(f[-1]) || f[-1]=='>' || ( f[-1] == ';' ) ) && isdigit(f[1]) && f[1]!='0' && ((g-f)<=2 || isalpha(f[2]))) { ok = TRUE; h = f+2; while (h c + 5 ) && ( ! memcmp( h-5, " ", 6 ) ) ) { h -= 6; kdDebug(7107) << "Skip " << endl; } else if ( *h == ';' ) { // Not a non-breaking space, so probably not ok ok = false; } } if (ok) { /* this might be a link */ /* skip html makeup */ while (h>c && *h=='>') { while (h!=c && *h!='<') h--; if (h!=c) h--; } if (isalnum(*h)) { char t,sec, *e; TQString subsec; // ### TODO avoid using TQString, as we do not know the encoding TQString fstr(f); // ### TODO avoid using TQString, as we do not know the encoding e=h+1; sec=f[1]; subsec=f[2]; int index = fstr.find(')', 2); if (index != -1) subsec = fstr.mid(2, index - 2); else // No closing ')' found, take first character as subsection. subsec = fstr.mid(2, 1); while (h>c && (isalnum(h[-1]) || h[-1]=='_' || h[-1]==':' || h[-1]=='-' || h[-1]=='.')) h--; t=*h; *h='\0'; output_real(c); *h=t; t=*e; *e='\0'; TQCString str; if (subsec.isEmpty()) str.sprintf("%s", h, sec, h); else str.sprintf("%s", h, sec, subsec.lower().latin1(), h); output_real(str.data()); *e=t; c=e; } } *f='\0'; output_real(c); *f='('; idtest[4]=f-1; c=f; break; /* manpage */ case 3: /* ftp */ case 2: /* www */ g=f=idtest[j]; while (*g && (isalnum(*g) || *g=='_' || *g=='-' || *g=='+' || *g=='.' || *g=='/')) g++; if (g[-1]=='.') g--; if (g-f>4) { char t; t=*f; *f='\0'; output_real(c); *f=t; t=*g;*g='\0'; TQCString str; str.sprintf("%s", ((j==3)?"ftp":"http"), f, f); output_real(str.data()); *g=t; c=g; } else { f[3]='\0'; output_real(c); c=f+3; f[3]='.'; } break; case 1: /* mailto */ g=f=idtest[1]; while (g>c && (isalnum(g[-1]) || g[-1]=='_' || g[-1]=='-' || g[-1]=='+' || g[-1]=='.' || g[-1]=='%')) g--; if (g-7>=c && g[-1]==':') { // We have perhaps an email address starting with mailto: if (!tqstrncmp("mailto:",g-7,7)) g-=7; } h=f+1; while (*h && (isalnum(*h) || *h=='_' || *h=='-' || *h=='+' || *h=='.')) h++; if (*h=='.') h--; if (h-f>4 && f-g>1) { char t; t=*g; *g='\0'; output_real(c); *g=t;t=*h;*h='\0'; TQCString str; str.sprintf("%s", g, g); output_real(str.data()); *h=t; c=h; } else { *f='\0'; output_real(c); *f='@'; idtest[1]=c; c=f; } break; case 0: /* url */ g=f=idtest[0]; while (g>c && isalpha(g[-1]) && islower(g[-1])) g--; h=f+3; while (*h && !isspace(*h) && *h!='<' && *h!='>' && *h!='"' && *h!='&') h++; if (f-g>2 && f-g<7 && h-f>3) { char t; t=*g; *g='\0'; output_real(c); *g=t; t=*h; *h='\0'; TQCString str; str.sprintf("%s", g, g); output_real(str.data()); *h=t; c=h; } else { f[1]='\0'; output_real(c); f[1]='/'; c=f+1; } break; default: break; } nr=0; if (idtest[0] && idtest[0]<=c) idtest[0]=strstr(c+1,"://"); if (idtest[1] && idtest[1]<=c) idtest[1]=strchr(c+1,'@'); if (idtest[2] && idtest[2]=buffmax) { char *h = new char[buffmax*2]; #ifdef SIMPLE_MAN2HTML if (!h) { cerr << "Memory full, cannot output!" << endl; exit(1); } #else // modern compiler do not return a NULL for a new #endif memcpy(h, buffer, buffmax); delete [] buffer; buffer=h; buffmax=buffmax*2; } buffer[buffpos++]=*c2++; } } else if (output_possible) { while (*c2) { outbuffer[obp++]=*c2; if (*c=='\n' || obp >= HUGE_STR_MAX) { outbuffer[obp]='\0'; add_links(outbuffer); obp=0; } c2++; } } delete [] c3; } static TQCString set_font( const TQCString& name ) { // Every font but R (Regular) creates elements TQCString markup; if ( current_font != "R" && !current_font.isEmpty() ) markup += ""; const uint len = name.length(); bool fontok = true; if ( len == 1 ) { const char lead = name[0]; switch (lead) { case 'P': // Palatino? case 'R': break; // regular, do nothing case 'I': markup += ""; break; case 'B': markup += ""; break; case 'L': markup += ""; break; // ### What's L? default: fontok = false; } } else if ( len == 2 ) { if ( name == "BI" ) markup += ""; // Courier else if ( name == "CR" ) markup += ""; else if ( name == "CW" ) // CW is used by pod2man(1) (alias PerlDoc) markup += ""; else if ( name == "CI" ) markup += ""; else if ( name == "CB" ) markup += ""; // Times else if ( name == "TR" ) markup += ""; else if ( name == "TI" ) markup += ""; else if ( name == "TB" ) markup += ""; // Helvetica else if ( name == "HR" ) markup += ""; else if ( name == "HI" ) markup += ""; else if ( name == "HB" ) markup += ""; else fontok = false; } else if ( len == 3 ) { if ( name == "CBI" ) markup += ""; else if ( name == "TBI" ) markup += ""; else if ( name == "HBI" ) markup += ""; } if (fontok) current_font = name; else current_font = "R"; // Still nothing, then it is 'R' (Regular) return markup; } /// \deprecated static TQCString set_font( const char ch ) #ifndef SIMPLE_MAN2HTML TDE_DEPRECATED; static TQCString set_font( const char ch ) #endif { const TQCString name = &ch; return set_font( name ); } static TQCString change_to_size(int nr) { switch (nr) { case '0': case '1': case '2': case '3': case '4': case '5': case '6': case '7': case '8': case '9': nr=nr-'0'; break; case '\0': break; default: nr=current_size+nr; if (nr>9) nr=9; if (nr< -9) nr=-9; break; } if ( nr == current_size ) return ""; const TQCString font ( current_font ); TQCString markup; markup = set_font("R"); if (current_size) markup += ""; current_size=nr; if (nr) { markup += "0) markup += '+'; else { markup += '-'; nr=-nr; } markup += char( nr + '0' ); markup += "\">"; } markup += set_font( font ); return markup; } /* static int asint=0; */ static int intresult=0; #define SKIPEOL while (*c && *c++!='\n') static bool skip_escape=false; static bool single_escape=false; static char *scan_escape_direct( char *c, TQCString& cstr ); /** * scan a named character * param c position */ static TQCString scan_named_character( char*& c ) { TQCString name; if ( *c == '(' ) { // \*(ab Name of two characters if ( c[1] == escapesym ) { TQCString cstr; c = scan_escape_direct( c+2, cstr ); // ### HACK: as we convert characters too early to HTML, we need to support more than 2 characters here and assume that all characters passed by the variable are to be used. name = cstr; } else { name+=c[1]; name+=c[2]; c+=3; } } else if ( *c == '[' ) { // \*[long_name] Long name // Named character groff(7) // We must find the ] to get a name c++; while ( *c && *c != ']' && *c != '\n' ) { if ( *c == escapesym ) { TQCString cstr; c = scan_escape_direct( c+1, cstr ); const int result = cstr.find(']'); if ( result == -1 ) name += cstr; else { // Note: we drop the characters after the ] name += cstr.left( result ); } } else { name+=*c; c++; } } if ( !*c || *c == '\n' ) { kdDebug(7107) << "Found linefeed! Could not parse character name: " << name << endl; return ""; } c++; } else if ( *c =='C' || c[1]== '\'' ) { // \C'name' c+=2; while ( *c && *c != '\'' && *c != '\n' ) { if ( *c == escapesym ) { TQCString cstr; c = scan_escape_direct( c+1, cstr ); const int result = cstr.find('\''); if ( result == -1 ) name += cstr; else { // Note: we drop the characters after the ] name += cstr.left( result ); } } else { name+=*c; c++; } } if ( !*c || *c == '\n' ) { kdDebug(7107) << "Found linefeed! Could not parse (\\C mode) character name: " << name << endl; return ""; } c++; } // Note: characters with a one character length name doe not exist, as they would collide with other escapes // Now we have the name, let us find it between the string names TQMap::iterator it=s_characterDefinitionMap.find(name); if (it==s_characterDefinitionMap.end()) { kdDebug(7107) << "EXCEPTION: cannot find character with name: " << name << endl; // No output, as an undefined string is empty by default return ""; } else { kdDebug(7107) << "Character with name: \"" << name << "\" => " << (*it).m_output << endl; return (*it).m_output; } } static TQCString scan_named_string(char*& c) { TQCString name; if ( *c == '(' ) { // \*(ab Name of two characters if ( c[1] == escapesym ) { TQCString cstr; c = scan_escape_direct( c+2, cstr ); kdDebug(7107) << "\\(" << cstr << endl; // ### HACK: as we convert characters too early to HTML, we need to support more than 2 characters here and assume that all characters passed by the variable are to be used. name = cstr; } else { name+=c[1]; name+=c[2]; c+=3; } } else if ( *c == '[' ) { // \*[long_name] Long name // Named character groff(7) // We must find the ] to get a name c++; while ( *c && *c != ']' && *c != '\n' ) { if ( *c == escapesym ) { TQCString cstr; c = scan_escape_direct( c+1, cstr ); const int result = cstr.find(']'); if ( result == -1 ) name += cstr; else { // Note: we drop the characters after the ] name += cstr.left( result ); } } else { name+=*c; c++; } } if ( !*c || *c == '\n' ) { kdDebug(7107) << "Found linefeed! Could not parse string name: " << name << endl; return ""; } c++; } else { // \*a Name of one character name+=*c; c++; } // Now we have the name, let us find it between the string names TQMap::iterator it=s_stringDefinitionMap.find(name); if (it==s_stringDefinitionMap.end()) { kdDebug(7107) << "EXCEPTION: cannot find string with name: " << name << endl; // No output, as an undefined string is empty by default return ""; } else { kdDebug(7107) << "String with name: \"" << name << "\" => " << (*it).m_output << endl; return (*it).m_output; } } static TQCString scan_dollar_parameter(char*& c) { unsigned int argno = 0; // No dollar argument number yet! if ( *c == '0' ) { //kdDebug(7107) << "$0" << endl; c++; return s_dollarZero; } else if ( *c >= '1' && *c <= '9' ) { //kdDebug(7107) << "$ direct" << endl; argno = ( *c - '0' ); c++; } else if ( *c == '(' ) { //kdDebug(7107) << "$(" << endl; if ( c[1] && c[2] && c[1] >= '0' && c[1] <= '9' && c[2] >= '0' && c[2] <= '9' ) { argno = ( c[1] - '0' ) * 10 + ( c[2] - '0' ); c += 3; } else { if ( !c[1] ) c++; else if ( !c[2] ) c+=2; else c += 3; return ""; } } else if ( *c == '[' ) { //kdDebug(7107) << "$[" << endl; argno = 0; c++; while ( *c && *c>='0' && *c<='9' && *c!=']' ) { argno *= 10; argno += ( *c - '0' ); c++; } if ( *c != ']' ) { return ""; } c++; } else if ( ( *c == '*' ) || ( *c == '@' ) ) { const bool quote = ( *c == '@' ); TQValueList::const_iterator it = s_argumentList.begin(); TQCString param; bool space = false; for ( ; it != s_argumentList.end(); ++it ) { if (space) param += " "; if (quote) param += '\"'; // Not as HTML, as it could be used by macros ! param += (*it); if (quote) param += '\"'; // Not as HTML, as it could be used by macros! space = true; } c++; return param; } else { kdDebug(7107) << "EXCEPTION: unknown parameter $" << *c << endl; return ""; } //kdDebug(7107) << "ARG $" << argno << endl; if ( !s_argumentList.isEmpty() && argno > 0 ) { //kdDebug(7107) << "ARG $" << argno << " OK!" << endl; argno--; if ( argno >= s_argumentList.size() ) { kdDebug(7107) << "EXCEPTION: cannot find parameter $" << (argno+1) << endl; return ""; } return s_argumentList[argno]; } return ""; } /// return the value of read-only number registers static int read_only_number_register( const TQCString& name ) { // Internal read-only variables if ( name == ".$" ) { kdDebug(7107) << "\\n[.$] == " << s_argumentList.size() << endl; return s_argumentList.size(); } else if ( name == ".g" ) return 0; // We are not groff(1) else if ( name == ".s" ) return current_size; #if 0 // ### TODO: map the fonts to a number else if ( name == ".f" ) return current_font; #endif else if ( name == ".P" ) return 0; // We are not printing else if ( name == ".A" ) return s_nroff; #ifndef SIMPLE_MAN2HTML // Special KDE TDEIO man: else if ( name == ".TDE_VERSION_MAJOR" ) return TDE_VERSION_MAJOR; else if ( name == ".TDE_VERSION_MINOR" ) return TDE_VERSION_MINOR; else if ( name == ".TDE_VERSION_RELEASE" ) return TDE_VERSION_RELEASE; else if ( name == ".TDE_VERSION" ) return TDE_VERSION; #endif // ### TODO: should .T be set to "html"? But we are not the HTML post-processor. :-( // ### TODO: groff defines much more read-only number registers #ifndef SIMPLE_MAN2HTML kdDebug(7107) << "EXCEPTION: unknown read-only number register: " << name << endl; #endif return 0; // Undefined variable } /// get the value of a number register and auto-increment if asked static int scan_number_register( char*& c) { int sign = 0; // Sign for auto-increment (if any) switch (*c) { case '+': sign = 1; c++; break; case '-': sign = -1; c++; break; default: break; } TQCString name; if ( *c == '[' ) { c++; if ( *c == '+' ) { sign = 1; c++; } else if ( *c == '-' ) { sign = -1; c++; } while ( *c && *c != ']' && *c != '\n' ) { // ### TODO: a \*[string] could be inside and should be processed name+=*c; c++; } if ( !*c || *c == '\n' ) { kdDebug(7107) << "Found linefeed! Could not parse number register name: " << name << endl; return 0; } c++; } else if ( *c == '(' ) { c++; if ( *c == '+' ) { sign = 1; c++; } else if ( *c == '-' ) { sign = -1; c++; } name+=c[0]; name+=c[1]; c+=2; } else { name += *c; c++; } if ( name[0] == '.' ) { return read_only_number_register( name ); } else { TQMap< TQCString, NumberDefinition >::iterator it = s_numberDefinitionMap.find( name ); if ( it == s_numberDefinitionMap.end() ) { return 0; // Undefined variable } else { (*it).m_value += sign * (*it).m_increment; return (*it).m_value; } } } /// get and set font static TQCString scan_named_font( char*& c ) { TQCString name; if ( *c == '(' ) { // \f(ab Name of two characters if ( c[1] == escapesym ) { TQCString cstr; c = scan_escape_direct( c+2, cstr ); kdDebug(7107) << "\\(" << cstr << endl; // ### HACK: as we convert characters too early to HTML, we need to support more than 2 characters here and assume that all characters passed by the variable are to be used. name = cstr; } else { name+=c[1]; name+=c[2]; c+=3; } } else if ( *c == '[' ) { // \f[long_name] Long name // We must find the ] to get a name c++; while ( *c && *c != ']' && *c != '\n' ) { if ( *c == escapesym ) { TQCString cstr; c = scan_escape_direct( c+1, cstr ); const int result = cstr.find(']'); if ( result == -1 ) name += cstr; else { // Note: we drop the characters after the ] name += cstr.left( result ); } } else { name+=*c; c++; } } if ( !*c || *c == '\n' ) { kdDebug(7107) << "Found linefeed! Could not parse font name: " << name << endl; return ""; } c++; } else { // \fa Font name with one character or one digit // ### HACK do *not* use: name = *c; or name would be empty name += *c; c++; } //kdDebug(7107) << "FONT NAME: " << name << endl; // Now we have the name, let us find the font bool ok = false; const unsigned int number = name.toUInt( &ok ); if ( ok ) { if ( number < 5 ) { const char* fonts[] = { "R", "I", "B", "BI", "CR" }; // Regular, Italic, Bold, Bold Italic, Courier regular name = fonts[ number ]; } else { kdDebug(7107) << "EXCEPTION: font has too big number: " << name << " => " << number << endl; name = "R"; // Let assume Regular } } else if ( name.isEmpty() ) { kdDebug(7107) << "EXCEPTION: font has no name: " << name << endl; name = "R"; // Let assume Regular } if ( !skip_escape ) return set_font( name ); else return ""; } static TQCString scan_number_code( char*& c ) { TQCString number; if ( *c != '\'' ) return ""; while ( *c && ( *c != '\n' ) && ( *c != '\'' ) ) { number += *c; c++; } bool ok = false; unsigned int result = number.toUInt( &ok ); if ( ( result < ' ' ) || ( result > 65535 ) ) return ""; else if ( result == '\t' ) { curpos += 8; curpos &= 0xfff8; return "\t"; } number.setNum( result ); number.prepend( "&#" ); number.append( ";" ); curpos ++; return number; } // ### TODO known missing escapes from groff(7): // ### TODO \& \! \) \: \R static char *scan_escape_direct( char *c, TQCString& cstr ) { bool exoutputp; bool exskipescape; int i,j; bool cplusplus = true; // Should the c++ be done at the end of the function cstr = ""; intresult=0; switch (*c) { case 'e': cstr = "\\"; curpos++;break; // ### FIXME: it should be the current escape symbol case '0': // ### TODO Where in Unicode? (space of digit width) case '~': // non-breakable-space (resizeable!) case ' ': case '|': // half-non-breakable-space case '^': // quarter-non-breakable-space cstr = " "; curpos++; break; case '"': SKIPEOL; c--; break; // ### TODO \# like \" but does not ignore the end of line (groff(7)) case '$': { c++; cstr = scan_dollar_parameter( c ); cplusplus = false; break; } case 'z': { c++; if (*c=='\\') { c=scan_escape_direct( c+1, cstr ); c--; } else cstr = TQCString( c, 1 ); break; } case 'k': c++; if (*c=='(') c+=2; // ### FIXME \k[REG] exists too case '!': case '%': case 'a': case 'd': case 'r': case 'u': case '\n': case '&': cstr = ""; break; case '(': case '[': case 'C': { // Do not go forward as scan_named_character needs the leading symbol cstr = scan_named_character( c ); cplusplus = false; break; } case '*': { c++; cstr = scan_named_string( c ); cplusplus = false; break; } case 'f': { c++; cstr = scan_named_font( c ); cplusplus = false; break; } case 's': // ### FIXME: many forms are missing c++; j=0;i=0; if (*c=='-') {j= -1; c++;} else if (*c=='+') {j=1; c++;} if (*c=='0') c++; else if (*c=='\\') { c++; c=scan_escape_direct( c, cstr ); i=intresult; if (!j) j=1; } else while (isdigit(*c) && (!i || (!j && i<4))) i=i*10+(*c++)-'0'; if (!j) { j=1; if (i) i=i-10; } if (!skip_escape) cstr=change_to_size(i*j); c--; break; case 'n': { c++; intresult = scan_number_register( c ); cplusplus = false; break; } case 'w': c++; i=*c; c++; exoutputp=output_possible; exskipescape=skip_escape; output_possible=false; skip_escape=true; j=0; while (*c!=i) { j++; if ( *c == escapesym ) c = scan_escape_direct( c+1, cstr); else c++; } output_possible=exoutputp; skip_escape=exskipescape; intresult=j; break; case 'l': cstr = "

"; curpos=0; case 'b': case 'v': case 'x': case 'o': case 'L': case 'h': c++; i=*c; c++; exoutputp=output_possible; exskipescape=skip_escape; output_possible=0; skip_escape=true; while (*c != i) if (*c==escapesym) c=scan_escape_direct( c+1, cstr ); else c++; output_possible=exoutputp; skip_escape=exskipescape; break; case 'c': no_newline_output=1; break; case '{': newline_for_fun++; break; // Start conditional block case '}': if (newline_for_fun) newline_for_fun--; break; // End conditional block case 'p': cstr = "
\n";curpos=0; break; case 't': cstr = "\t";curpos=(curpos+8)&0xfff8; break; case '<': cstr = "<";curpos++; break; case '>': cstr = ">";curpos++; break; case '\\': { if (single_escape) c--; else cstr="\\"; break; } case 'N': { c++; cstr = scan_number_code( c ); cplusplus = false; break; } #if 0 { if (*++c) c++; // c += 2 if (sscanf(c, "%d", &i) != 1) // (### FIXME ugly!) break; TQCString temp; temp.sprintf( "%d", i ); // Skip over number (### FIXME ugly!) c += temp.length(); switch(i) { case 8: cstr = "\t"; curpos=(curpos+8)&0xfff8; break; case 34: cstr = """; curpos++; break; default: cstr = char( i ); curpos++; break; } break; } #endif case '\'': cstr = "´";curpos++; break; // groff(7) ### TODO verify case '`': cstr = "`";curpos++; break; // groff(7) case '-': cstr = "-";curpos++; break; // groff(7) case '.': cstr = ".";curpos++; break; // groff(7) default: cstr = *c; curpos++; break; } if (cplusplus) c++; return c; } static char *scan_escape(char *c) { TQCString cstr; char* result = scan_escape_direct( c, cstr ); if ( !skip_escape ) out_html(cstr); return result; } class TABLEROW; class TABLEITEM { public: TABLEITEM(TABLEROW *row); ~TABLEITEM() { delete [] contents; } void setContents(const char *_contents) { delete [] contents; contents = tqstrdup(_contents); } const char *getContents() const { return contents; } void init() { delete [] contents; contents = 0; size = 0; align = 0; valign = 0; colspan = 1; rowspan = 1; font = 0; vleft = 0; vright = 0; space = 0; width = 0; } void copyLayout(const TABLEITEM *orig) { size = orig->size; align = orig->align; valign = orig->valign; colspan = orig->colspan; rowspan = orig->rowspan; font = orig->font; vleft = orig->vleft; vright = orig->vright; space = orig->space; width = orig->width; } public: int size,align,valign,colspan,rowspan,font,vleft,vright,space,width; private: char *contents; TABLEROW *_parent; }; class TABLEROW { char *test; public: TABLEROW() { test = new char; items.setAutoDelete(true); prev = 0; next = 0; } ~TABLEROW() { delete test; } int length() const { return items.count(); } bool has(int index) { return (index >= 0) && (index < (int)items.count()); } TABLEITEM &at(int index) { return *items.at(index); } TABLEROW *copyLayout() const; void addItem(TABLEITEM *item) { items.append(item); } TABLEROW *prev, *next; private: TQPtrList items; }; TABLEITEM::TABLEITEM(TABLEROW *row) : contents(0), _parent(row) { init(); _parent->addItem(this); } TABLEROW *TABLEROW::copyLayout() const { TABLEROW *newrow = new TABLEROW(); TQPtrListIterator it(items); for ( ; it.current(); ++it) { TABLEITEM *newitem = new TABLEITEM(newrow); newitem->copyLayout(it.current()); } return newrow; } static const char *tableopt[]= { "center", "expand", "box", "allbox", "doublebox", "tab", "linesize", "delim", NULL }; static int tableoptl[] = { 6,6,3,6,9,3,8,5,0}; static void clear_table(TABLEROW *table) { TABLEROW *tr1,*tr2; tr1=table; while (tr1->prev) tr1=tr1->prev; while (tr1) { tr2=tr1; tr1=tr1->next; delete tr2; } } static char *scan_expression(char *c, int *result); static char *scan_format(char *c, TABLEROW **result, int *maxcol) { TABLEROW *layout, *currow; TABLEITEM *curfield; int i,j; if (*result) { clear_table(*result); } layout= currow=new TABLEROW(); curfield=new TABLEITEM(currow); while (*c && *c!='.') { switch (*c) { case 'C': case 'c': case 'N': case 'n': case 'R': case 'r': case 'A': case 'a': case 'L': case 'l': case 'S': case 's': case '^': case '_': if (curfield->align) curfield=new TABLEITEM(currow); curfield->align=toupper(*c); c++; break; case 'i': case 'I': case 'B': case 'b': curfield->font = toupper(*c); c++; break; case 'f': case 'F': c++; curfield->font = toupper(*c); c++; if (!isspace(*c) && *c!='.') c++; break; case 't': case 'T': curfield->valign='t'; c++; break; case 'p': case 'P': c++; i=j=0; if (*c=='+') { j=1; c++; } if (*c=='-') { j=-1; c++; } while (isdigit(*c)) i=i*10+(*c++)-'0'; if (j) curfield->size= i*j; else curfield->size=j-10; break; case 'v': case 'V': case 'w': case 'W': c=scan_expression(c+2,&curfield->width); break; case '|': if (curfield->align) curfield->vleft++; else curfield->vright++; c++; break; case 'e': case 'E': c++; break; case '0': case '1': case '2': case '3': case '4': case '5': case '6': case '7': case '8': case '9': i=0; while (isdigit(*c)) i=i*10+(*c++)-'0'; curfield->space=i; break; case ',': case '\n': currow->next=new TABLEROW(); currow->next->prev=currow; currow=currow->next; currow->next=NULL; curfield=new TABLEITEM(currow); c++; break; default: c++; break; } } if (*c=='.') while (*c++!='\n'); *maxcol=0; currow=layout; while (currow) { i=currow->length(); if (i>*maxcol) *maxcol=i; currow=currow->next; } *result=layout; return c; } static TABLEROW *next_row(TABLEROW *tr) { if (tr->next) { tr=tr->next; if (!tr->next) return next_row(tr); return tr; } else { tr->next = tr->copyLayout(); tr->next->prev = tr; return tr->next; } } static char itemreset[20]="\\fR\\s0"; #define FORWARDCUR do { curfield++; } while (currow->has(curfield) && currow->at(curfield).align=='S'); static char *scan_table(char *c) { char *h; char *g; int center=0, expand=0, box=0, border=0, linesize=1; int i,j,maxcol=0, finished=0; TQCString oldfont; int oldsize,oldfillout; char itemsep='\t'; TABLEROW *layout=NULL, *currow; int curfield = -1; while (*c++!='\n'); h=c; if (*h=='.') return c-1; oldfont=current_font; oldsize=current_size; oldfillout=fillout; out_html(set_font("R")); out_html(change_to_size(0)); if (!fillout) { fillout=1; out_html("

"); fillout=oldfillout; out_html(change_to_size(oldsize)); out_html(set_font(oldfont)); return c; } static char *scan_expression( char *c, int *result, const unsigned int numLoop ) { int value=0,value2,sign=1,opex=0; char oper='c'; if (*c=='!') { c=scan_expression(c+1, &value); value= (!value); } else if (*c=='n') { c++; value=s_nroff; } else if (*c=='t') { c++; value=1-s_nroff; } else if (*c=='\'' || *c=='"' || *c<' ' || (*c=='\\' && c[1]=='(')) { /* ?string1?string2? ** test if string1 equals string2. */ char *st1=NULL, *st2=NULL, *h; char *tcmp=NULL; char sep; sep=*c; if (sep=='\\') { tcmp=c; c=c+3; } c++; h=c; while (*c!= sep && (!tcmp || tqstrncmp(c,tcmp,4))) c++; *c='\n'; scan_troff(h, 1, &st1); *c=sep; if (tcmp) c=c+3; c++; h=c; while (*c!=sep && (!tcmp || tqstrncmp(c,tcmp,4))) c++; *c='\n'; scan_troff(h,1,&st2); *c=sep; if (!st1 && !st2) value=1; else if (!st1 || !st2) value=0; else value=(!qstrcmp(st1, st2)); delete [] st1; delete [] st2; if (tcmp) c=c+3; c++; } else { while (*c && ( !isspace(*c) || ( numLoop > 0 ) ) && *c!=')' && opex >= 0) { opex=0; switch (*c) { case '(': c = scan_expression( c + 1, &value2, numLoop + 1 ); value2=sign*value2; opex=1; break; case '.': case '0': case '1': case '2': case '3': case '4': case '5': case '6': case '7': case '8': case '9': { int num=0,denum=1; value2=0; while (isdigit(*c)) value2=value2*10+((*c++)-'0'); if (*c=='.' && isdigit(c[1])) { c++; while (isdigit(*c)) { num=num*10+((*c++)-'0'); denum=denum*10; } } if (isalpha(*c)) { /* scale indicator */ switch (*c) { case 'i': /* inch -> 10pt */ value2=value2*10+(num*10+denum/2)/denum; num=0; break; default: break; } c++; } value2=value2+(num+denum/2)/denum; value2=sign*value2; opex=1; if (*c=='.') opex = -1; } break; case '\\': c=scan_escape(c+1); value2=intresult*sign; if (isalpha(*c)) c++; /* scale indicator */ opex=1; break; case '-': if (oper) { sign=-1; c++; break; } case '>': case '<': case '+': case '/': case '*': case '%': case '&': case '=': case ':': if (c[1]=='=') oper=(*c++) +16; else oper=*c; c++; break; default: c++; break; } if (opex > 0) { sign=1; switch (oper) { case 'c': value=value2; break; case '-': value=value-value2; break; case '+': value=value+value2; break; case '*': value=value*value2; break; case '/': if (value2) value=value/value2; break; case '%': if (value2) value=value%value2; break; case '<': value=(value': value=(value>value2); break; case '>'+16: value=(value>=value2); break; case '<'+16: value=(value<=value2); break; case '=': case '='+16: value=(value==value2); break; case '&': value = (value && value2); break; case ':': value = (value || value2); break; default: { kdDebug(7107) << "Unknown operator " << char(oper) << endl; } } oper=0; } } if (*c==')') c++; } *result=value; return c; } static char *scan_expression(char *c, int *result) { return scan_expression( c, result, 0 ); } static void trans_char(char *c, char s, char t) { char *sl=c; int slash=0; while (*sl!='\n' || slash) { if (!slash) { if (*sl==escapesym) slash=1; else if (*sl==s) *sl=t; } else slash=0; sl++; } } // 2004-10-19, patched by Waldo Bastian : // Fix handling of lines like: // .TH FIND 1L \" -*- nroff -*- // Where \" indicates the start of comment. // // The problem is the \" handling in fill_words(), the return value // indicates the end of the word as well as the end of the line, which makes it // basically impossible to express that the end of the last word is not the end of // the line. // // I have corrected that by adding an extra parameter 'next_line' that returns a // pointer to the next line, while the function itself returns a pointer to the end // of the last word. static char *fill_words(char *c, char *words[], int *n, bool newline, char **next_line) { char *sl=c; int slash=0; int skipspace=0; *n=0; words[*n]=sl; while (*sl && (*sl!='\n' || slash)) { if (!slash) { if (*sl=='"') { if (skipspace && (*(sl+1)=='"')) *sl++ = '\a'; else { *sl='\a'; skipspace=!skipspace; } } else if (*sl==escapesym) { slash=1; if (sl[1]=='\n') *sl='\a'; } else if ((*sl==' ' || *sl=='\t') && !skipspace) { if (newline) *sl='\n'; if (words[*n]!=sl) (*n)++; words[*n]=sl+1; } } else { if (*sl=='"') { sl--; if (newline) *sl='\n'; if (words[*n]!=sl) (*n)++; if (next_line) { char *eow = sl; sl++; while (*sl && *sl !='\n') sl++; *next_line = sl; return eow; } return sl; } slash=0; } sl++; } if (sl!=words[*n]) (*n)++; if (next_line) *next_line = sl+1; return sl; } static const char *abbrev_list[] = { "GSBG", "Getting Started ", "SUBG", "Customizing SunOS", "SHBG", "Basic Troubleshooting", "SVBG", "SunView User's Guide", "MMBG", "Mail and Messages", "DMBG", "Doing More with SunOS", "UNBG", "Using the Network", "GDBG", "Games, Demos & Other Pursuits", "CHANGE", "SunOS 4.1 Release Manual", "INSTALL", "Installing SunOS 4.1", "ADMIN", "System and Network Administration", "SECUR", "Security Features Guide", "PROM", "PROM User's Manual", "DIAG", "Sun System Diagnostics", "SUNDIAG", "Sundiag User's Guide", "MANPAGES", "SunOS Reference Manual", "REFMAN", "SunOS Reference Manual", "SSI", "Sun System Introduction", "SSO", "System Services Overview", "TEXT", "Editing Text Files", "DOCS", "Formatting Documents", "TROFF", "Using nroff and troff", "INDEX", "Global Index", "CPG", "C Programmer's Guide", "CREF", "C Reference Manual", "ASSY", "Assembly Language Reference", "PUL", "Programming Utilities and Libraries", "DEBUG", "Debugging Tools", "NETP", "Network Programming", "DRIVER", "Writing Device Drivers", "STREAMS", "STREAMS Programming", "SBDK", "SBus Developer's Kit", "WDDS", "Writing Device Drivers for the SBus", "FPOINT", "Floating-Point Programmer's Guide", "SVPG", "SunView 1 Programmer's Guide", "SVSPG", "SunView 1 System Programmer's Guide", "PIXRCT", "Pixrect Reference Manual", "CGI", "SunCGI Reference Manual", "CORE", "SunCore Reference Manual", "4ASSY", "Sun-4 Assembly Language Reference", "SARCH", "SPARC Architecture Manual", "KR", "The C Programming Language", NULL, NULL }; static const char *lookup_abbrev(char *c) { int i=0; if (!c) return ""; while (abbrev_list[i] && qstrcmp(c,abbrev_list[i])) i=i+2; if (abbrev_list[i]) return abbrev_list[i+1]; else return c; } static const char *section_list[] = { #ifdef Q_OS_SOLARIS // for Solaris "1", "User Commands", "1B", "SunOS/BSD Compatibility Package Commands", "1b", "SunOS/BSD Compatibility Package Commands", "1C", "Communication Commands ", "1c", "Communication Commands", "1F", "FMLI Commands ", "1f", "FMLI Commands", "1G", "Graphics and CAD Commands ", "1g", "Graphics and CAD Commands ", "1M", "Maintenance Commands", "1m", "Maintenance Commands", "1S", "SunOS Specific Commands", "1s", "SunOS Specific Commands", "2", "System Calls", "3", "C Library Functions", "3B", "SunOS/BSD Compatibility Library Functions", "3b", "SunOS/BSD Compatibility Library Functions", "3C", "C Library Functions", "3c", "C Library Functions", "3E", "C Library Functions", "3e", "C Library Functions", "3F", "Fortran Library Routines", "3f", "Fortran Library Routines", "3G", "C Library Functions", "3g", "C Library Functions", "3I", "Wide Character Functions", "3i", "Wide Character Functions", "3K", "Kernel VM Library Functions", "3k", "Kernel VM Library Functions", "3L", "Lightweight Processes Library", "3l", "Lightweight Processes Library", "3M", "Mathematical Library", "3m", "Mathematical Library", "3N", "Network Functions", "3n", "Network Functions", "3R", "Realtime Library", "3r", "Realtime Library", "3S", "Standard I/O Functions", "3s", "Standard I/O Functions", "3T", "Threads Library", "3t", "Threads Library", "3W", "C Library Functions", "3w", "C Library Functions", "3X", "Miscellaneous Library Functions", "3x", "Miscellaneous Library Functions", "4", "File Formats", "4B", "SunOS/BSD Compatibility Package File Formats", "4b", "SunOS/BSD Compatibility Package File Formats", "5", "Headers, Tables, and Macros", "6", "Games and Demos", "7", "Special Files", "7B", "SunOS/BSD Compatibility Special Files", "7b", "SunOS/BSD Compatibility Special Files", "8", "Maintenance Procedures", "8C", "Maintenance Procedures", "8c", "Maintenance Procedures", "8S", "Maintenance Procedures", "8s", "Maintenance Procedures", "9", "DDI and DKI", "9E", "DDI and DKI Driver Entry Points", "9e", "DDI and DKI Driver Entry Points", "9F", "DDI and DKI Kernel Functions", "9f", "DDI and DKI Kernel Functions", "9S", "DDI and DKI Data Structures", "9s", "DDI and DKI Data Structures", "L", "Local Commands", #elif defined(__NetBSD__) || defined(__OpenBSD__) || defined(__FreeBSD__) || defined(__DragonFly__) "1", "General Commands", "2", "System Calls", "3", "Library Functions", "4", "Kernel Interfaces", "5", "File Formats", "6", "Games", "7", "Miscellaneous Information", "8", "System Manager's Manuals", "9", "Kernel Developer's Manuals", #else // Other OS "1", "User Commands ", "1C", "User Commands", "1G", "User Commands", "1S", "User Commands", "1V", "User Commands ", "2", "System Calls", "2V", "System Calls", "3", "C Library Functions", "3C", "Compatibility Functions", "3F", "Fortran Library Routines", "3K", "Kernel VM Library Functions", "3L", "Lightweight Processes Library", "3M", "Mathematical Library", "3N", "Network Functions", "3p", "Perl Functions", "3R", "RPC Services Library", "3S", "Standard I/O Functions", "3V", "C Library Functions", "3X", "Miscellaneous Library Functions", "4", "Devices and Network Interfaces", "4F", "Protocol Families", "4I", "Devices and Network Interfaces", "4M", "Devices and Network Interfaces", "4N", "Devices and Network Interfaces", "4P", "Protocols", "4S", "Devices and Network Interfaces", "4V", "Devices and Network Interfaces", "5", "File Formats", "5V", "File Formats", "6", "Games and Demos", "7", "Environments, Tables, and Troff Macros", "7V", "Environments, Tables, and Troff Macros", "8", "Maintenance Commands", "8C", "Maintenance Commands", "8S", "Maintenance Commands", "8V", "Maintenance Commands", "L", "Local Commands", #endif // The defaults NULL, "Misc. Reference Manual Pages", NULL, NULL }; static const char *section_name(char *c) { int i=0; if (!c) return ""; while (section_list[i] && qstrcmp(c,section_list[i])) i=i+2; if (section_list[i+1]) return section_list[i+1]; else return c; } static char *skip_till_newline(char *c) { int lvl=0; while (*c && (*c!='\n' || lvl>0)) { if (*c=='\\') { c++; if (*c=='}') lvl--; else if (*c=='{') lvl++; } c++; } if (*c) c++; if (lvl<0 && newline_for_fun) { newline_for_fun = newline_for_fun+lvl; if (newline_for_fun<0) newline_for_fun=0; } return c; } static bool s_whileloop = false; /// Processing the .while request static void request_while( char*& c, int j, bool mdoc ) { // ### TODO: .break and .continue kdDebug(7107) << "Entering .while" << endl; c += j; char* newline = skip_till_newline( c ); const char oldchar = *newline; *newline = 0; // We store the full .while stuff into a TQCString as if it would be a macro const TQCString macro = c ; kdDebug(7107) << "'Macro' of .while" << endl << macro << endl; // Prepare for continuing after .while loop end *newline = oldchar; c = newline; // Process -while loop const bool oldwhileloop = s_whileloop; s_whileloop = true; int result = true; // It must be an int due to the call to scan_expression while ( result ) { // Unlike for a normal macro, we have the condition at start, so we do not need to prepend extra bytes char* liveloop = tqstrdup( macro.data() ); kdDebug(7107) << "Scanning .while condition" << endl; kdDebug(7101) << "Loop macro " << liveloop << endl; char* end_expression = scan_expression( liveloop, &result ); kdDebug(7101) << "After " << end_expression << endl; if ( result ) { kdDebug(7107) << "New .while iteration" << endl; // The condition is true, so call the .while's content char* help = end_expression + 1; while ( *help && ( *help == ' ' || *help == '\t' ) ) ++help; if ( ! *help ) { // We have a problem, so stop .while result = false; break; } if ( mdoc ) scan_troff_mandoc( help, false, 0 ); else scan_troff( help, false, 0 ); } delete[] liveloop; } // s_whileloop = oldwhileloop; kdDebug(7107) << "Ending .while" << endl; } const int max_wordlist = 100; /// Processing mixed fonts reqiests like .BI static void request_mixed_fonts( char*& c, int j, const char* font1, const char* font2, const bool mode, const bool inFMode ) { c += j; if (*c=='\n') c++; int words; char *wordlist[max_wordlist]; fill_words(c, wordlist, &words, true, &c); for (int i=0; i s_ifelseval; // Process a (mdoc) request involving quotes static char* process_quote(char* c, int j, const char* open, const char* close) { trans_char(c,'"','\a'); c+=j; if (*c=='\n') c++; // ### TODO: why? Quote requests cannot be empty! out_html(open); c=scan_troff_mandoc(c,1,0); out_html(close); out_html(NEWLINE); if (fillout) curpos++; else curpos=0; return c; } /** * Is the char \p ch a puntuaction in sence of mdoc(7) */ static bool is_mdoc_punctuation( const char ch ) { if ( ( ch >= '0' && ch <= '9' ) || ( ch >='A' && ch <='Z' ) || ( ch >= 'a' && ch <= 'z' ) ) return false; else if ( ch == '.' || ch == ',' || ch == ';' || ch == ':' || ch == '(' || ch == ')' || ch == '[' || ch == ']' ) return true; else return false; } /** * Can the char \p c be part of an identifier * \note For groff, an identifier can consist of nearly all ASCII printable non-white-space characters * See info:/groff/Identifiers */ static bool is_identifier_char( const char c ) { if ( c >= '!' && c <= '[' ) // Include digits and upper case return true; else if ( c >= ']' && c <= '~' ) // Include lower case return true; else if ( c== '\\' ) return false; // ### TODO: it should be treated as escape instead! return false; } static TQCString scan_identifier( char*& c ) { char* h = c; // help pointer // ### TODO Groff seems to eat nearly everything as identifier name (info:/groff/Identifiers) while ( *h && *h != '\a' && *h != '\n' && is_identifier_char( *h ) ) ++h; const char tempchar = *h; *h = 0; const TQCString name = c; *h = tempchar; if ( name.isEmpty() ) { kdDebug(7107) << "EXCEPTION: identifier empty!" << endl; } c = h; return name; } static char *scan_request(char *c) { // mdoc(7) stuff static bool mandoc_synopsis=false; /* True if we are in the synopsis section */ static bool mandoc_command=false; /* True if this is mdoc(7) page */ static int mandoc_bd_options; /* Only copes with non-nested Bd's */ static int function_argument=0; // Number of function argument (.Fo, .Fa, .Fc) // man(7) stuff static bool ur_ignore=false; // Has .UR a parameter : (for .UE to know if or not to write ) int i=0; bool mode=false; char *h=0; char *wordlist[max_wordlist]; int words; char *sl; while (*c==' ' || *c=='\t') c++; // Spaces or tabs allowed between control character and request if (c[0]=='\n') return c+1; if (c[0]==escapesym) { /* some pages use .\" .\$1 .\} */ /* .\$1 is too difficult/stuppid */ if (c[1]=='$') { kdDebug(7107) << "Found .\\$" << endl; c=skip_till_newline(c); // ### TODO } else c = scan_escape(c+1); } else { int nlen = 0; TQCString macroName; while (c[nlen] && (c[nlen] != ' ') && (c[nlen] != '\t') && (c[nlen] != '\n') && (c[nlen] != escapesym)) { macroName+=c[nlen]; nlen++; } int j = nlen; while (c[j] && c[j]==' ' || c[j]=='\t') j++; /* search macro database of self-defined macros */ TQMap::iterator it=s_stringDefinitionMap.find(macroName); if (it!=s_stringDefinitionMap.end()) { kdDebug(7107) << "CALLING MACRO: " << macroName << endl; const TQCString oldDollarZero = s_dollarZero; // Previous value of $0 s_dollarZero = macroName; sl=fill_words(c+j, wordlist, &words, true, &c); *sl='\0'; for (i=1;i oldArgumentList( s_argumentList ); s_argumentList.clear(); for ( i = 0 ; i < max_wordlist; i++ ) { if (!wordlist[i]) break; s_argumentList.push_back( wordlist[i] ); } const int onff=newline_for_fun; if (mandoc_command) scan_troff_mandoc( work + 1, 0, NULL ); else scan_troff( work + 1, 0, NULL); delete[] work; newline_for_fun=onff; s_argumentList = oldArgumentList; } for (i=0; i::iterator it=s_stringDefinitionMap.find(name); if (it==s_stringDefinitionMap.end()) { StringDefinition def; def.m_length=0; def.m_output=result; s_stringDefinitionMap.insert(name,def); } else { (*it).m_length=0; (*it).m_output=result; } delete[] result; if (*c) *c='.'; c=skip_till_newline(c); kdDebug(7107) << "end .di" << endl; break; } case REQ_ds: // groff(7) "Define String variable" mode=true; case REQ_as: // groff (7) "Append String variable" { kdDebug(7107) << "start .ds/.as" << endl; int oldcurpos=curpos; c+=j; const TQCString name( scan_identifier( c) ); if ( name.isEmpty() ) break; while (*c && isspace(*c)) c++; if (*c && *c=='"') c++; single_escape=true; curpos=0; char* result=0; c=scan_troff(c,1,&result); TQMap::iterator it=s_stringDefinitionMap.find(name); if (it==s_stringDefinitionMap.end()) { StringDefinition def; def.m_length=curpos; def.m_output=result; s_stringDefinitionMap.insert(name,def); } else { if (mode) { // .ds Defining String (*it).m_length=curpos; (*it).m_output=result; } else { // .as Appending String (*it).m_length+=curpos; (*it).m_output+=result; } } delete[] result; single_escape=false; curpos=oldcurpos; kdDebug(7107) << "end .ds/.as" << endl; break; } case REQ_br: // groff(7) "line BReak" { if (still_dd) out_html("

"); // ### VERIFY (does not look like generating good HTML) else out_html("
\n"); curpos=0; c=c+j; if (c[0]==escapesym) c=scan_escape(c+1); c=skip_till_newline(c); break; } case REQ_c2: // groff(7) "reset non-break Control character" (2 means non-break) { c=c+j; if (*c!='\n') nobreaksym=*c; else nobreaksym='\''; c=skip_till_newline(c); break; } case REQ_cc: // groff(7) "reset Control Character" { c=c+j; if (*c!='\n') controlsym=*c; else controlsym='.'; c=skip_till_newline(c); break; } case REQ_ce: // groff (7) "CEnter" { c=c+j; if (*c=='\n') i=1; else { i=0; while ('0'<=*c && *c<='9') { i=i*10+*c-'0'; c++; } } c=skip_till_newline(c); /* center next i lines */ if (i>0) { out_html("\n"); while (i && *c) { char *line=NULL; c=scan_troff(c,1, &line); if (line && tqstrncmp(line, "
", 4)) { out_html(line); out_html("
\n"); delete [] line; // ### FIXME: memory leak! i--; } } out_html("\n"); curpos=0; } break; } case REQ_ec: // groff(7) "reset Escape Character" { c=c+j; if (*c!='\n') escapesym=*c; else escapesym='\\'; break; c=skip_till_newline(c); } case REQ_eo: // groff(7) "turn Escape character Off" { escapesym='\0'; c=skip_till_newline(c); break; } case REQ_ex: // groff(7) "EXit" { return 0; break; } case REQ_fc: // groff(7) "set Field and pad Character" { c=c+j; if (*c=='\n') fieldsym=padsym='\0'; else { fieldsym=c[0]; padsym=c[1]; } c=skip_till_newline(c); break; } case REQ_fi: // groff(7) "FIll" { if (!fillout) { out_html(set_font("R")); out_html(change_to_size('0')); out_html("

\n"); } curpos=0; fillout=0; c=skip_till_newline(c); break; } case REQ_ps: // groff(7) "previous Point Size" { c=c+j; if (*c=='\n') out_html(change_to_size('0')); else { j=0; i=0; if (*c=='-') { j= -1; c++; } else if (*c=='+') j=1;c++; c=scan_expression(c, &i); if (!j) { j=1; if (i>5) i=i-10; } out_html(change_to_size(i*j)); } c=skip_till_newline(c); break; } case REQ_sp: // groff(7) "SKip one line" { c=c+j; if (fillout) out_html("

"); else { out_html(NEWLINE); } curpos=0; c=skip_till_newline(c); break; } case REQ_so: // groff(7) "Include SOurce file" { char *buf; char *name=NULL; curpos=0; c=c+j; if (*c=='/') h=c; else { h=c-3; h[0]='.'; h[1]='.'; h[2]='/'; } while (*c!='\n') c++; *c='\0'; scan_troff(h,1, &name); if (name[3]=='/') h=name+3; else h=name; /* this works alright, except for section 3 */ buf=read_man_page(h); if (!buf) { kdDebug(7107) << "Unable to open or read file: .so " << (h) << endl; out_html("

" "man2html: unable to open or read file.\n"); out_html(h); out_html("

\n"); } else scan_troff(buf+1,0,NULL); delete [] buf; delete [] name; *c++='\n'; break; } case REQ_ta: // gorff(7) "set TAbulators" { c=c+j; j=0; while (*c!='\n') { sl=scan_expression(c, &tabstops[j]); if (j>0 && (*c=='-' || *c=='+')) tabstops[j]+=tabstops[j-1]; c=sl; while (*c==' ' || *c=='\t') c++; j++; } maxtstop=j; curpos=0; break; } case REQ_ti: // groff(7) "Temporary Indent" { /*while (itemdepth || dl_set[itemdepth]) { out_html("\n"); if (dl_set[itemdepth]) dl_set[itemdepth]=0; else itemdepth--; }*/ out_html("
\n"); c=c+j; c=scan_expression(c, &j); for (i=0; i"); }; out_html(set_font("R")); out_html(NEWLINE); if (!fillout) curpos=0; else curpos++; break; } case REQ_Fn: // mdoc(7) for "Function calls" { // brackets and commas have to be inserted automatically c+=j; if (*c=='\n') c++; sl=fill_words(c, wordlist, &words, true, &c); if ( words ) { for (i=0; i"); out_html(NEWLINE); if (!fillout) curpos=0; else curpos++; break; } case REQ_Fo: // mdoc(7) "Function definition Opening" { const char* font[2] = { "B", "R" }; c+=j; if (*c=='\n') c++; char *eol=strchr(c,'\n'); char *semicolon=strchr(c,';'); if ((semicolon!=0) && (semicolon 0 out_html(set_font("R")); out_html(NEWLINE); if (!fillout) curpos=0; else curpos++; break; } case REQ_Fc:// mdoc(7) "Function definition Close" { // .Fc has no parameter c+=j; c=skip_till_newline(c); const char* font[2] = { "B", "R" }; out_html(set_font(font[i&1])); out_html(")"); out_html(set_font("R")); if (mandoc_synopsis) out_html("
"); out_html(NEWLINE); if (!fillout) curpos=0; else curpos++; function_argument=0; // Reset the count variable break; } case REQ_Fa: // mdoc(7) "Function definition argument" { const char* font[2] = { "B", "R" }; c+=j; if (*c=='\n') c++; sl=fill_words(c, wordlist, &words, true, &c); out_html(set_font(font[i&1])); // function_argument==0 means that we had no .Fo before, e.g. in mdoc.samples(7) if (function_argument > 1) { out_html(", "); curpos+=2; function_argument++; } else if (function_argument==1) { // We are only at the first parameter function_argument++; } for (i=0; ia b ] */ mode=true; out_html(set_font("R")); out_html("["); curpos++; request_mixed_fonts( c, j, "B", "I", true, false ); break; // Do not break! } case REQ_Ft: //perhaps "Function return type" { request_mixed_fonts( c, j, "B", "I", false, true ); break; } case REQ_BR: { request_mixed_fonts( c, j, "B", "R", false, false ); break; } case REQ_BI: { request_mixed_fonts( c, j, "B", "I", false, false ); break; } case REQ_IB: { request_mixed_fonts( c, j, "I", "B", false, false ); break; } case REQ_IR: { request_mixed_fonts( c, j, "I", "R", false, false ); break; } case REQ_RB: { request_mixed_fonts( c, j, "R", "B", false, false ); break; } case REQ_RI: { request_mixed_fonts( c, j, "R", "I", false, false ); break; } case REQ_DT: // man(7) "Default Tabulators" { for (j=0;j<20; j++) tabstops[j]=(j+1)*8; maxtstop=20; c=skip_till_newline(c); break; } case REQ_IP: // man(7) "Ident Paragraph" { sl=fill_words(c+j, wordlist, &words, true, &c); if (!dl_set[itemdepth]) { out_html("

"); if (words) scan_troff(wordlist[0], 1,NULL); out_html("

"); curpos=0; break; } case REQ_TP: // man(7) "hanging Tag Paragraph" { if (!dl_set[itemdepth]) { out_html("

"); c=skip_till_newline(c); /* somewhere a definition ends with '.TP' */ if (!*c) still_dd=true; else { // HACK for proc(5) while (c[0]=='.' && c[1]=='\\' && c[2]=='\"') { // We have a comment, so skip the line c=skip_till_newline(c); } c=scan_troff(c,1,NULL); out_html(": "); } curpos=0; break; } case REQ_IX: // "INdex" ### TODO: where is it defined? { /* general index */ c=skip_till_newline(c); break; } case REQ_P: // man(7) "Paragraph" case REQ_LP:// man(7) "Paragraph" case REQ_PP:// man(7) "Paragraph; reset Prevailing indent" { if (dl_set[itemdepth]) { out_html("

\n"); dl_set[itemdepth]=0; } if (fillout) out_html("

\n"); else { out_html(NEWLINE); } curpos=0; c=skip_till_newline(c); break; } case REQ_HP: // man(7) "Hanging indent Paragraph" { if (!dl_set[itemdepth]) { out_html("

\n"); still_dd=true; c=skip_till_newline(c); curpos=0; break; } case REQ_PD: // man(7) "Paragraph Distance" { c=skip_till_newline(c); break; } case REQ_Rs: // mdoc(7) "Relative margin Start" case REQ_RS: // man(7) "Relative margin Start" { sl=fill_words(c+j, wordlist, &words, true, 0); j=1; if (words>0) scan_expression(wordlist[0], &j); if (j>=0) { itemdepth++; dl_set[itemdepth]=0; out_html(" "); c=skip_till_newline(c); curpos=0; break; } } case REQ_Re: // mdoc(7) "Relative margin End" case REQ_RE: // man(7) "Relative margin End" { if (itemdepth > 0) { if (dl_set[itemdepth]) out_html(" "); out_html("

\n"); itemdepth--; } c=skip_till_newline(c); curpos=0; break; } case REQ_SB: // man(7) "Small; Bold" { out_html(set_font("B")); out_html(""); trans_char(c,'"','\a'); // ### VERIFY c=scan_troff(c+j, 1, NULL); out_html(""); out_html(set_font("R")); break; } case REQ_SM: // man(7) "SMall" { c=c+j; if (*c=='\n') c++; out_html(""); trans_char(c,'"','\a'); // ### VERIFY c=scan_troff(c,1,NULL); out_html(""); break; } case REQ_Ss: // mdoc(7) "Sub Section" mandoc_command = 1; case REQ_SS: // mdoc(7) "Sub Section" mode=true; case REQ_Sh: // mdoc(7) "Sub Header" /* hack for fallthru from above */ mandoc_command = !mode || mandoc_command; case REQ_SH: // man(7) "Sub Header" { c=c+j; if (*c=='\n') c++; while (itemdepth || dl_set[itemdepth]) { out_html("

\n"); if (dl_set[itemdepth]) dl_set[itemdepth]=0; else if (itemdepth > 0) itemdepth--; } out_html(set_font("R")); out_html(change_to_size(0)); if (!fillout) { fillout=1; out_html("

"); mandoc_synopsis = tqstrncmp(c, "SYNOPSIS", 8) == 0; c = mandoc_command ? scan_troff_mandoc(c,1,NULL) : scan_troff(c,1,NULL); if (mode) out_html("

\n"); section=1; curpos=0; break; } case REQ_Sx: // mdoc(7) { // reference to a section header out_html(set_font("B")); trans_char(c,'"','\a'); c=c+j; if (*c=='\n') c++; c=scan_troff(c, 1, NULL); out_html(set_font("R")); out_html(NEWLINE); if (fillout) curpos++; else curpos=0; break; } case REQ_TS: // ### TODO where is it defined? (tbl?) { c=scan_table(c); break; } case REQ_Dt: /* mdoc(7) */ mandoc_command = true; case REQ_TH: // man(7) "Title Header" { if (!output_possible) { sl = fill_words(c+j, wordlist, &words, true, &c); // ### TODO: the page should be displayed even if it is "anonymous" (words==0) if (words>=1) { for (i=1; i\n\n"); #ifdef SIMPLE_MAN2HTML // Most English man pages are in ISO-8859-1 out_html("\n"); #else // tdeio_man transforms from local to UTF-8 out_html("\n"); #endif out_html(""); out_html(scan_troff(wordlist[0], 0, NULL)); out_html( " Manpage\n"); out_html( "\n" ); out_html( "\n"); out_html( "\n\n" ); out_html("\n\n" ); out_html("

\n" ); out_html("

\n"); out_html(" $\"Top$ \n"); out_html("

\n"); out_html("

\n"); out_html(" $\"Top$ \n"); out_html("

\n"); out_html("

\n"); out_html( scan_troff(wordlist[0], 0, NULL ) ); out_html("

\n"); out_html("

" ); out_html( scan_troff(wordlist[0], 0, NULL ) ); out_html( "

\n" ); if (words>1) { out_html("Section: " ); if (!mandoc_command && words>4) out_html(scan_troff(wordlist[4], 0, NULL) ); else out_html(section_name(wordlist[1])); out_html(" ("); out_html(scan_troff(wordlist[1], 0, NULL)); out_html(")\n"); } else { out_html("Section not specified"); } *sl='\n'; } } else { kdWarning(7107) << ".TH found but output not possible" << endl; c=skip_till_newline(c); } curpos=0; break; } case REQ_TX: // mdoc(7) { sl=fill_words(c+j, wordlist, &words, true, &c); *sl='\0'; out_html(set_font("I")); if (words>1) wordlist[1][-1]='\0'; const char *c2=lookup_abbrev(wordlist[0]); curpos+=tqstrlen(c2); out_html(c2); out_html(set_font("R")); if (words>1) out_html(wordlist[1]); *sl='\n'; break; } case REQ_rm: // groff(7) "ReMove" /* .rm xx : Remove request, macro or string */ mode=true; case REQ_rn: // groff(7) "ReName" /* .rn xx yy : Rename request, macro or string xx to yy */ { kdDebug(7107) << "start .rm/.rn" << endl; c+=j; const TQCString name( scan_identifier( c ) ); if ( name.isEmpty() ) { kdDebug(7107) << "EXCEPTION: empty origin string to remove/rename: " << endl; break; } TQCString name2; if ( !mode ) { while (*c && isspace(*c) && *c!='\n') ++c; name2 = scan_identifier( c ); if ( name2.isEmpty() ) { kdDebug(7107) << "EXCEPTION: empty destination string to rename: " << endl; break; } } c=skip_till_newline(c); TQMap::iterator it=s_stringDefinitionMap.find(name); if (it==s_stringDefinitionMap.end()) { kdDebug(7107) << "EXCEPTION: cannot find string to rename or remove: " << name << endl; } else { if (mode) { // .rm ReMove s_stringDefinitionMap.remove(name); } else { // .rn ReName StringDefinition def=(*it); s_stringDefinitionMap.remove(name); s_stringDefinitionMap.insert(name2,def); } } kdDebug(7107) << "end .rm/.rn" << endl; break; } case REQ_nx: // ### TODO in man(7) it is "No filling", not "next file" /* .nx filename : next file. */ case REQ_in: // groff(7) "INdent" { /* .in +-N : Indent */ c=skip_till_newline(c); break; } case REQ_nr: // groff(7) "Number Register" { kdDebug(7107) << "start .nr" << endl; c += j; const TQCString name( scan_identifier( c ) ); if ( name.isEmpty() ) { kdDebug(7107) << "EXCEPTION: empty name for register variable" << endl; break; } while ( *c && ( *c==' ' || *c=='\t' ) ) c++; int sign = 0; if ( *c && ( *c == '+' || *c == '-' ) ) { if ( *c == '+' ) sign = 1; else if ( *c == '-' ) sign = -1; } int value = 0; int increment = 0; c=scan_expression( c, &value ); if ( *c && *c!='\n') { while ( *c && ( *c==' ' || *c=='\t' ) ) c++; c=scan_expression( c, &increment ); } c = skip_till_newline( c ); TQMap ::iterator it = s_numberDefinitionMap.find( name ); if ( it == s_numberDefinitionMap.end() ) { if ( sign < 1 ) value = -value; NumberDefinition def( value, increment ); s_numberDefinitionMap.insert( name, def ); } else { if ( sign > 0 ) (*it).m_value += value; else if ( sign < 0 ) (*it).m_value += - value; else (*it).m_value = value; (*it).m_increment = increment; } kdDebug(7107) << "end .nr" << endl; break; } case REQ_am: // groff(7) "Append Macro" /* .am xx yy : append to a macro. */ /* define or handle as .ig yy */ mode=true; case REQ_de: // groff(7) "DEfine macro" /* .de xx yy : define or redefine macro xx; end at .yy (..) */ /* define or handle as .ig yy */ { kdDebug(7107) << "Start .am/.de" << endl; c+=j; char *next_line; sl = fill_words(c, wordlist, &words, true, &next_line); char *nameStart = wordlist[0]; c = nameStart; while (*c && (*c != ' ') && (*c != '\n')) c++; *c = '\0'; const TQCString name(nameStart); TQCString endmacro; if (words == 1) { endmacro=".."; } else { endmacro='.'; c = wordlist[1]; while (*c && (*c != ' ') && (*c != '\n')) endmacro+=*c++; } c = next_line; sl=c; const int length=tqstrlen(endmacro); while (*c && tqstrncmp(c,endmacro,length)) c=skip_till_newline(c); TQCString macro; while (sl!=c) { if (sl[0]=='\\' && sl[1]=='\\') { macro+='\\'; sl++; } else macro+=*sl; sl++; } TQMap::iterator it=s_stringDefinitionMap.find(name); if (it==s_stringDefinitionMap.end()) { StringDefinition def; def.m_length=0; def.m_output=macro; s_stringDefinitionMap.insert(name,def); } else if (mode) { // .am Append Macro (*it).m_length=0; // It could be formerly a string // if ((*it).m_output.right(1)!='\n') if (*((*it).m_output.right(1).data())!='\n') (*it).m_output+='\n'; (*it).m_output+=macro; } else { // .de DEfine macro (*it).m_length=0; // It could be formerly a string (*it).m_output=macro; } c=skip_till_newline(c); kdDebug(7107) << "End .am/.de" << endl; break; } case REQ_Bl: // mdoc(7) "Begin List" { char list_options[NULL_TERMINATED(MED_STR_MAX)]; char *nl = strchr(c,'\n'); c=c+j; if (dl_set[itemdepth]) /* These things can nest. */ itemdepth++; if (nl) { /* Parse list options */ strlimitcpy(list_options, c, nl - c, MED_STR_MAX); } if (strstr(list_options, "-bullet")) { /* HTML Unnumbered List */ dl_set[itemdepth] = BL_BULLET_LIST; out_html("

\n"); } if (fillout) out_html("

\n"); else { out_html(NEWLINE); } curpos=0; c=skip_till_newline(c); break; } case REQ_El: // mdoc(7) "End List" { c=c+j; if (dl_set[itemdepth] & BL_DESC_LIST) out_html("

\n"); else if (dl_set[itemdepth] & BL_ENUM_LIST) out_html("\n"); dl_set[itemdepth]=0; if (itemdepth > 0) itemdepth--; if (fillout) out_html("

\n"); else { out_html(NEWLINE); } curpos=0; c=skip_till_newline(c); break; } case REQ_It: // mdoc(7) "list ITem" { c=c+j; if (tqstrncmp(c, "Xo", 2) == 0 && isspace(*(c+2))) c = skip_till_newline(c); if (dl_set[itemdepth] & BL_DESC_LIST) { out_html("

"); out_html(set_font("B")); if (*c=='\n') { /* Don't allow embedded comms after a newline */ c++; c=scan_troff(c,1,NULL); } else { /* Do allow embedded comms on the same line. */ c=scan_troff_mandoc(c,1,NULL); } out_html(set_font("R")); out_html(NEWLINE); out_html("

"); } else if (dl_set[itemdepth] & (BL_BULLET_LIST | BL_ENUM_LIST)) { out_html("

"); c=scan_troff_mandoc(c,1,NULL); out_html(NEWLINE); } if (fillout) curpos++; else curpos=0; break; } case REQ_Bk: /* mdoc(7) */ case REQ_Ek: /* mdoc(7) */ case REQ_Dd: /* mdoc(7) */ case REQ_Os: // mdoc(7) "Operating System" { trans_char(c,'"','\a'); c=c+j; if (*c=='\n') c++; c=scan_troff_mandoc(c, 1, NULL); out_html(NEWLINE); if (fillout) curpos++; else curpos=0; break; } case REQ_Bt: // mdoc(7) "Beta Test" { trans_char(c,'"','\a'); c=c+j; out_html(" is currently in beta test."); if (fillout) curpos++; else curpos=0; break; } case REQ_At: /* mdoc(7) */ case REQ_Fx: /* mdoc(7) */ case REQ_Nx: /* mdoc(7) */ case REQ_Ox: /* mdoc(7) */ case REQ_Bx: /* mdoc(7) */ case REQ_Ux: /* mdoc(7) */ case REQ_Dx: /* mdoc(7) */ { bool parsable=true; trans_char(c,'"','\a'); c=c+j; if (*c=='\n') c++; if (request==REQ_At) { out_html("AT&T UNIX "); parsable=false; } else if (request==REQ_Fx) { out_html("FreeBSD "); parsable=false; } else if (request==REQ_Nx) out_html("NetBSD "); else if (request==REQ_Ox) out_html("OpenBSD "); else if (request==REQ_Bx) out_html("BSD "); else if (request==REQ_Ux) out_html("UNIX "); else if (request==REQ_Dx) out_html("DragonFly "); if (parsable) c=scan_troff_mandoc(c,1,0); else c=scan_troff(c,1,0); if (fillout) curpos++; else curpos=0; break; } case REQ_Dl: /* mdoc(7) */ { c=c+j; out_html(NEWLINE); out_html("

"); if (*c=='\n') c++; c=scan_troff_mandoc(c, 1, NULL); out_html("

"); if (fillout) curpos++; else curpos=0; break; } case REQ_Bd: /* mdoc(7) */ { /* Seems like a kind of example/literal mode */ char bd_options[NULL_TERMINATED(MED_STR_MAX)]; char *nl = strchr(c,'\n'); c=c+j; if (nl) strlimitcpy(bd_options, c, nl - c, MED_STR_MAX); out_html(NEWLINE); mandoc_bd_options = 0; /* Remember options for terminating Bl */ if (strstr(bd_options, "-offset indent")) { mandoc_bd_options |= BD_INDENT; out_html("

\n"); } if ( strstr(bd_options, "-literal") || strstr(bd_options, "-unfilled")) { if (fillout) { mandoc_bd_options |= BD_LITERAL; out_html(set_font("R")); out_html(change_to_size('0')); out_html("
\n");
                        }
                        curpos=0;
                        fillout=0;
                    }
                    c=skip_till_newline(c);
                    break;
                }
                case REQ_Ed:	/* mdoc(7) */
                {
                    if (mandoc_bd_options & BD_LITERAL)
                    {
                        if (!fillout)
                        {
                            out_html(set_font("R"));
                            out_html(change_to_size('0'));
                            out_html("
\n"); } } if (mandoc_bd_options & BD_INDENT) out_html("

"); curpos=0; still_dd=false; } switch (*h) { case '&': intbuff[ibp++]='&'; intbuff[ibp++]='a'; intbuff[ibp++]='m'; intbuff[ibp++]='p'; intbuff[ibp++]=';'; curpos++; break; case '<': intbuff[ibp++]='&'; intbuff[ibp++]='l'; intbuff[ibp++]='t'; intbuff[ibp++]=';'; curpos++; break; case '>': intbuff[ibp++]='&'; intbuff[ibp++]='g'; intbuff[ibp++]='t'; intbuff[ibp++]=';'; curpos++; break; case '"': intbuff[ibp++]='&'; intbuff[ibp++]='q'; intbuff[ibp++]='u'; intbuff[ibp++]='o'; intbuff[ibp++]='t'; intbuff[ibp++]=';'; curpos++; break; case '\n': if (h != c && h[-1]=='\n' && fillout) { intbuff[ibp++]='<'; intbuff[ibp++]='P'; intbuff[ibp++]='>'; } if (contained_tab && fillout) { intbuff[ibp++]='<'; intbuff[ibp++]='B'; intbuff[ibp++]='R'; intbuff[ibp++]='>'; } contained_tab=0; curpos=0; usenbsp=0; intbuff[ibp++]='\n'; break; case '\t': { int curtab=0; contained_tab=1; FLUSHIBP; /* like a typewriter, not like TeX */ tabstops[19]=curpos+1; while (curtab480) { FLUSHIBP; } curpos++; } } else { out_html(""); while (curpos"); } } } break; default: if (*h==' ' && (h[-1]=='\n' || usenbsp)) { FLUSHIBP; if (!usenbsp && fillout) { out_html(" "); curpos=0; } usenbsp=fillout; if (usenbsp) out_html(" "); else intbuff[ibp++]=' '; } else if (*h>31 && *h<127) intbuff[ibp++]=*h; else if (((unsigned char)(*h))>127) { intbuff[ibp++]=*h; } curpos++; break; } if (ibp > (MED_STR_MAX - 20)) FLUSHIBP; h++; } } FLUSHIBP; if (buffer) buffer[buffpos]='\0'; if (san && h && *h) h++; newline_for_fun=exnewline_for_fun; if (result) { *result = buffer; buffer=exbuffer; buffpos=exbuffpos; buffmax=exbuffmax; scaninbuff=exscaninbuff; } return h; } static char *scan_troff_mandoc(char *c, bool san, char **result) { char *ret; char *end = c; bool oldval = mandoc_line; mandoc_line = true; while (*end && *end != '\n') { end++; } if (end >= c + 2 && ispunct(*(end - 1)) && isspace(*(end - 2)) && *(end - 2) != '\n') { /* Don't format lonely punctuation E.g. in "xyz ," format * the xyz and then append the comma removing the space. */ *(end - 2) = 0; (void)scan_troff(c, 0, result); ret = end-2; *(end-2)=*(end-1); *(end-1)=' '; } else { ret = scan_troff(c, san, result); } mandoc_line = oldval; return ret; } // Entry point void scan_man_page(const char *man_page) { if (!man_page) return; kdDebug(7107) << "Start scanning man page" << endl; // ## Do more init // Unlike man2html, we actually call this several times, hence the need to // properly cleanup all those static vars s_ifelseval.clear(); s_characterDefinitionMap.clear(); InitCharacterDefinitions(); s_stringDefinitionMap.clear(); InitStringDefinitions(); s_numberDefinitionMap.clear(); InitNumberDefinitions(); s_argumentList.clear(); section = 0; s_dollarZero = ""; // No macro called yet! output_possible = false; int strLength = tqstrlen(man_page); char *buf = new char[strLength + 2]; qstrcpy(buf+1, man_page); buf[0] = '\n'; kdDebug(7107) << "Parse man page" << endl; scan_troff(buf+1,0,NULL); kdDebug(7107) << "Man page parsed!" << endl; while (itemdepth || dl_set[itemdepth]) { out_html("\n"); if (dl_set[itemdepth]) dl_set[itemdepth]=0; else if (itemdepth > 0) itemdepth--; } out_html(set_font("R")); out_html(change_to_size(0)); if (!fillout) { fillout=1; out_html(""); } out_html(NEWLINE); if (section) { output_real("\n"); section = 0; } if (output_possible) { output_real("\n"); output_real("\n"); output_real("\n"); output_real("\n"); output_real("\n"); output_real("\n"); output_real("\n"); output_real("\n"); output_real("\n"); output_real("\n\n"); } delete [] buf; // Release memory s_characterDefinitionMap.clear(); s_stringDefinitionMap.clear(); s_numberDefinitionMap.clear(); s_argumentList.clear(); // reinit static variables for reuse delete [] buffer; buffer = 0; escapesym='\\'; nobreaksym='\''; controlsym='.'; fieldsym=0; padsym=0; buffpos=0; buffmax=0; scaninbuff=false; itemdepth=0; for (int i = 0; i < 20; i++) dl_set[i] = 0; still_dd=false; for (int i = 0; i < 12; i++) tabstops[i] = (i+1)*8; maxtstop=12; curpos=0; mandoc_name_count = 0; } #ifdef SIMPLE_MAN2HTML void output_real(const char *insert) { cout << insert; } char *read_man_page(const char *filename) { int man_pipe = 0; char *man_buf = NULL; FILE *man_stream = NULL; struct stat stbuf; size_t buf_size; if (stat(filename, &stbuf) == -1) { std::cerr << "read_man_page: can't find " << filename << endl; return NULL; } if (!S_ISREG(stbuf.st_mode)) { std::cerr << "read_man_page: no file " << filename << endl; return NULL; } buf_size = stbuf.st_size; man_buf = stralloc(buf_size+5); man_pipe = 0; man_stream = fopen(filename, "r"); if (man_stream) { man_buf[0] = '\n'; if (fread(man_buf+1, 1, buf_size, man_stream) == buf_size) { man_buf[buf_size] = '\n'; man_buf[buf_size + 1] = man_buf[buf_size + 2] = '\0'; } else { man_buf = NULL; } fclose(man_stream); } return man_buf; } int main(int argc, char **argv) { htmlPath = "."; cssPath = "."; if (argc < 2) { std::cerr << "call: " << argv[0] << " \n"; return 1; } if (chdir(argv[1])) { char *buf = read_man_page(argv[1]); if (buf) { scan_man_page(buf); delete [] buf; } } else { DIR *dir = opendir("."); struct dirent *ent; while ((ent = readdir(dir)) != NULL) { cerr << "converting " << ent->d_name << endl; char *buf = read_man_page(ent->d_name); if (buf) { scan_man_page(buf); delete [] buf; } } closedir(dir); } return 0; } #endif

"); else out_html("\n

"); mandoc_synopsis = tqstrncmp(c, "SYNOPSIS", 8) == 0; c = mandoc_command ? scan_troff_mandoc(c,1,NULL) : scan_troff(c,1,NULL); if (mode) out_html("

" ); out_html( scan_troff(wordlist[0], 0, NULL ) ); out_html( "