comparison src/org/nwoca/ssdt/tools/html2wiki/Html2Wiki.java @ 15:494ca5643e1a

adjust h2 transformer for headings with arguments and added transformer for removing the empty contents table that is left as part of the conversion of the manuals.
author ferrall@nwoca.org
date Mon, 07 Feb 2011 11:44:10 -0500
parents c8442e0eff84
children 001e43423d5d
comparison
equal deleted inserted replaced
14:c8442e0eff84 15:494ca5643e1a
40 transformers.add(new DeleteTransformer("(?m)<br>$")); 40 transformers.add(new DeleteTransformer("(?m)<br>$"));
41 transformers.add(new DeleteTransformer("<caption>.*</caption>")); // remove SDML captions (used for TOC) 41 transformers.add(new DeleteTransformer("<caption>.*</caption>")); // remove SDML captions (used for TOC)
42 transformers.add(new DeleteTransformer("<font .*?>|</font>")); 42 transformers.add(new DeleteTransformer("<font .*?>|</font>"));
43 transformers.add(new CloseTagTransformer("<li>","(\n|\r)*(<li>|</ul>|</ol>|<ul>|<ol>)","</li>")); 43 transformers.add(new CloseTagTransformer("<li>","(\n|\r)*(<li>|</ul>|</ol>|<ul>|<ol>)","</li>"));
44 transformers.add(new BadTableDataTransformer()); 44 transformers.add(new BadTableDataTransformer());
45 transformers.add(new BadTableRowTransformer()); 45 transformers.add(new BadTableRowTransformer());
46 transformers.add(new ReflowTransformer()); 46 transformers.add(new ReflowTransformer());
47 transformers.add(new DeleteTransformer("<p>")); 47 transformers.add(new DeleteTransformer("<p>"));
48 transformers.add(new ReplaceTransformer("\\{","\\{")); // Escape braces 48 transformers.add(new ReplaceTransformer("\\{","\\{")); // Escape braces
49 transformers.add(new ReplaceTransformer("\\}","\\}")); 49 transformers.add(new ReplaceTransformer("\\}","\\}"));
50 50
51 transformers.add(new ReplaceTransformer("\\[","\\[")); // Escape brackets 51 transformers.add(new ReplaceTransformer("\\[","\\[")); // Escape brackets
52 transformers.add(new ReplaceTransformer("\\]","\\]")); 52 transformers.add(new ReplaceTransformer("\\]","\\]"));
73 transformers.add(new TagTransformer("<em>(.*?)</em>", "*","*")); 73 transformers.add(new TagTransformer("<em>(.*?)</em>", "*","*"));
74 transformers.add(new TagTransformer("<strong>(.*?)</strong>", true, "*","*")); 74 transformers.add(new TagTransformer("<strong>(.*?)</strong>", true, "*","*"));
75 transformers.add(new TagTransformer("<u>(.*?)</u>" , "+","+")); 75 transformers.add(new TagTransformer("<u>(.*?)</u>" , "+","+"));
76 transformers.add(new TagTransformer("(?s)<kbd>(.*?)</kbd>", "{{", "}}")); 76 transformers.add(new TagTransformer("(?s)<kbd>(.*?)</kbd>", "{{", "}}"));
77 transformers.add(new TagTransformer("<h1>(.*)</h1>", "h1. ", "")); 77 transformers.add(new TagTransformer("<h1>(.*)</h1>", "h1. ", ""));
78 transformers.add(new TagTransformer("<h2>(.*)</h2>", "h2. ", "")); 78 transformers.add(new TagTransformer("<h2.*>(.*)</h2>", "h2. ", ""));
79 transformers.add(new TagTransformer("<h3>(accessing the program|sample run|sample screens?|sample reports?)</[h|H]3>","h3.", "")); 79 transformers.add(new TagTransformer("<h3>(accessing the program|sample run|sample screens?|sample reports?)</[h|H]3>","h3.", ""));
80 transformers.add(new TagTransformer("<h3>(.*)</H3>", "h3. ", "")); 80 transformers.add(new TagTransformer("<h3>(.*)</H3>", "h3. ", ""));
81 transformers.add(new TagTransformer("<h3>(.*)</h3>", "h3. ", "")); 81 transformers.add(new TagTransformer("<h3>(.*)</h3>", "h3. ", ""));
82 transformers.add(new TagTransformer("<h4>(.*)</h4>", "h4. ", "")); 82 transformers.add(new TagTransformer("<h4>(.*)</h4>", "h4. ", ""));
83 transformers.add(new TagTransformer("<h5>(.*)</h5>", "h5. ", "")); 83 transformers.add(new TagTransformer("<h5>(.*)</h5>", "h5. ", ""));
107 transformers.add(new ReplaceTransformer("&gt;",">")); 107 transformers.add(new ReplaceTransformer("&gt;",">"));
108 transformers.add(new ReplaceTransformer("&quot;","\"")); 108 transformers.add(new ReplaceTransformer("&quot;","\""));
109 transformers.add(new ReplaceTransformer("&amp;","&")); 109 transformers.add(new ReplaceTransformer("&amp;","&"));
110 transformers.add(new ReplaceTransformer(":\\)",": )")); // No smilies... 110 transformers.add(new ReplaceTransformer(":\\)",": )")); // No smilies...
111 transformers.add(new ReplaceTransformer("(\\w)(--)(\\w)"," -- ",2)); // avoid strikeout 111 transformers.add(new ReplaceTransformer("(\\w)(--)(\\w)"," -- ",2)); // avoid strikeout
112 transformers.add(new ReplaceTransformer("\\{table(.*?)\\}\\n\\s{2}\\{tr\\}\\n\\s{4}\\{td\\}Contents\\{td\\}\\n\\s{2}\\{tr\\}\\n\\{table\\}","")); // remove "contents" table
112 113
113 } 114 }
114 115
115 /** 116 /**
116 * @param args the command line arguments 117 * @param args the command line arguments