/**
* Main class of Stand-alone version of WebHelpIndexer
*
- * User: Kasun Gajasinghe, University of Moratuwa, http://kasunbg.blogspot.com
+ * User: Kasun Gajasinghe, University of Moratuwa, http://kasunbg.org
* Date: Feb 10, 2011
*
- * @author Kasun Gajasinghe
+ * @author Kasun Gajasinghe, University of Moratuwa, http://kasunbg.org
*/
public class IndexerMain {
private String outputDir = null;
private String projectDir = null;
- // ANT parameters
+ // two of the input parameters
public String htmlDir = null;
public String indexerLanguage = "en";
setHtmlDir(htmlDir);
setIndexerLanguage(indexerLanguage);
}
-
+
/**
* The content language defaults to English "en"
*
System.getProperty("tocFile")
);
} else {
- throw new RuntimeException("Specify at least the the directory containing html files (htmlDir)\n " +
+ throw new RuntimeException("Specify at least the directory containing html files (htmlDir)\n " +
"ex: java -jar webhelpindexer.jar -DhtmlDir=docs/content -DindexerLanguage=en \n" +
"The program will exit now."
);
}
/**
- * Implementation of the execute function (Task interface)
+ * The main execution happens here.
*/
public void execute() {
+
+/*
+ //These system properties are set via command-line/ant-script now. See xsl/webhelp/build.xml#index target for
+ details.
try {
+ //TagSoup SAX HTML Parser which supports parsing even the bad non-xml-conformed HTML
+ System.setProperty("org.xml.sax.driver", "org.ccil.cowan.tagsoup.Parser");
+ //org.ccil.cowan.tagsoup.jaxp.SAXParserImpl
+ System.setProperty("javax.xml.parsers.SAXParserFactory", "org.ccil.cowan.tagsoup.jaxp.SAXFactoryImpl");
+
//Use Xerces as the parser. Does not support Saxon6.5.5 parser
- System.setProperty("org.xml.sax.driver", "org.apache.xerces.parsers.SAXParser");
- System.setProperty("javax.xml.parsers.SAXParserFactory", "org.apache.xerces.jaxp.SAXParserFactoryImpl");
+// System.setProperty("org.xml.sax.driver", "org.apache.xerces.parsers.SAXParser");
+// System.setProperty("javax.xml.parsers.SAXParserFactory", "org.apache.xerces.jaxp.SAXParserFactoryImpl");
+
+ //saxon
// System.setProperty("org.xml.sax.driver", "com.icl.saxon.aelfred.SAXDriver");
// System.setProperty("javax.xml.parsers.SAXParserFactory", "com.icl.saxon.aelfred.SAXParserFactoryImpl");
} catch (SecurityException se) {
System.out.println("[WARNING] Default parser is not set to Xerces. Make sure Saxon6.5.5 " +
"is not in your CLASSPATH");
}
+ */
ArrayList<DocFileInfo> filesDescription = null; // list of information about the topic files
ArrayList<File> htmlFiles = null; // topic files listed in the given directory
javax.xml.parsers.SAXParser sp = spf.newSAXParser();\r
// deactivate the validation\r
sp.getXMLReader().setFeature("http://xml.org/sax/features/external-general-entities", false);\r
- sp.getXMLReader().setFeature("http://apache.org/xml/features/nonvalidating/load-external-dtd", false);\r
+// sp.getXMLReader().setFeature("http://apache.org/xml/features/nonvalidating/load-external-dtd", false);\r
+// this feature isn't supported in TagSoup \r
\r
//parse the file and also register this class for call backs\r
//System.out.println("Parsing: " + file);\r
package com.nexwave.nquindexer;
-import java.io.BufferedOutputStream;
-import java.io.File;
-import java.io.FileOutputStream;
-import java.io.IOException;
-import java.io.OutputStream;
-import java.io.OutputStreamWriter;
-import java.io.UnsupportedEncodingException;
+import java.io.*;
import java.util.ArrayList;
import java.util.Iterator;
import java.util.Map;
private static String txt_indices_location = "The created index files are located in ";
/**
- * Create a javascript array listing the html files with their paths relative to the project root
+ * Create a JavaScript array listing the html files with their paths relative to the project root
*
* @param fileO path and name of the file in which to output the list of html files
* @param list of the html files, relative to the doc root directory
}
/**
- * Create javascript index files alphabetically.
+ * Create JavaScript index files alphabetically.
*
* @param fileOutStr contains the path and the suffix of the index files to create.
* The first letter of the key is added to the given suffix. For example: e.g. a.js, b.js etc...
The value is the numbers of the files in which the word exists.
Example: w["key"]="file1,file2,file3";*/
int count = 0;
- if (i == 1)
+ if (i == 1) {
out.write("var indexerLanguage=\"" + indexerLanguage + "\";\n");
- out.write("//Auto generated index for searching.\n");
+ }
+ out.write("//Auto generated index for searching by xsl-webhelpindexer for DocBook Webhelp." +
+ "# Kasun Gajasinghe, University of Moratuwa\n");
while (keyIt.hasNext()) { //&& (tempLetter == tstr.charAt(0))
out.write("w[\"" + tstr + "\"]" + "=\"" + indexMap.get(tstr) + "\";\n");
tstr = (String) keyIt.next();