var HTML_DIR = "/home/steve/dev/mozilla/extensions/xpclucene/test/htmldocs"; var service = Components.classes["@skrul.com/xpclucene;1"].getService(Components.interfaces.nsILuceneFactory); var parser = Components.classes["@mozilla.org/xmlextras/domparser;1"].createInstance(Components.interfaces.nsIDOMParser); var file = Components.classes["@mozilla.org/file/local;1"].createInstance(Components.interfaces.nsILocalFile); file.initWithPath(HTML_DIR); var entries = file.directoryEntries; while(entries.hasMoreElements()) { var entry = entries.getNext(); entry.QueryInterface(Components.interfaces.nsIFile); var fileStream = Components.classes["@mozilla.org/network/file-input-stream;1"].createInstance(Components.interfaces.nsIFileInputStream); fileStream.init(entry, 1, 0, false); var doc = parser.parseFromStream(fileStream, "UTF-8", fileStream.available(), "text/xml"); var s = service.filterHTMLDocument(doc); print("**** " + s); fileStream.close(); }