Revision 2376 tmp/org.txm.groovy.core/src/groovy/org/txm/macro/misc/EuroPress2XMLMacro.groovy

EuroPress2XMLMacro.groovy (revision 2376)
7 7
import java.text.DecimalFormat
8 8
import org.txm.utils.xml.DomUtils;
9 9
import org.txm.importer.ValidateXml;
10
import org.w3c.tidy.Tidy
11 10
import groovy.util.XmlParser
12 11
import org.kohsuke.args4j.*
13 12
import groovy.transform.Field
......
99 98

  
100 99
	File xhtmlFile = new File(outDir, name+".xhtml")
101 100

  
102
//	Tidy tidy = new Tidy(); // obtain a new Tidy instance
103
//	tidy.setXHTML(true); // set desired config options using tidy setters
104
//	tidy.setInputEncoding("UTF-8")
105
//	tidy.setOutputEncoding("UTF-8")
106
//	tidy.setShowErrors(0)
107
//	tidy.setShowWarnings(false)
108 101
	xhtmlFile.withWriter("UTF-8") { out ->
109 102
		def doc = org.jsoup.Jsoup.connect(tmpHTML.toURI().toURL().toString());
110 103
		println "current charset: "+doc.charset()

Also available in: Unified diff