📄 html3xml.java
字号:
import java.io.BufferedInputStream;
import java.io.FileOutputStream;
import java.io.FileWriter;
import java.io.IOException;
import java.io.PrintWriter;
import java.net.URL;
import org.w3c.tidy.Tidy;
//HTML文件转换成XML输出
public class HTML2XML {
private String url;
private String outFileName;
private String errOutFileName;
public HTML2XML(String url, String outFileName, String errOutFileName) {
this.url = url;
this.outFileName = outFileName;
this.errOutFileName = errOutFileName;
}
public void convert() {
URL u;
BufferedInputStream in;
FileOutputStream out;
Tidy tidy = new Tidy();
//告诉Tidy将HTML转换为XML
tidy.setXmlOut(true);
try {
//将错误信息保存到文件中
tidy.setErrout(new PrintWriter(new FileWriter(errOutFileName),
true));
u = new URL(url);
//创建一个输入输出流
in = new BufferedInputStream(u.openStream());
out = new FileOutputStream(outFileName);
//转换文件
tidy.parse(in, out);
in.close();
out.close();//释放
} catch (IOException e) {
System.out.println(this.toString() + e.toString());
}
}
public static void main(String[] args) {
//参数: HTML文件的URL,输出文件和错误文件名
System.out.println("程序开始运行......");
TestHTML2XML t = new TestHTML2XML(
"http://localhost/servlet-study/testmail.jsp",
"d:\\temp\\html2xml.xml", "d:\\temp\\error.txt");
t.convert();
System.out.println("程序运行结束......");
} }
⌨️ 快捷键说明
复制代码
Ctrl + C
搜索代码
Ctrl + F
全屏模式
F11
切换主题
Ctrl + Shift + D
显示快捷键
?
增大字号
Ctrl + =
减小字号
Ctrl + -