0
点赞
收藏
分享

微信扫一扫

Jsoup解析xml文档快速入门

编程练习生J 2022-01-09 阅读 44

jsoup解析xml文件的三种方法
demoJsoup1.java
package Jsoup;

import org.jsoup.Jsoup;
import org.jsoup.nodes.Document;
import org.jsoup.nodes.Element;
import org.jsoup.select.Elements;

import java.io.File;
import java.io.IOException;

public class demojsoup1 {
public static void main(String[] args) throws IOException {
//获取xml文件路径
String path = demojsoup1.class.getClassLoader().getResource(“student.xml”).getPath();
//加载xml路径,设置编码格式
Document document = Jsoup.parse(new File(path), “UTF-8”);
//获取name属性
Elements elements = document.getElementsByTag(“name”);
System.out.println(elements.size());
Element element = elements.get(1);
//获取文本内容
String name = element.text();
System.out.println(name);
}
}
demojsoup2.java
package Jsoup;

import org.jsoup.Jsoup;
import org.jsoup.nodes.Document;

import java.net.MalformedURLException;
import java.net.URL;

public class demojsoup2 {
public static void main(String[] args) throws Exception {
String path = demojsoup2.class.getClassLoader().getResource(“student.xml”).getPath();
// String str= “<?Jsoup version=\"1.0\" endcoding=\"UTF-8\" ?>\n” +
// “\n” +
// “\n” +
// " <student number=“heima_0001”>\n" +
// " tom\n" +
// " 18\n" +
// " male\n" +
// " \n" +
// " <student number=“heima_0002”>\n" +
// " zhangsan\n" +
// " 18\n" +
// " male\n" +
// " \n" +
// “”;
// Document document = Jsoup.parse(str);
// System.out.println(document);
//第三种方法
URL url = new URL(“https://www.ruiwen.com/wenxue/qingshi/378406.html”);
Document document = Jsoup.parse(url, 10000);
System.out.println(document);
}

}
demojsoup3.java
package Jsoup;

import org.jsoup.Jsoup;
import org.jsoup.nodes.Document;
import org.jsoup.nodes.Element;
import org.jsoup.select.Elements;

import java.io.File;

public class demojsoup3 {
public static void main(String[] args) throws Exception{
String path=demojsoup3.class.getClassLoader().getResource(“student.xml”).getPath();
Document document = Jsoup.parse(new File(path), “UTF-8”);
Element element = document.getElementsByTag(“student”).get(1);
Elements name = element.getElementsByTag(“name”);
System.out.println(element.text());
System.out.println("--------------------------");
String number = element.attr(“number”);
System.out.println(number);
System.out.println("--------------------------");
String text = name.text();
String html = name.html();
System.out.println(text);
System.out.println(html);

}

}
demojsoup.java
package Jsoup;

import org.jsoup.Jsoup;
import org.jsoup.nodes.Document;
import org.jsoup.nodes.Element;
import org.jsoup.select.Elements;

import java.io.File;

public class demojsoup4 {
public static void main(String[] args) throws Exception{
String path= demojsoup4.class.getClassLoader().getResource(“student.xml”).getPath();
Document document = Jsoup.parse(new File(path), “UTF-8”);
Elements student = document.select(“student”);
System.out.println(student);
System.out.println("--------------------");
Elements name = document.select(“name”);
System.out.println(name);
System.out.println("--------------------");
Elements select = document.select(“student[number=“heima_0001”]>age”);
System.out.println(select);
}
}

举报

相关推荐

0 条评论