Jsoup是一款比较好的Java版HTML解析器。可直接解析某个URL地址、HTML文本内容。可经过DOM,CSS以及相似于jQuery的操做方法来取出和操做数据。html
<!-- 解析 html 文件 --> <dependency> <groupId>org.jsoup</groupId> <artifactId>jsoup</artifactId> <version>1.10.2</version> </dependency>
public static Document getDocument (String url){ try { return Jsoup.connect(url).get(); } catch (IOException e) { e.printStackTrace(); } return null; } public static void main(String[] args) { Document document=getDocument("https://item.wuage.com/543589592257.html?psa=W26.a190.a137.1"); System.out.println(document.select("img").first().attr("src")); System.out.println(document.getElementsByTag("title").first().text()); System.out.println(document.select("meta[name='keywords']").first().attr("content")); System.out.println(document.select("meta[name='description']").first().attr("content")); }