Jsoup是一款比較好的Java版HTML解析器。可直接解析某個URL地址、HTML文本內容。可經過DOM,CSS以及相似於jQuery的操做方法來取出和操做數據。html
<!-- 解析 html 文件 --> <dependency> <groupId>org.jsoup</groupId> <artifactId>jsoup</artifactId> <version>1.10.2</version> </dependency>
public static Document getDocument (String url){ try { return Jsoup.connect(url).get(); } catch (IOException e) { e.printStackTrace(); } return null; } public static void main(String[] args) { Document document=getDocument("https://item.wuage.com/543589592257.html?psa=W26.a190.a137.1"); System.out.println(document.select("img").first().attr("src")); System.out.println(document.getElementsByTag("title").first().text()); System.out.println(document.select("meta[name='keywords']").first().attr("content")); System.out.println(document.select("meta[name='description']").first().attr("content")); }