Java HTML / XML How to - JSoup select from HTML by tag name








Question

We would like to know how to jSoup select from HTML by tag name.

Answer

import org.jsoup.Jsoup;
import org.jsoup.nodes.Document;
import org.jsoup.nodes.Element;
import org.jsoup.select.Elements;
import java.io.IOException;
/*from   w ww .  j  av  a  2 s . c  o m*/
public class Main {
  public static void main (String[] args) throws IOException {
    String docId = "1";
    String url = "http://www.your server.com/" + docId;
    Document doc = Jsoup.connect(url).timeout(60000).userAgent("Mozilla/25.0").get();
    Elements authors = doc.select("div");

    System.out.println("authors=" + authors);
    System.out.println("authors.length=" + authors.size());

    for (Element a : authors) {
      System.out.println("  author: " + a);
    }
  }
}