Selection Example2
Jsoup is an open source java library for parsing and manipulating HTML with ease.
Get the latest binaries from http://jsoup.org/ .
This requires the library jsoup-1.6.1.jar to be in classpath.
The following example shows div and anchor selection.
03
<
title
>BE THE CODER</
title
>
04
<
script
type
=
"text/javascript"
src
=
"jQuery.js"
></
script
>
07
<
script
type
=
"text/javascript"
src
=
"Tooltip.js"
></
script
>
10
<
div
id
=
"notify-container"
>Notify Content</
div
>
11
<
div
id
=
"overlay-header"
>Overlay Header Content</
div
>
12
<
div
id
=
"custom-header"
>Custom Header Content</
div
>
14
<
div
class
=
"container"
>
15
Container Data Content <
a
id
=
"nav-cont"
href
=
"/content"
>AAA</
a
> BBB CCC DDDD
18
<
div
class
=
"nav mainnavs"
>
20
<
li
class
=
"youarehere"
><
a
id
=
"nav-questions"
href
=
"/questions"
>Questions</
a
></
li
>
21
<
li
><
a
id
=
"nav-tags"
href
=
"/tags"
>Tags</
a
></
li
>
22
<
li
><
a
id
=
"nav-users"
href
=
"/users"
>Users</
a
></
li
>
25
<
div
id
=
"footer-one"
>Custom Footer Content1</
div
>
26
<
div
id
=
"footer-two"
>Custom Footer Content2</
div
>
package com.bethecoder.tutorials.jsoup.tests;
import java.io.IOException;
import java.io.InputStream;
import org.jsoup.Jsoup;
import org.jsoup.nodes.Document;
public class SelectTest2 {
/**
* @param args
* @throws IOException
*/
public static void main ( String [] args ) throws IOException {
InputStream ins = SelectTest2. class .
getClassLoader () .getResourceAsStream ( "Simple.html" ) ;
Document doc = Jsoup.parse ( ins, "UTF-8" , "btc.com" ) ;
System.out.println ( doc.select ( "div" ) .first () .toString ()) ; //First div
//ul under a div having 'mainnavs' as class
System.out.println ( doc.select ( "div.mainnavs > ul" )) ;
//anchors under li under ul under a div having 'mainnavs' as class
System.out.println ( doc.select ( "div.mainnavs > ul > li > a" )) ;
//first anchor under li under ul under a div having 'mainnavs' as class
System.out.println ( doc.select ( "div.mainnavs > ul > li > a" ) .first ()) ;
}
}
It gives the following output,
01
<
div
id
=
"notify-container"
>
07
<
li
class
=
"youarehere"
><
a
id
=
"nav-questions"
href
=
"/questions"
>Questions</
a
></
li
>
08
<
li
><
a
id
=
"nav-tags"
href
=
"/tags"
>Tags</
a
></
li
>
09
<
li
><
a
id
=
"nav-users"
href
=
"/users"
>Users</
a
></
li
>
13
<
a
id
=
"nav-questions"
href
=
"/questions"
>Questions</
a
>
14
<
a
id
=
"nav-tags"
href
=
"/tags"
>Tags</
a
>
15
<
a
id
=
"nav-users"
href
=
"/users"
>Users</
a
>
18
<
a
id
=
"nav-questions"
href
=
"/questions"
>Questions</
a
>