HTMLDocument: Document Iterator Example

   
import java.io.BufferedReader;
import java.io.InputStream;
import java.io.InputStreamReader;
import java.net.URL;
import java.net.URLConnection;

import javax.swing.text.AttributeSet;
import javax.swing.text.html.HTML;
import javax.swing.text.html.HTMLDocument;
import javax.swing.text.html.HTMLEditorKit;
import javax.swing.text.html.parser.ParserDelegator;

public class DocumentIteratorExample {

  public static void main(String args[]) throws Exception {
    URL url = new URL("http://www.java2s.com");
    URLConnection connection = url.openConnection();
    InputStream is = connection.getInputStream();
    InputStreamReader isr = new InputStreamReader(is);
    BufferedReader br = new BufferedReader(isr);

    HTMLEditorKit htmlKit = new HTMLEditorKit();
    HTMLDocument htmlDoc = (HTMLDocument) htmlKit.createDefaultDocument();
    HTMLEditorKit.Parser parser = new ParserDelegator();
    HTMLEditorKit.ParserCallback callback = htmlDoc.getReader(0);
    parser.parse(br, callback, true);

    for (HTMLDocument.Iterator iterator = htmlDoc.getIterator(HTML.Tag.A); iterator
        .isValid(); iterator.next()) {

      AttributeSet attributes = iterator.getAttributes();
      String srcString = (String) attributes
          .getAttribute(HTML.Attribute.HREF);
      System.out.print(srcString);
      int startOffset = iterator.getStartOffset();
      int endOffset = iterator.getEndOffset();
      int length = endOffset - startOffset;
      String text = htmlDoc.getText(startOffset, length);
      System.out.println(" - " + text);
    }
    System.exit(0);
  }
}

Related examples in the same category

1.	DocumentFilter that maps lowercase letters to uppercase
2.	An extension of PlainDocument that restricts the length of its content
3.	Document Event Demo
4.	React to the document update insert changed event
5.	DocumentListener Demo
6.	extends PlainDocument to create a float value type text field
7.	extends PlainDocument to create alpha and numeric value based field field
8.	Implement a document cleaner that maps lowercase letters to uppercase
9.	Document ElementIterator Demo
10.	Format JTextField's text to uppercase
11.	Overriding a Few Default Typed Key Bindings in a JTextComponent
12.	Overriding - key
13.	Override $ key
14.	Overriding space key
15.	Disable a character so that no action is invoked.
16.	Bind a keystroke to shift-space
17.	Prevent the space from being inserted when shift-space is pressed.
18.	Subclass InputVerifier
19.	extends PlainDocument
20.	This Document restricts the size of the contained plain text to the given number of characters.
21.	A frame with three text fields to set the background color.

HTMLDocument: Document Iterator Example : Document Event « Swing JFC « Java

Related examples in the same category