public class HtmlScrubber extends HtmlVisitor
Modifier and Type | Field and Description |
---|---|
static int |
ATTR_DOWNCASE |
static int |
ATTR_UPCASE |
static int |
DEFAULT_OPTIONS |
protected int |
flags |
protected boolean |
inPreBlock |
protected HtmlDocument.HtmlElement |
previousElement |
static int |
STRIP_QUOTES |
static int |
TAGS_DOWNCASE |
static int |
TAGS_UPCASE |
static int |
TRIM_SPACES |
Constructor and Description |
---|
HtmlScrubber()
Create an HtmlScrubber with the default options (downcase tags and
tag attributes, strip out unnecessary quotes.)
|
HtmlScrubber(int flags)
Create an HtmlScrubber with the desired set of options.
|
Modifier and Type | Method and Description |
---|---|
void |
start() |
void |
visit(HtmlDocument.Annotation a) |
void |
visit(HtmlDocument.Comment c) |
void |
visit(HtmlDocument.EndTag t) |
void |
visit(HtmlDocument.Newline n) |
void |
visit(HtmlDocument.Tag t) |
void |
visit(HtmlDocument.TagBlock bl) |
void |
visit(HtmlDocument.Text t) |
finish, visit, visit, visit
public static final int TAGS_UPCASE
public static final int TAGS_DOWNCASE
public static final int ATTR_UPCASE
public static final int ATTR_DOWNCASE
public static final int STRIP_QUOTES
public static final int TRIM_SPACES
public static final int DEFAULT_OPTIONS
protected int flags
protected HtmlDocument.HtmlElement previousElement
protected boolean inPreBlock
public HtmlScrubber()
public HtmlScrubber(int flags)
flags
- A bitmask representing the desired scrubbing optionspublic void start()
start
in class HtmlVisitor
public void visit(HtmlDocument.Tag t)
visit
in class HtmlVisitor
public void visit(HtmlDocument.EndTag t)
visit
in class HtmlVisitor
public void visit(HtmlDocument.Text t)
visit
in class HtmlVisitor
public void visit(HtmlDocument.Comment c)
visit
in class HtmlVisitor
public void visit(HtmlDocument.Newline n)
visit
in class HtmlVisitor
public void visit(HtmlDocument.Annotation a)
visit
in class HtmlVisitor
public void visit(HtmlDocument.TagBlock bl)
visit
in class HtmlVisitor