|
||||||||||
| PREV CLASS NEXT CLASS | FRAMES NO FRAMES | |||||||||
| SUMMARY: NESTED | FIELD | CONSTR | METHOD | DETAIL: FIELD | CONSTR | METHOD | |||||||||
java.lang.Objectedu.iastate.utils.string.HTMLHandler
| Constructor Summary | |
HTMLHandler()
|
|
| Method Summary | |
static java.lang.String |
escapeHTMLTags(java.lang.String in)
This method takes a string which may contain HTML tags (ie, <b>, <table>, etc) and converts the '<'' and '>' characters to their HTML escape sequences. |
static java.lang.String[] |
getLinksInHTML(java.lang.String uriStr)
Getting the Links in an HTML Document This method takes a URI which can be either a filename (e.g. file://c:/dir/file.html)or a URL (e.g. http://host.com/page.html) and returns all HREF links in the document. |
static java.util.Vector |
getNestdBlock(java.lang.String tag,
java.lang.CharSequence input,
boolean greedy)
return all tags begin with 'tag' no repeated nesting is detected, like |
static java.util.Vector |
getNestdBlock(java.lang.String head,
java.lang.String tail,
java.lang.CharSequence input,
boolean greedy)
get all block with given head and tail head and tail are not included |
static java.util.Vector |
getTopNestdBlock(java.lang.CharSequence inputStr)
return the content of the highest |
static java.lang.String |
Html2Txt(java.io.InputStream stream)
|
static java.lang.String |
Html2Txt(java.lang.String HTMLstr)
|
static java.lang.String |
Html2Txt(java.net.URI uri)
Getting the Text in an HTML Document to reaf from a URI [ a filename (e.g. file://c:/dir/file.html) or a URL (e.g. http://host.com/page.html) ] URL url = new URI( uriStr ).toURL() ; URLConnection conn = url.openConnection() ; Html2Txt( conn.getInputStream() ) ; for String strHTML InputStream stream = new StringBufferInputStream(strHTML); Html2Txt(stream); |
static boolean |
isEmailValid(java.lang.String inputString)
|
static boolean |
isUrlValid(java.lang.String url)
protected boolean isUrlValid(String url) ---------------------------------------- Checks whether the URL is valid; really basic for now; |
static java.lang.String |
TagRemover(java.lang.String strHTML)
Remove the tags "<" between ">" |
| Methods inherited from class java.lang.Object |
clone, equals, finalize, getClass, hashCode, notify, notifyAll, toString, wait, wait, wait |
| Constructor Detail |
public HTMLHandler()
| Method Detail |
public static java.util.Vector getTopNestdBlock(java.lang.CharSequence inputStr)
inputStr -
public static java.util.Vector getNestdBlock(java.lang.String tag,
java.lang.CharSequence input,
boolean greedy)
tag - input -
public static java.util.Vector getNestdBlock(java.lang.String head,
java.lang.String tail,
java.lang.CharSequence input,
boolean greedy)
head - tail - input - greedy -
public static java.lang.String Html2Txt(java.net.URI uri)
public static java.lang.String Html2Txt(java.lang.String HTMLstr)
public static java.lang.String Html2Txt(java.io.InputStream stream)
public static java.lang.String TagRemover(java.lang.String strHTML)
strHTML - String
public static boolean isEmailValid(java.lang.String inputString)
public static java.lang.String[] getLinksInHTML(java.lang.String uriStr)
uriStr -
public static boolean isUrlValid(java.lang.String url)
public static final java.lang.String escapeHTMLTags(java.lang.String in)
in - the text to be converted.
|
||||||||||
| PREV CLASS NEXT CLASS | FRAMES NO FRAMES | |||||||||
| SUMMARY: NESTED | FIELD | CONSTR | METHOD | DETAIL: FIELD | CONSTR | METHOD | |||||||||