public final class HtmlParsingUtils extends Object
Modifier and Type | Method and Description |
---|---|
static Document |
createEmptyDoc() |
static HTTPSamplerBase |
createUrlFromAnchor(String parsedUrlString,
URL context)
Create a new Sampler based on an HREF string plus a contextual URL
object.
|
static List<HTTPSamplerBase> |
createURLFromForm(Node doc,
URL context) |
static void |
extractStyleURLs(URL baseUrl,
URLCollection urls,
String styleTagStr) |
static Node |
getDOM(String text)
Returns a node representing a whole xml given an xml document.
|
static org.w3c.tidy.Tidy |
getParser()
Returns
tidy as HTML parser. |
static boolean |
isAnchorMatched(HTTPSamplerBase newLink,
HTTPSamplerBase config)
Check if anchor matches by checking against:
- protocol
- domain
- path
- parameter names
|
static boolean |
isArgumentMatched(Argument arg,
Argument patternArg)
Arguments match if the input name matches the corresponding pattern name
and the input value matches the pattern value, where the matching is done
first using String equals, and then Regular Expression matching if the equals test fails.
|
static boolean |
isEqualOrMatches(String arg,
String pat)
Match the input argument against the pattern using String.equals() or pattern matching if that fails
using case-insensitive matching.
|
static boolean |
isEqualOrMatches(String arg,
String pat,
org.apache.oro.text.regex.Perl5Matcher matcher,
org.apache.oro.text.PatternCacheLRU cache)
Match the input argument against the pattern using String.equals() or pattern matching if that fails.
|
static boolean |
isEqualOrMatchesCaseBlind(String arg,
String pat)
Match the input argument against the pattern using String.equals() or pattern matching if that fails
using case-insensitive matching.
|
static boolean |
isEqualOrMatchesCaseBlind(String arg,
String pat,
org.apache.oro.text.regex.Perl5Matcher matcher,
org.apache.oro.text.PatternCacheLRU cache)
Match the input argument against the pattern using String.equals() or pattern matching if that fails
using case-insensitive matching.
|
public static boolean isAnchorMatched(HTTPSamplerBase newLink, HTTPSamplerBase config)
newLink
- target to matchconfig
- pattern to match againstpublic static boolean isArgumentMatched(Argument arg, Argument patternArg)
arg
- - input ArgumentpatternArg
- - pattern to match againstpublic static boolean isEqualOrMatches(String arg, String pat, org.apache.oro.text.regex.Perl5Matcher matcher, org.apache.oro.text.PatternCacheLRU cache)
arg
- input stringpat
- pattern stringmatcher
- Perl5Matchercache
- PatternCachepublic static boolean isEqualOrMatchesCaseBlind(String arg, String pat, org.apache.oro.text.regex.Perl5Matcher matcher, org.apache.oro.text.PatternCacheLRU cache)
arg
- input stringpat
- pattern stringmatcher
- Perl5Matchercache
- PatternCachepublic static boolean isEqualOrMatches(String arg, String pat)
arg
- input stringpat
- pattern stringpublic static boolean isEqualOrMatchesCaseBlind(String arg, String pat)
arg
- input stringpat
- pattern stringpublic static org.w3c.tidy.Tidy getParser()
tidy
as HTML parser.tidy
HTML parserpublic static Node getDOM(String text)
text
- an xml documentpublic static Document createEmptyDoc()
public static HTTPSamplerBase createUrlFromAnchor(String parsedUrlString, URL context) throws MalformedURLException
parsedUrlString
- the url from the hrefcontext
- the context in which the href was found. This is used to
extract url information that might be missing in
parsedUrlString
MalformedURLException
- when the given url (parsedUrlString
plus
context
is malformed)public static List<HTTPSamplerBase> createURLFromForm(Node doc, URL context)
public static void extractStyleURLs(URL baseUrl, URLCollection urls, String styleTagStr)
Copyright © 1998-2019 Apache Software Foundation. All Rights Reserved.