org.jsoup.parser.ParseErrorList java code examples

void error(String errorMsg) {
  if (errors.canAddError())
    errors.add(new ParseError(reader.pos(), errorMsg));
}

  public static ParseErrorList tracking(int maxSize) {
    return new ParseErrorList(INITIAL_CAPACITY, maxSize);
  }
}

public Document parseInput(String html, String baseUri) {
  errors = isTrackErrors() ? ParseErrorList.tracking(maxErrors) : ParseErrorList.noTracking();
  return treeBuilder.parse(new StringReader(html), baseUri, errors, settings);
}

Document parse(Reader input, String baseUri) {
  return parse(input, baseUri, ParseErrorList.noTracking(), ParseSettings.preserveCase);
}

public boolean isValidBodyHtml(String bodyHtml) {
  Document clean = Document.createShell("");
  Document dirty = Document.createShell("");
  ParseErrorList errorList = ParseErrorList.tracking(1);
  List<Node> nodes = Parser.parseFragment(bodyHtml, dirty.body(), "", errorList);
  dirty.body().insertChildren(0, nodes);
  int numDiscarded = copySafeNodes(dirty.body(), clean.body());
  return numDiscarded == 0 && errorList.size() == 0;
}

boolean canAddError() {
  return size() < maxSize;
}

Document parse(String input, String baseUri) {
  return parse(new StringReader(input), baseUri, ParseErrorList.noTracking(), ParseSettings.preserveCase);
}

void eofError(TokeniserState state) {
  if (errors.canAddError())
    errors.add(new ParseError(reader.pos(), "Unexpectedly reached end of file (EOF) in input state [%s]", state));
}

public Document parseInput(Reader inputHtml, String baseUri) {
  errors = isTrackErrors() ? ParseErrorList.tracking(maxErrors) : ParseErrorList.noTracking();
  return treeBuilder.parse(inputHtml, baseUri, errors, settings);
}

/**
 * Parse HTML into a Document.
 *
 * @param html HTML to parse
 * @param baseUri base URI of document (i.e. original fetch location), for resolving relative URLs.
 *
 * @return parsed Document
 */
public static Document parse(String html, String baseUri) {
  TreeBuilder treeBuilder = new HtmlTreeBuilder();
  return treeBuilder.parse(new StringReader(html), baseUri, ParseErrorList.noTracking(), treeBuilder.defaultSettings());
}

public static ParseErrorList noTracking() {
  return new ParseErrorList(0, 0);
}

private void characterReferenceError(String message) {
  if (errors.canAddError())
    errors.add(new ParseError(reader.pos(), "Invalid character reference: %s", message));
}

/**
 * Parse a fragment of XML into a list of nodes.
 *
 * @param fragmentXml the fragment of XML to parse
 * @param baseUri base URI of document (i.e. original fetch location), for resolving relative URLs.
 * @return list of nodes parsed from the input XML.
 */
public static List<Node> parseXmlFragment(String fragmentXml, String baseUri) {
  XmlTreeBuilder treeBuilder = new XmlTreeBuilder();
  return treeBuilder.parseFragment(fragmentXml, baseUri, ParseErrorList.noTracking(), treeBuilder.defaultSettings());
}

void error(HtmlTreeBuilderState state) {
  if (errors.canAddError())
    errors.add(new ParseError(reader.pos(), "Unexpected token [%s] when in state [%s]", currentToken.tokenType(), state));
}

/**
 * Parse a fragment of HTML into a list of nodes. The context element, if supplied, supplies parsing context.
 *
 * @param fragmentHtml the fragment of HTML to parse
 * @param context (optional) the element that this HTML fragment is being parsed for (i.e. for inner HTML). This
 * provides stack context (for implicit element creation).
 * @param baseUri base URI of document (i.e. original fetch location), for resolving relative URLs.
 *
 * @return list of nodes parsed from the input HTML. Note that the context element, if supplied, is not modified.
 */
public static List<Node> parseFragment(String fragmentHtml, Element context, String baseUri) {
  HtmlTreeBuilder treeBuilder = new HtmlTreeBuilder();
  return treeBuilder.parseFragment(fragmentHtml, context, baseUri, ParseErrorList.noTracking(), treeBuilder.defaultSettings());
}

void error(TokeniserState state) {
  if (errors.canAddError())
    errors.add(new ParseError(reader.pos(), "Unexpected character '%s' in input state [%s]", reader.current(), state));
}

/**
 * Utility method to unescape HTML entities from a string
 * @param string HTML escaped string
 * @param inAttribute if the string is to be escaped in strict mode (as attributes are)
 * @return an unescaped string
 */
public static String unescapeEntities(String string, boolean inAttribute) {
  Tokeniser tokeniser = new Tokeniser(new CharacterReader(string), ParseErrorList.noTracking());
  return tokeniser.unescapeEntities(inAttribute);
}

void error(Asta4DTagSupportHtmlTreeBuilderState state) {
  if (errors.canAddError())
    errors.add(new ParseError(reader.pos(), "Unexpected token [%s] when in state [%s]", currentToken.tokenType(), state));
}

Javadoc

A container for ParseErrors.

Most used methods

Popular in Java

Reactive rest calls using spring rest template
getSupportFragmentManager (FragmentActivity)
getSystemService (Context)
setScale (BigDecimal)
ConnectException (java.net)
A ConnectException is thrown if a connection cannot be established to a remote host on a specific po
HttpURLConnection (java.net)
An URLConnection for HTTP (RFC 2616 [http://tools.ietf.org/html/rfc2616]) used to send and receive d
NumberFormat (java.text)
The abstract base class for all number formats. This class provides the interface for formatting and
ConcurrentHashMap (java.util.concurrent)
A plug-in replacement for JDK1.5 java.util.concurrent.ConcurrentHashMap. This version is based on or
ExecutorService (java.util.concurrent)
An Executor that provides methods to manage termination and methods that can produce a Future for tr
Semaphore (java.util.concurrent)
A counting semaphore. Conceptually, a semaphore maintains a set of permits. Each #acquire blocks if
Top 12 Jupyter Notebook extensions

How to useParseErrorList in org.jsoup.parser

Best Java code snippets using org.jsoup.parser.ParseErrorList (Showing top 18 results out of 315)

How to use
ParseErrorList
in
org.jsoup.parser