@Override public String select(String text) { for (Selector selector : selectors) { String result = selector.select(text); if (result != null) { return result; } } return null; }
@Override public List<String> selectList(String text) { List<String> results = new ArrayList<String>(); for (Selector selector : selectors) { List<String> strings = selector.selectList(text); results.addAll(strings); } return results; } }
public Object process(Page page) { boolean matched = false; for (Pattern targetPattern : targetUrlPatterns) { if (targetPattern.matcher(page.getUrl().toString()).matches()) { matched = true; } } if (!matched) { return null; } if (objectExtractor == null) { return processSingle(page, null, true); } else { if (objectExtractor.multi) { List<Object> os = new ArrayList<Object>(); List<String> list = objectExtractor.getSelector().selectList(page.getRawText()); for (String s : list) { Object o = processSingle(page, s, false); if (o != null) { os.add(o); } } return os; } else { String select = objectExtractor.getSelector().select(page.getRawText()); Object o = processSingle(page, select, false); return o; } } }
value = page.getHtml().selectDocumentForList(fieldExtractor.getSelector()); } else { value = fieldExtractor.getSelector().selectList(html); value = fieldExtractor.getSelector().selectList(page.getUrl().toString()); break; case RawText: value = fieldExtractor.getSelector().selectList(page.getRawText()); break; default: value = fieldExtractor.getSelector().selectList(html); value = page.getHtml().selectDocument(fieldExtractor.getSelector()); } else { value = fieldExtractor.getSelector().select(html); value = fieldExtractor.getSelector().select(page.getUrl().toString()); break; case RawText: value = fieldExtractor.getSelector().select(page.getRawText()); break; default: value = fieldExtractor.getSelector().select(html);
protected Selectable selectList(Selector selector, List<String> strings) { List<String> results = new ArrayList<String>(); for (String string : strings) { List<String> result = selector.selectList(string); results.addAll(result); } return new PlainText(results); }
@Override public String select(String text) { for (Selector selector : selectors) { if (text == null) { return null; } text = selector.select(text); } return text; }
@Override public List<String> selectList(String text) { List<String> results = new ArrayList<String>(); boolean first = true; for (Selector selector : selectors) { if (first) { results = selector.selectList(text); first = false; } else { List<String> resultsTemp = new ArrayList<String>(); for (String result : results) { resultsTemp.addAll(selector.selectList(result)); } results = resultsTemp; if (results == null || results.size() == 0) { return results; } } } return results; } }
protected Selectable select(Selector selector, List<String> strings) { List<String> results = new ArrayList<String>(); for (String string : strings) { String result = selector.select(string); if (result != null) { results.add(result); } } return new PlainText(results); }
public List<String> selectDocumentForList(Selector selector) { if (selector instanceof ElementSelector) { ElementSelector elementSelector = (ElementSelector) selector; return elementSelector.selectList(getDocument()); } else { return selector.selectList(getFirstSourceText()); } }
/** * @param selector selector * @return result */ public String selectDocument(Selector selector) { if (selector instanceof ElementSelector) { ElementSelector elementSelector = (ElementSelector) selector; return elementSelector.select(getDocument()); } else { return selector.select(getFirstSourceText()); } }
@Override public List<String> selectList(String text) { List<String> results = new ArrayList<String>(); for (Selector selector : selectors) { List<String> strings = selector.selectList(text); results.addAll(strings); } return results; } }
@Override public String select(String text) { for (Selector selector : selectors) { if (text == null) { return null; } text = selector.select(text); } return text; }
protected Selectable selectList(Selector selector, List<String> strings) { List<String> results = new ArrayList<String>(); for (String string : strings) { List<String> result = selector.selectList(string); results.addAll(result); } return new PlainText(results); }
@Override public String select(String text) { for (Selector selector : selectors) { String result = selector.select(text); if (result != null) { return result; } } return null; }
@Override public List<String> selectList(String text) { List<String> results = new ArrayList<String>(); boolean first = true; for (Selector selector : selectors) { if (first) { results = selector.selectList(text); first = false; } else { List<String> resultsTemp = new ArrayList<String>(); for (String result : results) { resultsTemp.addAll(selector.selectList(result)); } results = resultsTemp; if (results == null || results.size() == 0) { return results; } } } return results; } }
protected Selectable select(Selector selector, List<String> strings) { List<String> results = new ArrayList<String>(); for (String string : strings) { String result = selector.select(string); if (result != null) { results.add(result); } } return new PlainText(results); }
public List<String> selectDocumentForList(Selector selector) { if (selector instanceof ElementSelector) { ElementSelector elementSelector = (ElementSelector) selector; return elementSelector.selectList(getDocument()); } else { return selector.selectList(getFirstSourceText()); } }
/** * @param selector selector * @return result */ public String selectDocument(Selector selector) { if (selector instanceof ElementSelector) { ElementSelector elementSelector = (ElementSelector) selector; return elementSelector.select(getDocument()); } else { return selector.select(getFirstSourceText()); } }