Package org.jsoup.select

Examples of org.jsoup.select.Elements.first()


                    blockingId);
            Elements parentSnippetSearch = doc.select(parentSelector);
            if (parentSnippetSearch.isEmpty()) {
                isBlocked = false;
            } else {
                Element parentSnippet = parentSnippetSearch.first();
                if (parentSnippet.attr(ExtNodeConstants.SNIPPET_NODE_ATTR_STATUS)
                        .equals(ExtNodeConstants.SNIPPET_NODE_ATTR_STATUS_FINISHED)) {
                    isBlocked = false;
                } else {
                    isBlocked = true;
View Full Code Here


      el = ((ElementWrapper) docOrElement).el;
    }
    final Elements elements = el.select(selectStatement);

    if (elements.size() == 1)
      return ParseResult.success(tokens.replaceWithTokens(templatePos, templatePos+template.size(), new ElementWrapper(elements.first())));
    else {
      final List<Object> elementList = Lists.newArrayListWithCapacity(elements.size());
      for (final Element e : elements) {
        elementList.add(new ElementWrapper(e));
      }
View Full Code Here

  }

  @Override
  public String getTitle() {
    Elements elements = jsoupDocument.getElementsByTag("title");
    Element titleElement = elements.first();
    if(titleElement == null)
      return null;
    else
      return titleElement.text();
  }
View Full Code Here

  }

  @Override
  public HTMLElement getBody() {
    Elements elements = jsoupDocument.getElementsByTag("body");
    Element bodyElement = elements.first();
    if(bodyElement == null)
      return null;
    else
      return new HTMLElementImpl(bodyElement, this);
  }
View Full Code Here

        Document doc = Http.url(url).get();
        Elements videos = doc.select("source#mp4source");
        if (videos.size() == 0) {
            throw new IOException("Could not find source#mp4source at " + url);
        }
        String vidUrl = videos.first().attr("src");
        if (vidUrl.startsWith("//")) {
            vidUrl = "http:" + vidUrl;
        }
        return vidUrl;
    }
View Full Code Here

        Document doc = Http.url(this.url).get();
        Elements videos = doc.select("meta[name=twitter:player:stream]");
        if (videos.size() == 0) {
            throw new IOException("Could not find twitter:player:stream at " + url);
        }
        String vidUrl = videos.first().attr("content");
        vidUrl = vidUrl.replaceAll("&amp;", "&");
        addURLToDownload(new URL(vidUrl), HOST + "_" + getGID(this.url));
        waitForThreads();
    }
}
View Full Code Here

    }

    private static List<String> getURLsFromPageStatic(Document doc) {
        List<String> imageURLs = new ArrayList<String>();
        Elements els = doc.select("#ContentPlaceHolder1_thumbs");
        String thumbs = els.first().attr("value");
        for (String thumb : thumbs.split(",")) {
            if (thumb.trim().equals("")) {
                continue;
            }
            thumb = thumb.replaceAll("_[a-zA-Z]{3,5}", "");
View Full Code Here

        Document doc = Http.url(url).get();
        Elements videos = doc.select("video");
        if (videos.size() == 0) {
            throw new IOException("Could not find Embed code at " + url);
        }
        String vidUrl = videos.first().attr("file");
        addURLToDownload(new URL(vidUrl), HOST + "_" + getGID(this.url));
        waitForThreads();
    }
}
View Full Code Here

                Elements images = doc.select("a > img");
                if (images.size() == 0) {
                    logger.warn("Image not found at " + this.url);
                    return;
                }
                Element image = images.first();
                String imgsrc = image.attr("src");
                imgsrc = "http://" + this.url.getHost() + "/" + imgsrc;
                // Provide prefix and let the AbstractRipper "guess" the filename
                String prefix = "";
                if (Utils.getConfigBoolean("download.save_order", true)) {
View Full Code Here

    @Override
    public Document getNextPage(Document doc) throws IOException {
        // Find next page
        Elements nextPageUrl = doc.select("td[align=right] form");
        String nextUrl = urlBase+nextPageUrl.first().attr("action");
        if (nextPageUrl.size() == 0) {
            throw new IOException("No more pages");
        }
        sleep(500);
        Document nextPage = Http.url(nextUrl).cookies(cookies).get();
View Full Code Here

TOP
Copyright © 2018 www.massapi.com. All rights reserved.
All source code are property of their respective owners. Java is a trademark of Sun Microsystems, Inc and owned by ORACLE Inc. Contact coftware#gmail.com.