Package org.apache.nutch.parse.rss.structs

Examples of org.apache.nutch.parse.rss.structs.RSSItem


                }

                // now get the descriptions of all the underlying RSS Items and
                // then index them too
                for (int j = 0; j < r.getItems().size(); j++) {
                    RSSItem theRSSItem = (RSSItem) r.getItems().get(j);
                    indexText.append(theRSSItem.getDescription());
                    indexText.append(" ");

                    String whichLink = null;

                    if (theRSSItem.getPermalink() != null)
                        whichLink = theRSSItem.getPermalink();
                    else
                        whichLink = theRSSItem.getLink();

                    if (whichLink != null) {
                        try {
          if (theRSSItem.getDescription()!=null) {
        theOutlinks.add(new Outlink(whichLink, theRSSItem.getDescription(), getConf()));
          } else {
        theOutlinks.add(new Outlink(whichLink, "", getConf()));
          }
                        } catch (MalformedURLException e) {
                            if (LOG.isWarnEnabled()) {
View Full Code Here


            String description, String permalink) throws FeedParserException {

        //System.out.println("Found a new published article: " + permalink);
        if (fCurrentChannel != null) { //should never be null
            fCurrentChannel.getItems().add(
                    new RSSItem(title, link, description, permalink));
        }

    }
View Full Code Here

                }

                // now get the descriptions of all the underlying RSS Items and
                // then index them too
                for (int j = 0; j < r.getItems().size(); j++) {
                    RSSItem theRSSItem = (RSSItem) r.getItems().get(j);
                    indexText.append(theRSSItem.getDescription());
                    indexText.append(" ");

                    String whichLink = null;

                    if (theRSSItem.getPermalink() != null)
                        whichLink = theRSSItem.getPermalink();
                    else
                        whichLink = theRSSItem.getLink();

                    if (whichLink != null) {
                        try {
          if (theRSSItem.getDescription()!=null) {
        theOutlinks.add(new Outlink(whichLink, theRSSItem.getDescription()));
          } else {
        theOutlinks.add(new Outlink(whichLink, ""));
          }
                        } catch (MalformedURLException e) {
                            if (LOG.isWarnEnabled()) {
View Full Code Here

            String description, String permalink) throws FeedParserException {

        //System.out.println("Found a new published article: " + permalink);
        if (fCurrentChannel != null) { //should never be null
            fCurrentChannel.getItems().add(
                    new RSSItem(title, link, description, permalink));
        }

    }
View Full Code Here

                }

                // now get the descriptions of all the underlying RSS Items and
                // then index them too
                for (int j = 0; j < r.getItems().size(); j++) {
                    RSSItem theRSSItem = (RSSItem) r.getItems().get(j);
                    indexText.append(theRSSItem.getDescription());
                    indexText.append(" ");

                    String whichLink = null;

                    if (theRSSItem.getPermalink() != null)
                        whichLink = theRSSItem.getPermalink();
                    else
                        whichLink = theRSSItem.getLink();

                    if (whichLink != null) {
                        try {
          if (theRSSItem.getDescription()!=null) {
        theOutlinks.add(new Outlink(whichLink, theRSSItem.getDescription()));
          } else {
        theOutlinks.add(new Outlink(whichLink, ""));
          }
                        } catch (MalformedURLException e) {
                            LOG.info("nutch:parse-rss:RSSParser Exception: MalformedURL: "
View Full Code Here

                }

                // now get the descriptions of all the underlying RSS Items and
                // then index them too
                for (int j = 0; j < r.getItems().size(); j++) {
                    RSSItem theRSSItem = (RSSItem) r.getItems().get(j);
                    indexText.append(theRSSItem.getDescription());
                    indexText.append(" ");

                    String whichLink = null;

                    if (theRSSItem.getPermalink() != null)
                        whichLink = theRSSItem.getPermalink();
                    else
                        whichLink = theRSSItem.getLink();

                    if (whichLink != null) {
                        try {
                            theOutlinks.add(new Outlink(whichLink, theRSSItem
                                    .getDescription()));

                        } catch (MalformedURLException e) {
                            LOG
                                    .info("nutch:parse-rss:RSSParser Exception: MalformedURL: "
View Full Code Here

                }

                // now get the descriptions of all the underlying RSS Items and
                // then index them too
                for (int j = 0; j < r.getItems().size(); j++) {
                    RSSItem theRSSItem = (RSSItem) r.getItems().get(j);
                    indexText.append(theRSSItem.getDescription());
                    indexText.append(" ");

                    String whichLink = null;

                    if (theRSSItem.getPermalink() != null)
                        whichLink = theRSSItem.getPermalink();
                    else
                        whichLink = theRSSItem.getLink();

                    if (whichLink != null) {
                        try {
          if (theRSSItem.getDescription()!=null) {
        theOutlinks.add(new Outlink(whichLink, theRSSItem.getDescription(), getConf()));
          } else {
        theOutlinks.add(new Outlink(whichLink, "", getConf()));
          }
                        } catch (MalformedURLException e) {
                            if (LOG.isWarnEnabled()) {
View Full Code Here

            String description, String permalink) throws FeedParserException {

        //System.out.println("Found a new published article: " + permalink);
        if (fCurrentChannel != null) { //should never be null
            fCurrentChannel.getItems().add(
                    new RSSItem(title, link, description, permalink));
        }

    }
View Full Code Here

TOP

Related Classes of org.apache.nutch.parse.rss.structs.RSSItem

Copyright © 2018 www.massapicom. All rights reserved.
All source code are property of their respective owners. Java is a trademark of Sun Microsystems, Inc and owned by ORACLE Inc. Contact coftware#gmail.com.