View Javadoc

1   /**
2    * This file Copyright (c) 2008-2010 Magnolia International
3    * Ltd.  (http://www.magnolia-cms.com). All rights reserved.
4    *
5    *
6    * This file is dual-licensed under both the Magnolia
7    * Network Agreement and the GNU General Public License.
8    * You may elect to use one or the other of these licenses.
9    *
10   * This file is distributed in the hope that it will be
11   * useful, but AS-IS and WITHOUT ANY WARRANTY; without even the
12   * implied warranty of MERCHANTABILITY or FITNESS FOR A
13   * PARTICULAR PURPOSE, TITLE, or NONINFRINGEMENT.
14   * Redistribution, except as permitted by whichever of the GPL
15   * or MNA you select, is prohibited.
16   *
17   * 1. For the GPL license (GPL), you can redistribute and/or
18   * modify this file under the terms of the GNU General
19   * Public License, Version 3, as published by the Free Software
20   * Foundation.  You should have received a copy of the GNU
21   * General Public License, Version 3 along with this program;
22   * if not, write to the Free Software Foundation, Inc., 51
23   * Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
24   *
25   * 2. For the Magnolia Network Agreement (MNA), this file
26   * and the accompanying materials are made available under the
27   * terms of the MNA which accompanies this distribution, and
28   * is available at http://www.magnolia-cms.com/mna.html
29   *
30   * Any modifications to this file must keep this entire header
31   * intact.
32   *
33   */
34  package info.magnolia.module.rssaggregator.importhandler;
35  
36  import com.sun.syndication.feed.synd.SyndFeed;
37  import com.sun.syndication.fetcher.FeedFetcher;
38  import com.sun.syndication.fetcher.impl.FeedFetcherCache;
39  import com.sun.syndication.fetcher.impl.HashMapFeedInfoCache;
40  import com.sun.syndication.fetcher.impl.HttpURLFeedFetcher;
41  import org.slf4j.Logger;
42  import org.slf4j.LoggerFactory;
43  
44  import java.net.URL;
45  import java.util.Set;
46  
47  /**
48   * A simple single threaded {@link RSSFeedFetcher} for feed retrieval <code>http</code> that follows redirects and
49   * supports conditional gets. <p/> Will attempt to fetch all {@link FeedChannel feed channels} defined in the provided
50   * {@link AggregateFeed aggregate feeds}. Failures to fetch a feed result for a given feed channel are logged at ERROR
51   * level. <p/> Because of the single threaded nature of this implementation, it is suited for situations where the
52   * number feed channels to retrieve is small and the time window between update checks is large enough. <p/> For more
53   * demanding situations, use a more performant RSSFeedFetcher implementation.
54   *
55   * @author Rob van der Linden Vooren
56   * @see RSSFeedFetcher
57   */
58  public class SimpleRSSFeedFetcher implements RSSFeedFetcher {
59  
60      private final FeedFetcherCache feedInfoCache;
61  
62      private static final Logger log = LoggerFactory.getLogger(SimpleRSSFeedFetcher.class);
63  
64      public SimpleRSSFeedFetcher() {
65          this.feedInfoCache = HashMapFeedInfoCache.getInstance();
66      }
67  
68      public Set<AggregateFeed> fetchAggregateFeeds(Set<AggregateFeed> aggregateFeeds) {
69          for (AggregateFeed aggregateFeed : aggregateFeeds) {
70              for (FeedChannel channel : aggregateFeed.getChannels()) {
71                  log.debug("Fetching feed channel '{}' for aggregateFeed '{}'", channel.getUrl(), aggregateFeed.getName());
72                  SyndFeed feed = fetchFeedChannel(channel);
73                  if (feed == null) {
74                      continue;
75                  }
76                  channel.setFeed(feed);
77              }
78          }
79          return aggregateFeeds;
80      }
81  
82      //  Helper methods
83  
84      /**
85       * Fetch the given feed channel. A failed fetch results in a <code>null</code> {@link FeedChannel#feed feed}
86       * property set.
87       *
88       * @param channel the feed channel to fetch
89       * @return the feed channel with its {@link FeedChannel#feed feed} property set to the result of the fetch
90       */
91      protected SyndFeed fetchFeedChannel(FeedChannel channel) {
92          try {
93              final FeedFetcher fetcher = new HttpURLFeedFetcher(feedInfoCache);
94              return fetcher.retrieveFeed(new URL(channel.getUrl()));
95          } catch (Exception e) {
96              log.error("Failed to store fetch result for channel '{}': {}", new Object[] {channel, e});
97              return null;
98          }
99      }
100 }