import java.net.URL;
import java.nio.charset.StandardCharsets;
import java.nio.file.Files;
+import java.security.KeyManagementException;
+import java.security.NoSuchAlgorithmException;
+import java.security.cert.X509Certificate;
import java.util.ArrayList;
import java.util.Comparator;
+import java.util.Date;
+import java.util.HashMap;
+import java.util.HashSet;
import java.util.List;
+import java.util.Map;
+import java.util.Set;
+import java.util.logging.Logger;
+
+import javax.net.ssl.SSLContext;
+import javax.net.ssl.TrustManager;
+import javax.net.ssl.X509TrustManager;
+
+import org.jsoup.Jsoup;
import com.rometools.rome.feed.synd.SyndEnclosure;
import com.rometools.rome.feed.synd.SyndEntry;
import com.rometools.rome.io.FeedException;
import com.rometools.rome.io.SyndFeedInput;
import com.rometools.rome.io.XmlReader;
-import com.sun.xml.internal.ws.policy.privateutil.PolicyUtils.Collections;
-
-import org.jsoup.*;
public class Main {
+ private static final Logger LOG = Logger.getLogger(Main.class.getName());
+
+ static {
+ TrustManager[] mgrs;
+ SSLContext sc;
+
+ mgrs = new TrustManager[]{
+ new X509TrustManager() {
+ public java.security.cert.X509Certificate[] getAcceptedIssuers() {
+ return null;
+ }
+
+ public void checkClientTrusted(X509Certificate[] certs, String authType) {
+ }
+
+ public void checkServerTrusted(X509Certificate[] certs, String authType) {
+ }
+ }
+ };
+
+ try {
+ sc = SSLContext.getInstance("SSL");
+ sc.init(null, mgrs, new java.security.SecureRandom());
+ SSLContext.setDefault(sc);
+ } catch (NoSuchAlgorithmException | KeyManagementException e) {
+ e.printStackTrace();
+ }
+ }
+
private static void addArticles(Category cat, SyndFeed feed, List<Article> articles) {
String thumbnail;
String desc;
+ Date date;
for (SyndEntry entry: feed.getEntries()) {
thumbnail = null;
thumbnail = e.getUrl();
break;
}
-
-
+
+ if (entry.getDescription() != null) {
+ desc = Jsoup.parse(entry.getDescription().getValue()).text();
+ } else {
+ desc = null;
+ LOG.severe("No description for " + feed.getTitle() + " - " + entry.getTitle());
+ }
- desc = Jsoup.parse(entry.getDescription().getValue()).text();
+ date = entry.getPublishedDate();
+ if (date == null)
+ date = entry.getUpdatedDate();
articles.add(new Article(entry.getLink(),
cat,
entry.getTitle(),
desc,
thumbnail,
- entry.getPublishedDate(),
+ date,
feed.getTitle()));
}
}
}
}
+ private static Map<Category, String[]> getFeeds() {
+ Map<Category, String[]> result;
+
+ result = new HashMap<>();
+
+ result.put(Category.TOP,
+ new String[] {
+ "http://www.francetvinfo.fr/titres.rss",
+ "http://www.france24.com/fr/actualites/rss",
+ "https://www.franceinter.fr/rss/a-la-une.xml",
+ "http://www.rfi.fr/general/rss",
+ "http://www.cnews.fr/rss/une",
+ "http://www.bfmtv.com/rss/info/flux-rss/flux-toutes-les-actualites/"
+ });
+
+ result.put(Category.SPORT,
+ new String[] { "http://www.france24.com/fr/sports/rss" });
+
+ result.put(Category.FRANCE,
+ new String[] { "http://www.france24.com/fr/france/rss",
+ "http://www.rfi.fr/france/rss"});
+
+ result.put(Category.EUROPE,
+ new String[] { "http://www.france24.com/fr/europe/rss" });
+
+ result.put(Category.ECO,
+ new String[] { "http://www.france24.com/fr/economie/rss",
+ "http://www.rfi.fr/economie/rss" });
+
+ result.put(Category.ESSONNE,
+ new String[] { "https://www.essonneinfo.fr/feed/" });
+
+ result.put(Category.TECHNOLOGIE,
+ new String[] { "http://feeds.feedburner.com/lesnumeriques/news",
+ "http://www.zdnet.fr/feeds/rss/actualites/"});
+
+ return result;
+ }
+
private static List<Article> getArticles(Category cat) throws IllegalArgumentException, MalformedURLException, FeedException, IOException {
List<Article> articles;
+ String[] feeds;
+ Set<String> links;
articles = new ArrayList<>();
- switch (cat) {
- case TOP:
- addArticles(cat, getSyndFeed("http://www.france24.com/fr/actualites/rss"), articles);
- addArticles(cat, getSyndFeed("http://www.bfmtv.com/rss/info/flux-rss/flux-toutes-les-actualites/"), articles);
- break;
- case SPORT:
- addArticles(cat, getSyndFeed("http://www.france24.com/fr/sports/rss"), articles);
- break;
- case FRANCE:
- addArticles(cat, getSyndFeed("http://www.france24.com/fr/france/rss"), articles);
- break;
- case EUROPE:
- addArticles(cat, getSyndFeed("http://www.france24.com/fr/europe/rss"), articles);
- break;
- case ECO:
- addArticles(cat, getSyndFeed("http://www.france24.com/fr/economie/rss"), articles);
- break;
- default:
- throw new IllegalArgumentException();
+ feeds = getFeeds().get(cat);
+
+ if (feeds != null)
+ for (String str: feeds)
+ addArticles(cat, getSyndFeed(str), articles);
+ else
+ LOG.severe("No feed for category " + cat);
+
+ links = new HashSet<>(articles.size());
+ for (Article a: articles) {
+ if (links.contains(a.link))
+ LOG.severe(a.link + "is not uniq");
+ else
+ links.add(a.link);
}
articles.sort(new Comparator<Article> () {
articles = getArticles(cat);
- html = HTML.toHTML(articles);
+ html = HTML.toHTML(articles, cat);
f = new File(cat.getId() + ".html");