import be.nikiroo.gofetch.data.Comment;
import be.nikiroo.gofetch.data.Story;
+/**
+ * Support <a href="http://www.lemonde.fr/">http://www.lemonde.fr/</a>.
+ *
+ * @author niki
+ */
public class LeMonde extends BasicSupport {
@Override
public String getDescription() {
for (String topic : new String[] { "international", "politique",
"societe", "sciences" }) {
URL url = new URL("http://www.lemonde.fr/" + topic + "/1.html");
- InputStream in = open(url);
+ InputStream in = downloader.open(url);
Document doc = DataUtil.load(in, "UTF-8", url.toString());
Elements articles = doc.getElementsByTag("article");
for (Element article : articles) {
&& contentElements.size() > 0) {
String id = times.get(0).attr("datetime").replace(":", "_")
.replace("+", "_");
- String title = "[" + topic + "] "
- + titleElements.get(0).text();
+ String title = titleElements.get(0).text();
+ String date = date(titleElements.get(0).text());
String content = contentElements.get(0).text();
String intUrl = "";
String extUrl = "";
+ String author = "";
String details = "";
Elements detailsElements = article
.getElementsByClass("signature");
if (detailsElements.size() > 0) {
- details = detailsElements.get(0).text();
+ author = detailsElements.get(0).text();
}
Elements links = titleElements.get(0).getElementsByTag("a");
if (links.size() > 0) {
intUrl = links.get(0).absUrl("href");
- list.add(new Story(getType(), id, title, details,
- intUrl, extUrl, content));
+ list.add(new Story(getType(), id, title, author, date,
+ topic, details, intUrl, extUrl, content));
}
}
}
// some javascript, I need to check...)
URL url = new URL(story.getUrlInternal());
- InputStream in = open(url);
+ InputStream in = downloader.open(url);
Document doc = DataUtil.load(in, "UTF-8", url.toString());
Element article = doc.getElementById("articleBody");
if (article != null) {
- for (String line : toLines(article, new QuoteProcessor() {
- @Override
- public String processText(String text) {
- return text;
- }
-
+ for (String line : toLines(article, new BasicElementProcessor() {
@Override
public boolean ignoreNode(Node node) {
if (node instanceof Element) {
return false;
}
- @Override
- public boolean detectQuote(Node node) {
- return false;
- }
-
@Override
public String manualProcessing(Node node) {
if (node instanceof Element) {