Version 1.1.0
[fanfix.git] / src / be / nikiroo / fanfix / supported / E621.java
CommitLineData
08fe2e33
NR
1package be.nikiroo.fanfix.supported;
2
595dfa7a 3import java.awt.image.BufferedImage;
08fe2e33
NR
4import java.io.IOException;
5import java.io.InputStream;
6import java.net.URL;
7import java.util.ArrayList;
8import java.util.List;
9import java.util.Map.Entry;
10import java.util.Scanner;
11
12import be.nikiroo.fanfix.Instance;
13import be.nikiroo.fanfix.data.Chapter;
68686a37 14import be.nikiroo.fanfix.data.MetaData;
08fe2e33
NR
15import be.nikiroo.fanfix.data.Story;
16import be.nikiroo.utils.StringUtils;
92fb0719 17import be.nikiroo.utils.ui.Progress;
08fe2e33
NR
18
19/**
20 * Support class for <a href="http://e621.net/">e621.net</a> and <a
21 * href="http://e926.net/">e926.net</a>, a Furry website supporting comics,
22 * including some of MLP.
23 * <p>
24 * <a href="http://e926.net/">e926.net</a> only shows the "clean" images and
25 * comics, but it can be difficult to browse.
26 *
27 * @author niki
28 */
29class E621 extends BasicSupport {
30 @Override
31 public String getSourceName() {
32 return "e621.net";
33 }
34
35 @Override
68686a37
NR
36 protected MetaData getMeta(URL source, InputStream in) throws IOException {
37 MetaData meta = new MetaData();
38
39 meta.setTitle(getTitle(reset(in)));
40 meta.setAuthor(getAuthor(source, reset(in)));
41 meta.setDate("");
42 meta.setTags(new ArrayList<String>()); // TODDO ???
43 meta.setSource(getSourceName());
2206ef66 44 meta.setUrl(source.toString());
68686a37
NR
45 meta.setPublisher(getSourceName());
46 meta.setUuid(source.toString());
47 meta.setLuid("");
48 meta.setLang("EN");
49 meta.setSubject("");
50 meta.setType(getType().toString());
51 meta.setImageDocument(true);
595dfa7a 52 meta.setCover(getCover(source));
68686a37
NR
53
54 return meta;
08fe2e33
NR
55 }
56
57 @Override
92fb0719 58 public Story process(URL url, Progress pg) throws IOException {
08fe2e33 59 // There is no chapters on e621, just pagination...
92fb0719 60 Story story = super.process(url, pg);
08fe2e33
NR
61
62 Chapter only = new Chapter(1, null);
63 for (Chapter chap : story) {
64 only.getParagraphs().addAll(chap.getParagraphs());
65 }
66
67 story.getChapters().clear();
68 story.getChapters().add(only);
69
70 return story;
71 }
72
73 @Override
74 protected boolean supports(URL url) {
75 String host = url.getHost();
76 if (host.startsWith("www.")) {
77 host = host.substring("www.".length());
78 }
79
80 return ("e621.net".equals(host) || "e926.net".equals(host))
81 && url.getPath().startsWith("/pool/");
82 }
83
84 @Override
85 protected boolean isHtml() {
86 return true;
87 }
88
595dfa7a
NR
89 private BufferedImage getCover(URL source) throws IOException {
90 InputStream in = Instance.getCache().open(source, this, true);
91 String images = getChapterContent(new URL(source.toString() + "?page="
92 + 1), in, 1);
93 if (!images.isEmpty()) {
94 int pos = images.indexOf('\n');
95 if (pos >= 0) {
96 images = images.substring(1, pos - 1);
97 return getImage(this, null, images);
98 }
99 }
100
101 return null;
102 }
103
68686a37 104 private String getAuthor(URL source, InputStream in) throws IOException {
08fe2e33
NR
105 String author = getLine(in, "href=\"/post/show/", 0);
106 if (author != null) {
107 String key = "href=\"";
108 int pos = author.indexOf(key);
109 if (pos >= 0) {
110 author = author.substring(pos + key.length());
111 pos = author.indexOf("\"");
112 if (pos >= 0) {
113 author = author.substring(0, pos - 1);
114 String page = source.getProtocol() + "://"
115 + source.getHost() + author;
08fe2e33 116 try {
7d0d2be6
NR
117 InputStream pageIn = Instance.getCache().open(
118 new URL(page), this, false);
119 try {
120 key = "class=\"tag-type-artist\"";
121 author = getLine(pageIn, key, 0);
122 if (author != null) {
123 pos = author.indexOf("<a href=\"");
08fe2e33 124 if (pos >= 0) {
7d0d2be6
NR
125 author = author.substring(pos);
126 pos = author.indexOf("</a>");
127 if (pos >= 0) {
128 author = author.substring(0, pos);
129 return StringUtils.unhtml(author);
130 }
08fe2e33
NR
131 }
132 }
7d0d2be6
NR
133 } finally {
134 pageIn.close();
08fe2e33 135 }
7d0d2be6
NR
136 } catch (Exception e) {
137 // No author found
08fe2e33
NR
138 }
139 }
140 }
141 }
142
143 return null;
144 }
145
68686a37 146 private String getTitle(InputStream in) throws IOException {
08fe2e33
NR
147 String title = getLine(in, "<title>", 0);
148 if (title != null) {
149 int pos = title.indexOf('>');
150 if (pos >= 0) {
151 title = title.substring(pos + 1);
152 pos = title.indexOf('<');
153 if (pos >= 0) {
154 title = title.substring(0, pos);
155 }
156 }
157
158 if (title.startsWith("Pool:")) {
159 title = title.substring("Pool:".length());
160 }
161
68686a37 162 title = StringUtils.unhtml(title).trim();
08fe2e33
NR
163 }
164
165 return title;
166 }
167
168 @Override
169 protected String getDesc(URL source, InputStream in) throws IOException {
170 String desc = getLine(in, "margin-bottom: 2em;", 0);
171
172 if (desc != null) {
173 StringBuilder builder = new StringBuilder();
174
175 boolean inTags = false;
176 for (char car : desc.toCharArray()) {
177 if ((inTags && car == '>') || (!inTags && car == '<')) {
178 inTags = !inTags;
179 }
180
181 if (inTags) {
182 builder.append(car);
183 }
184 }
185
186 return builder.toString().trim();
187 }
188
189 return null;
190 }
191
192 @Override
193 protected List<Entry<String, URL>> getChapters(URL source, InputStream in)
194 throws IOException {
195 List<Entry<String, URL>> urls = new ArrayList<Entry<String, URL>>();
196 int last = 1; // no pool/show when only one page
197
198 @SuppressWarnings("resource")
199 Scanner scan = new Scanner(in, "UTF-8");
200 scan.useDelimiter("\\n");
201 while (scan.hasNext()) {
202 String line = scan.next();
203 for (int pos = line.indexOf(source.getPath()); pos >= 0; pos = line
204 .indexOf(source.getPath(), pos + source.getPath().length())) {
205 int equalPos = line.indexOf("=", pos);
206 int quotePos = line.indexOf("\"", pos);
207 if (equalPos >= 0 && quotePos > equalPos) {
208 String snum = line.substring(equalPos + 1, quotePos);
209 try {
210 int num = Integer.parseInt(snum);
211 if (num > last) {
212 last = num;
213 }
214 } catch (NumberFormatException e) {
215 }
216 }
217 }
218 }
219
220 for (int i = 1; i <= last; i++) {
221 final String key = Integer.toString(i);
222 final URL value = new URL(source.toString() + "?page=" + i);
223 urls.add(new Entry<String, URL>() {
224 public URL setValue(URL value) {
225 return null;
226 }
227
228 public URL getValue() {
229 return value;
230 }
231
232 public String getKey() {
233 return key;
234 }
235 });
236 }
237
238 return urls;
239 }
240
241 @Override
242 protected String getChapterContent(URL source, InputStream in, int number)
243 throws IOException {
244 StringBuilder builder = new StringBuilder();
245 String staticSite = "https://static1.e621.net";
246 if (source.getHost().contains("e926")) {
247 staticSite = staticSite.replace("e621", "e926");
248 }
249
250 String key = staticSite + "/data/preview/";
251
252 @SuppressWarnings("resource")
253 Scanner scan = new Scanner(in, "UTF-8");
254 scan.useDelimiter("\\n");
255 while (scan.hasNext()) {
256 String line = scan.next();
d98a2900 257 if (line.contains("class=\"preview")) {
08fe2e33
NR
258 for (int pos = line.indexOf(key); pos >= 0; pos = line.indexOf(
259 key, pos + key.length())) {
260 int endPos = line.indexOf("\"", pos);
261 if (endPos >= 0) {
262 String id = line.substring(pos + key.length(), endPos);
263 id = staticSite + "/data/" + id;
264
265 int dotPos = id.lastIndexOf(".");
266 if (dotPos >= 0) {
267 id = id.substring(0, dotPos);
268 builder.append("[");
269 builder.append(id);
270 builder.append("]\n");
271 }
272 }
273 }
274 }
275 }
276
277 return builder.toString();
278 }
279}