1 package be
.nikiroo
.fanfix
.supported
;
3 import java
.io
.IOException
;
4 import java
.io
.InputStream
;
5 import java
.net
.MalformedURLException
;
7 import java
.text
.SimpleDateFormat
;
8 import java
.util
.AbstractMap
;
9 import java
.util
.ArrayList
;
10 import java
.util
.Date
;
11 import java
.util
.List
;
12 import java
.util
.Map
.Entry
;
13 import java
.util
.Scanner
;
15 import be
.nikiroo
.fanfix
.Instance
;
16 import be
.nikiroo
.fanfix
.bundles
.Config
;
17 import be
.nikiroo
.fanfix
.data
.MetaData
;
18 import be
.nikiroo
.utils
.Image
;
19 import be
.nikiroo
.utils
.Progress
;
20 import be
.nikiroo
.utils
.StringUtils
;
23 * Support class for <a href="http://www.fanfiction.net/">Faniction.net</a>
24 * stories, a website dedicated to fanfictions of many, many different
25 * universes, from TV shows to novels to games.
29 class Fanfiction
extends BasicSupport_Deprecated
{
31 protected boolean isHtml() {
36 protected MetaData
getMeta(URL source
, InputStream in
) throws IOException
{
37 MetaData meta
= new MetaData();
39 meta
.setTitle(getTitle(reset(in
)));
40 meta
.setAuthor(getAuthor(reset(in
)));
41 meta
.setDate(getDate(reset(in
)));
42 meta
.setTags(getTags(reset(in
)));
43 meta
.setSource(getType().getSourceName());
44 meta
.setUrl(source
.toString());
45 meta
.setPublisher(getType().getSourceName());
46 meta
.setUuid(source
.toString());
48 meta
.setLang("en"); // TODO!
49 meta
.setSubject(getSubject(reset(in
)));
50 meta
.setType(getType().toString());
51 meta
.setImageDocument(false);
52 meta
.setCover(getCover(source
, reset(in
)));
57 private String
getSubject(InputStream in
) {
58 String line
= getLine(in
, "id=pre_story_links", 0);
60 int pos
= line
.lastIndexOf('"');
62 line
= line
.substring(pos
+ 1);
63 pos
= line
.indexOf('<');
65 return StringUtils
.unhtml(line
.substring(0, pos
)).trim();
73 private List
<String
> getTags(InputStream in
) {
74 List
<String
> tags
= new ArrayList
<String
>();
76 String key
= "title=\"Send Private Message\"";
77 String line
= getLine(in
, key
, 2);
80 int pos
= line
.indexOf(key
);
82 line
= line
.substring(pos
+ key
.length());
84 pos
= line
.indexOf(key
);
86 line
= line
.substring(0, pos
);
87 line
= StringUtils
.unhtml(line
).trim();
88 if (line
.endsWith("-")) {
89 line
= line
.substring(0, line
.length() - 1);
92 for (String tag
: line
.split("-")) {
93 tags
.add(StringUtils
.unhtml(tag
).trim());
102 private String
getTitle(InputStream in
) {
104 @SuppressWarnings("resource")
105 Scanner scan
= new Scanner(in
, "UTF-8");
106 scan
.useDelimiter("\\n");
107 while (scan
.hasNext()) {
108 String line
= scan
.next();
109 if (line
.contains("xcontrast_txt")) {
111 line
= StringUtils
.unhtml(line
).trim();
112 if (line
.startsWith("Follow/Fav")) {
113 line
= line
.substring("Follow/Fav".length()).trim();
116 return StringUtils
.unhtml(line
).trim();
124 private String
getAuthor(InputStream in
) {
125 String author
= null;
128 @SuppressWarnings("resource")
129 Scanner scan
= new Scanner(in
, "UTF-8");
130 scan
.useDelimiter("\\n");
131 while (scan
.hasNext()) {
132 String line
= scan
.next();
133 if (line
.contains("xcontrast_txt")) {
135 author
= StringUtils
.unhtml(line
).trim();
141 return bsHelper
.fixAuthor(author
);
144 private String
getDate(InputStream in
) {
145 String key
= "Published: <span data-xutime='";
146 String line
= getLine(in
, key
, 0);
148 int pos
= line
.indexOf(key
);
150 line
= line
.substring(pos
+ key
.length());
151 pos
= line
.indexOf('\'');
153 line
= line
.substring(0, pos
).trim();
155 SimpleDateFormat sdf
= new SimpleDateFormat(
158 .format(new Date(1000 * Long
.parseLong(line
)));
159 } catch (NumberFormatException e
) {
160 Instance
.getTraceHandler().error(
162 "Cannot convert publication date: "
173 protected String
getDesc(URL source
, InputStream in
) {
174 return getLine(in
, "title=\"Send Private Message\"", 1);
177 private Image
getCover(URL url
, InputStream in
) {
178 String key
= "class='cimage";
179 String line
= getLine(in
, key
, 0);
181 int pos
= line
.indexOf(key
);
183 line
= line
.substring(pos
+ key
.length());
185 pos
= line
.indexOf(key
);
187 line
= line
.substring(pos
+ key
.length());
188 pos
= line
.indexOf('\'');
190 line
= line
.substring(0, pos
);
191 if (line
.startsWith("//")) {
192 line
= url
.getProtocol() + "://"
194 } else if (line
.startsWith("//")) {
195 line
= url
.getProtocol() + "://" + url
.getHost()
196 + "/" + line
.substring(1);
198 line
= url
.getProtocol() + "://" + url
.getHost()
199 + "/" + url
.getPath() + "/" + line
;
202 return getImage(this, null, line
);
212 protected List
<Entry
<String
, URL
>> getChapters(URL source
, InputStream in
,
214 List
<Entry
<String
, URL
>> urls
= new ArrayList
<Entry
<String
, URL
>>();
216 String base
= source
.toString();
217 int pos
= base
.lastIndexOf('/');
218 String suffix
= base
.substring(pos
); // including '/' at start
219 base
= base
.substring(0, pos
);
220 if (base
.endsWith("/1")) {
221 base
= base
.substring(0, base
.length() - 1); // including '/' at end
224 String line
= getLine(in
, "id=chap_select", 0);
225 String key
= "<option value=";
229 for (pos
= line
.indexOf(key
); pos
>= 0; pos
= line
230 .indexOf(key
, pos
), i
++) {
231 pos
= line
.indexOf('>', pos
);
233 int endOfName
= line
.indexOf('<', pos
);
234 if (endOfName
>= 0) {
235 String name
= line
.substring(pos
+ 1, endOfName
);
236 String chapNum
= i
+ ".";
237 if (name
.startsWith(chapNum
)) {
238 name
= name
.substring(chapNum
.length(),
243 urls
.add(new AbstractMap
.SimpleEntry
<String
, URL
>(
244 name
.trim(), new URL(base
+ i
+ suffix
)));
245 } catch (MalformedURLException e
) {
246 Instance
.getTraceHandler()
247 .error(new IOException(
248 "Cannot parse chapter " + i
250 + (base
+ i
+ suffix
), e
));
257 final String chapName
= getTitle(reset(in
));
258 final URL chapURL
= source
;
259 urls
.add(new Entry
<String
, URL
>() {
261 public URL
setValue(URL value
) {
266 public URL
getValue() {
271 public String
getKey() {
281 protected String
getChapterContent(URL source
, InputStream in
, int number
,
283 StringBuilder builder
= new StringBuilder();
284 String startAt
= "class='storytext ";
285 String endAt1
= "function review_init";
286 String endAt2
= "id=chap_select";
289 @SuppressWarnings("resource")
290 Scanner scan
= new Scanner(in
, "UTF-8");
291 scan
.useDelimiter("\\n");
292 while (scan
.hasNext()) {
293 String line
= scan
.next();
294 if (!ok
&& line
.contains(startAt
)) {
296 } else if (ok
&& (line
.contains(endAt1
) || line
.contains(endAt2
))) {
302 // First line may contain the title and chap name again
303 if (builder
.length() == 0) {
304 int pos
= line
.indexOf("<hr");
306 boolean chaptered
= false;
307 for (String lang
: Instance
.getConfig().getList(
308 Config
.CONF_CHAPTER
)) {
309 String chapterWord
= Instance
.getConfig()
310 .getStringX(Config
.CONF_CHAPTER
, lang
);
311 int posChap
= line
.indexOf(chapterWord
+ " ");
319 line
= line
.substring(pos
);
324 builder
.append(line
);
329 return builder
.toString();
333 protected boolean supports(URL url
) {
334 return "fanfiction.net".equals(url
.getHost())
335 || "www.fanfiction.net".equals(url
.getHost());