Merge branch 'subtree'
[fanfix.git] / src / be / nikiroo / fanfix / supported / Text.java
1 package be.nikiroo.fanfix.supported;
2
3 import java.io.File;
4 import java.io.IOException;
5 import java.io.InputStream;
6 import java.net.URISyntaxException;
7 import java.net.URL;
8 import java.util.AbstractMap;
9 import java.util.ArrayList;
10 import java.util.List;
11 import java.util.Map.Entry;
12 import java.util.Scanner;
13
14 import org.jsoup.nodes.Document;
15
16 import be.nikiroo.fanfix.Instance;
17 import be.nikiroo.fanfix.bundles.Config;
18 import be.nikiroo.fanfix.data.MetaData;
19 import be.nikiroo.utils.Image;
20 import be.nikiroo.utils.ImageUtils;
21 import be.nikiroo.utils.Progress;
22 import be.nikiroo.utils.streams.MarkableFileInputStream;
23
24 /**
25 * Support class for local stories encoded in textual format, with a few rules:
26 * <ul>
27 * <li>The title must be on the first line</li>
28 * <li>The author (preceded by nothing, "by " or "©") must be on the second
29 * line, possibly with the publication date in parenthesis (i.e., "
30 * <tt>By Unknown (3rd October 1998)</tt>")</li>
31 * <li>Chapters must be declared with "<tt>Chapter x</tt>" or "
32 * <tt>Chapter x: NAME OF THE CHAPTER</tt>", where "<tt>x</tt>" is the chapter
33 * number</li>
34 * <li>A description of the story must be given as chapter number 0</li>
35 * <li>A cover may be present, with the same filename but a PNG, JPEG or JPG
36 * extension</li>
37 * </ul>
38 *
39 * @author niki
40 */
41 class Text extends BasicSupport {
42 private File sourceFile;
43 private InputStream in;
44
45 protected File getSourceFile() {
46 return sourceFile;
47 }
48
49 protected InputStream getInput() {
50 if (in != null) {
51 try {
52 in.reset();
53 } catch (IOException e) {
54 Instance.getInstance().getTraceHandler().error(new IOException("Cannot reset the Text stream", e));
55 }
56
57 return in;
58 }
59
60 return null;
61 }
62
63 @Override
64 protected boolean isHtml() {
65 return false;
66 }
67
68 @Override
69 protected Document loadDocument(URL source) throws IOException {
70 try {
71 sourceFile = new File(source.toURI());
72 in = new MarkableFileInputStream(sourceFile);
73 } catch (URISyntaxException e) {
74 throw new IOException("Cannot load the text document: " + source);
75 }
76
77 return null;
78 }
79
80 @Override
81 protected MetaData getMeta() throws IOException {
82 MetaData meta = new MetaData();
83
84 meta.setTitle(getTitle());
85 meta.setAuthor(getAuthor());
86 meta.setDate(bsHelper.formatDate(getDate()));
87 meta.setTags(new ArrayList<String>());
88 meta.setUrl(getSourceFile().toURI().toURL().toString());
89 meta.setUuid(getSourceFile().toString());
90 meta.setLuid("");
91 meta.setLang(getLang()); // default is EN
92 meta.setSubject(getSourceFile().getParentFile().getName());
93 meta.setImageDocument(false);
94 meta.setCover(getCover(getSourceFile()));
95
96 return meta;
97 }
98
99 private String getLang() {
100 @SuppressWarnings("resource") // cannot close, or we loose getInput()!
101 Scanner scan = new Scanner(getInput(), "UTF-8");
102 scan.useDelimiter("\\n");
103 scan.next(); // Title
104 scan.next(); // Author (Date)
105 String chapter0 = scan.next(); // empty or Chapter 0
106 while (chapter0.isEmpty()) {
107 chapter0 = scan.next();
108 }
109
110 String lang = detectChapter(chapter0, 0);
111 if (lang == null) {
112 // No description??
113 lang = detectChapter(chapter0, 1);
114 }
115
116 if (lang == null) {
117 lang = "en";
118 } else {
119 lang = lang.toLowerCase();
120 }
121
122 return lang;
123 }
124
125 private String getTitle() {
126 @SuppressWarnings("resource") // cannot close, or we loose getInput()!
127 Scanner scan = new Scanner(getInput(), "UTF-8");
128 scan.useDelimiter("\\n");
129 return scan.next();
130 }
131
132 private String getAuthor() {
133 @SuppressWarnings("resource") // cannot close, or we loose getInput()!
134 Scanner scan = new Scanner(getInput(), "UTF-8");
135 scan.useDelimiter("\\n");
136 scan.next();
137 String authorDate = scan.next();
138
139 String author = authorDate;
140 int pos = authorDate.indexOf('(');
141 if (pos >= 0) {
142 author = authorDate.substring(0, pos);
143 }
144
145 return bsHelper.fixAuthor(author);
146 }
147
148 private String getDate() {
149 @SuppressWarnings("resource") // cannot close, or we loose getInput()!
150 Scanner scan = new Scanner(getInput(), "UTF-8");
151 scan.useDelimiter("\\n");
152 scan.next();
153 String authorDate = scan.next();
154
155 String date = "";
156 int pos = authorDate.indexOf('(');
157 if (pos >= 0) {
158 date = authorDate.substring(pos + 1).trim();
159 pos = date.lastIndexOf(')');
160 if (pos >= 0) {
161 date = date.substring(0, pos).trim();
162 }
163 }
164
165 return date;
166 }
167
168 @Override
169 protected String getDesc() throws IOException {
170 return getChapterContent(null, 0, null).trim();
171 }
172
173 protected Image getCover(File sourceFile) {
174 String path = sourceFile.getName();
175
176 for (String ext : new String[] { ".txt", ".text", ".story" }) {
177 if (path.endsWith(ext)) {
178 path = path.substring(0, path.length() - ext.length());
179 }
180 }
181
182 Image cover = bsImages.getImage(this, sourceFile.getParentFile(), path);
183 if (cover != null) {
184 try {
185 File tmp = Instance.getInstance().getTempFiles().createTempFile("test_cover_image");
186 ImageUtils.getInstance().saveAsImage(cover, tmp, "png");
187 tmp.delete();
188 } catch (IOException e) {
189 cover = null;
190 }
191 }
192
193 return cover;
194 }
195
196 @Override
197 protected List<Entry<String, URL>> getChapters(Progress pg)
198 throws IOException {
199 List<Entry<String, URL>> chaps = new ArrayList<Entry<String, URL>>();
200 @SuppressWarnings("resource") // cannot close, or we loose getInput()!
201 Scanner scan = new Scanner(getInput(), "UTF-8");
202 scan.useDelimiter("\\n");
203 String line = "first is not empty";
204 while (scan.hasNext()) {
205 boolean prevLineEmpty = line.trim().isEmpty();
206 line = scan.next();
207 if (prevLineEmpty && detectChapter(line, chaps.size() + 1) != null) {
208 String chapName = Integer.toString(chaps.size() + 1);
209 int pos = line.indexOf(':');
210 if (pos >= 0 && pos + 1 < line.length()) {
211 chapName = line.substring(pos + 1).trim();
212 }
213
214 chaps.add(new AbstractMap.SimpleEntry<String, URL>(//
215 chapName, //
216 getSourceFile().toURI().toURL()));
217 }
218 }
219
220 return chaps;
221 }
222
223 @Override
224 protected String getChapterContent(URL source, int number, Progress pg)
225 throws IOException {
226 StringBuilder builder = new StringBuilder();
227 @SuppressWarnings("resource") // cannot close, or we loose getInput()!
228 Scanner scan = new Scanner(getInput(), "UTF-8");
229 scan.useDelimiter("\\n");
230 if (scan.hasNext())
231 scan.next(); // title
232 if (scan.hasNext())
233 scan.next(); // author
234 if (scan.hasNext())
235 scan.next(); // date or empty
236 Boolean inChap = null;
237 String line = "";
238 while (scan.hasNext()) {
239 if (number == 0 && !line.trim().isEmpty()) {
240 // We found pre-chapter content, we are checking for
241 // Chapter 0 (fake chapter) --> keep the content
242 if (inChap == null)
243 inChap = true;
244 }
245 line = scan.next();
246 if ((inChap == null || !inChap) && detectChapter(line, number) != null) {
247 inChap = true;
248 } else if (detectChapter(line, number + 1) != null) {
249 break;
250 } else if (inChap != null && inChap) {
251 builder.append(line);
252 builder.append("\n");
253 }
254 }
255
256 return builder.toString();
257 }
258
259 @Override
260 protected void close() {
261 InputStream in = getInput();
262 if (in != null) {
263 try {
264 in.close();
265 } catch (IOException e) {
266 Instance.getInstance().getTraceHandler()
267 .error(new IOException("Cannot close the text source file input", e));
268 }
269 }
270
271 super.close();
272 }
273
274 @Override
275 protected boolean supports(URL url) {
276 return supports(url, false);
277 }
278
279 /**
280 * Check if we supports this {@link URL}, that is, if the info file can be
281 * found OR not found.
282 * <p>
283 * It must also be a file, not another kind of URL.
284 *
285 * @param url
286 * the {@link URL} to check
287 * @param info
288 * TRUE to require the info file, FALSE to forbid the info file
289 *
290 * @return TRUE if it is supported
291 */
292 protected boolean supports(URL url, boolean info) {
293 if (!"file".equals(url.getProtocol())) {
294 return false;
295 }
296
297 boolean infoPresent = false;
298 File file;
299 try {
300 file = new File(url.toURI());
301 file = assureNoTxt(file);
302 file = new File(file.getPath() + ".info");
303 } catch (URISyntaxException e) {
304 Instance.getInstance().getTraceHandler().error(e);
305 file = null;
306 }
307
308 infoPresent = (file != null && file.exists());
309
310 return infoPresent == info;
311 }
312
313 /**
314 * Remove the ".txt" (or ".text") extension if it is present.
315 *
316 * @param file
317 * the file to process
318 *
319 * @return the same file or a copy of it without the ".txt" extension if it
320 * was present
321 */
322 protected File assureNoTxt(File file) {
323 for (String ext : new String[] { ".txt", ".text" }) {
324 if (file.getName().endsWith(ext)) {
325 file = new File(file.getPath().substring(0,
326 file.getPath().length() - ext.length()));
327 }
328 }
329
330 return file;
331 }
332
333 /**
334 * Check if the given line looks like the given starting chapter in a
335 * supported language, and return the language if it does (or NULL if not).
336 *
337 * @param line
338 * the line to check
339 * @param number
340 * the specific chapter number to check for
341 *
342 * @return the language or NULL
343 */
344 static private String detectChapter(String line, int number) {
345 line = line.toUpperCase();
346 for (String lang : Instance.getInstance().getConfig().getList(Config.CONF_CHAPTER)) {
347 String chapter = Instance.getInstance().getConfig().getStringX(Config.CONF_CHAPTER, lang);
348 if (chapter != null && !chapter.isEmpty()) {
349 chapter = chapter.toUpperCase() + " ";
350 if (line.startsWith(chapter)) {
351 // We want "[CHAPTER] [number]: [name]", with ": [name]"
352 // optional
353 String test = line.substring(chapter.length()).trim();
354
355 String possibleNum = test.trim();
356 if (possibleNum.indexOf(':') > 0) {
357 possibleNum = possibleNum.substring(0,
358 possibleNum.indexOf(':')).trim();
359 }
360
361 if (test.startsWith(Integer.toString(number))) {
362 test = test
363 .substring(Integer.toString(number).length())
364 .trim();
365 if (test.isEmpty() || test.startsWith(":")) {
366 return lang;
367 }
368 }
369 }
370 }
371 }
372
373 return null;
374 }
375 }