fix missing values for some old files
[nikiroo-utils.git] / supported / Text.java
CommitLineData
08fe2e33
NR
1package be.nikiroo.fanfix.supported;
2
3import java.io.File;
4import java.io.IOException;
5import java.io.InputStream;
6import java.net.URISyntaxException;
7import java.net.URL;
7445f856 8import java.util.AbstractMap;
08fe2e33
NR
9import java.util.ArrayList;
10import java.util.List;
11import java.util.Map.Entry;
12import java.util.Scanner;
13
7445f856
NR
14import org.jsoup.nodes.Document;
15
08fe2e33
NR
16import be.nikiroo.fanfix.Instance;
17import be.nikiroo.fanfix.bundles.Config;
32097898 18import be.nikiroo.fanfix.data.Chapter;
68686a37 19import be.nikiroo.fanfix.data.MetaData;
32097898 20import be.nikiroo.fanfix.data.Paragraph;
16a81ef7 21import be.nikiroo.utils.Image;
81b5e730 22import be.nikiroo.utils.ImageUtils;
ed08c171 23import be.nikiroo.utils.Progress;
8d59ce07 24import be.nikiroo.utils.streams.MarkableFileInputStream;
08fe2e33
NR
25
26/**
27 * Support class for local stories encoded in textual format, with a few rules:
28 * <ul>
29 * <li>The title must be on the first line</li>
30 * <li>The author (preceded by nothing, "by " or "©") must be on the second
31 * line, possibly with the publication date in parenthesis (i.e., "
32 * <tt>By Unknown (3rd October 1998)</tt>")</li>
33 * <li>Chapters must be declared with "<tt>Chapter x</tt>" or "
34 * <tt>Chapter x: NAME OF THE CHAPTER</tt>", where "<tt>x</tt>" is the chapter
35 * number</li>
36 * <li>A description of the story must be given as chapter number 0</li>
37 * <li>A cover may be present, with the same filename but a PNG, JPEG or JPG
48f14dc9 38 * extension</li>
08fe2e33
NR
39 * </ul>
40 *
41 * @author niki
42 */
7445f856
NR
43class Text extends BasicSupport {
44 private File sourceFile;
45 private InputStream in;
46
47 protected File getSourceFile() {
48 return sourceFile;
49 }
50
51 protected InputStream getInput() {
52 if (in != null) {
53 try {
54 in.reset();
55 } catch (IOException e) {
d66deb8d 56 Instance.getInstance().getTraceHandler().error(new IOException("Cannot reset the Text stream", e));
7445f856
NR
57 }
58
59 return in;
60 }
61
62 return null;
63 }
64
08fe2e33
NR
65 @Override
66 protected boolean isHtml() {
67 return false;
68 }
69
08fe2e33 70 @Override
7445f856
NR
71 protected Document loadDocument(URL source) throws IOException {
72 try {
73 sourceFile = new File(source.toURI());
67837328 74 in = new MarkableFileInputStream(sourceFile);
7445f856
NR
75 } catch (URISyntaxException e) {
76 throw new IOException("Cannot load the text document: " + source);
77 }
78
79 return null;
80 }
81
82 @Override
83 protected MetaData getMeta() throws IOException {
68686a37
NR
84 MetaData meta = new MetaData();
85
7445f856
NR
86 meta.setTitle(getTitle());
87 meta.setAuthor(getAuthor());
88 meta.setDate(getDate());
68686a37 89 meta.setTags(new ArrayList<String>());
727108fe 90 meta.setSource(getType().getSourceName());
7445f856 91 meta.setUrl(getSourceFile().toURI().toURL().toString());
2206ef66 92 meta.setPublisher("");
7445f856 93 meta.setUuid(getSourceFile().toString());
68686a37 94 meta.setLuid("");
7445f856
NR
95 meta.setLang(getLang()); // default is EN
96 meta.setSubject(getSourceFile().getParentFile().getName());
68686a37
NR
97 meta.setType(getType().toString());
98 meta.setImageDocument(false);
7445f856 99 meta.setCover(getCover(getSourceFile()));
31e27ee3 100
68686a37 101 return meta;
08fe2e33
NR
102 }
103
7445f856 104 private String getLang() {
08fe2e33 105 @SuppressWarnings("resource")
7445f856 106 Scanner scan = new Scanner(getInput(), "UTF-8");
08fe2e33
NR
107 scan.useDelimiter("\\n");
108 scan.next(); // Title
109 scan.next(); // Author (Date)
110 String chapter0 = scan.next(); // empty or Chapter 0
111 while (chapter0.isEmpty()) {
112 chapter0 = scan.next();
113 }
114
22848428
NR
115 String lang = detectChapter(chapter0, 0);
116 if (lang == null) {
117 // No description??
118 lang = detectChapter(chapter0, 1);
119 }
120
08fe2e33 121 if (lang == null) {
276f95c6 122 lang = "en";
08fe2e33 123 } else {
276f95c6 124 lang = lang.toLowerCase();
08fe2e33
NR
125 }
126
127 return lang;
128 }
129
7445f856 130 private String getTitle() {
08fe2e33 131 @SuppressWarnings("resource")
7445f856 132 Scanner scan = new Scanner(getInput(), "UTF-8");
08fe2e33
NR
133 scan.useDelimiter("\\n");
134 return scan.next();
135 }
136
7445f856 137 private String getAuthor() {
08fe2e33 138 @SuppressWarnings("resource")
7445f856 139 Scanner scan = new Scanner(getInput(), "UTF-8");
08fe2e33
NR
140 scan.useDelimiter("\\n");
141 scan.next();
142 String authorDate = scan.next();
143
144 String author = authorDate;
145 int pos = authorDate.indexOf('(');
146 if (pos >= 0) {
147 author = authorDate.substring(0, pos);
148 }
149
8d59ce07 150 return bsHelper.fixAuthor(author);
08fe2e33
NR
151 }
152
7445f856 153 private String getDate() {
08fe2e33 154 @SuppressWarnings("resource")
7445f856 155 Scanner scan = new Scanner(getInput(), "UTF-8");
08fe2e33
NR
156 scan.useDelimiter("\\n");
157 scan.next();
158 String authorDate = scan.next();
159
160 String date = "";
161 int pos = authorDate.indexOf('(');
162 if (pos >= 0) {
163 date = authorDate.substring(pos + 1).trim();
164 pos = date.lastIndexOf(')');
165 if (pos >= 0) {
166 date = date.substring(0, pos).trim();
167 }
168 }
169
170 return date;
171 }
172
173 @Override
7445f856 174 protected String getDesc() throws IOException {
32097898
NR
175 String content = getChapterContent(null, 0, null).trim();
176 if (!content.isEmpty()) {
177 Chapter desc = bsPara.makeChapter(this, null, 0, "Description",
178 content, isHtml(), null);
179 StringBuilder builder = new StringBuilder();
180 for (Paragraph para : desc) {
181 if (builder.length() > 0) {
182 builder.append("\n");
183 }
184 builder.append(para.getContent());
185 }
186 }
187
188 return content;
08fe2e33
NR
189 }
190
31e27ee3 191 protected Image getCover(File sourceFile) {
7445f856 192 String path = sourceFile.getName();
08fe2e33
NR
193
194 for (String ext : new String[] { ".txt", ".text", ".story" }) {
195 if (path.endsWith(ext)) {
196 path = path.substring(0, path.length() - ext.length());
197 }
198 }
199
32097898 200 Image cover = bsImages.getImage(this, sourceFile.getParentFile(), path);
81b5e730
NR
201 if (cover != null) {
202 try {
d66deb8d 203 File tmp = Instance.getInstance().getTempFiles().createTempFile("test_cover_image");
81b5e730
NR
204 ImageUtils.getInstance().saveAsImage(cover, tmp, "png");
205 tmp.delete();
206 } catch (IOException e) {
207 cover = null;
208 }
209 }
210
211 return cover;
08fe2e33
NR
212 }
213
214 @Override
7445f856
NR
215 protected List<Entry<String, URL>> getChapters(Progress pg)
216 throws IOException {
08fe2e33
NR
217 List<Entry<String, URL>> chaps = new ArrayList<Entry<String, URL>>();
218 @SuppressWarnings("resource")
7445f856 219 Scanner scan = new Scanner(getInput(), "UTF-8");
08fe2e33 220 scan.useDelimiter("\\n");
08fe2e33
NR
221 boolean prevLineEmpty = false;
222 while (scan.hasNext()) {
223 String line = scan.next();
22848428
NR
224 if (prevLineEmpty && detectChapter(line, chaps.size() + 1) != null) {
225 String chapName = Integer.toString(chaps.size() + 1);
226 int pos = line.indexOf(':');
227 if (pos >= 0 && pos + 1 < line.length()) {
228 chapName = line.substring(pos + 1).trim();
229 }
08fe2e33 230
7445f856
NR
231 chaps.add(new AbstractMap.SimpleEntry<String, URL>(//
232 chapName, //
233 getSourceFile().toURI().toURL()));
08fe2e33
NR
234 }
235
236 prevLineEmpty = line.trim().isEmpty();
237 }
238
239 return chaps;
240 }
241
242 @Override
7445f856
NR
243 protected String getChapterContent(URL source, int number, Progress pg)
244 throws IOException {
08fe2e33
NR
245 StringBuilder builder = new StringBuilder();
246 @SuppressWarnings("resource")
7445f856 247 Scanner scan = new Scanner(getInput(), "UTF-8");
08fe2e33
NR
248 scan.useDelimiter("\\n");
249 boolean inChap = false;
08fe2e33
NR
250 while (scan.hasNext()) {
251 String line = scan.next();
32097898 252 if (!inChap && detectChapter(line, number) != null) {
68686a37 253 inChap = true;
32097898 254 } else if (detectChapter(line, number + 1) != null) {
68686a37
NR
255 break;
256 } else if (inChap) {
257 builder.append(line);
258 builder.append("\n");
08fe2e33 259 }
08fe2e33
NR
260 }
261
262 return builder.toString();
263 }
264
7445f856
NR
265 @Override
266 protected void close() {
267 InputStream in = getInput();
268 if (in != null) {
269 try {
270 in.close();
271 } catch (IOException e) {
d66deb8d
NR
272 Instance.getInstance().getTraceHandler()
273 .error(new IOException("Cannot close the text source file input", e));
7445f856
NR
274 }
275 }
276
277 super.close();
278 }
279
08fe2e33
NR
280 @Override
281 protected boolean supports(URL url) {
86d49dbc
NR
282 return supports(url, false);
283 }
284
285 /**
286 * Check if we supports this {@link URL}, that is, if the info file can be
287 * found OR not found.
3ddb5591
NR
288 * <p>
289 * It must also be a file, not another kind of URL.
86d49dbc
NR
290 *
291 * @param url
292 * the {@link URL} to check
293 * @param info
294 * TRUE to require the info file, FALSE to forbid the info file
295 *
296 * @return TRUE if it is supported
297 */
298 protected boolean supports(URL url, boolean info) {
3ddb5591
NR
299 if (!"file".equals(url.getProtocol())) {
300 return false;
301 }
08fe2e33 302
3ddb5591
NR
303 boolean infoPresent = false;
304 File file;
305 try {
306 file = new File(url.toURI());
307 file = assureNoTxt(file);
308 file = new File(file.getPath() + ".info");
309 } catch (URISyntaxException e) {
d66deb8d 310 Instance.getInstance().getTraceHandler().error(e);
3ddb5591 311 file = null;
08fe2e33
NR
312 }
313
3ddb5591
NR
314 infoPresent = (file != null && file.exists());
315
86d49dbc
NR
316 return infoPresent == info;
317 }
318
319 /**
31e27ee3 320 * Remove the ".txt" (or ".text") extension if it is present.
86d49dbc
NR
321 *
322 * @param file
323 * the file to process
324 *
325 * @return the same file or a copy of it without the ".txt" extension if it
326 * was present
327 */
328 protected File assureNoTxt(File file) {
31e27ee3
NR
329 for (String ext : new String[] { ".txt", ".text" }) {
330 if (file.getName().endsWith(ext)) {
331 file = new File(file.getPath().substring(0,
332 file.getPath().length() - ext.length()));
333 }
86d49dbc
NR
334 }
335
336 return file;
08fe2e33
NR
337 }
338
08fe2e33
NR
339 /**
340 * Check if the given line looks like the given starting chapter in a
341 * supported language, and return the language if it does (or NULL if not).
342 *
343 * @param line
344 * the line to check
32097898
NR
345 * @param number
346 * the specific chapter number to check for
08fe2e33
NR
347 *
348 * @return the language or NULL
349 */
7445f856 350 static private String detectChapter(String line, int number) {
08fe2e33 351 line = line.toUpperCase();
d66deb8d
NR
352 for (String lang : Instance.getInstance().getConfig().getList(Config.CONF_CHAPTER)) {
353 String chapter = Instance.getInstance().getConfig().getStringX(Config.CONF_CHAPTER, lang);
08fe2e33
NR
354 if (chapter != null && !chapter.isEmpty()) {
355 chapter = chapter.toUpperCase() + " ";
356 if (line.startsWith(chapter)) {
22848428
NR
357 // We want "[CHAPTER] [number]: [name]", with ": [name]"
358 // optional
359 String test = line.substring(chapter.length()).trim();
32097898
NR
360
361 String possibleNum = test.trim();
362 if (possibleNum.indexOf(':') > 0) {
363 possibleNum = possibleNum.substring(0,
364 possibleNum.indexOf(':')).trim();
365 }
366
22848428
NR
367 if (test.startsWith(Integer.toString(number))) {
368 test = test
369 .substring(Integer.toString(number).length())
370 .trim();
371 if (test.isEmpty() || test.startsWith(":")) {
372 return lang;
08fe2e33 373 }
08fe2e33
NR
374 }
375 }
376 }
377 }
378
379 return null;
380 }
381}