X-Git-Url: http://git.nikiroo.be/?p=nikiroo-utils.git;a=blobdiff_plain;f=src%2Fbe%2Fnikiroo%2Ffanfix%2Fsupported%2FEpub.java;h=82af11855fdc299226fe2f52ca536f17a07d1d00;hp=8ae4c6c37052c5569674804b3be5d4fa3244f343;hb=8d59ce0748baeeea0458bab49716ab4543aae439;hpb=e4fa48a0b617e0a5368e8e8589909ae93c340447 diff --git a/src/be/nikiroo/fanfix/supported/Epub.java b/src/be/nikiroo/fanfix/supported/Epub.java index 8ae4c6c..82af118 100644 --- a/src/be/nikiroo/fanfix/supported/Epub.java +++ b/src/be/nikiroo/fanfix/supported/Epub.java @@ -1,24 +1,23 @@ package be.nikiroo.fanfix.supported; import java.io.File; -import java.io.FileInputStream; import java.io.IOException; import java.io.InputStream; +import java.net.URISyntaxException; import java.net.URL; import java.net.URLDecoder; import java.util.ArrayList; -import java.util.List; -import java.util.Map.Entry; import java.util.zip.ZipEntry; import java.util.zip.ZipInputStream; +import org.jsoup.nodes.Document; + import be.nikiroo.fanfix.Instance; import be.nikiroo.fanfix.data.MetaData; import be.nikiroo.utils.IOUtils; import be.nikiroo.utils.Image; -import be.nikiroo.utils.MarkableFileInputStream; -import be.nikiroo.utils.Progress; import be.nikiroo.utils.StringUtils; +import be.nikiroo.utils.streams.MarkableFileInputStream; /** * Support class for EPUB files created with this program (as we need some @@ -27,196 +26,207 @@ import be.nikiroo.utils.StringUtils; * @author niki */ class Epub extends InfoText { - protected MetaData meta; - private File tmp; + private MetaData meta; + private File tmpDir; private String desc; private URL fakeSource; private InputStream fakeIn; - @Override - public String getSourceName() { - return "epub"; + public File getSourceFileOriginal() { + return super.getSourceFile(); } @Override - protected boolean supports(URL url) { - if (url.getPath().toLowerCase().endsWith(".epub")) { - return true; + protected File getSourceFile() { + try { + return new File(fakeSource.toURI()); + } catch (URISyntaxException e) { + Instance.getTraceHandler() + .error(new IOException( + "Cannot get the source file from the info-text URL", + e)); } - return false; - } - - @Override - protected MetaData getMeta(URL source, InputStream in) throws IOException { - return meta; + return null; } @Override - protected String getDesc(URL source, InputStream in) throws IOException { - if (desc != null) { - return desc; - } - + protected InputStream getInput() { if (fakeIn != null) { - fakeIn.reset(); - return super.getDesc(fakeSource, fakeIn); + try { + fakeIn.reset(); + } catch (IOException e) { + Instance.getTraceHandler() + .error(new IOException( + "Cannot reset the Epub Text stream", e)); + } + + return fakeIn; } return null; } @Override - protected List> getChapters(URL source, InputStream in, - Progress pg) throws IOException { - if (fakeIn != null) { - fakeIn.reset(); - return super.getChapters(fakeSource, fakeIn, pg); - } - - return null; + protected boolean supports(URL url) { + return url.getPath().toLowerCase().endsWith(".epub"); } @Override - protected String getChapterContent(URL source, InputStream in, int number, - Progress pg) throws IOException { - if (fakeIn != null) { - fakeIn.reset(); - return super.getChapterContent(fakeSource, fakeIn, number, pg); - } - - return null; + protected MetaData getMeta() throws IOException { + return meta; } @Override - protected void preprocess(URL source, InputStream in) throws IOException { - // Note: do NOT close this stream, as it would also close "in" - ZipInputStream zipIn = new ZipInputStream(in); - tmp = File.createTempFile("fanfic-reader-parser_", ".tmp"); - File tmpInfo = new File(tmp + ".info"); - fakeSource = tmp.toURI().toURL(); - Image cover = null; - - String url = source.toString(); - String title = null; - String author = null; - - for (ZipEntry entry = zipIn.getNextEntry(); entry != null; entry = zipIn - .getNextEntry()) { - if (!entry.isDirectory() - && entry.getName().startsWith(getDataPrefix())) { - String entryLName = entry.getName().toLowerCase(); - - boolean imageEntry = false; - for (String ext : getImageExt(false)) { - if (entryLName.endsWith(ext)) { - imageEntry = true; + protected Document loadDocument(URL source) throws IOException { + super.loadDocument(source); // prepares super.getSourceFile() and + // super.getInput() + + InputStream in = super.getInput(); + ZipInputStream zipIn = null; + try { + zipIn = new ZipInputStream(in); + tmpDir = Instance.getTempFiles().createTempDir( + "fanfic-reader-parser"); + File tmp = new File(tmpDir, "file.txt"); + File tmpInfo = new File(tmpDir, "file.info"); + + fakeSource = tmp.toURI().toURL(); + Image cover = null; + + String url; + try { + url = getSource().toURI().toURL().toString(); + } catch (URISyntaxException e1) { + url = getSource().toString(); + } + String title = null; + String author = null; + + for (ZipEntry entry = zipIn.getNextEntry(); entry != null; entry = zipIn + .getNextEntry()) { + if (!entry.isDirectory() + && entry.getName().startsWith(getDataPrefix())) { + String entryLName = entry.getName().toLowerCase(); + + boolean imageEntry = false; + for (String ext : bsImages.getImageExt(false)) { + if (entryLName.endsWith(ext)) { + imageEntry = true; + } } - } - if (entry.getName().equals(getDataPrefix() + "version")) { - // Nothing to do for now ("first" - // version is 3.0) - } else if (entryLName.endsWith(".info")) { - // Info file - IOUtils.write(zipIn, tmpInfo); - } else if (imageEntry) { - // Cover - if (getCover()) { - try { - cover = new Image(zipIn); - } catch (Exception e) { - Instance.getTraceHandler().error(e); + if (entry.getName().equals(getDataPrefix() + "version")) { + // Nothing to do for now ("first" + // version is 3.0) + } else if (entryLName.endsWith(".info")) { + // Info file + IOUtils.write(zipIn, tmpInfo); + } else if (imageEntry) { + // Cover + if (getCover()) { + try { + cover = new Image(zipIn); + } catch (Exception e) { + Instance.getTraceHandler().error(e); + } } - } - } else if (entry.getName().equals(getDataPrefix() + "URL")) { - String[] descArray = StringUtils - .unhtml(IOUtils.readSmallStream(zipIn)).trim() - .split("\n"); - if (descArray.length > 0) { - url = descArray[0].trim(); - } - } else if (entry.getName().equals(getDataPrefix() + "SUMMARY")) { - String[] descArray = StringUtils - .unhtml(IOUtils.readSmallStream(zipIn)).trim() - .split("\n"); - int skip = 0; - if (descArray.length > 1) { - title = descArray[0].trim(); - skip = 1; - if (descArray.length > 2 - && descArray[1].startsWith("©")) { - author = descArray[1].substring(1).trim(); - skip = 2; + } else if (entry.getName().equals(getDataPrefix() + "URL")) { + String[] descArray = StringUtils + .unhtml(IOUtils.readSmallStream(zipIn)).trim() + .split("\n"); + if (descArray.length > 0) { + url = descArray[0].trim(); + } + } else if (entry.getName().equals( + getDataPrefix() + "SUMMARY")) { + String[] descArray = StringUtils + .unhtml(IOUtils.readSmallStream(zipIn)).trim() + .split("\n"); + int skip = 0; + if (descArray.length > 1) { + title = descArray[0].trim(); + skip = 1; + if (descArray.length > 2 + && descArray[1].startsWith("©")) { + author = descArray[1].substring(1).trim(); + skip = 2; + } + } + this.desc = ""; + for (int i = skip; i < descArray.length; i++) { + this.desc += descArray[i].trim() + "\n"; } - } - this.desc = ""; - for (int i = skip; i < descArray.length; i++) { - this.desc += descArray[i].trim() + "\n"; - } - this.desc = this.desc.trim(); - } else { - // Hopefully the data file - IOUtils.write(zipIn, tmp); + this.desc = this.desc.trim(); + } else { + // Hopefully the data file + IOUtils.write(zipIn, tmp); + } } } - } - - if (requireInfo() && (!tmp.exists() || !tmpInfo.exists())) { - throw new IOException( - "file not supported (maybe not created with this program or corrupt)"); - } - if (tmp.exists()) { - this.fakeIn = new MarkableFileInputStream(new FileInputStream(tmp)); - } + if (requireInfo() && (!tmp.exists() || !tmpInfo.exists())) { + throw new IOException( + "file not supported (maybe not created with this program or corrupt)"); + } - if (tmpInfo.exists()) { - meta = InfoReader.readMeta(tmpInfo, true); - if (cover != null) { - meta.setCover(cover); + if (tmp.exists()) { + this.fakeIn = new MarkableFileInputStream(tmp); } - tmpInfo.delete(); - } else { - if (title == null || title.isEmpty()) { - title = new File(source.getPath()).getName(); - if (title.toLowerCase().endsWith(".cbz")) { - title = title.substring(0, title.length() - 4); + + if (tmpInfo.exists()) { + meta = InfoReader.readMeta(tmpInfo, true); + tmpInfo.delete(); + } else { + if (title == null || title.isEmpty()) { + title = getSourceFileOriginal().getName(); + if (title.toLowerCase().endsWith(".cbz")) { + title = title.substring(0, title.length() - 4); + } + title = URLDecoder.decode(title, "UTF-8").trim(); } - title = URLDecoder.decode(title, "UTF-8").trim(); + + meta = new MetaData(); + meta.setLang("en"); + meta.setTags(new ArrayList()); + meta.setSource(getType().getSourceName()); + meta.setUuid(url); + meta.setUrl(url); + meta.setTitle(title); + meta.setAuthor(author); + meta.setImageDocument(isImagesDocumentByDefault()); } - meta = new MetaData(); - meta.setLang("EN"); - meta.setTags(new ArrayList()); - meta.setSource(getSourceName()); - meta.setUuid(url); - meta.setUrl(url); - meta.setTitle(title); - meta.setAuthor(author); - meta.setImageDocument(isImagesDocumentByDefault()); + if (meta.getCover() == null) { + if (cover != null) { + meta.setCover(cover); + } else { + meta.setCover(InfoReader + .getCoverByName(getSourceFileOriginal().toURI() + .toURL())); + } + } + } finally { + if (zipIn != null) { + zipIn.close(); + } + if (in != null) { + in.close(); + } } + + return null; } @Override protected void close() { - if (tmp != null && tmp.exists()) { - if (!tmp.delete()) { - tmp.deleteOnExit(); - } + if (tmpDir != null) { + IOUtils.deltree(tmpDir); } - tmp = null; - - if (fakeIn != null) { - try { - fakeIn.close(); - } catch (Exception e) { - Instance.getTraceHandler().error(e); - } - } + tmpDir = null; super.close(); }