X-Git-Url: http://git.nikiroo.be/?a=blobdiff_plain;f=src%2Fbe%2Fnikiroo%2Futils%2FStringUtils.java;h=1ee9ac4b569001fda8036815fe8a43277e8e18ef;hb=ce3972ea1a7083d1f8ef17463fb48c5bfa7ebf73;hp=ed3c630e94b076d9e1a6d32fe0a7016130530af0;hpb=72c32e8891f0964080f957fb6f4ff332b2ca203f;p=nikiroo-utils.git

diff --git a/src/be/nikiroo/utils/StringUtils.java b/src/be/nikiroo/utils/StringUtils.java
index ed3c630..1ee9ac4 100644
--- a/src/be/nikiroo/utils/StringUtils.java
+++ b/src/be/nikiroo/utils/StringUtils.java
@@ -1,25 +1,22 @@
 package be.nikiroo.utils;
 
-import java.awt.Image;
-import java.awt.geom.AffineTransform;
-import java.awt.image.AffineTransformOp;
-import java.awt.image.BufferedImage;
-import java.io.ByteArrayInputStream;
-import java.io.ByteArrayOutputStream;
-import java.io.File;
 import java.io.IOException;
 import java.io.InputStream;
+import java.io.OutputStream;
+import java.io.UnsupportedEncodingException;
 import java.security.MessageDigest;
 import java.security.NoSuchAlgorithmException;
 import java.text.Normalizer;
 import java.text.Normalizer.Form;
 import java.text.ParseException;
 import java.text.SimpleDateFormat;
+import java.util.AbstractMap;
+import java.util.ArrayList;
 import java.util.Date;
+import java.util.List;
+import java.util.Map.Entry;
 import java.util.regex.Pattern;
 
-import javax.imageio.ImageIO;
-
 import org.unbescape.html.HtmlEscape;
 import org.unbescape.html.HtmlEscapeLevel;
 import org.unbescape.html.HtmlEscapeType;
@@ -32,19 +29,49 @@ import org.unbescape.html.HtmlEscapeType;
 public class StringUtils {
 	/**
 	 * This enum type will decide the alignment of a {@link String} when padding
-	 * is applied or if there is enough horizontal space for it to be aligned.
+	 * or justification is applied (if there is enough horizontal space for it
+	 * to be aligned).
 	 */
 	public enum Alignment {
 		/** Aligned at left. */
-		Beginning,
+		LEFT,
 		/** Centered. */
-		Center,
+		CENTER,
 		/** Aligned at right. */
-		End
+		RIGHT,
+		/** Full justified (to both left and right). */
+		JUSTIFY,
+
+		// Old Deprecated values:
+
+		/** DEPRECATED: please use LEFT. */
+		@Deprecated
+		Beginning,
+		/** DEPRECATED: please use CENTER. */
+		@Deprecated
+		Center,
+		/** DEPRECATED: please use RIGHT. */
+		@Deprecated
+		End;
+
+		/**
+		 * Return the non-deprecated version of this enum if needed (or return
+		 * self if not).
+		 * 
+		 * @return the non-deprecated value
+		 */
+		Alignment undeprecate() {
+			if (this == Beginning)
+				return LEFT;
+			if (this == Center)
+				return CENTER;
+			if (this == End)
+				return RIGHT;
+			return this;
+		}
 	}
 
-	static private Pattern marks = Pattern
-			.compile("[\\p{InCombiningDiacriticalMarks}\\p{IsLm}\\p{IsSk}]+");
+	static private Pattern marks = getMarks();
 
 	/**
 	 * Fix the size of the given {@link String} either with space-padding or by
@@ -58,7 +85,7 @@ public class StringUtils {
 	 * @return the resulting {@link String} of size <i>size</i>
 	 */
 	static public String padString(String text, int width) {
-		return padString(text, width, true, Alignment.Beginning);
+		return padString(text, width, true, null);
 	}
 
 	/**
@@ -74,13 +101,19 @@ public class StringUtils {
 	 *            cut the {@link String} shorter if needed
 	 * @param align
 	 *            align the {@link String} in this position if we have enough
-	 *            space
+	 *            space (default is Alignment.Beginning)
 	 * 
 	 * @return the resulting {@link String} of size <i>size</i> minimum
 	 */
 	static public String padString(String text, int width, boolean cut,
 			Alignment align) {
 
+		if (align == null) {
+			align = Alignment.LEFT;
+		}
+
+		align = align.undeprecate();
+
 		if (width >= 0) {
 			if (text == null)
 				text = "";
@@ -91,23 +124,23 @@ public class StringUtils {
 				if (cut)
 					text = text.substring(0, width);
 			} else if (diff > 0) {
-				if (diff < 2 && align != Alignment.End)
-					align = Alignment.Beginning;
+				if (diff < 2 && align != Alignment.RIGHT)
+					align = Alignment.LEFT;
 
 				switch (align) {
-				case Beginning:
-					text = text + new String(new char[diff]).replace('\0', ' ');
-					break;
-				case End:
+				case RIGHT:
 					text = new String(new char[diff]).replace('\0', ' ') + text;
 					break;
-				case Center:
-				default:
+				case CENTER:
 					int pad1 = (diff) / 2;
 					int pad2 = (diff + 1) / 2;
 					text = new String(new char[pad1]).replace('\0', ' ') + text
 							+ new String(new char[pad2]).replace('\0', ' ');
 					break;
+				case LEFT:
+				default:
+					text = text + new String(new char[diff]).replace('\0', ' ');
+					break;
 				}
 			}
 		}
@@ -115,6 +148,177 @@ public class StringUtils {
 		return text;
 	}
 
+	/**
+	 * Justify a text into width-sized (at the maximum) lines.
+	 * 
+	 * @param text
+	 *            the {@link String} to justify
+	 * @param width
+	 *            the maximum size of the resulting lines
+	 * 
+	 * @return a list of justified text lines
+	 */
+	static public List<String> justifyText(String text, int width) {
+		return justifyText(text, width, null);
+	}
+
+	/**
+	 * Justify a text into width-sized (at the maximum) lines.
+	 * 
+	 * @param text
+	 *            the {@link String} to justify
+	 * @param width
+	 *            the maximum size of the resulting lines
+	 * @param align
+	 *            align the lines in this position (default is
+	 *            Alignment.Beginning)
+	 * 
+	 * @return a list of justified text lines
+	 */
+	static public List<String> justifyText(String text, int width,
+			Alignment align) {
+		if (align == null) {
+			align = Alignment.LEFT;
+		}
+
+		align = align.undeprecate();
+
+		switch (align) {
+		case CENTER:
+			return StringJustifier.center(text, width);
+		case RIGHT:
+			return StringJustifier.right(text, width);
+		case JUSTIFY:
+			return StringJustifier.full(text, width);
+		case LEFT:
+		default:
+			return StringJustifier.left(text, width);
+		}
+	}
+
+	/**
+	 * Justify a text into width-sized (at the maximum) lines.
+	 * 
+	 * @param text
+	 *            the {@link String} to justify
+	 * @param width
+	 *            the maximum size of the resulting lines
+	 * 
+	 * @return a list of justified text lines
+	 */
+	static public List<String> justifyText(List<String> text, int width) {
+		return justifyText(text, width, null);
+	}
+
+	/**
+	 * Justify a text into width-sized (at the maximum) lines.
+	 * 
+	 * @param text
+	 *            the {@link String} to justify
+	 * @param width
+	 *            the maximum size of the resulting lines
+	 * @param align
+	 *            align the lines in this position (default is
+	 *            Alignment.Beginning)
+	 * 
+	 * @return a list of justified text lines
+	 */
+	static public List<String> justifyText(List<String> text, int width,
+			Alignment align) {
+		List<String> result = new ArrayList<String>();
+
+		// Content <-> Bullet spacing (null = no spacing)
+		List<Entry<String, String>> lines = new ArrayList<Entry<String, String>>();
+		StringBuilder previous = null;
+		StringBuilder tmp = new StringBuilder();
+		String previousItemBulletSpacing = null;
+		String itemBulletSpacing = null;
+		for (String inputLine : text) {
+			boolean previousLineComplete = true;
+
+			String current = inputLine.replace("\t", "    ");
+			itemBulletSpacing = getItemSpacing(current);
+			boolean bullet = isItemLine(current);
+			if ((previousItemBulletSpacing == null || itemBulletSpacing
+					.length() <= previousItemBulletSpacing.length()) && !bullet) {
+				itemBulletSpacing = null;
+			}
+
+			if (itemBulletSpacing != null) {
+				current = current.trim();
+				if (!current.isEmpty() && bullet) {
+					current = current.substring(1);
+				}
+				current = current.trim();
+				previousLineComplete = bullet;
+			} else {
+				tmp.setLength(0);
+				for (String word : current.split(" ")) {
+					if (word.isEmpty()) {
+						continue;
+					}
+
+					if (tmp.length() > 0) {
+						tmp.append(' ');
+					}
+					tmp.append(word.trim());
+				}
+				current = tmp.toString();
+
+				previousLineComplete = current.isEmpty()
+						|| previousItemBulletSpacing != null
+						|| (previous != null && isFullLine(previous))
+						|| isHrLine(current) || isHrLine(previous);
+			}
+
+			if (previous == null) {
+				previous = new StringBuilder();
+			} else {
+				if (previousLineComplete) {
+					lines.add(new AbstractMap.SimpleEntry<String, String>(
+							previous.toString(), previousItemBulletSpacing));
+					previous.setLength(0);
+					previousItemBulletSpacing = itemBulletSpacing;
+				} else {
+					previous.append(' ');
+				}
+			}
+
+			previous.append(current);
+
+		}
+
+		if (previous != null) {
+			lines.add(new AbstractMap.SimpleEntry<String, String>(previous
+					.toString(), previousItemBulletSpacing));
+		}
+
+		for (Entry<String, String> line : lines) {
+			String content = line.getKey();
+			String spacing = line.getValue();
+
+			String bullet = "- ";
+			if (spacing == null) {
+				bullet = "";
+				spacing = "";
+			}
+
+			if (spacing.length() > width + 3) {
+				spacing = "";
+			}
+
+			for (String subline : StringUtils.justifyText(content, width
+					- (spacing.length() + bullet.length()), align)) {
+				result.add(spacing + bullet + subline);
+				if (!bullet.isEmpty()) {
+					bullet = "  ";
+				}
+			}
+		}
+
+		return result;
+	}
+
 	/**
 	 * Sanitise the given input to make it more Terminal-friendly by removing
 	 * combining characters.
@@ -149,7 +353,9 @@ public class StringUtils {
 
 		if (removeAllAccents) {
 			input = Normalizer.normalize(input, Form.NFKD);
-			input = marks.matcher(input).replaceAll("");
+			if (marks != null) {
+				input = marks.matcher(input).replaceAll("");
+			}
 		}
 
 		input = Normalizer.normalize(input, Form.NFKC);
@@ -171,11 +377,15 @@ public class StringUtils {
 	}
 
 	/**
-	 * Convert between time in milliseconds to {@link String} in a "static" way
-	 * (to exchange data over the wire, for instance).
+	 * Convert between the time in milliseconds to a {@link String} in a "fixed"
+	 * way (to exchange data over the wire, for instance).
+	 * <p>
+	 * Precise to the second.
 	 * 
 	 * @param time
-	 *            the time in milliseconds
+	 *            the specified number of milliseconds since the standard base
+	 *            time known as "the epoch", namely January 1, 1970, 00:00:00
+	 *            GMT
 	 * 
 	 * @return the time as a {@link String}
 	 */
@@ -185,422 +395,669 @@ public class StringUtils {
 	}
 
 	/**
-	 * Convert between time as a {@link String} to milliseconds in a "static"
+	 * Convert between the time as a {@link String} to milliseconds in a "fixed"
 	 * way (to exchange data over the wire, for instance).
+	 * <p>
+	 * Precise to the second.
 	 * 
-	 * @param time
+	 * @param displayTime
 	 *            the time as a {@link String}
 	 * 
-	 * @return the time in milliseconds
+	 * @return the number of milliseconds since the standard base time known as
+	 *         "the epoch", namely January 1, 1970, 00:00:00 GMT, or -1 in case
+	 *         of error
+	 * 
+	 * @throws ParseException
+	 *             in case of parse error
 	 */
-	static public long toTime(String display) {
+	static public long toTime(String displayTime) throws ParseException {
 		SimpleDateFormat sdf = new SimpleDateFormat("yyyy-MM-dd HH:mm:ss");
+		return sdf.parse(displayTime).getTime();
+	}
+
+	/**
+	 * Return a hash of the given {@link String}.
+	 * 
+	 * @param input
+	 *            the input data
+	 * 
+	 * @return the hash
+	 */
+	static public String getMd5Hash(String input) {
 		try {
-			return sdf.parse(display).getTime();
-		} catch (ParseException e) {
-			return -1;
+			MessageDigest md = MessageDigest.getInstance("MD5");
+			md.update(input.getBytes("UTF-8"));
+			byte byteData[] = md.digest();
+
+			StringBuffer hexString = new StringBuffer();
+			for (int i = 0; i < byteData.length; i++) {
+				String hex = Integer.toHexString(0xff & byteData[i]);
+				if (hex.length() == 1)
+					hexString.append('0');
+				hexString.append(hex);
+			}
+
+			return hexString.toString();
+		} catch (NoSuchAlgorithmException e) {
+			return input;
+		} catch (UnsupportedEncodingException e) {
+			return input;
 		}
 	}
 
 	/**
-	 * Convert the given {@link Image} object into a Base64 representation of
-	 * the same {@link Image}. object.
+	 * Remove the HTML content from the given input, and un-html-ize the rest.
+	 * 
+	 * @param html
+	 *            the HTML-encoded content
 	 * 
-	 * @param image
-	 *            the {@link Image} object to convert
+	 * @return the HTML-free equivalent content
+	 */
+	public static String unhtml(String html) {
+		StringBuilder builder = new StringBuilder();
+
+		int inTag = 0;
+		for (char car : html.toCharArray()) {
+			if (car == '<') {
+				inTag++;
+			} else if (car == '>') {
+				inTag--;
+			} else if (inTag <= 0) {
+				builder.append(car);
+			}
+		}
+
+		char nbsp = 'Â '; // non-breakable space (a special char)
+		char space = ' ';
+		return HtmlEscape.unescapeHtml(builder.toString()).replace(nbsp, space);
+	}
+
+	/**
+	 * Escape the given {@link String} so it can be used in XML, as content.
 	 * 
-	 * @return the Base64 representation
+	 * @param input
+	 *            the input {@link String}
 	 * 
-	 * @throws IOException
-	 *             in case of IO error
+	 * @return the escaped {@link String}
 	 */
-	static public String fromImage(BufferedImage image) throws IOException {
-		String imageString = null;
-		ByteArrayOutputStream out = new ByteArrayOutputStream();
+	public static String xmlEscape(String input) {
+		if (input == null) {
+			return "";
+		}
 
-		ImageIO.write(image, "jpeg", out);
-		byte[] imageBytes = out.toByteArray();
+		return HtmlEscape.escapeHtml(input,
+				HtmlEscapeType.HTML4_NAMED_REFERENCES_DEFAULT_TO_HEXA,
+				HtmlEscapeLevel.LEVEL_1_ONLY_MARKUP_SIGNIFICANT);
+	}
 
-		imageString = new String(Base64.encodeBytes(imageBytes));
+	/**
+	 * Escape the given {@link String} so it can be used in XML, as text content
+	 * inside double-quotes.
+	 * 
+	 * @param input
+	 *            the input {@link String}
+	 * 
+	 * @return the escaped {@link String}
+	 */
+	public static String xmlEscapeQuote(String input) {
+		if (input == null) {
+			return "";
+		}
 
-		out.close();
+		return HtmlEscape.escapeHtml(input,
+				HtmlEscapeType.HTML4_NAMED_REFERENCES_DEFAULT_TO_HEXA,
+				HtmlEscapeLevel.LEVEL_1_ONLY_MARKUP_SIGNIFICANT);
+	}
 
-		return imageString;
+	/**
+	 * Zip the data and then encode it into Base64.
+	 * 
+	 * @deprecated use {@link StringUtils#base64(byte[], boolean)} with the
+	 *             correct parameter instead
+	 * 
+	 * @param data
+	 *            the data
+	 * 
+	 * @return the Base64 zipped version
+	 */
+	@Deprecated
+	public static String zip64(String data) {
+		try {
+			return Base64.encodeBytes(data.getBytes("UTF-8"), Base64.GZIP);
+		} catch (IOException e) {
+			e.printStackTrace();
+			return null;
+		}
+	}
+
+	/**
+	 * Unconvert from Base64 then unzip the content.
+	 * 
+	 * @deprecated use {@link StringUtils#unbase64s(String, boolean)} with the
+	 *             correct parameter instead
+	 * 
+	 * @param data
+	 *            the data in Base64 format
+	 * 
+	 * @return the raw data
+	 * 
+	 * @throws IOException
+	 *             in case of I/O error
+	 */
+	@Deprecated
+	public static String unzip64(String data) throws IOException {
+		return new String(Base64.decode(data, Base64.GZIP), "UTF-8");
 	}
 
 	/**
-	 * Convert the given {@link File} image into a Base64 representation of the
-	 * same {@link File}.
+	 * Convert the given data to Base64 format.
 	 * 
-	 * @param file
-	 *            the {@link File} image to convert
+	 * @param data
+	 *            the data to convert
+	 * @param zip
+	 *            TRUE to also compress the data in GZIP format; remember that
+	 *            compressed and not-compressed content are different; you need
+	 *            to know which is which when decoding
 	 * 
-	 * @return the Base64 representation
+	 * @return the Base64 {@link String} representation of the data
 	 * 
 	 * @throws IOException
-	 *             in case of IO error
+	 *             in case of I/O errors
 	 */
-	static public String fromStream(InputStream in) throws IOException {
-		String fileString = null;
-		ByteArrayOutputStream out = new ByteArrayOutputStream();
+	public static String base64(String data, boolean zip) throws IOException {
+		return base64(data.getBytes("UTF-8"), zip);
+	}
 
-		byte[] buf = new byte[8192];
+	/**
+	 * Convert the given data to Base64 format.
+	 * 
+	 * @param data
+	 *            the data to convert
+	 * @param zip
+	 *            TRUE to also compress the data in GZIP format; remember that
+	 *            compressed and not-compressed content are different; you need
+	 *            to know which is which when decoding
+	 * 
+	 * @return the Base64 {@link String} representation of the data
+	 * 
+	 * @throws IOException
+	 *             in case of I/O errors
+	 */
+	public static String base64(byte[] data, boolean zip) throws IOException {
+		return Base64.encodeBytes(data, zip ? Base64.GZIP : Base64.NO_OPTIONS);
+	}
 
-		int c = 0;
-		while ((c = in.read(buf, 0, buf.length)) > 0) {
-			out.write(buf, 0, c);
+	/**
+	 * Convert the given data to Base64 format.
+	 * 
+	 * @param data
+	 *            the data to convert
+	 * @param zip
+	 *            TRUE to also uncompress the data from a GZIP format; take care
+	 *            about this flag, as it could easily cause errors in the
+	 *            returned content or an {@link IOException}
+	 * @param breakLines
+	 *            TRUE to break lines on every 76th character
+	 * 
+	 * @return the Base64 {@link String} representation of the data
+	 * 
+	 * @throws IOException
+	 *             in case of I/O errors
+	 */
+	public static OutputStream base64(OutputStream data, boolean zip,
+			boolean breakLines) throws IOException {
+		OutputStream out = new Base64.OutputStream(data,
+				breakLines ? Base64.DO_BREAK_LINES & Base64.ENCODE
+						: Base64.ENCODE);
+
+		if (zip) {
+			out = new java.util.zip.GZIPOutputStream(out);
 		}
-		out.flush();
-		in.close();
 
-		fileString = new String(Base64.encodeBytes(out.toByteArray()));
-		out.close();
+		return out;
+	}
 
-		return fileString;
+	/**
+	 * Convert the given data to Base64 format.
+	 * 
+	 * @param data
+	 *            the data to convert
+	 * @param zip
+	 *            TRUE to also uncompress the data from a GZIP format; take care
+	 *            about this flag, as it could easily cause errors in the
+	 *            returned content or an {@link IOException}
+	 * @param breakLines
+	 *            TRUE to break lines on every 76th character
+	 * 
+	 * @return the Base64 {@link String} representation of the data
+	 * 
+	 * @throws IOException
+	 *             in case of I/O errors
+	 */
+	public static InputStream base64(InputStream data, boolean zip,
+			boolean breakLines) throws IOException {
+		if (zip) {
+			data = new java.util.zip.GZIPInputStream(data);
+		}
+
+		return new Base64.InputStream(data, breakLines ? Base64.DO_BREAK_LINES
+				& Base64.ENCODE : Base64.ENCODE);
 	}
 
 	/**
-	 * Convert the given Base64 representation of an image into an {@link Image}
-	 * object.
+	 * Unconvert the given data from Base64 format back to a raw array of bytes.
+	 * <p>
+	 * Will automatically detect zipped data and also uncompress it before
+	 * returning, unless ZIP is false.
 	 * 
-	 * @param b64data
-	 *            the {@link Image} in Base64 format
+	 * @param data
+	 *            the data to unconvert
+	 * @param zip
+	 *            TRUE to also uncompress the data from a GZIP format
+	 *            automatically; if set to FALSE, zipped data can be returned
 	 * 
-	 * @return the {@link Image} object
+	 * @return the raw data represented by the given Base64 {@link String},
+	 *         optionally compressed with GZIP
 	 * 
 	 * @throws IOException
-	 *             in case of IO error
+	 *             in case of I/O errors
 	 */
-	static public BufferedImage toImage(String b64data) throws IOException {
-		ByteArrayInputStream in = new ByteArrayInputStream(
-				Base64.decode(b64data));
-		return toImage(in);
+	public static byte[] unbase64(String data, boolean zip) throws IOException {
+		return Base64
+				.decode(data, zip ? Base64.NO_OPTIONS : Base64.DONT_GUNZIP);
 	}
 
 	/**
-	 * Convert the given {@link InputStream} (which must allow calls to
-	 * {@link InputStream#reset()}) into an {@link Image} object.
+	 * Unconvert the given data from Base64 format back to a raw array of bytes.
 	 * 
-	 * @param in
-	 *            the 'resetable' {@link InputStream}
+	 * @param data
+	 *            the data to unconvert
+	 * @param zip
+	 *            TRUE to also uncompress the data from a GZIP format; take care
+	 *            about this flag, as it could easily cause errors in the
+	 *            returned content or an {@link IOException}
 	 * 
-	 * @return the {@link Image} object
+	 * @return the raw data represented by the given Base64 {@link String}
 	 * 
 	 * @throws IOException
-	 *             in case of IO error
+	 *             in case of I/O errors
 	 */
-	static public BufferedImage toImage(InputStream in) throws IOException {
-		int orientation;
-		try {
-			orientation = getExifTransorm(in);
-		} catch (Exception e) {
-			// no EXIF transform, ok
-			orientation = -1;
+	public static OutputStream unbase64(OutputStream data, boolean zip)
+			throws IOException {
+		OutputStream out = new Base64.OutputStream(data, Base64.DECODE);
+
+		if (zip) {
+			out = new java.util.zip.GZIPOutputStream(out);
 		}
 
-		in.reset();
-		BufferedImage image = ImageIO.read(in);
+		return out;
+	}
 
-		if (image == null) {
-			throw new IOException("Failed to convert input to image");
+	/**
+	 * Unconvert the given data from Base64 format back to a raw array of bytes.
+	 * 
+	 * @param data
+	 *            the data to unconvert
+	 * @param zip
+	 *            TRUE to also uncompress the data from a GZIP format; take care
+	 *            about this flag, as it could easily cause errors in the
+	 *            returned content or an {@link IOException}
+	 * 
+	 * @return the raw data represented by the given Base64 {@link String}
+	 * 
+	 * @throws IOException
+	 *             in case of I/O errors
+	 */
+	public static InputStream unbase64(InputStream data, boolean zip)
+			throws IOException {
+		if (zip) {
+			data = new java.util.zip.GZIPInputStream(data);
 		}
 
-		// Note: this code has been found on internet;
-		// thank you anonymous coder.
-		int width = image.getWidth();
-		int height = image.getHeight();
-		AffineTransform affineTransform = new AffineTransform();
-
-		switch (orientation) {
-		case 1:
-			break;
-		case 2: // Flip X
-			affineTransform.scale(-1.0, 1.0);
-			affineTransform.translate(-width, 0);
-			break;
-		case 3: // PI rotation
-			affineTransform.translate(width, height);
-			affineTransform.rotate(Math.PI);
-			break;
-		case 4: // Flip Y
-			affineTransform.scale(1.0, -1.0);
-			affineTransform.translate(0, -height);
-			break;
-		case 5: // - PI/2 and Flip X
-			affineTransform.rotate(-Math.PI / 2);
-			affineTransform.scale(-1.0, 1.0);
-			break;
-		case 6: // -PI/2 and -width
-			affineTransform.translate(height, 0);
-			affineTransform.rotate(Math.PI / 2);
-			break;
-		case 7: // PI/2 and Flip
-			affineTransform.scale(-1.0, 1.0);
-			affineTransform.translate(-height, 0);
-			affineTransform.translate(0, width);
-			affineTransform.rotate(3 * Math.PI / 2);
-			break;
-		case 8: // PI / 2
-			affineTransform.translate(0, width);
-			affineTransform.rotate(3 * Math.PI / 2);
-			break;
-		default:
-			affineTransform = null;
-			break;
-		}
+		return new Base64.InputStream(data, Base64.DECODE);
+	}
 
-		if (affineTransform != null) {
-			AffineTransformOp affineTransformOp = new AffineTransformOp(
-					affineTransform, AffineTransformOp.TYPE_BILINEAR);
+	/**
+	 * Unconvert the given data from Base64 format back to a raw array of bytes.
+	 * <p>
+	 * Will automatically detect zipped data and also uncompress it before
+	 * returning, unless ZIP is false.
+	 * 
+	 * @param data
+	 *            the data to unconvert
+	 * @param offset
+	 *            the offset at which to start taking the data (do not take the
+	 *            data before it into account)
+	 * @param count
+	 *            the number of bytes to take into account (do not process after
+	 *            this number of bytes has been processed)
+	 * @param zip
+	 *            TRUE to also uncompress the data from a GZIP format
+	 *            automatically; if set to FALSE, zipped data can be returned
+	 * 
+	 * @return the raw data represented by the given Base64 {@link String}
+	 * 
+	 * @throws IOException
+	 *             in case of I/O errors
+	 */
+	public static byte[] unbase64(byte[] data, int offset, int count,
+			boolean zip) throws IOException {
+		return Base64.niki_decode(data, offset, count, zip ? Base64.NO_OPTIONS
+				: Base64.DONT_GUNZIP);
+	}
 
-			BufferedImage transformedImage = new BufferedImage(height, width,
-					image.getType());
-			transformedImage = affineTransformOp
-					.filter(image, transformedImage);
+	/**
+	 * Unonvert the given data from Base64 format back to a {@link String}.
+	 * <p>
+	 * Will automatically detect zipped data and also uncompress it before
+	 * returning, unless ZIP is false.
+	 * 
+	 * @param data
+	 *            the data to unconvert
+	 * @param zip
+	 *            TRUE to also uncompress the data from a GZIP format
+	 *            automatically; if set to FALSE, zipped data can be returned
+	 * 
+	 * @return the {@link String} represented by the given Base64 {@link String}
+	 *         , optionally compressed with GZIP
+	 * 
+	 * @throws IOException
+	 *             in case of I/O errors
+	 */
+	public static String unbase64s(String data, boolean zip) throws IOException {
+		return new String(unbase64(data, zip), "UTF-8");
+	}
 
-			image = transformedImage;
-		}
-		//
+	/**
+	 * Unconvert the given data from Base64 format back into a {@link String}.
+	 * 
+	 * @param data
+	 *            the data to unconvert
+	 * @param offset
+	 *            the offset at which to start taking the data (do not take the
+	 *            data before it into account)
+	 * @param count
+	 *            the number of bytes to take into account (do not process after
+	 *            this number of bytes has been processed)
+	 * @param zip
+	 *            TRUE to also uncompress the data from a GZIP format; take care
+	 *            about this flag, as it could easily cause errors in the
+	 *            returned content or an {@link IOException}
+	 * 
+	 * @return the {@link String} represented by the given Base64 {@link String}
+	 *         , optionally compressed with GZIP
+	 * 
+	 * @throws IOException
+	 *             in case of I/O errors
+	 */
+	public static String unbase64s(byte[] data, int offset, int count,
+			boolean zip) throws IOException {
+		return new String(unbase64(data, offset, count, zip), "UTF-8");
+	}
 
-		return image;
+	/**
+	 * Return a display {@link String} for the given value, which can be
+	 * suffixed with "k" or "M" depending upon the number, if it is big enough.
+	 * <p>
+	 * <p>
+	 * Examples:
+	 * <ul>
+	 * <li><tt>8 765</tt> becomes "8k"</li>
+	 * <li><tt>998 765</tt> becomes "998k"</li>
+	 * <li><tt>12 987 364</tt> becomes "12M"</li>
+	 * <li><tt>5 534 333 221</tt> becomes "5G"</li>
+	 * </ul>
+	 * 
+	 * @param value
+	 *            the value to convert
+	 * 
+	 * @return the display value
+	 */
+	public static String formatNumber(long value) {
+		return formatNumber(value, 0);
 	}
 
 	/**
-	 * Return a hash of the given {@link String}.
+	 * Return a display {@link String} for the given value, which can be
+	 * suffixed with "k" or "M" depending upon the number, if it is big enough.
+	 * <p>
+	 * Examples (assuming decimalPositions = 1):
+	 * <ul>
+	 * <li><tt>8 765</tt> becomes "8.7k"</li>
+	 * <li><tt>998 765</tt> becomes "998.7k"</li>
+	 * <li><tt>12 987 364</tt> becomes "12.9M"</li>
+	 * <li><tt>5 534 333 221</tt> becomes "5.5G"</li>
+	 * </ul>
 	 * 
-	 * @param input
-	 *            the input data
+	 * @param value
+	 *            the value to convert
+	 * @param decimalPositions
+	 *            the number of decimal positions to keep
 	 * 
-	 * @return the hash
+	 * @return the display value
 	 */
-	static public String getHash(String input) {
-		try {
-			MessageDigest md = MessageDigest.getInstance("MD5");
-			md.update(input.getBytes());
-			byte byteData[] = md.digest();
+	public static String formatNumber(long value, int decimalPositions) {
+		long userValue = value;
+		String suffix = "";
+		long mult = 1;
+
+		if (value >= 1000000000l) {
+			mult = 1000000000l;
+			userValue = value / 1000000000l;
+			suffix = "G";
+		} else if (value >= 1000000l) {
+			mult = 1000000l;
+			userValue = value / 1000000l;
+			suffix = "M";
+		} else if (value >= 1000l) {
+			mult = 1000l;
+			userValue = value / 1000l;
+			suffix = "k";
+		}
 
-			StringBuffer hexString = new StringBuffer();
-			for (int i = 0; i < byteData.length; i++) {
-				String hex = Integer.toHexString(0xff & byteData[i]);
-				if (hex.length() == 1)
-					hexString.append('0');
-				hexString.append(hex);
+		String deci = "";
+		if (decimalPositions > 0) {
+			deci = Long.toString(value % mult);
+			int size = Long.toString(mult).length() - 1;
+			while (deci.length() < size) {
+				deci = "0" + deci;
 			}
 
-			return hexString.toString();
-		} catch (NoSuchAlgorithmException e) {
-			return input;
+			deci = deci.substring(0, Math.min(decimalPositions, deci.length()));
+			while (deci.length() < decimalPositions) {
+				deci += "0";
+			}
+
+			deci = "." + deci;
 		}
+
+		return Long.toString(userValue) + deci + suffix;
 	}
 
 	/**
-	 * Return the EXIF transformation flag of this image if any.
-	 * 
+	 * The reverse operation to {@link StringUtils#formatNumber(long)}: it will
+	 * read a "display" number that can contain a "M" or "k" suffix and return
+	 * the full value.
 	 * <p>
-	 * Note: this code has been found on internet; thank you anonymous coder.
-	 * </p>
+	 * Of course, the conversion to and from display form is lossy (example:
+	 * <tt>6870</tt> to "6.5k" to <tt>6500</tt>).
 	 * 
-	 * @param in
-	 *            the data {@link InputStream}
+	 * @param value
+	 *            the value in display form with possible "M" and "k" suffixes,
+	 *            can be NULL
 	 * 
-	 * @return the transformation flag if any
+	 * @return the value as a number, or 0 if not possible to convert
+	 */
+	public static long toNumber(String value) {
+		return toNumber(value, 0l);
+	}
+
+	/**
+	 * The reverse operation to {@link StringUtils#formatNumber(long)}: it will
+	 * read a "display" number that can contain a "M" or "k" suffix and return
+	 * the full value.
+	 * <p>
+	 * Of course, the conversion to and from display form is lossy (example:
+	 * <tt>6870</tt> to "6.5k" to <tt>6500</tt>).
 	 * 
-	 * @throws IOException
-	 *             in case of IO error
-	 */
-	static private int getExifTransorm(InputStream in) throws IOException {
-		int[] exif_data = new int[100];
-		int set_flag = 0;
-		int is_motorola = 0;
-
-		/* Read File head, check for JPEG SOI + Exif APP1 */
-		for (int i = 0; i < 4; i++)
-			exif_data[i] = in.read();
-
-		if (exif_data[0] != 0xFF || exif_data[1] != 0xD8
-				|| exif_data[2] != 0xFF || exif_data[3] != 0xE1)
-			return -2;
-
-		/* Get the marker parameter length count */
-		int length = (in.read() << 8 | in.read());
-
-		/* Length includes itself, so must be at least 2 */
-		/* Following Exif data length must be at least 6 */
-		if (length < 8)
-			return -1;
-		length -= 8;
-		/* Read Exif head, check for "Exif" */
-		for (int i = 0; i < 6; i++)
-			exif_data[i] = in.read();
-
-		if (exif_data[0] != 0x45 || exif_data[1] != 0x78
-				|| exif_data[2] != 0x69 || exif_data[3] != 0x66
-				|| exif_data[4] != 0 || exif_data[5] != 0)
-			return -1;
-
-		/* Read Exif body */
-		length = length > exif_data.length ? exif_data.length : length;
-		for (int i = 0; i < length; i++)
-			exif_data[i] = in.read();
-
-		if (length < 12)
-			return -1; /* Length of an IFD entry */
-
-		/* Discover byte order */
-		if (exif_data[0] == 0x49 && exif_data[1] == 0x49)
-			is_motorola = 0;
-		else if (exif_data[0] == 0x4D && exif_data[1] == 0x4D)
-			is_motorola = 1;
-		else
-			return -1;
-
-		/* Check Tag Mark */
-		if (is_motorola == 1) {
-			if (exif_data[2] != 0)
-				return -1;
-			if (exif_data[3] != 0x2A)
-				return -1;
-		} else {
-			if (exif_data[3] != 0)
-				return -1;
-			if (exif_data[2] != 0x2A)
-				return -1;
-		}
+	 * @param value
+	 *            the value in display form with possible "M" and "k" suffixes,
+	 *            can be NULL
+	 * @param def
+	 *            the default value if it is not possible to convert the given
+	 *            value to a number
+	 * 
+	 * @return the value as a number, or 0 if not possible to convert
+	 */
+	public static long toNumber(String value, long def) {
+		long count = def;
+		if (value != null) {
+			value = value.trim().toLowerCase();
+			try {
+				long mult = 1;
+				if (value.endsWith("g")) {
+					value = value.substring(0, value.length() - 1).trim();
+					mult = 1000000000;
+				} else if (value.endsWith("m")) {
+					value = value.substring(0, value.length() - 1).trim();
+					mult = 1000000;
+				} else if (value.endsWith("k")) {
+					value = value.substring(0, value.length() - 1).trim();
+					mult = 1000;
+				}
 
-		/* Get first IFD offset (offset to IFD0) */
-		int offset;
-		if (is_motorola == 1) {
-			if (exif_data[4] != 0)
-				return -1;
-			if (exif_data[5] != 0)
-				return -1;
-			offset = exif_data[6];
-			offset <<= 8;
-			offset += exif_data[7];
-		} else {
-			if (exif_data[7] != 0)
-				return -1;
-			if (exif_data[6] != 0)
-				return -1;
-			offset = exif_data[5];
-			offset <<= 8;
-			offset += exif_data[4];
-		}
-		if (offset > length - 2)
-			return -1; /* check end of data segment */
-
-		/* Get the number of directory entries contained in this IFD */
-		int number_of_tags;
-		if (is_motorola == 1) {
-			number_of_tags = exif_data[offset];
-			number_of_tags <<= 8;
-			number_of_tags += exif_data[offset + 1];
-		} else {
-			number_of_tags = exif_data[offset + 1];
-			number_of_tags <<= 8;
-			number_of_tags += exif_data[offset];
-		}
-		if (number_of_tags == 0)
-			return -1;
-		offset += 2;
-
-		/* Search for Orientation Tag in IFD0 */
-		for (;;) {
-			if (offset > length - 12)
-				return -1; /* check end of data segment */
-			/* Get Tag number */
-			int tagnum;
-			if (is_motorola == 1) {
-				tagnum = exif_data[offset];
-				tagnum <<= 8;
-				tagnum += exif_data[offset + 1];
-			} else {
-				tagnum = exif_data[offset + 1];
-				tagnum <<= 8;
-				tagnum += exif_data[offset];
+				long deci = 0;
+				if (value.contains(".")) {
+					String[] tab = value.split("\\.");
+					if (tab.length != 2) {
+						throw new NumberFormatException(value);
+					}
+					double decimal = Double.parseDouble("0."
+							+ tab[tab.length - 1]);
+					deci = ((long) (mult * decimal));
+					value = tab[0];
+				}
+				count = mult * Long.parseLong(value) + deci;
+			} catch (Exception e) {
 			}
-			if (tagnum == 0x0112)
-				break; /* found Orientation Tag */
-			if (--number_of_tags == 0)
-				return -1;
-			offset += 12;
 		}
 
-		/* Get the Orientation value */
-		if (is_motorola == 1) {
-			if (exif_data[offset + 8] != 0)
-				return -1;
-			set_flag = exif_data[offset + 9];
-		} else {
-			if (exif_data[offset + 9] != 0)
-				return -1;
-			set_flag = exif_data[offset + 8];
-		}
-		if (set_flag > 8)
-			return -1;
+		return count;
+	}
 
-		return set_flag;
+	/**
+	 * The "remove accents" pattern.
+	 * 
+	 * @return the pattern, or NULL if a problem happens
+	 */
+	private static Pattern getMarks() {
+		try {
+			return Pattern
+					.compile("[\\p{InCombiningDiacriticalMarks}\\p{IsLm}\\p{IsSk}]+");
+		} catch (Exception e) {
+			// Can fail on Android...
+			return null;
+		}
 	}
 
+	//
+	// justify List<String> related:
+	//
+
 	/**
-	 * Remove the HTML content from the given input, and un-html-ize the rest.
+	 * Check if this line ends as a complete line (ends with a "." or similar).
+	 * <p>
+	 * Note that we consider an empty line as full, and a line ending with
+	 * spaces as not complete.
 	 * 
-	 * @param html
-	 *            the HTML-encoded content
+	 * @param line
+	 *            the line to check
 	 * 
-	 * @return the HTML-free equivalent content
+	 * @return TRUE if it does
 	 */
-	public static String unhtml(String html) {
-		StringBuilder builder = new StringBuilder();
+	static private boolean isFullLine(StringBuilder line) {
+		if (line.length() == 0) {
+			return true;
+		}
 
-		int inTag = 0;
-		for (char car : html.toCharArray()) {
-			if (car == '<') {
-				inTag++;
-			} else if (car == '>') {
-				inTag--;
-			} else if (inTag <= 0) {
-				builder.append(car);
-			}
+		char lastCar = line.charAt(line.length() - 1);
+		switch (lastCar) {
+		case '.': // points
+		case '?':
+		case '!':
+
+		case '\'': // quotes
+		case 'â':
+		case 'â':
+
+		case '"': // double quotes
+		case 'â':
+		case 'â':
+		case 'Â»':
+		case 'Â«':
+			return true;
+		default:
+			return false;
 		}
+	}
 
-		return HtmlEscape.unescapeHtml(builder.toString());
+	/**
+	 * Check if this line represent an item in a list or description (i.e.,
+	 * check that the first non-space char is "-").
+	 * 
+	 * @param line
+	 *            the line to check
+	 * 
+	 * @return TRUE if it is
+	 */
+	static private boolean isItemLine(String line) {
+		String spacing = getItemSpacing(line);
+		return spacing != null && !spacing.isEmpty()
+				&& line.charAt(spacing.length()) == '-';
 	}
 
 	/**
-	 * Escape the given {@link String} so it can be used in XML, as content.
+	 * Return all the spaces that start this line (or Empty if none).
 	 * 
-	 * @param input
-	 *            the input {@link String}
+	 * @param line
+	 *            the line to get the starting spaces from
 	 * 
-	 * @return the escaped {@link String}
+	 * @return the left spacing
 	 */
-	public static String xmlEscape(String input) {
-		if (input == null) {
-			return "";
+	static private String getItemSpacing(String line) {
+		int i;
+		for (i = 0; i < line.length(); i++) {
+			if (line.charAt(i) != ' ') {
+				return line.substring(0, i);
+			}
 		}
 
-		return HtmlEscape.escapeHtml(input,
-				HtmlEscapeType.HTML4_NAMED_REFERENCES_DEFAULT_TO_HEXA,
-				HtmlEscapeLevel.LEVEL_1_ONLY_MARKUP_SIGNIFICANT);
+		return "";
 	}
 
 	/**
-	 * Escape the given {@link String} so it can be used in XML, as text content
-	 * inside double-quotes.
+	 * This line is an horizontal spacer line.
 	 * 
-	 * @param input
-	 *            the input {@link String}
+	 * @param line
+	 *            the line to test
 	 * 
-	 * @return the escaped {@link String}
+	 * @return TRUE if it is
 	 */
-	public static String xmlEscapeQuote(String input) {
-		if (input == null) {
-			return "";
+	static private boolean isHrLine(CharSequence line) {
+		int count = 0;
+		if (line != null) {
+			for (int i = 0; i < line.length(); i++) {
+				char car = line.charAt(i);
+				if (car == ' ' || car == '\t' || car == '*' || car == '-'
+						|| car == '_' || car == '~' || car == '=' || car == '/'
+						|| car == '\\') {
+					count++;
+				} else {
+					return false;
+				}
+			}
 		}
 
-		return HtmlEscape.escapeHtml(input,
-				HtmlEscapeType.HTML4_NAMED_REFERENCES_DEFAULT_TO_HEXA,
-				HtmlEscapeLevel.LEVEL_1_ONLY_MARKUP_SIGNIFICANT);
+		return count > 2;
 	}
 }