StringUtils.java

   1 /*
   2  * Jexer - Java Text User Interface
   3  *
   4  * The MIT License (MIT)
   5  *
   6  * Copyright (C) 2019 Kevin Lamonte
   7  *
   8  * Permission is hereby granted, free of charge, to any person obtaining a
   9  * copy of this software and associated documentation files (the "Software"),
  10  * to deal in the Software without restriction, including without limitation
  11  * the rights to use, copy, modify, merge, publish, distribute, sublicense,
  12  * and/or sell copies of the Software, and to permit persons to whom the
  13  * Software is furnished to do so, subject to the following conditions:
  14  *
  15  * The above copyright notice and this permission notice shall be included in
  16  * all copies or substantial portions of the Software.
  17  *
  18  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  19  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  20  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
  21  * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
  22  * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
  23  * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
  24  * DEALINGS IN THE SOFTWARE.
  25  *
  26  * @author Kevin Lamonte [kevin.lamonte@gmail.com]
  27  * @version 1
  28  */
  29 package jexer.bits;
  30
  31 import java.util.List;
  32 import java.util.ArrayList;
  33 import java.util.Arrays;
  34
  35 /**
  36  * StringUtils contains methods to:
  37  *
  38  *    - Convert one or more long lines of strings into justified text
  39  *      paragraphs.
  40  *
  41  *    - Unescape C0 control codes.
  42  *
  43  *    - Read/write a line of RFC4180 comma-separated values strings to/from a
  44  *      list of strings.
  45  */
  46 public class StringUtils {
  47
  48     /**
  49      * Left-justify a string into a list of lines.
  50      *
  51      * @param str the string
  52      * @param n the maximum number of characters in a line
  53      * @return the list of lines
  54      */
  55     public static List<String> left(final String str, final int n) {
  56         List<String> result = new ArrayList<String>();
  57
  58         /*
  59          * General procedure:
  60          *
  61          *   1. Split on '\n' into paragraphs.
  62          *
  63          *   2. Scan each line, noting the position of the last
  64          *      beginning-of-a-word.
  65          *
  66          *   3. Chop at the last #2 if the next beginning-of-a-word exceeds
  67          *      n.
  68          *
  69          *   4. Return the lines.
  70          */
  71
  72         String [] rawLines = str.split("\n");
  73         for (int i = 0; i < rawLines.length; i++) {
  74             StringBuilder line = new StringBuilder();
  75             StringBuilder word = new StringBuilder();
  76             boolean inWord = false;
  77             for (int j = 0; j < rawLines[i].length(); j++) {
  78                 char ch = rawLines[i].charAt(j);
  79                 if ((ch == ' ') || (ch == '\t')) {
  80                     if (inWord == true) {
  81                         // We have just transitioned from a word to
  82                         // whitespace.  See if we have enough space to add
  83                         // the word to the line.
  84                         if (width(word.toString()) + width(line.toString()) > n) {
  85                             // This word will exceed the line length.  Wrap
  86                             // at it instead.
  87                             result.add(line.toString());
  88                             line = new StringBuilder();
  89                         }
  90                         if ((word.toString().startsWith(" "))
  91                             && (width(line.toString()) == 0)
  92                         ) {
  93                             line.append(word.substring(1));
  94                         } else {
  95                             line.append(word);
  96                         }
  97                         word = new StringBuilder();
  98                         word.append(ch);
  99                         inWord = false;
 100                     } else {
 101                         // We are in the whitespace before another word.  Do
 102                         // nothing.
 103                     }
 104                 } else {
 105                     if (inWord == true) {
 106                         // We are appending to a word.
 107                         word.append(ch);
 108                     } else {
 109                         // We have transitioned from whitespace to a word.
 110                         word.append(ch);
 111                         inWord = true;
 112                     }
 113                 }
 114             } // for (int j = 0; j < rawLines[i].length(); j++)
 115
 116             if (width(word.toString()) + width(line.toString()) > n) {
 117                 // This word will exceed the line length.  Wrap at it
 118                 // instead.
 119                 result.add(line.toString());
 120                 line = new StringBuilder();
 121             }
 122             if ((word.toString().startsWith(" "))
 123                 && (width(line.toString()) == 0)
 124             ) {
 125                 line.append(word.substring(1));
 126             } else {
 127                 line.append(word);
 128             }
 129             result.add(line.toString());
 130         } // for (int i = 0; i < rawLines.length; i++) {
 131
 132         return result;
 133     }
 134
 135     /**
 136      * Right-justify a string into a list of lines.
 137      *
 138      * @param str the string
 139      * @param n the maximum number of characters in a line
 140      * @return the list of lines
 141      */
 142     public static List<String> right(final String str, final int n) {
 143         List<String> result = new ArrayList<String>();
 144
 145         /*
 146          * Same as left(), but preceed each line with spaces to make it n
 147          * chars long.
 148          */
 149         List<String> lines = left(str, n);
 150         for (String line: lines) {
 151             StringBuilder sb = new StringBuilder();
 152             for (int i = 0; i < n - width(line); i++) {
 153                 sb.append(' ');
 154             }
 155             sb.append(line);
 156             result.add(sb.toString());
 157         }
 158
 159         return result;
 160     }
 161
 162     /**
 163      * Center a string into a list of lines.
 164      *
 165      * @param str the string
 166      * @param n the maximum number of characters in a line
 167      * @return the list of lines
 168      */
 169     public static List<String> center(final String str, final int n) {
 170         List<String> result = new ArrayList<String>();
 171
 172         /*
 173          * Same as left(), but preceed/succeed each line with spaces to make
 174          * it n chars long.
 175          */
 176         List<String> lines = left(str, n);
 177         for (String line: lines) {
 178             StringBuilder sb = new StringBuilder();
 179             int l = (n - width(line)) / 2;
 180             int r = n - width(line) - l;
 181             for (int i = 0; i < l; i++) {
 182                 sb.append(' ');
 183             }
 184             sb.append(line);
 185             for (int i = 0; i < r; i++) {
 186                 sb.append(' ');
 187             }
 188             result.add(sb.toString());
 189         }
 190
 191         return result;
 192     }
 193
 194     /**
 195      * Fully-justify a string into a list of lines.
 196      *
 197      * @param str the string
 198      * @param n the maximum number of characters in a line
 199      * @return the list of lines
 200      */
 201     public static List<String> full(final String str, final int n) {
 202         List<String> result = new ArrayList<String>();
 203
 204         /*
 205          * Same as left(), but insert spaces between words to make each line
 206          * n chars long.  The "algorithm" here is pretty dumb: it performs a
 207          * split on space and then re-inserts multiples of n between words.
 208          */
 209         List<String> lines = left(str, n);
 210         for (int lineI = 0; lineI < lines.size() - 1; lineI++) {
 211             String line = lines.get(lineI);
 212             String [] words = line.split(" ");
 213             if (words.length > 1) {
 214                 int charCount = 0;
 215                 for (int i = 0; i < words.length; i++) {
 216                     charCount += words[i].length();
 217                 }
 218                 int spaceCount = n - charCount;
 219                 int q = spaceCount / (words.length - 1);
 220                 int r = spaceCount % (words.length - 1);
 221                 StringBuilder sb = new StringBuilder();
 222                 for (int i = 0; i < words.length - 1; i++) {
 223                     sb.append(words[i]);
 224                     for (int j = 0; j < q; j++) {
 225                         sb.append(' ');
 226                     }
 227                     if (r > 0) {
 228                         sb.append(' ');
 229                         r--;
 230                     }
 231                 }
 232                 for (int j = 0; j < r; j++) {
 233                     sb.append(' ');
 234                 }
 235                 sb.append(words[words.length - 1]);
 236                 result.add(sb.toString());
 237             } else {
 238                 result.add(line);
 239             }
 240         }
 241         if (lines.size() > 0) {
 242             result.add(lines.get(lines.size() - 1));
 243         }
 244
 245         return result;
 246     }
 247
 248     /**
 249      * Convert raw strings into escaped strings that be splatted on the
 250      * screen.
 251      *
 252      * @param str the string
 253      * @return a string that can be passed into Screen.putStringXY()
 254      */
 255     public static String unescape(final String str) {
 256         StringBuilder sb = new StringBuilder();
 257         for (int i = 0; i < str.length(); i++) {
 258             char ch = str.charAt(i);
 259             if ((ch < 0x20) || (ch == 0x7F)) {
 260                 switch (ch) {
 261                 case '\b':
 262                     sb.append("\\b");
 263                     continue;
 264                 case '\f':
 265                     sb.append("\\f");
 266                     continue;
 267                 case '\n':
 268                     sb.append("\\n");
 269                     continue;
 270                 case '\r':
 271                     sb.append("\\r");
 272                     continue;
 273                 case '\t':
 274                     sb.append("\\t");
 275                     continue;
 276                 case 0x7f:
 277                     sb.append("^?");
 278                     continue;
 279                 default:
 280                     sb.append(' ');
 281                     continue;
 282                 }
 283             }
 284             sb.append(ch);
 285         }
 286         return sb.toString();
 287     }
 288
 289     /**
 290      * Read a line of RFC4180 comma-separated values (CSV) into a list of
 291      * strings.
 292      *
 293      * @param line the CSV line, with or without without line terminators
 294      * @return the list of strings
 295      */
 296     public static List<String> fromCsv(final String line) {
 297         List<String> result = new ArrayList<String>();
 298
 299         StringBuilder str = new StringBuilder();
 300         boolean quoted = false;
 301         boolean fieldQuoted = false;
 302
 303         for (int i = 0; i < line.length(); i++) {
 304             char ch = line.charAt(i);
 305
 306             /*
 307             System.err.println("ch '" + ch + "' str '" + str + "' " +
 308                 " fieldQuoted " + fieldQuoted + " quoted " + quoted);
 309              */
 310
 311             if (ch == ',') {
 312                 if (fieldQuoted && quoted) {
 313                     // Terminating a quoted field.
 314                     result.add(str.toString());
 315                     str = new StringBuilder();
 316                     quoted = false;
 317                     fieldQuoted = false;
 318                 } else if (fieldQuoted) {
 319                     // Still waiting to see the terminating quote for this
 320                     // field.
 321                     str.append(ch);
 322                 } else if (quoted) {
 323                     // An unmatched double-quote and comma.  This should be
 324                     // an invalid sequence.  We will treat it as a quote
 325                     // terminating the field.
 326                     str.append('\"');
 327                     result.add(str.toString());
 328                     str = new StringBuilder();
 329                     quoted = false;
 330                     fieldQuoted = false;
 331                 } else {
 332                     // A field separator.
 333                     result.add(str.toString());
 334                     str = new StringBuilder();
 335                     quoted = false;
 336                     fieldQuoted = false;
 337                 }
 338                 continue;
 339             }
 340
 341             if (ch == '\"') {
 342                 if ((str.length() == 0) && (!fieldQuoted)) {
 343                     // The opening quote to a quoted field.
 344                     fieldQuoted = true;
 345                 } else if (quoted) {
 346                     // This is a double-quote.
 347                     str.append('\"');
 348                     quoted = false;
 349                 } else {
 350                     // This is the beginning of a quote.
 351                     quoted = true;
 352                 }
 353                 continue;
 354             }
 355
 356             // Normal character, pass it on.
 357             str.append(ch);
 358         }
 359
 360         // Include the final field.
 361         result.add(str.toString());
 362
 363         return result;
 364     }
 365
 366     /**
 367      * Write a list of strings to on line of RFC4180 comma-separated values
 368      * (CSV).
 369      *
 370      * @param list the list of strings
 371      * @return the CSV line, without any line terminators
 372      */
 373     public static String toCsv(final List<String> list) {
 374         StringBuilder result = new StringBuilder();
 375         int i = 0;
 376         for (String str: list) {
 377
 378             if (!str.contains("\"") && !str.contains(",")) {
 379                 // Just append the string with a comma.
 380                 result.append(str);
 381             } else if (!str.contains("\"") && str.contains(",")) {
 382                 // Contains commas, but no quotes.  Just double-quote it.
 383                 result.append("\"");
 384                 result.append(str);
 385                 result.append("\"");
 386             } else if (str.contains("\"")) {
 387                 // Contains quotes and maybe commas.  Double-quote it and
 388                 // replace quotes inside.
 389                 result.append("\"");
 390                 for (int j = 0; j < str.length(); j++) {
 391                     char ch = str.charAt(j);
 392                     result.append(ch);
 393                     if (ch == '\"') {
 394                         result.append("\"");
 395                     }
 396                 }
 397                 result.append("\"");
 398             }
 399
 400             if (i < list.size() - 1) {
 401                 result.append(",");
 402             }
 403             i++;
 404         }
 405         return result.toString();
 406     }
 407
 408     /**
 409      * Determine display width of a Unicode code point.
 410      *
 411      * @param ch the code point, can be char
 412      * @return the number of text cell columns required to display this code
 413      * point, one of 0, 1, or 2
 414      */
 415     public static int width(final int ch) {
 416         /*
 417          * This routine is a modified version of mk_wcwidth() available
 418          * at: http://www.cl.cam.ac.uk/~mgk25/ucs/wcwidth.c
 419          *
 420          * The combining characters list has been omitted from this
 421          * implementation.  Hopefully no users will be impacted.
 422          */
 423
 424         // 8-bit control characters: width 0
 425         if (ch == 0) {
 426             return 0;
 427         }
 428         if ((ch < 32) || ((ch >= 0x7f) && (ch < 0xa0))) {
 429             return 0;
 430         }
 431
 432         // All others: either 1 or 2
 433         if ((ch >= 0x1100)
 434             && ((ch <= 0x115f)
 435                 // Hangul Jamo init. consonants
 436                 || (ch == 0x2329)
 437                 || (ch == 0x232a)
 438                 // CJK ... Yi
 439                 || ((ch >= 0x2e80) && (ch <= 0xa4cf) && (ch != 0x303f))
 440                 // Hangul Syllables
 441                 || ((ch >= 0xac00) && (ch <= 0xd7a3))
 442                 // CJK Compatibility Ideographs
 443                 || ((ch >= 0xf900) && (ch <= 0xfaff))
 444                 // Vertical forms
 445                 || ((ch >= 0xfe10) && (ch <= 0xfe19))
 446                 // CJK Compatibility Forms
 447                 || ((ch >= 0xfe30) && (ch <= 0xfe6f))
 448                 // Fullwidth Forms
 449                 || ((ch >= 0xff00) && (ch <= 0xff60))
 450                 || ((ch >= 0xffe0) && (ch <= 0xffe6))
 451                 || ((ch >= 0x20000) && (ch <= 0x2fffd))
 452                 || ((ch >= 0x30000) && (ch <= 0x3fffd))
 453                 // emoji
 454                 || ((ch >= 0x1f004) && (ch <= 0x1fffd))
 455             )
 456         ) {
 457             return 2;
 458         }
 459         return 1;
 460     }
 461
 462     /**
 463      * Determine display width of a string.  This ASSUMES that no characters
 464      * are combining.  Hopefully no users will be impacted.
 465      *
 466      * @param str the string
 467      * @return the number of text cell columns required to display this string
 468      */
 469     public static int width(final String str) {
 470         int n = 0;
 471         for (int i = 0; i < str.length();) {
 472             int ch = str.codePointAt(i);
 473             n += width(ch);
 474             i += Character.charCount(ch);
 475         }
 476         return n;
 477     }
 478
 479     /**
 480      * Check if character is in the CJK range.
 481      *
 482      * @param ch character to check
 483      * @return true if this character is in the CJK range
 484      */
 485     public static boolean isCjk(final int ch) {
 486         return ((ch >= 0x2e80) && (ch <= 0x9fff));
 487     }
 488
 489     /**
 490      * Check if character is in the emoji range.
 491      *
 492      * @param ch character to check
 493      * @return true if this character is in the emoji range
 494      */
 495     public static boolean isEmoji(final int ch) {
 496         return ((ch >= 0x1f004) && (ch <= 0x1fffd));
 497     }
 498
 499     // ------------------------------------------------------------------------
 500     // Base64 -----------------------------------------------------------------
 501     // ------------------------------------------------------------------------
 502
 503     /*
 504      * The Base64 encoder/decoder below is provided to support JDK 1.6 - JDK
 505      * 11.  It was taken from https://sourceforge.net/projects/migbase64/
 506      *
 507      * The following changes were made:
 508      *
 509      * - Code has been indented and long lines cut to fit within 80 columns.
 510      *
 511      * - Char, String, and "fast" byte functions removed.  byte versions
 512      *   retained and called toBase64()/fromBase64().
 513      *
 514      * - Enclosing braces added to blocks.
 515      */
 516
 517     /**
 518      * A very fast and memory efficient class to encode and decode to and
 519      * from BASE64 in full accordance with RFC 2045.<br><br> On Windows XP
 520      * sp1 with 1.4.2_04 and later ;), this encoder and decoder is about 10
 521      * times faster on small arrays (10 - 1000 bytes) and 2-3 times as fast
 522      * on larger arrays (10000 - 1000000 bytes) compared to
 523      * <code>sun.misc.Encoder()/Decoder()</code>.<br><br>
 524      *
 525      * On byte arrays the encoder is about 20% faster than Jakarta Commons
 526      * Base64 Codec for encode and about 50% faster for decoding large
 527      * arrays. This implementation is about twice as fast on very small
 528      * arrays (&lt 30 bytes). If source/destination is a <code>String</code>
 529      * this version is about three times as fast due to the fact that the
 530      * Commons Codec result has to be recoded to a <code>String</code> from
 531      * <code>byte[]</code>, which is very expensive.<br><br>
 532      *
 533      * This encode/decode algorithm doesn't create any temporary arrays as
 534      * many other codecs do, it only allocates the resulting array. This
 535      * produces less garbage and it is possible to handle arrays twice as
 536      * large as algorithms that create a temporary array. (E.g. Jakarta
 537      * Commons Codec). It is unknown whether Sun's
 538      * <code>sun.misc.Encoder()/Decoder()</code> produce temporary arrays but
 539      * since performance is quite low it probably does.<br><br>
 540      *
 541      * The encoder produces the same output as the Sun one except that the
 542      * Sun's encoder appends a trailing line separator if the last character
 543      * isn't a pad. Unclear why but it only adds to the length and is
 544      * probably a side effect. Both are in conformance with RFC 2045
 545      * though.<br> Commons codec seem to always att a trailing line
 546      * separator.<br><br>
 547      *
 548      * <b>Note!</b> The encode/decode method pairs (types) come in three
 549      * versions with the <b>exact</b> same algorithm and thus a lot of code
 550      * redundancy. This is to not create any temporary arrays for transcoding
 551      * to/from different format types. The methods not used can simply be
 552      * commented out.<br><br>
 553      *
 554      * There is also a "fast" version of all decode methods that works the
 555      * same way as the normal ones, but har a few demands on the decoded
 556      * input. Normally though, these fast verions should be used if the
 557      * source if the input is known and it hasn't bee tampered with.<br><br>
 558      *
 559      * If you find the code useful or you find a bug, please send me a note
 560      * at base64 @ miginfocom . com.
 561      *
 562      * Licence (BSD):
 563      * ==============
 564      *
 565      * Copyright (c) 2004, Mikael Grev, MiG InfoCom AB. (base64 @ miginfocom
 566      * . com) All rights reserved.
 567      *
 568      * Redistribution and use in source and binary forms, with or without
 569      * modification, are permitted provided that the following conditions are
 570      * met: Redistributions of source code must retain the above copyright
 571      * notice, this list of conditions and the following disclaimer.
 572      * Redistributions in binary form must reproduce the above copyright
 573      * notice, this list of conditions and the following disclaimer in the
 574      * documentation and/or other materials provided with the distribution.
 575      * Neither the name of the MiG InfoCom AB nor the names of its
 576      * contributors may be used to endorse or promote products derived from
 577      * this software without specific prior written permission.
 578      *
 579      * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
 580      * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
 581      * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
 582      * A PARTICULAR PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE COPYRIGHT
 583      * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
 584      * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
 585      * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
 586      * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
 587      * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
 588      * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
 589      * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 590      *
 591      * @version 2.2
 592      * @author Mikael Grev
 593      *         Date: 2004-aug-02
 594      *         Time: 11:31:11
 595      */
 596
 597     private static final char[] CA = "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789+/".toCharArray();
 598     private static final int[] IA = new int[256];
 599     static {
 600         Arrays.fill(IA, -1);
 601         for (int i = 0, iS = CA.length; i < iS; i++) {
 602             IA[CA[i]] = i;
 603         }
 604         IA['='] = 0;
 605     }
 606
 607     /**
 608      * Encodes a raw byte array into a BASE64 <code>byte[]</code>
 609      * representation i accordance with RFC 2045.
 610      * @param sArr The bytes to convert. If <code>null</code> or length 0
 611      * an empty array will be returned.
 612      * @return A BASE64 encoded array. Never <code>null</code>.
 613      */
 614     public final static String toBase64(byte[] sArr) {
 615         // Check special case
 616         int sLen = sArr != null ? sArr.length : 0;
 617         if (sLen == 0) {
 618             return "";
 619         }
 620
 621         final boolean lineSep = true;
 622
 623         int eLen = (sLen / 3) * 3;                              // Length of even 24-bits.
 624         int cCnt = ((sLen - 1) / 3 + 1) << 2;                   // Returned character count
 625         int dLen = cCnt + (lineSep ? (cCnt - 1) / 76 << 1 : 0); // Length of returned array
 626         byte[] dArr = new byte[dLen];
 627
 628         // Encode even 24-bits
 629         for (int s = 0, d = 0, cc = 0; s < eLen;) {
 630             // Copy next three bytes into lower 24 bits of int, paying
 631             // attension to sign.
 632             int i = (sArr[s++] & 0xff) << 16 | (sArr[s++] & 0xff) << 8 | (sArr[s++] & 0xff);
 633
 634             // Encode the int into four chars
 635             dArr[d++] = (byte) CA[(i >>> 18) & 0x3f];
 636             dArr[d++] = (byte) CA[(i >>> 12) & 0x3f];
 637             dArr[d++] = (byte) CA[(i >>> 6) & 0x3f];
 638             dArr[d++] = (byte) CA[i & 0x3f];
 639
 640             // Add optional line separator
 641             if (lineSep && ++cc == 19 && d < dLen - 2) {
 642                 dArr[d++] = '\r';
 643                 dArr[d++] = '\n';
 644                 cc = 0;
 645             }
 646         }
 647
 648         // Pad and encode last bits if source isn't an even 24 bits.
 649         int left = sLen - eLen; // 0 - 2.
 650         if (left > 0) {
 651             // Prepare the int
 652             int i = ((sArr[eLen] & 0xff) << 10) | (left == 2 ? ((sArr[sLen - 1] & 0xff) << 2) : 0);
 653
 654             // Set last four chars
 655             dArr[dLen - 4] = (byte) CA[i >> 12];
 656             dArr[dLen - 3] = (byte) CA[(i >>> 6) & 0x3f];
 657             dArr[dLen - 2] = left == 2 ? (byte) CA[i & 0x3f] : (byte) '=';
 658             dArr[dLen - 1] = '=';
 659         }
 660         try {
 661             return new String(dArr, "UTF-8");
 662         } catch (java.io.UnsupportedEncodingException e) {
 663             throw new IllegalArgumentException(e);
 664         }
 665
 666     }
 667
 668     /**
 669      * Decodes a BASE64 encoded byte array. All illegal characters will
 670      * be ignored and can handle both arrays with and without line
 671      * separators.
 672      * @param sArr The source array. Length 0 will return an empty
 673      * array. <code>null</code> will throw an exception.
 674      * @return The decoded array of bytes. May be of length 0. Will be
 675      * <code>null</code> if the legal characters (including '=') isn't
 676      * divideable by 4. (I.e. definitely corrupted).
 677      */
 678     public final static byte[] fromBase64(byte[] sArr) {
 679         // Check special case
 680         int sLen = sArr.length;
 681
 682         // Count illegal characters (including '\r', '\n') to know what
 683         // size the returned array will be, so we don't have to
 684         // reallocate & copy it later.
 685         int sepCnt = 0; // Number of separator characters. (Actually illegal characters, but that's a bonus...)
 686         for (int i = 0; i < sLen; i++) {
 687             // If input is "pure" (I.e. no line separators or illegal chars)
 688             // base64 this loop can be commented out.
 689             if (IA[sArr[i] & 0xff] < 0) {
 690                 sepCnt++;
 691             }
 692         }
 693
 694         // Check so that legal chars (including '=') are evenly
 695         // divideable by 4 as specified in RFC 2045.
 696         if ((sLen - sepCnt) % 4 != 0) {
 697             return null;
 698         }
 699
 700         int pad = 0;
 701         for (int i = sLen; i > 1 && IA[sArr[--i] & 0xff] <= 0;) {
 702             if (sArr[i] == '=') {
 703                 pad++;
 704             }
 705         }
 706
 707         int len = ((sLen - sepCnt) * 6 >> 3) - pad;
 708
 709         byte[] dArr = new byte[len];       // Preallocate byte[] of exact length
 710
 711         for (int s = 0, d = 0; d < len;) {
 712             // Assemble three bytes into an int from four "valid" characters.
 713             int i = 0;
 714             for (int j = 0; j < 4; j++) {   // j only increased if a valid char was found.
 715                 int c = IA[sArr[s++] & 0xff];
 716                 if (c >= 0) {
 717                     i |= c << (18 - j * 6);
 718                 } else {
 719                     j--;
 720                 }
 721             }
 722
 723             // Add the bytes
 724             dArr[d++] = (byte) (i >> 16);
 725             if (d < len) {
 726                 dArr[d++]= (byte) (i >> 8);
 727                 if (d < len) {
 728                     dArr[d++] = (byte) i;
 729                 }
 730             }
 731         }
 732
 733         return dArr;
 734     }
 735
 736 }