/* * @(#)Base64.java * * Copyright 2003-2004 Sun Microsystems, Inc. All Rights Reserved. * * Redistribution and use in source and binary forms, with or without * modification, are permitted provided that the following conditions are met: * * 1. Redistribution of source code must retain the above copyright notice, * this list of conditions and the following disclaimer. * * 2. Redistribution in binary form must reproduce the above copyright * notice, this list of conditions and the following disclaimer in the * documentation and/or other materials provided with the distribution. * * Neither the name of Sun Microsystems, Inc. or the names of contributors may * be used to endorse or promote products derived from this software without * specific prior written permission. * * This software is provided "AS IS," without a warranty of any kind. ALL * EXPRESS OR IMPLIED CONDITIONS, REPRESENTATIONS AND WARRANTIES, INCLUDING * ANY IMPLIED WARRANTY OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE * OR NON-INFRINGEMENT, ARE HEREBY EXCLUDED. SUN MICROSYSTEMS, INC. ("SUN") * AND ITS LICENSORS SHALL NOT BE LIABLE FOR ANY DAMAGES SUFFERED BY LICENSEE * AS A RESULT OF USING, MODIFYING OR DISTRIBUTING THIS SOFTWARE OR ITS * DERIVATIVES. IN NO EVENT WILL SUN OR ITS LICENSORS BE LIABLE FOR ANY LOST * REVENUE, PROFIT OR DATA, OR FOR DIRECT, INDIRECT, SPECIAL, CONSEQUENTIAL, * INCIDENTAL OR PUNITIVE DAMAGES, HOWEVER CAUSED AND REGARDLESS OF THE THEORY * OF LIABILITY, ARISING OUT OF THE USE OF OR INABILITY TO USE THIS SOFTWARE, * EVEN IF SUN HAS BEEN ADVISED OF THE POSSIBILITY OF SUCH DAMAGES. * * You acknowledge that this software is not designed or intended for use in * the design, construction, operation or maintenance of any nuclear facility. */ package com.sun.xacml.attr; import java.io.IOException; import java.io.ByteArrayOutputStream; /** * Class that knows how to encode and decode Base64 values. Base64 * Content-Transfer-Encoding rules are defined in Section 6.8 of IETF RFC 2045 * <i>Multipurpose Internet Mail Extensions (MIME) Part One: Format of Internet * Message Bodies</i>, available at <a * href="ftp://ftp.isi.edu/in-notes/rfc2045.txt"> * <code>ftp://ftp.isi.edu/in-notes/rfc2045.txt</code></a>. * <p> * All methods of this class are static and thread-safe. * * @since 1.0 * @author Anne Anderson */ class Base64 { /* * ASCII white-space characters. These are the ones recognized by the * C and Java language [pre-processors]. */ private static final char SPACE = 0x20; /* space, or blank, character */ private static final char ETX = 0x04; /* end-of-text character */ private static final char VTAB = 0x0b; /* vertical tab character */ private static final char FF = 0x0c; /* form-feed character */ private static final char HTAB = 0x09; /* horizontal tab character */ private static final char LF = 0x0a; /* line feed character */ private static final char ALTLF = 0x13; /* line feed on some systems */ private static final char CR = 0x0d; /* carriage-return character */ /* * String used for BASE64 encoding and decoding. * * For index values 0-63, the character at each index is the Base-64 * encoded value of the index value. Index values beyond 63 are never * referenced during encoding, but are used in this implementation to * help in decoding. The character at index 64 is the Base64 pad * character '='. * * Charaters in index positions 0-64 MUST NOT be moved or altered, as * this will break the implementation. * * The characters after index 64 are white space characters that should be * ignored in Base64-encoded input strings while doing decoding. Note that * the white-space character set should include values used on various * platforms, since a Base64-encoded value may have been generated on a * non-Java platform. The values included here are those used in Java and * in C. * * The white-space character set may be modified without affecting the * implementation of the encoding algorithm. */ private static final String BASE64EncodingString = "ABCDEFGHIJ" + "KLMNOPQRST" + "UVWXYZabcd" + "efghijklmn" + "opqrstuvwx" + "yz01234567" + "89+/" + "=" + SPACE + ETX + VTAB + FF + HTAB + LF + ALTLF + CR; // Index of pad character in Base64EncodingString private static final int PAD_INDEX = 64; /* * The character in Base64EncodingString with the maximum * character value in Unicode. */ private static final int MAX_BASE64_CHAR = 'z'; /* * Array for mapping encoded characters to decoded values. * This array is initialized when needed by calling * initDecodeArray(). Only includes entries up to * MAX_BASE64_CHAR. */ private static int [] Base64DecodeArray = null; /* * State values used for decoding a quantum of four encoded input * characters as follows. * * Initial state: NO_CHARS_DECODED * NO_CHARS_DECODED: no characters have been decoded * on encoded char: decode char into output quantum; * new state: ONE_CHAR_DECODED * otherwise: Exception * ONE_CHAR_DECODED: one character has been decoded * on encoded char: decode char into output quantum; * new state: TWO_CHARS_DECODED * otherwise: Exception * TWO_CHARS_DECODED: two characters have been decoded * on encoded char: decode char into output quantum; * new state: THREE_CHARS_DECODED * on pad: write quantum byte 0 to output; * new state: PAD_THREE_READ * THREE_CHARS_DECODED: three characters have been decoded * on encoded char: decode char into output quantum; * write quantum bytes 0-2 to output; * new state: NO_CHARS_DECODED * on pad: write quantum bytes 0-1 to output; * new state: PAD_FOUR_READ * PAD_THREE_READ: pad character has been read as 3rd of 4 chars * on pad: new state: PAD_FOUR_READ * otherwise: Exception * PAD_FOUR_READ: pad character has been read as 4th of 4 char * on any char: Exception * * The valid terminal states are NO_CHARS_DECODED and PAD_FOUR_READ. */ private static final int NO_CHARS_DECODED = 0; private static final int ONE_CHAR_DECODED = 1; private static final int TWO_CHARS_DECODED = 2; private static final int THREE_CHARS_DECODED = 3; private static final int PAD_THREE_READ = 5; private static final int PAD_FOUR_READ = 6; /** * The maximum number of groups that should be encoded * onto a single line (so we don't exceed 76 characters * per line). */ private static final int MAX_GROUPS_PER_LINE = 76/4; /** * Encodes the input byte array into a Base64-encoded * <code>String</code>. The output <code>String</code> * has a CR LF (0x0d 0x0a) after every 76 bytes, but * not at the end. * <p> * <b>WARNING</b>: If the input byte array is modified * while encoding is in progress, the output is undefined. * * @param binaryValue the byte array to be encoded * * @return the Base64-encoded <code>String</code> */ public static String encode(byte[] binaryValue) { int binaryValueLen = binaryValue.length; // Estimated output length (about 1.4x input, due to CRLF) int maxChars = (binaryValueLen * 7) / 5; // Buffer for encoded output StringBuffer sb = new StringBuffer(maxChars); int groupsToEOL = MAX_GROUPS_PER_LINE; // Convert groups of 3 input bytes, with pad if < 3 in final for (int binaryValueNdx = 0; binaryValueNdx < binaryValueLen; binaryValueNdx += 3) { // Encode 1st 6-bit group int group1 = (binaryValue[binaryValueNdx] >> 2) & 0x3F; sb.append(BASE64EncodingString.charAt(group1)); // Encode 2nd 6-bit group int group2 = (binaryValue[binaryValueNdx] << 4) & 0x030; if ((binaryValueNdx+1) < binaryValueLen) { group2 = group2 | ((binaryValue[binaryValueNdx+1] >> 4) & 0xF); } sb.append(BASE64EncodingString.charAt(group2)); // Encode 3rd 6-bit group int group3; if ((binaryValueNdx+1) < binaryValueLen) { group3 = (binaryValue[binaryValueNdx+1] << 2) & 0x03C; if ((binaryValueNdx+2) < binaryValueLen) { group3 = group3 | ((binaryValue[binaryValueNdx+2] >> 6) & 0x3); } } else { group3 = PAD_INDEX; } sb.append(BASE64EncodingString.charAt(group3)); // Encode 4th 6-bit group int group4; if ((binaryValueNdx+2) < binaryValueLen) { group4 = binaryValue[binaryValueNdx+2] & 0x3F; } else { group4 = PAD_INDEX; } sb.append(BASE64EncodingString.charAt(group4)); // After every MAX_GROUPS_PER_LINE groups, insert CR LF. // Unless this is the final line, in which case we skip that. groupsToEOL = groupsToEOL - 1; if (groupsToEOL == 0) { groupsToEOL = MAX_GROUPS_PER_LINE; if ((binaryValueNdx+3) <= binaryValueLen) { sb.append(CR); sb.append(LF); } } } return sb.toString(); } /** * Initializes Base64DecodeArray, if this hasn't already been * done. */ private static synchronized void initDecodeArray() { if (Base64DecodeArray != null) { return; } int [] ourArray = new int [MAX_BASE64_CHAR+1]; for (int i = 0; i <= MAX_BASE64_CHAR; i++) { ourArray[i] = BASE64EncodingString.indexOf(i); } Base64DecodeArray = ourArray; } /** * Decodes a Base64-encoded <code>String</code>. The result * is returned in a byte array that should match the original * binary value (before encoding). Whitespace characters * in the input <code>String</code> are ignored. * <p> * If the <code>ignoreBadChars</code> parameter is * <code>true</code>, characters that are not allowed * in a BASE64-encoded string are ignored. Otherwise, * they cause an <code>IOException</code> to be raised. * * @param encoded a <code>String</code> containing a * Base64-encoded value * @param ignoreBadChars If <code>true</code>, bad characters * are ignored. Otherwise, they cause * an <code>IOException</code> to be * raised. * * @return a byte array containing the decoded value * * @throws IOException if the input <code>String</code> is not * a valid Base64-encoded value */ public static byte[] decode(String encoded, boolean ignoreBadChars) throws IOException { int encodedLen = encoded.length(); int maxBytes = (encodedLen/4)*3; /* Maximum possible output bytes */ ByteArrayOutputStream ba = /* Buffer for decoded output */ new ByteArrayOutputStream(maxBytes); byte[] quantum = new byte[3]; /* one output quantum */ // ensure Base64DecodeArray is initialized initDecodeArray(); /* * Every 4 encoded characters in input are converted to 3 bytes of * output. This is called one "quantum". Each encoded character is * mapped to one 6-bit unit of the output. Whitespace characters in * the input are passed over; they are not included in the output. */ int state = NO_CHARS_DECODED; for (int encodedNdx = 0; encodedNdx < encodedLen; encodedNdx++) { // Turn encoded char into decoded value int encodedChar = encoded.charAt(encodedNdx); int decodedChar; if (encodedChar > MAX_BASE64_CHAR) { decodedChar = -1; } else { decodedChar = Base64DecodeArray[encodedChar]; } // Handle white space and invalid characters if (decodedChar == -1) { if (ignoreBadChars) { continue; } throw new IOException("Invalid character"); } if (decodedChar > PAD_INDEX) { /* whitespace */ continue; } // Handle valid characters switch (state) { case NO_CHARS_DECODED: if (decodedChar == PAD_INDEX) { throw new IOException("Pad character in invalid position"); } quantum[0] = (byte) ((decodedChar << 2) & 0xFC); state = ONE_CHAR_DECODED; break; case ONE_CHAR_DECODED: if (decodedChar == PAD_INDEX) { throw new IOException("Pad character in invalid position"); } quantum[0] = (byte) (quantum[0] | ((decodedChar >> 4) & 0x3)); quantum[1] = (byte) ((decodedChar << 4) & 0xF0); state = TWO_CHARS_DECODED; break; case TWO_CHARS_DECODED: if (decodedChar == PAD_INDEX) { ba.write(quantum, 0, 1); state = PAD_THREE_READ; } else { quantum[1] = (byte) (quantum[1] | ((decodedChar >> 2) & 0x0F)); quantum[2] = (byte) ((decodedChar << 6) & 0xC0); state = THREE_CHARS_DECODED; } break; case THREE_CHARS_DECODED: if (decodedChar == PAD_INDEX) { ba.write(quantum, 0, 2); state = PAD_FOUR_READ; } else { quantum[2] = (byte) (quantum[2] | decodedChar); ba.write(quantum, 0, 3); state = NO_CHARS_DECODED; } break; case PAD_THREE_READ: if (decodedChar != PAD_INDEX) { throw new IOException("Missing pad character"); } state = PAD_FOUR_READ; break; case PAD_FOUR_READ: throw new IOException("Invalid input follows pad character"); } } // Test valid terminal states if (state != NO_CHARS_DECODED && state != PAD_FOUR_READ) { throw new IOException("Invalid sequence of input characters"); } return ba.toByteArray(); } }