/* |
|
* Copyright (c) 1995, 2001, Oracle and/or its affiliates. All rights reserved. |
|
* DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. |
|
* |
|
* This code is free software; you can redistribute it and/or modify it |
|
* under the terms of the GNU General Public License version 2 only, as |
|
* published by the Free Software Foundation. Oracle designates this |
|
* particular file as subject to the "Classpath" exception as provided |
|
* by Oracle in the LICENSE file that accompanied this code. |
|
* |
|
* This code is distributed in the hope that it will be useful, but WITHOUT |
|
* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or |
|
* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License |
|
* version 2 for more details (a copy is included in the LICENSE file that |
|
* accompanied this code). |
|
* |
|
* You should have received a copy of the GNU General Public License version |
|
* 2 along with this work; if not, write to the Free Software Foundation, |
|
* Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA. |
|
* |
|
* Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA |
|
* or visit www.oracle.com if you need additional information or have any |
|
* questions. |
|
*/ |
|
package sun.misc; |
|
import java.io.PushbackInputStream; |
|
import java.io.OutputStream; |
|
import java.io.PrintStream; |
|
import java.io.IOException; |
|
/** |
|
* This class implements a Berkeley uu character decoder. This decoder |
|
* was made famous by the uudecode program. |
|
* |
|
* The basic character coding is algorithmic, taking 6 bits of binary |
|
* data and adding it to an ASCII ' ' (space) character. This converts |
|
* these six bits into a printable representation. Note that it depends |
|
* on the ASCII character encoding standard for english. Groups of three |
|
* bytes are converted into 4 characters by treating the three bytes |
|
* a four 6 bit groups, group 1 is byte 1's most significant six bits, |
|
* group 2 is byte 1's least significant two bits plus byte 2's four |
|
* most significant bits. etc. |
|
* |
|
* In this encoding, the buffer prefix is: |
|
* <pre> |
|
* begin [mode] [filename] |
|
* </pre> |
|
* |
|
* This is followed by one or more lines of the form: |
|
* <pre> |
|
* (len)(data)(data)(data) ... |
|
* </pre> |
|
* where (len) is the number of bytes on this line. Note that groupings |
|
* are always four characters, even if length is not a multiple of three |
|
* bytes. When less than three characters are encoded, the values of the |
|
* last remaining bytes is undefined and should be ignored. |
|
* |
|
* The last line of data in a uuencoded buffer is represented by a single |
|
* space character. This is translated by the decoding engine to a line |
|
* length of zero. This is immediately followed by a line which contains |
|
* the word 'end[newline]' |
|
* |
|
* If an error is encountered during decoding this class throws a |
|
* CEFormatException. The specific detail messages are: |
|
* |
|
* <pre> |
|
* "UUDecoder: No begin line." |
|
* "UUDecoder: Malformed begin line." |
|
* "UUDecoder: Short Buffer." |
|
* "UUDecoder: Bad Line Length." |
|
* "UUDecoder: Missing 'end' line." |
|
* </pre> |
|
* |
|
* @author Chuck McManis |
|
* @see CharacterDecoder |
|
* @see UUEncoder |
|
*/ |
|
public class UUDecoder extends CharacterDecoder { |
|
/** |
|
* This string contains the name that was in the buffer being decoded. |
|
*/ |
|
public String bufferName; |
|
/** |
|
* Represents UNIX(tm) mode bits. Generally three octal digits |
|
* representing read, write, and execute permission of the owner, |
|
* group owner, and others. They should be interpreted as the bit groups: |
|
* <pre> |
|
* (owner) (group) (others) |
|
* rwx rwx rwx (r = read, w = write, x = execute) |
|
*</pre> |
|
* |
|
*/ |
|
public int mode; |
|
/** |
|
* UU encoding specifies 3 bytes per atom. |
|
*/ |
|
protected int bytesPerAtom() { |
|
return (3); |
|
} |
|
/** |
|
* All UU lines have 45 bytes on them, for line length of 15*4+1 or 61 |
|
* characters per line. |
|
*/ |
|
protected int bytesPerLine() { |
|
return (45); |
|
} |
|
/** This is used to decode the atoms */ |
|
private byte decoderBuffer[] = new byte[4]; |
|
/** |
|
* Decode a UU atom. Note that if l is less than 3 we don't write |
|
* the extra bits, however the encoder always encodes 4 character |
|
* groups even when they are not needed. |
|
*/ |
|
protected void decodeAtom(PushbackInputStream inStream, OutputStream outStream, int l) |
|
throws IOException { |
|
int i, c1, c2, c3, c4; |
|
int a, b, c; |
|
StringBuffer x = new StringBuffer(); |
|
for (i = 0; i < 4; i++) { |
|
c1 = inStream.read(); |
|
if (c1 == -1) { |
|
throw new CEStreamExhausted(); |
|
} |
|
x.append((char)c1); |
|
decoderBuffer[i] = (byte) ((c1 - ' ') & 0x3f); |
|
} |
|
a = ((decoderBuffer[0] << 2) & 0xfc) | ((decoderBuffer[1] >>> 4) & 3); |
|
b = ((decoderBuffer[1] << 4) & 0xf0) | ((decoderBuffer[2] >>> 2) & 0xf); |
|
c = ((decoderBuffer[2] << 6) & 0xc0) | (decoderBuffer[3] & 0x3f); |
|
outStream.write((byte)(a & 0xff)); |
|
if (l > 1) { |
|
outStream.write((byte)( b & 0xff)); |
|
} |
|
if (l > 2) { |
|
outStream.write((byte)(c&0xff)); |
|
} |
|
} |
|
/** |
|
* For uuencoded buffers, the data begins with a line of the form: |
|
* begin MODE FILENAME |
|
* This line always starts in column 1. |
|
*/ |
|
protected void decodeBufferPrefix(PushbackInputStream inStream, OutputStream outStream) throws IOException { |
|
int c; |
|
StringBuffer q = new StringBuffer(32); |
|
String r; |
|
boolean sawNewLine; |
|
/* |
|
* This works by ripping through the buffer until it finds a 'begin' |
|
* line or the end of the buffer. |
|
*/ |
|
sawNewLine = true; |
|
while (true) { |
|
c = inStream.read(); |
|
if (c == -1) { |
|
throw new CEFormatException("UUDecoder: No begin line."); |
|
} |
|
if ((c == 'b') && sawNewLine){ |
|
c = inStream.read(); |
|
if (c == 'e') { |
|
break; |
|
} |
|
} |
|
sawNewLine = (c == '\n') || (c == '\r'); |
|
} |
|
/* |
|
* Now we think its begin, (we've seen ^be) so verify it here. |
|
*/ |
|
while ((c != '\n') && (c != '\r')) { |
|
c = inStream.read(); |
|
if (c == -1) { |
|
throw new CEFormatException("UUDecoder: No begin line."); |
|
} |
|
if ((c != '\n') && (c != '\r')) { |
|
q.append((char)c); |
|
} |
|
} |
|
r = q.toString(); |
|
if (r.indexOf(' ') != 3) { |
|
throw new CEFormatException("UUDecoder: Malformed begin line."); |
|
} |
|
mode = Integer.parseInt(r.substring(4,7)); |
|
bufferName = r.substring(r.indexOf(' ',6)+1); |
|
/* |
|
* Check for \n after \r |
|
*/ |
|
if (c == '\r') { |
|
c = inStream.read (); |
|
if ((c != '\n') && (c != -1)) |
|
inStream.unread (c); |
|
} |
|
} |
|
/** |
|
* In uuencoded buffers, encoded lines start with a character that |
|
* represents the number of bytes encoded in this line. The last |
|
* line of input is always a line that starts with a single space |
|
* character, which would be a zero length line. |
|
*/ |
|
protected int decodeLinePrefix(PushbackInputStream inStream, OutputStream outStream) throws IOException { |
|
int c; |
|
c = inStream.read(); |
|
if (c == ' ') { |
|
c = inStream.read(); /* discard the (first)trailing CR or LF */ |
|
c = inStream.read(); /* check for a second one */ |
|
if ((c != '\n') && (c != -1)) |
|
inStream.unread (c); |
|
throw new CEStreamExhausted(); |
|
} else if (c == -1) { |
|
throw new CEFormatException("UUDecoder: Short Buffer."); |
|
} |
|
c = (c - ' ') & 0x3f; |
|
if (c > bytesPerLine()) { |
|
throw new CEFormatException("UUDecoder: Bad Line Length."); |
|
} |
|
return (c); |
|
} |
|
/** |
|
* Find the end of the line for the next operation. |
|
* The following sequences are recognized as end-of-line |
|
* CR, CR LF, or LF |
|
*/ |
|
protected void decodeLineSuffix(PushbackInputStream inStream, OutputStream outStream) throws IOException { |
|
int c; |
|
while (true) { |
|
c = inStream.read(); |
|
if (c == -1) { |
|
throw new CEStreamExhausted(); |
|
} |
|
if (c == '\n') { |
|
break; |
|
} |
|
if (c == '\r') { |
|
c = inStream.read(); |
|
if ((c != '\n') && (c != -1)) { |
|
inStream.unread (c); |
|
} |
|
break; |
|
} |
|
} |
|
} |
|
/** |
|
* UUencoded files have a buffer suffix which consists of the word |
|
* end. This line should immediately follow the line with a single |
|
* space in it. |
|
*/ |
|
protected void decodeBufferSuffix(PushbackInputStream inStream, OutputStream outStream) throws IOException { |
|
int c; |
|
c = inStream.read(decoderBuffer); |
|
if ((decoderBuffer[0] != 'e') || (decoderBuffer[1] != 'n') || |
|
(decoderBuffer[2] != 'd')) { |
|
throw new CEFormatException("UUDecoder: Missing 'end' line."); |
|
} |
|
} |
|
} |