111 lines
4.1 KiB
Java
111 lines
4.1 KiB
Java
|
|
||
|
/*
|
||
|
* Janino - An embedded Java[TM] compiler
|
||
|
*
|
||
|
* Copyright (c) 2001-2010, Arno Unkrig
|
||
|
* All rights reserved.
|
||
|
*
|
||
|
* Redistribution and use in source and binary forms, with or without modification, are permitted provided that the
|
||
|
* following conditions are met:
|
||
|
*
|
||
|
* 1. Redistributions of source code must retain the above copyright notice, this list of conditions and the
|
||
|
* following disclaimer.
|
||
|
* 2. Redistributions in binary form must reproduce the above copyright notice, this list of conditions and the
|
||
|
* following disclaimer in the documentation and/or other materials provided with the distribution.
|
||
|
* 3. The name of the author may not be used to endorse or promote products derived from this software without
|
||
|
* specific prior written permission.
|
||
|
*
|
||
|
* THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
|
||
|
* TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL
|
||
|
* THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING,
|
||
|
* BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
|
||
|
* INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
|
||
|
* (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
|
||
|
* POSSIBILITY OF SUCH DAMAGE.
|
||
|
*/
|
||
|
|
||
|
package org.codehaus.janino;
|
||
|
|
||
|
import java.io.FilterReader;
|
||
|
import java.io.IOException;
|
||
|
import java.io.Reader;
|
||
|
|
||
|
/**
|
||
|
* A {@link FilterReader} that unescapes the "Unicode Escapes" as described in JLS7 3.10.6.
|
||
|
* <p>
|
||
|
* Notice that it is possible to formulate invalid escape sequences, e.g. "\u123g" ("g" is not a valid hex
|
||
|
* character). This is handled by throwing a {@link java.lang.RuntimeException}-derived {@link
|
||
|
* org.codehaus.janino.UnicodeUnescapeException}.
|
||
|
*/
|
||
|
public
|
||
|
class UnicodeUnescapeReader extends FilterReader {
|
||
|
|
||
|
public
|
||
|
UnicodeUnescapeReader(Reader in) { super(in); }
|
||
|
|
||
|
/**
|
||
|
* Override {@link FilterReader#read()}.
|
||
|
*
|
||
|
* @throws UnicodeUnescapeException Invalid escape sequence encountered
|
||
|
*/
|
||
|
@Override public int
|
||
|
read() throws IOException {
|
||
|
int c;
|
||
|
|
||
|
// Read next character.
|
||
|
if (this.unreadChar == -1) {
|
||
|
c = this.in.read();
|
||
|
} else {
|
||
|
c = this.unreadChar;
|
||
|
this.unreadChar = -1;
|
||
|
}
|
||
|
|
||
|
// Check for backslash-u escape sequence, preceeded with an even number
|
||
|
// of backslashes.
|
||
|
if (c != '\\' || this.oddPrecedingBackslashes) {
|
||
|
this.oddPrecedingBackslashes = false;
|
||
|
return c;
|
||
|
}
|
||
|
|
||
|
// Read one character ahead and check if it is a "u".
|
||
|
c = this.in.read();
|
||
|
if (c != 'u') {
|
||
|
this.unreadChar = c;
|
||
|
this.oddPrecedingBackslashes = true;
|
||
|
return '\\';
|
||
|
}
|
||
|
|
||
|
// Skip redundant "u"s.
|
||
|
do {
|
||
|
c = this.in.read();
|
||
|
if (c == -1) throw new UnicodeUnescapeException("Incomplete escape sequence");
|
||
|
} while (c == 'u');
|
||
|
|
||
|
// Decode escape sequence.
|
||
|
char[] ca = new char[4];
|
||
|
ca[0] = (char) c;
|
||
|
if (this.in.read(ca, 1, 3) != 3) throw new UnicodeUnescapeException("Incomplete escape sequence");
|
||
|
try {
|
||
|
return 0xffff & Integer.parseInt(new String(ca), 16);
|
||
|
} catch (NumberFormatException ex) {
|
||
|
throw new UnicodeUnescapeException("Invalid escape sequence \"\\u" + new String(ca) + "\"", ex);
|
||
|
}
|
||
|
}
|
||
|
|
||
|
/** Overrides {@link FilterReader#read(char[], int, int)}. */
|
||
|
@Override public int
|
||
|
read(char[] cbuf, int off, int len) throws IOException {
|
||
|
if (len == 0) return 0;
|
||
|
int res = 0;
|
||
|
do {
|
||
|
int c = this.read();
|
||
|
if (c == -1) break;
|
||
|
cbuf[off++] = (char) c;
|
||
|
} while (++res < len);
|
||
|
return res == 0 ? -1 : res;
|
||
|
}
|
||
|
|
||
|
private int unreadChar = -1; // -1 == none
|
||
|
private boolean oddPrecedingBackslashes;
|
||
|
}
|