diff options
author | Mark Spruiell <mes@zeroc.com> | 2002-08-28 01:16:24 +0000 |
---|---|---|
committer | Mark Spruiell <mes@zeroc.com> | 2002-08-28 01:16:24 +0000 |
commit | 71c8c443160e2dbaae3faec9fe3c0f0193d4d692 (patch) | |
tree | a6b61d979a34b2e791f97bb5f44f1220efa3b286 /java/src/IceInternal/StringUtil.java | |
parent | improving xerces workaround (diff) | |
download | ice-71c8c443160e2dbaae3faec9fe3c0f0193d4d692.tar.bz2 ice-71c8c443160e2dbaae3faec9fe3c0f0193d4d692.tar.xz ice-71c8c443160e2dbaae3faec9fe3c0f0193d4d692.zip |
adding encoding for references, identities
Diffstat (limited to 'java/src/IceInternal/StringUtil.java')
-rw-r--r-- | java/src/IceInternal/StringUtil.java | 270 |
1 files changed, 270 insertions, 0 deletions
diff --git a/java/src/IceInternal/StringUtil.java b/java/src/IceInternal/StringUtil.java index 8a64798de37..119506b3f96 100644 --- a/java/src/IceInternal/StringUtil.java +++ b/java/src/IceInternal/StringUtil.java @@ -75,4 +75,274 @@ public final class StringUtil return -1; } + + private static void + encodeChar(byte b, StringBuffer s, String special) + { + switch(b) + { + case (byte)'\\': + { + s.append("\\\\"); + break; + } + case (byte)'\'': + { + s.append("\\'"); + break; + } + case (byte)'"': + { + s.append("\\\""); + break; + } + case (byte)'\b': + { + s.append("\\b"); + break; + } + case (byte)'\f': + { + s.append("\\f"); + break; + } + case (byte)'\n': + { + s.append("\\n"); + break; + } + case (byte)'\r': + { + s.append("\\r"); + break; + } + case (byte)'\t': + { + s.append("\\t"); + break; + } + default: + { + if(b <= (byte)31 || b == (byte)127) // Bytes are signed in Java (-128 to 127) + { + s.append('\\'); + String octal = Integer.toOctalString(b); + // + // Add leading zeroes so that we avoid problems during + // decoding. For example, consider the encoded string + // \0013 (i.e., a character with value 1 followed by + // the character '3'). If the leading zeroes were omitted, + // the result would be incorrectly interpreted by the + // decoder as a single character with value 11. + // + for(int j = octal.length(); j < 3; j++) + { + s.append('0'); + } + s.append(octal); + } + else if(special != null && special.indexOf((char)b) != -1) + { + s.append('\\'); + encodeChar(b, s, null); + } + else + { + s.append((char)b); + } + } + } + } + + // + // Encodes a string into UTF8, escaping all characters outside the range [32-126] + // as well as any special characters determined by the caller. + // + public static String + encodeString(String s, String special) + { + byte[] bytes = null; + try + { + bytes = s.getBytes("UTF8"); + } + catch(java.io.UnsupportedEncodingException ex) + { + assert(false); + return null; + } + + StringBuffer result = new StringBuffer(bytes.length); + + for(int i = 0; i < bytes.length; i++) + { + encodeChar(bytes[i], result, special); + } + + return result.toString(); + } + + // + // Decodes a UTF8 string. Decoding starts at the given start position + // (inclusive) and stops at the given end position (exclusive). If the end + // position is zero, then the remainder of the string is used. Upon success, + // the result parameter holds the decoded string and true is returned. + // A return value of false indicates an error was detected in the encoding. + // + public static boolean + decodeString(String s, int start, int end, Ice.StringHolder result) + { + final int len = s.length(); + if(end == 0) + { + end = len; + } + assert(start >= 0); + assert(end <= len); + assert(start < end); + + byte[] bytes = new byte[len]; + int bc = 0; + while(start < end) + { + char ch = s.charAt(start); + if(ch == '\\') + { + start++; + if(start == end) + { + return false; // Missing character + } + ch = s.charAt(start); + switch(ch) + { + case '\\': + { + bytes[bc++] = (byte)'\\'; + break; + } + case '\'': + case '"': + { + bytes[bc++] = (byte)ch; + break; + } + case 'b': + { + bytes[bc++] = (byte)'\b'; + break; + } + case 'f': + { + bytes[bc++] = (byte)'\f'; + break; + } + case 'n': + { + bytes[bc++] = (byte)'\n'; + break; + } + case 'r': + { + bytes[bc++] = (byte)'\r'; + break; + } + case 't': + { + bytes[bc++] = (byte)'\t'; + break; + } + case '0': + case '1': + case '2': + case '3': + case '4': + case '5': + case '6': + case '7': + case '8': + case '9': + { + int count = 0; + int val = 0; + while(count < 3 && start < end && s.charAt(start) >= '0' && s.charAt(start) <= '9') + { + val <<= 3; + val |= s.charAt(start) - '0'; + start++; + count++; + } + if(val > 255) + { + return false; // Octal value out of range + } + bytes[bc++] = (byte)val; + continue; // don't increment start + } + default: + { + byte b = (byte)ch; + if(b <= (byte)31 || b == (byte)127) // Bytes are signed in Java (-128 to 127) + { + return false; // Malformed encoding + } + else + { + bytes[bc++] = b; + } + } + } + } + else + { + bytes[bc++] = (byte)ch; + } + start++; + } + + try + { + result.value = new String(bytes, 0, bc, "UTF8"); + } + catch(java.io.UnsupportedEncodingException ex) + { + assert(false); + } + + return true; + } + + public static int + checkQuote(String s) + { + return checkQuote(s, 0); + } + + // + // If a single or double quotation mark is found at the start position, + // then the position of the matching closing quote is returned. If no + // quotation mark is found at the start position, then 0 is returned. + // If no matching closing quote is found, then -1 is returned. + // + public static int + checkQuote(String s, int start) + { + char quoteChar = s.charAt(start); + if(quoteChar == '"' || quoteChar == '\'') + { + start++; + final int len = s.length(); + int pos; + while(start < len && (pos = s.indexOf(quoteChar, start)) != -1) + { + if(s.charAt(pos - 1) != '\\') + { + return pos; + } + start = pos + 1; + } + return -1; // Unmatched quote + } + return 0; // Not quoted + } } |