1
0
Fork 0
mirror of https://github.com/eclipse-cdt/cdt synced 2025-08-12 10:45:37 +02:00

Bug 307311: Incorrect string display when using non-ASCII characters

This commit is contained in:
Mathias Kunter 2012-02-01 21:49:48 -05:00 committed by Marc Khouzam
parent f360d64c77
commit a974434ec3
7 changed files with 923 additions and 110 deletions

View file

@ -1,5 +1,5 @@
/*******************************************************************************
* Copyright (c) 2000, 2009 QNX Software Systems and others.
* Copyright (c) 2000, 2012 QNX Software Systems and others.
* All rights reserved. This program and the accompanying materials
* are made available under the terms of the Eclipse Public License v1.0
* which accompanies this distribution, and is available at
@ -8,6 +8,9 @@
* Contributors:
* QNX Software Systems - Initial API and implementation
* Wind River Systems - Modified for new DSF Reference Implementation
* Mathias Kunter - Modified for implementation of Bug 307311. Please
* find further implementation details within the
* MIStringHandler class.
*******************************************************************************/
package org.eclipse.cdt.dsf.mi.service.command.output;
@ -16,109 +19,27 @@ package org.eclipse.cdt.dsf.mi.service.command.output;
* GDB/MI const value represents a ios-c string.
*/
public class MIConst extends MIValue {
String cstring = ""; //$NON-NLS-1$
private String cstring = ""; //$NON-NLS-1$
public String getCString() {
return cstring;
}
public void setCString(String str) {
cstring = str;
}
/**
* Translate gdb c-string.
* Translates the C string value into a string which is suitable for display to a human.
* @return The translated string.
*/
public String getString() {
return getString(cstring);
return MIStringHandler.translateCString(cstring, true);
}
public static String getString(String str) {
StringBuffer buffer = new StringBuffer();
boolean escape = false;
for (int i = 0; i < str.length(); i++) {
char c = str.charAt(i);
if (c == '\\') {
if (escape) {
buffer.append(c);
escape = false;
} else {
escape = true;
}
} else {
if (escape) {
if (isIsoCSpecialChar(c)) {
buffer.append(isoC(c));
} else {
buffer.append('\\');
buffer.append(c);
}
} else {
buffer.append(c);
}
escape = false;
}
}
// If escape is still true it means that the
// last char was an '\'.
if (escape) {
buffer.append('\\');
}
return buffer.toString();
}
@Override
public String toString() {
return getCString();
}
/**
* Assuming that the precedent character was the
* escape sequence '\'
*/
private static String isoC(char c) {
String s = new Character(c).toString();
if (c == '"') {
s = "\""; //$NON-NLS-1$
} else if (c == '\'') {
s = "\'"; //$NON-NLS-1$
} else if (c == '?') {
s = "?"; //$NON-NLS-1$
} else if (c == 'a') {
s = "\007"; //$NON-NLS-1$
} else if (c == 'b') {
s = "\b"; //$NON-NLS-1$
} else if (c == 'f') {
s = "\f"; //$NON-NLS-1$
} else if (c == 'n') {
s = System.getProperty("line.separator", "\n"); //$NON-NLS-1$ //$NON-NLS-2$ $NON-NLS-2$
} else if (c == 'r') {
s = "\r"; //$NON-NLS-1$
} else if (c == 't') {
s = "\t"; //$NON-NLS-1$
} else if (c == 'v') {
s = "\013"; //$NON-NLS-1$
}
return s;
}
private static boolean isIsoCSpecialChar(char c) {
switch (c) {
case '"':
case '\'':
case '?':
case 'a':
case 'b':
case 'f':
case 'n':
case 'r':
case 't':
case 'v':
return true;
}
return false;
}
}

View file

@ -1,5 +1,5 @@
/*******************************************************************************
* Copyright (c) 2000, 2009 QNX Software Systems and others.
* Copyright (c) 2000, 2012 QNX Software Systems and others.
* All rights reserved. This program and the accompanying materials
* are made available under the terms of the Eclipse Public License v1.0
* which accompanies this distribution, and is available at
@ -8,6 +8,7 @@
* Contributors:
* QNX Software Systems - Initial API and implementation
* Wind River Systems - Modified for new DSF Reference Implementation
* Mathias Kunter - use MIConst.getString which is for human consumption (Bug 307311)
*******************************************************************************/
package org.eclipse.cdt.dsf.mi.service.command.output;
@ -32,7 +33,7 @@ public class MIDataEvaluateExpressionInfo extends MIInfo {
if (var.equals("value")) { //$NON-NLS-1$
MIValue value = results[i].getMIValue();
if (value instanceof MIConst) {
fValue = ((MIConst)value).getCString();
fValue = ((MIConst)value).getString();
}
}
}

View file

@ -1,5 +1,5 @@
/*******************************************************************************
* Copyright (c) 2000, 2009 QNX Software Systems and others.
* Copyright (c) 2000, 2012 QNX Software Systems and others.
* All rights reserved. This program and the accompanying materials
* are made available under the terms of the Eclipse Public License v1.0
* which accompanies this distribution, and is available at
@ -8,6 +8,7 @@
* Contributors:
* QNX Software Systems - Initial API and implementation
* Wind River Systems - Modified for new DSF Reference Implementation
* Mathias Kunter - Don't always parse backslashes (Bug 367456, Bug 307311)
*******************************************************************************/
package org.eclipse.cdt.dsf.mi.service.command.output;
@ -216,7 +217,9 @@ public class MIParser {
if (buffer.length() > 0 && buffer.charAt(0) == '"') {
buffer.deleteCharAt(0);
}
stream.setCString(translateCString(new FSB(buffer)));
// Don't parse any backslashes - backslashes within stream records
// aren't escaped.
stream.setCString(translateCString(new FSB(buffer), false));
oob = stream;
} else {
// Badly format MI line, just pass it to the user as target stream
@ -306,7 +309,9 @@ public class MIParser {
} else if (buffer.charAt(0) == '"') {
buffer.deleteCharAt(0);
MIConst cnst = new MIConst();
cnst.setCString(translateCString(buffer));
// Parse backslashes - backslashes within result
// and out of band records are escaped.
cnst.setCString(translateCString(buffer, true));
value = cnst;
}
}
@ -382,15 +387,20 @@ public class MIParser {
return list;
}
/*
* MI C-String rather MICOnst values are enclose in double quotes
* and any double quotes or backslash in the string are escaped.
* Assuming the starting double quote was removed.
* This method will stop at the closing double quote remove the extra
* backslach escaping and return the string __without__ the enclosing double quotes
* The orignal StringBuffer will move forward.
/**
* MI C-String rather MIConst values are enclosed in double quotes
* and any double quotes or backslashes in the string are escaped.
* Assuming the starting double quote was removed. This method will
* stop at the closing double quote, remove the extra backslash escaping
* and return the string __without__ the enclosing double quotes. The
* original string buffer will move forward.
* @param buffer The string buffer to read from.
* @param parseBackslashes Defines whether backslashes should be parsed.
* This parameter is necessary to differentiate between records which
* contain escaped backslashes and records which do not.
* @return The translated C string.
*/
private String translateCString(FSB buffer) {
private String translateCString(FSB buffer, boolean parseBackslashes) {
boolean escape = false;
boolean closingQuotes = false;
@ -402,7 +412,9 @@ public class MIParser {
if (c == '\\') {
if (escape) {
sb.append(c);
sb.append(c);
if (!parseBackslashes) {
sb.append(c);
}
escape = false;
} else {
escape = true;

View file

@ -1,5 +1,5 @@
/*******************************************************************************
* Copyright (c) 2000, 2009 QNX Software Systems and others.
* Copyright (c) 2000, 2012 QNX Software Systems and others.
* All rights reserved. This program and the accompanying materials
* are made available under the terms of the Eclipse Public License v1.0
* which accompanies this distribution, and is available at
@ -8,6 +8,7 @@
* Contributors:
* QNX Software Systems - Initial API and implementation
* Wind River Systems - Modified for new DSF Reference Implementation
* Mathias Kunter - Modified to use the new MIStringHandler class (Bug 307311)
*******************************************************************************/
package org.eclipse.cdt.dsf.mi.service.command.output;
@ -28,7 +29,8 @@ public abstract class MIStreamRecord extends MIOOBRecord {
}
public String getString () {
return MIConst.getString(getCString());
// Return the translated C string without escaping any special characters.
return MIStringHandler.translateCString(getCString(), false);
}
@Override

View file

@ -0,0 +1,487 @@
/*******************************************************************************
* Copyright (c) 2012 Mathias Kunter and others.
* All rights reserved. This program and the accompanying materials
* are made available under the terms of the Eclipse Public License v1.0
* which accompanies this distribution, and is available at
* http://www.eclipse.org/legal/epl-v10.html
*
* Contributors:
* Mathias Kunter - Initial Implementation (Bug 307311)
*******************************************************************************/
package org.eclipse.cdt.dsf.mi.service.command.output;
import java.nio.ByteBuffer;
import java.nio.CharBuffer;
import java.nio.charset.Charset;
import java.nio.charset.CharsetDecoder;
import java.nio.charset.CharsetEncoder;
import java.text.ParseException;
import java.util.EnumSet;
/**
* The MIStringHandler class provides several static functions to handle C and / or MI strings.
* @since 4.1
*/
public class MIStringHandler {
/**
* Defines special characters which are used within escape notations to represent a
* corresponding Unicode code point (i.e. character code). See the specialCodePoints
* list below on the same index for the corresponding code point.
*/
private static char[] specialChars = new char[] {
'a', // Alert (bell) character
'b', // Backspace character
'e', // GNU extension: Escape character
'E', // same as 'e'
'f', // Form feed character
'n', // New line character
'r', // Carriage return character
't', // Horizontal tabulation character
'v', // Vertical tabulation character
'\'', // Single quotation mark
'"', // Double quotation mark
'\\', // Backslash
'?' // Literal question mark
};
/**
* Defines special Unicode code points (i.e. character codes) which can be escaped by a
* corresponding special character. See the specialChars list above on the same index
* for the corresponding special character.
*/
private static int[] specialCodePoints = new int[] {
0x07, // corresponds to \a
0x08, // corresponds to \b
0x1B, // corresponds to \e
0x1B, // corresponds to \E
0x0C, // corresponds to \f
0x0A, // corresponds to \n
0x0D, // corresponds to \r
0x09, // corresponds to \t
0x0B, // corresponds to \v
0x27, // corresponds to \'
0x22, // corresponds to \"
0x5C, // corresponds to \\
0x3F // corresponds to \?
};
/**
* An internal helper enumeration which holds the current status while parsing an escaped
* text sequence.
*/
private enum EscapeStatus {
NONE,
BEGIN,
OCTAL_NUMBER,
HEX_NUMBER,
UNICODE_SHORT_NUMBER,
UNICODE_LONG_NUMBER,
VALID,
INVALID
}
/**
* An enumeration defining the escape sequences which should be parsed.
*/
public enum ParseFlags {
SPECIAL_CHARS,
OCTAL_NUMBERS,
HEX_NUMBERS,
UNICODE_SHORT_NUMBERS,
UNICODE_LONG_NUMBERS
}
/**
* Translates the given C string into a string suitable for display. This includes handling
* of escaped characters and different string encodings. This is necessary in order to correctly
* deal with non-ASCII strings.
* @param str The C string to translate.
* @param escapeChars Defines whether non-printable characters should be escaped within
* the translated string, or not.
* @return The translated string.
*/
public static String translateCString(String str, boolean escapeChars) {
if (escapeChars) {
// Don't parse the special character escape notations here. We can do this here because
// we want to keep them in their escaped form anyway, and because the following string
// transcoding process isn't affected by escaped special chars. By doing so we avoid
// caring about some nasty details of the special character escaping process: for
// example, single quotation marks are commonly only escaped within character constants,
// while double quotation marks are commonly only escaped within string constants. By
// not parsing the special character escape notations at all here, we just keep the
// original special character escaping provided by the given MI string.
str = parseString(str, EnumSet.complementOf(EnumSet.of(ParseFlags.SPECIAL_CHARS)));
} else {
// Parse all escaped characters.
str = parseString(str);
}
// Transcode the string in order to handle non-ASCII strings correctly.
str = transcodeString(str);
if (escapeChars) {
// Escape any non-printable characters again, as we want to be able to display them.
// However, don't escape any printable special chars, as they haven't been parsed before.
str = escapeString(str, false);
} else {
// No escaping necessary here. We however have to make sure that we use the correct line
// separation character sequence.
str = str.replace("\n", System.getProperty("line.separator", "\n")); //$NON-NLS-1$ //$NON-NLS-2$ //$NON-NLS-3$
}
return str;
}
/**
* Returns whether the given character is a special character, or not.
* @param c The character to test.
* @return The test result.
*/
public static boolean isSpecialChar(char c) {
for (int i = 0; i < specialChars.length; i++) {
if (specialChars[i] == c) {
return true;
}
}
return false;
}
/**
* Returns whether the given Unicode code point is a special code point, or not.
* @param codePoint The Unicode code point to test.
* @return The test result.
*/
public static boolean isSpecialCodePoint(int codePoint) {
for (int i = 0; i < specialCodePoints.length; i++) {
if (specialCodePoints[i] == codePoint) {
return true;
}
}
return false;
}
/**
* Parses the given special character into an Unicode code point.
* @param c The special character to parse.
* @return The parsed Unicode code point.
* @throws ParseException Thrown when the given character can't be parsed. This happens when it's
* not a special character.
*/
public static int parseSpecialChar(char c) throws ParseException {
for (int i = 0; i < specialChars.length; i++) {
if (specialChars[i] == c) {
return specialCodePoints[i];
}
}
throw new ParseException("The given character '" + c + "' is not a special character.", 0); //$NON-NLS-1$ //$NON-NLS-2$
}
/**
* Parses the given special Unicode code point into a character.
* @param codePoint The special Unicode code point to parse.
* @return The parsed character.
* @throws ParseException Thrown when the given Unicode code point can't be parsed. This happens
* when it's not a special code point.
*/
public static char parseSpecialCodePoint(int codePoint) throws ParseException {
for (int i = 0; i < specialCodePoints.length; i++) {
if (specialCodePoints[i] == codePoint) {
return specialChars[i];
}
}
throw new ParseException("The given Unicode code point " + codePoint + " is not a special code point.", 0); //$NON-NLS-1$ //$NON-NLS-2$
}
/**
* This is an overloaded function. See the Javadoc of the other function overload for details.
* @param str The string which should be parsed.
* @return The parsed string.
*/
public static String parseString(String str) {
return parseString(str, EnumSet.allOf(ParseFlags.class));
}
/**
* Parses any escaped characters and replaces them with their corresponding Unicode code points.
* This function parses all escape notations which are supported by gcc and / or gdb. Those are:</br></br>
*
* <ul>
* <li>Special char escape notations: \a, \b, \e, \E, \f, \n, \r, \t, \v, \', \", \\, and \?</li>
*
* <li>Octal escape notation: An initial backslash, followed by 1, 2, or 3 octal digits. Values
* above 0xFF are ignored. Octal escape notations may not use more than 3 octal digits.</li>
*
* <li>Hexadecimal escape notation: An initial backslash, followed by an "x" and 1 or more
* hexadecimal digits. Hexadecimal escape notations may not use more than 4 hexadecimal digits
* (although gcc accepts hexadecimal escape notations of any arbitrary length).</li>
*
* <li>Short Unicode escape notation: An initial backslash, followed by an "u" and exactly 4
* hexadecimal digits.</li>
*
* <li>Long Unicode escape notation: An initial backslash, followed by an "U" and exactly 8
* hexadecimal digits.</li>
* </ul>
* @param str The string which should be parsed.
* @param parseFlags The set of escape notations which should be parsed.
* @return The parsed string.
*/
public static String parseString(String str, EnumSet<ParseFlags> parseFlags) {
StringBuffer buffer = new StringBuffer();
StringBuffer escapeBuffer = new StringBuffer();
EscapeStatus escStatus = EscapeStatus.NONE;
for (int i = 0; i < str.length(); i++) {
char c = str.charAt(i);
boolean consumeChar = true;
boolean isLastChar = i == str.length() - 1;
if (escStatus == EscapeStatus.NONE) {
if (c == '\\') {
// Escaping begins. Reset the escape buffer.
escapeBuffer.setLength(0);
escapeBuffer.append(c);
escStatus = EscapeStatus.BEGIN;
}
} else if (escStatus == EscapeStatus.BEGIN) {
if (parseFlags.contains(ParseFlags.SPECIAL_CHARS) && isSpecialChar(c)) {
try {
buffer.appendCodePoint(parseSpecialChar(c));
escStatus = EscapeStatus.VALID;
} catch (ParseException e) {
// This is just for completeness. We will actually never catch any ParseException here
// since we already checked the character with isSpecialChar() before.
escapeBuffer.append(c);
escStatus = EscapeStatus.INVALID;
}
} else if (parseFlags.contains(ParseFlags.OCTAL_NUMBERS) && c >= '0' && c <= '7') {
escStatus = EscapeStatus.OCTAL_NUMBER;
// Don't consume this character right now - as this wouldn't work if it's the last character.
consumeChar = false;
} else if (parseFlags.contains(ParseFlags.HEX_NUMBERS) && c == 'x') {
escStatus = EscapeStatus.HEX_NUMBER;
} else if (parseFlags.contains(ParseFlags.UNICODE_SHORT_NUMBERS) && c == 'u') {
escStatus = EscapeStatus.UNICODE_SHORT_NUMBER;
} else if (parseFlags.contains(ParseFlags.UNICODE_LONG_NUMBERS) && c == 'U') {
escStatus = EscapeStatus.UNICODE_LONG_NUMBER;
} else {
escStatus = EscapeStatus.INVALID;
}
if (consumeChar) {
escapeBuffer.append(c);
}
} else if (escStatus == EscapeStatus.HEX_NUMBER) {
// Only consume this character if it belongs to the escape sequence.
consumeChar = (c >= '0' && c <= '9') || (c >= 'a' && c <= 'f') || (c >= 'A' && c <= 'F');
if (consumeChar) {
escapeBuffer.append(c);
}
if (!consumeChar || isLastChar || escapeBuffer.length() == 6) {
// The escape sequence is terminated. Set the escape status to invalid until
// we know that it's actually valid.
escStatus = EscapeStatus.INVALID;
if (escapeBuffer.length() > 2) {
// Decode the hexadecimal number.
try {
int codePoint = Integer.parseInt(escapeBuffer.toString().substring(2), 16);
if (codePoint <= 0x10FFFF) {
buffer.appendCodePoint(codePoint);
escStatus = EscapeStatus.VALID;
}
} catch (NumberFormatException e) {
}
}
}
} else if (escStatus == EscapeStatus.UNICODE_SHORT_NUMBER || escStatus == EscapeStatus.UNICODE_LONG_NUMBER) {
// Only consume this character if it belongs to the escape sequence.
consumeChar = (c >= '0' && c <= '9') || (c >= 'a' && c <= 'f') || (c >= 'A' && c <= 'F');
if (consumeChar) {
escapeBuffer.append(c);
}
int finalLength = escStatus == EscapeStatus.UNICODE_SHORT_NUMBER ? 6 : 10;
if (escapeBuffer.length() == finalLength) {
// The escape sequence is terminated. Set the escape status to invalid until
// we know that it's actually valid. Decode the hexadecimal number.
escStatus = EscapeStatus.INVALID;
try {
int codePoint = Integer.parseInt(escapeBuffer.toString().substring(2), 16);
if (codePoint <= 0x10FFFF) {
buffer.appendCodePoint(codePoint);
escStatus = EscapeStatus.VALID;
}
} catch (NumberFormatException e) {
}
} else if (!consumeChar || isLastChar) {
// The escape sequence is terminated and invalid.
escStatus = EscapeStatus.INVALID;
}
} else if (escStatus == EscapeStatus.OCTAL_NUMBER) {
// Only consume this character if it belongs to the escape sequence.
consumeChar = c >= '0' && c <= '7';
if (consumeChar) {
escapeBuffer.append(c);
}
if (!consumeChar || isLastChar || escapeBuffer.length() == 4) {
// The escape sequence is terminated. Set the escape status to invalid until
// we know that it's actually valid.
escStatus = EscapeStatus.INVALID;
if (escapeBuffer.length() > 1) {
// Decode the octal number.
try {
int codePoint = Integer.parseInt(escapeBuffer.toString().substring(1), 8);
if (codePoint <= 0xFF) {
buffer.appendCodePoint(codePoint);
escStatus = EscapeStatus.VALID;
}
} catch (NumberFormatException e) {
}
}
}
}
if (escStatus == EscapeStatus.NONE) {
// Current character isn't escaped - copy it over to the destination buffer.
buffer.append(c);
} else if (escStatus == EscapeStatus.VALID) {
escStatus = EscapeStatus.NONE;
} else if (escStatus == EscapeStatus.INVALID) {
buffer.append(escapeBuffer);
escStatus = EscapeStatus.NONE;
}
if (!consumeChar) {
// Don't consume the current character.
i--;
}
}
// Check for non-finished escape sequences at the end of the string.
if (escStatus != EscapeStatus.NONE) {
buffer.append(escapeBuffer);
}
// Convert the buffer into a string and return it.
return buffer.toString();
}
/**
* Transcodes the given string. This is done as follows:</br></br>
* 1) The given string is encoded into a binary byte buffer.</br></br>
* 2) It's tested whether this binary byte buffer seems to represent a string which is encoded as
* either ASCII, Latin-1, or UTF-8. If this is the case, the binary byte buffer is decoded back into
* a string and this string is returned. If the test is negative, the given string is returned without
* modification because its encoding can't be reliably determined in this case.
* The most important use case of this function is to transcode a string which is actually UTF-8 but has
* been incorrectly decoded as Latin-1 instead.
* @param str The string to transcode.
* @return The transcoded string.
*/
public static String transcodeString(String str) {
// Try to transcode the string from Latin-1 to UTF-8 (ASCII doesn't need to be explicitly
// considered here since Latin-1 is backwards compatible with ASCII). The transcoding will
// almost certainly only succeed if the string actually *is* encoded in UTF-8. If the
// transcoding fails, the string is simply left unchanged.
try {
// First, try to encode the string as Latin-1 in order to obtain the binary byte
// representation of the string.
CharsetEncoder latin1Encoder = Charset.forName("ISO-8859-1").newEncoder(); //$NON-NLS-1$
ByteBuffer stringBytes = latin1Encoder.encode(CharBuffer.wrap(str.toCharArray()));
// Next, try to decode the string as UTF-8. This will almost certainly only succeed
// if the string actually *is* encoded in UTF-8. Note that if the decoding fails,
// an exception is thrown before the str variable is assigned. The original string
// is therefore left unchanged in this case.
CharsetDecoder utf8Decoder = Charset.forName("UTF-8").newDecoder(); //$NON-NLS-1$
str = utf8Decoder.decode(stringBytes).toString();
} catch (Exception e) {
}
return str;
}
/**
* Escapes any non-printable characters as well as the printable special characters single quotation
* mark, double quotation mark, backslash, and literal question mark within the given string. Supports
* the entire Unicode code space.
* @param str The string which should be escaped.
* @return The escaped string.
*/
public static String escapeString(String str) {
return escapeString(str, true);
}
/**
* Escapes any non-printable characters within the given string. Supports the entire Unicode code space.
* @param str The string which should be escaped.
* @param escapePrintableSpecialChars Defines whether the printable special characters single
* quotation mark, double quotation mark, backslash, and literal question mark should be
* escaped as well, or not.
* @return The escaped string.
*/
public static String escapeString(String str, boolean escapePrintableSpecialChars) {
StringBuffer buffer = new StringBuffer();
for (int i = 0; i < str.length(); i++) {
// Get the current character code point. Note that using the Java "char" data type isn't
// sufficient here, as it can't handle all Unicode characters.
int codePoint = str.codePointAt(i);
if (Character.isSupplementaryCodePoint(codePoint)) {
i++;
}
// Check the code point type of the character in order to determine whether it's
// printable or not.
int codePointType = Character.getType(codePoint);
switch (codePointType) {
case Character.LINE_SEPARATOR:
case Character.PARAGRAPH_SEPARATOR:
case Character.CONTROL:
case Character.PRIVATE_USE:
case Character.SURROGATE:
case Character.UNASSIGNED:
// Non-printable character.
if (isSpecialCodePoint(codePoint)) {
// Escape by using the special character escape notation.
buffer.append('\\');
try {
buffer.append(parseSpecialCodePoint(codePoint));
} catch (ParseException e) {
buffer.appendCodePoint(codePoint);
}
} else if (codePoint == 0x00) {
// Escape the null character separately - don't use leading zeros.
buffer.append("\\0"); //$NON-NLS-1$
} else if (codePoint <= 0xFF) {
// Escape by using the octal escape notation.
buffer.append(String.format("\\%03o", codePoint)); //$NON-NLS-1$
} else if (codePoint <= 0xFFFF) {
// Escape by using the short Unicode escape notation.
buffer.append(String.format("\\u%04x", codePoint)); //$NON-NLS-1$
} else {
// Escape by using the long Unicode escape notation.
buffer.append(String.format("\\U%08x", codePoint)); //$NON-NLS-1$
}
break;
default:
// Printable character.
if (escapePrintableSpecialChars && isSpecialCodePoint(codePoint)) {
// Escape by using the special character escape notation.
buffer.append('\\');
try {
buffer.append(parseSpecialCodePoint(codePoint));
} catch (ParseException e) {
buffer.appendCodePoint(codePoint);
}
} else {
// Don't escape.
buffer.appendCodePoint(codePoint);
}
}
}
return buffer.toString();
}
}

View file

@ -1,5 +1,5 @@
/*******************************************************************************
* Copyright (c) 2000, 2009 QNX Software Systems and others.
* Copyright (c) 2000, 2012 QNX Software Systems and others.
* All rights reserved. This program and the accompanying materials
* are made available under the terms of the Eclipse Public License v1.0
* which accompanies this distribution, and is available at
@ -8,6 +8,7 @@
* Contributors:
* QNX Software Systems - Initial API and implementation
* Wind River Systems - Modified for new DSF Reference Implementation
* Mathias Kunter - use MIConst.getString which is for human consumption (Bug 307311)
*******************************************************************************/
package org.eclipse.cdt.dsf.mi.service.command.output;
@ -30,7 +31,7 @@ public class MIVarEvaluateExpressionInfo extends MIInfo {
if (var.equals("value")) { //$NON-NLS-1$
MIValue val = results[i].getMIValue();
if (val instanceof MIConst) {
value = ((MIConst)val).getCString();
value = ((MIConst)val).getString();
}
}
}

View file

@ -0,0 +1,389 @@
/*******************************************************************************
* Copyright (c) 2012 Mathias Kunter and others.
* All rights reserved. This program and the accompanying materials
* are made available under the terms of the Eclipse Public License v1.0
* which accompanies this distribution, and is available at
* http://www.eclipse.org/legal/epl-v10.html
*
* Contributors:
* Mathias Kunter - Initial Implementation (Bug 307311)
*******************************************************************************/
package org.eclipse.cdt.dsf.mi.service.command.output;
import java.text.ParseException;
import org.junit.Test;
import static org.junit.Assert.*;
import junit.framework.JUnit4TestAdapter;
public class MIStringHandlerTests {
@Test
public void testTranscodeString() {
// Test transcoding of an empty string.
assertEquals(MIStringHandler.transcodeString(""), ""); //$NON-NLS-1$ //$NON-NLS-2$
// Test transcoding of an ASCII string.
assertEquals(MIStringHandler.transcodeString("ASCII"), "ASCII"); //$NON-NLS-1$ //$NON-NLS-2$
// Test transcoding of Latin-1 strings.
assertEquals(MIStringHandler.transcodeString("\344"), "\344"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.transcodeString("abc\344"), "abc\344"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.transcodeString("\344abc"), "\344abc"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.transcodeString("abc\344def"), "abc\344def"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.transcodeString("abc\ndef\344ghi\tjkl"), "abc\ndef\344ghi\tjkl"); //$NON-NLS-1$ //$NON-NLS-2$
// Test transcoding of UTF-8 strings.
assertEquals(MIStringHandler.transcodeString("\303\244"), "\344"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.transcodeString("abc\303\244"), "abc\344"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.transcodeString("\303\244abc"), "\344abc"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.transcodeString("abc\303\244def"), "abc\344def"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.transcodeString("abc\ndef\303\244ghi\tjkl"), "abc\ndef\344ghi\tjkl"); //$NON-NLS-1$ //$NON-NLS-2$
// Test transcoding of a string with unsupported encoding (here: UTF-16).
assertEquals(MIStringHandler.transcodeString("\u3090"), "\u3090"); //$NON-NLS-1$ //$NON-NLS-2$
}
@Test
public void testEscapeString() {
// Test escaping of an empty string.
assertEquals(MIStringHandler.escapeString(""), ""); //$NON-NLS-1$ //$NON-NLS-2$
// Test escaping of a plain text string.
assertEquals(MIStringHandler.escapeString("abc"), "abc"); //$NON-NLS-1$ //$NON-NLS-2$
// Test escaping of strings which contain special chars.
assertEquals(MIStringHandler.escapeString("\n"), "\\n"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.escapeString("\n\b"), "\\n\\b"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.escapeString("\0\1\2\3\4\5\6\7\10\11\12\13\14\15\16\17"), "\\0\\001\\002\\003\\004\\005\\006\\a\\b\\t\\n\\v\\f\\r\\016\\017"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.escapeString("\33"), "\\e"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.escapeString("\\", true), "\\\\"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.escapeString("\\", false), "\\"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.escapeString("'\t\\", true), "\\'\\t\\\\"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.escapeString("'\t\\", false), "'\\t\\"); //$NON-NLS-1$ //$NON-NLS-2$
// Test escaping of strings which contain non-printable characters up to 0x7F.
assertEquals(MIStringHandler.escapeString("\0"), "\\0"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.escapeString("\177"), "\\177"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.escapeString("abc\177"), "abc\\177"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.escapeString("\177abc"), "\\177abc"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.escapeString("abc\177def"), "abc\\177def"); //$NON-NLS-1$ //$NON-NLS-2$
// Test escaping of strings which contain non-printable characters up to 0xFF.
assertEquals(MIStringHandler.escapeString("\230"), "\\230"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.escapeString("abc\230"), "abc\\230"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.escapeString("\230abc"), "\\230abc"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.escapeString("abc\230def"), "abc\\230def"); //$NON-NLS-1$ //$NON-NLS-2$
// Test escaping of strings which contain non-printable characters up to 0xFFFF.
assertEquals(MIStringHandler.escapeString("\ud800"), "\\ud800"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.escapeString("abc\ud800"), "abc\\ud800"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.escapeString("\ud800abc"), "\\ud800abc"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.escapeString("abc\ud800def"), "abc\\ud800def"); //$NON-NLS-1$ //$NON-NLS-2$
// Test escaping of strings which contain non-printable characters up to 0x10FFFF.
assertEquals(MIStringHandler.escapeString("\udbff\udfff"), "\\U0010ffff"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.escapeString("abc\udbff\udfff"), "abc\\U0010ffff"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.escapeString("\udbff\udfffabc"), "\\U0010ffffabc"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.escapeString("abc\udbff\udfffdef"), "abc\\U0010ffffdef"); //$NON-NLS-1$ //$NON-NLS-2$
// Test escaping of a string which contains all sorts of non-printable characters.
assertEquals(MIStringHandler.escapeString("abc\n\tdef\\ghi\njkl\177\230\n\ud800\udbff\udfff?mno\"", true), "abc\\n\\tdef\\\\ghi\\njkl\\177\\230\\n\\ud800\\U0010ffff\\?mno\\\""); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.escapeString("abc\n\tdef\\ghi\njkl\177\230\n\ud800\udbff\udfff?mno\"", false), "abc\\n\\tdef\\ghi\\njkl\\177\\230\\n\\ud800\\U0010ffff?mno\""); //$NON-NLS-1$ //$NON-NLS-2$
// Test escaping of an ill-formed UTF-16 Java string.
assertEquals(MIStringHandler.escapeString("abc\udbff"), "abc\\udbff"); //$NON-NLS-1$ //$NON-NLS-2$
}
@Test
public void testIsSpecialChar() {
// Testing non-special chars.
assertEquals(MIStringHandler.isSpecialChar('i'), false);
assertEquals(MIStringHandler.isSpecialChar('w'), false);
// Testing special chars.
assertEquals(MIStringHandler.isSpecialChar('a'), true);
assertEquals(MIStringHandler.isSpecialChar('n'), true);
assertEquals(MIStringHandler.isSpecialChar('t'), true);
assertEquals(MIStringHandler.isSpecialChar('\''), true);
assertEquals(MIStringHandler.isSpecialChar('\\'), true);
}
@Test
public void testIsSpecialCodePoint() {
// Testing non-special Unicode code points.
assertEquals(MIStringHandler.isSpecialCodePoint(0x69), false); // 'i' character
assertEquals(MIStringHandler.isSpecialCodePoint(0x77), false); // 'w' character
assertEquals(MIStringHandler.isSpecialCodePoint(0x61), false); // 'a' character
assertEquals(MIStringHandler.isSpecialCodePoint(0x6E), false); // 'n' character
// Testing special Unicode code points.
assertEquals(MIStringHandler.isSpecialCodePoint(0x07), true); // '\a' character
assertEquals(MIStringHandler.isSpecialCodePoint(0x0A), true); // '\n' character
assertEquals(MIStringHandler.isSpecialCodePoint(0x09), true); // '\t' character
assertEquals(MIStringHandler.isSpecialCodePoint(0x27), true); // '\'' character
assertEquals(MIStringHandler.isSpecialCodePoint(0x5C), true); // '\\' character
}
@Test
public void testParseSpecialChar() {
// Testing non-special chars. This actually should throw ParseExceptions.
try {
MIStringHandler.parseSpecialChar('i');
fail("No parsing exception thrown.");
} catch (ParseException e) {
}
try {
MIStringHandler.parseSpecialChar('w');
fail("No parsing exception thrown.");
} catch (ParseException e) {
}
try {
// Testing special chars.
assertEquals(MIStringHandler.parseSpecialChar('a'), 0x07);
assertEquals(MIStringHandler.parseSpecialChar('n'), 0x0A);
assertEquals(MIStringHandler.parseSpecialChar('t'), 0x09);
assertEquals(MIStringHandler.parseSpecialChar('\''), 0x27);
assertEquals(MIStringHandler.parseSpecialChar('\\'), 0x5C);
} catch (ParseException e) {
fail("Parsing exception thrown."); //$NON-NLS-1$
}
}
@Test
public void testParseSpecialCodePoint() {
try {
// Testing non-special Unicode code points. This actually should throw ParseExceptions.
try {
MIStringHandler.parseSpecialCodePoint(0x69);
fail("No parsing exception thrown.");
} catch (ParseException e) {
}
try {
MIStringHandler.parseSpecialCodePoint(0x77);
fail("No parsing exception thrown.");
} catch (ParseException e) {
}
// Testing special Unicode code points.
assertEquals(MIStringHandler.parseSpecialCodePoint(0x07), 'a');
assertEquals(MIStringHandler.parseSpecialCodePoint(0x0A), 'n');
assertEquals(MIStringHandler.parseSpecialCodePoint(0x09), 't');
assertEquals(MIStringHandler.parseSpecialCodePoint(0x27), '\'');
assertEquals(MIStringHandler.parseSpecialCodePoint(0x5C), '\\');
} catch (ParseException e) {
fail("Parsing exception thrown."); //$NON-NLS-1$
}
}
@Test
public void testParseString() {
// Test parsing of an empty string.
assertEquals(MIStringHandler.parseString(""), ""); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString(""), ""); //$NON-NLS-1$ //$NON-NLS-2$
// Test parsing of a plain text string.
assertEquals(MIStringHandler.parseString("abc"), "abc"); //$NON-NLS-1$ //$NON-NLS-2$
// Test parsing of strings which contain valid special char escape notations.
assertEquals(MIStringHandler.parseString("\\n"), "\n"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("\\\\"), "\\"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("\\'\\t\\\\"), "'\t\\"); //$NON-NLS-1$ //$NON-NLS-2$
// Test parsing of strings which contain invalid special char escape notations.
assertEquals(MIStringHandler.parseString("\\w"), "\\w"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("\\"), "\\"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("abc\\"), "abc\\"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("\\www"), "\\www"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("abc\\www"), "abc\\www"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("\\'\\z\\\\"), "'\\z\\"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("\\'\\z\\"), "'\\z\\"); //$NON-NLS-1$ //$NON-NLS-2$
// Test parsing of strings which contain valid octal escape notations.
assertEquals(MIStringHandler.parseString("\\141\\142\\143"), "abc"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("\\141\\142\\143\\0"), "abc\0"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("\\141\\142\\143\\12"), "abc\n"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("\\141\\\\142\\143\\\\"), "a\\142c\\"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("\\12"), "\n"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("\\012"), "\n"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("'\\011\\"), "'\t\\"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("\\177"), "\177"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("\\377"), "\377"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("\\3777"), "\3777"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("abc\\177"), "abc\177"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("\\177abc"), "\177abc"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("abc\\177def"), "abc\177def"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("\\0"), "\0"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("\\1"), "\001"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("\\1a"), "\001a"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("\\18"), "\0018"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("\\01"), "\001"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("\\01a"), "\001a"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("\\001"), "\001"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("\\001a"), "\001a"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("\\0011"), "\0011"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("\\0011a"), "\0011a"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("\\1111"), "\1111"); //$NON-NLS-1$ //$NON-NLS-2$
// Test parsing of strings which contain invalid octal escape notations.
assertEquals(MIStringHandler.parseString("\\400"), "\\400"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("\\4000"), "\\4000"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("\\8"), "\\8"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("\\90"), "\\90"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("\\ 0"), "\\ 0"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("\\141\\142\\143\\"), "abc\\"); //$NON-NLS-1$ //$NON-NLS-2$
// Test parsing of strings which contain valid hexadecimal escape notations.
assertEquals(MIStringHandler.parseString("\\x0"), "\0"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("\\xa"), "\n"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("\\xa0"), "\240"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("\\xag"), "\ng"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("\\x0a"), "\n"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("\\x0a0"), "\240"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("\\x0ag"), "\ng"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("\\x00a"), "\n"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("\\x00a0"), "\240"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("\\x00ag"), "\ng"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("\\x000a"), "\n"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("\\x000a0"), "\n0"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("\\x000ag"), "\ng"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("\\x0000a"), "\0a"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("\\x0000a0"), "\0a0"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("\\x0000ag"), "\0ag"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("abc\\x20def"), "abc\u20def"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("abc\\x20def\\xa"), "abc\u20def\n"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("abc\\x20ghi"), "abc ghi"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("abc\\x20ghi\\xa"), "abc ghi\n"); //$NON-NLS-1$ //$NON-NLS-2$
// Test parsing of strings which contain invalid hexadecimal escape notations.
assertEquals(MIStringHandler.parseString("\\x"), "\\x"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("abc\\x"), "abc\\x"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("\\xwww"), "\\xwww"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("\\x\\"), "\\x\\"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("\\x 0"), "\\x 0"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("\\x\\0"), "\\x\0"); //$NON-NLS-1$ //$NON-NLS-2$
// Test parsing of strings which contain valid short Unicode escape notations.
assertEquals(MIStringHandler.parseString("\\u0000"), "\0"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("\\u000f"), "\017"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("\\u00ff"), "\377"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("\\u0fff"), "\u0fff"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("\\uffff"), "\uffff"); //$NON-NLS-1$ //$NON-NLS-2$
// Test parsing of strings which contain invalid short Unicode escape notations.
assertEquals(MIStringHandler.parseString("\\u"), "\\u"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("abc\\u"), "abc\\u"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("\\uwww"), "\\uwww"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("\\u\\"), "\\u\\"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("\\u 0"), "\\u 0"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("\\u\\0"), "\\u\0"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("\\u0"), "\\u0"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("\\u00"), "\\u00"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("\\u000"), "\\u000"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("\\u000g"), "\\u000g"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("\\ug"), "\\ug"); //$NON-NLS-1$ //$NON-NLS-2$
// Test parsing of strings which contain valid long Unicode escape notations.
assertEquals(MIStringHandler.parseString("\\U00000000"), "\0"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("\\U0000000f"), "\017"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("\\U000000ff"), "\377"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("\\U00000fff"), "\u0fff"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("\\U0000ffff"), "\uffff"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("\\U000fffff"), "\udbbf\udfff"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("\\U0010ffff"), "\udbff\udfff"); //$NON-NLS-1$ //$NON-NLS-2$
// Test parsing of strings which contain invalid long Unicode escape notations.
assertEquals(MIStringHandler.parseString("\\U"), "\\U"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("abc\\U"), "abc\\U"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("\\Uwww"), "\\Uwww"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("\\U\\"), "\\U\\"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("\\U 0"), "\\U 0"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("\\U\\0"), "\\U\0"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("\\U0"), "\\U0"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("\\U00"), "\\U00"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("\\U000"), "\\U000"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("\\U0000"), "\\U0000"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("\\U00000"), "\\U00000"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("\\U000000"), "\\U000000"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("\\U0000000"), "\\U0000000"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("\\U0000000g"), "\\U0000000g"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("\\U00110000"), "\\U00110000"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("\\U00f00000"), "\\U00f00000"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("\\U0f000000"), "\\U0f000000"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("\\Uf0000000"), "\\Uf0000000"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("\\Uffffffff"), "\\Uffffffff"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("\\Ufffffff"), "\\Ufffffff"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.parseString("\\Ug"), "\\Ug"); //$NON-NLS-1$ //$NON-NLS-2$
}
@Test
public void testTranslateCString() {
// Test translating an empty string.
assertEquals(MIStringHandler.translateCString("", false), ""); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.translateCString("", true), ""); //$NON-NLS-1$ //$NON-NLS-2$
// Test translating a plain text string.
assertEquals(MIStringHandler.translateCString("abc", false), "abc"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.translateCString("abc", true), "abc"); //$NON-NLS-1$ //$NON-NLS-2$
// Test translating strings which contain special chars and / or escaped special chars.
assertEquals(MIStringHandler.translateCString("\t", true), "\\t"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.translateCString("\t", false), "\t"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.translateCString("\\t", true), "\\t"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.translateCString("\\t", false), "\t"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.translateCString("\t\\t", true), "\\t\\t"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.translateCString("\t\\t", false), "\t\t"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.translateCString("\\t\t", true), "\\t\\t"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.translateCString("\\t\t", false), "\t\t"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.translateCString("'\"", true), "'\""); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.translateCString("'\"", false), "'\""); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.translateCString("\\'\\\"", true), "\\'\\\""); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.translateCString("\\'\\\"", false), "'\""); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.translateCString("'\\\"", true), "'\\\""); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.translateCString("'\\\"", false), "'\""); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.translateCString("\\'\"", true), "\\'\""); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.translateCString("\\'\"", false), "'\""); //$NON-NLS-1$ //$NON-NLS-2$
// Test translating strings which contain hexadecimal escape notations.
assertEquals(MIStringHandler.translateCString("\\x0000", true), "\\0"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.translateCString("\\x0000", false), "\0"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.translateCString("abc\\x31\\x32\\x33www", true), "abc123www"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.translateCString("abc\\x0031\\x0032\\x0033www", true), "abc123www"); //$NON-NLS-1$ //$NON-NLS-2$
// Test translating strings which contain octal escape notations.
assertEquals(MIStringHandler.translateCString("\\000", true), "\\0"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.translateCString("\\000", false), "\0"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.translateCString("\\0", true), "\\0"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.translateCString("\\0", false), "\0"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.translateCString("abc\\222def", true), "abc\\222def"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.translateCString("abc\\222def", false), "abc\222def"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.translateCString("abc\\303def", true), "abc\303def"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.translateCString("abc\\303def", false), "abc\303def"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.translateCString("abc\\303\\244def", true), "abc\344def"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.translateCString("abc\"def", true), "abc\"def"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.translateCString("abc\"def", false), "abc\"def"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.translateCString("abc'def", true), "abc'def"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.translateCString("abc'def", false), "abc'def"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.translateCString("abc\\\"def", true), "abc\\\"def"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.translateCString("abc\\\"def", false), "abc\"def"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.translateCString("abc\\'def", true), "abc\\'def"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.translateCString("abc\\'def", false), "abc'def"); //$NON-NLS-1$ //$NON-NLS-2$
// Test translating strings which contain short Unicode escape notations.
assertEquals(MIStringHandler.translateCString("\\u0000", true), "\\0"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.translateCString("\\u0000", false), "\0"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.translateCString("abc\\u0031\\u0032\\u0033def", true), "abc123def"); //$NON-NLS-1$ //$NON-NLS-2$
// Test translating strings which contain long Unicode escape notations.
assertEquals(MIStringHandler.translateCString("\\U00000000", true), "\\0"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.translateCString("\\U00000000", false), "\0"); //$NON-NLS-1$ //$NON-NLS-2$
assertEquals(MIStringHandler.translateCString("abc\\U00000031\\U00000032\\U00000033def", true), "abc123def"); //$NON-NLS-1$ //$NON-NLS-2$
}
public static junit.framework.Test suite() {
return new JUnit4TestAdapter(MIStringHandlerTests.class);
}
}