- Replaced StringUtils.unescape with a simpler implementation - Added BuiltinTypeMembers to allow the compiler control over its tags

7年前 · 6c510eb26b
--- a/CodeModel/src/main/java/org/openzen/zenscript/codemodel/type/member/BuiltinTypeMembers.java
+++ b/CodeModel/src/main/java/org/openzen/zenscript/codemodel/type/member/BuiltinTypeMembers.java
@@ -0,0 +1,34 @@
 
				
				+/*
			
 
				
				+ * To change this license header, choose License Headers in Project Properties.
			
 
				
				+ * To change this template file, choose Tools | Templates
			
 
				
				+ * and open the template in the editor.
			
 
				
				+ */
			
 
				
				+package org.openzen.zenscript.codemodel.type.member;
			
 
				
				+
			
 
				
				+import org.openzen.zenscript.codemodel.Modifiers;
			
 
				
				+import org.openzen.zenscript.codemodel.expression.ConstantIntExpression;
			
 
				
				+import org.openzen.zenscript.codemodel.member.CasterMember;
			
 
				
				+import org.openzen.zenscript.codemodel.member.builtin.ConstantGetterMember;
			
 
				
				+import org.openzen.zenscript.codemodel.type.BasicTypeID;
			
 
				
				+import org.openzen.zenscript.shared.CodePosition;
			
 
				
				+
			
 
				
				+/**
			
 
				
				+ *
			
 
				
				+ * @author Hoofdgebruiker
			
 
				
				+ */
			
 
				
				+public class BuiltinTypeMembers {
			
 
				
				+	public static final ConstantGetterMember INT_GET_MIN_VALUE = new ConstantGetterMember("MIN_VALUE", position -> new ConstantIntExpression(position, Integer.MIN_VALUE));
			
 
				
				+	public static final ConstantGetterMember INT_GET_MAX_VALUE = new ConstantGetterMember("MAX_VALUE", position -> new ConstantIntExpression(position, Integer.MAX_VALUE));
			
 
				
				+	
			
 
				
				+	public static final CasterMember INT_TO_BYTE = new CasterMember(CodePosition.BUILTIN, 0, BasicTypeID.BYTE);
			
 
				
				+	public static final CasterMember INT_TO_SBYTE = new CasterMember(CodePosition.BUILTIN, 0, BasicTypeID.SBYTE);
			
 
				
				+	public static final CasterMember INT_TO_SHORT = new CasterMember(CodePosition.BUILTIN, 0, BasicTypeID.SHORT);
			
 
				
				+	public static final CasterMember INT_TO_USHORT = new CasterMember(CodePosition.BUILTIN, 0, BasicTypeID.USHORT);
			
 
				
				+	public static final CasterMember INT_TO_UINT = new CasterMember(CodePosition.BUILTIN, Modifiers.MODIFIER_IMPLICIT, BasicTypeID.UINT);
			
 
				
				+	public static final CasterMember INT_TO_LONG = new CasterMember(CodePosition.BUILTIN, Modifiers.MODIFIER_IMPLICIT, BasicTypeID.LONG);
			
 
				
				+	public static final CasterMember INT_TO_ULONG = new CasterMember(CodePosition.BUILTIN, Modifiers.MODIFIER_IMPLICIT, BasicTypeID.ULONG);
			
 
				
				+	public static final CasterMember INT_TO_FLOAT = new CasterMember(CodePosition.BUILTIN, Modifiers.MODIFIER_IMPLICIT, BasicTypeID.FLOAT);
			
 
				
				+	public static final CasterMember INT_TO_DOUBLE = new CasterMember(CodePosition.BUILTIN, Modifiers.MODIFIER_IMPLICIT, BasicTypeID.DOUBLE);
			
 
				
				+	public static final CasterMember INT_TO_CHAR = new CasterMember(CodePosition.BUILTIN, 0, BasicTypeID.CHAR);
			
 
				
				+	public static final CasterMember INT_TO_STRING = new CasterMember(CodePosition.BUILTIN, Modifiers.MODIFIER_IMPLICIT, BasicTypeID.STRING);
			
 
				
				+}
			
--- a/CodeModel/src/main/java/org/openzen/zenscript/codemodel/type/member/DefinitionMemberGroup.java
+++ b/CodeModel/src/main/java/org/openzen/zenscript/codemodel/type/member/DefinitionMemberGroup.java
@@ -225,6 +225,10 @@ public class DefinitionMemberGroup {
 
				
				 	
			
 
				
				 	public Expression call(CodePosition position, TypeScope scope, Expression target, CallArguments arguments, boolean allowStaticUsage) {
			
 
				
				 		ICallableMember method = selectMethod(position, scope, arguments, true, allowStaticUsage);
			
 
				
				+		for (int i = 0; i < arguments.arguments.length; i++) {
			
 
				
				+			arguments.arguments[i] = arguments.arguments[i].castImplicit(position, scope, method.getHeader().parameters[i].type);
			
 
				
				+		}
			
 
				
				+		
			
 
				
				 		FunctionHeader instancedHeader = method.getHeader().withGenericArguments(scope.getTypeRegistry(), arguments.typeArguments);
			
 
				
				 		return method.call(position, target, instancedHeader, arguments);
			
 
				
				 	}
			
--- a/CodeModel/src/main/java/org/openzen/zenscript/codemodel/type/member/TypeMemberBuilder.java
+++ b/CodeModel/src/main/java/org/openzen/zenscript/codemodel/type/member/TypeMemberBuilder.java
@@ -270,20 +270,20 @@ public class TypeMemberBuilder implements ITypeVisitor<Void> {
 
				
				 		registerArithmeticOperations(LONG, LONG);
			
 
				
				 		registerArithmeticOperations(FLOAT, FLOAT);
			
 
				
				 		registerArithmeticOperations(DOUBLE, DOUBLE);
			
 
				
				-		members.addGetter(new ConstantGetterMember("MIN_VALUE", position -> new ConstantIntExpression(position, Integer.MIN_VALUE)), TypeMemberPriority.SPECIFIED);
			
 
				
				-		members.addGetter(new ConstantGetterMember("MAX_VALUE", position -> new ConstantIntExpression(position, Integer.MAX_VALUE)), TypeMemberPriority.SPECIFIED);
			
 
				
				+		members.addGetter(BuiltinTypeMembers.INT_GET_MIN_VALUE, TypeMemberPriority.SPECIFIED);
			
 
				
				+		members.addGetter(BuiltinTypeMembers.INT_GET_MAX_VALUE, TypeMemberPriority.SPECIFIED);
			
 
				
				 		
			
 
				
				-		members.addCaster(new CasterMember(CodePosition.BUILTIN, 0, BasicTypeID.BYTE), TypeMemberPriority.SPECIFIED);
			
 
				
				-		members.addCaster(new CasterMember(CodePosition.BUILTIN, 0, BasicTypeID.SBYTE), TypeMemberPriority.SPECIFIED);
			
 
				
				-		members.addCaster(new CasterMember(CodePosition.BUILTIN, 0, BasicTypeID.SHORT), TypeMemberPriority.SPECIFIED);
			
 
				
				-		members.addCaster(new CasterMember(CodePosition.BUILTIN, 0, BasicTypeID.USHORT), TypeMemberPriority.SPECIFIED);
			
 
				
				-		members.addCaster(new CasterMember(CodePosition.BUILTIN, Modifiers.MODIFIER_IMPLICIT, BasicTypeID.UINT), TypeMemberPriority.SPECIFIED);
			
 
				
				-		members.addCaster(new CasterMember(CodePosition.BUILTIN, Modifiers.MODIFIER_IMPLICIT, BasicTypeID.LONG), TypeMemberPriority.SPECIFIED);
			
 
				
				-		members.addCaster(new CasterMember(CodePosition.BUILTIN, Modifiers.MODIFIER_IMPLICIT, BasicTypeID.ULONG), TypeMemberPriority.SPECIFIED);
			
 
				
				-		members.addCaster(new CasterMember(CodePosition.BUILTIN, Modifiers.MODIFIER_IMPLICIT, BasicTypeID.FLOAT), TypeMemberPriority.SPECIFIED);
			
 
				
				-		members.addCaster(new CasterMember(CodePosition.BUILTIN, Modifiers.MODIFIER_IMPLICIT, BasicTypeID.DOUBLE), TypeMemberPriority.SPECIFIED);
			
 
				
				-		members.addCaster(new CasterMember(CodePosition.BUILTIN, 0, BasicTypeID.CHAR), TypeMemberPriority.SPECIFIED);
			
 
				
				-		members.addCaster(new CasterMember(CodePosition.BUILTIN, Modifiers.MODIFIER_IMPLICIT, BasicTypeID.STRING), TypeMemberPriority.SPECIFIED);
			
 
				
				+		members.addCaster(BuiltinTypeMembers.INT_TO_BYTE, TypeMemberPriority.SPECIFIED);
			
 
				
				+		members.addCaster(BuiltinTypeMembers.INT_TO_SBYTE, TypeMemberPriority.SPECIFIED);
			
 
				
				+		members.addCaster(BuiltinTypeMembers.INT_TO_SHORT, TypeMemberPriority.SPECIFIED);
			
 
				
				+		members.addCaster(BuiltinTypeMembers.INT_TO_USHORT, TypeMemberPriority.SPECIFIED);
			
 
				
				+		members.addCaster(BuiltinTypeMembers.INT_TO_UINT, TypeMemberPriority.SPECIFIED);
			
 
				
				+		members.addCaster(BuiltinTypeMembers.INT_TO_LONG, TypeMemberPriority.SPECIFIED);
			
 
				
				+		members.addCaster(BuiltinTypeMembers.INT_TO_ULONG, TypeMemberPriority.SPECIFIED);
			
 
				
				+		members.addCaster(BuiltinTypeMembers.INT_TO_FLOAT, TypeMemberPriority.SPECIFIED);
			
 
				
				+		members.addCaster(BuiltinTypeMembers.INT_TO_DOUBLE, TypeMemberPriority.SPECIFIED);
			
 
				
				+		members.addCaster(BuiltinTypeMembers.INT_TO_CHAR, TypeMemberPriority.SPECIFIED);
			
 
				
				+		members.addCaster(BuiltinTypeMembers.INT_TO_STRING, TypeMemberPriority.SPECIFIED);
			
 
				
				 	}
			
 
				
				 
			
 
				
				 	private void visitUInt() {
			
--- a/JavaBytecodeCompiler/src/main/java/org/openzen/zenscript/javabytecode/JavaBytecodeImplementation.java
+++ b/JavaBytecodeCompiler/src/main/java/org/openzen/zenscript/javabytecode/JavaBytecodeImplementation.java
@@ -0,0 +1,16 @@
 
				
				+/*
			
 
				
				+ * To change this license header, choose License Headers in Project Properties.
			
 
				
				+ * To change this template file, choose Tools | Templates
			
 
				
				+ * and open the template in the editor.
			
 
				
				+ */
			
 
				
				+package org.openzen.zenscript.javabytecode;
			
 
				
				+
			
 
				
				+import org.openzen.zenscript.javabytecode.compiler.JavaWriter;
			
 
				
				+
			
 
				
				+/**
			
 
				
				+ *
			
 
				
				+ * @author Hoofdgebruiker
			
 
				
				+ */
			
 
				
				+public interface JavaBytecodeImplementation {
			
 
				
				+	public void compile(JavaWriter writer);
			
 
				
				+}
			
--- a/JavaBytecodeCompiler/src/main/java/org/openzen/zenscript/javabytecode/JavaCompiler.java
+++ b/JavaBytecodeCompiler/src/main/java/org/openzen/zenscript/javabytecode/JavaCompiler.java
@@ -12,6 +12,7 @@ import org.objectweb.asm.Opcodes;
 
				
				 import org.openzen.zenscript.codemodel.HighLevelDefinition;
			
 
				
				 import org.openzen.zenscript.codemodel.ScriptBlock;
			
 
				
				 import org.openzen.zenscript.codemodel.statement.Statement;
			
 
				
				+import org.openzen.zenscript.codemodel.type.member.BuiltinTypeMembers;
			
 
				
				 import org.openzen.zenscript.javabytecode.compiler.JavaStatementVisitor;
			
 
				
				 import org.openzen.zenscript.javabytecode.compiler.JavaWriter;
			
 
				
				 import org.openzen.zenscript.shared.SourceFile;
			
@@ -21,6 +22,24 @@ import org.openzen.zenscript.shared.SourceFile;
 
				
				  * @author Hoofdgebruiker
			
 
				
				  */
			
 
				
				 public class JavaCompiler {
			
 
				
				+	static {
			
 
				
				+		JavaClassInfo jInteger = new JavaClassInfo("java/lang/Integer");
			
 
				
				+		BuiltinTypeMembers.INT_GET_MIN_VALUE.setTag(JavaFieldInfo.class, new JavaFieldInfo(jInteger, "MIN_VALUE", "I"));
			
 
				
				+		BuiltinTypeMembers.INT_GET_MAX_VALUE.setTag(JavaFieldInfo.class, new JavaFieldInfo(jInteger, "MAX_VALUE", "I"));
			
 
				
				+		
			
 
				
				+		BuiltinTypeMembers.INT_TO_BYTE.setTag(JavaBytecodeImplementation.class, writer -> writer.i2b());
			
 
				
				+		BuiltinTypeMembers.INT_TO_SBYTE.setTag(JavaBytecodeImplementation.class, writer -> writer.i2b());
			
 
				
				+		BuiltinTypeMembers.INT_TO_SHORT.setTag(JavaBytecodeImplementation.class, writer -> writer.i2s());
			
 
				
				+		BuiltinTypeMembers.INT_TO_USHORT.setTag(JavaBytecodeImplementation.class, writer -> writer.i2s());
			
 
				
				+		BuiltinTypeMembers.INT_TO_UINT.setTag(JavaBytecodeImplementation.class, writer -> {});
			
 
				
				+		BuiltinTypeMembers.INT_TO_LONG.setTag(JavaBytecodeImplementation.class, writer -> writer.i2l());
			
 
				
				+		BuiltinTypeMembers.INT_TO_ULONG.setTag(JavaBytecodeImplementation.class, writer -> writer.i2l());
			
 
				
				+		BuiltinTypeMembers.INT_TO_FLOAT.setTag(JavaBytecodeImplementation.class, writer -> writer.i2f());
			
 
				
				+		BuiltinTypeMembers.INT_TO_DOUBLE.setTag(JavaBytecodeImplementation.class, writer -> writer.i2d());
			
 
				
				+		BuiltinTypeMembers.INT_TO_CHAR.setTag(JavaBytecodeImplementation.class, writer -> writer.i2s());
			
 
				
				+		BuiltinTypeMembers.INT_TO_STRING.setTag(JavaMethodInfo.class, new JavaMethodInfo(jInteger, "toString", "(I)Ljava/lang/String;", true));
			
 
				
				+	}
			
 
				
				+	
			
 
				
				 	private final JavaModule target;
			
 
				
				 	private final List<String> scriptBlockNames = new ArrayList<>();
			
 
				
				 	private final ClassWriter scriptsClassWriter;
			
--- a/JavaBytecodeCompiler/src/main/java/org/openzen/zenscript/javabytecode/JavaMethodInfo.java
+++ b/JavaBytecodeCompiler/src/main/java/org/openzen/zenscript/javabytecode/JavaMethodInfo.java
@@ -13,10 +13,16 @@ public class JavaMethodInfo {
 
				
				 	public final JavaClassInfo javaClass;
			
 
				
				 	public final String name;
			
 
				
				 	public final String signature;
			
 
				
				+	public final boolean isStatic;
			
 
				
				 	
			
 
				
				 	public JavaMethodInfo(JavaClassInfo javaClass, String name, String signature) {
			
 
				
				+		this(javaClass, name, signature, false);
			
 
				
				+	}
			
 
				
				+	
			
 
				
				+	public JavaMethodInfo(JavaClassInfo javaClass, String name, String signature, boolean isStatic) {
			
 
				
				 		this.javaClass = javaClass;
			
 
				
				 		this.name = name;
			
 
				
				 		this.signature = signature;
			
 
				
				+		this.isStatic = isStatic;
			
 
				
				 	}
			
 
				
				 }
			
--- a/JavaBytecodeCompiler/src/main/java/org/openzen/zenscript/javabytecode/compiler/JavaExpressionVisitor.java
+++ b/JavaBytecodeCompiler/src/main/java/org/openzen/zenscript/javabytecode/compiler/JavaExpressionVisitor.java
@@ -1,6 +1,7 @@
 
				
				 package org.openzen.zenscript.javabytecode.compiler;

			
 
				
				 

			
 
				
				 import org.openzen.zenscript.codemodel.expression.*;

			
 
				
				+import org.openzen.zenscript.javabytecode.JavaBytecodeImplementation;

			
 
				
				 import org.openzen.zenscript.javabytecode.JavaFieldInfo;

			
 
				
				 import org.openzen.zenscript.javabytecode.JavaMethodInfo;

			
 
				
				 

			
@@ -29,20 +30,32 @@ public class JavaExpressionVisitor implements ExpressionVisitor<Void> {
 
				
				 

			
 
				
				     @Override

			
 
				
				     public Void visitCall(CallExpression expression) {

			
 
				
				-

			
 
				
				         expression.target.accept(this);

			
 
				
				         for (Expression argument : expression.arguments.arguments) {

			
 
				
				             argument.accept(this);

			
 
				
				         }

			
 
				
				 		

			
 
				
				+		JavaBytecodeImplementation implementation = expression.member.getTag(JavaBytecodeImplementation.class);

			
 
				
				+		if (implementation != null) {

			
 
				
				+			implementation.compile(javaWriter);

			
 
				
				+			return null;

			
 
				
				+		}

			
 
				
				+		

			
 
				
				 		JavaMethodInfo methodInfo = expression.member.getTag(JavaMethodInfo.class);

			
 
				
				 		if (methodInfo == null)

			
 
				
				 			throw new IllegalStateException("Call target has no method info!");

			
 
				
				 		

			
 
				
				-        javaWriter.invokeVirtual(

			
 
				
				-				methodInfo.javaClass.internalClassName,

			
 
				
				-				methodInfo.name,

			
 
				
				-				methodInfo.signature);

			
 
				
				+		if (methodInfo.isStatic) {

			
 
				
				+			javaWriter.invokeStatic(

			
 
				
				+					methodInfo.javaClass.internalClassName,

			
 
				
				+					methodInfo.name,

			
 
				
				+					methodInfo.signature);

			
 
				
				+		} else {

			
 
				
				+			javaWriter.invokeVirtual(

			
 
				
				+					methodInfo.javaClass.internalClassName,

			
 
				
				+					methodInfo.name,

			
 
				
				+					methodInfo.signature);

			
 
				
				+		}

			
 
				
				 		

			
 
				
				         return null;

			
 
				
				     }

			
--- a/Parser/src/main/java/org/openzen/zenscript/parser/expression/ParsedExpression.java
+++ b/Parser/src/main/java/org/openzen/zenscript/parser/expression/ParsedExpression.java
@@ -29,7 +29,7 @@ import org.openzen.zenscript.parser.type.IParsedType;
 
				
				 import org.openzen.zenscript.shared.CodePosition;
			
 
				
				 import org.openzen.zenscript.shared.CompileException;
			
 
				
				 import org.openzen.zenscript.shared.CompileExceptionCode;
			
 
				
				-import static org.openzen.zenscript.shared.StringUtils.unescapeString;
			
 
				
				+import static org.openzen.zenscript.shared.StringUtils.unescape;
			
 
				
				 
			
 
				
				 /**
			
 
				
				  *
			
@@ -315,7 +315,7 @@ public abstract class ParsedExpression {
 
				
				 						indexString2 = parser.optional(T_STRING_DQ);
			
 
				
				 					
			
 
				
				 					if (indexString2 != null) {
			
 
				
				-						base = new ParsedExpressionMember(position, base, unescapeString(indexString2.content), Collections.emptyList());
			
 
				
				+						base = new ParsedExpressionMember(position, base, unescape(indexString2.content), Collections.emptyList());
			
 
				
				 					} else {
			
 
				
				 						ZSToken last = parser.next();
			
 
				
				 						throw new ParseException(last, "Invalid expression, last token: " + last.content);
			
@@ -364,7 +364,7 @@ public abstract class ParsedExpression {
 
				
				 			case T_STRING_DQ:
			
 
				
				 				return new ParsedExpressionString(
			
 
				
				 						position,
			
 
				
				-						unescapeString(parser.next().content));
			
 
				
				+						unescape(parser.next().content));
			
 
				
				 			case T_IDENTIFIER: {
			
 
				
				 				String name = parser.next().content;
			
 
				
				 				List<IParsedType> genericParameters = IParsedType.parseGenericParameters(parser);
			
--- a/ScriptingExample/scripts/helloworld.zs
+++ b/ScriptingExample/scripts/helloworld.zs
@@ -1 +1,2 @@
 
				
				 println("Hello world!");
			
 
				
				+println(5);
			
--- a/Shared/src/main/java/org/openzen/zenscript/shared/StringUtils.java
+++ b/Shared/src/main/java/org/openzen/zenscript/shared/StringUtils.java
@@ -5,390 +5,316 @@
 
				
				  */
			
 
				
				 package org.openzen.zenscript.shared;
			
 
				
				 
			
 
				
				+import java.io.IOException;
			
 
				
				+import java.io.InputStream;
			
 
				
				+import java.util.Collection;
			
 
				
				+import java.util.HashMap;
			
 
				
				+import java.util.Map;
			
 
				
				+import java.util.Properties;
			
 
				
				+import java.util.logging.Level;
			
 
				
				+import java.util.logging.Logger;
			
 
				
				+import java.util.regex.Pattern;
			
 
				
				+
			
 
				
				 /**
			
 
				
				  *
			
 
				
				  * @author Hoofdgebruiker
			
 
				
				  */
			
 
				
				 public class StringUtils {
			
 
				
				+	private static final Map<String, CharacterEntity> NAMED_CHARACTER_ENTITIES;
			
 
				
				+	private static final Pattern MATCH_ACCENTS = Pattern.compile("\\p{M}");
			
 
				
				+	
			
 
				
				+	static
			
 
				
				+	{
			
 
				
				+		NAMED_CHARACTER_ENTITIES = new HashMap<>();
			
 
				
				+		
			
 
				
				+		Properties properties = new Properties();
			
 
				
				+		try {
			
 
				
				+			InputStream input = String.class.getResourceAsStream("/org/openzen/zenscript/shared/characterEntities.properties");
			
 
				
				+			if (input != null)
			
 
				
				+				properties.load(input);
			
 
				
				+			else
			
 
				
				+				System.out.println("Warning: could not load character entities");
			
 
				
				+		} catch (IOException ex) {
			
 
				
				+			Logger.getLogger(StringUtils.class.getName()).log(Level.SEVERE, null, ex);
			
 
				
				+		}
			
 
				
				+		
			
 
				
				+		for (Object okey : properties.keySet()) {
			
 
				
				+			String key = okey.toString();
			
 
				
				+			char value = (char) Integer.parseInt(properties.getProperty(key));
			
 
				
				+			CharacterEntity entity = new CharacterEntity(key, value);
			
 
				
				+			NAMED_CHARACTER_ENTITIES.put(entity.stringValue, entity);
			
 
				
				+		}
			
 
				
				+	}
			
 
				
				 	
			
 
				
				 	/**
			
 
				
				+	 * Left pads (prefixes) a string with characters until it reaches the given string
			
 
				
				+	 * length. Does not do anything if the string length &gt;= given length.
			
 
				
				 	 * 
			
 
				
				-	 * unescape_perl_string()
			
 
				
				-	 * 
			
 
				
				-	 * Tom Christiansen <tchrist@perl.com> Sun Nov 28 12:55:24 MST 2010
			
 
				
				-	 * 
			
 
				
				-	 * It's completely ridiculous that there's no standard unescape_java_string
			
 
				
				-	 * function. Since I have to do the damn thing myself, I might as well make
			
 
				
				-	 * it halfway useful by supporting things Java was too stupid to consider in
			
 
				
				-	 * strings:
			
 
				
				-	 * 
			
 
				
				-	 * => "?" items are additions to Java string escapes but normal in Java
			
 
				
				-	 * regexes
			
 
				
				-	 * 
			
 
				
				-	 * => "!" items are also additions to Java regex escapes
			
 
				
				-	 * 
			
 
				
				-	 * Standard singletons: ?\a ?\e \f \n \r \t
			
 
				
				-	 * 
			
 
				
				-	 * NB: \b is unsupported as backspace so it can pass-through to the regex
			
 
				
				-	 * translator untouched; I refuse to make anyone doublebackslash it as
			
 
				
				-	 * doublebackslashing is a Java idiocy I desperately wish would die out.
			
 
				
				-	 * There are plenty of other ways to write it:
			
 
				
				+	 * @param value value to be padded
			
 
				
				+	 * @param length desired string length
			
 
				
				+	 * @param c padding character
			
 
				
				+	 * @return padded string
			
 
				
				+	 */
			
 
				
				+	public static String lpad(String value, int length, char c)
			
 
				
				+	{
			
 
				
				+		if (value.length() >= length)
			
 
				
				+			return value;
			
 
				
				+		
			
 
				
				+		return times(c, length - value.length()) + value;
			
 
				
				+	}
			
 
				
				+	
			
 
				
				+	/**
			
 
				
				+	 * Right pads (suffixes) a string with characters until it reaches the given
			
 
				
				+	 * string length. Does not do anything if the string length &gt;= given length.
			
 
				
				 	 * 
			
 
				
				-	 * \cH, \12, \012, \x08 \x{8}, \u0008, \U00000008
			
 
				
				+	 * @param value value to be padded
			
 
				
				+	 * @param length desired string length
			
 
				
				+	 * @param c padding character
			
 
				
				+	 * @return padded string
			
 
				
				+	 */
			
 
				
				+	public static String rpad(String value, int length, char c)
			
 
				
				+	{
			
 
				
				+		if (value.length() >= length)
			
 
				
				+			return value;
			
 
				
				+		
			
 
				
				+		return value + times(c, length - value.length());
			
 
				
				+	}
			
 
				
				+	
			
 
				
				+	/**
			
 
				
				+	 * Constructs a string with count times the given character.
			
 
				
				 	 * 
			
 
				
				-	 * Octal escapes: \0 \0N \0NN \N \NN \NNN Can range up to !\777 not \377
			
 
				
				+	 * @param c filling character
			
 
				
				+	 * @param count character count
			
 
				
				+	 * @return string value
			
 
				
				+	 */
			
 
				
				+	public static String times(char c, int count)
			
 
				
				+	{
			
 
				
				+		char[] value = new char[count];
			
 
				
				+		for (int i = 0; i < count; i++) {
			
 
				
				+			value[i] = c;
			
 
				
				+		}
			
 
				
				+		return new String(value);
			
 
				
				+	}
			
 
				
				+	
			
 
				
				+	/**
			
 
				
				+	 * Unescapes a string escaped in one of following ways:
			
 
				
				 	 * 
			
 
				
				-	 * TODO: add !\o{NNNNN} last Unicode is 4177777 maxint is 37777777777
			
 
				
				+	 * <ul>
			
 
				
				+	 * <li>A string escaped with single quotes (<code>'Hello "my" world'</code>)</li>
			
 
				
				+	 * <li>A string escaped with double quotes (<code>"Hello 'my' world"</code>)</li>
			
 
				
				+	 * <li>A near-literal string (<code>@"C:\Program Files\"</code>) in which escape sequences
			
 
				
				+	 * aren't processed but the " character cannot occur</li>
			
 
				
				+	 * </ul>
			
 
				
				 	 * 
			
 
				
				-	 * Control chars: ?\cX Means: ord(X) ^ ord('@')
			
 
				
				+	 * The following escape sequences are recognized:
			
 
				
				+	 * <ul>
			
 
				
				+	 * <li>\\</li>
			
 
				
				+	 * <li>\'</li>
			
 
				
				+	 * <li>\"</li>
			
 
				
				+	 * <li>\&amp;namedCharacterEntity; (note that although redundant, \&amp;#ddd; and \&amp;#xXXXX; are also allowed)</li>
			
 
				
				+	 * <li>\t</li>
			
 
				
				+	 * <li>\n</li>
			
 
				
				+	 * <li>\r</li>
			
 
				
				+	 * <li>\b</li>
			
 
				
				+	 * <li>\f</li>
			
 
				
				+	 * <li>\&amp;uXXXX for unicode character points</li>
			
 
				
				+	 * </ul>
			
 
				
				 	 * 
			
 
				
				-	 * Old hex escapes: \xXX unbraced must be 2 xdigits
			
 
				
				+	 * @param escapedString escaped string
			
 
				
				+	 * @return unescaped string
			
 
				
				+	 */
			
 
				
				+	public static String unescape(String escapedString)
			
 
				
				+	{
			
 
				
				+		if (escapedString.length() < 2)
			
 
				
				+			throw new IllegalArgumentException("String is not quoted");
			
 
				
				+		
			
 
				
				+		boolean isLiteral = escapedString.charAt(0) == '@';
			
 
				
				+		if (isLiteral)
			
 
				
				+			escapedString = escapedString.substring(1);
			
 
				
				+		
			
 
				
				+		if (escapedString.charAt(0) != '"' && escapedString.charAt(0) != '\'')
			
 
				
				+			throw new IllegalArgumentException("String is not quoted");
			
 
				
				+		
			
 
				
				+		char quoteCharacter = escapedString.charAt(0);
			
 
				
				+		if (escapedString.charAt(escapedString.length() - 1) != quoteCharacter)
			
 
				
				+			throw new IllegalArgumentException("Unbalanced quotes");
			
 
				
				+		
			
 
				
				+		if (isLiteral)
			
 
				
				+			return escapedString.substring(1, escapedString.length() - 1);
			
 
				
				+		
			
 
				
				+		StringBuilder result = new StringBuilder(escapedString.length() - 2);
			
 
				
				+		
			
 
				
				+		for (int i = 1; i < escapedString.length() - 1; i++) {
			
 
				
				+			if (escapedString.charAt(i) == '\\') {
			
 
				
				+				if (i >= escapedString.length() - 1)
			
 
				
				+					throw new IllegalArgumentException("Unfinished escape sequence");
			
 
				
				+				
			
 
				
				+				switch (escapedString.charAt(i + 1)) {
			
 
				
				+					case '\\': i++; result.append('\\'); break;
			
 
				
				+					case '&':
			
 
				
				+						CharacterEntity characterEntity = readCharacterEntity(escapedString, i + 1);
			
 
				
				+						i += characterEntity.stringValue.length() + 2;
			
 
				
				+						result.append(characterEntity.charValue);
			
 
				
				+						break;
			
 
				
				+					case 't': i++; result.append('\t'); break;
			
 
				
				+					case 'r': i++; result.append('\r'); break;
			
 
				
				+					case 'n': i++; result.append('\n'); break;
			
 
				
				+					case 'b': i++; result.append('\b'); break;
			
 
				
				+					case 'f': i++; result.append('\f'); break;
			
 
				
				+					case '"': i++; result.append('\"'); break;
			
 
				
				+					case '\'': i++; result.append('\''); break;
			
 
				
				+					case 'u':
			
 
				
				+						if (i >= escapedString.length() - 5)
			
 
				
				+							throw new IllegalArgumentException("Unfinished escape sequence");
			
 
				
				+						int hex0 = readHexCharacter(escapedString.charAt(i + 2));
			
 
				
				+						int hex1 = readHexCharacter(escapedString.charAt(i + 3));
			
 
				
				+						int hex2 = readHexCharacter(escapedString.charAt(i + 4));
			
 
				
				+						int hex3 = readHexCharacter(escapedString.charAt(i + 5));
			
 
				
				+						i += 5;
			
 
				
				+						result.append((hex0 << 12) | (hex1 << 8) | (hex2 << 4) | hex3);
			
 
				
				+					default:
			
 
				
				+						throw new IllegalArgumentException("Illegal escape sequence");
			
 
				
				+				}
			
 
				
				+			}
			
 
				
				+			else
			
 
				
				+				result.append(escapedString.charAt(i));
			
 
				
				+		}
			
 
				
				+		
			
 
				
				+		return result.toString();
			
 
				
				+	}
			
 
				
				+	
			
 
				
				+	/**
			
 
				
				+	 * Escapes special characters in the given string, including ". (but not ').
			
 
				
				+	 * Adds opening and closing quotes.
			
 
				
				 	 * 
			
 
				
				-	 * Perl hex escapes: !\x{XXX} braced may be 1-8 xdigits NB: proper Unicode
			
 
				
				-	 * never needs more than 6, as highest valid codepoint is 0x10FFFF, not
			
 
				
				-	 * maxint 0xFFFFFFFF
			
 
				
				+	 * @param value value to be escaped
			
 
				
				+	 * @param quote character (' or ")
			
 
				
				+	 * @param escapeUnicode true to escape any non-ascii value, false to leave them be
			
 
				
				+	 * @return escaped value
			
 
				
				+	 */
			
 
				
				+	public static String escape(String value, char quote, boolean escapeUnicode)
			
 
				
				+	{
			
 
				
				+		StringBuilder output = new StringBuilder();
			
 
				
				+		output.append(quote);
			
 
				
				+		for (char c : value.toCharArray()) {
			
 
				
				+			switch (c) {
			
 
				
				+				case '"': if (quote == '"') output.append("\\\""); break;
			
 
				
				+				case '\'': if (quote == '\'') output.append("\\\'"); break;
			
 
				
				+				case '\n': output.append("\\n"); break;
			
 
				
				+				case '\r': output.append("\\r"); break;
			
 
				
				+				case '\t': output.append("\\t"); break;
			
 
				
				+				default:
			
 
				
				+					if (escapeUnicode && c > 127) {
			
 
				
				+						output.append("\\u");
			
 
				
				+						output.append(lpad(Integer.toHexString(c), 4, '0'));
			
 
				
				+					} else {
			
 
				
				+						output.append(c);
			
 
				
				+					}
			
 
				
				+			}
			
 
				
				+		}
			
 
				
				+		
			
 
				
				+		output.append(quote);
			
 
				
				+		return output.toString();
			
 
				
				+	}
			
 
				
				+	
			
 
				
				+	/**
			
 
				
				+	 * Reads a single hex digit and converts it to a value 0-15.
			
 
				
				 	 * 
			
 
				
				-	 * Lame Java escape: \[IDIOT JAVA PREPROCESSOR]uXXXX must be exactly 4
			
 
				
				-	 * xdigits;
			
 
				
				+	 * @param hex hex digit
			
 
				
				+	 * @return converted value
			
 
				
				+	 */
			
 
				
				+	public static int readHexCharacter(char hex)
			
 
				
				+	{
			
 
				
				+		if (hex >= '0' && hex <= '9')
			
 
				
				+			return hex - '0';
			
 
				
				+		
			
 
				
				+		if (hex >= 'A' && hex <= 'F')
			
 
				
				+			return hex - 'A' + 10;
			
 
				
				+		
			
 
				
				+		if (hex >= 'a' && hex <= 'f')
			
 
				
				+			return hex - 'a' + 10;
			
 
				
				+		
			
 
				
				+		throw new IllegalArgumentException("Illegal hex character: " + hex);
			
 
				
				+	}
			
 
				
				+	
			
 
				
				+	/**
			
 
				
				+	 * Retrieves all official named character entities.
			
 
				
				 	 * 
			
 
				
				-	 * I can't write XXXX in this comment where it belongs because the damned
			
 
				
				-	 * Java Preprocessor can't mind its own business. Idiots!
			
 
				
				+	 * @return named character entities
			
 
				
				+	 */
			
 
				
				+	public static Collection<CharacterEntity> getNamedCharacterEntities()
			
 
				
				+	{
			
 
				
				+		return NAMED_CHARACTER_ENTITIES.values();
			
 
				
				+	}
			
 
				
				+	
			
 
				
				+	/**
			
 
				
				+	 * Reads a single character entity (formatted as &amp;characterEntity;) at the
			
 
				
				+	 * given string offset.
			
 
				
				 	 * 
			
 
				
				-	 * Lame Python escape: !\UXXXXXXXX must be exactly 8 xdigits
			
 
				
				+	 * The following formats are supported:
			
 
				
				+	 * <ul>
			
 
				
				+	 * <li>&amp;namedCharacterEntity;</li>
			
 
				
				+	 * <li>&amp;#ddd</li>
			
 
				
				+	 * <li>&amp;#xXXXX</li>
			
 
				
				+	 * </ul>
			
 
				
				 	 * 
			
 
				
				-	 * TODO: Perl translation escapes: \Q \U \L \E \[IDIOT JAVA PREPROCESSOR]u
			
 
				
				-	 * \l These are not so important to cover if you're passing the result to
			
 
				
				-	 * Pattern.compile(), since it handles them for you further downstream. Hm,
			
 
				
				-	 * what about \[IDIOT JAVA PREPROCESSOR]u?
			
 
				
				+	 * The returned value includes the character entity, without the enclosing
			
 
				
				+	 * &amp; and ; characters.
			
 
				
				 	 * 
			
 
				
				-	 * @param oldstr
			
 
				
				-	 * @return
			
 
				
				+	 * @param str string value to search in
			
 
				
				+	 * @param offset offset to look at
			
 
				
				+	 * @return character entity
			
 
				
				+	 * @throws IllegalArgumentException if the given string does not contain a
			
 
				
				+	 *	valid character entity at the given position
			
 
				
				 	 */
			
 
				
				-	public static String unescapeString(String oldstr) {
			
 
				
				-		if ((oldstr.charAt(0) != '"' || oldstr.charAt(oldstr.length() - 1) != '"')
			
 
				
				-				&& (oldstr.charAt(0) != '\'' || oldstr.charAt(oldstr.length() - 1) != '\'')) {
			
 
				
				-			// TODO: error
			
 
				
				-			// throw new TweakerExecuteException("Not a valid string constant: "
			
 
				
				-			// + oldstr);
			
 
				
				-		}
			
 
				
				-		oldstr = oldstr.substring(1, oldstr.length() - 1);
			
 
				
				-
			
 
				
				-		/*
			
 
				
				-		 * In contrast to fixing Java's broken regex charclasses, this one need
			
 
				
				-		 * be no bigger, as unescaping shrinks the string here, where in the
			
 
				
				-		 * other one, it grows it.
			
 
				
				-		 */
			
 
				
				-
			
 
				
				-		StringBuilder newstr = new StringBuilder(oldstr.length());
			
 
				
				-
			
 
				
				-		boolean saw_backslash = false;
			
 
				
				-
			
 
				
				-		for (int i = 0; i < oldstr.length(); i++) {
			
 
				
				-			int cp = oldstr.codePointAt(i);
			
 
				
				-			if (oldstr.codePointAt(i) > Character.MAX_VALUE) {
			
 
				
				-				i++;
			
 
				
				-				/**** WE HATES UTF-16! WE HATES IT FOREVERSES!!! ****/
			
 
				
				-			}
			
 
				
				-
			
 
				
				-			if (!saw_backslash) {
			
 
				
				-				if (cp == '\\') {
			
 
				
				-					saw_backslash = true;
			
 
				
				-				} else {
			
 
				
				-					newstr.append(Character.toChars(cp));
			
 
				
				-				}
			
 
				
				-				continue; /* switch */
			
 
				
				-			}
			
 
				
				-
			
 
				
				-			if (cp == '\\') {
			
 
				
				-				saw_backslash = false;
			
 
				
				-				newstr.append('\\');
			
 
				
				-				continue; /* switch */
			
 
				
				-			}
			
 
				
				-
			
 
				
				-			switch (cp) {
			
 
				
				-
			
 
				
				-				case 'r':
			
 
				
				-					newstr.append('\r');
			
 
				
				-					break; /* switch */
			
 
				
				-
			
 
				
				-				case 'n':
			
 
				
				-					newstr.append('\n');
			
 
				
				-					break; /* switch */
			
 
				
				-
			
 
				
				-				case 'f':
			
 
				
				-					newstr.append('\f');
			
 
				
				-					break; /* switch */
			
 
				
				-
			
 
				
				-				/* PASS a \b THROUGH!! */
			
 
				
				-				case 'b':
			
 
				
				-					newstr.append("\\b");
			
 
				
				-					break; /* switch */
			
 
				
				-
			
 
				
				-				case 't':
			
 
				
				-					newstr.append('\t');
			
 
				
				-					break; /* switch */
			
 
				
				-
			
 
				
				-				case 'a':
			
 
				
				-					newstr.append('\007');
			
 
				
				-					break; /* switch */
			
 
				
				-
			
 
				
				-				case 'e':
			
 
				
				-					newstr.append('\033');
			
 
				
				-					break; /* switch */
			
 
				
				-
			
 
				
				-				/*
			
 
				
				-				 * A "control" character is what you get when you xor its
			
 
				
				-				 * codepoint with '@'==64. This only makes sense for ASCII, and
			
 
				
				-				 * may not yield a "control" character after all.
			
 
				
				-				 * 
			
 
				
				-				 * Strange but true: "\c{" is ";", "\c}" is "=", etc.
			
 
				
				-				 */
			
 
				
				-				case 'c': {
			
 
				
				-					if (++i == oldstr.length()) {
			
 
				
				-						// TODO: error
			
 
				
				-						// throw new TweakerExecuteException("trailing \\c");
			
 
				
				-					}
			
 
				
				-					cp = oldstr.codePointAt(i);
			
 
				
				-					/*
			
 
				
				-					 * don't need to grok surrogates, as next line blows them up
			
 
				
				-					 */
			
 
				
				-					if (cp > 0x7f) {
			
 
				
				-						// TODO: error
			
 
				
				-						// throw new TweakerExecuteException(
			
 
				
				-						// "expected ASCII after \\c");
			
 
				
				-					}
			
 
				
				-					newstr.append(Character.toChars(cp ^ 64));
			
 
				
				-					break; /* switch */
			
 
				
				-				}
			
 
				
				-
			
 
				
				-				case '8':
			
 
				
				-				case '9':
			
 
				
				-					// TODO: error
			
 
				
				-					// throw new TweakerExecuteException("illegal octal digit");
			
 
				
				-					/* NOTREACHED */
			
 
				
				-
			
 
				
				-					/*
			
 
				
				-					 * may be 0 to 2 octal digits following this one so back up
			
 
				
				-					 * one for fallthrough to next case; unread this digit and
			
 
				
				-					 * fall through to next case.
			
 
				
				-					 */
			
 
				
				-				case '1':
			
 
				
				-				case '2':
			
 
				
				-				case '3':
			
 
				
				-				case '4':
			
 
				
				-				case '5':
			
 
				
				-				case '6':
			
 
				
				-				case '7':
			
 
				
				-					--i;
			
 
				
				-					/* FALLTHROUGH */
			
 
				
				-
			
 
				
				-					/*
			
 
				
				-					 * Can have 0, 1, or 2 octal digits following a 0 this
			
 
				
				-					 * permits larger values than octal 377, up to octal 777.
			
 
				
				-					 */
			
 
				
				-				case '0': {
			
 
				
				-					if (i + 1 == oldstr.length()) {
			
 
				
				-						/* found \0 at end of string */
			
 
				
				-						newstr.append(Character.toChars(0));
			
 
				
				-						break; /* switch */
			
 
				
				-					}
			
 
				
				-					i++;
			
 
				
				-					int digits = 0;
			
 
				
				-					int j;
			
 
				
				-					for (j = 0; j <= 2; j++) {
			
 
				
				-						if (i + j == oldstr.length()) {
			
 
				
				-							break; /* for */
			
 
				
				-						}
			
 
				
				-						/* safe because will unread surrogate */
			
 
				
				-						int ch = oldstr.charAt(i + j);
			
 
				
				-						if (ch < '0' || ch > '7') {
			
 
				
				-							break; /* for */
			
 
				
				-						}
			
 
				
				-						digits++;
			
 
				
				-					}
			
 
				
				-					if (digits == 0) {
			
 
				
				-						--i;
			
 
				
				-						newstr.append('\0');
			
 
				
				-						break; /* switch */
			
 
				
				-					}
			
 
				
				-					int value = 0;
			
 
				
				-					try {
			
 
				
				-						value = Integer
			
 
				
				-							.parseInt(oldstr.substring(i, i + digits), 8);
			
 
				
				-					} catch (NumberFormatException nfe) {
			
 
				
				-						// TODO: error
			
 
				
				-						// throw new TweakerExecuteException(
			
 
				
				-						// "invalid octal value for \\0 escape");
			
 
				
				-					}
			
 
				
				-					newstr.append(Character.toChars(value));
			
 
				
				-					i += digits - 1;
			
 
				
				-					break; /* switch */
			
 
				
				-				} /* end case '0' */
			
 
				
				-
			
 
				
				-				case 'x': {
			
 
				
				-					if (i + 2 > oldstr.length()) {
			
 
				
				-						// TODO: error
			
 
				
				-						// throw new TweakerExecuteException(
			
 
				
				-						// "string too short for \\x escape");
			
 
				
				-					}
			
 
				
				-					i++;
			
 
				
				-					boolean saw_brace = false;
			
 
				
				-					if (oldstr.charAt(i) == '{') {
			
 
				
				-						/* ^^^^^^ ok to ignore surrogates here */
			
 
				
				-						i++;
			
 
				
				-						saw_brace = true;
			
 
				
				-					}
			
 
				
				-					int j;
			
 
				
				-					for (j = 0; j < 8; j++) {
			
 
				
				-
			
 
				
				-						if (!saw_brace && j == 2) {
			
 
				
				-							break; /* for */
			
 
				
				-						}
			
 
				
				-
			
 
				
				-						/*
			
 
				
				-						 * ASCII test also catches surrogates
			
 
				
				-						 */
			
 
				
				-						int ch = oldstr.charAt(i + j);
			
 
				
				-						if (ch > 127) {
			
 
				
				-							// TODO: error
			
 
				
				-							// throw new TweakerExecuteException(
			
 
				
				-							// "illegal non-ASCII hex digit in \\x escape");
			
 
				
				-						}
			
 
				
				-
			
 
				
				-						if (saw_brace && ch == '}') {
			
 
				
				-							break; /* for */
			
 
				
				-						}
			
 
				
				-
			
 
				
				-						if (!((ch >= '0' && ch <= '9') || (ch >= 'a' && ch <= 'f') || (ch >= 'A' && ch <= 'F'))) {
			
 
				
				-							// TODO: error
			
 
				
				-							// throw new TweakerExecuteException(String.format(
			
 
				
				-							// "illegal hex digit #%d '%c' in \\x", ch, ch));
			
 
				
				-						}
			
 
				
				-
			
 
				
				-					}
			
 
				
				-					if (j == 0) {
			
 
				
				-						// TODO: error
			
 
				
				-						// throw new TweakerExecuteException(
			
 
				
				-						// "empty braces in \\x{} escape");
			
 
				
				-					}
			
 
				
				-					int value = 0;
			
 
				
				-					try {
			
 
				
				-						value = Integer.parseInt(oldstr.substring(i, i + j), 16);
			
 
				
				-					} catch (NumberFormatException nfe) {
			
 
				
				-						// TODO: error
			
 
				
				-						// throw new TweakerExecuteException(
			
 
				
				-						// "invalid hex value for \\x escape");
			
 
				
				-					}
			
 
				
				-					newstr.append(Character.toChars(value));
			
 
				
				-					if (saw_brace) {
			
 
				
				-						j++;
			
 
				
				-					}
			
 
				
				-					i += j - 1;
			
 
				
				-					break; /* switch */
			
 
				
				-				}
			
 
				
				-
			
 
				
				-				case 'u': {
			
 
				
				-					if (i + 4 > oldstr.length()) {
			
 
				
				-						// TODO: error
			
 
				
				-						// throw new TweakerExecuteException(
			
 
				
				-						// "string too short for \\u escape");
			
 
				
				-					}
			
 
				
				-					i++;
			
 
				
				-					int j;
			
 
				
				-					for (j = 0; j < 4; j++) {
			
 
				
				-						/* this also handles the surrogate issue */
			
 
				
				-						if (oldstr.charAt(i + j) > 127) {
			
 
				
				-							// TODO: error
			
 
				
				-							// throw new TweakerExecuteException(
			
 
				
				-							// "illegal non-ASCII hex digit in \\u escape");
			
 
				
				-						}
			
 
				
				-					}
			
 
				
				-					int value = 0;
			
 
				
				-					try {
			
 
				
				-						value = Integer.parseInt(oldstr.substring(i, i + j), 16);
			
 
				
				-					} catch (NumberFormatException nfe) {
			
 
				
				-						// TODO: error
			
 
				
				-						// throw new TweakerExecuteException(
			
 
				
				-						// "invalid hex value for \\u escape");
			
 
				
				-					}
			
 
				
				-					newstr.append(Character.toChars(value));
			
 
				
				-					i += j - 1;
			
 
				
				-					break; /* switch */
			
 
				
				-				}
			
 
				
				-
			
 
				
				-				case 'U': {
			
 
				
				-					if (i + 8 > oldstr.length()) {
			
 
				
				-						// TODO: error
			
 
				
				-						// throw new TweakerExecuteException(
			
 
				
				-						// "string too short for \\U escape");
			
 
				
				-					}
			
 
				
				-					i++;
			
 
				
				-					int j;
			
 
				
				-					for (j = 0; j < 8; j++) {
			
 
				
				-						/* this also handles the surrogate issue */
			
 
				
				-						if (oldstr.charAt(i + j) > 127) {
			
 
				
				-							// TODO: error
			
 
				
				-							// throw new TweakerExecuteException(
			
 
				
				-							// "illegal non-ASCII hex digit in \\U escape");
			
 
				
				-						}
			
 
				
				-					}
			
 
				
				-					int value = 0;
			
 
				
				-					try {
			
 
				
				-						value = Integer.parseInt(oldstr.substring(i, i + j), 16);
			
 
				
				-					} catch (NumberFormatException nfe) {
			
 
				
				-						// TODO: error
			
 
				
				-						// throw new TweakerExecuteException(
			
 
				
				-						// "invalid hex value for \\U escape");
			
 
				
				-					}
			
 
				
				-					newstr.append(Character.toChars(value));
			
 
				
				-					i += j - 1;
			
 
				
				-					break; /* switch */
			
 
				
				-				}
			
 
				
				-
			
 
				
				-				default:
			
 
				
				-					newstr.append('\\');
			
 
				
				-					newstr.append(Character.toChars(cp));
			
 
				
				-					/*
			
 
				
				-					 * say(String.format(
			
 
				
				-					 * "DEFAULT unrecognized escape %c passed through", cp));
			
 
				
				-					 */
			
 
				
				-					break; /* switch */
			
 
				
				-
			
 
				
				+	public static CharacterEntity readCharacterEntity(String str, int offset)
			
 
				
				+	{
			
 
				
				+		if (offset + 3 >= str.length())
			
 
				
				+			throw new IllegalArgumentException("Not a proper character entity");
			
 
				
				+		if (str.charAt(offset) != '&')
			
 
				
				+			throw new IllegalArgumentException("Not a proper character entity");
			
 
				
				+		
			
 
				
				+		int semi = str.indexOf(';', offset);
			
 
				
				+		if (semi < 0)
			
 
				
				+			throw new IllegalArgumentException("Not a proper character entity");
			
 
				
				+		
			
 
				
				+		String entity = str.substring(offset + 1, semi);
			
 
				
				+		if (entity.isEmpty())
			
 
				
				+			throw new IllegalArgumentException("Not a proper character entity");
			
 
				
				+		
			
 
				
				+		if (NAMED_CHARACTER_ENTITIES.containsKey(entity))
			
 
				
				+			return NAMED_CHARACTER_ENTITIES.get(entity);
			
 
				
				+		
			
 
				
				+		if (entity.charAt(0) == '#') {
			
 
				
				+			if (entity.length() < 2)
			
 
				
				+				throw new IllegalArgumentException("Not a proper character entity");
			
 
				
				+			
			
 
				
				+			if (str.charAt(1) == 'x') {
			
 
				
				+				// hex character entity
			
 
				
				+				if (entity.length() != 7)
			
 
				
				+					throw new IllegalArgumentException("Not a proper character entity");
			
 
				
				+				
			
 
				
				+				int ivalue = Integer.parseInt(entity.substring(2), 16);
			
 
				
				+				return new CharacterEntity(entity, (char) ivalue);
			
 
				
				+			} else {
			
 
				
				+				// decimal character entity
			
 
				
				+				int ivalue = Integer.parseInt(entity.substring(1));
			
 
				
				+				return new CharacterEntity(entity, (char) ivalue);
			
 
				
				 			}
			
 
				
				-			saw_backslash = false;
			
 
				
				-		}
			
 
				
				-
			
 
				
				-		/* weird to leave one at the end */
			
 
				
				-		if (saw_backslash) {
			
 
				
				-			newstr.append('\\');
			
 
				
				 		}
			
 
				
				 		
			
 
				
				-		String result = newstr.toString();
			
 
				
				-		return result;
			
 
				
				+		throw new IllegalArgumentException("Not a valid named character entity");
			
 
				
				 	}
			
 
				
				-
			
 
				
				-	/*
			
 
				
				-	 * Return a string "U+XX.XXX.XXXX" etc, where each XX set is the xdigits of
			
 
				
				-	 * the logical Unicode code point. No bloody brain-damaged UTF-16 surrogate
			
 
				
				-	 * crap, just true logical characters.
			
 
				
				-	 */
			
 
				
				-	private static String uniplus(String s) {
			
 
				
				-		if (s.length() == 0) {
			
 
				
				-			return "";
			
 
				
				-		}
			
 
				
				-		/* This is just the minimum; sb will grow as needed. */
			
 
				
				-		StringBuilder sb = new StringBuilder(2 + 3 * s.length());
			
 
				
				-		sb.append("U+");
			
 
				
				-		for (int i = 0; i < s.length(); i++) {
			
 
				
				-			sb.append(String.format("%X", s.codePointAt(i)));
			
 
				
				-			if (s.codePointAt(i) > Character.MAX_VALUE) {
			
 
				
				-				i++;
			
 
				
				-				/**** WE HATES UTF-16! WE HATES IT FOREVERSES!!! ****/
			
 
				
				-			}
			
 
				
				-			if (i + 1 < s.length()) {
			
 
				
				-				sb.append(".");
			
 
				
				-			}
			
 
				
				+	
			
 
				
				+	public static class CharacterEntity
			
 
				
				+	{
			
 
				
				+		public char charValue;
			
 
				
				+		public String stringValue;
			
 
				
				+		
			
 
				
				+		public CharacterEntity(String stringValue, char charValue)
			
 
				
				+		{
			
 
				
				+			this.charValue = charValue;
			
 
				
				+			this.stringValue = stringValue;
			
 
				
				 		}
			
 
				
				-		return sb.toString();
			
 
				
				 	}
			
 
				
				 }
			
--- a/src/main/resources/org/openzen/zenscript/shared/characterEntities.properties
+++ b/src/main/resources/org/openzen/zenscript/shared/characterEntities.properties
@@ -0,0 +1,266 @@
 
				
				+quot=34
			
 
				
				+amp=38
			
 
				
				+apos=39
			
 
				
				+lt=60
			
 
				
				+gt=62
			
 
				
				+
			
 
				
				+nbsp=160
			
 
				
				+iexcl=161
			
 
				
				+cent=162
			
 
				
				+pound=163
			
 
				
				+curren=164
			
 
				
				+yen=165
			
 
				
				+brvbar=166
			
 
				
				+sect=167
			
 
				
				+uml=168
			
 
				
				+copy=169
			
 
				
				+ordf=170
			
 
				
				+laquo=171
			
 
				
				+not=172
			
 
				
				+shy=173
			
 
				
				+reg=174
			
 
				
				+macr=175
			
 
				
				+deg=176
			
 
				
				+plusmn=177
			
 
				
				+sup2=178
			
 
				
				+sup3=179
			
 
				
				+acute=180
			
 
				
				+micro=181
			
 
				
				+para=182
			
 
				
				+middot=183
			
 
				
				+cedil=184
			
 
				
				+sup1=185
			
 
				
				+ordm=186
			
 
				
				+raquo=187
			
 
				
				+frac14=188
			
 
				
				+frac12=189
			
 
				
				+frac34=190
			
 
				
				+iquest=191
			
 
				
				+
			
 
				
				+Agrave=192
			
 
				
				+Aacute=193
			
 
				
				+Acirc=194
			
 
				
				+Atilde=195
			
 
				
				+Auml=196
			
 
				
				+Aring=197
			
 
				
				+AElig=198
			
 
				
				+Ccedil=199
			
 
				
				+Egrave=200
			
 
				
				+Eacute=201
			
 
				
				+Ecirc=202
			
 
				
				+Euml=203
			
 
				
				+lgrave=204
			
 
				
				+lacute=205
			
 
				
				+lcirc=206
			
 
				
				+luml=207
			
 
				
				+ETH=208
			
 
				
				+Ntilde=209
			
 
				
				+Ograve=210
			
 
				
				+Oacute=211
			
 
				
				+Ocirc=212
			
 
				
				+Otilde=213
			
 
				
				+Ouml=214
			
 
				
				+times=215
			
 
				
				+Oslash=216
			
 
				
				+Ugrave=217
			
 
				
				+Uacute=218
			
 
				
				+Ucirc=219
			
 
				
				+Uuml=220
			
 
				
				+Yacute=221
			
 
				
				+THORN=222
			
 
				
				+szlig=223
			
 
				
				+agrave=224
			
 
				
				+aacute=225
			
 
				
				+acirc=226
			
 
				
				+atilde=227
			
 
				
				+auml=228
			
 
				
				+aring=229
			
 
				
				+aelig=230
			
 
				
				+ccedil=231
			
 
				
				+egrave=232
			
 
				
				+eacute=233
			
 
				
				+ecirc=234
			
 
				
				+euml=235
			
 
				
				+igrave=236
			
 
				
				+iacute=237
			
 
				
				+icirc=238
			
 
				
				+iuml=239
			
 
				
				+eth=240
			
 
				
				+ntilde=241
			
 
				
				+ograve=242
			
 
				
				+oacute=243
			
 
				
				+ocirc=244
			
 
				
				+otilde=245
			
 
				
				+ouml=246
			
 
				
				+divide=247
			
 
				
				+oslash=248
			
 
				
				+ugrave=249
			
 
				
				+uacute=250
			
 
				
				+ucirc=251
			
 
				
				+uuml=252
			
 
				
				+yacute=253
			
 
				
				+thorn=254
			
 
				
				+yuml=255
			
 
				
				+
			
 
				
				+OElig=338
			
 
				
				+oelig=339
			
 
				
				+Scaron=352
			
 
				
				+scaron=353
			
 
				
				+Yuml=376
			
 
				
				+
			
 
				
				+fnof=402
			
 
				
				+
			
 
				
				+circ=710
			
 
				
				+tilde=732
			
 
				
				+
			
 
				
				+Alpha=913
			
 
				
				+Beta=914
			
 
				
				+Gamma=915
			
 
				
				+Delta=916
			
 
				
				+Epsilon=917
			
 
				
				+Zeta=918
			
 
				
				+Eta=919
			
 
				
				+Theta=920
			
 
				
				+Iota=921
			
 
				
				+Kappa=922
			
 
				
				+Lambda=923
			
 
				
				+Mu=924
			
 
				
				+Nu=925
			
 
				
				+Xi=926
			
 
				
				+Omicron=927
			
 
				
				+Pi=928
			
 
				
				+Rho=929
			
 
				
				+Sigma=931
			
 
				
				+Tau=932
			
 
				
				+Upsilon=933
			
 
				
				+Phi=934
			
 
				
				+Chi=935
			
 
				
				+Psi=936
			
 
				
				+Omega=937
			
 
				
				+
			
 
				
				+alpha=945
			
 
				
				+beta=946
			
 
				
				+gamma=947
			
 
				
				+delta=948
			
 
				
				+epsilon=949
			
 
				
				+zeta=950
			
 
				
				+eta=951
			
 
				
				+theta=952
			
 
				
				+iota=953
			
 
				
				+kappa=954
			
 
				
				+lambda=955
			
 
				
				+mu=956
			
 
				
				+nu=957
			
 
				
				+xi=958
			
 
				
				+omicron=959
			
 
				
				+pi=960
			
 
				
				+rho=961
			
 
				
				+sigmaf=962
			
 
				
				+sigma=963
			
 
				
				+tau=964
			
 
				
				+upsilon=965
			
 
				
				+phi=966
			
 
				
				+chi=967
			
 
				
				+psi=968
			
 
				
				+omega=969
			
 
				
				+thetasym=977
			
 
				
				+upsih=978
			
 
				
				+piv=982
			
 
				
				+
			
 
				
				+ensp=8194
			
 
				
				+emsp=8195
			
 
				
				+thinsp=8201
			
 
				
				+zwnj=8204
			
 
				
				+zwj=8205
			
 
				
				+lrm=8206
			
 
				
				+rlm=8207
			
 
				
				+ndash=8211
			
 
				
				+mdash=8212
			
 
				
				+lsquo=8216
			
 
				
				+rsquo=8217
			
 
				
				+sbquo=8218
			
 
				
				+ldquo=8220
			
 
				
				+rdquo=8221
			
 
				
				+bdquo=8222
			
 
				
				+dagger=8224
			
 
				
				+Dagger=8225
			
 
				
				+bull=8226
			
 
				
				+hellip=8230
			
 
				
				+permil=8240
			
 
				
				+prime=8242
			
 
				
				+Prime=8243
			
 
				
				+lsaquo=8249
			
 
				
				+rsaquo=8250
			
 
				
				+oline=8254
			
 
				
				+frasl=8260
			
 
				
				+
			
 
				
				+euro=8364
			
 
				
				+
			
 
				
				+image=8465
			
 
				
				+weierp=8472
			
 
				
				+real=8476
			
 
				
				+trade=8482
			
 
				
				+alefsym=8501
			
 
				
				+
			
 
				
				+larr=8592
			
 
				
				+uarr=8593
			
 
				
				+rarr=8594
			
 
				
				+darr=8595
			
 
				
				+harr=8596
			
 
				
				+crarr=8629
			
 
				
				+lArr=8656
			
 
				
				+uArr=8657
			
 
				
				+rArr=8658
			
 
				
				+dArr=8659
			
 
				
				+hArr=8660
			
 
				
				+
			
 
				
				+forall=8704
			
 
				
				+part=8706
			
 
				
				+exist=8707
			
 
				
				+empty=8709
			
 
				
				+nabla=8711
			
 
				
				+isin=8712
			
 
				
				+notin=8713
			
 
				
				+ni=8715
			
 
				
				+prod=8719
			
 
				
				+sum=8721
			
 
				
				+minus=8722
			
 
				
				+lowast=8727
			
 
				
				+radic=8730
			
 
				
				+prop=8733
			
 
				
				+infin=8734
			
 
				
				+ang=8736
			
 
				
				+and=8743
			
 
				
				+or=8744
			
 
				
				+cap=8745
			
 
				
				+cup=8746
			
 
				
				+int=8747
			
 
				
				+there4=8756
			
 
				
				+sim=8764
			
 
				
				+cong=8773
			
 
				
				+asymp=8776
			
 
				
				+ne=8800
			
 
				
				+equiv=8801
			
 
				
				+le=8804
			
 
				
				+ge=8805
			
 
				
				+sub=8834
			
 
				
				+sup=8835
			
 
				
				+nsub=8836
			
 
				
				+sube=8838
			
 
				
				+supe=8839
			
 
				
				+oplus=8853
			
 
				
				+otimes=8855
			
 
				
				+perp=8869
			
 
				
				+sdot=8901
			
 
				
				+
			
 
				
				+lceil=8968
			
 
				
				+rceil=8969
			
 
				
				+lfloor=8970
			
 
				
				+rfloor=8971
			
 
				
				+lang=9001
			
 
				
				+rang=9002
			
 
				
				+loz=9674
			
 
				
				+spades=9824
			
 
				
				+clubs=8927
			
 
				
				+hearts=9829
			
 
				
				+diams=9830