[Jython-checkins] SF.net SVN: jython:[6488] branches/newstr/src

SourceForge Headquarters 225 Broadway Suite 1600 San Diego, CA 92101 +1 (858) 422-6466

Revision: 6488
          http://jython.svn.sourceforge.net/jython/?rev=6488&view=rev
Author:   zyasoft
Date:     2009-06-21 03:17:50 +0000 (Sun, 21 Jun 2009)

Log Message:
-----------
Added PyNew* versions of PyString and PyUnicode to enable incremental refactoring.

Modified Paths:
--------------
    branches/newstr/src/templates/mappings

Added Paths:
-----------
    branches/newstr/src/org/python/core/PyNewString.java
    branches/newstr/src/org/python/core/PyNewStringDerived.java
    branches/newstr/src/org/python/core/PyNewUnicode.java
    branches/newstr/src/org/python/core/PyNewUnicodeDerived.java
    branches/newstr/src/templates/newstr.derived
    branches/newstr/src/templates/newunicode.derived

Added: branches/newstr/src/org/python/core/PyNewString.java
===================================================================

--- branches/newstr/src/org/python/core/PyNewString.java	                        (rev 0)
+++ branches/newstr/src/org/python/core/PyNewString.java	2009-06-21 03:17:50 UTC (rev 6488)
@@ -0,0 +1,3104 @@
+/// Copyright (c) Corporation for National Research Initiatives
+package org.python.core;
+
+import java.math.BigInteger;
+
+import org.python.core.util.ExtraMath;
+import org.python.core.util.StringUtil;
+import org.python.expose.ExposedMethod;
+import org.python.expose.ExposedNew;
+import org.python.expose.ExposedType;
+import org.python.expose.MethodType;
+
+
+/**
+ * A builtin python string.
+ */
+@ExposedType(name = "newstr")
+public class PyNewString extends PyBaseString
+{
+    public static final PyType TYPE = PyType.fromClass(PyNewString.class);
+    protected String string;
+    protected transient boolean interned=false;
+
+    // for PyJavaClass.init()
+    public PyNewString() {
+        this(TYPE, "");
+    }
+
+    public PyNewString(PyType subType, String string) {
+        super(subType);
+        if (string == null) {
+            throw new IllegalArgumentException(
+                            "Cannot create PyString from null!");
+        }
+        this.string = string;
+    }
+
+    public PyNewString(String string) {
+        this(TYPE, string);
+    }
+
+    public PyNewString(char c) {
+        this(TYPE,String.valueOf(c));
+    }
+
+    PyNewString(StringBuilder buffer) {
+        this(TYPE, new String(buffer));
+    }
+    
+    /**
+     * Creates a PyString from an already interned String. Just means it won't
+     * be reinterned if used in a place that requires interned Strings.
+     */
+    public static PyNewString fromInterned(String interned) {
+        PyNewString str = new PyNewString(TYPE, interned);
+        str.interned = true;
+        return str;
+    }
+
+    @ExposedNew
+    final static PyObject str_new(PyNewWrapper new_, boolean init, PyType subtype,
+            PyObject[] args, String[] keywords) {
+        ArgParser ap = new ArgParser("str", args, keywords, new String[] { "object" }, 0);
+        PyObject S = ap.getPyObject(0, null);
+        if(new_.for_type == subtype) {
+            if(S == null) {
+                return new PyNewString("");
+            }
+            return new PyNewString(S.__str__().toString());
+        } else {
+            if (S == null) {
+                return new PyNewStringDerived(subtype, "");
+            }
+            return new PyNewStringDerived(subtype, S.__str__().toString());
+        }
+    }
+
+    public int[] toCodePoints() {
+        int n = string.length();
+        int[] codePoints = new int[n];
+        for (int i = 0; i < n; i++) {
+            codePoints[i] = string.charAt(i);
+        }
+        return codePoints;
+    }
+    
+    public String substring(int start, int end) {
+        return string.substring(start, end);
+    }
+    
+    public PyString __str__() {
+        return str___str__();
+    }
+
+    @ExposedMethod(doc = BuiltinDocs.str___str___doc) 
+    final PyString str___str__() {
+        return new PyString(string);
+    }
+
+    public PyUnicode __unicode__() {
+        return new PyUnicode(string);
+    }
+
+    public int __len__() {
+        return str___len__();
+    }
+
+    @ExposedMethod(doc = BuiltinDocs.str___len___doc)
+    final int str___len__() {
+        return string.length();
+    }
+
+    public String toString() {
+        return string;
+    }
+
+    public String internedString() {
+        if (interned)
+            return string;
+        else {
+            string = string.intern();
+            interned = true;
+            return string;
+        }
+    }
+
+    public PyString __repr__() {
+        return str___repr__();
+    }
+
+    @ExposedMethod(doc = BuiltinDocs.str___repr___doc)
+    final PyString str___repr__() {
+        return new PyString(encode_UnicodeEscape(string, true));
+    }
+
+    private static char[] hexdigit = "0123456789abcdef".toCharArray();
+
+    public static String encode_UnicodeEscape(String str,
+                                              boolean use_quotes)
+    {
+        int size = str.length();
+        StringBuilder v = new StringBuilder(str.length());
+
+        char quote = 0;
+
+        if (use_quotes) {
+            quote = str.indexOf('\'') >= 0 &&
+                             str.indexOf('"') == -1 ? '"' : '\'';
+            v.append(quote);
+        }
+
+        for (int i = 0; size-- > 0; ) {
+            int ch = str.charAt(i++);
+            /* Escape quotes */
+            if (use_quotes && (ch == quote || ch == '\\')) {
+                v.append('\\');
+                v.append((char) ch);
+                continue;
+            }
+                /* Map UTF-16 surrogate pairs to Unicode \UXXXXXXXX escapes */
+                else if (ch >= 0xD800 && ch < 0xDC00) {
+                    char ch2 = str.charAt(i++);
+                    size--;
+                    if (ch2 >= 0xDC00 && ch2 <= 0xDFFF) {
+                    int ucs = (((ch & 0x03FF) << 10) | (ch2 & 0x03FF)) + 0x00010000;
+                    v.append('\\');
+                    v.append('U');
+                    v.append(hexdigit[(ucs >> 28) & 0xf]);
+                    v.append(hexdigit[(ucs >> 24) & 0xf]);
+                    v.append(hexdigit[(ucs >> 20) & 0xf]);
+                    v.append(hexdigit[(ucs >> 16) & 0xf]);
+                    v.append(hexdigit[(ucs >> 12) & 0xf]);
+                    v.append(hexdigit[(ucs >> 8) & 0xf]);
+                    v.append(hexdigit[(ucs >> 4) & 0xf]);
+                    v.append(hexdigit[ucs & 0xf]);
+                    continue;
+                    }
+                    /* Fall through: isolated surrogates are copied as-is */
+                    i--;
+                    size++;
+                }
+            /* Map 16-bit characters to '\\uxxxx' */
+             if (ch >= 256) {
+                v.append('\\');
+                v.append('u');
+                v.append(hexdigit[(ch >> 12) & 0xf]);
+                v.append(hexdigit[(ch >> 8) & 0xf]);
+                v.append(hexdigit[(ch >> 4) & 0xf]);
+                v.append(hexdigit[ch & 15]);
+            }
+             /* Map special whitespace to '\t', \n', '\r' */
+            else if (ch == '\t') v.append("\\t");
+            else if (ch == '\n') v.append("\\n");
+            else if (ch == '\r') v.append("\\r");
+            /* Map non-printable US ASCII to '\ooo' */
+            else if (ch < ' ' || ch >= 127) {
+                v.append('\\');
+                v.append('x');
+                v.append(hexdigit[(ch >> 4) & 0xf]);
+                v.append(hexdigit[ch & 0xf]);
+            }
+            /* Copy everything else as-is */
+            else
+                v.append((char) ch);
+        }
+        if (use_quotes)
+            v.append(quote);
+        return v.toString();
+    }
+
+    private static ucnhashAPI pucnHash = null;
+
+    
+    public static String decode_UnicodeEscape(String str,
+                                              int start,
+                                              int end,
+                                              String errors,
+                                              boolean unicode) {
+        StringBuilder v = new StringBuilder(end - start);
+        for(int s = start; s < end;) {
+            char ch = str.charAt(s);
+            /* Non-escape characters are interpreted as Unicode ordinals */
+            if(ch != '\\') {
+                v.append(ch);
+                s++;
+                continue;
+            }
+            int loopStart = s;
+            /* \ - Escapes */
+            s++;
+            if(s == end) {
+                s = codecs.insertReplacementAndGetResume(v,
+                                                         errors,
+                                                         "unicodeescape",
+                                                         str,
+                                                         loopStart,
+                                                         s + 1,
+                                                         "\\ at end of string");
+                continue;
+            }
+            ch = str.charAt(s++);
+            switch(ch){
+                /* \x escapes */
+                case '\n':
+                    break;
+                case '\\':
+                    v.append('\\');
+                    break;
+                case '\'':
+                    v.append('\'');
+                    break;
+                case '\"':
+                    v.append('\"');
+                    break;
+                case 'b':
+                    v.append('\b');
+                    break;
+                case 'f':
+                    v.append('\014');
+                    break; /* FF */
+                case 't':
+                    v.append('\t');
+                    break;
+                case 'n':
+                    v.append('\n');
+                    break;
+                case 'r':
+                    v.append('\r');
+                    break;
+                case 'v':
+                    v.append('\013');
+                    break; /* VT */
+                case 'a':
+                    v.append('\007');
+                    break; /* BEL, not classic C */
+                /* \OOO (octal) escapes */
+                case '0':
+                case '1':
+                case '2':
+                case '3':
+                case '4':
+                case '5':
+                case '6':
+                case '7':
+                    int x = Character.digit(ch, 8);
+                    for(int j = 0; j < 2 && s < end; j++, s++) {
+                        ch = str.charAt(s);
+                        if(ch < '0' || ch > '7')
+                            break;
+                        x = (x << 3) + Character.digit(ch, 8);
+                    }
+                    v.append((char)x);
+                    break;
+                case 'x':
+                    s = hexescape(v, errors, 2, s, str, end, "truncated \\xXX");
+                    break;
+                case 'u':
+                    if(!unicode) {
+                        v.append('\\');
+                        v.append('u');
+                        break;
+                    }
+                    s = hexescape(v,
+                                  errors,
+                                  4,
+                                  s,
+                                  str,
+                                  end,
+                                  "truncated \\uXXXX");
+                    break;
+                case 'U':
+                    if(!unicode) {
+                        v.append('\\');
+                        v.append('U');
+                        break;
+                    }
+                    s = hexescape(v,
+                                  errors,
+                                  8,
+                                  s,
+                                  str,
+                                  end,
+                                  "truncated \\UXXXXXXXX");
+                    break;
+                case 'N':
+                    if(!unicode) {
+                        v.append('\\');
+                        v.append('N');
+                        break;
+                    }
+                    /*
+                     * Ok, we need to deal with Unicode Character Names now,
+                     * make sure we've imported the hash table data...
+                     */
+                    if(pucnHash == null) {
+                        PyObject mod = imp.importName("ucnhash", true);
+                        mod = mod.__call__();
+                        pucnHash = (ucnhashAPI)mod.__tojava__(Object.class);
+                        if(pucnHash.getCchMax() < 0)
+                            throw Py.UnicodeError("Unicode names not loaded");
+                    }
+                    if(str.charAt(s) == '{') {
+                        int startName = s + 1;
+                        int endBrace = startName;
+                        /*
+                         * look for either the closing brace, or we exceed the
+                         * maximum length of the unicode character names
+                         */
+                        int maxLen = pucnHash.getCchMax();
+                        while(endBrace < end && str.charAt(endBrace) != '}'
+                                && (endBrace - startName) <= maxLen) {
+                            endBrace++;
+                        }
+                        if(endBrace != end && str.charAt(endBrace) == '}') {
+                            int value = pucnHash.getValue(str,
+                                                          startName,
+                                                          endBrace);
+                            if(storeUnicodeCharacter(value, v)) {
+                                s = endBrace + 1;
+                            } else {
+                                s = codecs.insertReplacementAndGetResume(v,
+                                                                         errors,
+                                                                         "unicodeescape",
+                                                                         str,
+                                                                         loopStart,
+                                                                         endBrace + 1,
+                                                                         "illegal Unicode character");
+                            }
+                        } else {
+                            s = codecs.insertReplacementAndGetResume(v,
+                                                                     errors,
+                                                                     "unicodeescape",
+                                                                     str,
+                                                                     loopStart,
+                                                                     endBrace,
+                                                                     "malformed \\N character escape");
+                        }
+                        break;
+                    } else {
+                        s = codecs.insertReplacementAndGetResume(v,
+                                                                 errors,
+                                                                 "unicodeescape",
+                                                                 str,
+                                                                 loopStart,
+                                                                 s + 1,
+                                                                 "malformed \\N character escape");
+                    }
+                    break;
+                default:
+                    v.append('\\');
+                    v.append(str.charAt(s - 1));
+                    break;
+            }
+        }
+        return v.toString();
+    }
+
+    private static int hexescape(StringBuilder partialDecode,
+                                 String errors,
+                                 int digits,
+                                 int hexDigitStart,
+                                 String str,
+                                 int size,
+                                 String errorMessage) {
+        if(hexDigitStart + digits > size) {
+            return codecs.insertReplacementAndGetResume(partialDecode,
+                                                        errors,
+                                                        "unicodeescape",
+                                                        str,
+                                                        hexDigitStart - 2,
+                                                        size,
+                                                        errorMessage);
+        }
+        int i = 0;
+        int x = 0;
+        for(; i < digits; ++i) {
+            char c = str.charAt(hexDigitStart + i);
+            int d = Character.digit(c, 16);
+            if(d == -1) {
+                return codecs.insertReplacementAndGetResume(partialDecode,
+                                                            errors,
+                                                            "unicodeescape",
+                                                            str,
+                                                            hexDigitStart - 2,
+                                                            hexDigitStart + i + 1,
+                                                            errorMessage);
+            }
+            x = (x << 4) & ~0xF;
+            if(c >= '0' && c <= '9')
+                x += c - '0';
+            else if(c >= 'a' && c <= 'f')
+                x += 10 + c - 'a';
+            else
+                x += 10 + c - 'A';
+        }
+        if(storeUnicodeCharacter(x, partialDecode)) {
+            return hexDigitStart + i;
+        } else {
+            return codecs.insertReplacementAndGetResume(partialDecode,
+                                                        errors,
+                                                        "unicodeescape",
+                                                        str,
+                                                        hexDigitStart - 2,
+                                                        hexDigitStart + i + 1,
+                                                        "illegal Unicode character");
+        }
+    }
+
+    /*pass in an int since this can be a UCS-4 character */
+    private static boolean storeUnicodeCharacter(int value,
+            StringBuilder partialDecode) {
+        if (value < 0 || (value >= 0xD800 && value <= 0xDFFF)) {
+            return false;
+        } else if (value <= PySystemState.maxunicode) {
+            partialDecode.appendCodePoint(value);
+            return true;
+        }
+        return false;
+    }
+
+    @ExposedMethod(doc = BuiltinDocs.str___getitem___doc)
+    final PyObject str___getitem__(PyObject index) {
+        PyObject ret = seq___finditem__(index);
+        if (ret == null) {
+            throw Py.IndexError("string index out of range");
+        }
+        return ret;
+    }
+    
+    //XXX: need doc
+    @ExposedMethod(defaults = "null")
+    final PyObject str___getslice__(PyObject start, PyObject stop, PyObject step) {
+        return seq___getslice__(start, stop, step);
+    }
+
+    public int __cmp__(PyObject other) {
+        return str___cmp__(other);
+    }
+
+    @ExposedMethod(type = MethodType.CMP)
+    final int str___cmp__(PyObject other) {
+        if (!(other instanceof PyNewString))
+            return -2;
+
+        int c = string.compareTo(((PyNewString)other).string);
+        return c < 0 ? -1 : c > 0 ? 1 : 0;
+    }
+
+    public PyObject __eq__(PyObject other) {
+        return str___eq__(other);
+    }
+
+    @ExposedMethod(type = MethodType.BINARY, doc = BuiltinDocs.str___eq___doc)
+    final PyObject str___eq__(PyObject other) {
+        String s = coerce(other);
+        if (s == null)
+            return null;
+        return string.equals(s) ? Py.True : Py.False;
+    }
+
+    public PyObject __ne__(PyObject other) {
+        return str___ne__(other);
+    }
+
+    @ExposedMethod(type = MethodType.BINARY, doc = BuiltinDocs.str___ne___doc)
+    final PyObject str___ne__(PyObject other) {
+        String s = coerce(other);
+        if (s == null)
+            return null;
+        return string.equals(s) ? Py.False : Py.True;
+    }
+    
+    public PyObject __lt__(PyObject other) {
+        return str___lt__(other);
+    }
+
+    @ExposedMethod(type = MethodType.BINARY, doc = BuiltinDocs.str___lt___doc)
+    final PyObject str___lt__(PyObject other){
+        String s = coerce(other);
+        if (s == null)
+            return null;
+        return string.compareTo(s) < 0 ? Py.True : Py.False;
+    }
+
+    public PyObject __le__(PyObject other) {
+        return str___le__(other);
+    }
+
+    @ExposedMethod(type = MethodType.BINARY, doc = BuiltinDocs.str___le___doc)
+    final PyObject str___le__(PyObject other){
+        String s = coerce(other);
+        if (s == null)
+            return null;
+        return string.compareTo(s) <= 0 ? Py.True : Py.False;
+    }
+
+    public PyObject __gt__(PyObject other) {
+        return str___gt__(other);
+    }
+
+    @ExposedMethod(type = MethodType.BINARY, doc = BuiltinDocs.str___gt___doc)
+    final PyObject str___gt__(PyObject other){
+        String s = coerce(other);
+        if (s == null)
+            return null;
+        return string.compareTo(s) > 0 ? Py.True : Py.False;
+    }
+
+    public PyObject __ge__(PyObject other) {
+        return str___ge__(other);
+    }
+
+    @ExposedMethod(type = MethodType.BINARY, doc = BuiltinDocs.str___ge___doc)
+    final PyObject str___ge__(PyObject other){
+        String s = coerce(other);
+        if (s == null)
+            return null;
+        return string.compareTo(s) >= 0 ? Py.True : Py.False;
+    }
+
+    private static String coerce(PyObject o) {
+        if (o instanceof PyNewString)
+            return o.toString();
+        return null;
+    }
+
+    public int hashCode() {
+        return str___hash__();
+    }
+
+    @ExposedMethod(doc = BuiltinDocs.str___hash___doc)
+    final int str___hash__() {
+        return string.hashCode();
+    }
+
+    /**
+     * @return a byte array with one byte for each char in this object's
+     *         underlying String. Each byte contains the low-order bits of its
+     *         corresponding char.
+     */
+    public byte[] toBytes() {
+        return StringUtil.toBytes(string);
+    }
+
+    public Object __tojava__(Class<?> c) {
+        if (c.isAssignableFrom(String.class)) {
+            return string;
+        }
+
+        if (c == Character.TYPE || c == Character.class)
+            if (string.length() == 1)
+                return new Character(string.charAt(0));
+
+        if (c.isArray()) {
+            if (c.getComponentType() == Byte.TYPE)
+                return toBytes();
+            if (c.getComponentType() == Character.TYPE)
+                return string.toCharArray();
+        }
+
+        if (c.isInstance(this))
+            return this;
+
+        return Py.NoConversion;
+    }
+
+    protected PyObject pyget(int i) {
+        return Py.newString(string.charAt(i));
+    }
+
+    protected PyObject getslice(int start, int stop, int step) {
+        if (step > 0 && stop < start)
+            stop = start;
+        if (step == 1)
+            return fromSubstring(start, stop);
+        else {
+            int n = sliceLength(start, stop, step);
+            char new_chars[] = new char[n];
+            int j = 0;
+            for (int i=start; j<n; i+=step)
+                new_chars[j++] = string.charAt(i);
+
+            return createInstance(new String(new_chars), true);
+        }
+    }
+
+    public PyNewString createInstance(String str) {
+        return new PyNewString(str);
+    }
+
+    protected PyNewString createInstance(String str, boolean isBasic) {
+        // ignore isBasic, doesn't apply to PyString, just PyNewUnicode
+        return new PyNewString(str);
+    } 
+    
+    public boolean __contains__(PyObject o) {
+        return str___contains__(o);
+    }
+
+    @ExposedMethod(doc = BuiltinDocs.str___contains___doc)
+    final boolean str___contains__(PyObject o) {
+        if (!(o instanceof PyNewString))
+            throw Py.TypeError("'in <string>' requires string as left operand");
+        PyNewString other = (PyNewString) o;
+        return string.indexOf(other.string) >= 0;
+    }
+
+    protected PyObject repeat(int count) {
+        if(count < 0) {
+            count = 0;
+        }
+        int s = string.length();
+        if((long)s * count > Integer.MAX_VALUE) {
+            // Since Strings store their data in an array, we can't make one
+            // longer than Integer.MAX_VALUE. Without this check we get
+            // NegativeArraySize exceptions when we create the array on the
+            // line with a wrapped int.
+            throw Py.OverflowError("max str len is " + Integer.MAX_VALUE);
+        }
+        char new_chars[] = new char[s * count];
+        for(int i = 0; i < count; i++) {
+            string.getChars(0, s, new_chars, i * s);
+        }
+        return createInstance(new String(new_chars));
+    }
+
+    @Override
+    public PyObject __mul__(PyObject o) {
+        return str___mul__(o);
+    }
+
+    @ExposedMethod(type = MethodType.BINARY, doc = BuiltinDocs.str___mul___doc)
+    final PyObject str___mul__(PyObject o) {
+        if (!o.isIndex()) {
+            return null;
+        }
+        return repeat(o.asIndex(Py.OverflowError));
+    }
+    
+    @Override
+    public PyObject __rmul__(PyObject o) {
+        return str___rmul__(o);
+    }
+
+    @ExposedMethod(type = MethodType.BINARY, doc = BuiltinDocs.str___rmul___doc)
+    final PyObject str___rmul__(PyObject o) {
+        if (!o.isIndex()) {
+            return null;
+        }
+        return repeat(o.asIndex(Py.OverflowError));
+    }
+
+    public PyObject __add__(PyObject other) {
+        return str___add__(other);
+    }
+    
+    @ExposedMethod(type = MethodType.BINARY, doc = BuiltinDocs.str___add___doc)
+    final PyObject str___add__(PyObject other) {
+        if (other instanceof PyNewUnicode) {
+            return decode().__add__(other);
+        }
+        if (other instanceof PyNewString) {
+            PyNewString otherStr = (PyNewString)other;
+            return new PyNewString(string.concat(otherStr.string));
+        }
+        return null;
+    }
+
+    @ExposedMethod(doc = BuiltinDocs.str___getnewargs___doc)
+    final PyTuple str___getnewargs__() {
+        return new PyTuple(new PyNewString(this.string));
+    }
+
+    public PyTuple __getnewargs__() {
+        return str___getnewargs__();
+    }
+
+    public PyObject __mod__(PyObject other) {
+        return str___mod__(other);
+    }
+    
+    @ExposedMethod(doc = BuiltinDocs.str___mod___doc)
+    public PyObject str___mod__(PyObject other){
+        StringFormatter fmt = new StringFormatter(string, false);
+        return fmt.format(other);
+    }
+
+    public PyObject __int__() {
+        try
+        {
+            return Py.newInteger(atoi(10));
+        } catch (PyException e) {
+            if (e.match(Py.OverflowError)) {
+                return atol(10);
+            }
+            throw e;
+        }
+    }
+
+    public PyObject __long__() {
+        return atol(10);
+    }
+
+    public PyFloat __float__() {
+        return new PyFloat(atof());
+    }
+
+    public PyObject __pos__() {
+      throw Py.TypeError("bad operand type for unary +");
+    }
+
+    public PyObject __neg__() {
+      throw Py.TypeError("bad operand type for unary -");
+    }
+
+    public PyObject __invert__() {
+      throw Py.TypeError("bad operand type for unary ~");
+    }
+
+    @SuppressWarnings("fallthrough")
+    public PyComplex __complex__() {
+        boolean got_re = false;
+        boolean got_im = false;
+        boolean done = false;
+        boolean sw_error = false;
+
+        int s = 0;
+        int n = string.length();
+        while (s < n && Character.isSpaceChar(string.charAt(s)))
+            s++;
+
+        if (s == n) {
+            throw Py.ValueError("empty string for complex()");
+        }
+
+        double z = -1.0;
+        double x = 0.0;
+        double y = 0.0;
+
+        int sign = 1;
+        do {
+            char c = string.charAt(s);
+            switch (c) {
+            case '-':
+                sign = -1;
+                /* Fallthrough */
+            case '+':
+                if (done || s+1 == n) {
+                    sw_error = true;
+                    break;
+                }
+                //  a character is guaranteed, but it better be a digit
+                //  or J or j
+                c = string.charAt(++s);  //  eat the sign character
+                                         //  and check the next
+                if  (!Character.isDigit(c) && c!='J' && c!='j')
+                    sw_error = true;
+                break;
+
+            case 'J':
+            case 'j':
+                if (got_im || done) {
+                    sw_error = true;
+                    break;
+                }
+                if  (z < 0.0) {
+                    y = sign;
+                } else {
+                    y = sign * z;
+                }
+                got_im = true;
+                done = got_re;
+                sign = 1;
+                s++; // eat the J or j
+                break;
+
+            case ' ':
+                while (s < n && Character.isSpaceChar(string.charAt(s)))
+                    s++;
+                if (s != n)
+                    sw_error = true;
+                break;
+
+            default:
+                boolean digit_or_dot = (c == '.' || Character.isDigit(c));
+                if (!digit_or_dot) {
+                    sw_error = true;
+                    break;
+                }
+                int end = endDouble(string, s);
+                z = Double.valueOf(string.substring(s, end)).doubleValue();
+                if (z == Double.POSITIVE_INFINITY) {
+                	throw Py.ValueError(String.format("float() out of range: %.150s", string));
+                }
+
+                s=end;
+                if (s < n) {
+                    c = string.charAt(s);
+                    if  (c == 'J' || c == 'j') {
+                        break;
+                    }
+                }
+                if  (got_re) {
+                   sw_error = true;
+                   break;
+                }
+
+                /* accept a real part */
+                x = sign * z;
+                got_re = true;
+                done = got_im;
+                z = -1.0;
+                sign = 1;
+                break;
+
+             }  /* end of switch  */
+
+        } while (s < n && !sw_error);
+
+        if (sw_error) {
+            throw Py.ValueError("malformed string for complex() " +
+                                string.substring(s));
+        }
+
+        return new PyComplex(x,y);
+    }
+
+    private int endDouble(String string, int s) {
+        int n = string.length();
+        while (s < n) {
+            char c = string.charAt(s++);
+            if (Character.isDigit(c))
+                continue;
+            if (c == '.')
+                continue;
+            if (c == 'e' || c == 'E') {
+                if (s < n) {
+                    c = string.charAt(s);
+                    if (c == '+' || c == '-')
+                        s++;
+                    continue;
+                }
+            }
+            return s-1;
+        }
+        return s;
+    }
+
+    // Add in methods from string module
+    public String lower() {
+        return str_lower();
+    }
+    
+    @ExposedMethod(doc = BuiltinDocs.str_lower_doc)
+    final String str_lower() {
+        return string.toLowerCase();
+    }
+
+    public String upper() {
+        return str_upper();
+    }
+
+    @ExposedMethod(doc = BuiltinDocs.str_upper_doc)
+    final String str_upper() {
+        return string.toUpperCase();
+    }
+
+    public String title() {
+        return str_title();
+    }
+
+    @ExposedMethod(doc = BuiltinDocs.str_title_doc)
+    final String str_title() {
+        char[] chars = string.toCharArray();
+        int n = chars.length;
+
+        boolean previous_is_cased = false;
+        for (int i = 0; i < n; i++) {
+            char ch = chars[i];
+            if (previous_is_cased)
+                chars[i] = Character.toLowerCase(ch);
+            else
+                chars[i] = Character.toTitleCase(ch);
+
+            if (Character.isLowerCase(ch) ||
+                   Character.isUpperCase(ch) ||
+                   Character.isTitleCase(ch))
+                previous_is_cased = true;
+            else
+                previous_is_cased = false;
+        }
+        return new String(chars);
+    }
+
+    public String swapcase() {
+        return str_swapcase();
+    }
+
+    @ExposedMethod(doc = BuiltinDocs.str_swapcase_doc)
+    final String str_swapcase() {
+        char[] chars = string.toCharArray();
+        int n=chars.length;
+        for (int i=0; i<n; i++) {
+            char c = chars[i];
+            if (Character.isUpperCase(c)) {
+                chars[i] = Character.toLowerCase(c);
+            }
+            else if (Character.isLowerCase(c)) {
+                chars[i] = Character.toUpperCase(c);
+            }
+        }
+        return new String(chars);
+    }
+
+    public String strip() {
+        return str_strip(null);
+    }
+
+    public String strip(String sep) {
+        return str_strip(sep);
+    }
+
+    @ExposedMethod(defaults = "null", doc = BuiltinDocs.str_strip_doc)
+    final String str_strip(String sep) {
+        char[] chars = string.toCharArray();
+        int n=chars.length;
+        int start=0;
+        if (sep == null)
+            while (start < n && Character.isWhitespace(chars[start]))
+                start++;
+        else
+            while (start < n && sep.indexOf(chars[start]) >= 0)
+                start++;
+
+        int end=n-1;
+        if (sep == null)
+            while (end >= 0 && Character.isWhitespace(chars[end]))
+                end--;
+        else
+            while (end >= 0 && sep.indexOf(chars[end]) >= 0)
+                end--;
+
+        if (end >= start) {
+            return (end < n-1 || start > 0)
+                ? string.substring(start, end+1) : string;
+        } else {
+            return "";
+        }
+    }
+
+    public String lstrip() {
+        return str_lstrip(null);
+    }
+    
+    public String lstrip(String sep) {
+        return str_lstrip(sep);
+    }
+
+    @ExposedMethod(defaults = "null", doc = BuiltinDocs.str_lstrip_doc)
+    final String str_lstrip(String sep) {
+        char[] chars = string.toCharArray();
+        int n=chars.length;
+        int start=0;
+        if (sep == null)
+            while (start < n && Character.isWhitespace(chars[start]))
+                start++;
+        else
+            while (start < n && sep.indexOf(chars[start]) >= 0)
+                start++;
+
+        return (start > 0) ? string.substring(start, n) : string;
+    }
+
+    public String rstrip(String sep) {
+        return str_rstrip(sep);
+    }
+    
+    @ExposedMethod(defaults = "null", doc = BuiltinDocs.str_rstrip_doc)
+    final String str_rstrip(String sep) {
+        char[] chars = string.toCharArray();
+        int n=chars.length;
+        int end=n-1;
+        if (sep == null)
+            while (end >= 0 && Character.isWhitespace(chars[end]))
+                end--;
+        else
+            while (end >= 0 && sep.indexOf(chars[end]) >= 0)
+                end--;
+
+        return (end < n-1) ? string.substring(0, end+1) : string;
+    }
+
+
+    public PyList split() {
+        return str_split(null, -1);
+    }
+
+    public PyList split(String sep) {
+        return str_split(sep, -1);
+    }
+
+    public PyList split(String sep, int maxsplit) {
+        return str_split(sep, maxsplit);
+    }
+
+    @ExposedMethod(defaults = {"null", "-1"}, doc = BuiltinDocs.str_split_doc)
+    final PyList str_split(String sep, int maxsplit) {
+        if (sep != null) {
+            if (sep.length() == 0) {
+                throw Py.ValueError("empty separator");
+            }
+            return splitfields(sep, maxsplit);
+        }
+
+        PyList list = new PyList();
+
+        char[] chars = string.toCharArray();
+        int n=chars.length;
+
+        if (maxsplit < 0)
+            maxsplit = n;
+
+        int splits=0;
+        int index=0;
+        while (index < n && splits < maxsplit) {
+            while (index < n && Character.isWhitespace(chars[index]))
+                index++;
+            if (index == n)
+                break;
+            int start = index;
+
+            while (index < n && !Character.isWhitespace(chars[index]))
+                index++;
+            list.append(fromSubstring(start, index));
+            splits++;
+        }
+        while (index < n && Character.isWhitespace(chars[index]))
+            index++;
+        if (index < n) {
+            list.append(fromSubstring(index, n));
+        }
+        return list;
+    }
+
+    public PyList rsplit() {
+        return str_rsplit(null, -1);
+    }
+
+    public PyList rsplit(String sep) {
+        return str_rsplit(sep, -1);
+    }
+
+    public PyList rsplit(String sep, int maxsplit) {
+        return str_rsplit(sep, maxsplit);
+    }
+
+    @ExposedMethod(defaults = {"null", "-1"}, doc = BuiltinDocs.str_rsplit_doc)
+    final PyList str_rsplit(String sep, int maxsplit) {
+        if (sep != null) {
+            if (sep.length() == 0) {
+                throw Py.ValueError("empty separator");
+            }
+            PyList list = rsplitfields(sep, maxsplit);
+            list.reverse();
+            return list;
+        }
+
+        PyList list = new PyList();
+        char[] chars = string.toCharArray();
+
+        if (maxsplit < 0) {
+            maxsplit = chars.length;
+        }
+
+        int splits = 0;
+        int i = chars.length - 1;
+
+        while (i > -1 && Character.isWhitespace(chars[i])) {
+            i--;
+        }
+        if (i == -1) {
+            return list;
+        }
+
+        while (splits < maxsplit) {
+            while (i > -1 && Character.isWhitespace(chars[i])) {
+                i--;
+            }
+            if (i == -1) {
+                break;
+            }
+
+            int nextWsChar = i;
+            while (nextWsChar > -1 && !Character.isWhitespace(chars[nextWsChar])) {
+                nextWsChar--;
+            }
+            if (nextWsChar == -1) {
+                break;
+            }
+
+            splits++;
+            list.add(fromSubstring(nextWsChar + 1, i + 1));
+            i = nextWsChar;
+        }
+        while (i > -1 && Character.isWhitespace(chars[i])) {
+            i--;
+        }
+        if (i > -1) {
+            list.add(fromSubstring(0,i+1));
+        }
+        list.reverse();
+        return list;
+    }
+
+    public PyTuple partition(PyObject sepObj) {
+        return str_partition(sepObj);
+    }
+
+    @ExposedMethod(doc = BuiltinDocs.str_partition_doc)
+    final PyTuple str_partition(PyObject sepObj) {
+        String sep;
+
+        if (sepObj instanceof PyNewUnicode) {
+            return unicodePartition(sepObj);
+        } else if (sepObj instanceof PyNewString) {
+            sep = ((PyNewString)sepObj).string;
+        } else {
+            throw Py.TypeError("expected a character buffer object");
+        }
+
+        if (sep.length() == 0) {
+            throw Py.ValueError("empty separator");
+        }
+
+        int index = string.indexOf(sep);
+        if (index != -1) {
+            return new PyTuple(fromSubstring(0, index), sepObj,
+                               fromSubstring(index + sep.length(), string.length()));
+        } else {
+            return new PyTuple(this, Py.EmptyString, Py.EmptyString);
+        }
+    }
+
+    final PyTuple unicodePartition(PyObject sepObj) {
+        PyUnicode strObj = __unicode__();
+        String str = strObj.string;
+
+        // Will throw a TypeError if not a basestring
+        String sep = sepObj.asString();
+        sepObj = sepObj.__unicode__();
+
+        if (sep.length() == 0) {
+            throw Py.ValueError("empty separator");
+        }
+
+        int index = str.indexOf(sep);
+        if (index != -1) {
+            return new PyTuple(strObj.fromSubstring(0, index), sepObj,
+                               strObj.fromSubstring(index + sep.length(), str.length()));
+        } else {
+            PyUnicode emptyUnicode = Py.newUnicode("");
+            return new PyTuple(this, emptyUnicode, emptyUnicode);
+        }
+    }
+
+    public PyTuple rpartition(PyObject sepObj) {
+        return str_rpartition(sepObj);
+    }
+
+    @ExposedMethod(doc = BuiltinDocs.str_rpartition_doc)
+    final PyTuple str_rpartition(PyObject sepObj) {
+        String sep;
+
+        if (sepObj instanceof PyNewUnicode) {
+            return unicodePartition(sepObj);
+        } else if (sepObj instanceof PyNewString) {
+            sep = ((PyNewString)sepObj).string;
+        } else {
+            throw Py.TypeError("expected a character buffer object");
+        }
+
+        if (sep.length() == 0) {
+            throw Py.ValueError("empty separator");
+        }
+
+        int index = string.lastIndexOf(sep);
+        if (index != -1) {
+            return new PyTuple(fromSubstring(0, index), sepObj,
+                               fromSubstring(index + sep.length(), string.length()));
+        } else {
+            return new PyTuple(Py.EmptyString, Py.EmptyString, this);
+        }
+    }
+
+    final PyTuple unicodeRpartition(PyObject sepObj) {
+        PyUnicode strObj = __unicode__();
+        String str = strObj.string;
+
+        // Will throw a TypeError if not a basestring
+        String sep = sepObj.asString();
+        sepObj = sepObj.__unicode__();
+
+        if (sep.length() == 0) {
+            throw Py.ValueError("empty separator");
+        }
+
+        int index = str.lastIndexOf(sep);
+        if (index != -1) {
+            return new PyTuple(strObj.fromSubstring(0, index), sepObj,
+                               strObj.fromSubstring(index + sep.length(), str.length()));
+        } else {
+            PyUnicode emptyUnicode = Py.newUnicode("");
+            return new PyTuple(emptyUnicode, emptyUnicode, this);
+        }
+    }
+
+    private PyList splitfields(String sep, int maxsplit) {
+        PyList list = new PyList();
+
+        int length = string.length();
+        if (maxsplit < 0)
+            maxsplit = length + 1;
+
+        int lastbreak = 0;
+        int splits = 0;
+        int sepLength = sep.length();
+        int index;
+        if((sep.length() == 0) && (maxsplit != 0)) {
+            index = string.indexOf(sep, lastbreak);
+            list.append(fromSubstring(lastbreak, index));
+            splits++;
+        }
+        while (splits < maxsplit) {
+            index = string.indexOf(sep, lastbreak);
+            if (index == -1)
+                break;
+            if(sep.length() == 0)
+                index++;
+            splits += 1;
+            list.append(fromSubstring(lastbreak, index));
+            lastbreak = index + sepLength;
+        }
+        if (lastbreak <= length) {
+            list.append(fromSubstring(lastbreak, length));
+        }
+        return list;
+    }
+
+    private PyList rsplitfields(String sep, int maxsplit) {
+        PyList list = new PyList();
+
+        int length = string.length();
+        if (maxsplit < 0) {
+            maxsplit = length + 1;
+        }
+
+        int lastbreak = length;
+        int splits = 0;
+        int index = length;
+        int sepLength = sep.length();
+
+        while (index > 0 && splits < maxsplit) {
+            int i = string.lastIndexOf(sep, index - sepLength);
+            if (i == index) {
+                i -= sepLength;
+            }
+            if (i < 0) {
+                break;
+            }
+            splits++;
+            list.append(fromSubstring(i + sepLength, lastbreak));
+            lastbreak = i;
+            index = i;
+
+        }
+        list.append(fromSubstring(0, lastbreak));
+        return list;
+    }
+
+    public PyList splitlines() {
+        return str_splitlines(false);
+    }
+
+    public PyList splitlines(boolean keepends) {
+        return str_splitlines(keepends);
+    }
+
+    @ExposedMethod(defaults = "false", doc = BuiltinDocs.str_splitlines_doc)
+    final PyList str_splitlines(boolean keepends) {
+        PyList list = new PyList();
+
+        char[] chars = string.toCharArray();
+        int n=chars.length;
+
+        int j = 0;
+        for (int i = 0; i < n; ) {
+            /* Find a line and append it */
+            while (i < n && chars[i] != '\n' && chars[i] != '\r' &&
+                    Character.getType(chars[i]) != Character.LINE_SEPARATOR)
+                i++;
+
+            /* Skip the line break reading CRLF as one line break */
+            int eol = i;
+            if (i < n) {
+                if (chars[i] == '\r' && i + 1 < n && chars[i+1] == '\n')
+                    i += 2;
+                else
+                    i++;
+                if (keepends)
+                    eol = i;
+            }
+            list.append(fromSubstring(j, eol));
+            j = i;
+        }
+        if (j < n) {
+            list.append(fromSubstring(j, n));
+        }
+        return list;
+    }
+
+    protected PyNewString fromSubstring(int begin, int end) {
+        return createInstance(string.substring(begin, end), true);
+    }
+
+    public int index(String sub) {
+        return str_index(sub, 0, null);
+    }
+
+    public int index(String sub, int start) {
+        return str_index(sub, start, null);
+    }
+
+    public int index(String sub, int start, int end) {
+        return str_index(sub, start, Py.newInteger(end));
+    }
+
+    @ExposedMethod(defaults = {"0", "null"}, doc = BuiltinDocs.str_index_doc)
+    final int str_index(String sub, int start, PyObject end) {
+        int index = str_find(sub, start, end);
+        if (index == -1)
+            throw Py.ValueError("substring not found in string.index");
+        return index;
+    }
+
+    public int rindex(String sub) {
+        return str_rindex(sub, 0, null);
+    }
+
+    public int rindex(String sub, int start) {
+        return str_rindex(sub, start, null);
+    }
+
+    public int rindex(String sub, int start, int end) {
+        return str_rindex(sub, start, Py.newInteger(end));
+    }
+
+    @ExposedMethod(defaults = {"0", "null"}, doc = BuiltinDocs.str_rindex_doc)
+    final int str_rindex(String sub, int start, PyObject end) {
+        int index = str_rfind(sub, start, end);
+        if(index == -1)
+            throw Py.ValueError("substring not found in string.rindex");
+        return index;
+    }
+
+    public int count(String sub) {
+        return str_count(sub, 0, null);
+    }
+
+    public int count(String sub, int start) {
+        return str_count(sub, start, null);
+    }
+
+    public int count(String sub, int start, int end) {
+        return str_count(sub, start, Py.newInteger(end));
+    }
+    
+    @ExposedMethod(defaults = {"0", "null"}, doc = BuiltinDocs.str_count_doc)
+    final int str_count(String sub, int start, PyObject end) {
+        int[] indices = translateIndices(start, end);
+        int n = sub.length();
+        if(n == 0) {
+            if (start > string.length()) {
+                return 0;
+            }
+            return indices[1] - indices[0] + 1;
+        }
+        int count = 0;
+        while(true){
+            int index = string.indexOf(sub, indices[0]);
+            indices[0] = index + n;
+            if(indices[0] > indices[1] || index == -1) {
+                break;
+            }
+            count++;
+        }
+        return count;
+    }
+
+    public int find(String sub) {
+        return str_find(sub, 0, null);
+    }
+
+    public int find(String sub, int start) {
+        return str_find(sub, start, null);
+    }
+
+    public int find(String sub, int start, int end) {
+        return str_find(sub, start, Py.newInteger(end));
+    }
+
+    @ExposedMethod(defaults = {"0", "null"}, doc = BuiltinDocs.str_find_doc)
+    final int str_find(String sub, int start, PyObject end) {
+        int[] indices = translateIndices(start, end);
+        int index = string.indexOf(sub, indices[0]);
+        if (index < start || index > indices[1]) {
+            return -1;
+        }
+        return index;
+    }
+
+    public int rfind(String sub) {
+        return str_rfind(sub, 0, null);
+    }
+
+    public int rfind(String sub, int start) {
+        return str_rfind(sub, start, null);
+    }
+
+    public int rfind(String sub, int start, int end) {
+        return str_rfind(sub, start, Py.newInteger(end));
+    }
+
+    @ExposedMethod(defaults = {"0", "null"}, doc = BuiltinDocs.str_rfind_doc)
+    final int str_rfind(String sub, int start, PyObject end) {
+        int[] indices = translateIndices(start, end);
+        int index = string.lastIndexOf(sub, indices[1] - sub.length());
+        if (index < start) {
+            return -1;
+        }
+        return index;
+    }
+
+    public double atof() {
+        StringBuilder s = null;
+        int n = string.length();
+        for (int i = 0; i < n; i++) {
+            char ch = string.charAt(i);
+            if (ch == '\u0000') {
+                throw Py.ValueError("null byte in argument for float()");
+            }
+            if (Character.isDigit(ch)) {
+                if (s == null)
+                    s = new StringBuilder(string);
+                int val = Character.digit(ch, 10);
+                s.setCharAt(i, Character.forDigit(val, 10));
+            }
+        }
+        String sval = string;
+        if (s != null)
+            sval = s.toString();
+        try {
+            // Double.valueOf allows format specifier ("d" or "f") at the end
+            String lowSval = sval.toLowerCase();
+            if (lowSval.equals("nan")) return Double.NaN;
+            else if (lowSval.equals("inf")) return Double.POSITIVE_INFINITY;
+            else if (lowSval.equals("-inf")) return Double.NEGATIVE_INFINITY;
+            
+            if (lowSval.endsWith("d") || lowSval.endsWith("f")) {
+                throw new NumberFormatException("format specifiers not allowed");
+            }
+            return Double.valueOf(sval).doubleValue();
+        }
+        catch (NumberFormatException exc) {
+            throw Py.ValueError("invalid literal for __float__: "+string);
+        }
+    }
+
+    public int atoi() {
+        return atoi(10);
+    }
+
+    public int atoi(int base) {
+        if ((base != 0 && base < 2) || (base > 36)) {
+            throw Py.ValueError("invalid base for atoi()");
+        }
+
+        int b = 0;
+        int e = string.length();
+
+        while (b < e && Character.isWhitespace(string.charAt(b)))
+            b++;
+
+        while (e > b && Character.isWhitespace(string.charAt(e-1)))
+            e--;
+
+        char sign = 0;
+        if (b < e) {
+            sign = string.charAt(b);
+            if (sign == '-' || sign == '+') {
+                b++;
+                while (b < e && Character.isWhitespace(string.charAt(b))) b++;
+            }
+
+            if (base == 0 || base == 16) {
+                if (string.charAt(b) == '0') {
+                    if (b < e-1 &&
+                           Character.toUpperCase(string.charAt(b+1)) == 'X') {
+                        base = 16;
+                        b += 2;
+                    } else {
+                        if (base == 0)
+                            base = 8;
+                    }
+                }
+            }
+        }
+
+        if (base == 0)
+            base = 10;
+
+        String s = string;
+        if (b > 0 || e < string.length())
+            s = string.substring(b, e);
+
+        try {
+            BigInteger bi;
+            if (sign == '-') {
+                bi = new BigInteger("-" + s, base);
+            } else
+                bi = new BigInteger(s, base);
+            if (bi.compareTo(PyInteger.maxInt) > 0 || bi.compareTo(PyInteger.minInt) < 0) {
+                throw Py.OverflowError("long int too large to convert to int");
+            }
+            return bi.intValue();
+        } catch (NumberFormatException exc) {
+            throw Py.ValueError("invalid literal for int() with base " + base + ": " + string);
+        } catch (StringIndexOutOfBoundsException exc) {
+            throw Py.ValueError("invalid literal for int() with base " + base + ": " + string);
+        }
+    }
+
+    public PyLong atol() {
+        return atol(10);
+    }
+
+    public PyLong atol(int base) {
+        String str = string;
+        int b = 0;
+        int e = str.length();
+
+        while (b < e && Character.isWhitespace(str.charAt(b)))
+            b++;
+
+        while (e > b && Character.isWhitespace(str.charAt(e-1)))
+            e--;
+
+
+        char sign = 0;
+        if (b < e) {
+            sign = string.charAt(b);
+            if (sign == '-' || sign == '+') {
+                b++;
+                while (b < e && Character.isWhitespace(str.charAt(b))) b++;
+            }
+
+
+            if (base == 0 || base == 16) {
+                if (string.charAt(b) == '0') {
+                    if (b < e-1 &&
+                           Character.toUpperCase(string.charAt(b+1)) == 'X') {
+                        base = 16;
+                        b += 2;
+                    } else {
+                        if (base == 0)
+                            base = 8;
+                    }
+                }
+            }
+        }
+        if (base == 0)
+            base = 10;
+
+        if (base < 2 || base > 36)
+            throw Py.ValueError("invalid base for long literal:" + base);
+
+        // if the base >= 22, then an 'l' or 'L' is a digit!
+        if (base < 22 && e > b && (str.charAt(e-1) == 'L' || str.charAt(e-1) == 'l'))
+            e--;
+        
+        if (b > 0 || e < str.length())
+            str = str.substring(b, e);
+        
+        try {
+            java.math.BigInteger bi = null;
+            if (sign == '-')
+                bi = new java.math.BigInteger("-" + str, base);
+            else
+                bi = new java.math.BigInteger(str, base);
+            return new PyLong(bi);
+        } catch (NumberFormatException exc) {
+            if (this instanceof PyNewUnicode) {
+                // TODO: here's a basic issue: do we use the BigInteger constructor
+                // above, or add an equivalent to CPython's PyNewUnicode_EncodeDecimal;
+                // we should note that the current error string does not quite match
+                // CPython regardless of the codec, that's going to require some more work
+                throw Py.UnicodeEncodeError("decimal", "codec can't encode character",
+                        0,0, "invalid decimal Unicode string");
+            }
+            else {
+            throw Py.ValueError("invalid literal for long() with base " + base + ": " + string);
+            }
+        } catch (StringIndexOutOfBoundsException exc) {
+            throw Py.ValueError("invalid literal for long() with base " + base + ": " + string);
+        }
+    }
+
+    private static String padding(int n, char pad) {
+        char[] chars = new char[n];
+        for (int i=0; i<n; i++)
+            chars[i] = pad;
+        return new String(chars);
+    }
+
+    private static char parse_fillchar(String function, String fillchar) {
+        if (fillchar == null) { return ' '; }
+        if (fillchar.length() != 1) {
+            throw Py.TypeError(function + "() argument 2 must be char, not str");
+        }
+        return fillchar.charAt(0);
+    }
+    
+    public String ljust(int width) {
+        return str_ljust(width, null);
+    }
+
+    public String ljust(int width, String padding) {
+        return str_ljust(width, padding);
+    }
+    
+    @ExposedMethod(defaults="null", doc = BuiltinDocs.str_ljust_doc)
+    final String str_ljust(int width, String fillchar) {
+        char pad = parse_fillchar("ljust", fillchar);
+        int n = width-string.length();
+        if (n <= 0)
+            return string;
+        return string+padding(n, pad);
+    }
+
+    public String rjust(int width) {
+        return str_rjust(width, null);
+    }
+
+    @ExposedMethod(defaults="null", doc = BuiltinDocs.str_rjust_doc)
+    final String str_rjust(int width, String fillchar) {
+        char pad = parse_fillchar("rjust", fillchar);
+        int n = width-string.length();
+        if (n <= 0)
+            return string;
+        return padding(n, pad)+string;
+    }
+
+    public String center(int width) {
+        return str_center(width, null);
+    }
+
+    @ExposedMethod(defaults="null", doc = BuiltinDocs.str_center_doc)
+    final String str_center(int width, String fillchar) {
+        char pad = parse_fillchar("center", fillchar);
+        int n = width-string.length();
+        if (n <= 0)
+            return string;
+        int half = n/2;
+        if (n%2 > 0 &&  width%2 > 0)
+            half += 1;
+        
+        return padding(half, pad)+string+padding(n-half, pad);
+    }
+
+    public String zfill(int width) {
+        return str_zfill(width);
+    }
+
+    @ExposedMethod(doc = BuiltinDocs.str_zfill_doc)
+    final String str_zfill(int width) {
+        String s = string;
+        int n = s.length();
+        if (n >= width)
+            return s;
+        char[] chars = new char[width];
+        int nzeros = width-n;
+        int i=0;
+        int sStart=0;
+        if (n > 0) {
+            char start = s.charAt(0);
+            if (start == '+' || start == '-') {
+                chars[0] = start;
+                i += 1;
+                nzeros++;
+                sStart=1;
+            }
+        }
+        for(;i<nzeros; i++) {
+            chars[i] = '0';
+        }
+        s.getChars(sStart, s.length(), chars, i);
+        return new String(chars);
+    }
+
+    public String expandtabs() {
+        return str_expandtabs(8);
+    }
+
+    public String expandtabs(int tabsize) {
+        return str_expandtabs(tabsize);
+    }
+
+    @ExposedMethod(defaults = "8", doc = BuiltinDocs.str_expandtabs_doc)
+    final String str_expandtabs(int tabsize) {
+        String s = string;
+        StringBuilder buf = new StringBuilder((int)(s.length()*1.5));
+        char[] chars = s.toCharArray();
+        int n = chars.length;
+        int position = 0;
+
+        for(int i=0; i<n; i++) {
+            char c = chars[i];
+            if (c == '\t') {
+                int spaces = tabsize-position%tabsize;
+                position += spaces;
+                while (spaces-- > 0) {
+                    buf.append(' ');
+                }
+                continue;
+            }
+            if (c == '\n' || c == '\r') {
+                position = -1;
+            }
+            buf.append(c);
+            position++;
+        }
+        return buf.toString();
+    }
+
+    public String capitalize() {
+        return str_capitalize();
+    }
+
+    @ExposedMethod(doc = BuiltinDocs.str_capitalize_doc)
+    final String str_capitalize() {
+        if (string.length() == 0)
+            return string;
+        String first = string.substring(0,1).toUpperCase();
+        return first.concat(string.substring(1).toLowerCase());
+    }
+
+    @ExposedMethod(defaults = "null", doc = BuiltinDocs.str_replace_doc)
+    final PyNewString str_replace(PyObject oldPiece, PyObject newPiece, PyObject maxsplit) {
+        if(!(oldPiece instanceof PyNewString) || !(newPiece instanceof PyNewString)) {
+            throw Py.TypeError("str or unicode required for replace");
+        }
+
+        return replace((PyNewString)oldPiece, (PyNewString)newPiece, maxsplit == null ? -1 : maxsplit.asInt());
+    }
+    
+    protected PyNewString replace(PyNewString oldPiece, PyNewString newPiece, int maxsplit) {
+        int len = string.length();
+        int old_len = oldPiece.string.length();
+        if (len == 0) {
+            if (max...
 
[truncated message content]