LiteralParser.cs - This C# code is a Python interpreter imp…

/IronPython_2_6/Src/IronPython/Runtime/LiteralParser.cs

# · C# · 619 lines · 508 code · 64 blank · 47 comment · 188 complexity · 28d7ab60e1c4636b5eecdd5200790386 MD5 · raw file

/* ****************************************************************************

 *

 * Copyright (c) Microsoft Corporation. 

 *

 * This source code is subject to terms and conditions of the Microsoft Public License. A 

 * copy of the license can be found in the License.html file at the root of this distribution. If 

 * you cannot locate the  Microsoft Public License, please send an email to 

 * dlr@microsoft.com. By using this source code in any fashion, you are agreeing to be bound 

 * by the terms of the Microsoft Public License.

 *

 * You must not remove this notice, or any other, from this software.

 *

 *

 * ***************************************************************************/



using System;

using System.Collections.Generic;

using System.Diagnostics;

using System.Globalization;

using System.Text;



using IronPython.Runtime.Operations;



using Microsoft.Scripting.Utils;



#if CLR2

using Microsoft.Scripting.Math;

using Complex = Microsoft.Scripting.Math.Complex64;

#else

using System.Numerics;

#endif



namespace IronPython.Runtime {

    /// <summary>

    /// Summary description for ConstantValue.

    /// </summary>

    public static class LiteralParser {

        public static string ParseString(string text, bool isRaw, bool isUni) {

            return ParseString(text, isRaw, isUni, true);

        }

        public static string ParseString(string text, bool isRaw, bool isUni, bool complete) {

            Debug.Assert(text != null);



            if (isRaw && !isUni) return text;



            //PERFORMANCE-ISSUE ??? maybe optimize for the 0-escapes case

            StringBuilder buf = new StringBuilder(text.Length);

            int i = 0;

            int l = text.Length;

            int val;

            while (i < l) {

                char ch = text[i++];

                if (ch == '\\') {

                    if (i >= l) {

                        if (!complete) {

                            break;

                        } else if (isRaw) {

                            buf.Append('\\');

                            break;

                        } else {

                            throw PythonOps.ValueError("Trailing \\ in string");

                        }

                    }

                    ch = text[i++];



                    if (ch == 'u' || ch == 'U') {

                        int len = (ch == 'u') ? 4 : 8;

                        int max = 16;

                        if (isUni) {

                            if (TryParseInt(text, i, len, max, out val)) {

                                buf.Append((char)val);

                                i += len;

                            } else {

                                throw PythonOps.UnicodeEncodeError(@"'unicodeescape' codec can't decode bytes in position {0}: truncated \uXXXX escape", i);

                            }

                        } else {

                            buf.Append('\\');

                            buf.Append(ch);

                        }

                    } else {

                        if (isRaw) {

                            buf.Append('\\');

                            buf.Append(ch);

                            continue;

                        }

                        switch (ch) {

                            case 'a': buf.Append('\a'); continue;

                            case 'b': buf.Append('\b'); continue;

                            case 'f': buf.Append('\f'); continue;

                            case 'n': buf.Append('\n'); continue;

                            case 'r': buf.Append('\r'); continue;

                            case 't': buf.Append('\t'); continue;

                            case 'v': buf.Append('\v'); continue;

                            case '\\': buf.Append('\\'); continue;

                            case '\'': buf.Append('\''); continue;

                            case '\"': buf.Append('\"'); continue;

                            case '\r': if (i < l && text[i] == '\n') i++; continue;

                            case '\n': continue;

                            case 'x': //hex

                                if (!TryParseInt(text, i, 2, 16, out val)) {

                                    goto default;

                                }

                                buf.Append((char)val);

                                i += 2;

                                continue;

                            case '0':

                            case '1':

                            case '2':

                            case '3':

                            case '4':

                            case '5':

                            case '6':

                            case '7': {

                                    int onechar;

                                    val = ch - '0';

                                    if (i < l && HexValue(text[i], out onechar) && onechar < 8) {

                                        val = val * 8 + onechar;

                                        i++;

                                        if (i < l && HexValue(text[i], out onechar) && onechar < 8) {

                                            val = val * 8 + onechar;

                                            i++;

                                        }

                                    }

                                }



                                buf.Append((char)val);

                                continue;

                            default:

                                buf.Append("\\");

                                buf.Append(ch);

                                continue;

                        }

                    }

                } else {

                    buf.Append(ch);

                }

            }



            return buf.ToString();

        }



        internal static List<byte> ParseBytes(string text, bool isRaw, bool complete) {

            Debug.Assert(text != null);



            //PERFORMANCE-ISSUE ??? maybe optimize for the 0-escapes case

            List<byte> buf = new List<byte>(text.Length);



            int i = 0;

            int l = text.Length;

            int val;

            while (i < l) {

                char ch = text[i++];

                if (!isRaw && ch == '\\') {

                    if (i >= l) {

                        if (!complete) {

                            break;

                        } else {

                            throw PythonOps.ValueError("Trailing \\ in string");

                        }

                    }

                    ch = text[i++];

                    switch (ch) {

                        case 'a': buf.Add((byte)'\a'); continue;

                        case 'b': buf.Add((byte)'\b'); continue;

                        case 'f': buf.Add((byte)'\f'); continue;

                        case 'n': buf.Add((byte)'\n'); continue;

                        case 'r': buf.Add((byte)'\r'); continue;

                        case 't': buf.Add((byte)'\t'); continue;

                        case 'v': buf.Add((byte)'\v'); continue;

                        case '\\': buf.Add((byte)'\\'); continue;

                        case '\'': buf.Add((byte)'\''); continue;

                        case '\"': buf.Add((byte)'\"'); continue;

                        case '\r': if (i < l && text[i] == '\n') i++; continue;

                        case '\n': continue;

                        case 'x': //hex

                            if (!TryParseInt(text, i, 2, 16, out val)) {

                                goto default;

                            }

                            buf.Add((byte)val);

                            i += 2;

                            continue;

                        case '0':

                        case '1':

                        case '2':

                        case '3':

                        case '4':

                        case '5':

                        case '6':

                        case '7': {

                                int onechar;

                                val = ch - '0';

                                if (i < l && HexValue(text[i], out onechar) && onechar < 8) {

                                    val = val * 8 + onechar;

                                    i++;

                                    if (i < l && HexValue(text[i], out onechar) && onechar < 8) {

                                        val = val * 8 + onechar;

                                        i++;

                                    }

                                }

                            }



                            buf.Add((byte)val);

                            continue;

                        default:

                            buf.Add((byte)'\\');

                            buf.Add((byte)ch);

                            continue;

                    }

                    

                } else {

                    buf.Add((byte)ch);

                }

            }            



            return buf;

        }



        private static bool HexValue(char ch, out int value) {

            switch (ch) {

                case '0':

                case '\x660': value = 0; break;

                case '1':

                case '\x661': value = 1; break;

                case '2':

                case '\x662': value = 2; break;

                case '3':

                case '\x663': value = 3; break;

                case '4':

                case '\x664': value = 4; break;

                case '5':

                case '\x665': value = 5; break;

                case '6':

                case '\x666': value = 6; break;

                case '7':

                case '\x667': value = 7; break;

                case '8':

                case '\x668': value = 8; break;

                case '9':

                case '\x669': value = 9; break;

                default:

                    if (ch >= 'a' && ch <= 'z') {

                        value = ch - 'a' + 10;

                    } else if (ch >= 'A' && ch <= 'Z') {

                        value = ch - 'A' + 10;

                    } else {

                        value = -1;

                        return false;

                    }

                    break;

            }

            return true;

        }



        private static int HexValue(char ch) {

            int value;

            if (!HexValue(ch, out value)) {

                throw new ArgumentException("bad char for integer value: " + ch);

            }

            return value;

        }



        private static int CharValue(char ch, int b) {

            int val = HexValue(ch);

            if (val >= b) {

                throw new ArgumentException(String.Format("bad char for the integer value: '{0}' (base {1})", ch, b));

            }

            return val;

        }



        private static bool ParseInt(string text, int b, out int ret) {

            ret = 0;

            long m = 1;

            for (int i = text.Length - 1; i >= 0; i--) {

                // avoid the exception here.  Not only is throwing it expensive,

                // but loading the resources for it is also expensive 

                long lret = (long)ret + m * CharValue(text[i], b);

                if (Int32.MinValue <= lret && lret <= Int32.MaxValue) {

                    ret = (int)lret;

                } else {

                    return false;

                }



                m *= b;

                if (Int32.MinValue > m || m > Int32.MaxValue) {

                    return false;

                }

            }

            return true;

        }



        private static bool TryParseInt(string text, int start, int length, int b, out int value) {

            value = 0;

            if (start + length > text.Length) {

                return false;

            }

            for (int i = start, end = start + length; i < end; i++) {

                int onechar;

                if (HexValue(text[i], out onechar) && onechar < b) {

                    value = value * b + onechar;

                } else {

                    return false;

                }

            }

            return true;

        }



        public static object ParseInteger(string text, int b) {

            Debug.Assert(b != 0);

            int iret;

            if (!ParseInt(text, b, out iret)) {

                BigInteger ret = ParseBigInteger(text, b);

                if (!ret.AsInt32(out iret)) {

                    return ret;

                }

            }

            return iret;

        }



        public static object ParseIntegerSign(string text, int b) {

            int start = 0, end = text.Length, saveb = b;

            short sign = 1;



            if (b < 0 || b == 1 || b > 36) {

                throw new ArgumentException("base must be >= 2 and <= 36");

            }



            ParseIntegerStart(text, ref b, ref start, end, ref sign);



            int ret = 0;

            try {

                int saveStart = start;

                for (; ; ) {

                    int digit;

                    if (start >= end) {

                        if (saveStart == start) {

                            throw new ArgumentException("Invalid integer literal");

                        }

                        break;

                    }

                    if (!HexValue(text[start], out digit)) break;

                    if (!(digit < b)) {

                        if (text[start] == 'l' || text[start] == 'L') {

                            break;

                        }

                        throw new ArgumentException("Invalid integer literal");

                    }



                    checked {

                        // include sign here so that System.Int32.MinValue won't overflow

                        ret = ret * b + sign * digit;

                    }

                    start++;

                }

            } catch (OverflowException) {

                return ParseBigIntegerSign(text, saveb);

            }



            ParseIntegerEnd(text, start, end);



            return ret;

        }



        private static void ParseIntegerStart(string text, ref int b, ref int start, int end, ref short sign) {

            //  Skip whitespace

            while (start < end && Char.IsWhiteSpace(text, start)) start++;

            //  Sign?

            if (start < end) {

                switch (text[start]) {

                    case '-':

                        sign = -1;

                        goto case '+';

                    case '+':

                        start++;

                        break;

                }

            }

            //  Skip whitespace

            while (start < end && Char.IsWhiteSpace(text, start)) start++;



            //  Determine base

            if (b == 0) {

                if (start < end && text[start] == '0') {

                    start++;

                    // Hex, oct, or bin

                    b = 8;

                    if (start < end) {

                        if (text[start] == 'x' || text[start] == 'X') {

                            start++;

                            b = 16;

                        } else if (text[start] == 'o' || text[start] == 'O') {

                            start++;

                        } else if (text[start] == 'b' || text[start] == 'B') {

                            start++;

                            b = 2;

                        }

                    }

                } else {

                    b = 10;

                }

            }

        }



        private static void ParseIntegerEnd(string text, int start, int end) {

            //  Skip whitespace

            while (start < end && Char.IsWhiteSpace(text, start)) start++;



            if (start < end) {

                throw new ArgumentException("invalid integer number literal");

            }

        }



        public static BigInteger ParseBigInteger(string text, int b) {

            Debug.Assert(b != 0);

            BigInteger ret = BigInteger.Zero;

            BigInteger m = BigInteger.One;



            int i = text.Length - 1;

            if (text[i] == 'l' || text[i] == 'L') i -= 1;



            int groupMax = 7;

            if (b <= 10) groupMax = 9;// 2 147 483 647



            while (i >= 0) {

                // extract digits in a batch

                int smallMultiplier = 1;

                uint uval = 0;



                for (int j = 0; j < groupMax && i >= 0; j++) {

                    uval = (uint)(CharValue(text[i--], b) * smallMultiplier + uval);

                    smallMultiplier *= b;

                }



                // this is more generous than needed

                ret += m * (BigInteger)uval;

                if (i >= 0) m = m * (smallMultiplier);

            }



            return ret;

        }



        public static BigInteger ParseBigIntegerSign(string text, int b) {

            int start = 0, end = text.Length;

            short sign = 1;



            if (b < 0 || b == 1 || b > 36) {

                throw new ArgumentException("base must be >= 2 and <= 36");

            }



            ParseIntegerStart(text, ref b, ref start, end, ref sign);



            BigInteger ret = BigInteger.Zero;

            int saveStart = start;

            for (; ; ) {

                int digit;

                if (start >= end) {

                    if (start == saveStart) {

                        throw new ArgumentException("Invalid integer literal");

                    }

                    break;

                }

                if (!HexValue(text[start], out digit)) break;

                if (!(digit < b)) {

                    if (text[start] == 'l' || text[start] == 'L') {

                        break;

                    }

                    throw new ArgumentException("Invalid integer literal");

                }

                ret = ret * b + digit;

                start++;

            }



            if (start < end && (text[start] == 'l' || text[start] == 'L')) {

                start++;

            }



            ParseIntegerEnd(text, start, end);



            return sign < 0 ? -ret : ret;

        }





        public static double ParseFloat(string text) {

            try {

                //

                // Strings that end with '\0' is the specific case that CLR libraries allow,

                // however Python doesn't. Since we use CLR floating point number parser,

                // we must check explicitly for the strings that end with '\0'

                //

                if (text != null && text.Length > 0 && text[text.Length - 1] == '\0') {

                    throw PythonOps.ValueError("null byte in float literal");

                }

                return ParseFloatNoCatch(text);

            } catch (OverflowException) {

                return text.lstrip().StartsWith("-") ? Double.NegativeInfinity : Double.PositiveInfinity;

            }

        }



        private static double ParseFloatNoCatch(string text) {

            string s = ReplaceUnicodeDigits(text);

            switch (s.lower().lstrip()) {

                case "nan":

                case "+nan":

                case "-nan":

                    return double.NaN;

                case "inf":

                case "+inf":

                    return double.PositiveInfinity;

                case "-inf":

                    return double.NegativeInfinity;

                default:

                    // pass NumberStyles to disallow ,'s in float strings.

                    double res = double.Parse(s, NumberStyles.Float, System.Globalization.CultureInfo.InvariantCulture);

                    return (res == 0.0 && text.lstrip().StartsWith("-")) ? DoubleOps.NegativeZero : res;

            }

        }



        private static string ReplaceUnicodeDigits(string text) {

            StringBuilder replacement = null;

            for (int i = 0; i < text.Length; i++) {

                if (text[i] >= '\x660' && text[i] <= '\x669') {

                    if (replacement == null) replacement = new StringBuilder(text);

                    replacement[i] = (char)(text[i] - '\x660' + '0');

                }

            }

            if (replacement != null) {

                text = replacement.ToString();

            }

            return text;

        }



        // ParseComplex helpers

        private static char[] signs = new char[] { '+', '-' };

        private static Exception ExnMalformed() {

            return PythonOps.ValueError("complex() arg is a malformed string");

        }



        public static Complex ParseComplex(string s) {

            // remove no-meaning spaces and convert to lowercase

            string text = s.Trim().ToLower();

            if (String.IsNullOrEmpty(text)) {

                throw PythonOps.ValueError("complex() arg is an empty string");

            }

            if (text.IndexOf(' ') != -1) {

                throw ExnMalformed();

            }



            // remove 1 layer of parens

            if (text.StartsWith("(") && text.EndsWith(")")) {

                text = text.Substring(1, text.Length - 2);

            }



            try {

                int len = text.Length;

                string real, imag;



                if (text[len - 1] == 'j') {

                    // last sign delimits real and imaginary...

                    int signPos = text.LastIndexOfAny(signs);

                    // ... unless it's after 'e', so we bypass up to 2 of those here

                    for (int i = 0; signPos > 0 && text[signPos - 1] == 'e'; i++) {

                        if (i == 2) {

                            // too many 'e's

                            throw ExnMalformed();

                        }

                        signPos = text.Substring(0, signPos - 1).LastIndexOfAny(signs);

                    }



                    // no real component

                    if (signPos < 0) {

                        return MathUtils.MakeImaginary((len == 1) ? 1 : ParseFloatNoCatch(text.Substring(0, len - 1)));

                    }



                    real = text.Substring(0, signPos);

                    imag = text.Substring(signPos, len - signPos - 1);

                    if (imag.Length == 1) {

                        imag += "1"; // convert +/- to +1/-1

                    }

                } else {

                    // 'j' delimits real and imaginary

                    string[] splitText = text.Split(new char[] { 'j' });



                    // no imaginary component

                    if (splitText.Length == 1) {

                        return MathUtils.MakeReal(ParseFloatNoCatch(text));

                    }



                    // there should only be one j

                    if (splitText.Length != 2) {

                        throw ExnMalformed();

                    }

                    real = splitText[1];

                    imag = splitText[0];



                    // a sign must follow the 'j'

                    if (!(real.StartsWith("+") || real.StartsWith("-"))) {

                        throw ExnMalformed();

                    }

                }



                return new Complex(String.IsNullOrEmpty(real) ? 0 : ParseFloatNoCatch(real), ParseFloatNoCatch(imag));

            } catch (OverflowException) {

                throw PythonOps.ValueError("complex() literal too large to convert");

            } catch {

                throw ExnMalformed();

            }

        }



        public static Complex ParseImaginary(string text) {

            try {

                return MathUtils.MakeImaginary(double.Parse(

                    text.Substring(0, text.Length - 1),

                    System.Globalization.CultureInfo.InvariantCulture.NumberFormat

                    ));

            } catch (OverflowException) {

                return new Complex(0, Double.PositiveInfinity);

            }

        }

    }

}
Summary ✨

This C# code is a Python interpreter implementation, providing methods for parsing and evaluating Python expressions, including arithmetic operations, complex numbers, and string manipulation. It includes functions for parsing strings, replacing Unicode digits, and handling exceptions, allowing it to execute Python-like code in C#. The code provides a way to run Python scripts or interact with Python from within a C# application.
Tech Fingerprint

.NET Base Class Library
Alerts (11)

'static' Mutable static field detected; use readonly or const to prevent race conditions
37 38 41 608
'switch (' Switch statement detected; include a default case for robustness
86
Complexity hotspot; lines 340 to 342 (total complexity: 6)
340 341 342
Complexity hotspot; lines 461 to 463 (total complexity: 6)
461 462 463