plist-cil/plist-cil/ASCIIPropertyListParser.cs

// plist-cil - An open source library to parse and generate property lists for .NET
// Copyright (C) 2015 Natalia Portillo
//
// This code is based on:
// plist - An open source library to parse and generate property lists
// Copyright (C) 2014 Daniel Dreibrodt
//
// Permission is hereby granted, free of charge, to any person obtaining a copy
// of this software and associated documentation files (the "Software"), to deal
// in the Software without restriction, including without limitation the rights
// to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
// copies of the Software, and to permit persons to whom the Software is
// furnished to do so, subject to the following conditions:
//
// The above copyright notice and this permission notice shall be included in
// all copies or substantial portions of the Software.
//
// THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
// IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
// FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
// AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
// LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
// OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
// SOFTWARE.

using System;
using System.Collections.Generic;
using System.IO;
using System.Text;
using System.Text.RegularExpressions;

namespace Claunia.PropertyList
{
    /// <summary>
    ///     <para>
    ///         Parser for ASCII property lists. Supports Apple OS X/iOS and GnuStep/NeXTSTEP format.
    ///         This parser is based on the recursive descent paradigm, but the underlying grammar
    ///         is not explicitely defined.
    ///     </para>
    ///     <para>
    ///         Resources on ASCII property list format:
    ///     </para>
    ///     <para>
    ///         https://developer.apple.com/library/mac/#documentation/Cocoa/Conceptual/PropertyLists/OldStylePlists/OldStylePLists.html
    ///     </para>
    ///     <para>
    ///         Property List Programming Guide - Old-Style ASCII Property Lists
    ///     </para>
    ///     <para>
    ///         http://www.gnustep.org/resources/documentation/Developer/Base/Reference/NSPropertyList.html
    ///     </para>
    ///     <para>
    ///         GnuStep - NSPropertyListSerialization class documentation
    ///     </para>
    /// </summary>
    /// @author Daniel Dreibrodt
    /// @author Natalia Portillo
    public class ASCIIPropertyListParser
    {
        /// <summary>
        ///     A space
        /// </summary>
        public const char WHITESPACE_SPACE = ' ';
        /// <summary>
        ///     A tabulator
        /// </summary>
        public const char WHITESPACE_TAB = '\t';
        /// <summary>
        ///     A newline
        /// </summary>
        public const char WHITESPACE_NEWLINE = '\n';
        /// <summary>
        ///     A carriage return
        /// </summary>
        public const char WHITESPACE_CARRIAGE_RETURN = '\r';

        /// <summary>
        ///     Token of NSArray start
        /// </summary>
        public const char ARRAY_BEGIN_TOKEN = '(';
        /// <summary>
        ///     Token of NSArray end
        /// </summary>
        public const char ARRAY_END_TOKEN = ')';
        /// <summary>
        ///     Token of NSArray item delimiter
        /// </summary>
        public const char ARRAY_ITEM_DELIMITER_TOKEN = ',';

        /// <summary>
        ///     Token of NSDictionary start
        /// </summary>
        public const char DICTIONARY_BEGIN_TOKEN = '{';
        /// <summary>
        ///     Token of NSDictionary end
        /// </summary>
        public const char DICTIONARY_END_TOKEN = '}';
        /// <summary>
        ///     Token of NSDictionary assignment
        /// </summary>
        public const char DICTIONARY_ASSIGN_TOKEN = '=';
        /// <summary>
        ///     Token of NSDictionary item delimiter
        /// </summary>
        public const char DICTIONARY_ITEM_DELIMITER_TOKEN = ';';

        /// <summary>
        ///     Token of quoted NSString start
        /// </summary>
        public const char QUOTEDSTRING_BEGIN_TOKEN = '"';
        /// <summary>
        ///     Token of quoted NSString end
        /// </summary>
        public const char QUOTEDSTRING_END_TOKEN = '"';
        /// <summary>
        ///     Token of quoted NSString escaped character
        /// </summary>
        public const char QUOTEDSTRING_ESCAPE_TOKEN = '\\';

        /// <summary>
        ///     Token of NSData start
        /// </summary>
        public const char DATA_BEGIN_TOKEN = '<';
        /// <summary>
        ///     Token of NSData end
        /// </summary>
        public const char DATA_END_TOKEN = '>';

        /// <summary>
        ///     Token of GSObject start
        /// </summary>
        public const char DATA_GSOBJECT_BEGIN_TOKEN = '*';
        /// <summary>
        ///     Token of GSDate start
        /// </summary>
        public const char DATA_GSDATE_BEGIN_TOKEN = 'D';
        /// <summary>
        ///     Token of GSBoolean start
        /// </summary>
        public const char DATA_GSBOOL_BEGIN_TOKEN = 'B';
        /// <summary>
        ///     Token for GSBoolen's <c>true</c>
        /// </summary>
        public const char DATA_GSBOOL_TRUE_TOKEN = 'Y';
        /// <summary>
        ///     Token for GSBoolen's <c>false</c>
        /// </summary>
        public const char DATA_GSBOOL_FALSE_TOKEN = 'N';
        /// <summary>
        ///     Token for GSInteger
        /// </summary>
        public const char DATA_GSINT_BEGIN_TOKEN = 'I';
        /// <summary>
        ///     Token for GSReal
        /// </summary>
        public const char DATA_GSREAL_BEGIN_TOKEN = 'R';

        /// <summary>
        ///     Token for NSDate date field delimited
        /// </summary>
        public const char DATE_DATE_FIELD_DELIMITER = '-';
        /// <summary>
        ///     Token for NSDate time field delimiter
        /// </summary>
        public const char DATE_TIME_FIELD_DELIMITER = ':';
        /// <summary>
        ///     Token for GSDate date and time delimiter
        /// </summary>
        public const char DATE_GS_DATE_TIME_DELIMITER = ' ';
        /// <summary>
        ///     Token for NSDate date and time delimiter
        /// </summary>
        public const char DATE_APPLE_DATE_TIME_DELIMITER = 'T';
        /// <summary>
        ///     Token for NSDate end
        /// </summary>
        public const char DATE_APPLE_END_TOKEN = 'Z';

        /// <summary>
        ///     Token for comment start
        /// </summary>
        public const char COMMENT_BEGIN_TOKEN = '/';
        /// <summary>
        ///     Second token for multiline comment
        /// </summary>
        public const char MULTILINE_COMMENT_SECOND_TOKEN = '*';
        /// <summary>
        ///     Second token for singleline comment
        /// </summary>
        public const char SINGLELINE_COMMENT_SECOND_TOKEN = '/';
        /// <summary>
        ///     End token for multiline comment
        /// </summary>
        public const char MULTILINE_COMMENT_END_TOKEN = '/';

        /**
        * Property list source data
        */
        char[] data;
        /**
        * Current parsing index
        */
        int index;

        /**
        * Only allow subclasses to change instantiation.
        */
        protected ASCIIPropertyListParser() { }

        /// <summary>
        ///     Creates a new parser for the given property list content.
        /// </summary>
        /// <param name="propertyListContent">The content of the property list that is to be parsed.</param>
        ASCIIPropertyListParser(char[] propertyListContent)
        {
            data = propertyListContent;
        }

        /// <summary>
        ///     Parses an ASCII property list file.
        /// </summary>
        /// <param name="f">The ASCII property list file..</param>
        /// <returns>The root object of the property list. This is usually a NSDictionary but can also be a NSArray.</returns>
        /// <exception cref="FormatException">When an error occurs during parsing.</exception>
        /// <exception cref="IOException">When an error occured while reading from the input stream.</exception>
        public static NSObject Parse(FileInfo f)
        {
            return Parse(f.OpenRead());
        }

        /// <summary>
        ///     Parses an ASCII property list from an input stream.
        /// </summary>
        /// <param name="fs">The input stream that points to the property list's data.</param>
        /// <returns>The root object of the property list. This is usually a NSDictionary but can also be a NSArray.</returns>
        /// <exception cref="FormatException">When an error occurs during parsing.</exception>
        /// <exception cref="IOException"></exception>
        public static NSObject Parse(Stream fs)
        {
            byte[] buf = PropertyListParser.ReadAll(fs);
            // Don't close the stream - that would be the responisibility of code that class
            // Parse
            return Parse(buf);
        }

        /// <summary>
        ///     Parses an ASCII property list from a byte array.
        /// </summary>
        /// <param name="bytes">The ASCII property list data.</param>
        /// <returns>The root object of the property list. This is usually a NSDictionary but can also be a NSArray.</returns>
        /// <exception cref="FormatException">When an error occurs during parsing.</exception>
        public static NSObject Parse(byte[] bytes)
        {
            return Parse(bytes.AsSpan());
        }

        /// <summary>
        ///     Parses an ASCII property list from a byte array.
        /// </summary>
        /// <param name="bytes">The ASCII property list data.</param>
        /// <param name="count">The offset at which to start reading the property list.</param>
        /// <param name="offset">The length of the property list.</param>
        /// <returns>The root object of the property list. This is usually a NSDictionary but can also be a NSArray.</returns>
        /// <exception cref="FormatException">When an error occurs during parsing.</exception>
        public static NSObject Parse(byte[] bytes, int offset, int count)
        {
            return Parse(bytes.AsSpan(offset, count));
        }

        /// <summary>
        ///     Parses an ASCII property list from a byte span.
        /// </summary>
        /// <param name="bytes">The ASCII property list data.</param>
        /// <returns>The root object of the property list. This is usually a NSDictionary but can also be a NSArray.</returns>
        /// <exception cref="FormatException">When an error occurs during parsing.</exception>
        public static NSObject Parse(ReadOnlySpan<byte> bytes)
        {
            #if NATIVE_SPAN
            return ParseString(Encoding.UTF8.GetString(bytes));
            #else
            return ParseString(Encoding.UTF8.GetString(bytes.ToArray()));
            #endif
        }

        /// <summary>
        ///     Parses an ASCII property list from a string.
        /// </summary>
        /// <param name="value">The ASCII property list data.</param>
        /// <returns>The root object of the property list. This is usually a NSDictionary but can also be a NSArray.</returns>
        /// <exception cref="FormatException">When an error occurs during parsing.</exception>
        public static NSObject ParseString(string value)
        {
            ASCIIPropertyListParser parser = new ASCIIPropertyListParser(value.ToCharArray());
            return parser.Parse();
        }

        /// <summary>
        ///     Checks whether the given sequence of symbols can be accepted.
        /// </summary>
        /// <returns>Whether the given tokens occur at the current parsing position.</returns>
        /// <param name="sequence">The sequence of tokens to look for.</param>
        bool AcceptSequence(params char[] sequence)
        {
            for(int i = 0; i < sequence.Length; i++)
                if(data[index + i] != sequence[i])
                    return false;

            return true;
        }

        /// <summary>
        ///     Checks whether the given symbols can be accepted, that is, if one
        ///     of the given symbols is found at the current parsing position.
        /// </summary>
        /// <param name="acceptableSymbols">The symbols to check.</param>
        /// <returns>Whether one of the symbols can be accepted or not.</returns>
        bool Accept(params char[] acceptableSymbols)
        {
            bool symbolPresent                                 = false;
            foreach(char c in acceptableSymbols) symbolPresent |= data[index] == c;
            return symbolPresent;
        }

        /// <summary>
        ///     Checks whether the given symbol can be accepted, that is, if
        ///     the given symbols is found at the current parsing position.
        /// </summary>
        /// <param name="acceptableSymbol">The symbol to check.</param>
        /// <returns>Whether the symbol can be accepted or not.</returns>
        bool Accept(char acceptableSymbol)
        {
            return data[index] == acceptableSymbol;
        }

        /// <summary>
        ///     Expects the input to have one of the given symbols at the current parsing position.
        /// </summary>
        /// <param name="expectedSymbols">The expected symbols.</param>
        /// <exception cref="FormatException">If none of the expected symbols could be found.</exception>
        void Expect(params char[] expectedSymbols)
        {
            if(!Accept(expectedSymbols))
            {
                string excString                                          = "Expected '" + expectedSymbols[0] + "'";
                for(int i = 1; i < expectedSymbols.Length; i++) excString += " or '" + expectedSymbols[i] + "'";

                excString += " but found '" + data[index] + "'";
                throw new FormatException(string.Format("{0} at {1}", excString, index));
            }
        }

        /// <summary>
        ///     Expects the input to have the given symbol at the current parsing position.
        /// </summary>
        /// <param name="expectedSymbol">The expected symbol.</param>
        /// <exception cref="FormatException">If the expected symbol could be found.</exception>
        void Expect(char expectedSymbol)
        {
            if(!Accept(expectedSymbol))
                throw new FormatException(string.Format("Expected '{0}' but found '{1}' at {2}", expectedSymbol,
                                                        data[index], index));
        }

        /// <summary>
        ///     Reads an expected symbol.
        /// </summary>
        /// <param name="symbol">The symbol to read.</param>
        /// <exception cref="FormatException">If the expected symbol could not be read.</exception>
        void Read(char symbol)
        {
            Expect(symbol);
            index++;
        }

        /**
     * Skips the current symbol.
     */
        void Skip()
        {
            index++;
        }

        /// <summary>
        ///     Skips several symbols
        /// </summary>
        /// <param name="numSymbols">The amount of symbols to skip.</param>
        void Skip(int numSymbols)
        {
            index += numSymbols;
        }

        /**
     * Skips all whitespaces and comments from the current parsing position onward.
     */
        void SkipWhitespacesAndComments()
        {
            bool commentSkipped;
            do
            {
                commentSkipped = false;

                //Skip whitespaces
                while(Accept(WHITESPACE_CARRIAGE_RETURN, WHITESPACE_NEWLINE, WHITESPACE_SPACE, WHITESPACE_TAB)) Skip();

                //Skip single line comments "//..."
                if(AcceptSequence(COMMENT_BEGIN_TOKEN, SINGLELINE_COMMENT_SECOND_TOKEN))
                {
                    Skip(2);
                    ReadInputUntil(WHITESPACE_CARRIAGE_RETURN, WHITESPACE_NEWLINE);
                    commentSkipped = true;
                }
                //Skip multi line comments "/* ... */"
                else if(AcceptSequence(COMMENT_BEGIN_TOKEN, MULTILINE_COMMENT_SECOND_TOKEN))
                {
                    Skip(2);
                    while(true)
                    {
                        if(AcceptSequence(MULTILINE_COMMENT_SECOND_TOKEN, MULTILINE_COMMENT_END_TOKEN))
                        {
                            Skip(2);
                            break;
                        }

                        Skip();
                    }

                    commentSkipped = true;
                }
            }
            while(commentSkipped
            ); //if a comment was skipped more whitespace or another comment can follow, so skip again
        }

        /// <summary>
        ///     Reads input until one of the given symbols is found.
        /// </summary>
        /// <returns>The input until one the given symbols.</returns>
        /// <param name="symbols">The symbols that can occur after the string to read.</param>
        string ReadInputUntil(params char[] symbols)
        {
            string s = "";
            while(!Accept(symbols))
            {
                s += data[index];
                Skip();
            }

            return s;
        }

        /// <summary>
        ///     Reads input until the given symbol is found.
        /// </summary>
        /// <returns>The input until the given symbol.</returns>
        /// <param name="symbol">The symbol that can occur after the string to read.</param>
        string ReadInputUntil(char symbol)
        {
            string s = "";
            while(!Accept(symbol))
            {
                s += data[index];
                Skip();
            }

            return s;
        }

        /// <summary>
        ///     Parses the property list from the beginning and returns the root object
        ///     of the property list.
        /// </summary>
        /// <returns>The root object of the property list. This can either be a NSDictionary or a NSArray.</returns>
        /// <exception cref="FormatException">When an error occured during parsing</exception>
        public NSObject Parse()
        {
            index = 0;
            //Skip Unicode byte order mark (BOM)
            if(data.Length >= 3 && (data[0] & 0xFF) == 0xEF && (data[1] & 0xFF) == 0xBB &&
               (data[2]                     & 0xFF) == 0xBF) Skip(3);
            SkipWhitespacesAndComments();
            Expect(DICTIONARY_BEGIN_TOKEN, ARRAY_BEGIN_TOKEN, COMMENT_BEGIN_TOKEN);
            try { return ParseObject(); }
            catch(IndexOutOfRangeException)
            {
                throw new FormatException(string.Format("Reached end of input unexpectedly at {0}.", index));
            }
        }

        /// <summary>
        ///     Parses the NSObject found at the current position in the property list
        ///     data stream.
        /// </summary>
        /// <returns>The parsed NSObject.</returns>
        /// <seealso cref="ASCIIPropertyListParser.index" />
        NSObject ParseObject()
        {
            switch(data[index])
            {
                case ARRAY_BEGIN_TOKEN:      { return ParseArray(); }
                case DICTIONARY_BEGIN_TOKEN: { return ParseDictionary(); }
                case DATA_BEGIN_TOKEN:       { return ParseData(); }
                case QUOTEDSTRING_BEGIN_TOKEN:
                {
                    string quotedString = ParseQuotedString();
                    //apple dates are quoted strings of length 20 and after the 4 year digits a dash is found
                    if(quotedString.Length == 20 && quotedString[4] == DATE_DATE_FIELD_DELIMITER)
                        try { return new NSDate(quotedString); }
                        catch(Exception)
                        {
                            //not a date? --> return string
                            return new NSString(quotedString);
                        }

                    return new NSString(quotedString);
                }
                default:
                {
                    //0-9
                    if(data[index] > 0x2F && data[index] < 0x3A) return ParseDateString();

                    //non-numerical -> string or boolean
                    string parsedString = ParseString();
                    return new NSString(parsedString);
                }
            }
        }

        /// <summary>
        ///     Parses an array from the current parsing position.
        ///     The prerequisite for calling this method is, that an array begin token has been read.
        /// </summary>
        /// <returns>The array found at the parsing position.</returns>
        NSArray ParseArray()
        {
            //Skip begin token
            Skip();
            SkipWhitespacesAndComments();
            List<NSObject> objects = new List<NSObject>();
            while(!Accept(ARRAY_END_TOKEN))
            {
                objects.Add(ParseObject());
                SkipWhitespacesAndComments();
                if(Accept(ARRAY_ITEM_DELIMITER_TOKEN)) Skip();
                else break; //must have reached end of array

                SkipWhitespacesAndComments();
            }

            //parse end token
            Read(ARRAY_END_TOKEN);
            return new NSArray(objects.ToArray());
        }

        /// <summary>
        ///     Parses a dictionary from the current parsing position.
        ///     The prerequisite for calling this method is, that a dictionary begin token has been read.
        /// </summary>
        /// <returns>The dictionary found at the parsing position.</returns>
        NSDictionary ParseDictionary()
        {
            //Skip begin token
            Skip();
            SkipWhitespacesAndComments();
            NSDictionary dict = new NSDictionary();
            while(!Accept(DICTIONARY_END_TOKEN))
            {
                //Parse key
                string keyString;
                if(Accept(QUOTEDSTRING_BEGIN_TOKEN)) keyString = ParseQuotedString();
                else keyString                                 = ParseString();
                SkipWhitespacesAndComments();

                //Parse assign token
                Read(DICTIONARY_ASSIGN_TOKEN);
                SkipWhitespacesAndComments();

                NSObject nso = ParseObject();
                dict.Add(keyString, nso);
                SkipWhitespacesAndComments();
                Read(DICTIONARY_ITEM_DELIMITER_TOKEN);
                SkipWhitespacesAndComments();
            }

            //skip end token
            Skip();
            return dict;
        }

        /// <summary>
        ///     Parses a data object from the current parsing position.
        ///     This can either be a NSData object or a GnuStep NSNumber or NSDate.
        ///     The prerequisite for calling this method is, that a data begin token has been read.
        /// </summary>
        /// <returns>The data object found at the parsing position.</returns>
        NSObject ParseData()
        {
            NSObject obj = null;
            //Skip begin token
            Skip();
            if(Accept(DATA_GSOBJECT_BEGIN_TOKEN))
            {
                Skip();
                Expect(DATA_GSBOOL_BEGIN_TOKEN, DATA_GSDATE_BEGIN_TOKEN, DATA_GSINT_BEGIN_TOKEN,
                       DATA_GSREAL_BEGIN_TOKEN);
                if(Accept(DATA_GSBOOL_BEGIN_TOKEN))
                {
                    //Boolean
                    Skip();
                    Expect(DATA_GSBOOL_TRUE_TOKEN, DATA_GSBOOL_FALSE_TOKEN);
                    if(Accept(DATA_GSBOOL_TRUE_TOKEN)) obj = new NSNumber(true);
                    else obj                               = new NSNumber(false);
                    //Skip the parsed boolean token
                    Skip();
                }
                else if(Accept(DATA_GSDATE_BEGIN_TOKEN))
                {
                    //Date
                    Skip();
                    string dateString = ReadInputUntil(DATA_END_TOKEN);
                    obj = new NSDate(dateString);
                }
                else if(Accept(DATA_GSINT_BEGIN_TOKEN, DATA_GSREAL_BEGIN_TOKEN))
                {
                    //Number
                    Skip();
                    string numberString = ReadInputUntil(DATA_END_TOKEN);
                    obj = new NSNumber(numberString);
                }

                //parse data end token
                Read(DATA_END_TOKEN);
            }
            else
            {
                string dataString = ReadInputUntil(DATA_END_TOKEN);
                dataString = Regex.Replace(dataString, "\\s+", "");

                int    numBytes = dataString.Length / 2;
                byte[] bytes    = new byte[numBytes];
                for(int i = 0; i < bytes.Length; i++)
                {
                    string byteString = dataString.Substring(i * 2, 2);
                    int    byteValue  = Convert.ToInt32(byteString, 16);
                    bytes[i] = (byte)byteValue;
                }

                obj = new NSData(bytes);

                //skip end token
                Skip();
            }

            return obj;
        }

        /// <summary>
        ///     Attempts to parse a plain string as a date if possible.
        /// </summary>
        /// <returns>A NSDate if the string represents such an object. Otherwise a NSString is returned.</returns>
        NSObject ParseDateString()
        {
            string numericalString = ParseString();
            if(numericalString.Length > 4 && numericalString[4] == DATE_DATE_FIELD_DELIMITER)
                try { return new NSDate(numericalString); }
                catch(Exception)
                {
                    //An exception occurs if the string is not a date but just a string
                }

            return new NSString(numericalString);
        }

        /// <summary>
        ///     Parses a plain string from the current parsing position.
        ///     The string is made up of all characters to the next whitespace, delimiter token or assignment token.
        /// </summary>
        /// <returns>The string found at the current parsing position.</returns>
        string ParseString()
        {
            return ReadInputUntil(WHITESPACE_SPACE, WHITESPACE_TAB, WHITESPACE_NEWLINE,
                                  WHITESPACE_CARRIAGE_RETURN,
                                  ARRAY_ITEM_DELIMITER_TOKEN, DICTIONARY_ITEM_DELIMITER_TOKEN, DICTIONARY_ASSIGN_TOKEN,
                                  ARRAY_END_TOKEN);
        }

        /// <summary>
        ///     Parses a quoted string from the current parsing position.
        ///     The prerequisite for calling this method is, that a quoted string begin token has been read.
        /// </summary>
        /// <returns>The quoted string found at the parsing method with all special characters unescaped.</returns>
        /// <exception cref="FormatException">If an error occured during parsing.</exception>
        string ParseQuotedString()
        {
            //Skip begin token
            Skip();
            string quotedString       = "";
            bool   unescapedBackslash = true;
            //Read from opening quotation marks to closing quotation marks and skip escaped quotation marks
            while(data[index] != QUOTEDSTRING_END_TOKEN ||
                  data[index - 1] == QUOTEDSTRING_ESCAPE_TOKEN && unescapedBackslash)
            {
                quotedString += data[index];
                if(Accept(QUOTEDSTRING_ESCAPE_TOKEN))
                    unescapedBackslash = !(data[index - 1] == QUOTEDSTRING_ESCAPE_TOKEN && unescapedBackslash);
                Skip();
            }

            string unescapedString;
            try { unescapedString = ParseQuotedString(quotedString); }
            catch(Exception)
            {
                throw new FormatException(string.Format("The quoted string could not be parsed at {0}.", index));
            }

            //skip end token
            Skip();
            return unescapedString;
        }

        /// <summary>
        ///     Parses a string according to the format specified for ASCII property lists.
        ///     Such strings can contain escape sequences which are unescaped in this method.
        /// </summary>
        /// <returns>The unescaped string in UTF-8 or ASCII format, depending on the contained characters.</returns>
        /// <param name="s">
        ///     The escaped string according to the ASCII property list format, without leading and trailing quotation
        ///     marks.
        /// </param>
        /// <exception cref="ArgumentException">If the en-/decoder for the UTF-8 or ASCII encoding could not be loaded</exception>
        /// <exception cref="EncoderFallbackException">If the string is encoded neither in ASCII nor in UTF-8</exception>
        public static string ParseQuotedString(string s)
        {
            List<byte> strBytes = new List<byte>();

            IEnumerable<char> characters = s.ToCharArray();
            IEnumerator<char> c          = characters.GetEnumerator();

            while(c.MoveNext())
                switch(c.Current)
                {
                    case '\\':
                    {
                        //An escaped sequence is following
                        byte[] bts = Encoding.UTF8.GetBytes(ParseEscapedSequence(c));
                        foreach(byte b in bts) strBytes.Add(b);
                        break;
                    }
                    default:
                    {
                        //a normal ASCII char
                        strBytes.AddRange(Encoding.BigEndianUnicode.GetBytes(new[] {c.Current}));
                        break;
                    }
                }
            byte[] bytArr = new byte[strBytes.Count];
            int    i      = 0;
            foreach(byte b in strBytes)
            {
                bytArr[i] = b;
                i++;
            }

            //Build string
            string result = Encoding.BigEndianUnicode.GetString(bytArr);

            //If the string can be represented in the ASCII codepage
            // --> use ASCII encoding
            if(IsASCIIEncodable(result))
                return Encoding.ASCII.GetString(Encoding.Convert(Encoding.BigEndianUnicode, Encoding.ASCII, bytArr));

            //The string contains characters outside the ASCII codepage
            // --> use the UTF-8 encoded string
            return result;
        }

        /// <summary>
        ///     Unescapes an escaped character sequence, e.g. \\u00FC.
        /// </summary>
        /// <returns>The unescaped character as a string.</returns>
        /// <param name="iterator">The string character iterator pointing to the first character after the backslash</param>
        /// <exception cref="EncoderFallbackException">If an invalid Unicode or ASCII escape sequence is found.</exception>
        static string ParseEscapedSequence(IEnumerator<char> iterator)
        {
            iterator.MoveNext();
            char c = iterator.Current;
            if(c == '\\') return Encoding.UTF8.GetString(new byte[] {0, (byte)'\\'});

            if(c == '"') return Encoding.UTF8.GetString(new byte[] {0, (byte)'\"'});

            if(c == 'b') return Encoding.UTF8.GetString(new byte[] {0, (byte)'\b'});

            if(c == 'n') return Encoding.UTF8.GetString(new byte[] {0, (byte)'\n'});

            if(c == 'r') return Encoding.UTF8.GetString(new byte[] {0, (byte)'\r'});

            if(c == 't') return Encoding.UTF8.GetString(new byte[] {0, (byte)'\t'});

            if(c == 'U' || c == 'u')
            {
                //4 digit hex Unicode value
                string byte1 = "";
                iterator.MoveNext();
                byte1 += iterator.Current;
                iterator.MoveNext();
                byte1 += iterator.Current;
                string byte2 = "";
                iterator.MoveNext();
                byte2 += iterator.Current;
                iterator.MoveNext();
                byte2 += iterator.Current;
                byte[] stringBytes = {(byte)Convert.ToInt32(byte1, 16), (byte)Convert.ToInt32(byte2, 16)};
                return Encoding.UTF8.GetString(stringBytes);
            }
            else
            {
                //3 digit octal ASCII value
                string num = "";
                num += c;
                iterator.MoveNext();
                num += iterator.Current;
                iterator.MoveNext();
                num += iterator.Current;
                int    asciiCode   = Convert.ToInt32(num, 8);
                byte[] stringBytes = {0, (byte)asciiCode};
                return Encoding.UTF8.GetString(stringBytes);
            }
        }

        internal static bool IsASCIIEncodable(string text)
        {
            foreach(char c in text)
                if(c > 0x7F)
                    return false;

            return true;
        }
    }
}