diff --git a/Claunia.Encoding.Tests/Claunia.Encoding.Tests.csproj b/Claunia.Encoding.Tests/Claunia.Encoding.Tests.csproj index f57d0f9..9fb0e2d 100644 --- a/Claunia.Encoding.Tests/Claunia.Encoding.Tests.csproj +++ b/Claunia.Encoding.Tests/Claunia.Encoding.Tests.csproj @@ -8,7 +8,7 @@ Claunia.Encoding.Tests Claunia.Encoding.Tests v4.5 - 1.5 + 1.6 true diff --git a/Claunia.Encoding.sln b/Claunia.Encoding.sln index b940aef..112f2b5 100644 --- a/Claunia.Encoding.sln +++ b/Claunia.Encoding.sln @@ -29,6 +29,6 @@ Global $2.TabsToSpaces = True $0.CSharpFormattingPolicy = $3 $3.scope = text/x-csharp - version = 1.5 + version = 1.6 EndGlobalSection EndGlobal diff --git a/Claunia.Encoding/Claunia.Encoding.csproj b/Claunia.Encoding/Claunia.Encoding.csproj index 86745f8..242767c 100644 --- a/Claunia.Encoding/Claunia.Encoding.csproj +++ b/Claunia.Encoding/Claunia.Encoding.csproj @@ -13,7 +13,7 @@ Profile136 true Claunia.Encoding - 1.5 + 1.6 Natalia Portillo true Natalia Portillo @@ -22,8 +22,8 @@ Claunia.Encoding Library to provide codepage conversion to and from archaic and old computer systems and Unicode. https://raw.githubusercontent.com/claunia/Claunia.Encoding/master/LICENSE.MIT - 1.5 - Added GEM character set. + 1.6 + Added GEOS character set. true @@ -50,6 +50,7 @@ + diff --git a/Claunia.Encoding/Encoding.cs b/Claunia.Encoding/Encoding.cs index ae3945c..62dcc50 100644 --- a/Claunia.Encoding/Encoding.cs +++ b/Claunia.Encoding/Encoding.cs @@ -60,6 +60,10 @@ namespace Claunia.Encoding /// Static instance for the GEM encoding /// public static System.Text.Encoding GemEncoding = new Gem(); + /// + /// Static instance for the GEM encoding + /// + public static System.Text.Encoding GeosEncoding = new Geos(); /// /// Gets a value indicating whether the current encoding can be used by browser clients for displaying content. diff --git a/Claunia.Encoding/Geos.cs b/Claunia.Encoding/Geos.cs new file mode 100644 index 0000000..eb86088 --- /dev/null +++ b/Claunia.Encoding/Geos.cs @@ -0,0 +1,742 @@ +// +// Geos.cs +// +// Author: +// Natalia Portillo +// +// Copyright © 2016-2018 Natalia Portillo +// +// Permission is hereby granted, free of charge, to any person obtaining a copy +// of this software and associated documentation files (the "Software"), to deal +// in the Software without restriction, including without limitation the rights +// to use, copy, modify, merge, publish, distribute, sublicense, and/or sell +// copies of the Software, and to permit persons to whom the Software is +// furnished to do so, subject to the following conditions: +// +// The above copyright notice and this permission notice shall be included in +// all copies or substantial portions of the Software. +// +// THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR +// IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, +// FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE +// AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER +// LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, +// OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN +// THE SOFTWARE. + +using System; + +namespace Claunia.Encoding +{ + /// + /// Represents an GEOS character encoding of Unicode characters. + /// + public class Geos : Encoding + { + const string _bodyname = "geos"; + const int _codepage = 0; + const string _encodingname = "Western European (GEOS)"; + const string _headername = "geos"; + const string _webname = ""; + const int _windowsCodepage = 0; + + const bool browserDisplay = false; + const bool browserSave = false; + const bool mailNewsDisplay = false; + const bool mailNewsSave = false; + const bool readOnly = false; + const bool singleByte = true; + + /// + /// The GEOS to Unicode character map. + /// In the GEOS character map application lots of positions appears as '\u002E' ('.' period) in normal (non-symbol) + /// fonts. + /// + static readonly char[] GeosTable = + { + // 0x00 + '\u0000', '\u0001', '\u0002', '\u0003', '\u0004', '\u0005', '\u0006', '\u0007', + // 0x08 + '\u0008', '\u0009', '\u000A', '\u000B', '\u000C', '\u000D', '\u000E', '\u000F', + // 0x10 + '\u0010', '\u0011', '\u0012', '\u0013', '\u0014', '\u0015', '\u0016', '\u0017', + // 0x18 + '\u0018', '\u0019', '\u001A', '\u001B', '\u001C', '\u001D', '\u001E', '\u001F', + // 0x20 + '\u0020', '\u0021', '\u0022', '\u0023', '\u0024', '\u0025', '\u0026', '\u0027', + // 0x28 + '\u0028', '\u0029', '\u002A', '\u002B', '\u002C', '\u002D', '\u002E', '\u002F', + // 0x30 + '\u0030', '\u0031', '\u0032', '\u0033', '\u0034', '\u0035', '\u0036', '\u0037', + // 0x38 + '\u0038', '\u0039', '\u003A', '\u003B', '\u003C', '\u003D', '\u003E', '\u003F', + // 0x40 + '\u0040', '\u0041', '\u0042', '\u0043', '\u0044', '\u0045', '\u0046', '\u0047', + // 0x48 + '\u0048', '\u0049', '\u004A', '\u004B', '\u004C', '\u004D', '\u004E', '\u004F', + // 0x50 + '\u0050', '\u0051', '\u0052', '\u0053', '\u0054', '\u0055', '\u0056', '\u0057', + // 0x58 + '\u0058', '\u0059', '\u005A', '\u005B', '\u005C', '\u005D', '\u005E', '\u005F', + // 0x60 + '\u0060', '\u0061', '\u0062', '\u0063', '\u0064', '\u0065', '\u0066', '\u0067', + // 0x68 + '\u0068', '\u0069', '\u006A', '\u006B', '\u006C', '\u006D', '\u006E', '\u006F', + // 0x70 + '\u0070', '\u0071', '\u0072', '\u0073', '\u0074', '\u0075', '\u0076', '\u0077', + // 0x78 + '\u0078', '\u0079', '\u007A', '\u007B', '\u007C', '\u007D', '\u007E', '\u007F', + // 0x80 + '\u00C4', '\u00C5', '\u00C7', '\u00C9', '\u00D1', '\u00D6', '\u00DC', '\u00E1', + // 0x88 + '\u00E0', '\u00E2', '\u00E4', '\u00E3', '\u00E5', '\u00E7', '\u00E9', '\u00E8', + // 0x90 + '\u00EA', '\u00EB', '\u00ED', '\u00EC', '\u00EE', '\u00EF', '\u00F1', '\u00F3', + // 0x98 + '\u00F2', '\u00F4', '\u00F5', '\u00FA', '\u00F9', '\u00FB', '\u00FC', '\u2020', + // 0xA0 + '\u00B0', '\u00A2', '\u00A3', '\u00A7', '\u00B7', '\u00B6', '\u00DF', '\u00AE', + // 0xA8 + '\u00A9', '\u2122', '\u0022', '\u0027', '\u002E', '\u00C6', '\u00D8', '\u221E', + // 0xB0 + '\u00B1', '\u2264', '\u2265', '\u00A5', '\u00B5', '\u002E', '\u002E', '\u002E', + // 0xB8 + '\u03C0', '\u002E', '\u00AA', '\u00BA', '\u03A9', '\u00E6', '\u00F8', '\u00BF', + // 0xC0 + '\u00A1', '\u00AC', '\u221A', '\u0192', '\u2248', '\u002E', '\u00AB', '\u00BB', + // 0xC8 + '\u2026', '\u00A0', '\u00C0', '\u00C3', '\u00D5', '\u0152', '\u0153', '\u2013', + // 0xD0 + '\u2014', '\u201C', '\u201D', '\u2018', '\u2019', '\u00F7', '\u002E', '\u00FF', + // 0xD8 + '\u0178', '\u002E', '\u00A4', '\u2039', '\u203A', '\u00FD', '\u00DD', '\u2021', + // 0xE0 + '\u002E', '\u201A', '\u201E', '\u2030', '\u00C2', '\u00CA', '\u00C1', '\u00CB', + // 0xE8 + '\u00C8', '\u00CD', '\u00CE', '\u00CF', '\u00CC', '\u00D3', '\u00D4', '\u002E', + // 0xF0 + '\u00D2', '\u00DA', '\u00D9', '\u00B9', '\u20C6', '\u20DC', '\u00AF', '\u02C7', + // 0xF8 + '\u00B7', '\u00B0', '\u00B8', '\u2032', '\u02DB', '\u02D8', '\u00A0', '\u002E' + }; + + /// + /// Gets a value indicating whether the current encoding can be used by browser clients for displaying content. + /// + public override bool IsBrowserDisplay => browserDisplay; + + /// + /// Gets a value indicating whether the current encoding can be used by browser clients for saving content. + /// + public override bool IsBrowserSave => browserSave; + + /// + /// Gets a value indicating whether the current encoding can be used by mail and news clients for displaying content. + /// + public override bool IsMailNewsDisplay => mailNewsDisplay; + + /// + /// Gets a value indicating whether the current encoding can be used by mail and news clients for saving content. + /// + public override bool IsMailNewsSave => mailNewsSave; + + /// + /// Gets a value indicating whether the current encoding is read-only. + /// + /// The is single byte. + public override bool IsReadOnly => readOnly; + + /// + /// Gets a value indicating whether the current encoding uses single-byte code points. + /// + public override bool IsSingleByte => singleByte; + + /// + /// Gets the code page identifier of the current Encoding. + /// + public override int CodePage => _codepage; + + /// + /// Gets a name for the current encoding that can be used with mail agent body tags + /// + public override string BodyName => _bodyname; + + /// + /// Gets a name for the current encoding that can be used with mail agent header tags + /// + public override string HeaderName => _headername; + + /// + /// Ggets the name registered with the Internet Assigned Numbers Authority (IANA) for the current encoding. + /// + public override string WebName => _webname; + + /// + /// Gets the human-readable description of the current encoding. + /// + public override string EncodingName => _encodingname; + + /// + /// Gets the Windows operating system code page that most closely corresponds to the current encoding. + /// + public override int WindowsCodePage => _windowsCodepage; + + /// + /// Calculates the number of bytes produced by encoding the characters in the specified . + /// + /// The number of bytes produced by encoding the specified characters. + /// The containing the set of characters to encode. + public override int GetByteCount(string s) + { + if(s == null) throw new ArgumentNullException(nameof(s)); + + return s.Length; + } + + /// + /// Calculates the number of bytes produced by encoding a set of characters from the specified character array. + /// + /// The number of bytes produced by encoding the specified characters. + /// The character array containing the set of characters to encode. + /// The index of the first character to encode. + /// The number of characters to encode. + public override int GetByteCount(char[] chars, int index, int count) + { + if(chars == null) throw new ArgumentNullException(nameof(chars)); + + if(index < 0 || index >= chars.Length) throw new ArgumentOutOfRangeException(nameof(index)); + + if(count < 0 || index + count > chars.Length) throw new ArgumentOutOfRangeException(nameof(index)); + + return count; + } + + /// + /// Calculates the number of bytes produced by encoding all the characters in the specified character array. + /// + /// The number of bytes produced by encoding all the characters in the specified character array. + /// The character array containing the characters to encode. + public override int GetByteCount(char[] chars) + { + if(chars == null) throw new ArgumentNullException(nameof(chars)); + + return chars.Length; + } + + /// + /// Encodes a set of characters from the specified into the specified byte array. + /// + /// The actual number of bytes written into bytes. + /// The containing the set of characters to encode. + /// The index of the first character to encode. + /// The number of characters to encode. + /// The byte array to contain the resulting sequence of bytes. + /// The index at which to start writing the resulting sequence of bytes. + public override int GetBytes(string s, int charIndex, int charCount, byte[] bytes, int byteIndex) + { + return GetBytes(s.ToCharArray(), charIndex, charCount, bytes, byteIndex); + } + + /// + /// Encodes all the characters in the specified string into a sequence of bytes. + /// + /// A byte array containing the results of encoding the specified set of characters. + /// The string containing the characters to encode. + public override byte[] GetBytes(string s) + { + if(s == null) throw new ArgumentNullException(nameof(s)); + + return GetBytes(s.ToCharArray(), 0, s.Length); + } + + /// + /// Encodes a set of characters from the specified character array into the specified byte array. + /// + /// The actual number of bytes written into bytes. + /// The character array containing the set of characters to encode. + /// The index of the first character to encode. + /// The number of characters to encode. + /// The byte array to contain the resulting sequence of bytes. + /// The index at which to start writing the resulting sequence of bytes. + public override int GetBytes(char[] chars, int charIndex, int charCount, byte[] bytes, int byteIndex) + { + if(chars == null) throw new ArgumentNullException(nameof(chars)); + + if(bytes == null) throw new ArgumentNullException(nameof(bytes)); + + if(charIndex < 0) throw new ArgumentOutOfRangeException(nameof(charIndex)); + + if(charCount < 0) throw new ArgumentOutOfRangeException(nameof(charCount)); + + if(byteIndex < 0) throw new ArgumentOutOfRangeException(nameof(byteIndex)); + + if(charIndex >= chars.Length) throw new ArgumentOutOfRangeException(nameof(charIndex)); + + if(charCount + charIndex > chars.Length) throw new ArgumentOutOfRangeException(nameof(charCount)); + + if(byteIndex >= bytes.Length) throw new ArgumentOutOfRangeException(nameof(byteIndex)); + + if(byteIndex + charCount > bytes.Length) throw new ArgumentException(nameof(bytes)); + + byte[] temp = GetBytes(chars, charIndex, charCount); + + for(int i = 0; i < temp.Length; i++) bytes[i + byteIndex] = temp[i]; + + return charCount; + } + + /// + /// Encodes a set of characters from the specified character array into a sequence of bytes. + /// + /// A byte array containing the results of encoding the specified set of characters. + /// The character array containing the set of characters to encode. + /// The index of the first character to encode. + /// The number of characters to encode. + public override byte[] GetBytes(char[] chars, int index, int count) + { + if(chars == null) throw new ArgumentNullException(nameof(chars)); + + if(index < 0) throw new ArgumentOutOfRangeException(nameof(index)); + + if(count < 0) throw new ArgumentOutOfRangeException(nameof(count)); + + if(count + index > chars.Length) throw new ArgumentOutOfRangeException(nameof(count)); + + byte[] bytes = new byte[count]; + + for(int i = 0; i < count; i++) bytes[i] = GetByte(chars[index + i]); + + return bytes; + } + + /// + /// Encodes all the characters in the specified character array into a sequence of bytes. + /// + /// A byte array containing the results of encoding the specified set of characters. + /// The character array containing the characters to encode. + public override byte[] GetBytes(char[] chars) + { + return GetBytes(chars, 0, chars.Length); + } + + /// + /// Calculates the number of characters produced by decoding all the bytes in the specified byte array. + /// + /// The number of characters produced by decoding the specified sequence of bytes. + /// The byte array containing the sequence of bytes to decode. + public override int GetCharCount(byte[] bytes) + { + return GetCharCount(bytes, 0, bytes.Length); + } + + /// + /// Calculates the number of characters produced by decoding a sequence of bytes from the specified byte array. + /// + /// The number of characters produced by decoding the specified sequence of bytes. + /// The byte array containing the sequence of bytes to decode. + /// The index of the first byte to decode. + /// The number of bytes to decode. + public override int GetCharCount(byte[] bytes, int index, int count) + { + if(bytes == null) throw new ArgumentNullException(nameof(bytes)); + + if(index < 0) throw new ArgumentOutOfRangeException(nameof(index)); + + if(count < 0) throw new ArgumentOutOfRangeException(nameof(count)); + + if(count + index > bytes.Length) throw new ArgumentOutOfRangeException(nameof(count)); + + return count; + } + + /// + /// Decodes a sequence of bytes from the specified byte array into the specified character array. + /// + /// The actual number of characters written into chars. + /// The byte array containing the sequence of bytes to decode. + /// The index of the first byte to decode. + /// The number of bytes to decode. + /// The character array to contain the resulting set of characters. + /// The index at which to start writing the resulting set of characters. + public override int GetChars(byte[] bytes, int byteIndex, int byteCount, char[] chars, int charIndex) + { + if(bytes == null) throw new ArgumentNullException(nameof(bytes)); + + if(chars == null) throw new ArgumentNullException(nameof(chars)); + + if(byteIndex < 0) throw new ArgumentOutOfRangeException(nameof(byteIndex)); + + if(byteCount < 0) throw new ArgumentOutOfRangeException(nameof(byteCount)); + + if(charIndex < 0) throw new ArgumentOutOfRangeException(nameof(charIndex)); + + if(byteIndex >= bytes.Length) throw new ArgumentOutOfRangeException(nameof(byteIndex)); + + if(byteCount + byteIndex > bytes.Length) throw new ArgumentOutOfRangeException(nameof(byteCount)); + + if(charIndex >= chars.Length) throw new ArgumentOutOfRangeException(nameof(charIndex)); + + if(charIndex + byteCount > chars.Length) throw new ArgumentException(nameof(chars)); + + char[] temp = GetChars(bytes, byteIndex, byteCount); + + for(int i = 0; i < temp.Length; i++) chars[i + charIndex] = temp[i]; + + return byteCount; + } + + /// + /// Decodes all the bytes in the specified byte array into a set of characters. + /// + /// A character array containing the results of decoding the specified sequence of bytes. + /// The byte array containing the sequence of bytes to decode. + public override char[] GetChars(byte[] bytes) + { + return GetChars(bytes, 0, bytes.Length); + } + + /// + /// Decodes a sequence of bytes from the specified byte array into a set of characters. + /// + /// The chars. + /// The byte array containing the sequence of bytes to decode. + /// The index of the first byte to decode. + /// The number of bytes to decode. + public override char[] GetChars(byte[] bytes, int index, int count) + { + if(bytes == null) throw new ArgumentNullException(nameof(bytes)); + + if(index < 0) throw new ArgumentOutOfRangeException(nameof(index)); + + if(count < 0) throw new ArgumentOutOfRangeException(nameof(count)); + + if(count + index > bytes.Length) throw new ArgumentOutOfRangeException(nameof(count)); + + char[] chars = new char[count]; + + for(int i = 0; i < count; i++) chars[i] = GetChar(bytes[index + i]); + + return chars; + } + + /// + /// Calculates the maximum number of bytes produced by encoding the specified number of characters. + /// + /// The maximum number of bytes produced by encoding the specified number of characters. + /// The number of characters to encode. + public override int GetMaxByteCount(int charCount) + { + if(charCount < 0) throw new ArgumentOutOfRangeException(nameof(charCount)); + + return charCount; + } + + /// + /// Calculates the maximum number of characters produced by decoding the specified number of bytes. + /// + /// The maximum number of characters produced by decoding the specified number of bytes. + /// The number of bytes to decode. + public override int GetMaxCharCount(int byteCount) + { + if(byteCount < 0) throw new ArgumentOutOfRangeException(nameof(byteCount)); + + return byteCount; + } + + /// + /// Returns a sequence of bytes that specifies the encoding used. + /// + /// A byte array of length zero, as a preamble is not required. + public override byte[] GetPreamble() + { + return new byte[0]; + } + + /// + /// Decodes all the bytes in the specified byte array into a string. + /// + /// A string that contains the results of decoding the specified sequence of bytes. + /// The byte array containing the sequence of bytes to decode. + public string GetString(byte[] bytes) + { + return GetString(bytes, 0, bytes.Length); + } + + /// + /// Decodes a sequence of bytes from the specified byte array into a string. + /// + /// A string that contains the results of decoding the specified sequence of bytes. + /// The byte array containing the sequence of bytes to decode. + /// The index of the first byte to decode. + /// The number of bytes to decode. + public override string GetString(byte[] bytes, int index, int count) + { + return new string(GetChars(bytes, index, count)); + } + + /// + /// Converts a GEOS character to an Unicode character + /// + /// Unicode character. + /// GEOS character. + static char GetChar(byte character) + { + return GeosTable[character]; + } + + /// + /// Converts a Unicode character to an GEOS character + /// + /// GEOS character. + /// Unicode character. + static byte GetByte(char character) + { + switch(character) + { + case '\u0000': return 0x00; + case '\u0001': return 0x01; + case '\u0002': return 0x02; + case '\u0003': return 0x03; + case '\u0004': return 0x04; + case '\u0005': return 0x05; + case '\u0006': return 0x06; + case '\u0007': return 0x07; + case '\u0008': return 0x08; + case '\u0009': return 0x09; + case '\u000A': return 0x0A; + case '\u000B': return 0x0B; + case '\u000C': return 0x0C; + case '\u000D': return 0x0D; + case '\u000E': return 0x0E; + case '\u000F': return 0x0F; + case '\u0010': return 0x10; + case '\u0011': return 0x11; + case '\u0012': return 0x12; + case '\u0013': return 0x13; + case '\u0014': return 0x14; + case '\u0015': return 0x15; + case '\u0016': return 0x16; + case '\u0017': return 0x17; + case '\u0018': return 0x18; + case '\u0019': return 0x19; + case '\u001A': return 0x1A; + case '\u001B': return 0x1B; + case '\u001C': return 0x1C; + case '\u001D': return 0x1D; + case '\u001E': return 0x1E; + case '\u001F': return 0x1F; + case '\u0020': return 0x20; + case '\u0021': return 0x21; + case '\u0022': return 0x22; + case '\u0023': return 0x23; + case '\u0024': return 0x24; + case '\u0025': return 0x25; + case '\u0026': return 0x26; + case '\u0027': return 0x27; + case '\u0028': return 0x28; + case '\u0029': return 0x29; + case '\u002A': return 0x2A; + case '\u002B': return 0x2B; + case '\u002C': return 0x2C; + case '\u002D': return 0x2D; + case '\u002E': return 0x2E; + case '\u002F': return 0x2F; + case '\u0030': return 0x30; + case '\u0031': return 0x31; + case '\u0032': return 0x32; + case '\u0033': return 0x33; + case '\u0034': return 0x34; + case '\u0035': return 0x35; + case '\u0036': return 0x36; + case '\u0037': return 0x37; + case '\u0038': return 0x38; + case '\u0039': return 0x39; + case '\u003A': return 0x3A; + case '\u003B': return 0x3B; + case '\u003C': return 0x3C; + case '\u003D': return 0x3D; + case '\u003E': return 0x3E; + case '\u003F': return 0x3F; + case '\u0040': return 0x40; + case '\u0041': return 0x41; + case '\u0042': return 0x42; + case '\u0043': return 0x43; + case '\u0044': return 0x44; + case '\u0045': return 0x45; + case '\u0046': return 0x46; + case '\u0047': return 0x47; + case '\u0048': return 0x48; + case '\u0049': return 0x49; + case '\u004A': return 0x4A; + case '\u004B': return 0x4B; + case '\u004C': return 0x4C; + case '\u004D': return 0x4D; + case '\u004E': return 0x4E; + case '\u004F': return 0x4F; + case '\u0050': return 0x50; + case '\u0051': return 0x51; + case '\u0052': return 0x52; + case '\u0053': return 0x53; + case '\u0054': return 0x54; + case '\u0055': return 0x55; + case '\u0056': return 0x56; + case '\u0057': return 0x57; + case '\u0058': return 0x58; + case '\u0059': return 0x59; + case '\u005A': return 0x5A; + case '\u005B': return 0x5B; + case '\u005C': return 0x5C; + case '\u005D': return 0x5D; + case '\u005E': return 0x5E; + case '\u005F': return 0x5F; + case '\u0060': return 0x60; + case '\u0061': return 0x61; + case '\u0062': return 0x62; + case '\u0063': return 0x63; + case '\u0064': return 0x64; + case '\u0065': return 0x65; + case '\u0066': return 0x66; + case '\u0067': return 0x67; + case '\u0068': return 0x68; + case '\u0069': return 0x69; + case '\u006A': return 0x6A; + case '\u006B': return 0x6B; + case '\u006C': return 0x6C; + case '\u006D': return 0x6D; + case '\u006E': return 0x6E; + case '\u006F': return 0x6F; + case '\u0070': return 0x70; + case '\u0071': return 0x71; + case '\u0072': return 0x72; + case '\u0073': return 0x73; + case '\u0074': return 0x74; + case '\u0075': return 0x75; + case '\u0076': return 0x76; + case '\u0077': return 0x77; + case '\u0078': return 0x78; + case '\u0079': return 0x79; + case '\u007A': return 0x7A; + case '\u007B': return 0x7B; + case '\u007C': return 0x7C; + case '\u007D': return 0x7D; + case '\u007E': return 0x7E; + case '\u007F': return 0x7F; + case '\u00C4': return 0x80; + case '\u00C5': return 0x81; + case '\u00C7': return 0x82; + case '\u00C9': return 0x83; + case '\u00D1': return 0x84; + case '\u00D6': return 0x85; + case '\u00DC': return 0x86; + case '\u00E1': return 0x87; + case '\u00E0': return 0x88; + case '\u00E2': return 0x89; + case '\u00E4': return 0x8A; + case '\u00E3': return 0x8B; + case '\u00E5': return 0x8C; + case '\u00E7': return 0x8D; + case '\u00E9': return 0x8E; + case '\u00E8': return 0x8F; + case '\u00EA': return 0x90; + case '\u00EB': return 0x91; + case '\u00ED': return 0x92; + case '\u00EC': return 0x93; + case '\u00EE': return 0x94; + case '\u00EF': return 0x95; + case '\u00F1': return 0x96; + case '\u00F3': return 0x97; + case '\u00F2': return 0x98; + case '\u00F4': return 0x99; + case '\u00F5': return 0x9A; + case '\u00FA': return 0x9B; + case '\u00F9': return 0x9C; + case '\u00FB': return 0x9D; + case '\u00FC': return 0x9E; + case '\u2020': return 0x9F; + case '\u00B0': return 0xA0; + case '\u00A2': return 0xA1; + case '\u00A3': return 0xA2; + case '\u00A7': return 0xA3; + case '\u00B7': return 0xA4; + case '\u00B6': return 0xA5; + case '\u00DF': return 0xA6; + case '\u00AE': return 0xA7; + case '\u00A9': return 0xA8; + case '\u2122': return 0xA9; + case '\u00C6': return 0xAD; + case '\u00D8': return 0xAE; + case '\u221E': return 0xAF; + case '\u00B1': return 0xB0; + case '\u2264': return 0xB1; + case '\u2265': return 0xB2; + case '\u00A5': return 0xB3; + case '\u00B5': return 0xB4; + case '\u03C0': return 0xB8; + case '\u00AA': return 0xBA; + case '\u00BA': return 0xBB; + case '\u03A9': return 0xBC; + case '\u00E6': return 0xBD; + case '\u00F8': return 0xBE; + case '\u00BF': return 0xBF; + case '\u00A1': return 0xC0; + case '\u00AC': return 0xC1; + case '\u221A': return 0xC2; + case '\u0192': return 0xC3; + case '\u2248': return 0xC4; + case '\u00AB': return 0xC6; + case '\u00BB': return 0xC7; + case '\u2026': return 0xC8; + case '\u00A0': return 0xC9; + case '\u00C0': return 0xCA; + case '\u00C3': return 0xCB; + case '\u00D5': return 0xCC; + case '\u0152': return 0xCD; + case '\u0153': return 0xCE; + case '\u2013': return 0xCF; + case '\u2014': return 0xD0; + case '\u201C': return 0xD1; + case '\u201D': return 0xD2; + case '\u2018': return 0xD3; + case '\u2019': return 0xD4; + case '\u00F7': return 0xD5; + case '\u00FF': return 0xD7; + case '\u0178': return 0xD8; + case '\u05A4': return 0xDA; + case '\u2039': return 0xDB; + case '\u203A': return 0xDC; + case '\u00FD': return 0xDD; + case '\u00DD': return 0xDE; + case '\u2021': return 0xDF; + case '\u201A': return 0xE1; + case '\u201E': return 0xE2; + case '\u2030': return 0xE3; + case '\u00C2': return 0xE4; + case '\u00CA': return 0xE5; + case '\u00C1': return 0xE6; + case '\u00CB': return 0xE7; + case '\u00C8': return 0xE8; + case '\u00CD': return 0xE9; + case '\u00CE': return 0xEA; + case '\u00CF': return 0xEB; + case '\u00CC': return 0xEC; + case '\u00D3': return 0xED; + case '\u00D4': return 0xEE; + case '\u00D2': return 0xF0; + case '\u00DA': return 0xF1; + case '\u00D9': return 0xF2; + case '\u00B9': return 0xF3; + case '\u20C6': return 0xF4; + case '\u20DC': return 0xF5; + case '\u00AF': return 0xF6; + case '\u02C7': return 0xF7; + case '\u00B8': return 0xFA; + case '\u2032': return 0xFB; + case '\u02DB': return 0xFC; + case '\u02D8': return 0xFD; + default: + // Fallback to '?' + return 0x3F; + } + } + } +} \ No newline at end of file diff --git a/README.md b/README.md index 810d9d5..4f7ecb5 100644 --- a/README.md +++ b/README.md @@ -14,6 +14,7 @@ Supported encodings * Commodore PET Standard Code for Information Interchange (PETSCII) * DEC Radix-50 * GEM Character Set +* GEOS Character Set * MacArabic * MacCentralEuropean * MacCroatian