mirror of
https://github.com/claunia/Claunia.Encoding.git
synced 2025-12-16 19:24:43 +00:00
397 lines
13 KiB
C#
397 lines
13 KiB
C#
//
|
|
// Geos.cs
|
|
//
|
|
// Author:
|
|
// Natalia Portillo <claunia@claunia.com>
|
|
//
|
|
// Copyright © 2016-2021 Natalia Portillo
|
|
//
|
|
// Permission is hereby granted, free of charge, to any person obtaining a copy
|
|
// of this software and associated documentation files (the "Software"), to deal
|
|
// in the Software without restriction, including without limitation the rights
|
|
// to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
|
|
// copies of the Software, and to permit persons to whom the Software is
|
|
// furnished to do so, subject to the following conditions:
|
|
//
|
|
// The above copyright notice and this permission notice shall be included in
|
|
// all copies or substantial portions of the Software.
|
|
//
|
|
// THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
|
// IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
// FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
|
|
// AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
|
// LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
|
|
// OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
|
|
// THE SOFTWARE.
|
|
|
|
namespace Claunia.Encoding
|
|
{
|
|
/// <summary>Represents an GEOS character encoding of Unicode characters.</summary>
|
|
public class Geos : SingleByteEncoding
|
|
{
|
|
public override string BodyName => "geos";
|
|
public override int CodePage => 0;
|
|
public override string EncodingName => "Western European (GEOS)";
|
|
public override string HeaderName => "geos";
|
|
public override string WebName => "";
|
|
public override int WindowsCodePage => 0;
|
|
|
|
public override bool IsBrowserDisplay => false;
|
|
public override bool IsBrowserSave => false;
|
|
public override bool IsMailNewsDisplay => false;
|
|
public override bool IsMailNewsSave => false;
|
|
public override bool IsReadOnly => false;
|
|
public override bool IsSingleByte => true;
|
|
|
|
/// <summary>
|
|
/// The GEOS to Unicode character map. In the GEOS character map application lots of positions appears as '\u002E'
|
|
/// ('.' period) in normal (non-symbol) fonts.
|
|
/// </summary>
|
|
protected override char[] CharTable => new[]
|
|
{
|
|
// 0x00
|
|
'\u0000', '\u0001', '\u0002', '\u0003', '\u0004', '\u0005', '\u0006', '\u0007',
|
|
|
|
// 0x08
|
|
'\u0008', '\u0009', '\u000A', '\u000B', '\u000C', '\u000D', '\u000E', '\u000F',
|
|
|
|
// 0x10
|
|
'\u0010', '\u0011', '\u0012', '\u0013', '\u0014', '\u0015', '\u0016', '\u0017',
|
|
|
|
// 0x18
|
|
'\u0018', '\u0019', '\u001A', '\u001B', '\u001C', '\u001D', '\u001E', '\u001F',
|
|
|
|
// 0x20
|
|
'\u0020', '\u0021', '\u0022', '\u0023', '\u0024', '\u0025', '\u0026', '\u0027',
|
|
|
|
// 0x28
|
|
'\u0028', '\u0029', '\u002A', '\u002B', '\u002C', '\u002D', '\u002E', '\u002F',
|
|
|
|
// 0x30
|
|
'\u0030', '\u0031', '\u0032', '\u0033', '\u0034', '\u0035', '\u0036', '\u0037',
|
|
|
|
// 0x38
|
|
'\u0038', '\u0039', '\u003A', '\u003B', '\u003C', '\u003D', '\u003E', '\u003F',
|
|
|
|
// 0x40
|
|
'\u0040', '\u0041', '\u0042', '\u0043', '\u0044', '\u0045', '\u0046', '\u0047',
|
|
|
|
// 0x48
|
|
'\u0048', '\u0049', '\u004A', '\u004B', '\u004C', '\u004D', '\u004E', '\u004F',
|
|
|
|
// 0x50
|
|
'\u0050', '\u0051', '\u0052', '\u0053', '\u0054', '\u0055', '\u0056', '\u0057',
|
|
|
|
// 0x58
|
|
'\u0058', '\u0059', '\u005A', '\u005B', '\u005C', '\u005D', '\u005E', '\u005F',
|
|
|
|
// 0x60
|
|
'\u0060', '\u0061', '\u0062', '\u0063', '\u0064', '\u0065', '\u0066', '\u0067',
|
|
|
|
// 0x68
|
|
'\u0068', '\u0069', '\u006A', '\u006B', '\u006C', '\u006D', '\u006E', '\u006F',
|
|
|
|
// 0x70
|
|
'\u0070', '\u0071', '\u0072', '\u0073', '\u0074', '\u0075', '\u0076', '\u0077',
|
|
|
|
// 0x78
|
|
'\u0078', '\u0079', '\u007A', '\u007B', '\u007C', '\u007D', '\u007E', '\u007F',
|
|
|
|
// 0x80
|
|
'\u00C4', '\u00C5', '\u00C7', '\u00C9', '\u00D1', '\u00D6', '\u00DC', '\u00E1',
|
|
|
|
// 0x88
|
|
'\u00E0', '\u00E2', '\u00E4', '\u00E3', '\u00E5', '\u00E7', '\u00E9', '\u00E8',
|
|
|
|
// 0x90
|
|
'\u00EA', '\u00EB', '\u00ED', '\u00EC', '\u00EE', '\u00EF', '\u00F1', '\u00F3',
|
|
|
|
// 0x98
|
|
'\u00F2', '\u00F4', '\u00F5', '\u00FA', '\u00F9', '\u00FB', '\u00FC', '\u2020',
|
|
|
|
// 0xA0
|
|
'\u00B0', '\u00A2', '\u00A3', '\u00A7', '\u00B7', '\u00B6', '\u00DF', '\u00AE',
|
|
|
|
// 0xA8
|
|
'\u00A9', '\u2122', '\u0022', '\u0027', '\u002E', '\u00C6', '\u00D8', '\u221E',
|
|
|
|
// 0xB0
|
|
'\u00B1', '\u2264', '\u2265', '\u00A5', '\u00B5', '\u002E', '\u002E', '\u002E',
|
|
|
|
// 0xB8
|
|
'\u03C0', '\u002E', '\u00AA', '\u00BA', '\u03A9', '\u00E6', '\u00F8', '\u00BF',
|
|
|
|
// 0xC0
|
|
'\u00A1', '\u00AC', '\u221A', '\u0192', '\u2248', '\u002E', '\u00AB', '\u00BB',
|
|
|
|
// 0xC8
|
|
'\u2026', '\u00A0', '\u00C0', '\u00C3', '\u00D5', '\u0152', '\u0153', '\u2013',
|
|
|
|
// 0xD0
|
|
'\u2014', '\u201C', '\u201D', '\u2018', '\u2019', '\u00F7', '\u002E', '\u00FF',
|
|
|
|
// 0xD8
|
|
'\u0178', '\u002E', '\u00A4', '\u2039', '\u203A', '\u00FD', '\u00DD', '\u2021',
|
|
|
|
// 0xE0
|
|
'\u002E', '\u201A', '\u201E', '\u2030', '\u00C2', '\u00CA', '\u00C1', '\u00CB',
|
|
|
|
// 0xE8
|
|
'\u00C8', '\u00CD', '\u00CE', '\u00CF', '\u00CC', '\u00D3', '\u00D4', '\u002E',
|
|
|
|
// 0xF0
|
|
'\u00D2', '\u00DA', '\u00D9', '\u00B9', '\u20C6', '\u20DC', '\u00AF', '\u02C7',
|
|
|
|
// 0xF8
|
|
'\u00B7', '\u00B0', '\u00B8', '\u2032', '\u02DB', '\u02D8', '\u00A0', '\u002E'
|
|
};
|
|
|
|
/// <summary>Converts a Unicode character to an GEOS character</summary>
|
|
/// <returns>GEOS character.</returns>
|
|
/// <param name="character">Unicode character.</param>
|
|
private protected override byte GetByte(char character) => character switch
|
|
{
|
|
'\u0000' => 0x00,
|
|
'\u0001' => 0x01,
|
|
'\u0002' => 0x02,
|
|
'\u0003' => 0x03,
|
|
'\u0004' => 0x04,
|
|
'\u0005' => 0x05,
|
|
'\u0006' => 0x06,
|
|
'\u0007' => 0x07,
|
|
'\u0008' => 0x08,
|
|
'\u0009' => 0x09,
|
|
'\u000A' => 0x0A,
|
|
'\u000B' => 0x0B,
|
|
'\u000C' => 0x0C,
|
|
'\u000D' => 0x0D,
|
|
'\u000E' => 0x0E,
|
|
'\u000F' => 0x0F,
|
|
'\u0010' => 0x10,
|
|
'\u0011' => 0x11,
|
|
'\u0012' => 0x12,
|
|
'\u0013' => 0x13,
|
|
'\u0014' => 0x14,
|
|
'\u0015' => 0x15,
|
|
'\u0016' => 0x16,
|
|
'\u0017' => 0x17,
|
|
'\u0018' => 0x18,
|
|
'\u0019' => 0x19,
|
|
'\u001A' => 0x1A,
|
|
'\u001B' => 0x1B,
|
|
'\u001C' => 0x1C,
|
|
'\u001D' => 0x1D,
|
|
'\u001E' => 0x1E,
|
|
'\u001F' => 0x1F,
|
|
'\u0020' => 0x20,
|
|
'\u0021' => 0x21,
|
|
'\u0022' => 0x22,
|
|
'\u0023' => 0x23,
|
|
'\u0024' => 0x24,
|
|
'\u0025' => 0x25,
|
|
'\u0026' => 0x26,
|
|
'\u0027' => 0x27,
|
|
'\u0028' => 0x28,
|
|
'\u0029' => 0x29,
|
|
'\u002A' => 0x2A,
|
|
'\u002B' => 0x2B,
|
|
'\u002C' => 0x2C,
|
|
'\u002D' => 0x2D,
|
|
'\u002E' => 0x2E,
|
|
'\u002F' => 0x2F,
|
|
'\u0030' => 0x30,
|
|
'\u0031' => 0x31,
|
|
'\u0032' => 0x32,
|
|
'\u0033' => 0x33,
|
|
'\u0034' => 0x34,
|
|
'\u0035' => 0x35,
|
|
'\u0036' => 0x36,
|
|
'\u0037' => 0x37,
|
|
'\u0038' => 0x38,
|
|
'\u0039' => 0x39,
|
|
'\u003A' => 0x3A,
|
|
'\u003B' => 0x3B,
|
|
'\u003C' => 0x3C,
|
|
'\u003D' => 0x3D,
|
|
'\u003E' => 0x3E,
|
|
'\u003F' => 0x3F,
|
|
'\u0040' => 0x40,
|
|
'\u0041' => 0x41,
|
|
'\u0042' => 0x42,
|
|
'\u0043' => 0x43,
|
|
'\u0044' => 0x44,
|
|
'\u0045' => 0x45,
|
|
'\u0046' => 0x46,
|
|
'\u0047' => 0x47,
|
|
'\u0048' => 0x48,
|
|
'\u0049' => 0x49,
|
|
'\u004A' => 0x4A,
|
|
'\u004B' => 0x4B,
|
|
'\u004C' => 0x4C,
|
|
'\u004D' => 0x4D,
|
|
'\u004E' => 0x4E,
|
|
'\u004F' => 0x4F,
|
|
'\u0050' => 0x50,
|
|
'\u0051' => 0x51,
|
|
'\u0052' => 0x52,
|
|
'\u0053' => 0x53,
|
|
'\u0054' => 0x54,
|
|
'\u0055' => 0x55,
|
|
'\u0056' => 0x56,
|
|
'\u0057' => 0x57,
|
|
'\u0058' => 0x58,
|
|
'\u0059' => 0x59,
|
|
'\u005A' => 0x5A,
|
|
'\u005B' => 0x5B,
|
|
'\u005C' => 0x5C,
|
|
'\u005D' => 0x5D,
|
|
'\u005E' => 0x5E,
|
|
'\u005F' => 0x5F,
|
|
'\u0060' => 0x60,
|
|
'\u0061' => 0x61,
|
|
'\u0062' => 0x62,
|
|
'\u0063' => 0x63,
|
|
'\u0064' => 0x64,
|
|
'\u0065' => 0x65,
|
|
'\u0066' => 0x66,
|
|
'\u0067' => 0x67,
|
|
'\u0068' => 0x68,
|
|
'\u0069' => 0x69,
|
|
'\u006A' => 0x6A,
|
|
'\u006B' => 0x6B,
|
|
'\u006C' => 0x6C,
|
|
'\u006D' => 0x6D,
|
|
'\u006E' => 0x6E,
|
|
'\u006F' => 0x6F,
|
|
'\u0070' => 0x70,
|
|
'\u0071' => 0x71,
|
|
'\u0072' => 0x72,
|
|
'\u0073' => 0x73,
|
|
'\u0074' => 0x74,
|
|
'\u0075' => 0x75,
|
|
'\u0076' => 0x76,
|
|
'\u0077' => 0x77,
|
|
'\u0078' => 0x78,
|
|
'\u0079' => 0x79,
|
|
'\u007A' => 0x7A,
|
|
'\u007B' => 0x7B,
|
|
'\u007C' => 0x7C,
|
|
'\u007D' => 0x7D,
|
|
'\u007E' => 0x7E,
|
|
'\u007F' => 0x7F,
|
|
'\u00C4' => 0x80,
|
|
'\u00C5' => 0x81,
|
|
'\u00C7' => 0x82,
|
|
'\u00C9' => 0x83,
|
|
'\u00D1' => 0x84,
|
|
'\u00D6' => 0x85,
|
|
'\u00DC' => 0x86,
|
|
'\u00E1' => 0x87,
|
|
'\u00E0' => 0x88,
|
|
'\u00E2' => 0x89,
|
|
'\u00E4' => 0x8A,
|
|
'\u00E3' => 0x8B,
|
|
'\u00E5' => 0x8C,
|
|
'\u00E7' => 0x8D,
|
|
'\u00E9' => 0x8E,
|
|
'\u00E8' => 0x8F,
|
|
'\u00EA' => 0x90,
|
|
'\u00EB' => 0x91,
|
|
'\u00ED' => 0x92,
|
|
'\u00EC' => 0x93,
|
|
'\u00EE' => 0x94,
|
|
'\u00EF' => 0x95,
|
|
'\u00F1' => 0x96,
|
|
'\u00F3' => 0x97,
|
|
'\u00F2' => 0x98,
|
|
'\u00F4' => 0x99,
|
|
'\u00F5' => 0x9A,
|
|
'\u00FA' => 0x9B,
|
|
'\u00F9' => 0x9C,
|
|
'\u00FB' => 0x9D,
|
|
'\u00FC' => 0x9E,
|
|
'\u2020' => 0x9F,
|
|
'\u00B0' => 0xA0,
|
|
'\u00A2' => 0xA1,
|
|
'\u00A3' => 0xA2,
|
|
'\u00A7' => 0xA3,
|
|
'\u00B7' => 0xA4,
|
|
'\u00B6' => 0xA5,
|
|
'\u00DF' => 0xA6,
|
|
'\u00AE' => 0xA7,
|
|
'\u00A9' => 0xA8,
|
|
'\u2122' => 0xA9,
|
|
'\u00C6' => 0xAD,
|
|
'\u00D8' => 0xAE,
|
|
'\u221E' => 0xAF,
|
|
'\u00B1' => 0xB0,
|
|
'\u2264' => 0xB1,
|
|
'\u2265' => 0xB2,
|
|
'\u00A5' => 0xB3,
|
|
'\u00B5' => 0xB4,
|
|
'\u03C0' => 0xB8,
|
|
'\u00AA' => 0xBA,
|
|
'\u00BA' => 0xBB,
|
|
'\u03A9' => 0xBC,
|
|
'\u00E6' => 0xBD,
|
|
'\u00F8' => 0xBE,
|
|
'\u00BF' => 0xBF,
|
|
'\u00A1' => 0xC0,
|
|
'\u00AC' => 0xC1,
|
|
'\u221A' => 0xC2,
|
|
'\u0192' => 0xC3,
|
|
'\u2248' => 0xC4,
|
|
'\u00AB' => 0xC6,
|
|
'\u00BB' => 0xC7,
|
|
'\u2026' => 0xC8,
|
|
'\u00A0' => 0xC9,
|
|
'\u00C0' => 0xCA,
|
|
'\u00C3' => 0xCB,
|
|
'\u00D5' => 0xCC,
|
|
'\u0152' => 0xCD,
|
|
'\u0153' => 0xCE,
|
|
'\u2013' => 0xCF,
|
|
'\u2014' => 0xD0,
|
|
'\u201C' => 0xD1,
|
|
'\u201D' => 0xD2,
|
|
'\u2018' => 0xD3,
|
|
'\u2019' => 0xD4,
|
|
'\u00F7' => 0xD5,
|
|
'\u00FF' => 0xD7,
|
|
'\u0178' => 0xD8,
|
|
'\u05A4' => 0xDA,
|
|
'\u2039' => 0xDB,
|
|
'\u203A' => 0xDC,
|
|
'\u00FD' => 0xDD,
|
|
'\u00DD' => 0xDE,
|
|
'\u2021' => 0xDF,
|
|
'\u201A' => 0xE1,
|
|
'\u201E' => 0xE2,
|
|
'\u2030' => 0xE3,
|
|
'\u00C2' => 0xE4,
|
|
'\u00CA' => 0xE5,
|
|
'\u00C1' => 0xE6,
|
|
'\u00CB' => 0xE7,
|
|
'\u00C8' => 0xE8,
|
|
'\u00CD' => 0xE9,
|
|
'\u00CE' => 0xEA,
|
|
'\u00CF' => 0xEB,
|
|
'\u00CC' => 0xEC,
|
|
'\u00D3' => 0xED,
|
|
'\u00D4' => 0xEE,
|
|
'\u00D2' => 0xF0,
|
|
'\u00DA' => 0xF1,
|
|
'\u00D9' => 0xF2,
|
|
'\u00B9' => 0xF3,
|
|
'\u20C6' => 0xF4,
|
|
'\u20DC' => 0xF5,
|
|
'\u00AF' => 0xF6,
|
|
'\u02C7' => 0xF7,
|
|
'\u00B8' => 0xFA,
|
|
'\u2032' => 0xFB,
|
|
'\u02DB' => 0xFC,
|
|
'\u02D8' => 0xFD,
|
|
_ => 0x3F
|
|
};
|
|
}
|
|
} |