-
Notifications
You must be signed in to change notification settings - Fork 4
/
Copy pathcode_pages_id.go
129 lines (113 loc) · 3.68 KB
/
code_pages_id.go
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
package cpd
const (
// ASCII is the uint16 identifier with IANA name US-ASCII (MIME: US-ASCII).
// ANSI X3.4-1986
// Reference: RFC2046
ASCII IDCodePage = 3
// ISOLatinCyrillic is the MIB identifier with IANA name ISO_8859-5:1988 (MIME: ISO-8859-5).
//
// ISO-IR: International Register of Escape Sequences
// Note: The current registration authority is IPSJ/ITSCJ, Japan.
// Reference: RFC1345
ISOLatinCyrillic IDCodePage = 8
// UTF8 is the uint16 identifier with IANA name UTF-8.
//
// rfc3629
// Reference: RFC3629
UTF8 IDCodePage = 106
// Unicode is the uint16 identifier with IANA name ISO-10646-UCS-2.
//
// the 2-octet Basic Multilingual Plane, aka Unicode
// this needs to specify network byte order: the standard
// does not specify (it is a 16-bit integer space)
Unicode IDCodePage = 1000
// UnicodeASCII is the uint16 identifier with IANA name ISO-10646-UCS-Basic.
//
// ASCII subset of Unicode. Basic Latin = collection 1
// See ISO 10646, Appendix A
UnicodeASCII IDCodePage = 1002
// UTF7 is the uint16 identifier with IANA name UTF-7.
//
// rfc2152
// Reference: RFC2152
UTF7 IDCodePage = 1012
// UTF16BE is the uint16 identifier with IANA name UTF-16BE.
//
// rfc2781
// Reference: RFC2781
UTF16BE IDCodePage = 1013
// UTF16LE is the uint16 identifier with IANA name UTF-16LE.
//
// rfc2781
// Reference: RFC2781
UTF16LE IDCodePage = 1014
// UTF32 is the uint16 identifier with IANA name UTF-32.
//
// https://www.unicode.org/unicode/reports/tr19/
UTF32 IDCodePage = 1017
// UTF32BE is the uint16 identifier with IANA name UTF-32BE.
//
// https://www.unicode.org/unicode/reports/tr19/
UTF32BE IDCodePage = 1018
// UTF32LE is the uint16 identifier with IANA name UTF-32LE.
//
// https://www.unicode.org/unicode/reports/tr19/
UTF32LE IDCodePage = 1019
// KOI8R is the uint16 identifier with IANA name KOI8-R (MIME: KOI8-R).
//
// rfc1489 , based on GOST-19768-74, ISO-6937/8,
// INIS-Cyrillic, ISO-5427.
// Reference: RFC1489
KOI8R IDCodePage = 2084
// CP866 is the uint16 identifier with IANA name IBM866.
//
// IBM NLDG Volume 2 (SE09-8002-03) August 1994
CP866 IDCodePage = 2086
// CP1251 is the uint16 identifier with IANA name windows-1251.
//
// Microsoft http://www.iana.org/assignments/charset-reg/windows-1251
CP1251 IDCodePage = 2251
// Windows1252 is the uint16 identifier with IANA name windows-1252.
//
// Microsoft http://www.iana.org/assignments/charset-reg/windows-1252
Windows1252 IDCodePage = 2252
)
var nameMap = map[string]IDCodePage{
"unicode-1-1-utf-8": UTF8,
"utf-8": UTF8,
"utf8": UTF8,
"866": CP866,
"cp-866": CP866,
"cp866": CP866,
"csibm866": CP866,
"ibm866": CP866,
"csisolatincyrillic": ISOLatinCyrillic,
"cyrillic": ISOLatinCyrillic,
"iso-8859-5": ISOLatinCyrillic,
"iso-ir-144": ISOLatinCyrillic,
"iso8859-5": ISOLatinCyrillic,
"iso88595": ISOLatinCyrillic,
"iso_8859-5": ISOLatinCyrillic,
"iso_8859-5:1988": ISOLatinCyrillic,
"cskoi8r": KOI8R,
"koi": KOI8R,
"koi8": KOI8R,
"koi-8": KOI8R,
"koi8-r": KOI8R,
"koi8_r": KOI8R,
"koi8-ru": KOI8R,
"koi8-u": KOI8R,
"cp1251": CP1251,
"cp-1251": CP1251,
"win1251": CP1251,
"win-1251": CP1251,
"windows-1251": CP1251,
"windows1251": CP1251,
"x-cp1251": CP1251,
"utf-16be": UTF16BE,
"utf16be": UTF16BE,
"utf-16": UTF16LE,
"utf16": UTF16LE,
"utf-16le": UTF16LE,
"utf16le": UTF16LE,
}