JSON
Character Encoding Standards - JSON
Character encoding standards are specifications for representing characters as digital data in computers. Various schemes exist including ASCII, UTF-8, UTF-16, Shift_JIS, and EUC-JP, each with different character sets, byte structures, and compatibility characteristics. While UTF-8 has become the international standard widely adopted today, legacy encodings like Shift_JIS and EUC-JP are still used in Japanese computing environments.
character encoding
Unicode
UTF-8
ASCII
Shift_JIS
EUC-JP
charset
internationalization
[
{
"code": "ASCII",
"slug": "ascii",
"name": "ASCII",
"description": "American Standard Code for Information Interchange. Represents alphanumeric characters and symbols in 7 bits.",
"yearIntroduced": 1963,
"byteStructure": "固定長(1バイト、7ビット使用)",
"maxCharacters": 128,
"asciiCompatible": true,
"japaneseSupport": false,
"usage": "legacy"
},
{
"code": "UTF-8",
"slug": "utf-8",
"name": "UTF-8",
"description": "Variable-length Unicode encoding. ASCII-compatible and represents characters worldwide.",
"yearIntroduced": 1993,
"byteStructure": "可変長(1〜4バイト)",
"maxCharacters": 1114112,
"asciiCompatible": true,
"japaneseSupport": true,
"usage": "standard"
},
{
"code": "UTF-16",
"slug": "utf-16",
"name": "UTF-16",
"description": "16-bit Unicode encoding. Widely used in Windows and Java.",
"yearIntroduced": 1996,
"byteStructure": "可変長(2または4バイト)",
"maxCharacters": 1114112,
"asciiCompatible": false,
"japaneseSupport": true,
"usage": "system"
},
{
"code": "UTF-32",
"slug": "utf-32",
"name": "UTF-32",
"description": "Fixed-length 32-bit Unicode encoding. Used for internal processing.",
"yearIntroduced": 1996,
"byteStructure": "固定長(4バイト)",
"maxCharacters": 1114112,
"asciiCompatible": false,
"japaneseSupport": true,
"usage": "internal"
},
{
"code": "Shift_JIS",
"slug": "shift-jis",
"name": "Shift_JIS",
"description": "Legacy Japanese encoding. Widely used in Windows systems.",
"yearIntroduced": 1978,
"byteStructure": "可変長(1〜2バイト)",
"maxCharacters": 10000,
"asciiCompatible": false,
"japaneseSupport": true,
"usage": "legacy"
},
{
"code": "EUC-JP",
"slug": "euc-jp",
"name": "EUC-JP",
"description": "Japanese encoding used in Unix/Linux. ASCII-compatible.",
"yearIntroduced": 1988,
"byteStructure": "可変長(1〜3バイト)",
"maxCharacters": 11000,
"asciiCompatible": true,
"japaneseSupport": true,
"usage": "legacy"
},
{
"code": "ISO-2022-JP",
"slug": "iso-2022-jp",
"name": "ISO-2022-JP",
"description": "7-bit escape sequence Japanese encoding. Used in email.",
"yearIntroduced": 1983,
"byteStructure": "7ビット可変長(エスケープシーケンス使用)",
"maxCharacters": 10000,
"asciiCompatible": true,
"japaneseSupport": true,
"usage": "legacy"
},
{
"code": "GB2312",
"slug": "gb2312",
"name": "GB2312",
"description": "National standard encoding for Simplified Chinese.",
"yearIntroduced": 1980,
"byteStructure": "可変長(1〜2バイト)",
"maxCharacters": 7445,
"asciiCompatible": false,
"japaneseSupport": false,
"usage": "legacy"
},
{
"code": "Big5",
"slug": "big5",
"name": "Big5",
"description": "Traditional Chinese encoding used in Taiwan and Hong Kong.",
"yearIntroduced": 1984,
"byteStructure": "可変長(1〜2バイト)",
"maxCharacters": 13000,
"asciiCompatible": false,
"japaneseSupport": false,
"usage": "legacy"
},
{
"code": "Windows-1252",
"slug": "windows-1252",
"name": "Windows-1252",
"description": "Western European encoding used in Windows.",
"yearIntroduced": 1992,
"byteStructure": "固定長(1バイト)",
"maxCharacters": 256,
"asciiCompatible": true,
"japaneseSupport": false,
"usage": "legacy"
}
]