Add CJK codecs support as discussed on python-dev. (SF #873597)

Several style fixes are suggested by Martin v. Loewis and
Marc-Andre Lemburg. Thanks!
This commit is contained in:
Hye-Shik Chang 2004-01-17 14:29:29 +00:00
parent cd1f7430cb
commit 3e2a306920
88 changed files with 43278 additions and 34 deletions

View file

@ -212,15 +212,6 @@ The others represent the BOM in UTF-8 and UTF-32 encodings.
\end{datadesc}
\begin{seealso}
\seeurl{http://sourceforge.net/projects/python-codecs/}{A
SourceForge project working on additional support for Asian
codecs for use with Python. They are in the early stages of
development at the time of this writing --- look in their
FTP area for downloadable files.}
\end{seealso}
\subsection{Codec Base Classes}
The \module{codecs} defines a set of base classes which define the
@ -553,6 +544,10 @@ exist:
{646, us-ascii}
{English}
\lineiii{big5}
{big5_tw, csbig5}
{Traditional Chinese}
\lineiii{cp037}
{IBM037, IBM039}
{English}
@ -633,6 +628,18 @@ exist:
{}
{Greek}
\lineiii{cp932}
{932, ms932, mskanji, ms_kanji}
{Japanese}
\lineiii{cp949}
{949, ms949, uhc}
{Korean}
\lineiii{cp950}
{950, ms950}
{Traditional Chinese}
\lineiii{cp1006}
{}
{Urdu}
@ -681,6 +688,59 @@ exist:
{windows-1258}
{Vietnamese}
\lineiii{euc_jp}
{eucjp, ujis, u_jis}
{Japanese}
\lineiii{euc_jisx0213}
{jisx0213, eucjisx0213}
{Japanese}
\lineiii{euc_kr}
{euckr, korean, ksc5601, ks_c_5601, ks_c_5601_1987, ksx1001, ks_x_1001}
{Korean}
\lineiii{gb2312}
{chinese, csiso58gb231280, euc_cn, euccn, eucgb2312_cn, gb2312_1980,
gb2312_80, iso_ir_58}
{Simplified Chinese}
\lineiii{gbk}
{936, cp936, ms936}
{Unified Chinese}
\lineiii{gb18030}
{gb18030_2000}
{Unified Chinese}
\lineiii{hz}
{hzgb, hz_gb, hz_gb_2312}
{Simplified Chinese}
\lineiii{iso2022_jp}
{csiso2022jp, iso2022jp, iso_2022_jp}
{Japanese}
\lineiii{iso2022_jp_1}
{iso2022jp_1, iso_2022_jp_1}
{Japanese}
\lineiii{iso2022_jp_2}
{iso2022jp_2, iso_2022_jp_2}
{Japanese, Korean, Simplified Chinese, Western Europe, Greek}
\lineiii{iso2022_jp_3}
{iso2022jp_3, iso_2022_jp_3}
{Japanese}
\lineiii{iso2022_jp_ext}
{iso2022jp_ext, iso_2022_jp_ext}
{Japanese}
\lineiii{iso2022_kr}
{csiso2022kr, iso2022kr, iso_2022_kr}
{Korean}
\lineiii{latin_1}
{iso-8859-1, iso8859-1, 8859, cp819, latin, latin1, L1}
{West Europe}
@ -733,6 +793,10 @@ exist:
{iso-8859-15}
{Western Europe}
\lineiii{johab}
{cp1361, ms1361}
{Korean}
\lineiii{koi8_r}
{}
{Russian}
@ -765,6 +829,14 @@ exist:
{macturkish}
{Turkish}
\lineiii{shift_jis}
{csshiftjis, shiftjis, sjis, s_jis}
{Japanese}
\lineiii{shift_jisx0213}
{shiftjisx0213, sjisx0213, s_jisx0213}
{Japanese}
\lineiii{utf_16}
{U16, utf16}
{all languages}