From e03c7787b98f406d65714b0e7c9509131ac5828a Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Martin=20v=2E=20L=C3=B6wis?= Date: Mon, 22 Nov 2010 10:53:46 +0000 Subject: [PATCH] Issue #10459: Update CJK character names to Unicode 5.2. --- Misc/NEWS | 2 ++ Modules/unicodedata.c | 5 +++-- 2 files changed, 5 insertions(+), 2 deletions(-) diff --git a/Misc/NEWS b/Misc/NEWS index cb9e4897163..9edc91d925f 100644 --- a/Misc/NEWS +++ b/Misc/NEWS @@ -13,6 +13,8 @@ Core and Builtins Library ------- +- Issue #10459: Update CJK character names to Unicode 5.2. + - Issue #4493: urllib2 adds '/' in front of path components which does not start with '/. Common behavior exhibited by browsers and other clients. diff --git a/Modules/unicodedata.c b/Modules/unicodedata.c index 77f36377c78..b4af29071af 100644 --- a/Modules/unicodedata.c +++ b/Modules/unicodedata.c @@ -869,8 +869,9 @@ is_unified_ideograph(Py_UCS4 code) { return ( (0x3400 <= code && code <= 0x4DB5) || /* CJK Ideograph Extension A */ - (0x4E00 <= code && code <= 0x9FBB) || /* CJK Ideograph */ - (0x20000 <= code && code <= 0x2A6D6));/* CJK Ideograph Extension B */ + (0x4E00 <= code && code <= 0x9FCB) || /* CJK Ideograph, Unicode 5.2 */ + (0x20000 <= code && code <= 0x2A6D6) || /* CJK Ideograph Extension B */ + (0x2A700 <= code && code <= 0x2B734)); /* CJK Ideograph Extension C */ } static int