[KoCo-CVS] [Commit] cjkcodecs/tools genmap_tchinese.py
Brought to you by:
perky
From: Hye-Shik C. <pe...@us...> - 2003-06-19 17:49:07
|
perky 03/06/19 10:49:01 Modified: tools genmap_tchinese.py Log: Fix some big5 mappings to give more roundtrip compatibility. Revision Changes Path 1.4 +18 -1 cjkcodecs/tools/genmap_tchinese.py Index: genmap_tchinese.py =================================================================== RCS file: /cvsroot/koco/cjkcodecs/tools/genmap_tchinese.py,v retrieving revision 1.3 retrieving revision 1.4 diff -u -r1.3 -r1.4 --- genmap_tchinese.py 10 Jun 2003 11:12:12 -0000 1.3 +++ genmap_tchinese.py 19 Jun 2003 17:49:01 -0000 1.4 @@ -26,7 +26,7 @@ # IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE # POSSIBILITY OF SUCH DAMAGE. # -# $Id: genmap_tchinese.py,v 1.3 2003/06/10 11:12:12 perky Exp $ +# $Id: genmap_tchinese.py,v 1.4 2003/06/19 17:49:01 perky Exp $ # from genmap_support import * @@ -54,6 +54,19 @@ print "Loading Mapping File..." cp950decmap = loadmap(cp950map) big5decmap = loadmap(big5map) + +# big5 mapping fix (see doc/NOTES.big5) +for m in """\ +0xA15A 0x2574 +0xA1C3 0xFFE3 +0xA1C5 0x02CD +0xA1FE 0xFF0F +0xA240 0xFF3C +0xA2CC 0x5341 +0xA2CE 0x5345""".splitlines(): + bcode, ucode = map(eval, m.split()) + big5decmap[bcode >> 8][bcode & 0xff] = ucode + big5encmap, cp950encmap = {}, {} for c1, m in cp950decmap.items(): for c2, code in m.items(): @@ -73,6 +86,10 @@ del cp950encmap[code >> 8][code & 0xff] if not cp950encmap[code >> 8]: del cp950encmap[code >>8] + +# fix unicode->big5 duplicated mapping priority +big5encmap[0x53][0x41] = 0xA451 +big5encmap[0x53][0x45] = 0xA4CA omap = open('map_big5.h', 'w') printcopyright(omap) |