forked from len0rd/rockbox
We used 16-bit variables to store the 'character code' everywhere but this won't let us represent anything beyond U+FFFF. This patch changes those variables to a custom type that can be 32 or 16 bits depending on the build, and adjusts numerous internal APIs and datastructures to match. This includes: * utf8decode() and friends * font manipulation, caching, rendering, and generation * on-screen keyboard * FAT filesystem (parsing and generating utf16 LFNs) * WIN32 simulator platform code Note that this patch doesn't _enable_ >16bit unicode support; a followup patch will turn that on for appropriate targets. Appears to work on: * hosted linux, native, linux simulator in both 16/32-bit modes. Needs testing on: * windows and macos simulator (16bit+32bit) Change-Id: Iba111b27d2433019b6bff937cf1ebd2c4353a0e8
103 lines
2.5 KiB
C
103 lines
2.5 KiB
C
/***************************************************************************
|
|
* __________ __ ___.
|
|
* Open \______ \ ____ ____ | | _\_ |__ _______ ___
|
|
* Source | _// _ \_/ ___\| |/ /| __ \ / _ \ \/ /
|
|
* Jukebox | | ( <_> ) \___| < | \_\ ( <_> > < <
|
|
* Firmware |____|_ /\____/ \___ >__|_ \|___ /\____/__/\_ \
|
|
* \/ \/ \/ \/ \/
|
|
*
|
|
*
|
|
* Copyright (C) 2006 by Frank Dischner
|
|
*
|
|
* This program is free software; you can redistribute it and/or
|
|
* modify it under the terms of the GNU General Public License
|
|
* as published by the Free Software Foundation; either version 2
|
|
* of the License, or (at your option) any later version.
|
|
*
|
|
* This software is distributed on an "AS IS" basis, WITHOUT WARRANTY OF ANY
|
|
* KIND, either express or implied.
|
|
*
|
|
****************************************************************************/
|
|
#include "config.h"
|
|
#include "hangul.h"
|
|
|
|
const char jamo_table[51][3] = {
|
|
{ 1, 0, 1},
|
|
{ 2, 0, 2},
|
|
{ 0, 0, 3},
|
|
{ 3, 0, 4},
|
|
{ 0, 0, 5},
|
|
{ 0, 0, 6},
|
|
{ 4, 0, 7},
|
|
{ 5, 0, 0},
|
|
{ 6, 0, 8},
|
|
{ 0, 0, 9},
|
|
{ 0, 0, 10},
|
|
{ 0, 0, 11},
|
|
{ 0, 0, 12},
|
|
{ 0, 0, 13},
|
|
{ 0, 0, 14},
|
|
{ 0, 0, 15},
|
|
{ 7, 0, 16},
|
|
{ 8, 0, 17},
|
|
{ 9, 0, 0},
|
|
{ 0, 0, 18},
|
|
{10, 0, 19},
|
|
{11, 0, 20},
|
|
{12, 0, 21},
|
|
{13, 0, 22},
|
|
{14, 0, 0},
|
|
{15, 0, 23},
|
|
{16, 0, 24},
|
|
{17, 0, 25},
|
|
{18, 0, 26},
|
|
{19, 0, 27},
|
|
{ 0, 1, 0},
|
|
{ 0, 2, 0},
|
|
{ 0, 3, 0},
|
|
{ 0, 4, 0},
|
|
{ 0, 5, 0},
|
|
{ 0, 6, 0},
|
|
{ 0, 7, 0},
|
|
{ 0, 8, 0},
|
|
{ 0, 9, 0},
|
|
{ 0, 10, 0},
|
|
{ 0, 11, 0},
|
|
{ 0, 12, 0},
|
|
{ 0, 13, 0},
|
|
{ 0, 14, 0},
|
|
{ 0, 15, 0},
|
|
{ 0, 16, 0},
|
|
{ 0, 17, 0},
|
|
{ 0, 18, 0},
|
|
{ 0, 19, 0},
|
|
{ 0, 20, 0},
|
|
{ 0, 21, 0},
|
|
};
|
|
|
|
/* takes three jamo chars and joins them into one hangul */
|
|
ucschar_t hangul_join(ucschar_t lead, ucschar_t vowel, ucschar_t tail)
|
|
{
|
|
ucschar_t ch = 0xfffd;
|
|
|
|
if (lead < 0x3131 || lead > 0x3163)
|
|
return ch;
|
|
lead = jamo_table[lead-0x3131][0];
|
|
|
|
if (vowel < 0x3131 || vowel > 0x3163)
|
|
return ch;
|
|
vowel = jamo_table[vowel-0x3131][1];
|
|
|
|
if (tail) {
|
|
if (tail < 0x3131 || tail > 0x3163)
|
|
return ch;
|
|
tail = jamo_table[tail-0x3131][2];
|
|
if (!tail)
|
|
return ch;
|
|
}
|
|
|
|
if (lead && vowel)
|
|
ch = tail + (vowel - 1)*28 + (lead - 1)*588 + 44032;
|
|
|
|
return ch;
|
|
}
|