1
0
Fork 0
forked from len0rd/rockbox
foxbox/firmware/hangul.c
Solomon Peachy a2c10f6189 unicode: Support characters beyond the first unicode plane
We used 16-bit variables to store the 'character code' everywhere but
this won't let us represent anything beyond U+FFFF.

This patch changes those variables to a custom type that can be 32 or 16
bits depending on the build, and adjusts numerous internal APIs and
datastructures to match.  This includes:

 * utf8decode() and friends
 * font manipulation, caching, rendering, and generation
 * on-screen keyboard
 * FAT filesystem (parsing and generating utf16 LFNs)
 * WIN32 simulator platform code

Note that this patch doesn't _enable_ >16bit unicode support; a followup
patch will turn that on for appropriate targets.

Appears to work on:

  * hosted linux, native, linux simulator in both 16/32-bit modes.

Needs testing on:

  * windows and macos simulator (16bit+32bit)

Change-Id: Iba111b27d2433019b6bff937cf1ebd2c4353a0e8
2025-09-12 09:24:30 -04:00

103 lines
2.5 KiB
C

/***************************************************************************
* __________ __ ___.
* Open \______ \ ____ ____ | | _\_ |__ _______ ___
* Source | _// _ \_/ ___\| |/ /| __ \ / _ \ \/ /
* Jukebox | | ( <_> ) \___| < | \_\ ( <_> > < <
* Firmware |____|_ /\____/ \___ >__|_ \|___ /\____/__/\_ \
* \/ \/ \/ \/ \/
*
*
* Copyright (C) 2006 by Frank Dischner
*
* This program is free software; you can redistribute it and/or
* modify it under the terms of the GNU General Public License
* as published by the Free Software Foundation; either version 2
* of the License, or (at your option) any later version.
*
* This software is distributed on an "AS IS" basis, WITHOUT WARRANTY OF ANY
* KIND, either express or implied.
*
****************************************************************************/
#include "config.h"
#include "hangul.h"
const char jamo_table[51][3] = {
{ 1, 0, 1},
{ 2, 0, 2},
{ 0, 0, 3},
{ 3, 0, 4},
{ 0, 0, 5},
{ 0, 0, 6},
{ 4, 0, 7},
{ 5, 0, 0},
{ 6, 0, 8},
{ 0, 0, 9},
{ 0, 0, 10},
{ 0, 0, 11},
{ 0, 0, 12},
{ 0, 0, 13},
{ 0, 0, 14},
{ 0, 0, 15},
{ 7, 0, 16},
{ 8, 0, 17},
{ 9, 0, 0},
{ 0, 0, 18},
{10, 0, 19},
{11, 0, 20},
{12, 0, 21},
{13, 0, 22},
{14, 0, 0},
{15, 0, 23},
{16, 0, 24},
{17, 0, 25},
{18, 0, 26},
{19, 0, 27},
{ 0, 1, 0},
{ 0, 2, 0},
{ 0, 3, 0},
{ 0, 4, 0},
{ 0, 5, 0},
{ 0, 6, 0},
{ 0, 7, 0},
{ 0, 8, 0},
{ 0, 9, 0},
{ 0, 10, 0},
{ 0, 11, 0},
{ 0, 12, 0},
{ 0, 13, 0},
{ 0, 14, 0},
{ 0, 15, 0},
{ 0, 16, 0},
{ 0, 17, 0},
{ 0, 18, 0},
{ 0, 19, 0},
{ 0, 20, 0},
{ 0, 21, 0},
};
/* takes three jamo chars and joins them into one hangul */
ucschar_t hangul_join(ucschar_t lead, ucschar_t vowel, ucschar_t tail)
{
ucschar_t ch = 0xfffd;
if (lead < 0x3131 || lead > 0x3163)
return ch;
lead = jamo_table[lead-0x3131][0];
if (vowel < 0x3131 || vowel > 0x3163)
return ch;
vowel = jamo_table[vowel-0x3131][1];
if (tail) {
if (tail < 0x3131 || tail > 0x3163)
return ch;
tail = jamo_table[tail-0x3131][2];
if (!tail)
return ch;
}
if (lead && vowel)
ch = tail + (vowel - 1)*28 + (lead - 1)*588 + 44032;
return ch;
}