forked from len0rd/rockbox
internals: Support characters beyond the first unicode plane (WIP)
We used 16-bit variables to store the 'character code' everywhere but
this won't let us represent anything beyond U+FFFF.
This patch changes those variables to a custom type that can be 32 or 16
bits depending on the build, and adjusts numerous internal APIs and
datastructures to match. This includes:
* utf8decode() and friends
* on-screen keyboard
* font manipulation, caching, rendering, and generation
* VFAT code parses and generates utf16 dirents
* WIN32 simulator reads and writes utf16 filenames
Note that this patch doesn't _enable_ >16bit unicode support; a followup
patch will turn that on for appropriate targets.
Known bugs:
* Native players in 32-bit unicode mode generate mangled filename
entries if they include UTF16 surrogate codepoints. Root cause
is unclear, and may reside in core dircache code.
Needs testing on:
* windows simulator (16bit+32bit)
Change-Id: I193a00fe2a11a4181ddc82df2d71be52bf00b6e6
This commit is contained in:
parent
94712b34d4
commit
d05c59f35b
44 changed files with 480 additions and 335 deletions
|
|
@ -18,6 +18,7 @@
|
|||
* KIND, either express or implied.
|
||||
*
|
||||
****************************************************************************/
|
||||
#include "config.h"
|
||||
#include "hangul.h"
|
||||
|
||||
const char jamo_table[51][3] = {
|
||||
|
|
@ -75,10 +76,9 @@ const char jamo_table[51][3] = {
|
|||
};
|
||||
|
||||
/* takes three jamo chars and joins them into one hangul */
|
||||
unsigned short hangul_join(unsigned short lead, unsigned short vowel,
|
||||
unsigned short tail)
|
||||
ucschar_t hangul_join(ucschar_t lead, ucschar_t vowel, ucschar_t tail)
|
||||
{
|
||||
unsigned short ch = 0xfffd;
|
||||
ucschar_t ch = 0xfffd;
|
||||
|
||||
if (lead < 0x3131 || lead > 0x3163)
|
||||
return ch;
|
||||
|
|
|
|||
Loading…
Add table
Add a link
Reference in a new issue