mirror of
https://github.com/tildearrow/furnace.git
synced 2024-11-05 04:15:05 +00:00
8bcab6e139
may be non-standard compliant (yet) also it crashes foobar2000 for some reason but this will be fixed
93 lines
1.9 KiB
C++
93 lines
1.9 KiB
C++
#include "utfutils.h"
|
|
|
|
int decodeUTF8(const unsigned char* data, char& len) {
|
|
int ret=0xfffd;
|
|
if (data[0]<0x80) {
|
|
ret=data[0];
|
|
len=1;
|
|
} else if (data[0]<0xc0) {
|
|
ret=0xfffd; // invalid
|
|
len=1;
|
|
} else if (data[0]<0xe0) {
|
|
if (data[1]>=0x80 && data[1]<0xc0) {
|
|
len=2;
|
|
ret=((data[0]&31)<<6)|
|
|
(data[1]&63);
|
|
} else len=1;
|
|
} else if (data[0]<0xf0) {
|
|
if (data[1]>=0x80 && data[1]<0xc0) {
|
|
if (data[2]>=0x80 && data[2]<0xc0) {
|
|
len=3;
|
|
ret=((data[0]&15)<<12)|
|
|
((data[1]&63)<<6)|
|
|
(data[2]&63);
|
|
} else len=2;
|
|
} else len=1;
|
|
} else if (data[0]<0xf5) {
|
|
if (data[1]>=0x80 && data[1]<0xc0) {
|
|
if (data[2]>=0x80 && data[2]<0xc0) {
|
|
if (data[3]>=0x80 && data[3]<0xc0) {
|
|
len=4;
|
|
ret=((data[0]&7)<<18)|
|
|
((data[1]&63)<<12)|
|
|
((data[2]&63)<<6)|
|
|
(data[3]&63);
|
|
} else len=3;
|
|
} else len=2;
|
|
} else len=1;
|
|
} else {
|
|
len=1;
|
|
return 0xfffd;
|
|
}
|
|
|
|
if ((ret>=0xd800 && ret<=0xdfff) || ret>=0x110000) return 0xfffd;
|
|
return ret;
|
|
}
|
|
|
|
size_t utf8len(const char* s) {
|
|
size_t p=0;
|
|
size_t r=0;
|
|
char cl;
|
|
while (s[p]!=0) {
|
|
r++;
|
|
decodeUTF8((const unsigned char*)&s[p],cl);
|
|
p+=cl;
|
|
}
|
|
return r;
|
|
}
|
|
|
|
char utf8csize(const unsigned char* c) {
|
|
char ret;
|
|
decodeUTF8(c,ret);
|
|
return ret;
|
|
}
|
|
|
|
WString utf8To16(const char* s) {
|
|
WString ret;
|
|
int ch, p;
|
|
char chs;
|
|
p=0;
|
|
while (s[p]!=0) {
|
|
ch=decodeUTF8((const unsigned char*)&s[p],chs);
|
|
ret+=(unsigned short)ch;
|
|
p+=chs;
|
|
}
|
|
return ret;
|
|
}
|
|
|
|
String utf16To8(const wchar_t* s) {
|
|
String ret;
|
|
for (size_t i=0; i<wcslen(s); i++) {
|
|
if (s[i]<0x80) {
|
|
ret+=s[i];
|
|
} else if (s[i]<0x800) {
|
|
ret+=(0xc0+((s[i]>>6)&31));
|
|
ret+=(0x80+((s[i])&63));
|
|
} else {
|
|
ret+=(0xe0+((s[i]>>12)&15));
|
|
ret+=(0x80+((s[i]>>6)&63));
|
|
ret+=(0x80+((s[i])&63));
|
|
}
|
|
}
|
|
return ret;
|
|
}
|