mirror of
https://github.com/CloverHackyColor/CloverBootloader.git
synced 2025-01-13 19:31:28 +01:00
e37d782aad
Signed-off-by: Sergey Isakov <isakov-sl@bk.ru>
289 lines
15 KiB
C
289 lines
15 KiB
C
//
|
|
// utf8Conversion.hpp
|
|
//
|
|
// Created by jief the 24 Feb 2020.
|
|
//
|
|
|
|
#ifndef __unicode_conversions_h__
|
|
#define __unicode_conversions_h__
|
|
|
|
#include <stddef.h>
|
|
#include <wchar.h>
|
|
#include <string.h>
|
|
|
|
#ifndef __cplusplus
|
|
//typedef uint16_t wchar_t;
|
|
typedef uint32_t char32_t;
|
|
typedef uint16_t char16_t;
|
|
#endif
|
|
|
|
#ifndef __WCHAR_MAX__
|
|
#define __WCHAR_MAX__ 0xFFFFu
|
|
#endif
|
|
|
|
#if __WCHAR_MAX__ <= 0xFFFFu
|
|
#define wchar_cast char16_t
|
|
#else
|
|
#define wchar_cast char32_t
|
|
#endif
|
|
|
|
#ifndef wchar_cast
|
|
#error wchar_cast
|
|
#endif
|
|
|
|
|
|
/*
|
|
* len means nb utf32 char
|
|
* size means nb of underlying native type (nb of char16_t, nb of char32_t, etc.
|
|
*/
|
|
|
|
|
|
|
|
/****** utility *****/
|
|
|
|
|
|
/****** utf8 - utf32 *****/
|
|
|
|
/*
|
|
* Size of an UTF32 char when represented in UTF8
|
|
* Return value : size
|
|
*/
|
|
size_t utf8_size_of_utf32_char(char32_t c);
|
|
|
|
/*
|
|
* Increment size and return a pointer to the next char
|
|
* Return value : pointer to the end of string or at the error
|
|
*/
|
|
const char32_t* utf8_size_of_utf32_char_ptr(const char32_t *s, size_t* size);
|
|
|
|
/*
|
|
* Store an utf32 char in dst, if there is enough room (dst_max_len is >= size of utf32 char)
|
|
* If there is enough room, dst_max_len is decrement and dst is increment and returned
|
|
* If there isn't enough room, dst_max_len is set to 0 and dst is returned
|
|
*/
|
|
char* get_utf8_from_char32(char* dst, size_t* dst_max_len, char32_t utf32_char);
|
|
|
|
/*
|
|
* char32 will be set to 0 at the end of string or at error
|
|
* Return value : pointer to the end of string or at the error
|
|
*/
|
|
const char* get_char32_from_utf8_string(const char* s, char32_t* char32);
|
|
|
|
|
|
|
|
/*
|
|
* Size in bytes of an utf32 string if it were converted to utf8
|
|
* Return value : pointer to the end of string or at the error
|
|
*/
|
|
size_t utf8_size_of_utf32_string(const char32_t* s);
|
|
/*
|
|
* Size in bytes of an utf32 string of len char if it were converted to utf8
|
|
* Return value : pointer to the end of string or at the error
|
|
*/
|
|
size_t utf8_size_of_utf32_string_len(const char32_t* s, size_t len);
|
|
|
|
size_t utf32_size_of_utf8_string(const char* s);
|
|
size_t utf32_size_of_utf8_string_len(const char* s, size_t len);
|
|
|
|
size_t utf32_string_from_utf8_string(char32_t* dst, size_t dst_max_len, const char* s);
|
|
size_t utf8_string_from_utf32_string(char* dst, size_t dst_max_len, const char32_t *s);
|
|
|
|
|
|
/****** utf8 - utf16 *****/
|
|
|
|
/*
|
|
* Increment size
|
|
* Return value : pointer to the end of string or at the error
|
|
*/
|
|
const char16_t* utf8_size_of_utf16_char_ptr(const char16_t *s, size_t* size);
|
|
|
|
size_t utf8_size_of_utf16_string(const char16_t* s);
|
|
size_t utf8_size_of_utf16_string_len(const char16_t* s, size_t len);
|
|
|
|
size_t utf16_size_of_utf8_string(const char* s);
|
|
size_t utf16_size_of_utf8_string_len(const char* s, size_t len);
|
|
|
|
size_t utf8_string_from_utf16_string(char* dst, size_t dst_max_len, const char16_t *s);
|
|
size_t utf16_string_from_utf8_string(char16_t* dst, size_t dst_max_len, const char* s);
|
|
|
|
|
|
/****** utf16 - utf32 *****/
|
|
|
|
size_t utf16_size_of_utf32_char(char32_t c);
|
|
void get_char16_from_char32(char32_t char32, char16_t* char16_1, char16_t* char16_2);
|
|
char32_t get_char32_from_char16(char16_t char16_1, char16_t char16_2);
|
|
const char16_t* get_char32_from_utf16_string(const char16_t* s, char32_t* char32);
|
|
|
|
|
|
size_t utf16_size_of_utf32_string(const char32_t *s);
|
|
size_t utf16_size_of_utf32_string_len(const char32_t *s, size_t len);
|
|
size_t utf32_size_of_utf16_string(const char16_t *s);
|
|
size_t utf32_size_of_utf16_string_len(const char16_t *s, size_t len);
|
|
|
|
size_t utf16_string_from_utf32_string(char16_t* dst, size_t dst_max_len, const char32_t *s);
|
|
size_t utf32_string_from_utf16_string(char32_t* dst, size_t dst_max_len, const char16_t *s);
|
|
|
|
|
|
/****** utf8 - wchar_t *****/
|
|
|
|
size_t utf8_size_of_wchar_string(const wchar_t* s);
|
|
size_t utf8_size_of_wchar_string_len(const wchar_t* s, size_t len);
|
|
size_t wchar_size_of_utf8_string(const char* s);
|
|
size_t wchar_size_of_utf8_string_len(const char* s, size_t len);
|
|
|
|
size_t utf8_string_from_wchar_string(char* dst, size_t dst_max_len, const wchar_t* s);
|
|
size_t wchar_string_from_utf8_string(wchar_t* dst, size_t dst_max_len, const char* s);
|
|
|
|
|
|
/****** utf16 - wchar_t *****/
|
|
size_t utf16_size_of_wchar_string(const wchar_t* s);
|
|
size_t utf16_size_of_wchar_string_len(const wchar_t* s, size_t len);
|
|
size_t wchar_size_of_utf16_string(const char16_t *s);
|
|
size_t wchar_size_of_utf16_string_len(const char16_t *s, size_t len);
|
|
|
|
size_t utf16_string_from_wchar_string(char16_t* dst, size_t dst_max_len, const wchar_t* s);
|
|
size_t wchar_string_from_utf16_string(wchar_t* dst, size_t dst_max_len, const char16_t* s);
|
|
|
|
|
|
/****** utf32 - wchar_t *****/
|
|
size_t utf32_size_of_wchar_string(const wchar_t* s);
|
|
size_t utf32_size_of_wchar_string_len(const wchar_t* s, size_t len);
|
|
size_t wchar_size_of_utf32_string(const char32_t *s);
|
|
size_t wchar_size_of_utf32_string_len(const char32_t *s, size_t len);
|
|
|
|
size_t utf32_string_from_wchar_string(char32_t* dst, size_t dst_max_len, const wchar_t* s);
|
|
size_t wchar_string_from_utf32_string(wchar_t* dst, size_t dst_max_len, const char32_t* s);
|
|
|
|
|
|
/****** no conversion *****/
|
|
|
|
size_t utf8_size_of_utf8_string(const char* s);
|
|
size_t utf8_size_of_utf8_string_len(const char* s, size_t len);
|
|
size_t utf16_size_of_utf16_string(const char16_t* s);
|
|
size_t utf16_size_of_utf16_string_len(const char16_t* s, size_t len);
|
|
size_t utf32_size_of_utf32_string(const char32_t* s);
|
|
size_t utf32_size_of_utf32_string_len(const char32_t* s, size_t len);
|
|
size_t wchar_size_of_wchar_string(const wchar_t* s);
|
|
size_t wchar_size_of_wchar_string_len(const wchar_t* s, size_t len);
|
|
|
|
size_t utf8_string_from_utf8_string(char* dst, size_t dst_max_len, const char *s);
|
|
size_t utf16_string_from_utf16_string(char16_t* dst, size_t dst_max_len, const char16_t *s);
|
|
size_t utf32_string_from_utf32_string(char32_t* dst, size_t dst_max_len, const char32_t *s);
|
|
size_t wchar_string_from_wchar_string(wchar_t* dst, size_t dst_max_len, const wchar_t *s);
|
|
|
|
/****** convenience *****/
|
|
|
|
inline size_t length_of_utf8_string(const char* s) {return utf32_size_of_utf8_string(s); }
|
|
inline size_t length_of_utf16_string(const char16_t* s) {return utf32_size_of_utf16_string(s); }
|
|
inline size_t length_of_utf32_string(const char32_t* s) {return utf32_size_of_utf32_string(s); } // UTF32 length == size
|
|
size_t length_of_wchar_string(const wchar_t* s);
|
|
|
|
|
|
#ifdef __cplusplus
|
|
|
|
inline const char* get_char32_from_string(const char* s, char32_t* char32) { return get_char32_from_utf8_string(s, char32); }
|
|
inline const char16_t* get_char32_from_string(const char16_t* s, char32_t* char32) { return get_char32_from_utf16_string(s, char32); }
|
|
inline const char32_t* get_char32_from_string(const char32_t* s, char32_t* char32) { *char32 = *s; return s+1; }
|
|
inline const wchar_t* get_char32_from_string(const wchar_t* s, char32_t* char32) { return (wchar_t*)get_char32_from_string((wchar_cast*)s, char32); }
|
|
|
|
|
|
inline size_t length_of_utf_string(const char* s) { return utf32_size_of_utf8_string(s); };
|
|
inline size_t length_of_utf_string(const char16_t* s) { return utf32_size_of_utf16_string(s); };
|
|
inline size_t length_of_utf_string(const char32_t* s) { return utf32_size_of_utf32_string(s); };
|
|
inline size_t length_of_utf_string(const wchar_t* s) { return length_of_utf_string((wchar_cast*)s); };
|
|
|
|
|
|
|
|
inline size_t size_of_utf_string(const char* s) { return utf8_size_of_utf8_string(s); }
|
|
inline size_t size_of_utf_string(const char16_t* s) { return utf16_size_of_utf16_string(s); }
|
|
inline size_t size_of_utf_string(const char32_t* s) { return utf32_size_of_utf32_string(s); } // for UTF32 size and length are equal
|
|
inline size_t size_of_utf_string(const wchar_t* s) { return size_of_utf_string((wchar_cast*)s); }
|
|
|
|
inline size_t utf_size_of_utf_string(const char*, const char* s) { return utf8_size_of_utf8_string(s); }
|
|
inline size_t utf_size_of_utf_string(const char16_t*, const char* s) { return utf16_size_of_utf8_string(s); }
|
|
inline size_t utf_size_of_utf_string(const char32_t*, const char* s) { return utf32_size_of_utf8_string(s); }
|
|
inline size_t utf_size_of_utf_string(const wchar_t* t, const char* s) { return utf_size_of_utf_string((wchar_cast*)t, s); }
|
|
|
|
inline size_t utf_size_of_utf_string(const char*, const char16_t* s) { return utf8_size_of_utf16_string(s); }
|
|
inline size_t utf_size_of_utf_string(const char16_t*, const char16_t* s) { return utf16_size_of_utf16_string(s); }
|
|
inline size_t utf_size_of_utf_string(const char32_t*, const char16_t* s) { return utf32_size_of_utf16_string(s); }
|
|
inline size_t utf_size_of_utf_string(const wchar_t* t, const char16_t* s) { return utf_size_of_utf_string((wchar_cast*)t, s); }
|
|
|
|
inline size_t utf_size_of_utf_string(const char*, const char32_t* s) { return utf8_size_of_utf32_string(s); }
|
|
inline size_t utf_size_of_utf_string(const char16_t*, const char32_t* s) { return utf16_size_of_utf32_string(s); }
|
|
inline size_t utf_size_of_utf_string(const char32_t*, const char32_t* s) { return utf32_size_of_utf32_string(s); }
|
|
inline size_t utf_size_of_utf_string(const wchar_t* t, const char32_t* s) { return utf_size_of_utf_string((wchar_cast*)t, s); }
|
|
|
|
inline size_t utf_size_of_utf_string(const char* t, const wchar_t* s) { return utf_size_of_utf_string(t, (wchar_cast*)s); }
|
|
inline size_t utf_size_of_utf_string(const char16_t* t, const wchar_t* s) { return utf_size_of_utf_string(t, (wchar_cast*)s); }
|
|
inline size_t utf_size_of_utf_string(const char32_t* t, const wchar_t* s) { return utf_size_of_utf_string(t, (wchar_cast*)s); }
|
|
inline size_t utf_size_of_utf_string(const wchar_t* t, const wchar_t* s) { return utf_size_of_utf_string(t, (wchar_cast*)s); }
|
|
|
|
|
|
inline size_t size_of_utf_string_len(const char* s, size_t len) { return utf8_size_of_utf8_string_len(s, len); }
|
|
inline size_t size_of_utf_string_len(const char16_t* s, size_t len) { return utf16_size_of_utf16_string_len(s, len); }
|
|
inline size_t size_of_utf_string_len(const char32_t* s, size_t len) { return utf32_size_of_utf32_string_len(s, len); } // for UTF32 size and length are equal
|
|
inline size_t size_of_utf_string_len(const wchar_t* s, size_t len) { return size_of_utf_string_len((wchar_cast*)s, len); }
|
|
|
|
inline size_t utf_size_of_utf_string_len(const char*, const char* s, size_t len) { return utf8_size_of_utf8_string_len(s, len); }
|
|
inline size_t utf_size_of_utf_string_len(const char16_t*, const char* s, size_t len) { return utf16_size_of_utf8_string_len(s, len); }
|
|
inline size_t utf_size_of_utf_string_len(const char32_t*, const char* s, size_t len) { return utf32_size_of_utf8_string_len(s, len); }
|
|
inline size_t utf_size_of_utf_string_len(const wchar_t* t, const char* s, size_t len) { return utf_size_of_utf_string_len((wchar_cast*)t, s, len); }
|
|
|
|
inline size_t utf_size_of_utf_string_len(const char*, const char16_t* s, size_t len) { return utf8_size_of_utf16_string_len(s, len); }
|
|
inline size_t utf_size_of_utf_string_len(const char16_t*, const char16_t* s, size_t len) { return utf16_size_of_utf16_string_len(s, len); }
|
|
inline size_t utf_size_of_utf_string_len(const char32_t*, const char16_t* s, size_t len) { return utf32_size_of_utf16_string_len(s, len); }
|
|
inline size_t utf_size_of_utf_string_len(const wchar_t* t, const char16_t* s, size_t len) { return utf_size_of_utf_string_len((wchar_cast*)t, s, len); }
|
|
|
|
inline size_t utf_size_of_utf_string_len(const char*, const char32_t* s, size_t len) { return utf8_size_of_utf32_string_len(s, len); }
|
|
inline size_t utf_size_of_utf_string_len(const char16_t*, const char32_t* s, size_t len) { return utf16_size_of_utf32_string_len(s, len); }
|
|
inline size_t utf_size_of_utf_string_len(const char32_t*, const char32_t* s, size_t len) { return utf32_size_of_utf32_string_len(s, len); }
|
|
inline size_t utf_size_of_utf_string_len(const wchar_t* t, const char32_t* s, size_t len) { return utf_size_of_utf_string_len((wchar_cast*)t, s, len); }
|
|
|
|
inline size_t utf_size_of_utf_string_len(const char* t, const wchar_t* s, size_t len) { return utf_size_of_utf_string_len((wchar_cast*)t, (wchar_cast*)s, len); }
|
|
inline size_t utf_size_of_utf_string_len(const char16_t* t, const wchar_t* s, size_t len) { return utf_size_of_utf_string_len((wchar_cast*)t, (wchar_cast*)s, len); }
|
|
inline size_t utf_size_of_utf_string_len(const char32_t* t, const wchar_t* s, size_t len) { return utf_size_of_utf_string_len((wchar_cast*)t, (wchar_cast*)s, len); }
|
|
inline size_t utf_size_of_utf_string_len(const wchar_t* t, const wchar_t* s, size_t len) { return utf_size_of_utf_string_len((wchar_cast*)t, (wchar_cast*)s, len); }
|
|
|
|
|
|
|
|
|
|
|
|
inline size_t utf_string_from_utf_string(char* dst, size_t dst_max_len, const char* s) { return utf8_string_from_utf8_string(dst, dst_max_len, s); }
|
|
inline size_t utf_string_from_utf_string(char16_t* dst, size_t dst_max_len, const char* s) { return utf16_string_from_utf8_string(dst, dst_max_len, s); }
|
|
inline size_t utf_string_from_utf_string(char32_t* dst, size_t dst_max_len, const char* s) { return utf32_string_from_utf8_string(dst, dst_max_len, s); }
|
|
inline size_t utf_string_from_utf_string(wchar_t* dst, size_t dst_max_len, const char* s) { return utf_string_from_utf_string((wchar_cast*)dst, dst_max_len, s); }
|
|
|
|
inline size_t utf_string_from_utf_string(char* dst, size_t dst_max_len, const char16_t *s) { return utf8_string_from_utf16_string(dst, dst_max_len, s); }
|
|
inline size_t utf_string_from_utf_string(char16_t* dst, size_t dst_max_len, const char16_t *s) { return utf16_string_from_utf16_string(dst, dst_max_len, s); }
|
|
inline size_t utf_string_from_utf_string(char32_t* dst, size_t dst_max_len, const char16_t *s) { return utf32_string_from_utf16_string(dst, dst_max_len, s); }
|
|
inline size_t utf_string_from_utf_string(wchar_t* dst, size_t dst_max_len, const char16_t *s) { return utf_string_from_utf_string((wchar_cast*)dst, dst_max_len, s); }
|
|
|
|
inline size_t utf_string_from_utf_string(char* dst, size_t dst_max_len, const char32_t *s) { return utf8_string_from_utf32_string(dst, dst_max_len, s); }
|
|
inline size_t utf_string_from_utf_string(char16_t* dst, size_t dst_max_len, const char32_t *s) { return utf16_string_from_utf32_string(dst, dst_max_len, s); }
|
|
inline size_t utf_string_from_utf_string(char32_t* dst, size_t dst_max_len, const char32_t *s) { return utf32_string_from_utf32_string(dst, dst_max_len, s); }
|
|
inline size_t utf_string_from_utf_string(wchar_t* dst, size_t dst_max_len, const char32_t *s) { return utf_string_from_utf_string((wchar_cast*)dst, dst_max_len, s); }
|
|
|
|
inline size_t utf_string_from_utf_string(char* dst, size_t dst_max_len, const wchar_t *s) { return utf_string_from_utf_string(dst, dst_max_len, (wchar_cast*)s); }
|
|
inline size_t utf_string_from_utf_string(char16_t* dst, size_t dst_max_len, const wchar_t *s) { return utf_string_from_utf_string(dst, dst_max_len, (wchar_cast*)s); }
|
|
inline size_t utf_string_from_utf_string(char32_t* dst, size_t dst_max_len, const wchar_t *s) { return utf_string_from_utf_string(dst, dst_max_len, (wchar_cast*)s); }
|
|
inline size_t utf_string_from_utf_string(wchar_t* dst, size_t dst_max_len, const wchar_t *s) { return utf_string_from_utf_string(dst, dst_max_len, (wchar_cast*)s); }
|
|
|
|
#endif // __cplusplus
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
#undef wchar_cast
|
|
|
|
#endif /* utf816Conversion_hpp */
|