mirror of https://github.com/ddevault/scdoc
You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
43 lines
924 B
43 lines
924 B
#ifndef _SCDOC_UNICODE_H
|
|
#define _SCDOC_UNICODE_H
|
|
#include <stddef.h>
|
|
#include <stdint.h>
|
|
#include <stdio.h>
|
|
|
|
// Technically UTF-8 supports up to 6 byte codepoints, but Unicode itself
|
|
// doesn't really bother with more than 4.
|
|
#define UTF8_MAX_SIZE 4
|
|
|
|
#define UTF8_INVALID 0x80
|
|
|
|
/**
|
|
* Grabs the next UTF-8 character and advances the string pointer
|
|
*/
|
|
uint32_t utf8_decode(const char **str);
|
|
|
|
/**
|
|
* Encodes a character as UTF-8 and returns the length of that character.
|
|
*/
|
|
size_t utf8_encode(char *str, uint32_t ch);
|
|
|
|
/**
|
|
* Returns the size of the next UTF-8 character
|
|
*/
|
|
int utf8_size(const char *str);
|
|
|
|
/**
|
|
* Returns the size of a UTF-8 character
|
|
*/
|
|
size_t utf8_chsize(uint32_t ch);
|
|
|
|
/**
|
|
* Reads and returns the next character from the file.
|
|
*/
|
|
uint32_t utf8_fgetch(FILE *f);
|
|
|
|
/**
|
|
* Writes this character to the file and returns the number of bytes written.
|
|
*/
|
|
size_t utf8_fputch(FILE *f, uint32_t ch);
|
|
|
|
#endif
|
|
|