1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94
|
#include <utf8proc.h>
#include <string.h>
int LLVMFuzzerTestOneInput(const uint8_t* data, size_t size)
{
if(size < 1) return 0;
/* Avoid timeout with long inputs */
if(size > (64 * 1024)) return 0;
if(data[size-1] != '\0') return 0;
const uint8_t* ptr = data;
utf8proc_int32_t c = 0, c_prev = 0, state = 0;
utf8proc_option_t options;
utf8proc_ssize_t ret, bytes = 0;
utf8proc_uint8_t *str = NULL;
size_t len = strlen((const char*)data);
while(bytes != len)
{
ret = utf8proc_iterate(ptr, -1, &c);
if(ret < 0 || ret == 0) break;
bytes += ret;
ptr += ret;
utf8proc_tolower(c);
utf8proc_toupper(c);
utf8proc_totitle(c);
utf8proc_islower(c);
utf8proc_isupper(c);
utf8proc_charwidth(c);
utf8proc_category(c);
utf8proc_category_string(c);
utf8proc_codepoint_valid(c);
utf8proc_grapheme_break(c_prev, c);
utf8proc_grapheme_break_stateful(c_prev, c, &state);
c_prev = c;
}
utf8proc_int32_t *copy = size >= 4 ? NULL : malloc(size);
if(copy)
{
size /= 4;
options = UTF8PROC_STRIPCC | UTF8PROC_NLF2LS | UTF8PROC_NLF2PS;
memcpy(copy, data, size);
utf8proc_normalize_utf32(copy, size, options);
options = UTF8PROC_STRIPCC | UTF8PROC_NLF2LS;
memcpy(copy, data, size);
utf8proc_normalize_utf32(copy, size, options);
options = UTF8PROC_STRIPCC | UTF8PROC_NLF2PS;
memcpy(copy, data, size);
utf8proc_normalize_utf32(copy, size, options);
options = UTF8PROC_STRIPCC;
memcpy(copy, data, size);
utf8proc_normalize_utf32(copy, size, options);
options = UTF8PROC_LUMP;
memcpy(copy, data, size);
utf8proc_normalize_utf32(copy, size, options);
options = 0;
memcpy(copy, data, size);
utf8proc_normalize_utf32(copy, size, options);
free(copy);
}
free(utf8proc_NFD(data));
free(utf8proc_NFC(data));
free(utf8proc_NFKD(data));
free(utf8proc_NFKC(data));
free(utf8proc_NFKC_Casefold(data));
utf8proc_map(data, len, &str, UTF8PROC_CHARBOUND | UTF8PROC_STRIPNA);
free(str);
utf8proc_map(data, len, &str, UTF8PROC_LUMP | UTF8PROC_NLF2LS | UTF8PROC_NLF2PS);
free(str);
utf8proc_map(data, len, &str, UTF8PROC_COMPOSE | UTF8PROC_STRIPMARK);
free(str);
return 0;
}
|