forked from AFLplusplus/AFLplusplus
-
Notifications
You must be signed in to change notification settings - Fork 0
/
utf8.dict
73 lines (52 loc) · 1.53 KB
/
utf8.dict
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
# https://www.cl.cam.ac.uk/~mgk25/ucs/examples/UTF-8-test.txt
# Defines byteorder and endianess
byte_order="\xFE\xFF"
# Reorder the display of text for RTL reading
right_to_left="\x20\x2E"
# Mongolian Vowel Separator: invisible and has the whitespace property
invisible_separator="\x18\x03"
# Invisible zero-width character.
word_join="\x20\x60"
# Reserved code point
reserved="\xfe\xfe"
# Invalid code point
invalid1="\xff\xff"
invalid2="\x01\xff\xff"
invalid3="\xfdd0"
# unassigned code point
unassigned="\x0f\xed"
# illegal low half-surrogate
illegal_low="\xde\xad"
# illegal high half-surrogate
illegal_high="\xda\xad"
# private use area code usbed by apple for its logo
apple="\xf8\xff"
# hostname normalization
fullwidth_solidus="\xff\x0f"
# numerical mapping and a value
bold_eight="\x01\xd7\xd6"
# # U+00DF normalizes to "ss" during IDNA2003's mapping phase,
# different from its IDNA2008 mapping. See http://www.unicode.org/reports/tr46/
weird="\x00\xdf"
# U+FDFD expands by 11x (UTF-8) and 18x (UTF-16) under NFKC/NFKC
expansion="\xfd\xfd"
# U+0390 expands by 3x (UTF-8) under NFD
expansion2="\x03\x90"
# U+1F82 expands by 4x (UTF-16) under NFD
expansion3= "\x1F\x82"
# U+FB2C expands by 3x (UTF-16) under NFC
expansion4="\xFB\x2C"
# Lowecaser expansion: https://twitter.com/jifa/status/625776454479970304
low_exp1="\x02\x3a"
low_exp2="\x02\x3e"
low_exp3="\x00\xdf"
low_exp4="\x1e\x9e"
# Null byte
null="\x00\x00"
"\xfc\x80\x80\x80\x80\x80"
"fc\x80\x80\x80\x80\xaf"
# Confusing new lines
"\x00\x1b"
"\x00\x85"
"\x20\x28"
"\x20\x29"