Charsets used for validation
[3099257 urls; 243 unique values]
Popularity | Value | Frequency |
1 | iso-8859-1 | 1510827 |
2 | utf-8 | 943326 |
3 | windows-1252 | 293595 |
4 | shift_jis | 87593 |
5 | iso-8859-2 | 60663 |
6 | windows-1251 | 51336 |
7 | windows-1250 | 30353 |
8 | gb2312 | 19412 |
9 | iso-8859-15 | 12276 |
10 | big5 | 11395 |
11 | windows-1254 | 9756 |
12 | iso-8859-9 | 9091 |
13 | us-ascii | 8134 |
14 | euc-jp | 7174 |
15 | x-sjis | 5564 |
16 | euc-kr | 4768 |
17 | windows-1257 | 4023 |
18 | windows-1255 | 4022 |
19 | windows-1256 | 3981 |
20 | koi8-r | 3353 |
21 | iso-8859-7 | 2346 |
22 | iso8859-1 | 2281 |
23 | windows-1253 | 2272 |
24 | windows-874 | 1277 |
25 | gbk | 924 |
26 | iso-2022-jp | 711 |
27 | tis-620 | 665 |
28 | utf-16le | 630 |
29 | cp1251 | 617 |
30 | shift-jis | 564 |
31 | latin1 | 515 |
32 | iso-8859-8 | 379 |
33 | utf-16 | 369 |
34 | cp1252 | 361 |
35 | x-mac-roman | 354 |
36 | utf8 | 347 |
37 | ks_c_5601-1987 | 330 |
38 | macintosh | 316 |
39 | unicode | 278 |
40 | iso-8859-8-i | 202 |
41 | windows-31j | 181 |
42 | iso-8859-5 | 170 |
43 | iso8859-2 | 165 |
44 | cp-1251 | 159 |
45 | x-euc-jp | 147 |
46 | euc_kr | 146 |
47 | iso8859_1 | 96 |
48 | iso8859-15 | 96 |
49 | charset=iso-8859-1 | 93 |
50 | iso_8859-1 | 93 |
51 | iso-8859-13 | 88 |
52 | iso-8859-4 | 88 |
53 | sjis | 80 |
54 | koi8-u | 71 |
55 | latin-1 | 64 |
56 | cp1250 | 64 |
57 | x-x-big5 | 63 |
58 | iso8859-9 | 41 |
59 | euc_jp | 41 |
60 | ascii | 38 |
61 | latin2 | 36 |
62 | gb_2312-80 | 34 |
63 | big-5 | 32 |
64 | cp1254 | 31 |
65 | utf-16be | 28 |
66 | ms932 | 28 |
67 | iso-8859-6 | 24 |
68 | iso-8859-3 | 24 |
69 | iso_8859_1 | 23 |
70 | windows-1258 | 21 |
71 | iso-latin-1 | 19 |
72 | .latin1 | 18 |
73 | charset=iso-8859-2 | 16 |
74 | tis620 | 16 |
75 | euckr | 16 |
76 | es_es.iso-8859-1 | 16 |
77 | iso-8859-16 | 15 |
78 | gb18030 | 14 |
79 | cp-1250 | 13 |
80 | big5-hkscs | 13 |
81 | iso-8859-10 | 11 |
82 | latin2-iso-8859-2 | 11 |
83 | .iso8859-1 | 11 |
84 | iso-8859-11 | 11 |
85 | windows_1258 | 10 |
86 | gb-2312 | 9 |
87 | iso 8859-1 | 9 |
88 | cp866 | 9 |
89 | iso-8859-14 | 8 |
90 | x-windows-949 | 7 |
91 | ms949 | 7 |
92 | jis | 7 |
93 | iso88591 | 7 |
94 | iso-2022-kr | 7 |
95 | charset=windows-1251 | 7 |
96 | sift_jis | 7 |
97 | s-jis | 7 |
98 | en-iso-8859-1 | 6 |
99 | ibm866 | 6 |
100 | ibm852 | 6 |
101 | en_us.iso8859-1 | 6 |
102 | cp-1252 | 6 |
103 | windows1250 | 6 |
104 | ibm437 | 6 |
105 | iso8859-8 | 6 |
106 | charset=windows-1252 | 5 |
107 | shif_jis | 5 |
108 | charset=windows-1250 | 5 |
109 | de_de.iso-8859-15@euro | 5 |
110 | x-jis | 5 |
111 | koi8r | 5 |
112 | latin5 | 5 |
113 | cp850 | 5 |
114 | hz-gb-2312 | 4 |
115 | fr-iso-8859-1 | 4 |
116 | x_sjis | 4 |
117 | iso-8859-15@euro | 4 |
118 | greek | 4 |
119 | cp437 | 4 |
120 | iso_8859-2 | 4 |
121 | ru_ru.cp1251 | 4 |
122 | utf-7 | 4 |
123 | fr_fr.iso8859-1 | 4 |
124 | iso_8859-9 | 4 |
125 | ibm850 | 4 |