Charsets used for validation
[3099257 urls; 243 unique values]
| Popularity | Value | Frequency |
| 1 | iso-8859-1 | 1510827 |
| 2 | utf-8 | 943326 |
| 3 | windows-1252 | 293595 |
| 4 | shift_jis | 87593 |
| 5 | iso-8859-2 | 60663 |
| 6 | windows-1251 | 51336 |
| 7 | windows-1250 | 30353 |
| 8 | gb2312 | 19412 |
| 9 | iso-8859-15 | 12276 |
| 10 | big5 | 11395 |
| 11 | windows-1254 | 9756 |
| 12 | iso-8859-9 | 9091 |
| 13 | us-ascii | 8134 |
| 14 | euc-jp | 7174 |
| 15 | x-sjis | 5564 |
| 16 | euc-kr | 4768 |
| 17 | windows-1257 | 4023 |
| 18 | windows-1255 | 4022 |
| 19 | windows-1256 | 3981 |
| 20 | koi8-r | 3353 |
| 21 | iso-8859-7 | 2346 |
| 22 | iso8859-1 | 2281 |
| 23 | windows-1253 | 2272 |
| 24 | windows-874 | 1277 |
| 25 | gbk | 924 |
| 26 | iso-2022-jp | 711 |
| 27 | tis-620 | 665 |
| 28 | utf-16le | 630 |
| 29 | cp1251 | 617 |
| 30 | shift-jis | 564 |
| 31 | latin1 | 515 |
| 32 | iso-8859-8 | 379 |
| 33 | utf-16 | 369 |
| 34 | cp1252 | 361 |
| 35 | x-mac-roman | 354 |
| 36 | utf8 | 347 |
| 37 | ks_c_5601-1987 | 330 |
| 38 | macintosh | 316 |
| 39 | unicode | 278 |
| 40 | iso-8859-8-i | 202 |
| 41 | windows-31j | 181 |
| 42 | iso-8859-5 | 170 |
| 43 | iso8859-2 | 165 |
| 44 | cp-1251 | 159 |
| 45 | x-euc-jp | 147 |
| 46 | euc_kr | 146 |
| 47 | iso8859_1 | 96 |
| 48 | iso8859-15 | 96 |
| 49 | charset=iso-8859-1 | 93 |
| 50 | iso_8859-1 | 93 |
| 51 | iso-8859-13 | 88 |
| 52 | iso-8859-4 | 88 |
| 53 | sjis | 80 |
| 54 | koi8-u | 71 |
| 55 | latin-1 | 64 |
| 56 | cp1250 | 64 |
| 57 | x-x-big5 | 63 |
| 58 | iso8859-9 | 41 |
| 59 | euc_jp | 41 |
| 60 | ascii | 38 |
| 61 | latin2 | 36 |
| 62 | gb_2312-80 | 34 |
| 63 | big-5 | 32 |
| 64 | cp1254 | 31 |
| 65 | utf-16be | 28 |
| 66 | ms932 | 28 |
| 67 | iso-8859-6 | 24 |
| 68 | iso-8859-3 | 24 |
| 69 | iso_8859_1 | 23 |
| 70 | windows-1258 | 21 |
| 71 | iso-latin-1 | 19 |
| 72 | .latin1 | 18 |
| 73 | charset=iso-8859-2 | 16 |
| 74 | tis620 | 16 |
| 75 | euckr | 16 |
| 76 | es_es.iso-8859-1 | 16 |
| 77 | iso-8859-16 | 15 |
| 78 | gb18030 | 14 |
| 79 | cp-1250 | 13 |
| 80 | big5-hkscs | 13 |
| 81 | iso-8859-10 | 11 |
| 82 | latin2-iso-8859-2 | 11 |
| 83 | .iso8859-1 | 11 |
| 84 | iso-8859-11 | 11 |
| 85 | windows_1258 | 10 |
| 86 | gb-2312 | 9 |
| 87 | iso 8859-1 | 9 |
| 88 | cp866 | 9 |
| 89 | iso-8859-14 | 8 |
| 90 | x-windows-949 | 7 |
| 91 | ms949 | 7 |
| 92 | jis | 7 |
| 93 | iso88591 | 7 |
| 94 | iso-2022-kr | 7 |
| 95 | charset=windows-1251 | 7 |
| 96 | sift_jis | 7 |
| 97 | s-jis | 7 |
| 98 | en-iso-8859-1 | 6 |
| 99 | ibm866 | 6 |
| 100 | ibm852 | 6 |
| 101 | en_us.iso8859-1 | 6 |
| 102 | cp-1252 | 6 |
| 103 | windows1250 | 6 |
| 104 | ibm437 | 6 |
| 105 | iso8859-8 | 6 |
| 106 | charset=windows-1252 | 5 |
| 107 | shif_jis | 5 |
| 108 | charset=windows-1250 | 5 |
| 109 | de_de.iso-8859-15@euro | 5 |
| 110 | x-jis | 5 |
| 111 | koi8r | 5 |
| 112 | latin5 | 5 |
| 113 | cp850 | 5 |
| 114 | hz-gb-2312 | 4 |
| 115 | fr-iso-8859-1 | 4 |
| 116 | x_sjis | 4 |
| 117 | iso-8859-15@euro | 4 |
| 118 | greek | 4 |
| 119 | cp437 | 4 |
| 120 | iso_8859-2 | 4 |
| 121 | ru_ru.cp1251 | 4 |
| 122 | utf-7 | 4 |
| 123 | fr_fr.iso8859-1 | 4 |
| 124 | iso_8859-9 | 4 |
| 125 | ibm850 | 4 |