PHP Classes

File: charsets.php

Recommend this page to a friend!
  Classes of Jill Lingoff   Sweeper   charsets.php   Download  
File: charsets.php
Role: Auxiliary script
Content type: text/plain
Description: Auxiliary script
Class: Sweeper
Clean HTML to remove unwanted tags and attributes
Author: By
Last change:
Date: 5 years ago
Size: 30,743 bytes
 

Contents

Class file image Download
<?php /* <!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd"> <html xmlns="http://www.w3.org/1999/xhtml"> <head> <meta http-equiv="Content-Type" content="text/html; charset=utf-8" /> <title>Untitled Document</title> </head> <body> rnet Explorer 5 </h2> <table class="clsStd"> <tbody> <tr> <th>CharsetFriendlyName</th> <th>Preferred Charset Label</th> <th>Aliases</th> <th>IE&nbsp;Ver</th> <th>Min OS</th> <th>CodePage</th> <th>FamilyCodePage</th> </tr> <tr> <td>Arabic (ASMO 708)</td> <td>ASMO-708</td> <td>&nbsp;</td> <td>IE5</td> <td>Win95</td> <td>708</td> <td>1256</td> </tr> <tr> <td>Arabic (DOS)</td> <td>DOS-720</td> <td>&nbsp;</td> <td>IE5</td> <td>Win95</td> <td>720</td> <td>1256</td> </tr> <tr> <td>Arabic (ISO)</td> <td>iso-8859-6</td> <td>arabic, csISOLatinArabic, ECMA-114, ISO_8859-6, ISO_8859-6:1987, iso-ir-127</td> <td>IE5,&nbsp;IE4</td> <td>Win95</td> <td>28596</td> <td>1256</td> </tr> <tr> <td>Arabic (Mac)</td> <td>x-mac-arabic</td> <td>&nbsp;</td> <td>IE5</td> <td>Win2000</td> <td>10004</td> <td>1256</td> </tr> <tr> <td>Arabic (Windows)</td> <td>windows-1256</td> <td>cp1256 </td> <td>IE5</td> <td>Win95</td> <td>1256</td> <td>1256</td> </tr> <tr> <td>Baltic (DOS)</td> <td>ibm775</td> <td>CP500</td> <td>IE5</td> <td>Win2000</td> <td>775</td> <td>1257</td> </tr> <tr> <td>Baltic (ISO)</td> <td>iso-8859-4</td> <td>csISOLatin4, ISO_8859-4, ISO_8859-4:1988, iso-ir-110, l4, latin4</td> <td>IE5</td> <td>Win95</td> <td>28594</td> <td>1257</td> </tr> <tr> <td>Baltic (Windows)</td> <td>windows-1257</td> <td>&nbsp;</td> <td>IE5</td> <td>Win95</td> <td>1257</td> <td>1257</td> </tr> <tr> <td>Central European (DOS)</td> <td>ibm852</td> <td>cp852</td> <td>IE5,&nbsp;IE4</td> <td>Win95</td> <td>852</td> <td>1250</td> </tr> <tr> <td>Central European (ISO)</td> <td>iso-8859-2</td> <td>csISOLatin2, iso_8859-2, iso_8859-2:1987, iso8859-2, iso-ir-101, l2, latin2</td> <td>IE5,&nbsp;IE4</td> <td>Win95</td> <td>28592</td> <td>1250</td> </tr> <tr> <td>Central European (Mac)</td> <td>x-mac-ce</td> <td>&nbsp;</td> <td>IE5</td> <td>Win2000</td> <td>10029</td> <td>1250</td> </tr> <tr> <td>Central European (Windows)</td> <td>windows-1250</td> <td>x-cp1250</td> <td>IE5</td> <td>Win95</td> <td>1250</td> <td>1250</td> </tr> <tr> <td>Chinese Simplified (EUC)</td> <td>EUC-CN</td> <td>x-euc-cn</td> <td>IE5</td> <td>Win2000</td> <td>51936</td> <td>936</td> </tr> <tr> <td>Chinese Simplified (GB2312)</td> <td>gb2312</td> <td>chinese, CN-GB, csGB2312, csGB231280, csISO58GB231280, GB_2312-80, GB231280, GB2312-80, GBK, iso-ir-58</td> <td>IE5,&nbsp;IE4</td> <td>Win95</td> <td>936</td> <td>936</td> </tr> <tr> <td>Chinese Simplified (HZ)</td> <td>hz-gb-2312</td> <td>&nbsp;</td> <td>IE5,&nbsp;IE4</td> <td>Win95</td> <td>52936</td> <td>936</td> </tr> <tr> <td>Chinese Simplified (Mac)</td> <td>x-mac-chinesesimp</td> <td>&nbsp;</td> <td>IE5</td> <td>Win2000</td> <td>10008</td> <td>936</td> </tr> <tr> <td>Chinese Traditional (Big5)</td> <td>big5</td> <td>cn-big5, csbig5, x-x-big5</td> <td>IE5,&nbsp;IE4</td> <td>Win95</td> <td>950</td> <td>950</td> </tr> <tr> <td>Chinese Traditional (CNS)</td> <td>x-Chinese-CNS</td> <td>&nbsp;</td> <td>IE5</td> <td>Win2000</td> <td>20000</td> <td>950</td> </tr> <tr> <td>Chinese Traditional (Eten)</td> <td>x-Chinese-Eten</td> <td>&nbsp;</td> <td>IE5</td> <td>Win2000</td> <td>20002</td> <td>950</td> </tr> <tr> <td>Chinese Traditional (Mac)</td> <td>x-mac-chinesetrad</td> <td>&nbsp;</td> <td>IE5</td> <td>Win2000</td> <td>10002</td> <td>950</td> </tr> <tr> <td>Cyrillic (DOS)</td> <td>cp866</td> <td>ibm866</td> <td>IE5,&nbsp;IE4</td> <td>Win95</td> <td>866</td> <td>1251</td> </tr> <tr> <td>Cyrillic (ISO)</td> <td>iso-8859-5</td> <td>csISOLatin5, csISOLatinCyrillic, cyrillic, ISO_8859-5, ISO_8859-5:1988, iso-ir-144, l5</td> <td>IE5,&nbsp;IE4</td> <td>Win95</td> <td>28595</td> <td>1251</td> </tr> <tr> <td>Cyrillic (KOI8-R)</td> <td>koi8-r</td> <td>csKOI8R, koi, koi8, koi8r</td> <td>IE5,&nbsp;IE4</td> <td>Win95</td> <td>20866</td> <td>1251</td> </tr> <tr> <td>Cyrillic (KOI8-U)</td> <td>koi8-u</td> <td>koi8-ru</td> <td>IE5</td> <td>Win95</td> <td>21866</td> <td>1251</td> </tr> <tr> <td>Cyrillic (Mac)</td> <td>x-mac-cyrillic</td> <td>&nbsp;</td> <td>IE5</td> <td>Win2000</td> <td>10007</td> <td>1251</td> </tr> <tr> <td>Cyrillic (Windows)</td> <td>windows-1251</td> <td>x-cp1251</td> <td>IE5</td> <td>Win95</td> <td>1251</td> <td>1251</td> </tr> <tr> <td>Europa</td> <td>x-Europa</td> <td>&nbsp;</td> <td>IE5</td> <td>n.a.</td> <td>29001</td> <td>1252</td> </tr> <tr> <td>German (IA5)</td> <td>x-IA5-German</td> <td>&nbsp;</td> <td>IE5</td> <td>Win2000</td> <td>20106</td> <td>1252</td> </tr> <tr> <td>Greek (DOS)</td> <td>ibm737</td> <td>&nbsp;</td> <td>IE5</td> <td>Win2000</td> <td>737</td> <td>1253</td> </tr> <tr> <td>Greek (ISO)</td> <td>iso-8859-7</td> <td>csISOLatinGreek, ECMA-118, ELOT_928, greek, greek8, ISO_8859-7, ISO_8859-7:1987, iso-ir-126</td> <td>IE5,&nbsp;IE4</td> <td>Win95</td> <td>28597</td> <td>1253</td> </tr> <tr> <td>Greek (Mac)</td> <td>x-mac-greek</td> <td>&nbsp;</td> <td>IE5</td> <td>Win2000</td> <td>10006</td> <td>1253</td> </tr> <tr> <td>Greek (Windows)</td> <td>windows-1253</td> <td>&nbsp;</td> <td>IE5</td> <td>Win95</td> <td>1253</td> <td>1253</td> </tr> <tr> <td>Greek, Modern (DOS)</td> <td>ibm869</td> <td>&nbsp;</td> <td>IE5</td> <td>Win2000</td> <td>869</td> <td>1253</td> </tr> <tr> <td>Hebrew (DOS)</td> <td>DOS-862</td> <td>&nbsp;</td> <td>IE5</td> <td>Win95</td> <td>862</td> <td>1255</td> </tr> <tr> <td>Hebrew (ISO-Logical)</td> <td>iso-8859-8-i</td> <td>logical</td> <td>IE5,&nbsp;IE4</td> <td>Win95</td> <td>38598</td> <td>1255</td> </tr> <tr> <td>Hebrew (ISO-Visual)</td> <td>iso-8859-8</td> <td>csISOLatinHebrew, hebrew, ISO_8859-8, ISO_8859-8:1988, ISO-8859-8, iso-ir-138, visual</td> <td>IE5,&nbsp;IE4</td> <td>Win95</td> <td>28598</td> <td>1255</td> </tr> <tr> <td>Hebrew (Mac)</td> <td>x-mac-hebrew</td> <td>&nbsp;</td> <td>IE5</td> <td>Win2000</td> <td>10005</td> <td>1255</td> </tr> <tr> <td>Hebrew (Windows)</td> <td>windows-1255</td> <td>ISO_8859-8-I, ISO-8859-8, visual</td> <td>IE5</td> <td>Win95</td> <td>1255</td> <td>1255</td> </tr> <tr> <td>IBM EBCDIC (Arabic)</td> <td>x-EBCDIC-Arabic</td> <td>&nbsp;</td> <td>IE5</td> <td>Win2000</td> <td>20420</td> <td>1256</td> </tr> <tr> <td>IBM EBCDIC (Cyrillic Russian)</td> <td>x-EBCDIC-CyrillicRussian</td> <td>&nbsp;</td> <td>IE5</td> <td>Win2000</td> <td>20880</td> <td>1251</td> </tr> <tr> <td>IBM EBCDIC (Cyrillic Serbian-Bulgarian)</td> <td>x-EBCDIC-CyrillicSerbianBulgarian</td> <td>&nbsp;</td> <td>IE5</td> <td>Win2000</td> <td>21025</td> <td>1251</td> </tr> <tr> <td>IBM EBCDIC (Denmark-Norway)</td> <td>x-EBCDIC-DenmarkNorway</td> <td>&nbsp;</td> <td>IE5</td> <td>Win2000</td> <td>20277</td> <td>1252</td> </tr> <tr> <td>IBM EBCDIC (Denmark-Norway-Euro)</td> <td>x-ebcdic-denmarknorway-euro</td> <td>&nbsp;</td> <td>IE5</td> <td>Win2000</td> <td>1142</td> <td>1252</td> </tr> <tr> <td>IBM EBCDIC (Finland-Sweden)</td> <td>x-EBCDIC-FinlandSweden</td> <td>&nbsp;</td> <td>IE5</td> <td>Win2000</td> <td>20278</td> <td>1252</td> </tr> <tr> <td>IBM EBCDIC (Finland-Sweden-Euro)</td> <td>x-ebcdic-finlandsweden-euro</td> <td>&nbsp;</td> <td>IE5</td> <td>Win2000</td> <td>1143</td> <td>1252</td> </tr> <tr> <td>IBM EBCDIC (Finland-Sweden-Euro)</td> <td>x-ebcdic-finlandsweden-euro</td> <td>X-EBCDIC-France</td> <td>IE5</td> <td>Win2000</td> <td>1143</td> <td>1252</td> </tr> <tr> <td>IBM EBCDIC (France-Euro)</td> <td>x-ebcdic-france-euro</td> <td>&nbsp;</td> <td>IE5</td> <td>Win2000</td> <td>1147</td> <td>1252</td> </tr> <tr> <td>IBM EBCDIC (Germany)</td> <td>x-EBCDIC-Germany</td> <td>&nbsp;</td> <td>IE5</td> <td>Win2000</td> <td>20273</td> <td>1252</td> </tr> <tr> <td>IBM EBCDIC (Germany-Euro)</td> <td>x-ebcdic-germany-euro</td> <td>&nbsp;</td> <td>IE5</td> <td>Win2000</td> <td>1141</td> <td>1252</td> </tr> <tr> <td>IBM EBCDIC (Greek Modern)</td> <td>x-EBCDIC-GreekModern</td> <td>&nbsp;</td> <td>IE5</td> <td>Win2000</td> <td>875</td> <td>1253</td> </tr> <tr> <td>IBM EBCDIC (Greek)</td> <td>x-EBCDIC-Greek</td> <td>&nbsp;</td> <td>IE5</td> <td>Win2000</td> <td>20423</td> <td>1253</td> </tr> <tr> <td>IBM EBCDIC (Hebrew)</td> <td>x-EBCDIC-Hebrew</td> <td>&nbsp;</td> <td>IE5</td> <td>Win2000</td> <td>20424</td> <td>1255</td> </tr> <tr> <td>IBM EBCDIC (Icelandic)</td> <td>x-EBCDIC-Icelandic</td> <td>&nbsp;</td> <td>IE5</td> <td>Win2000</td> <td>20871</td> <td>1252</td> </tr> <tr> <td>IBM EBCDIC (Icelandic-Euro)</td> <td>x-ebcdic-icelandic-euro</td> <td>&nbsp;</td> <td>IE5</td> <td>Win2000</td> <td>1149</td> <td>1252</td> </tr> <tr> <td>IBM EBCDIC (International-Euro)</td> <td>x-ebcdic-international-euro</td> <td>&nbsp;</td> <td>IE5</td> <td>Win2000</td> <td>1148</td> <td>1252</td> </tr> <tr> <td>IBM EBCDIC (Italy)</td> <td>x-EBCDIC-Italy</td> <td>&nbsp;</td> <td>IE5</td> <td>Win2000</td> <td>20280</td> <td>1252</td> </tr> <tr> <td>IBM EBCDIC (Italy-Euro)</td> <td>x-ebcdic-italy-euro</td> <td>&nbsp;</td> <td>IE5</td> <td>Win2000</td> <td>1144</td> <td>1252</td> </tr> <tr> <td>IBM EBCDIC (Japanese and Japanese Katakana)</td> <td>x-EBCDIC-JapaneseAndKana</td> <td>&nbsp;</td> <td>IE5</td> <td>Win2000</td> <td>50930</td> <td>932</td> </tr> <tr> <td>IBM EBCDIC (Japanese and Japanese-Latin)</td> <td>x-EBCDIC-JapaneseAndJapaneseLatin</td> <td>&nbsp;</td> <td>IE5</td> <td>Win2000</td> <td>50939</td> <td>932</td> </tr> <tr> <td>IBM EBCDIC (Japanese and US-Canada)</td> <td>x-EBCDIC-JapaneseAndUSCanada</td> <td>&nbsp;</td> <td>IE5</td> <td>Win2000</td> <td>50931</td> <td>932</td> </tr> <tr> <td>IBM EBCDIC (Japanese katakana)</td> <td>x-EBCDIC-JapaneseKatakana</td> <td>&nbsp;</td> <td>IE5</td> <td>Win2000</td> <td>20290</td> <td>932</td> </tr> <tr> <td>IBM EBCDIC (Korean and Korean Extended)</td> <td>x-EBCDIC-KoreanAndKoreanExtended</td> <td>&nbsp;</td> <td>IE5</td> <td>Win2000</td> <td>50933</td> <td>949</td> </tr> <tr> <td>IBM EBCDIC (Korean Extended)</td> <td>x-EBCDIC-KoreanExtended</td> <td>&nbsp;</td> <td>IE5</td> <td>Win2000</td> <td>20833</td> <td>949</td> </tr> <tr> <td>IBM EBCDIC (Multilingual Latin-2)</td> <td>CP870</td> <td>&nbsp;</td> <td>IE5</td> <td>Win2000</td> <td>870</td> <td>1250</td> </tr> <tr> <td>IBM EBCDIC (Simplified Chinese)</td> <td>x-EBCDIC-SimplifiedChinese</td> <td>&nbsp;</td> <td>IE5</td> <td>Win2000</td> <td>50935</td> <td>936</td> </tr> <tr> <td>IBM EBCDIC (Spain)</td> <td>X-EBCDIC-Spain</td> <td>&nbsp;</td> <td>IE5</td> <td>Win2000</td> <td>20284</td> <td>1252</td> </tr> <tr> <td>IBM EBCDIC (Spain-Euro)</td> <td>x-ebcdic-spain-euro</td> <td>&nbsp;</td> <td>IE5</td> <td>Win2000</td> <td>1145</td> <td>1252</td> </tr> <tr> <td>IBM EBCDIC (Thai)</td> <td>x-EBCDIC-Thai</td> <td>&nbsp;</td> <td>IE5</td> <td>Win2000</td> <td>20838</td> <td>874</td> </tr> <tr> <td>IBM EBCDIC (Traditional Chinese)</td> <td>x-EBCDIC-TraditionalChinese</td> <td>&nbsp;</td> <td>IE5</td> <td>Win2000</td> <td>50937</td> <td>950</td> </tr> <tr> <td>IBM EBCDIC (Turkish Latin-5)</td> <td>CP1026</td> <td>&nbsp;</td> <td>IE5</td> <td>Win2000</td> <td>1026</td> <td>1254</td> </tr> <tr> <td>IBM EBCDIC (Turkish)</td> <td>x-EBCDIC-Turkish</td> <td>&nbsp;</td> <td>IE5</td> <td>Win2000</td> <td>20905</td> <td>1254</td> </tr> <tr> <td>IBM EBCDIC (UK)</td> <td>x-EBCDIC-UK</td> <td>&nbsp;</td> <td>IE5</td> <td>Win2000</td> <td>20285</td> <td>1252</td> </tr> <tr> <td>IBM EBCDIC (UK-Euro)</td> <td>x-ebcdic-uk-euro</td> <td>&nbsp;</td> <td>IE5</td> <td>Win2000</td> <td>1146</td> <td>1252</td> </tr> <tr> <td>IBM EBCDIC (US-Canada)</td> <td>ebcdic-cp-us</td> <td>&nbsp;</td> <td>IE5</td> <td>Win2000</td> <td>37</td> <td>1252</td> </tr> <tr> <td>IBM EBCDIC (US-Canada-Euro)</td> <td>x-ebcdic-cp-us-euro</td> <td>&nbsp;</td> <td>IE5</td> <td>Win2000</td> <td>1140</td> <td>1252</td> </tr> <tr> <td>Icelandic (DOS)</td> <td>ibm861</td> <td>&nbsp;</td> <td>IE5</td> <td>Win2000</td> <td>861</td> <td>1252</td> </tr> <tr> <td>Icelandic (Mac)</td> <td>x-mac-icelandic</td> <td>&nbsp;</td> <td>IE5</td> <td>Win2000</td> <td>10079</td> <td>1252</td> </tr> <tr> <td>ISCII Assamese</td> <td>x-iscii-as</td> <td>&nbsp;</td> <td>IE5</td> <td>Win2000</td> <td>57006</td> <td>57006</td> </tr> <tr> <td>ISCII Bengali</td> <td>x-iscii-be</td> <td>&nbsp;</td> <td>IE5</td> <td>Win2000</td> <td>57003</td> <td>57003</td> </tr> <tr> <td>ISCII Devanagari</td> <td>x-iscii-de</td> <td>&nbsp;</td> <td>IE5</td> <td>Win2000</td> <td>57002</td> <td>57002</td> </tr> <tr> <td>ISCII Gujarathi</td> <td>x-iscii-gu</td> <td>&nbsp;</td> <td>IE5</td> <td>Win2000</td> <td>57010</td> <td>57010</td> </tr> <tr> <td>ISCII Kannada</td> <td>x-iscii-ka</td> <td>&nbsp;</td> <td>IE5</td> <td>Win2000</td> <td>57008</td> <td>57008</td> </tr> <tr> <td>ISCII Malayalam</td> <td>x-iscii-ma</td> <td>&nbsp;</td> <td>IE5</td> <td>Win2000</td> <td>57009</td> <td>57009</td> </tr> <tr> <td>ISCII Oriya</td> <td>x-iscii-or</td> <td>&nbsp;</td> <td>IE5</td> <td>Win2000</td> <td>57007</td> <td>57007</td> </tr> <tr> <td>ISCII Panjabi</td> <td>x-iscii-pa</td> <td>&nbsp;</td> <td>IE5</td> <td>Win2000</td> <td>57011</td> <td>57011</td> </tr> <tr> <td>ISCII Tamil</td> <td>x-iscii-ta</td> <td>&nbsp;</td> <td>IE5</td> <td>Win2000</td> <td>57004</td> <td>57004</td> </tr> <tr> <td>ISCII Telugu</td> <td>x-iscii-te</td> <td>&nbsp;</td> <td>IE5</td> <td>Win2000</td> <td>57005</td> <td>57005</td> </tr> <tr> <td>Japanese (EUC)</td> <td>euc-jp</td> <td>csEUCPkdFmtJapanese, Extended_UNIX_Code_Packed_Format_for_Japanese, x-euc, x-euc-jp</td> <td>IE5,&nbsp;IE4</td> <td>Win95</td> <td>51932</td> <td>932</td> </tr> <tr> <td>Japanese (JIS)</td> <td>iso-2022-jp</td> <td>&nbsp;</td> <td>IE5,&nbsp;IE4</td> <td>Win95</td> <td>50220</td> <td>932</td> </tr> <tr> <td>Japanese (JIS-Allow 1 byte Kana - SO/SI)</td> <td>iso-2022-jp</td> <td>_iso-2022-jp$SIO</td> <td>IE5</td> <td>Win95</td> <td>50222</td> <td>932</td> </tr> <tr> <td>Japanese (JIS-Allow 1 byte Kana)</td> <td>csISO2022JP</td> <td>_iso-2022-jp</td> <td>IE5</td> <td>Win95</td> <td>50221</td> <td>932</td> </tr> <tr> <td>Japanese (Mac)</td> <td>x-mac-japanese</td> <td>&nbsp;</td> <td>IE5</td> <td>Win2000</td> <td>10001</td> <td>932</td> </tr> <tr> <td>Japanese (Shift-JIS)</td> <td>shift_jis</td> <td>csShiftJIS, csWindows31J, ms_Kanji, shift-jis, x-ms-cp932, x-sjis</td> <td>IE5,&nbsp;IE4</td> <td>Win95</td> <td>932</td> <td>932</td> </tr> <tr> <td>Korean</td> <td>ks_c_5601-1987</td> <td>csKSC56011987, euc-kr, iso-ir-149, korean, ks_c_5601, ks_c_5601_1987, ks_c_5601-1989, KSC_5601, KSC5601</td> <td>IE5</td> <td>Win95</td> <td>949</td> <td>949</td> </tr> <tr> <td>Korean (EUC)</td> <td>euc-kr</td> <td>csEUCKR</td> <td>IE5</td> <td>Win95</td> <td>51949</td> <td>949</td> </tr> <tr> <td>Korean (ISO)</td> <td>iso-2022-kr</td> <td>csISO2022KR</td> <td>IE5</td> <td>Win95</td> <td>50225</td> <td>949</td> </tr> <tr> <td>Korean (Johab)</td> <td>Johab</td> <td>&nbsp;</td> <td>IE5</td> <td>Win2000</td> <td>1361</td> <td>1361</td> </tr> <tr> <td>Korean (Mac)</td> <td>x-mac-korean</td> <td>&nbsp;</td> <td>IE5</td> <td>Win2000</td> <td>10003</td> <td>949</td> </tr> <tr> <td>Latin 3 (ISO)</td> <td>iso-8859-3</td> <td>csISOLatin3, ISO_8859-3, ISO_8859-3:1988, iso-ir-109, l3, latin3</td> <td>IE5,&nbsp;IE4</td> <td>Win95</td> <td>28593</td> <td>1254</td> </tr> <tr> <td>Latin 9 (ISO)</td> <td>iso-8859-15</td> <td>csISOLatin9, ISO_8859-15, l9, latin9</td> <td>IE5</td> <td>Win95</td> <td>28605</td> <td>1252</td> </tr> <tr> <td>Norwegian (IA5)</td> <td>x-IA5-Norwegian</td> <td>&nbsp;</td> <td>IE5</td> <td>Win2000</td> <td>20108</td> <td>1252</td> </tr> <tr> <td>OEM United States</td> <td>IBM437</td> <td>437, cp437, csPC8, CodePage437</td> <td>IE5</td> <td>Win2000</td> <td>437</td> <td>1252</td> </tr> <tr> <td>Swedish (IA5)</td> <td>x-IA5-Swedish</td> <td>&nbsp;</td> <td>IE5</td> <td>Win2000</td> <td>20107</td> <td>1252</td> </tr> <tr> <td>Thai (Windows)</td> <td>windows-874</td> <td>DOS-874, iso-8859-11, TIS-620</td> <td>IE5,&nbsp;IE4</td> <td>Win95</td> <td>874</td> <td>874</td> </tr> <tr> <td>Turkish (DOS)</td> <td>ibm857</td> <td>&nbsp;</td> <td>IE5</td> <td>Win2000</td> <td>857</td> <td>1254</td> </tr> <tr> <td>Turkish (ISO)</td> <td>iso-8859-9</td> <td>csISOLatin5, ISO_8859-9, ISO_8859-9:1989, iso-ir-148, l5, latin5</td> <td>IE5</td> <td>Win95</td> <td>28599</td> <td>1254</td> </tr> <tr> <td>Turkish (Mac)</td> <td>x-mac-turkish</td> <td>&nbsp;</td> <td>IE5</td> <td>Win2000</td> <td>10081</td> <td>1254</td> </tr> <tr> <td>Turkish (Windows)</td> <td>windows-1254</td> <td>ISO_8859-9, ISO_8859-9:1989, iso-8859-9, iso-ir-148, latin5</td> <td>IE5</td> <td>Win95</td> <td>1254</td> <td>1254</td> </tr> <tr> <td>Unicode</td> <td>unicode</td> <td>utf-16</td> <td>IE5,&nbsp;IE4</td> <td>Win95</td> <td>1200</td> <td>1200</td> </tr> <tr> <td>Unicode (Big-Endian)</td> <td>unicodeFFFE</td> <td>&nbsp;</td> <td>IE5,&nbsp;IE4</td> <td>Win95</td> <td>1201</td> <td>1200</td> </tr> <tr> <td>Unicode (UTF-7)</td> <td>utf-7</td> <td>csUnicode11UTF7, unicode-1-1-utf-7, x-unicode-2-0-utf-7</td> <td>IE5,&nbsp;IE4</td> <td>Win95</td> <td>65000</td> <td>1200</td> </tr> <tr> <td>Unicode (UTF-8)</td> <td>utf-8</td> <td>unicode-1-1-utf-8, unicode-2-0-utf-8, x-unicode-2-0-utf-8</td> <td>IE5,&nbsp;IE4</td> <td>Win95</td> <td>65001</td> <td>1200</td> </tr> <tr> <td>US-ASCII</td> <td>us-ascii</td> <td>ANSI_X3.4-1968, ANSI_X3.4-1986, ascii, cp367, csASCII, IBM367, ISO_646.irv:1991, ISO646-US, iso-ir-6us</td> <td>IE5</td> <td>Win95</td> <td>20127</td> <td>1252</td> </tr> <tr> <td>Vietnamese (Windows)</td> <td>windows-1258</td> <td>&nbsp;</td> <td>IE5,&nbsp;IE4</td> <td>Win95</td> <td>1258</td> <td>1258</td> </tr> <tr> <td>Western European (DOS)</td> <td>ibm850</td> <td>&nbsp;</td> <td>IE5</td> <td>Win2000</td> <td>850</td> <td>1252</td> </tr> <tr> <td>Western European (IA5)</td> <td>x-IA5</td> <td>&nbsp;</td> <td>IE5</td> <td>Win2000</td> <td>20105</td> <td>1252</td> </tr> <tr> <td>Western European (ISO)</td> <td>iso-8859-1</td> <td>cp819, csISOLatin1, ibm819, iso_8859-1, iso_8859-1:1987, iso8859-1, iso-ir-100, l1, latin1</td> <td>IE5</td> <td>Win95</td> <td>28591</td> <td>1252</td> </tr> <tr> <td>Western European (Mac)</td> <td>macintosh</td> <td>&nbsp;</td> <td>IE5</td> <td>Win2000</td> <td>10000</td> <td>1252</td> </tr> <tr> <td>Western European (Windows)</td> <td>Windows-1252</td> <td>ANSI_X3.4-1968, ANSI_X3.4-1986, ascii, cp367, cp819, csASCII, IBM367, ibm819, ISO_646.irv:1991, iso_8859-1, iso_8859-1:1987, ISO646-US, iso8859-1, iso-8859-1, iso-ir-100, iso-ir-6, latin1, us, us-ascii, x-ansi</td> <td>IE5</td> <td>Win95</td> <td>1252</td> <td>1252</td> </tr> </tbody> </table> <h2> <a id="unknown_587"></a>Internal Charsets Not for Gen </body> </html> */ // raw, ascii, latin0, latin1, utf8, iso2022, mac, win1252, ibm858, utf16le, utf16be, utf16, big5, shiftjis // some of these are pure guesses and while some wierd character sets are unlikely to be used, I suppose these guesses could be wrong and cause problems $tidy_charsets = array( // HTML => tidy 'ASMO-708' => '', 'DOS-720' => '', 'iso-8859-6' => '', 'x-mac-arabic' => 'mac', 'windows-1256' => '', 'ibm775' => '', 'iso-8859-4' => '', 'windows-1257' => '', 'ibm852' => '', 'iso-8859-2' => '', 'x-mac-ce' => 'mac', 'windows-1250' => '', 'EUC-CN' => '', 'gb2312' => '', 'hz-gb-2312' => '', 'x-mac-chinesesimp' => 'mac', 'big5' => 'big5', 'x-Chinese-CNS' => '', 'x-Chinese-Eten' => '', 'x-mac-chinesetrad' => 'mac', 'cp866' => '', 'iso-8859-5' => '', 'koi8-r' => '', 'koi8-u' => '', 'x-mac-cyrillic' => 'mac', 'windows-1251' => '', 'x-Europa' => '', 'x-IA5-German' => '', 'ibm737' => '', 'iso-8859-7' => '', 'x-mac-greek' => 'mac', 'windows-1253' => '', 'ibm869' => '', 'DOS-862' => '', 'iso-8859-8-i' => '', 'iso-8859-8' => '', 'x-mac-hebrew' => 'mac', 'windows-1255' => '', 'x-EBCDIC-Arabic' => '', 'x-EBCDIC-CyrillicRussian' => '', 'x-EBCDIC-CyrillicSerbianBulgarian' => '', 'x-EBCDIC-DenmarkNorway' => '', 'x-ebcdic-denmarknorway-euro' => '', 'x-EBCDIC-FinlandSweden' => '', 'x-ebcdic-finlandsweden-euro' => '', 'x-ebcdic-finlandsweden-euro' => '', 'x-ebcdic-france-euro' => '', 'x-EBCDIC-Germany' => '', 'x-ebcdic-germany-euro' => '', 'x-EBCDIC-GreekModern' => '', 'x-EBCDIC-Greek' => '', 'x-EBCDIC-Hebrew' => '', 'x-EBCDIC-Icelandic' => '', 'x-ebcdic-icelandic-euro' => '', 'x-ebcdic-international-euro' => '', 'x-EBCDIC-Italy' => '', 'x-ebcdic-italy-euro' => '', 'x-EBCDIC-JapaneseAndKana' => '', 'x-EBCDIC-JapaneseAndJapaneseLatin' => '', 'x-EBCDIC-JapaneseAndUSCanada' => '', 'x-EBCDIC-JapaneseKatakana' => '', 'x-EBCDIC-KoreanAndKoreanExtended' => '', 'x-EBCDIC-KoreanExtended' => '', 'CP870' => '', 'x-EBCDIC-SimplifiedChinese' => '', 'X-EBCDIC-Spain' => '', 'x-ebcdic-spain-euro' => '', 'x-EBCDIC-Thai' => '', 'x-EBCDIC-TraditionalChinese' => '', 'CP1026' => '', 'x-EBCDIC-Turkish' => '', 'x-EBCDIC-UK' => '', 'x-ebcdic-uk-euro' => '', 'ebcdic-cp-us' => '', 'x-ebcdic-cp-us-euro' => '', 'ibm861' => '', 'x-mac-icelandic' => 'mac', 'x-iscii-as' => '', 'x-iscii-be' => '', 'x-iscii-de' => '', 'x-iscii-gu' => '', 'x-iscii-ka' => '', 'x-iscii-ma' => '', 'x-iscii-or' => '', 'x-iscii-pa' => '', 'x-iscii-ta' => '', 'x-iscii-te' => '', 'euc-jp' => '', 'iso-2022-jp' => 'iso2022', 'iso-2022-jp' => 'iso2022', 'csISO2022JP' => 'iso2022', 'x-mac-japanese' => 'mac', 'shift_jis' => 'shiftjis', 'ks_c_5601-1987' => '', 'euc-kr' => '', 'iso-2022-kr' => 'iso2022', 'Johab' => '', 'x-mac-korean' => 'mac', 'iso-8859-3' => '', 'iso-8859-15' => '', 'x-IA5-Norwegian' => '', 'IBM437' => '', 'x-IA5-Swedish' => '', 'windows-874' => '', 'ibm857' => '', 'iso-8859-9' => '', 'x-mac-turkish' => 'mac', 'windows-1254' => '', 'unicode' => '', 'unicodeFFFE' => '', 'utf-7' => '', 'utf-8' => 'utf8', 'us-ascii' => 'ascii', 'windows-1258' => '', 'ibm850' => '', 'x-IA5' => '', 'iso-8859-1' => 'latin1', 'macintosh' => 'mac', 'Windows-1252' => 'win1252', ); $tidy_charsets_lower = array( 'asmo-708' => '', 'dos-720' => '', 'iso-8859-6' => '', 'x-mac-arabic' => 'mac', 'windows-1256' => '', 'ibm775' => '', 'iso-8859-4' => '', 'windows-1257' => '', 'ibm852' => '', 'iso-8859-2' => '', 'x-mac-ce' => 'mac', 'windows-1250' => '', 'euc-cn' => '', 'gb2312' => '', 'hz-gb-2312' => '', 'x-mac-chinesesimp' => 'mac', 'big5' => 'big5', 'x-chinese-cns' => '', 'x-chinese-eten' => '', 'x-mac-chinesetrad' => 'mac', 'cp866' => '', 'iso-8859-5' => '', 'koi8-r' => '', 'koi8-u' => '', 'x-mac-cyrillic' => 'mac', 'windows-1251' => '', 'x-europa' => '', 'x-ia5-german' => '', 'ibm737' => '', 'iso-8859-7' => '', 'x-mac-greek' => 'mac', 'windows-1253' => '', 'ibm869' => '', 'dos-862' => '', 'iso-8859-8-i' => '', 'iso-8859-8' => '', 'x-mac-hebrew' => 'mac', 'windows-1255' => '', 'x-ebcdic-arabic' => '', 'x-ebcdic-cyrillicrussian' => '', 'x-ebcdic-cyrillicserbianbulgarian' => '', 'x-ebcdic-denmarknorway' => '', 'x-ebcdic-denmarknorway-euro' => '', 'x-ebcdic-finlandsweden' => '', 'x-ebcdic-finlandsweden-euro' => '', 'x-ebcdic-france-euro' => '', 'x-ebcdic-germany' => '', 'x-ebcdic-germany-euro' => '', 'x-ebcdic-greekmodern' => '', 'x-ebcdic-greek' => '', 'x-ebcdic-hebrew' => '', 'x-ebcdic-icelandic' => '', 'x-ebcdic-icelandic-euro' => '', 'x-ebcdic-international-euro' => '', 'x-ebcdic-italy' => '', 'x-ebcdic-italy-euro' => '', 'x-ebcdic-japaneseandkana' => '', 'x-ebcdic-japaneseandjapaneselatin' => '', 'x-ebcdic-japaneseanduscanada' => '', 'x-ebcdic-japanesekatakana' => '', 'x-ebcdic-koreanandkoreanextended' => '', 'x-ebcdic-koreanextended' => '', 'cp870' => '', 'x-ebcdic-simplifiedchinese' => '', 'x-ebcdic-spain' => '', 'x-ebcdic-spain-euro' => '', 'x-ebcdic-thai' => '', 'x-ebcdic-traditionalchinese' => '', 'cp1026' => '', 'x-ebcdic-turkish' => '', 'x-ebcdic-uk' => '', 'x-ebcdic-uk-euro' => '', 'ebcdic-cp-us' => '', 'x-ebcdic-cp-us-euro' => '', 'ibm861' => '', 'x-mac-icelandic' => 'mac', 'x-iscii-as' => '', 'x-iscii-be' => '', 'x-iscii-de' => '', 'x-iscii-gu' => '', 'x-iscii-ka' => '', 'x-iscii-ma' => '', 'x-iscii-or' => '', 'x-iscii-pa' => '', 'x-iscii-ta' => '', 'x-iscii-te' => '', 'euc-jp' => '', 'iso-2022-jp' => 'iso2022', 'csiso2022jp' => 'iso2022', 'x-mac-japanese' => 'mac', 'shift_jis' => 'shiftjis', 'ks_c_5601-1987' => '', 'euc-kr' => '', 'iso-2022-kr' => 'iso2022', 'johab' => '', 'x-mac-korean' => 'mac', 'iso-8859-3' => '', 'iso-8859-15' => '', 'x-ia5-norwegian' => '', 'ibm437' => '', 'x-ia5-swedish' => '', 'windows-874' => '', 'ibm857' => '', 'iso-8859-9' => '', 'x-mac-turkish' => 'mac', 'windows-1254' => '', 'unicode' => '', 'unicodefffe' => '', 'utf-7' => '', 'utf-8' => 'utf8', 'us-ascii' => 'ascii', 'windows-1258' => '', 'ibm850' => '', 'x-ia5' => '', 'iso-8859-1' => 'latin1', 'macintosh' => 'mac', 'windows-1252' => 'win1252', ); ?>