summaryrefslogtreecommitdiffstats
path: root/htdocs
diff options
context:
space:
mode:
authorot <ot@localhost>2007-07-19 03:59:24 +0000
committerot <ot@localhost>2007-07-19 03:59:24 +0000
commit901f132d79f2beb50feff0c0aca3b2045bdb0316 (patch)
tree7f7b9345309a550435de9ab8442f49d8295d2ca3 /htdocs
parent3d8de8e5e8a8ec95d120a8b054dbbd4afe30890f (diff)
downloadmarkup-validator-901f132d79f2beb50feff0c0aca3b2045bdb0316.zip
markup-validator-901f132d79f2beb50feff0c0aca3b2045bdb0316.tar.gz
markup-validator-901f132d79f2beb50feff0c0aca3b2045bdb0316.tar.bz2
removing the list of supported character encodings,
as we have a better and more reliable technical way to do this. Replacing with a mechanism to: * suggest a better alias if a "bad" encoding alias is used * refuse to transcode if encoding used is forbidden by policy (I don't know any, but the mechanism is here...) More details: http://lists.w3.org/Archives/Public/public-qa-dev/2007Jul/0009.html and surrounding thread.
Diffstat (limited to 'htdocs')
-rw-r--r--htdocs/config/charset.cfg73
1 files changed, 18 insertions, 55 deletions
diff --git a/htdocs/config/charset.cfg b/htdocs/config/charset.cfg
index 69ef847..aed81a6 100644
--- a/htdocs/config/charset.cfg
+++ b/htdocs/config/charset.cfg
@@ -1,60 +1,23 @@
#
-# List of accepted encodings.
+# List of encodings aliases and forbidden encodings
#
-# $Id: charset.cfg,v 1.13 2006-10-12 01:15:50 ot Exp $
-#
-# The Validator will refuse to decode documents in an encoding
-# other than those listed here. The list is independent of what
+# $Id: charset.cfg,v 1.14 2007-07-19 03:59:23 ot Exp $
+
+# This list indicates character encoding aliases that are
+# not recommended, along with a recommended equivalent, e.g:
+# encoding-obscure = encoding-well-known
+
+# It also lists encoding names that the validator will refuse to treat:
+# bogus_encoding = Encoding Forbidden (Reason why)
+
+# The list is independent of what
# is supported on a specific system but subject to the Validator
# policy for acceptable encodings.
-#
-utf-8 = 1
-utf-16 = 1
-utf-16be = 1
-utf-16le = 1
-iso-8859-1 = 1
-iso-8859-2 = 1
-iso-8859-3 = 1
-iso-8859-4 = 1
-iso-8859-5 = 1
-iso-8859-6 = 1
-iso-8859-6-i = 1
-iso-8859-7 = 1
-iso-8859-8 = 1
-iso-8859-8-i = 1
-iso-8859-9 = 1
-iso-8859-10 = 1
-iso-8859-11 = 1
-iso-8859-13 = 1
-iso-8859-14 = 1
-iso-8859-15 = 1
-iso-8859-16 = 1
-us-ascii = 1
-iso-2022-jp = 1
-shift_jis = 1
-euc-jp = 1
-gb2312 = 1
-big5 = 1
-iso-2022-kr = 1
-euc-kr = 1
-gb18030 = 1
-tis-620 = 1
-koi8-r = 1
-koi8-u = 1
-windows-1250 = 1
-windows-1251 = 1
-windows-1252 = 1
-windows-1253 = 1
-windows-1254 = 1
-windows-1255 = 1
-windows-1256 = 1
-windows-1257 = 1
-macintosh = 1
-x-mac-roman = 1
-x-sjis = 1
-iso8859-1 = 1
-ascii = 1
-iso-8859-1-Windows-3.1-Latin-1 = 1
-ks_c_5601-1987 = 1
-ksc_5601 = 1
+
+x-mac-roman = macintosh
+x-sjis = shift_jis
+iso8859-1 = iso-8859-1
+ascii = us-ascii
+# this one is in IANA, but better use only windows-1252
+iso-8859-1-Windows-3.1-Latin-1 = windows-1252