changeset 194:e5a931733a98

Added the character encoding category parameters. git-svn-id: svn://svn.code.sf.net/p/universalindent/code/trunk@398 59b1889a-e5ac-428c-b0c7-476e01d41282
author thomas_-_s <thomas_-_s@59b1889a-e5ac-428c-b0c7-476e01d41282>
date Thu, 07 Jun 2007 13:04:38 +0000
parents 7d66d89cbcd2
children 7aa4bdbdda35
files data/uigui_htmltidy.ini
diffstat 1 files changed, 55 insertions(+), 1 deletions(-) [+]
line wrap: on
line diff
--- a/data/uigui_htmltidy.ini	Thu Jun 07 13:03:44 2007 +0000
+++ b/data/uigui_htmltidy.ini	Thu Jun 07 13:04:38 2007 +0000
@@ -1,5 +1,5 @@
 [%20header]
-categories="HTML, XHTML, XML|Diagnostics|Pretty Print|Character Encoding|Miscellaneous"
+categories="HTML, XHTML, XML|Diagnostics|Pretty Print|Character Encoding"
 cfgFileParameterEnding=cr
 configFilename=tidy.cfg
 fileTypes=*.html|*.htm
@@ -617,3 +617,57 @@
 TrueFalse=wrap-sections:yes|wrap-sections:no
 Value=0
 ValueDefault=0
+
+[ascii-chars]
+Category=3
+Description="<html>Can be used to modify behavior of -c (--clean yes) option. If set to 'yes' when using -c, &emdash;, &rdquo;, and other named character entities are downgraded to their closest ascii equivalents.</html>"
+EditorType=boolean
+Enabled=false
+TrueFalse=ascii-chars:yes|ascii-chars:no
+Value=0
+ValueDefault=0
+
+[char-encoding]
+Category=3
+Choices=char-encoding:raw|char-encoding:ascii|char-encoding:latin0|char-encoding:latin1|char-encoding:utf8|char-encoding:iso2022|char-encoding:mac|char-encoding:win1252|char-encoding:ibm858|char-encoding:utf16le|char-encoding:utf16be|char-encoding:utf16|char-encoding:big5|char-encoding:shiftjis
+Description="<html>This option specifies the character encoding Tidy uses for both the input and output. For ascii, Tidy will accept Latin-1 (ISO-8859-1) character values, but will use entities for all characters whose value > 127. For raw, Tidy will output values above 127 without translating them into entities. For latin1, characters above 255 will be written as entities. For utf8, Tidy assumes that both input and output is encoded as UTF-8. You can use iso2022 for files encoded using the ISO-2022 family of encodings e.g. ISO-2022-JP. For mac and win1252, Tidy will accept vendor specific character values, but will use entities for all characters whose value > 127.</html>"
+EditorType=multiple
+Enabled=false
+Value=1
+ValueDefault=1
+
+[input-encoding]
+Category=3
+Choices=input-encoding:raw|input-encoding:ascii|input-encoding:latin0|input-encoding:latin1|input-encoding:utf8|input-encoding:iso2022|input-encoding:mac|input-encoding:win1252|input-encoding:ibm858|input-encoding:utf16le|input-encoding:utf16be|input-encoding:utf16|input-encoding:big5|input-encoding:shiftjis
+Description="<html>This option specifies the character encoding Tidy uses for the input. See char-encoding for more info.</html>"
+EditorType=multiple
+Enabled=false
+Value=4
+ValueDefault=4
+
+[newline]
+Category=3
+Choices=newline:LF|newline:CRLF|newline:CR
+Description="<html>The default is appropriate to the current platform: CRLF on PC-DOS, MS-Windows and OS/2, CR on Classic Mac OS, and LF everywhere else (Unix and Linux).</html>"
+EditorType=multiple
+Enabled=false
+Value=1
+ValueDefault=1
+
+[output-bom]
+Category=3
+Choices=output-bom:auto|output-bom:yes|output-bom:no
+Description="<html>This option specifies if Tidy should write a Unicode Byte Order Mark character (BOM; also known as Zero Width No-Break Space; has value of U+FEFF) to the beginning of the output; only for UTF-8 and UTF-16 output encodings. If set to 'auto', this option causes Tidy to write a BOM to the output only if a BOM was present at the beginning of the input. A BOM is always written for XML/XHTML output using UTF-16 output encodings.</html>"
+EditorType=multiple
+Enabled=false
+Value=0
+ValueDefault=0
+
+[output-encoding]
+Category=3
+Choices=output-encoding:raw|output-encoding:ascii|output-encoding:latin0|output-encoding:latin1|output-encoding:utf8|output-encoding:iso2022|output-encoding:mac|output-encoding:win1252|output-encoding:ibm858|output-encoding:utf16le|output-encoding:utf16be|output-encoding:utf16|output-encoding:big5|output-encoding:shiftjis
+Description="<html>This option specifies the character encoding Tidy uses for the output. See char-encoding for more info. May only be different from input-encoding for Latin encodings (ascii, latin0, latin1, mac, win1252, ibm858).</html>"
+EditorType=multiple
+Enabled=false
+Value=1
+ValueDefault=1