From c305220ceb5576952f611bf1ca547a363276b3ca Mon Sep 17 00:00:00 2001 From: Neil Date: Sun, 28 Aug 2016 12:35:29 +1000 Subject: SC_CHARSET_DEFAULT now means code page 1252 on Windows unless code page set. Improved documentation for character sets. --- doc/ScintillaDoc.html | 68 ++++++++++++++++++++++++++++++++++++++--------- doc/ScintillaHistory.html | 6 +++++ 2 files changed, 61 insertions(+), 13 deletions(-) (limited to 'doc') diff --git a/doc/ScintillaDoc.html b/doc/ScintillaDoc.html index 6e94e52e3..36eb6ad15 100644 --- a/doc/ScintillaDoc.html +++ b/doc/ScintillaDoc.html @@ -2723,24 +2723,66 @@ struct Sci_TextToFind { SCI_STYLESETCHARACTERSET(SCE_C_STRING, SC_CHARSET_RUSSIAN) would ensure that strings in Russian would display correctly in C and C++ (SCE_C_STRING is the style number used by the C and C++ lexer to display literal strings; it has the value 6). This - feature works differently on Windows and GTK+.

+ feature works differently on Windows and GTK+.
+ The default character set is SC_CHARSET_DEFAULT.

The character sets supported on Windows are:
- SC_CHARSET_ANSI, SC_CHARSET_ARABIC, SC_CHARSET_BALTIC, - SC_CHARSET_CHINESEBIG5, SC_CHARSET_DEFAULT, - SC_CHARSET_EASTEUROPE, SC_CHARSET_GB2312, - SC_CHARSET_GREEK, SC_CHARSET_HANGUL, SC_CHARSET_HEBREW, - SC_CHARSET_JOHAB, SC_CHARSET_MAC, SC_CHARSET_OEM, - SC_CHARSET_RUSSIAN (code page 1251), - SC_CHARSET_SHIFTJIS, SC_CHARSET_SYMBOL, SC_CHARSET_THAI, - SC_CHARSET_TURKISH, and SC_CHARSET_VIETNAMESE.

+ SC_CHARSET_ANSI, + SC_CHARSET_ARABIC, + SC_CHARSET_BALTIC, + SC_CHARSET_CHINESEBIG5, + SC_CHARSET_DEFAULT, + SC_CHARSET_EASTEUROPE, + SC_CHARSET_GB2312, + SC_CHARSET_GREEK, + SC_CHARSET_HANGUL, + SC_CHARSET_HEBREW, + SC_CHARSET_JOHAB, + SC_CHARSET_MAC, + SC_CHARSET_OEM, + SC_CHARSET_RUSSIAN (code page 1251), + SC_CHARSET_SHIFTJIS, + SC_CHARSET_SYMBOL, + SC_CHARSET_THAI, + SC_CHARSET_TURKISH, and + SC_CHARSET_VIETNAMESE.
+ SC_CHARSET_ANSI and SC_CHARSET_DEFAULT specify European Windows + code page 1252 unless the code page is set.

The character sets supported on GTK+ are:
- SC_CHARSET_ANSI, SC_CHARSET_OEM866 (code page 866), SC_CHARSET_CYRILLIC (code page 1251), + SC_CHARSET_ANSI, + SC_CHARSET_DEFAULT (8859-1), + SC_CHARSET_OEM866 (code page 866), + SC_CHARSET_CYRILLIC (code page 1251), + SC_CHARSET_EASTEUROPE, + SC_CHARSET_GB2312, + SC_CHARSET_HANGUL, + SC_CHARSET_RUSSIAN (KOI8-R), + SC_CHARSET_SHIFTJIS, and + SC_CHARSET_8859_15.

+ +

The character sets supported on Cocoa are:
+ SC_CHARSET_8859_15, + SC_CHARSET_ANSI (8859-1), + SC_CHARSET_ARABIC, + SC_CHARSET_BALTIC, + SC_CHARSET_CHINESEBIG5, + SC_CHARSET_CYRILLIC (code page 1251), + SC_CHARSET_DEFAULT (8859-1), SC_CHARSET_EASTEUROPE, - SC_CHARSET_GB2312, SC_CHARSET_HANGUL, - SC_CHARSET_RUSSIAN (KOI8-R), SC_CHARSET_SHIFTJIS, and - SC_CHARSET_8859_15.

+ SC_CHARSET_GB2312, + SC_CHARSET_GREEK, + SC_CHARSET_HANGUL, + SC_CHARSET_HEBREW, + SC_CHARSET_JOHAB, + SC_CHARSET_MAC, + SC_CHARSET_OEM, + SC_CHARSET_RUSSIAN (code page 1251), + SC_CHARSET_SHIFTJIS, + SC_CHARSET_SYMBOL, + SC_CHARSET_THAI, + SC_CHARSET_TURKISH, + SC_CHARSET_VIETNAMESE.

SCI_STYLESETCASE(int styleNumber, int caseMode)
SCI_STYLEGETCASE(int styleNumber)
diff --git a/doc/ScintillaHistory.html b/doc/ScintillaHistory.html index 1ebddebc5..64197c744 100644 --- a/doc/ScintillaHistory.html +++ b/doc/ScintillaHistory.html @@ -520,6 +520,12 @@ Bug #1648.

  • + SC_CHARSET_DEFAULT now means code page 1252 on Windows unless a code page is set. + This prevents unexpected behaviour and crashes on East Asian systems where default locales are commonly DBCS. + Projects which want to default to DBCS code pages in East Asian locales should set the code page and + character set explicitly. +
  • +
  • The HTML lexer no longer treats "<?" inside a string in a script as potentially starting an XML document. Bug #767.
  • -- cgit v1.2.3