aboutsummaryrefslogtreecommitdiffhomepage
path: root/lexers/LexHollywood.cxx
diff options
context:
space:
mode:
Diffstat (limited to 'lexers/LexHollywood.cxx')
-rw-r--r--lexers/LexHollywood.cxx512
1 files changed, 512 insertions, 0 deletions
diff --git a/lexers/LexHollywood.cxx b/lexers/LexHollywood.cxx
new file mode 100644
index 000000000..41c295686
--- /dev/null
+++ b/lexers/LexHollywood.cxx
@@ -0,0 +1,512 @@
+// Scintilla source code edit control
+/** @file LexHollywood.cxx
+ ** Lexer for Hollywood
+ ** Written by Andreas Falkenhahn, based on the BlitzBasic/PureBasic/Lua lexers
+ ** Thanks to Nicholai Benalal
+ ** For more information on Hollywood, see http://www.hollywood-mal.com/
+ ** Mail me (andreas <at> airsoftsoftwair <dot> de) for any bugs.
+ ** This code is subject to the same license terms as the rest of the Scintilla project:
+ ** The License.txt file describes the conditions under which this software may be distributed.
+ **/
+
+#include <stdlib.h>
+#include <string.h>
+#include <stdio.h>
+#include <stdarg.h>
+#include <assert.h>
+#include <ctype.h>
+
+#include <string>
+#include <map>
+
+#include "ILexer.h"
+#include "Scintilla.h"
+#include "SciLexer.h"
+
+#include "WordList.h"
+#include "LexAccessor.h"
+#include "StyleContext.h"
+#include "CharacterSet.h"
+#include "LexerModule.h"
+#include "OptionSet.h"
+#include "DefaultLexer.h"
+
+using namespace Scintilla;
+
+/* Bits:
+ * 1 - whitespace
+ * 2 - operator
+ * 4 - identifier
+ * 8 - decimal digit
+ * 16 - hex digit
+ * 32 - bin digit
+ * 64 - letter
+ */
+static int character_classification[128] =
+{
+ 0, // NUL ($0)
+ 0, // SOH ($1)
+ 0, // STX ($2)
+ 0, // ETX ($3)
+ 0, // EOT ($4)
+ 0, // ENQ ($5)
+ 0, // ACK ($6)
+ 0, // BEL ($7)
+ 0, // BS ($8)
+ 1, // HT ($9)
+ 1, // LF ($A)
+ 0, // VT ($B)
+ 0, // FF ($C)
+ 1, // CR ($D)
+ 0, // SO ($E)
+ 0, // SI ($F)
+ 0, // DLE ($10)
+ 0, // DC1 ($11)
+ 0, // DC2 ($12)
+ 0, // DC3 ($13)
+ 0, // DC4 ($14)
+ 0, // NAK ($15)
+ 0, // SYN ($16)
+ 0, // ETB ($17)
+ 0, // CAN ($18)
+ 0, // EM ($19)
+ 0, // SUB ($1A)
+ 0, // ESC ($1B)
+ 0, // FS ($1C)
+ 0, // GS ($1D)
+ 0, // RS ($1E)
+ 0, // US ($1F)
+ 1, // space ($20)
+ 4, // ! ($21)
+ 0, // " ($22)
+ 0, // # ($23)
+ 4, // $ ($24)
+ 2, // % ($25)
+ 2, // & ($26)
+ 2, // ' ($27)
+ 2, // ( ($28)
+ 2, // ) ($29)
+ 2, // * ($2A)
+ 2, // + ($2B)
+ 2, // , ($2C)
+ 2, // - ($2D)
+ // NB: we treat "." as an identifier although it is also an operator and a decimal digit
+ // the reason why we treat it as an identifier is to support syntax highlighting for
+ // plugin commands which always use a "." in their names, e.g. pdf.OpenDocument();
+ // we handle the decimal digit case manually below so that 3.1415 and .123 is styled correctly
+ // the collateral damage of treating "." as an identifier is that "." is never styled
+ // SCE_HOLLYWOOD_OPERATOR
+ 4, // . ($2E)
+ 2, // / ($2F)
+ 28, // 0 ($30)
+ 28, // 1 ($31)
+ 28, // 2 ($32)
+ 28, // 3 ($33)
+ 28, // 4 ($34)
+ 28, // 5 ($35)
+ 28, // 6 ($36)
+ 28, // 7 ($37)
+ 28, // 8 ($38)
+ 28, // 9 ($39)
+ 2, // : ($3A)
+ 2, // ; ($3B)
+ 2, // < ($3C)
+ 2, // = ($3D)
+ 2, // > ($3E)
+ 2, // ? ($3F)
+ 0, // @ ($40)
+ 84, // A ($41)
+ 84, // B ($42)
+ 84, // C ($43)
+ 84, // D ($44)
+ 84, // E ($45)
+ 84, // F ($46)
+ 68, // G ($47)
+ 68, // H ($48)
+ 68, // I ($49)
+ 68, // J ($4A)
+ 68, // K ($4B)
+ 68, // L ($4C)
+ 68, // M ($4D)
+ 68, // N ($4E)
+ 68, // O ($4F)
+ 68, // P ($50)
+ 68, // Q ($51)
+ 68, // R ($52)
+ 68, // S ($53)
+ 68, // T ($54)
+ 68, // U ($55)
+ 68, // V ($56)
+ 68, // W ($57)
+ 68, // X ($58)
+ 68, // Y ($59)
+ 68, // Z ($5A)
+ 2, // [ ($5B)
+ 2, // \ ($5C)
+ 2, // ] ($5D)
+ 2, // ^ ($5E)
+ 68, // _ ($5F)
+ 2, // ` ($60)
+ 84, // a ($61)
+ 84, // b ($62)
+ 84, // c ($63)
+ 84, // d ($64)
+ 84, // e ($65)
+ 84, // f ($66)
+ 68, // g ($67)
+ 68, // h ($68)
+ 68, // i ($69)
+ 68, // j ($6A)
+ 68, // k ($6B)
+ 68, // l ($6C)
+ 68, // m ($6D)
+ 68, // n ($6E)
+ 68, // o ($6F)
+ 68, // p ($70)
+ 68, // q ($71)
+ 68, // r ($72)
+ 68, // s ($73)
+ 68, // t ($74)
+ 68, // u ($75)
+ 68, // v ($76)
+ 68, // w ($77)
+ 68, // x ($78)
+ 68, // y ($79)
+ 68, // z ($7A)
+ 2, // { ($7B)
+ 2, // | ($7C)
+ 2, // } ($7D)
+ 2, // ~ ($7E)
+ 0, // &#127; ($7F)
+};
+
+static bool IsSpace(int c) {
+ return c < 128 && (character_classification[c] & 1);
+}
+
+static bool IsOperator(int c) {
+ return c < 128 && (character_classification[c] & 2);
+}
+
+static bool IsIdentifier(int c) {
+ return c < 128 && (character_classification[c] & 4);
+}
+
+static bool IsDigit(int c) {
+ return c < 128 && (character_classification[c] & 8);
+}
+
+static bool IsHexDigit(int c) {
+ return c < 128 && (character_classification[c] & 16);
+}
+
+static int LowerCase(int c)
+{
+ if (c >= 'A' && c <= 'Z')
+ return 'a' + c - 'A';
+ return c;
+}
+
+static int CheckHollywoodFoldPoint(char const *token) {
+ if (!strcmp(token, "function")) {
+ return 1;
+ }
+ if (!strcmp(token, "endfunction")) {
+ return -1;
+ }
+ return 0;
+}
+
+// An individual named option for use in an OptionSet
+
+// Options used for LexerHollywood
+struct OptionsHollywood {
+ bool fold;
+ bool foldCompact;
+ OptionsHollywood() {
+ fold = false;
+ foldCompact = false;
+ }
+};
+
+static const char * const hollywoodWordListDesc[] = {
+ "Hollywood keywords",
+ "Hollywood standard API functions",
+ "Hollywood plugin API functions",
+ "Hollywood plugin methods",
+ 0
+};
+
+struct OptionSetHollywood : public OptionSet<OptionsHollywood> {
+ OptionSetHollywood(const char * const wordListDescriptions[]) {
+ DefineProperty("fold", &OptionsHollywood::fold);
+ DefineProperty("fold.compact", &OptionsHollywood::foldCompact);
+ DefineWordListSets(wordListDescriptions);
+ }
+};
+
+class LexerHollywood : public DefaultLexer {
+ int (*CheckFoldPoint)(char const *);
+ WordList keywordlists[4];
+ OptionsHollywood options;
+ OptionSetHollywood osHollywood;
+public:
+ LexerHollywood(int (*CheckFoldPoint_)(char const *), const char * const wordListDescriptions[]) :
+ CheckFoldPoint(CheckFoldPoint_),
+ osHollywood(wordListDescriptions) {
+ }
+ virtual ~LexerHollywood() {
+ }
+ void SCI_METHOD Release() {
+ delete this;
+ }
+ int SCI_METHOD Version() const {
+ return lvRelease4;
+ }
+ const char * SCI_METHOD PropertyNames() {
+ return osHollywood.PropertyNames();
+ }
+ int SCI_METHOD PropertyType(const char *name) {
+ return osHollywood.PropertyType(name);
+ }
+ const char * SCI_METHOD DescribeProperty(const char *name) {
+ return osHollywood.DescribeProperty(name);
+ }
+ Sci_Position SCI_METHOD PropertySet(const char *key, const char *val);
+ const char * SCI_METHOD DescribeWordListSets() {
+ return osHollywood.DescribeWordListSets();
+ }
+ Sci_Position SCI_METHOD WordListSet(int n, const char *wl);
+ void SCI_METHOD Lex(Sci_PositionU startPos, Sci_Position length, int initStyle, IDocument *pAccess);
+ void SCI_METHOD Fold(Sci_PositionU startPos, Sci_Position length, int initStyle, IDocument *pAccess);
+
+ void * SCI_METHOD PrivateCall(int, void *) {
+ return 0;
+ }
+ static ILexer4 *LexerFactoryHollywood() {
+ return new LexerHollywood(CheckHollywoodFoldPoint, hollywoodWordListDesc);
+ }
+};
+
+Sci_Position SCI_METHOD LexerHollywood::PropertySet(const char *key, const char *val) {
+ if (osHollywood.PropertySet(&options, key, val)) {
+ return 0;
+ }
+ return -1;
+}
+
+Sci_Position SCI_METHOD LexerHollywood::WordListSet(int n, const char *wl) {
+ WordList *wordListN = 0;
+ switch (n) {
+ case 0:
+ wordListN = &keywordlists[0];
+ break;
+ case 1:
+ wordListN = &keywordlists[1];
+ break;
+ case 2:
+ wordListN = &keywordlists[2];
+ break;
+ case 3:
+ wordListN = &keywordlists[3];
+ break;
+ }
+ Sci_Position firstModification = -1;
+ if (wordListN) {
+ WordList wlNew;
+ wlNew.Set(wl);
+ if (*wordListN != wlNew) {
+ wordListN->Set(wl);
+ firstModification = 0;
+ }
+ }
+ return firstModification;
+}
+
+void SCI_METHOD LexerHollywood::Lex(Sci_PositionU startPos, Sci_Position length, int initStyle, IDocument *pAccess) {
+ LexAccessor styler(pAccess);
+
+ styler.StartAt(startPos);
+ bool inString = false;
+
+ StyleContext sc(startPos, length, initStyle, styler);
+
+ // Can't use sc.More() here else we miss the last character
+ for (; ; sc.Forward())
+ {
+ if (sc.atLineStart) inString = false;
+
+ if (sc.ch == '\"' && sc.chPrev != '\\') inString = !inString;
+
+ if (sc.state == SCE_HOLLYWOOD_IDENTIFIER) {
+ if (!IsIdentifier(sc.ch)) {
+ char s[100];
+ int kstates[4] = {
+ SCE_HOLLYWOOD_KEYWORD,
+ SCE_HOLLYWOOD_STDAPI,
+ SCE_HOLLYWOOD_PLUGINAPI,
+ SCE_HOLLYWOOD_PLUGINMETHOD,
+ };
+ sc.GetCurrentLowered(s, sizeof(s));
+ for (int i = 0; i < 4; i++) {
+ if (keywordlists[i].InList(s)) {
+ sc.ChangeState(kstates[i]);
+ }
+ }
+ sc.SetState(SCE_HOLLYWOOD_DEFAULT);
+ }
+ } else if (sc.state == SCE_HOLLYWOOD_OPERATOR) {
+
+ // always reset to default on operators because otherwise
+ // comments won't be recognized in sequences like "+/* Hello*/"
+ // --> "+/*" would be recognized as a sequence of operators
+
+ // if (!IsOperator(sc.ch)) sc.SetState(SCE_HOLLYWOOD_DEFAULT);
+ sc.SetState(SCE_HOLLYWOOD_DEFAULT);
+
+ } else if (sc.state == SCE_HOLLYWOOD_PREPROCESSOR) {
+ if (!IsIdentifier(sc.ch))
+ sc.SetState(SCE_HOLLYWOOD_DEFAULT);
+ } else if (sc.state == SCE_HOLLYWOOD_CONSTANT) {
+ if (!IsIdentifier(sc.ch))
+ sc.SetState(SCE_HOLLYWOOD_DEFAULT);
+ } else if (sc.state == SCE_HOLLYWOOD_NUMBER) {
+ if (!IsDigit(sc.ch) && sc.ch != '.')
+ sc.SetState(SCE_HOLLYWOOD_DEFAULT);
+ } else if (sc.state == SCE_HOLLYWOOD_HEXNUMBER) {
+ if (!IsHexDigit(sc.ch))
+ sc.SetState(SCE_HOLLYWOOD_DEFAULT);
+ } else if (sc.state == SCE_HOLLYWOOD_STRING) {
+ if (sc.ch == '"') {
+ sc.ForwardSetState(SCE_HOLLYWOOD_DEFAULT);
+ }
+ if (sc.atLineEnd) {
+ sc.SetState(SCE_HOLLYWOOD_DEFAULT);
+ }
+ } else if (sc.state == SCE_HOLLYWOOD_COMMENT) {
+ if (sc.atLineEnd) {
+ sc.SetState(SCE_HOLLYWOOD_DEFAULT);
+ }
+ } else if (sc.state == SCE_HOLLYWOOD_COMMENTBLOCK) {
+ if (sc.Match("*/") && !inString) {
+ sc.Forward();
+ sc.ForwardSetState(SCE_HOLLYWOOD_DEFAULT);
+ }
+ } else if (sc.state == SCE_HOLLYWOOD_STRINGBLOCK) {
+ if (sc.Match("]]") && !inString) {
+ sc.Forward();
+ sc.ForwardSetState(SCE_HOLLYWOOD_DEFAULT);
+ }
+ }
+
+ if (sc.state == SCE_HOLLYWOOD_DEFAULT) {
+ if (sc.Match(';')) {
+ sc.SetState(SCE_HOLLYWOOD_COMMENT);
+ } else if (sc.Match("/*")) {
+ sc.SetState(SCE_HOLLYWOOD_COMMENTBLOCK);
+ sc.Forward();
+ } else if (sc.Match("[[")) {
+ sc.SetState(SCE_HOLLYWOOD_STRINGBLOCK);
+ sc.Forward();
+ } else if (sc.Match('"')) {
+ sc.SetState(SCE_HOLLYWOOD_STRING);
+ } else if (sc.Match('$')) {
+ sc.SetState(SCE_HOLLYWOOD_HEXNUMBER);
+ } else if (sc.Match("0x") || sc.Match("0X")) { // must be before IsDigit() because of 0x
+ sc.SetState(SCE_HOLLYWOOD_HEXNUMBER);
+ sc.Forward();
+ } else if (sc.ch == '.' && (sc.chNext >= '0' && sc.chNext <= '9')) { // ".1234" style numbers
+ sc.SetState(SCE_HOLLYWOOD_NUMBER);
+ sc.Forward();
+ } else if (IsDigit(sc.ch)) {
+ sc.SetState(SCE_HOLLYWOOD_NUMBER);
+ } else if (sc.Match('#')) {
+ sc.SetState(SCE_HOLLYWOOD_CONSTANT);
+ } else if (sc.Match('@')) {
+ sc.SetState(SCE_HOLLYWOOD_PREPROCESSOR);
+ } else if (IsOperator(sc.ch)) {
+ sc.SetState(SCE_HOLLYWOOD_OPERATOR);
+ } else if (IsIdentifier(sc.ch)) {
+ sc.SetState(SCE_HOLLYWOOD_IDENTIFIER);
+ }
+ }
+
+ if (!sc.More())
+ break;
+ }
+ sc.Complete();
+}
+
+void SCI_METHOD LexerHollywood::Fold(Sci_PositionU startPos, Sci_Position length, int /* initStyle */, IDocument *pAccess) {
+
+ if (!options.fold)
+ return;
+
+ LexAccessor styler(pAccess);
+
+ Sci_PositionU lengthDoc = startPos + length;
+ int visibleChars = 0;
+ Sci_Position lineCurrent = styler.GetLine(startPos);
+ int levelPrev = styler.LevelAt(lineCurrent) & SC_FOLDLEVELNUMBERMASK;
+ int levelCurrent = levelPrev;
+ char chNext = styler[startPos];
+ int styleNext = styler.StyleAt(startPos);
+ int done = 0;
+ char word[256];
+ int wordlen = 0;
+
+ for (Sci_PositionU i = startPos; i < lengthDoc; i++) {
+ char ch = chNext;
+ chNext = styler.SafeGetCharAt(i + 1);
+ int style = styleNext;
+ styleNext = styler.StyleAt(i + 1);
+ bool atEOL = (ch == '\r' && chNext != '\n') || (ch == '\n');
+ if (!done) {
+ if (wordlen) { // are we scanning a token already?
+ word[wordlen] = static_cast<char>(LowerCase(ch));
+ if (!IsIdentifier(ch)) { // done with token
+ word[wordlen] = '\0';
+ levelCurrent += CheckFoldPoint(word);
+ done = 1;
+ } else if (wordlen < 255) {
+ wordlen++;
+ }
+ } else { // start scanning at first non-whitespace character
+ if (!IsSpace(ch)) {
+ if (style != SCE_HOLLYWOOD_COMMENTBLOCK && IsIdentifier(ch)) {
+ word[0] = static_cast<char>(LowerCase(ch));
+ wordlen = 1;
+ } else // done with this line
+ done = 1;
+ }
+ }
+ }
+
+ if (atEOL) {
+ int lev = levelPrev;
+ if (visibleChars == 0 && options.foldCompact) {
+ lev |= SC_FOLDLEVELWHITEFLAG;
+ }
+ if ((levelCurrent > levelPrev) && (visibleChars > 0)) {
+ lev |= SC_FOLDLEVELHEADERFLAG;
+ }
+ if (lev != styler.LevelAt(lineCurrent)) {
+ styler.SetLevel(lineCurrent, lev);
+ }
+ lineCurrent++;
+ levelPrev = levelCurrent;
+ visibleChars = 0;
+ done = 0;
+ wordlen = 0;
+ }
+ if (!IsSpace(ch)) {
+ visibleChars++;
+ }
+ }
+ // Fill in the real level of the next line, keeping the current flags as they will be filled in later
+
+ int flagsNext = styler.LevelAt(lineCurrent) & ~SC_FOLDLEVELNUMBERMASK;
+ styler.SetLevel(lineCurrent, levelPrev | flagsNext);
+}
+
+LexerModule lmHollywood(SCLEX_HOLLYWOOD, LexerHollywood::LexerFactoryHollywood, "hollywood", hollywoodWordListDesc);