aboutsummaryrefslogtreecommitdiffhomepage
path: root/lexlua/elixir.lua
blob: 6dc0bfff4c61fa36b489d005a28b298138264e0b (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
-- Copyright 2015-2020 Mitchell mitchell.att.foicica.com. See License.txt.
-- Contributed by Richard Philips.
-- Elixir LPeg lexer.

local lexer = require('lexer')
local token, word_match = lexer.token, lexer.word_match
local B, P, S, R = lpeg.B, lpeg.P, lpeg.S, lpeg.R

local lex = lexer.new('elixir', {fold_by_indentation = true})

-- Whitespace.
lex:add_rule('whitespace', token(lexer.WHITESPACE, lexer.space^1))

-- Sigils.
local sigil11 = P("~") * S("CRSW") * lexer.range('<', '>', false)
local sigil12 = P("~") * S("CRSW") * lexer.range('{', '}', false)
local sigil13 = P("~") * S("CRSW") * lexer.range('[', ']', false)
local sigil14 = P("~") * S("CRSW") * lexer.range('(', ')', false)
local sigil15 = P("~") * S("CRSW") * lexer.range('|', false, false)
local sigil16 = P("~") * S("CRSW") * lexer.range('/', false, false)
local sigil17 = P("~") * S("CRSW") * lexer.range('"', false, false)
local sigil18 = P("~") * S("CRSW") * lexer.range("'", false, false)
local sigil19 = P("~") * S("CRSW") * lexer.range('"""')
local sigil10 = P("~") * S("CRSW") * lexer.range("'''")
local sigil21 = P("~") * S("crsw") * lexer.range('<', '>', false, true)
local sigil22 = P("~") * S("crsw") * lexer.range('{', '}', false, true)
local sigil23 = P("~") * S("crsw") * lexer.range('[', ']', false, true)
local sigil24 = P("~") * S("crsw") * lexer.range('(', ')', false, true)
local sigil25 = P("~") * S("crsw") * lexer.range('|', false)
local sigil26 = P("~") * S("crsw") * lexer.range('/', false)
local sigil27 = P("~") * S("crsw") * lexer.range('"', false)
local sigil28 = P("~") * S("crsw") * lexer.range("'", false)
local sigil29 = P("~") * S("crsw") * lexer.range('"""')
local sigil20 = P("~") * S("crsw") * lexer.range("'''")
local sigil_token = token(lexer.REGEX, sigil10 + sigil19 + sigil11 + sigil12 +
  sigil13 + sigil14 + sigil15 + sigil16 + sigil17 + sigil18 + sigil20 +
  sigil29 + sigil21 + sigil22 + sigil23 + sigil24 + sigil25 + sigil26 +
  sigil27 + sigil28)
local sigiladdon_token = token(lexer.EMBEDDED, R('az', 'AZ')^0)
lex:add_rule('sigil', sigil_token * sigiladdon_token)

-- Atoms.
local atom1 = B(1 - P(':')) * P(':') * lexer.range('"', false)
local atom2 = B(1 - P(':')) * P(':') * R('az', 'AZ') *
  R('az', 'AZ', '__', '@@', '09')^0 * S('?!')^-1
local atom3 = B(1 - R('az', 'AZ', '__', '09', '::')) *
  R('AZ') * R('az', 'AZ', '__', '@@', '09')^0 * S('?!')^-1
lex:add_rule('atom', token(lexer.CONSTANT, atom1 + atom2 + atom3))

-- Strings.
local dq_str = lexer.range('"')
local triple_dq_str = lexer.range('"""')
lex:add_rule('string', token(lexer.STRING, triple_dq_str + dq_str))

-- Comments.
lex:add_rule('comment', token(lexer.COMMENT, lexer.to_eol('#', true)))

-- Attributes.
lex:add_rule('attribute', token(lexer.LABEL, B(1 - R('az', 'AZ', '__')) *
  P('@') * R('az','AZ') * R('az','AZ','09','__')^0))

-- Booleans.
lex:add_rule('boolean', token(lexer.NUMBER, P(':')^-1 *
  word_match[[true false nil]]))

-- Functions.
lex:add_rule('function', token(lexer.FUNCTION, word_match[[
  defstruct defrecordp defrecord defprotocol defp defoverridable defmodule
  defmacrop defmacro defimpl defexception defdelegate defcallback def
]]))

-- Keywords.
lex:add_rule('keyword', token(lexer.KEYWORD, word_match[[
  is_atom is_binary is_bitstring is_boolean is_float is_function is_integer
  is_list is_map is_number is_pid is_port is_record is_reference is_tuple
  is_exception case when cond for if unless try receive send exit raise throw
  after rescue catch else do end quote unquote super import require alias use
  self with fn
]]))

-- Operators
local operator1 = word_match[[and or not when xor in]]
local operator2 = P('!==') + '!=' + '!' + '=~' + '===' + '==' + '=' + '<<<' +
  '<<' + '<=' + '<-' + '<' + '>>>' + '>>' + '>=' + '>' + '->' + '--' + '-' +
  '++' + '+' + '&&&' + '&&' + '&' + '|||' + '||' + '|>' + '|' + '..' + '.' +
  '^^^' + '^' + '\\\\' + '::' + '*' + '/' + '~~~' + '@'
lex:add_rule('operator', token(lexer.OPERATOR, operator1 + operator2))

-- Identifiers
lex:add_rule('identifier', token(lexer.IDENTIFIER, R('az', '__') *
  R('az', 'AZ', '__', '09')^0 * S('?!')^-1))

-- Numbers
local dec = lexer.digit * (lexer.digit + P("_"))^0
local bin = '0b' * S('01')^1
local oct = '0o' * R('07')^1
local integer = bin + lexer.hex_num + oct + dec
local float = lexer.digit^1 * P(".") * lexer.digit^1 * S("eE") *
  (S('+-')^-1 * lexer.digit^1)^-1
lex:add_rule('number', B(1 - R('az', 'AZ', '__')) * S('+-')^-1 *
  token(lexer.NUMBER, float + integer))

return lex