aboutsummaryrefslogtreecommitdiffhomepage
path: root/lexlua/mediawiki.lua
blob: f3d7efff70a24e80bea1bdbecaea251a02452883 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
-- Copyright 2006-2019 Mitchell mitchell.att.foicica.com. See License.txt.
-- MediaWiki LPeg lexer.
-- Contributed by Alexander Misel.

local lexer = require('lexer')
local token, word_match = lexer.token, lexer.word_match
local P, R, S, B = lpeg.P, lpeg.R, lpeg.S, lpeg.B

local lex = lexer.new('mediawiki')

-- Comments.
lex:add_rule('comment', token(lexer.COMMENT, '<!--' * (lexer.any - '-->')^0 *
                                             P('-->')^-1))

-- HTML-like tags
local tag_start = token('tag_start', '<' * P('/')^-1 * lexer.alnum^1 *
                                     lexer.space^0)
local tag_attr = token('tag_attr', lexer.alpha^1 * lexer.space^0 *
                                   ('=' * lexer.space^0 *
                                    ('"' * ((lexer.any - S('>"\\')) +
                                     ('\\' * lexer.any))^0 * '"' +
                                     (lexer.any - lexer.space - '>')^0)^-1)^0 *
                                   lexer.space^0)
local tag_end = token('tag_end', P('/')^-1 * '>')
lex:add_rule('tag', tag_start * tag_attr^0 * tag_end)
lex:add_style('tag_start', lexer.STYLE_KEYWORD)
lex:add_style('tag_attr', lexer.STYLE_TYPE)
lex:add_style('tag_end', lexer.STYLE_KEYWORD)

-- Link
lex:add_rule('link', token(lexer.STRING, S('[]')))
lex:add_rule('internal_link', B('[[') *
                              token('link_article', (lexer.any - '|' - ']]')^1))
lex:add_style('link_article', lexer.STYLE_STRING..',underlined')

-- Templates and parser functions.
lex:add_rule('template', token(lexer.OPERATOR, S('{}')))
lex:add_rule('parser_func', B('{{') *
                            token('parser_func', P('#') * lexer.alpha^1 +
                                                 lexer.upper^1 * ':'))
lex:add_rule('template_name', B('{{') *
                              token('template_name', (lexer.any - S('{}|'))^1))
lex:add_style('parser_func', lexer.STYLE_FUNCTION)
lex:add_style('template_name', lexer.STYLE_OPERATOR..',underlined')

-- Operators.
lex:add_rule('operator', token(lexer.OPERATOR, S('-=|#~!')))

-- Behavior switches
local start_pat = P(function(_, pos) return pos == 1 end)
lex:add_rule('behavior_switch', (B(lexer.space) + start_pat) *
                                token('behavior_switch',
                                      '__' * (P('TOC') + 'FORCETOC' + 'NOTOC' +
                                              'NOEDITSECTION' + 'NOCC' +
                                              'NOINDEX') * '__') * #lexer.space)
lex:add_style('behavior_switch', lexer.STYLE_KEYWORD)

return lex