1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68
|
-- Copyright 2006-2017 Mitchell mitchell.att.foicica.com. See LICENSE.
-- IDL LPeg lexer.
local l = require('lexer')
local token, word_match = l.token, l.word_match
local P, R, S = lpeg.P, lpeg.R, lpeg.S
local M = {_NAME = 'idl'}
-- Whitespace.
local ws = token(l.WHITESPACE, l.space^1)
-- Comments.
local line_comment = '//' * l.nonnewline_esc^0
local block_comment = '/*' * (l.any - '*/')^0 * P('*/')^-1
local comment = token(l.COMMENT, line_comment + block_comment)
-- Strings.
local sq_str = l.delimited_range("'", true)
local dq_str = l.delimited_range('"', true)
local string = token(l.STRING, sq_str + dq_str)
-- Numbers.
local number = token(l.NUMBER, l.float + l.integer)
-- Preprocessor.
local preproc_word = word_match{
'define', 'undef', 'ifdef', 'ifndef', 'if', 'elif', 'else', 'endif',
'include', 'warning', 'pragma'
}
local preproc = token(l.PREPROCESSOR,
l.starts_line('#') * preproc_word * l.nonnewline^0)
-- Keywords.
local keyword = token(l.KEYWORD, word_match{
'abstract', 'attribute', 'case', 'const', 'context', 'custom', 'default',
'exception', 'enum', 'factory', 'FALSE', 'in', 'inout', 'interface', 'local',
'module', 'native', 'oneway', 'out', 'private', 'public', 'raises',
'readonly', 'struct', 'support', 'switch', 'TRUE', 'truncatable', 'typedef',
'union', 'valuetype'
})
-- Types.
local type = token(l.TYPE, word_match{
'any', 'boolean', 'char', 'double', 'fixed', 'float', 'long', 'Object',
'octet', 'sequence', 'short', 'string', 'unsigned', 'ValueBase', 'void',
'wchar', 'wstring'
})
-- Identifiers.
local identifier = token(l.IDENTIFIER, l.word)
-- Operators.
local operator = token(l.OPERATOR, S('!<>=+-/*%&|^~.,:;?()[]{}'))
M._rules = {
{'whitespace', ws},
{'keyword', keyword},
{'type', type},
{'identifier', identifier},
{'string', string},
{'comment', comment},
{'number', number},
{'preprocessor', preproc},
{'operator', operator},
}
return M
|