From a834016170048cf746dcbbbe5755d4ca989c03c0 Mon Sep 17 00:00:00 2001 From: "David B. Lamkins" Date: Sat, 28 May 2016 13:59:55 +0200 Subject: lexer: add lexer for Google protocol buffer IDL Close #326 --- lexers/protobuf.lua | 57 +++++++++++++++++++++++++++++++++++++++++++++++++++++ vis.lua | 1 + 2 files changed, 58 insertions(+) create mode 100644 lexers/protobuf.lua diff --git a/lexers/protobuf.lua b/lexers/protobuf.lua new file mode 100644 index 0000000..fdf0a73 --- /dev/null +++ b/lexers/protobuf.lua @@ -0,0 +1,57 @@ +-- Copyright 2016 David B. Lamkins +-- Protocol Buffer IDL + +local l = require('lexer') +local token, word_match = l.token, l.word_match +local P, R, S = lpeg.P, lpeg.R, lpeg.S + +local M = {_NAME = 'protobuf'} + +-- Whitespace. +local ws = token(l.WHITESPACE, l.space^1) + +-- Comments. +local line_comment = '//' * l.nonnewline_esc^0 +local block_comment = '/*' * (l.any - '*/')^0 * P('*/')^-1 +local comment = token(l.COMMENT, line_comment + block_comment) + +-- Strings. +local sq_str = P('L')^-1 * l.delimited_range("'", true) +local dq_str = P('L')^-1 * l.delimited_range('"', true) +local string = token(l.STRING, sq_str + dq_str) + +-- Numbers. +local number = token(l.NUMBER, l.float + l.integer) + +-- Keywords. +local keyword = token(l.KEYWORD, word_match{ + 'contained', 'syntax', 'import', 'option', 'package', 'message', 'group', + 'oneof', 'optional', 'required', 'repeated', 'default', 'extend', + 'extensions', 'to', 'max', 'reserved', 'service', 'rpc', 'returns' +}) + +-- Types. +local type = token(l.TYPE, word_match{ + 'int32', 'int64', 'uint32', 'uint64', 'sint32', 'sint64', 'fixed32', + 'fixed64', 'sfixed32', 'sfixed64', 'float', 'double', 'bool', 'string', + 'bytes', 'enum', 'true', 'false' +}) + +-- Identifiers. +local identifier = token(l.IDENTIFIER, l.word) + +-- Operators. +local operator = token(l.OPERATOR, S('<>=|;,.()[]{}')) + +M._rules = { + {'whitespace', ws}, + {'keyword', keyword}, + {'type', type}, + {'identifier', identifier}, + {'string', string}, + {'comment', comment}, + {'number', number}, + {'operator', operator}, +} + +return M diff --git a/vis.lua b/vis.lua index ee3ba41..5804c20 100644 --- a/vis.lua +++ b/vis.lua @@ -161,6 +161,7 @@ vis.filetypes = { [".po|.pot"] = "gettext", [".prolog"] = "prolog", [".props|.properties"] = "props", + [".proto"] = "protobuf", [".ps1"] = "powershell", [".pure"] = "pure", [".Rakefile|.rake|.rb|.rbw"] = "ruby", -- cgit v1.2.3