moonscript/moonscript/parse.lua
2011-05-20 01:08:36 -07:00

219 lines
4.1 KiB
Lua

module("moonscript.parse", package.seeall)
require"util"
require"lpeg"
local compile = require"moonscript.compile"
local dump = require"moonscript.dump"
local data = require"moonscript.data"
local Stack = data.Stack
local function count_indent(str)
local sum = 0
for v in str:gmatch("[\t ]") do
if v == ' ' then sum = sum + 1 end
if v == '\t' then sum = sum + 4 end
end
return sum
end
local R, S, V, P = lpeg.R, lpeg.S, lpeg.V, lpeg.P
local C, Ct, Cmt = lpeg.C, lpeg.Ct, lpeg.Cmt
local White = S" \t\n"^0
local Space = S" \t"^0
local Break = S"\n"
local Stop = Break + -1
local Indent = C(S"\t "^0) / count_indent
local Name = C(R("az", "AZ", "__") * R("az", "AZ", "__")^0) * Space
local Num = C(R("09")^1) / tonumber * Space
local FactorOp = lpeg.C(S"+-") * Space
local TermOp = lpeg.C(S"*/%") * Space
local function wrap(fn)
local env = getfenv(fi)
return setfenv(fn, setmetatable({}, {
__index = function(self, name)
local value = env[name]
if value ~= nil then return value end
if name:match"^[A-Z][A-Za-z0-9]*$" then
local v = V(name)
rawset(self, name, v)
return v
end
error("unknown variable referenced: "..name)
end
}))
end
local function mark(name)
return function(...)
return name, ...
end
end
local function got(what)
return Cmt("", function(...)
print("++ got "..what)
return true
end)
end
local function flatten(tbl)
if #tbl == 1 then
return tbl[1]
end
return tbl
end
local build_grammar = wrap(function()
local err_msg = "Failed to compile, line:\n [%d] >> %s (%d)"
local line = 1
local function line_count(subject, pos, str)
for _ in str:gmatch("\n") do
line = line + 1
end
-- print(line, util.dump(str))
return true
end
local Space = Cmt(Space, line_count)
local Break = Cmt(Break, line_count)
local _indent = Stack(0) -- current indent
local function check_indent(str, pos, indent)
return _indent:top() == indent
end
local function advance_indent(str, pos, indent)
if indent > _indent:top() then
_indent:push(indent)
return true
end
end
local function pop_indent(str, pos)
if not _indent:pop() then error("unexpected outdent") end
return true
end
local keywords = {}
local function key(word)
keywords[word] = true
return word * Space
end
local function sym(chars)
return chars * Space
end
-- make sure name is not a keyword
local Name = Cmt(Name, function(str, pos, name)
if keywords[name] then return false end
return true, name
end)
local g = lpeg.P{
File,
File = Block^-1,
Block = Ct(Line * (Break^0 * Line)^0),
Line = Cmt(Indent, check_indent) * (Ct(If) + Exp),
Body = Break * InBlock + Ct(Line),
InBlock = #Cmt(Indent, advance_indent) * Block * OutBlock,
OutBlock = Cmt(P(""), pop_indent),
FunCall = Name * Ct(ExpList) / mark"fncall",
If = key"if" * Exp * Body / mark"if",
Assign = Ct(NameList) * sym"=" * Ct(ExpList) / mark"assign",
Exp = Ct(Value * (FactorOp * Value)^0) / flatten,
Value = Assign + FunLit + FunCall + Num + Name + TableLit,
TableLit = sym"{" * Ct(ExpList^-1) * sym"}" / mark"list",
FunLit = (sym"(" * Ct(NameList^-1) * sym")")^-1 * sym"->" * Body / mark"fndef",
NameList = Name * (sym"," * Name)^0,
ExpList = Exp * (sym"," * Exp)^0
}
return {
_g = White * g * White * -1,
match = function(self, str, ...)
local function get_line(num)
for line in str:gmatch("(.-)[\n$]") do
if num == 1 then return line end
num = num - 1
end
end
local tree = self._g:match(str, ...)
if not tree then
local line_str = get_line(line) or ""
return nil, err_msg:format(line, line_str, _indent:top())
end
return tree
end
}
end)
local grammar = build_grammar()
-- parse a string
-- returns tree, or nil and error message
function string(str)
local g = build_grammar()
return grammar:match(str)
end
local program = [[
if two_dads
do something
if yum
heckyes 23
print 2
print dadas
{1,2,3,4}
(a,b) ->
throw nuts
print 100
]]
local program = [[
hi = (a) -> print a
if true
hi 100
]]
local program3 = [[
-- hello
class Hello
@something = 2323
hello: () ->
print 200
]]