local re = require 'parser.relabel' local m = require 'lpeglabel' local scriptBuf = '' local compiled = {} local parser local RESERVED = { ['and'] = true, ['break'] = true, ['do'] = true, ['else'] = true, ['elseif'] = true, ['end'] = true, ['false'] = true, ['for'] = true, ['function'] = true, ['goto'] = true, ['if'] = true, ['in'] = true, ['local'] = true, ['nil'] = true, ['not'] = true, ['or'] = true, ['repeat'] = true, ['return'] = true, ['then'] = true, ['true'] = true, ['until'] = true, ['while'] = true, } local defs = setmetatable({}, {__index = function (self, key) self[key] = function (...) if parser[key] then return parser[key](...) end end return self[key] end}) defs.nl = (m.P'\r\n' + m.S'\r\n') / function () if parser.nl then return parser.nl() end end defs.s = m.S' \t' defs.S = - defs.s defs.ea = '\a' defs.eb = '\b' defs.ef = '\f' defs.en = '\n' defs.er = '\r' defs.et = '\t' defs.ev = '\v' defs['nil'] = m.Cp() / function () return nil end defs.NotReserved = function (_, _, str) if RESERVED[str] then return false end return true, str end defs.np = m.Cp() / function (n) return n+1 end local eof = re.compile '!. / %{SYNTAX_ERROR}' local function grammar(tag) return function (script) scriptBuf = script .. '\r\n' .. scriptBuf compiled[tag] = re.compile(scriptBuf, defs) * eof end end local function errorpos(pos, err) return { type = 'UNKNOWN', start = pos, finish = pos, err = err, } end grammar 'Comment' [[ Comment <- '--' (LongComment / ShortComment) LongComment <- '[' {:eq: '='* :} '[' CommentClose CommentClose <- ']' =eq ']' / . CommentClose ShortComment <- (!%nl .)* ]] grammar 'Sp' [[ Sp <- (Comment / %nl / %s)* Sps <- (Comment / %nl / %s)+ ]] grammar 'Common' [[ Word <- [a-zA-Z0-9_] Cut <- !Word X16 <- [a-fA-F0-9] Rest <- (!%nl .)* AND <- Sp {'and'} Cut BREAK <- Sp 'break' Cut DO <- Sp 'do' Cut ELSE <- Sp 'else' Cut ELSEIF <- Sp 'elseif' Cut END <- Sp 'end' Cut FALSE <- Sp 'false' Cut FOR <- Sp 'for' Cut FUNCTION <- Sp 'function' Cut GOTO <- Sp 'goto' Cut IF <- Sp 'if' Cut IN <- Sp 'in' Cut LOCAL <- Sp 'local' Cut NIL <- Sp 'nil' Cut NOT <- Sp 'not' Cut OR <- Sp {'or'} Cut REPEAT <- Sp 'repeat' Cut RETURN <- Sp 'return' Cut THEN <- Sp 'then' Cut TRUE <- Sp 'true' Cut UNTIL <- Sp 'until' Cut WHILE <- Sp 'while' Cut Esc <- '\' -> '' EChar EChar <- 'a' -> ea / 'b' -> eb / 'f' -> ef / 'n' -> en / 'r' -> er / 't' -> et / 'v' -> ev / '\' / '"' / "'" / %nl / ('z' (%nl / %s)*) -> '' / ('x' {X16 X16}) -> Char16 / ([0-9] [0-9]? [0-9]?) -> Char10 / ('u{' {} {Word*} '}') -> CharUtf8 -- 错误处理 / 'x' {} -> MissEscX / 'u' !'{' {} -> MissTL / 'u{' Word* !'}' {} -> MissTR / {} -> ErrEsc Comp <- Sp {CompList} CompList <- '<=' / '>=' / '<' / '>' / '~=' / '==' BOR <- Sp {'|'} BXOR <- Sp {'~'} BAND <- Sp {'&'} Bshift <- Sp {BshiftList} BshiftList <- '<<' / '>>' Concat <- Sp {'..'} Adds <- Sp {AddsList} AddsList <- '+' / '-' Muls <- Sp {MulsList} MulsList <- '*' / '//' / '/' / '%' Unary <- Sp {} {UnaryList} UnaryList <- NOT / '#' / '-' / '~' POWER <- Sp {'^'} PL <- Sp '(' PR <- Sp ')' BL <- Sp '[' BR <- Sp ']' TL <- Sp '{' TR <- Sp '}' COMMA <- Sp ',' SEMICOLON <- Sp ';' DOTS <- Sp ({} '...') -> DOTS DOT <- Sp '.' !'.' COLON <- Sp ({} ':' !':') -> COLON LABEL <- Sp '::' ASSIGN <- Sp '=' Nothing <- {} -> Nothing TOCLOSE <- Sp '*toclose' DirtyAssign <- ASSIGN / {} -> MissAssign DirtyBR <- BR {} / {} -> MissBR DirtyTR <- TR {} / {} -> MissTR DirtyPR <- PR {} / {} -> MissPR ]] grammar 'Nil' [[ Nil <- Sp ({} -> Nil) NIL ]] grammar 'Boolean' [[ Boolean <- Sp ({} -> True) TRUE / Sp ({} -> False) FALSE ]] grammar 'String' [[ String <- Sp ({} StringDef {}) -> String StringDef <- '"' {~(Esc / !%nl !'"' .)*~} -> 1 ('"' / {} -> MissQuote1) / "'" {~(Esc / !%nl !"'" .)*~} -> 1 ("'" / {} -> MissQuote2) / ('[' {} {:eq: '='* :} {} '[' {(!StringClose .)*} -> 1 (StringClose / {})) -> LongString StringClose <- ']' =eq ']' ]] grammar 'Number' [[ Number <- Sp ({} {NumberDef} {}) -> Number ErrNumber? NumberDef <- Number16 / Number10 ErrNumber <- ({} {([0-9a-zA-Z] / '.')+}) -> UnknownSymbol Number10 <- Float10 Float10Exp? / Integer10 Float10? Float10Exp? Integer10 <- '0' / [1-9] [0-9]* '.'? [0-9]* Float10 <- '.' [0-9]+ Float10Exp <- [eE] [+-]? [1-9] [0-9]* / ({} [eE] [+-]? {}) -> MissExponent Number16 <- '0' [xX] Float16 Float16Exp? / '0' [xX] Integer16 Float16? Float16Exp? Integer16 <- X16+ '.'? X16* / ({} {Word*}) -> MustX16 Float16 <- '.' X16+ / '.' ({} {Word*}) -> MustX16 Float16Exp <- [pP] [+-]? [1-9] [0-9]* / ({} [pP] [+-]? {}) -> MissExponent ]] grammar 'Name' [[ Name <- Sp ({} NameBody {}) -> Name NameBody <- ([a-zA-Z_] [a-zA-Z0-9_]*) => NotReserved MustName <- Name / DirtyName DirtyName <- {} -> DirtyName ]] grammar 'Exp' [[ Exp <- Sp ExpOr ExpOr <- (ExpAnd (OR ExpAnd)*) -> Binary ExpAnd <- (ExpCompare (AND ExpCompare)*) -> Binary ExpCompare <- (ExpBor (Comp ExpBor)*) -> Binary ExpBor <- (ExpBxor (BOR ExpBxor)*) -> Binary ExpBxor <- (ExpBand (BXOR ExpBand)*) -> Binary ExpBand <- (ExpBshift (BAND ExpBshift)*) -> Binary ExpBshift <- (ExpConcat (Bshift ExpConcat)*) -> Binary ExpConcat <- (ExpAdds (Concat ExpConcat)*) -> Binary ExpAdds <- (ExpMuls (Adds ExpMuls)*) -> Binary ExpMuls <- (ExpUnary (Muls ExpUnary)*) -> Binary ExpUnary <- ( (Unary+ (ExpPower / DirtyName))) -> Unary / ExpPower ExpPower <- (ExpUnit (POWER ExpUnary)*) -> Binary ExpUnit <- Nil / Boolean / String / Number / DOTS / Table / Function / Simple Simple <- (Prefix (Suffix)*) -> Simple Prefix <- PL Exp PR / Name Suffix <- DOT MustName / COLON MustName / Sp ({} Table {}) -> Call / Sp ({} String {}) -> Call / Sp ({} BL DirtyExp (BR / Sp) {}) -> Index / Sp ({} PL CallArgList DirtyPR) -> Call DirtyExp <- Exp / {} -> DirtyExp ExpList <- (COMMA Exp)+ -> List / (Exp (COMMA Exp)*) -> List CallArgList <- Sp ({} (COMMA {} / Exp / DirtyCallArg)+ {}) -> CallArgList / %nil DirtyCallArg<- Sp ({} {(!PR !PL !COMMA !Word .)+}) -> UnknownSymbol NameList <- (COMMA MustName)+ -> List / (Name (COMMA MustName)*) -> List / DirtyName -> List ArgList <- (COMMA AfterArg)+ -> List / (FirstArg (COMMA AfterArg)*)? -> List FirstArg <- DOTS / Name AfterArg <- DOTS / MustName Table <- Sp ({} TL TableFields? DirtyTR) -> Table TableFields <- (TableSep {} / TableField / DirtyField)+ DirtyField <- Sp ({} {(!TR !BL !COMMA !SEMICOLON !Word .)+}) -> UnknownSymbol TableSep <- COMMA / SEMICOLON TableField <- NewIndex / NewField / Exp NewIndex <- Sp ({} BL DirtyExp DirtyBR DirtyAssign DirtyExp) -> NewIndex NewField <- (MustName ASSIGN DirtyExp) -> NewField Function <- Sp ({} FunctionBody {}) -> Function FunctionBody<- FUNCTION FuncName PL ArgList PR (!END Action)* END? / FUNCTION FuncName PL ArgList PR? (!END Action)* END? / FUNCTION FuncName Nothing (!END Action)* END? FuncName <- (Name? (FuncSuffix)*) -> Simple FuncSuffix <- DOT MustName / COLON MustName -- 纯占位,修改了 `relabel.lua` 使重复定义不抛错 Action <- !END . Set <- END ]] grammar 'Action' [[ Action <- Sp (CrtAction / UnkAction) CrtAction <- SEMICOLON / Do / Break / Return / Label / GoTo / If / For / While / Repeat / Function / LocalFunction / Local / Set / Call / Exp UnkAction <- ({} {. (!Sps !CrtAction .)*}) -> UnknownSymbol SimpleList <- (Simple (COMMA Simple)*) -> List Do <- Sp ({} DO DoBody END? {}) -> Do DoBody <- (!END Action)* -> DoBody Break <- BREAK -> Break Return <- RETURN ExpList? -> Return Label <- LABEL MustName -> Label LABEL GoTo <- GOTO MustName -> GoTo If <- Sp ({} IfBody {}) -> If IfHead <- (IfPart -> IfBlock) / (ElseIfPart -> ElseIfBlock) / (ElsePart -> ElseBlock) IfBody <- IfHead (ElseIfPart -> ElseIfBlock)* (ElsePart -> ElseBlock)? END? IfPart <- IF Exp THEN {} (!ELSEIF !ELSE !END Action)* {} / IF DirtyExp THEN {} (!ELSEIF !ELSE !END Action)* {} / IF DirtyExp {} {} ElseIfPart <- ELSEIF Exp THEN {} (!ELSE !ELSEIF !END Action)* {} / ELSEIF DirtyExp THEN {} (!ELSE !ELSEIF !END Action)* {} / ELSEIF DirtyExp {} {} ElsePart <- ELSE {} (!END Action)* {} For <- Loop / In / FOR Loop <- Sp ({} LoopBody {}) -> Loop LoopBody <- FOR LoopStart LoopFinish LoopStep DO? (!END Action)* END? LoopStart <- MustName ASSIGN DirtyExp LoopFinish <- COMMA? Exp / COMMA? DirtyName LoopStep <- COMMA DirtyExp / COMMA? Exp / Nothing In <- Sp ({} InBody {}) -> In InBody <- FOR NameList IN? ExpList DO? (!END Action)* END? While <- Sp ({} WhileBody {}) -> While WhileBody <- WHILE Exp DO (!END Action)* END? Repeat <- Sp ({} RepeatBody {}) -> Repeat RepeatBody <- REPEAT (!UNTIL Action)* UNTIL Exp Local <- (LOCAL TOCLOSE? NameList (ASSIGN ExpList)?) -> Local Set <- (SimpleList ASSIGN ExpList?) -> Set Call <- Simple LocalFunction <- Sp ({} LOCAL FunctionBody {}) -> LocalFunction ]] grammar 'Lua' [[ Lua <- Head? Action* -> Lua Sp Head <- '#' (!%nl .)* ]] return function (lua, mode, parser_) parser = parser_ or {} local gram = compiled[mode] or compiled['Lua'] local r, _, pos = gram:match(lua) if not r then local err = errorpos(pos) return nil, err end return r end