v4k-git-backup/tools/luajit_lcpp.lua

1961 lines
65 KiB
Lua

----------------------------------------------------------------------------
--## lcpp - a C-PreProcessor for Lua 5.1 and LuaJIT ffi integration
--
-- Copyright (C) 2012-2014 Michael Schmoock <michael@schmoock.net>
--
--### Links
-- * GitHub page: [http://github.com/willsteel/lcpp](http://github.com/willsteel/lcpp)
-- * Project page: [http://lcpp.schmoock.net](http://lcpp.schmoock.net)
-- * Lua: [http://www.lua.org](http://www.lua.org)
-- * LuaJIT: [http://luajit.org](http://luajit.org)
-- * Sponsored by: [http://mmbbq.org](http://mmbbq.org)
--
-- It can be used to pre-process LuaJIT ffi C header file input.
-- It can also be used to preprocess any other code (i.e. Lua itself)
--
-- git clone https://github.com/willsteel/lcpp.git
----------------------------------------------------------------------------
--## USAGE
-- -- load lcpp
-- local lcpp = require("lcpp")
--
-- -- use LuaJIT ffi and lcpp to parse cpp code
-- local ffi = require("ffi")
-- ffi.cdef("#include <your_header.h>")
--
-- -- use lcpp manually but add some predefines
-- local lcpp = require("lcpp");
-- local out = lcpp.compileFile("your_header.h", {UNICODE=1});
-- print(out);
--
-- -- compile some input manually
-- local out = lcpp.compile([[
-- #include "myheader.h"
-- #define MAXPATH 260
-- typedef struct somestruct_t {
-- void* base;
-- size_t size;
-- wchar_t path[MAXPATH];
-- } t_exe;
-- ]])
-- -- the result should be like this
-- out == [[
-- // <preprocessed content of file "myheader.h">
-- typedef struct somestruct_t {
-- void* base;
-- size_t size;
-- wchar_t path[260];
-- } t_exe;
-- ]]
--
-- -- access lcpp defines dynamically (i.e. if used with ffi)
-- local ffi = require("ffi")
-- local lcpp = require("lcpp")
-- ffi.cdef("#include <your_header.h>")
-- =ffi.lcpp_defs.YOUR_DEFINE
--
--
--## This CPPs BNF:
-- RULES:
-- CODE := {LINE}
-- LINE := {STUFF NEWML} STUFF NEWL
-- STUFF := DIRECTIVE | IGNORED_CONTENT
-- DIRECTIVE := OPTSPACES CMD OPTSPACES DIRECTIVE_NAME WHITESPACES DIRECTIVE_CONTENT WHITESPACES NEWL
--
-- LEAVES:
-- NEWL := "\n"
-- NEWL_ESC := "\\n"
-- WHITESPACES := "[ \t]+"
-- OPTSPACES := "[ \t]*"
-- COMMENT := "//(.-)$"
-- MLCOMMENT := "/[*](.-)[*]/"
-- IGNORED_CONTENT := "[^#].*"
-- CMD := "#"
-- DIRECTIVE_NAME := "include"|"define"|"undef"|"if"|"else"|"elif"|"else if"|"endif"|"ifdef"|"ifndef"|"pragma"
-- DIRECTIVE_CONTENT := ".*?"
--
--## TODOs:
-- - lcpp.LCPP_LUA for: load, loadfile
--
--## License (MIT)
-- -----------------------------------------------------------------------------
-- Permission is hereby granted, free of charge, to any person obtaining a copy
-- of this software and associated documentation files (the "Software"), to deal
-- in the Software without restriction, including without limitation the rights
-- to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-- copies of the Software, and to permit persons to whom the Software is
-- furnished to do so, subject to the following conditions:
--
-- The above copyright notice and this permission notice shall be included in
-- all copies or substantial portions of the Software.
--
-- THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-- IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-- FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
-- AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-- LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-- OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-- THE SOFTWARE.
--
-- MIT license: http://www.opensource.org/licenses/mit-license.php
-- -----------------------------------------------------------------------------
--
-- @module lcpp
local lcpp = {}
-- check bit is avail or not
local ok, bit = pcall(require, 'bit')
if not ok then
bit = {
lshift = function (x, y)
if y < 0 then return bit.rshift(x,-y) end
return (x * 2^y) % (2^32)
end,
rshift = function (x, y)
if y < 0 then return bit.lshift(x,-y) end
return math.floor(x % (2^32) / (2^y))
end,
bxor = function (x, y)
-- from http://lua-users.org/wiki/BitUtils
local z = 0
for i = 0, 31 do
if (x % 2 == 0) then -- x had a '0' in bit i
if ( y % 2 == 1) then -- y had a '1' in bit i
y = y - 1
z = z + 2 ^ i -- set bit i of z to '1'
end
else -- x had a '1' in bit i
x = x - 1
if (y % 2 == 0) then -- y had a '0' in bit i
z = z + 2 ^ i -- set bit i of z to '1'
else
y = y - 1
end
end
y = y / 2
x = x / 2
end
return z
end,
bnot = function (x)
-- if word size is not defined, I think it better than 0xFFFFFFFF - x.
return -1 - x
end,
band = function (x, y)
return ((x + y) - bit.bxor(x, y)) / 2
end,
bor = function (x, y)
return bit.bnot(bit.band(bit.bnot(x), bit.bnot(y)))
end,
}
end
-- CONFIG
lcpp.LCPP_LUA = false -- whether to use lcpp to preprocess Lua code (load, loadfile, loadstring...)
lcpp.LCPP_FFI = true -- whether to use lcpp as LuaJIT ffi PreProcessor (if used in luaJIT)
lcpp.LCPP_TEST = false -- whether to run lcpp unit tests when loading lcpp module
lcpp.ENV = {} -- static predefines (env-like)
lcpp.FAST = false -- perf. tweaks when enabled. con: breaks minor stuff like __LINE__ macros
lcpp.DEBUG = false
-- PREDEFINES
local __FILE__ = "__FILE__"
local __LINE__ = "__LINE__"
local __DATE__ = "__DATE__"
local __TIME__ = "__TIME__"
local __LCPP_INDENT__ = "__LCPP_INDENT__"
-- BNF LEAVES
local ENDL = "$"
local STARTL = "^"
local NEWL = "\n"
local NEWL_BYTE = NEWL:byte(1)
local NEWL_ESC = "\\"
local NEWML = "\\\n"
local CMD = "#"
local CMD_BYTE = CMD:byte(1)
local COMMENT = "^(.-)//.-$"
local MLCOMMENT = "/[*].-[*]/"
local WHITESPACES = "%s+"
local OPTSPACES = "%s*"
local IDENTIFIER = "[_%a][_%w]*"
local NOIDENTIFIER = "[^%w_]+"
local FILENAME = "[0-9a-zA-Z.%-_/\\]+"
local TEXT = ".+"
local STRINGIFY = "#"
local STRINGIFY_BYTE = STRINGIFY:byte(1)
local STRING_LITERAL = ".*"
-- BNF WORDS
local _INCLUDE = "include"
local _INCLUDE_NEXT = "include_next"
local _DEFINE = "define"
local _IFDEF = "ifdef"
local _IFNDEF = "ifndef"
local _ENDIF = "endif"
local _UNDEF = "undef"
local _IF = "if"
local _ELSE = "else"
local _ELIF = "elif"
local _NOT = "!"
local _ERROR = "error"
local _WARNING = "warning"
local _PRAGMA = "pragma"
-- BNF RULES
local INCLUDE = STARTL.._INCLUDE..WHITESPACES.."[<]("..FILENAME..")[>]"..OPTSPACES..ENDL
local LOCAL_INCLUDE = STARTL.._INCLUDE..WHITESPACES.."[\"]("..FILENAME..")[\"]"..OPTSPACES..ENDL
local INCLUDE_NEXT = STARTL.._INCLUDE_NEXT..WHITESPACES.."[\"<]("..FILENAME..")[\">]"..OPTSPACES..ENDL
local DEFINE = STARTL.._DEFINE
local IFDEF = STARTL.._IFDEF..WHITESPACES.."("..IDENTIFIER..")"..OPTSPACES..ENDL
local IFNDEF = STARTL.._IFNDEF..WHITESPACES.."("..IDENTIFIER..")"..OPTSPACES..ENDL
local ENDIF = STARTL.._ENDIF..OPTSPACES..ENDL
local UNDEF = STARTL.._UNDEF..WHITESPACES.."("..IDENTIFIER..")"..OPTSPACES..ENDL
local IF = STARTL.._IF..WHITESPACES.."(.*)"..ENDL
local ELSE = STARTL.._ELSE..OPTSPACES..ENDL
local ELIF = STARTL.._ELIF..WHITESPACES.."(.*)"..ENDL
local ELSEIF = STARTL.._ELSE..WHITESPACES.._IF..WHITESPACES.."(.*)"..ENDL
local ERROR = STARTL.._ERROR..WHITESPACES.."("..TEXT..")"..OPTSPACES..ENDL
local WARNING = STARTL.._WARNING..WHITESPACES.."("..TEXT..")"..OPTSPACES..ENDL
local ERROR_NOTEXT = STARTL.._ERROR..OPTSPACES..ENDL --> not required when we have POSIX regex
local PRAGMA = STARTL.._PRAGMA
-- speedups
local TRUEMACRO = STARTL.."("..IDENTIFIER..")%s*$"
local REPLMACRO = STARTL.."("..IDENTIFIER..")"..WHITESPACES.."(.+)$"
local FUNCMACRO = STARTL.."("..IDENTIFIER..")%(([_%s%w,]*)%)%s*(.*)"
-- ------------
-- LOCAL UTILS
-- ------------
lcpp.STATE = {lineno = 0} -- current state for debugging the last operation
local function error(msg) _G.print(debug.traceback()); _G.error(string.format("lcpp ERR [%04i] %s", lcpp.STATE.lineno, msg)) end
local function print(msg) _G.print(string.format("//lcpp INF [%04i] %s", lcpp.STATE.lineno, msg)) end
-- splits a string using a pattern into a table of substrings
local function gsplit(str, pat)
local function _split(str, pat)
local t = {} -- NOTE: use {n = 0} in Lua-5.0
local fpat = "(.-)"..pat
local last_end = 1
local s, e, cap = str:find(fpat, 1)
while s do
if s ~= 1 or cap ~= "" then
coroutine.yield(cap)
end
last_end = e + 1
s, e, cap = str:find(fpat, last_end)
end
if last_end <= #str then
cap = str:sub(last_end)
coroutine.yield(cap)
end
end
return coroutine.wrap(function() _split(str, pat) end)
end
local function split(str, pat)
local t = {}
for str in gsplit(str, pat) do table.insert(t, str) end
return t
end
-- Checks whether a string starts with a given substring
-- offset is optional
local function strsw(str, pat, offset)
if not str then return false end
if not offset then offset = 0 end
return string.sub(str, 1+offset, string.len(pat)+offset) == pat
end
-- Checks whether a string ends with a given substring
local function strew(str, pat)
if not str then return false end
return pat=='' or string.sub(str,-string.len(pat)) == pat
end
-- string trim12 from lua wiki
local function trim(str)
local from = str:match"^%s*()"
return from > #str and "" or str:match(".*%S", from)
end
-- returns the number of string occurrences
local function findn(input, what)
local count = 0
local offset = 0
local _
while true do
_, offset = string.find(input, what, offset+1, true)
if not offset then return count end
count = count + 1
end
end
-- C literal string concatenation
local function concatStringLiteral(input)
-- screener does remove multiline definition, so just check ".*"%s*".*" pattern
return input:gsub("\"("..STRING_LITERAL..")\""..OPTSPACES.."\"("..STRING_LITERAL..")\"", "\"%1%2\"")
end
-- c style boolean check (thus, 0 will be false)
local function CBoolean(value)
return value and (value ~= 0)
end
-- eval with c style number parse (UL, LL, L)
local function CEval(expr)
local ok, r = pcall(loadstring, "return " .. parseCInteger(expr))
if ok and r then
return r()
else
error(r)
end
end
-- a lightweight and flexible tokenizer
local function _tokenizer(str, setup)
local defsetup = {
-- EXAMPLE patterns have to be pretended with "^" for the tokenizer
["identifier"] = '^[_%a][_%w]*',
["number"] = '^[%+%-]?%d+[%.]?%d*[UL]*',
["ignore"] = '^%s+',
["string"] = true,
["keywords"] = {
-- ["NAME"] = '^pattern',
-- ...
},
}
if not setup then
setup = defsetup
end
setup.identifier = setup.identifier or defsetup.identifier
setup.number = setup.number or defsetup.number
setup.ignore = setup.ignore or defsetup.ignore
if nil == setup.string then setup.string = true end
setup.keywords = setup.keywords or {}
local strlen = #str
local i = 1
local i1, i2
local keyword
local function find(pat)
i1, i2 = str:find(pat,i)
return i1 ~= nil
end
local function cut()
return str:sub(i, i2)
end
local findKeyword
if setup.keywords_order then
findKeyword = function ()
for _, name in ipairs(setup.keywords_order) do
assert(setup.keywords[name])
local pat = setup.keywords[name]
local result = find(pat)
if result then
keyword = name
return true
end
end
end
else
findKeyword = function ()
for name, pat in pairs(setup.keywords) do
local result = find(pat)
if result then
keyword = name
return true
end
end
end
end
while true do
if i > strlen then return 'eof', nil, strlen, strlen end
if findKeyword() then
coroutine.yield(keyword, cut(), i1, i2)
elseif find(setup.ignore) then
coroutine.yield("ignore", cut(), i1, i2)
elseif find(setup.number) then
coroutine.yield('number', tonumber(cut()), i1, i2)
elseif find(setup.identifier) then
coroutine.yield('identifier', cut(), i1, i2)
elseif setup.string and (find('^"[^"]*"') or find("^'[^']*'")) then
-- strip the quotes
coroutine.yield('string', cut():sub(2,-2), i1, i2)
else -- any other unknown character
i1 = i
i2 = i
coroutine.yield('unknown', cut(), i1, i2)
end
i = i2+1
end
end
local function tokenizer(str, setup)
return coroutine.wrap(function() _tokenizer(str, setup) end)
end
-- ------------
-- PARSER
-- ------------
local LCPP_TOKENIZE_COMMENT = {
string = false,
keywords = {
MLCOMMENT = "^/%*.-%*/",
SLCOMMENT = "^//.-\n",
STRING_LITERAL = '^"[^"]*"',
},
}
-- hint: LuaJIT ffi does not rely on us to remove the comments, but maybe other usecases
local function removeComments(input)
local out = {}
for k, v, start, end_ in tokenizer(input, LCPP_TOKENIZE_COMMENT) do
if k == "MLCOMMENT" then
local newlineCount = findn(input:sub(start, end_), "\n")
local newlines = string.rep("\n", newlineCount)
table.insert(out, newlines)
elseif k == "SLCOMMENT" then
table.insert(out, "\n")
else
table.insert(out, input:sub(start, end_))
end
end
return table.concat(out)
end
-- C style number parse (UL, LL, L) and (octet, hex, binary)
local LCPP_TOKENIZE_INTEGER = {
string = false,
keywords_order = {
"STRING_LITERAL",
"CHAR_LITERAL",
"HEX_LITERAL",
"BIN_LITERAL",
"OCT_LITERAL",
"FPNUM_LITERAL",
"NUMBER_LITERAL",
},
keywords = {
STRING_LITERAL = '^"[^"]*"',
CHAR_LITERAL = "^L'.*'",
HEX_LITERAL = '^[%+%-]?%s*0x[a-fA-F%d]+[UL]*',
BIN_LITERAL = '^[%+%-]?%s*0b%d+[UL]*',
OCT_LITERAL = '^[%+%-]?%s*0%d+[UL]*',
FPNUM_LITERAL = '^[%+%-]?%s*%d+[%.]?%d*e[%+%-]%d*',
NUMBER_LITERAL = '^[%+%-]?%s*%d+[%.]?%d*[UL]+',
},
}
local function parseCInteger(input)
-- print('parseCInteger:input:' .. input)
local out = {}
local unary
for k, v, start, end_ in tokenizer(input, LCPP_TOKENIZE_INTEGER) do
-- print('parseCInteger:' .. k .. "|" .. v)
if k == "CHAR_LITERAL" then
table.insert(out, tostring(string.byte(loadstring("return \"" .. v:gsub("^L%'(.+)%'", "%1") .. "\"")())))
elseif k == "HEX_LITERAL" then
unary, v = v:match('([%+%-]?)0x([a-fA-F%d]+)[UL]*')
local n = tonumber(v, 16)
table.insert(out, unary..tostring(n))
elseif k == "NUMBER_LITERAL" then
v = v:match('([^UL]+)[UL]+')
table.insert(out, v)
elseif k == "BIN_LITERAL" then
unary, v = v:match('([%+%-]?)0b([01]+)[UL]*')
local n = tonumber(v, 2)
table.insert(out, unary..tostring(n))
elseif k == "OCT_LITERAL" then
unary, v = v:match('([%+%-]?)(0%d+)[UL]*')
local n = tonumber(v, 8)
table.insert(out, unary..tostring(n))
else
table.insert(out, input:sub(start, end_))
end
end
local str = table.concat(out)
-- print('parseCInteger:result:'..str)
return str
end
-- screener: revmoce comments, trim, ml concat...
-- it only splits to cpp input lines and removes comments. it does not tokenize.
local function screener(input)
local function _screener(input)
input = removeComments(input)
-- concat mulit-line input.
local count = 1
while count > 0 do input, count = string.gsub(input, "^(.-)\\\n(.-)$", "%1 %2\n") end
-- trim and join blocks not starting with "#"
local buffer = {}
for line in gsplit(input, NEWL) do
--print('newline:'..line)
line = trim(line)
if #line > 0 then
if line:byte(1) == CMD_BYTE then
line = line:gsub("#%s*(.*)", "#%1") -- remove optinal whitespaces after "#". reduce triming later.
if #buffer > 0 then
coroutine.yield(table.concat(buffer, NEWL))
buffer = {}
end
coroutine.yield(line)
else
if lcpp.FAST then
table.insert(buffer, line)
else
coroutine.yield(line)
end
end
elseif not lcpp.FAST then
coroutine.yield(line)
end
end
if #buffer > 0 then
coroutine.yield(table.concat(buffer, NEWL))
end
end
return coroutine.wrap(function() _screener(input) end)
end
-- apply currently known macros to input (and returns it)
local LCPP_TOKENIZE_APPLY_MACRO = {
keywords = {
DEFINED = "^defined%s*%(%s*"..IDENTIFIER.."%s*%)" ,
},
}
local function apply(state, input)
while true do
local out = {}
local functions = {}
local expand
for k, v, start, end_ in tokenizer(input, LCPP_TOKENIZE_APPLY_MACRO) do
-- print('tokenize:'..tostring(k).."|"..tostring(v))
if k == "identifier" then
local repl = v
local macro = state.defines[v]
if macro then
if type(macro) == "boolean" then
repl = ""
expand = true
elseif type(macro) == "string" then
repl = macro
expand = (repl ~= v)
elseif type(macro) == "number" then
repl = tostring(macro)
expand = (repl ~= v)
elseif type(macro) == "function" then
local decl,cnt = input:sub(start):gsub("^[_%a][_%w]*%s*%b()", "%1")
-- print('matching:'..input.."|"..decl.."|"..cnt)
if cnt > 0 then
repl = macro(decl)
-- print("d&r:"..decl.."|"..repl)
expand = true
table.insert(out, repl)
table.insert(out, input:sub(end_ + #decl))
break
else
if input:sub(start):find("^[_%a][_%w]*%s*%(") then
-- that is part of functional macro declaration.
-- print(v ..': cannot replace:<'..input..'> read more line')
return input,true
else
-- on macro name is also used as the symbol of some C declaration
-- (e.g. /usr/include/spawn.h, /usr/include/sys/select.h on centos 6.4)
-- no need to preprocess.
print(v .. ': macro name but used as C declaration in:' .. input)
end
end
end
end
table.insert(out, repl)
elseif k == "DEFINED" then
table.insert(out, input:sub(start, end_))
else
table.insert(out, input:sub(start, end_))
end
end
input = table.concat(out)
if not expand then
break
end
end
-- C liberal string concatenation, processing U,L,UL,LL
return parseCInteger(concatStringLiteral(input)),false
end
-- processes an input line. called from lcpp doWork loop
local function processLine(state, line)
if not line or #line == 0 then return line end
local cmd = nil
if line:byte(1) == CMD_BYTE then cmd = line:sub(2) end
-- print("process:"..line)--.."|"..tostring(state:skip()))
--[[ IF/THEN/ELSE STRUCTURAL BLOCKS ]]--
if cmd then
local ifdef = cmd:match(IFDEF)
local ifexp = cmd:match(IF)
local ifndef = cmd:match(IFNDEF)
local elif = cmd:match(ELIF)
local elseif_ = cmd:match(ELSEIF)
local else_ = cmd:match(ELSE)
local endif = cmd:match(ENDIF)
local struct = ifdef or ifexp or ifndef or elif or elseif_ or else_ or endif
if struct then
local skip = state:skip()
if ifdef then state:openBlock(state:defined(ifdef)) end
-- if skipped, it may have undefined expression. so not parse them
if ifexp then state:openBlock(skip and true or CBoolean(state:parseExpr(ifexp))) end
if ifndef then state:openBlock(not state:defined(ifndef)) end
if elif then state:elseBlock((skip and skip < #state.stack) and true or CBoolean(state:parseExpr(elif))) end
if elseif_ then state:elseBlock((skip and skip < #state.stack) and true or CBoolean(state:parseExpr(elseif_))) end
if else_ then state:elseBlock(true) end
if endif then state:closeBlock() end
return -- remove structural directives
end
end
--[[ SKIPPING ]]--
if state:skip() then
-- print('skip:' .. line)
return
end
--[[ READ NEW DIRECTIVES ]]--
if cmd then
-- handle #undef ...
local key = cmd:match(UNDEF)
if type(key) == "string" then
state:undefine(key)
return
end
-- read "#define >FooBar...<" directives
if cmd:match(DEFINE) then
local define = trim(cmd:sub(DEFINE:len()+1))
local macroname, replacement
-- simple "true" defines
macroname = define:match(TRUEMACRO)
if macroname then
state:define(macroname, true)
else
-- replace macro defines
macroname, replacement = define:match(REPLMACRO)
if macroname and replacement then
state:define(macroname, replacement)
else
-- read functional macros
macroname, replacement, source = state:parseFunction(define)
if macroname and replacement then
-- add original text for definition to check identify
state:define(macroname, replacement, false, source)
end
end
end
return
end
-- handle #include ...
local filename = cmd:match(INCLUDE)
if filename then
return state:includeFile(filename)
end
local filename = cmd:match(LOCAL_INCLUDE)
if filename then
return state:includeFile(filename, false, true)
end
local filename = cmd:match(INCLUDE_NEXT)
if filename then
--print("include_next:"..filename)
return state:includeFile(filename, true)
end
-- ignore, because we dont have any pragma directives yet
if cmd:match(PRAGMA) then return end
-- handle #error
local errMsg = cmd:match(ERROR)
local errNoTxt = cmd:match(ERROR_NOTEXT)
local warnMsg = cmd:match(WARNING)
if errMsg then error(errMsg) end
if errNoTxt then error("<ERROR MESSAGE NOT SET>") end
if warnMsg then
print(warnMsg)
return
end
-- abort on unknown keywords
error("unknown directive: "..line)
end
if state.incompleteLine then
--print('merge with incompleteLine:'..state.incompleteLine)
line = (state.incompleteLine .. line)
state.incompleteLine = nil
end
--[[ APPLY MACROS ]]--
-- print(line)
local _line,more = state:apply(line);
-- print('endprocess:'.._line)
if more then
state.incompleteLine = line
return ""
else
return _line
end
return line
end
local function doWork(state)
local function _doWork(state)
if not state:defined(__FILE__) then state:define(__FILE__, "<USER_CHUNK>", true) end
local oldIndent = state:getIndent()
while true do
local input = state:getLine()
if not input then break end
local output = processLine(state, input)
if not lcpp.FAST and not output then output = "" end -- output empty skipped lines
if lcpp.DEBUG then output = output.." -- "..input end -- input as comment when DEBUG
if output then coroutine.yield(output) end
end
if (oldIndent ~= state:getIndent()) then error("indentation level must be balanced within a file. was:"..oldIndent.." is:"..state:getIndent()) end
end
return coroutine.wrap(function() _doWork(state) end)
end
local function includeFile(state, filename, next, _local)
local result, result_state = lcpp.compileFile(filename, state.defines, state.macro_sources, next, _local)
-- now, we take the define table of the sub file for further processing
state.defines = result_state.defines
-- and return the compiled result
return result
end
-- sets a global define
local function define(state, key, value, override, macro_source)
--print("define:"..key.." type:"..tostring(value).." value:"..tostring(pval))
if value and not override then
if type(value) == 'function' then
assert(macro_source, "macro source should specify to check identity")
local pval = state.macro_sources[key]
if pval and (pval ~= macro_source) then error("already defined: "..key) end
state.macro_sources[key] = macro_source
else
local pval = state.defines[key]
if pval and (pval ~= value) then error("already defined: "..key) end
end
end
state.defines[key] = state:prepareMacro(value)
end
-- parses CPP exressions
-- i.e.: #if !defined(_UNICODE) && !defined(UNICODE)
--
--BNF:
-- EXPR -> (BRACKET_OPEN)(EXPR)(BRACKET_CLOSE)
-- EXPR -> (EXPR)(OR)(EXPR)
-- EXPR -> (EXPR)(AND)(EXPR)
-- EXPR -> (NOT)(EXPR)
-- EXPR -> (FUNCTION)
-- FUNCTION -> (IDENTIFIER)(BRACKET_OPEN)(ARGS)(BRACKET_CLOSE)
-- ARGS -> ((IDENTIFIER)[(COMMA)(IDENTIFIER)])?
--LEAVES:
-- IGNORE -> " \t"
-- BRACKET_OPEN -> "("
-- BRACKET_CLOSE -> ")"
-- OR -> "||"
-- AND -> "&&"
-- NOT -> "!"
-- IDENTIFIER -> "[0-9a-zA-Z_]"
--
local LCPP_TOKENIZE_MACRO = {
string = true,
keywords_order = {
"CONCAT",
"SPACE",
},
keywords = {
CONCAT = "^%s*##%s*",
SPACE = "^%s",
},
}
local LCPP_TOKENIZE_MACRO_ARGS = {
string = true,
keywords_order = {
"STRING_LITERAL",
"PARENTHESE",
"FUNCTIONAL",
"ARGS",
"SINGLE_CHARACTER_ARGS",
"COMMA",
},
keywords = {
PARENTHESE = "^%s*%b()",
FUNCTIONAL = "^".. IDENTIFIER .. "%s*%b()",
STRING_LITERAL = '^"[^"]*"',
ARGS = "^[^,%s][^,]*[^,%s]",
SINGLE_CHARACTER_ARGS = "^[^,%s]",
COMMA = "^,",
},
}
local LCPP_TOKENIZE_EXPR = {
string = false,
keywords_order = {
"DEFINED",
"FUNCTIONAL_MACRO",
"BROPEN",
"BRCLOSE",
"TENARY_START",
"TENARY_MIDDLE",
-- binary operators
"EQUAL",
"NOT_EQUAL",
"AND",
"OR",
"BAND",
"BOR",
"BXOR",
"PLUS",
"MINUS",
"MULTIPLY",
"DIV",
"MOD",
"LTE",
"MTE",
"LSHIFT",
"RSHIFT",
"LT",
"MT",
-- unary operator
"NOT",
"BNOT",
-- literal
"STRING_LITERAL",
"CHAR_LITERAL",
"HEX_LITERAL",
"FPNUM_LITERAL",
"NUMBER_LITERAL",
},
keywords = {
DEFINED = '^defined',
FUNCTIONAL_MACRO = '^' .. IDENTIFIER .. "%s*%b()",
BROPEN = '^[(]',
BRCLOSE = '^[)]',
TENARY_START = '^%?',
TENARY_MIDDLE = '^%:',
EQUAL = '^==',
NOT_EQUAL = '^!=',
AND = '^&&',
OR = '^||',
BAND = '^&',
BOR = '^|',
BXOR = '^%^',
PLUS = '^%+',
MINUS = '^%-',
MULTIPLY = '^%*',
DIV = '^%/',
MOD = '^%%',
LTE = '^<=',
MTE = '^>=',
LSHIFT = '^<<',
RSHIFT = '^>>',
LT = '^<',
MT = '^>',
NOT = '^!',
BNOT = '^~',
STRING_LITERAL = '^L?"[^"]*"',
CHAR_LITERAL = "^L?'.*'",
HEX_LITERAL = '^[%+%-]?0?x[a-fA-F%d]+[UL]*',
FPNUM_LITERAL = '^[%+%-]?%d+[%.]?%d*e[%+%-]%d*',
NUMBER_LITERAL = '^[%+%-]?0?b?%d+[%.]?%d*[UL]*',
},
}
local function parseDefined(state, input)
local result = false
local bropen = false
local brclose = false
local ident = nil
for key, value in input do
if key == "BROPEN" then
bropen = true
end
if key == "identifier" then
ident = value
if not bropen then break end
end
if key == "BRCLOSE" and ident then
brclose = true
break
end
end
-- wiht and w/o brackets allowed
if ident and ((bropen and brclose) or (not bropen and not brclose)) then
return state:defined(ident)
end
error("expression parse error: defined(ident)")
end
--[[
order : smaller is higher priority
1 () [] -> .
2 ! ~ - + * & sizeof type cast ++ --
3 * / %
4 + -
5 << >>
6 < <= > >=
7 == !=
8 &
9 ^
10 |
11 &&
12 ||
13 ?: = += -= *= /= %= &= |= ^= <<= >>=
14 ,
]]
local combination_order = function (op, unary)
if unary then
if op == '-' or op == '!' or op == '~' then
return 2
else
assert(false, 'unsupported unary operator:' .. op)
end
else
if op == '*' or op == '/' or op == '%' then
return 3
elseif op == '+' or op == '-' then
return 4
elseif op == '>>' or op == '<<' then
return 5
elseif op == '<' or op == '>' or op == '<=' or op == '>=' then
return 6
elseif op == '==' or op == '!=' then
return 7
elseif op == '&' then
return 8
elseif op == '^' then
return 9
elseif op == '|' then
return 10
elseif op == '&&' then
return 11
elseif op == '||' then
return 12
elseif op == '?' or op == ':' then
return 13
else
assert(false, 'unsupported operator:' .. op)
end
end
end
local evaluate
evaluate = function (node)
if not node.op then -- leaf node or leaf node with unary operators
local v = node.v
if node.uops then
for _, uop in ipairs(node.uops) do
-- print('apply uop:'..uop.."|"..tostring(v))
if uop == '-' then
v = -v
elseif uop == '!' then
v = (not v)
elseif uop == '~' then
v = bit.bnot(v)
else
assert(false, 'invalid uop:' .. tostring(uop))
end
end
end
-- print('after apply:'..tostring(v))
return v
end
-- print(node.op..':'..tostring(node.l.v or node.l.op).."("..type(node.l.v)..")|"..tostring(node.r.v or node.r.op).."("..type(node.r.v)..")")
if node.op == '+' then -- binary operators
return (evaluate(node.l) + evaluate(node.r))
elseif node.op == '-' then
return (evaluate(node.l) - evaluate(node.r))
elseif node.op == '*' then
return (evaluate(node.l) * evaluate(node.r))
elseif node.op == '/' then
return (evaluate(node.l) / evaluate(node.r))
elseif node.op == '%' then
return (evaluate(node.l) % evaluate(node.r))
elseif node.op == '==' then
return (evaluate(node.l) == evaluate(node.r))
elseif node.op == '!=' then
return (evaluate(node.l) ~= evaluate(node.r))
elseif node.op == '<<' then
return bit.lshift(evaluate(node.l), evaluate(node.r))
elseif node.op == '>>' then
return bit.rshift(evaluate(node.l), evaluate(node.r))
elseif node.op == '&&' then
return (CBoolean(evaluate(node.l)) and CBoolean(evaluate(node.r)))
elseif node.op == '||' then
return (CBoolean(evaluate(node.l)) or CBoolean(evaluate(node.r)))
elseif node.op == '&' then
return bit.band(evaluate(node.l), evaluate(node.r))
elseif node.op == '|' then
return bit.bor(evaluate(node.l), evaluate(node.r))
elseif node.op == '^' then
return bit.bxor(evaluate(node.l), evaluate(node.r))
elseif node.op == '<=' then
return (evaluate(node.l) <= evaluate(node.r))
elseif node.op == '>=' then
return (evaluate(node.l) >= evaluate(node.r))
elseif node.op == '<' then
return (evaluate(node.l) < evaluate(node.r))
elseif node.op == '>' then
return (evaluate(node.l) > evaluate(node.r))
else
assert(false, 'invalid op:' .. tostring(node.op))
end
end
local function setValue(node, v)
-- print('setValue:' .. tostring(v).."|"..tostring(node.uops))-- .. "\t" .. debug.traceback())
if not node.op then
assert(not node.v, debug.traceback())
node.v = v
else
assert(node.l and (not node.r))
node.r = {v = v, uops = node.uops}
end
end
local function setUnaryOp(node, uop)
-- print('setUnaryOp:' .. tostring(uop))-- .. "\t" .. debug.traceback())
if not node.uops then node.uops = {} end
table.insert(node.uops, 1, uop)
end
local function parseExpr(state, input)
local node = {}
local root = node
-- first call gets string input. rest uses tokenizer
if type(input) == "string" then
-- print('parse:' .. input)
input = tokenizer(input, LCPP_TOKENIZE_EXPR)
end
for type, value in input do
-- print("type:"..type.." value:"..value)
-- unary operator
if type == "NOT" or
type == "BNOT" then
setUnaryOp(node, value)
end
if type == "BROPEN" then
setValue(node, state:parseExpr(input))
end
if type == "BRCLOSE" then
--print('BRCLOSE:' .. tostring(result))
break
end
if type == "STRING_LITERAL" then
setValue(node, value:sub(value[1] == 'L' and 3 or 2,-2))
end
if type == "NUMBER_LITERAL" or type == "HEX_LITERAL" or type == "FPNUM_LITERAL" or type == "CHAR_LITERAL" then
setValue(node, tonumber(parseCInteger(value)))
end
-- tenary operator
-- tenary has lowest priority, so any other operation can be calculate now.
if type == "TENARY_START" then
local l = state:parseExpr(input)
local r = state:parseExpr(input)
if evaluate(root) then
return l
else
return r
end
end
if type == "TENARY_MIDDLE" then
break
end
-- binary operator
if type == "EQUAL" or
type == "NOT_EQUAL" or
type == "AND" or
type == "OR" or
type == "BAND" or
type == "BOR" or
type == "BXOR" or
type == "PLUS" or
type == "MINUS" or
type == "MULTIPLY" or
type == "DIV" or
type == "MOD" or
type == "LTE" or
type == "MTE" or
type == "LSHIFT" or
type == "RSHIFT" or
type == "LT" or
type == "MT" then
if node.op then
if not node.r then -- during parse right operand : uop1 uop2 ... uopN operand1 op1 uop(N+1) uop(N+2) ... [uop(N+K)]
assert(type == "MINUS", "error: operators come consequently: " .. tostring(node.op) .. " and " .. tostring(value))
-- unary operater after binary operator
setUnaryOp(node, value)
else -- uop1 uop2 ... uopN operand1 op1 uop(N+1) uop(N+2) ... uop(N+M) operand2 [op2]
-- print("operator processing:" .. tostring(node.op) .. "|" .. value .. "|" .. tostring(node.l) .. "|" .. tostring(node.r))
local tmp = node
while tmp do
-- print('compare ' .. value..' and ' .. tmp.op)
if combination_order(tmp.op) > combination_order(value) then
-- print(value..' is stronger than ' .. tmp.op)
break
end
tmp = tmp.parent
end
if tmp then
node = {
op = value,
l = tmp.r,
parent = tmp
}
tmp.r.parent = node
tmp.r = node
else
node = {
op = value,
l = root,
}
root.parent = node
root = node
end
end
elseif node.v ~= nil then -- uop1 uop2 ... uopN operand1 [op]
local devided
if node.uops then
for _, uop in ipairs(node.uops) do
if combination_order(uop, true) > combination_order(value) then
-- there is a binary operator which has stronger than any of the unary
devided = uop
end
end
end
if devided then
assert(false, "TODO: can we do something about this case??:"..value.." is stronger than "..devided)
else
node.l = { v = node.v, uops = node.uops }
node.v = nil
node.uops = nil
node.op = value
end
else -- unary operator : uop1 uop2 ... [uopN]
assert(type == "MINUS", "error: invalid unary operator:" .. value)
setUnaryOp(node, value)
end
end
if type == "DEFINED" then
setValue(node, parseDefined(state, input))
elseif type == "identifier" or type == "FUNCTIONAL_MACRO" then
-- print('ident:' .. value)
local eval = state:apply(value)
-- print('apply result ' .. eval .. "|" .. tostring(unprocessed))
if eval ~= value then
eval = state:parseExpr(eval)
-- print('re-evaluate expr ' .. tostring(eval))
setValue(node, eval)
else
-- undefined macro symbol is always treated as 0.
-- http://gcc.gnu.org/onlinedocs/cpp/If.html#If
setValue(node, 0)
end
end
end
local r = evaluate(root)
-- print('evaluate:' .. tostring(r))
return r
end
-- apply string ops "##"
local function prepareMacro(state, input)
if type(input) ~= "string" then return input end
repeat
local out = {}
local concat
for k, v, start, end_ in tokenizer(input, LCPP_TOKENIZE_MACRO) do
if k == "CONCAT" then
-- remove concat op "##"
concat = true
else
table.insert(out, input:sub(start, end_))
end
end
input = table.concat(out)
until not concat
return input
end
-- macro args replacement function slower but more torelant for pathological case
local function replaceArgs(argsstr, repl)
local args = {}
argsstr = argsstr:sub(2,-2)
-- print('argsstr:'..argsstr)
local comma
for k, v, start, end_ in tokenizer(argsstr, LCPP_TOKENIZE_MACRO_ARGS) do
-- print("replaceArgs:" .. k .. "|" .. v)
if k == "ARGS" or k == "PARENTHESE" or k == "STRING_LITERAL" or
k == "FUNCTIONAL" or k == "SINGLE_CHARACTER_ARGS" then
table.insert(args, v)
comma = false
elseif k == "COMMA" then
if comma then
-- continued comma means empty parameter
table.insert(args, "")
end
comma = true
end
end
local v = repl:gsub("%$(%d+)", function (m) return args[tonumber(m)] or "" end)
-- print("replaceArgs:" .. repl .. "|" .. tostring(#args) .. "|" .. v)
return v
end
-- i.e.: "MAX(x, y) (((x) > (y)) ? (x) : (y))"
local function parseFunction(state, input)
if not input then return end
local concat
local name, argsstr, repl = input:match(FUNCMACRO)
if not name or not argsstr or not repl then return end
-- rename args to $1,$2... for later gsub
local noargs = 0
for argname in argsstr:gmatch(IDENTIFIER) do
noargs = noargs + 1
-- avoid matching substring of another identifier (eg. attrib matches __attribute__ and replace it)
repl = repl:gsub("(#*)(%s*)("..argname..")([_%w]?)", function (s1, s2, s3, s4)
if #s4 <= 0 then
return (#s1 == 1) and ("\"$"..noargs.."\"") or (s1..s2.."$"..noargs)
else
return s1..s2..s3..s4
end
end)
end
-- remove concat (after replace matching argument name to $1, $2, ...)
repl = repl:gsub("%s*##%s*", "")
-- build macro funcion
local func = function(input)
return input:gsub(name.."%s*(%b())", function (match)
return replaceArgs(match, repl)
end)
end
return name, func, repl
end
-- ------------
-- LCPP INTERFACE
-- ------------
--- initialies a lcpp state. not needed manually. handy for testing
function lcpp.init(input, predefines, macro_sources)
-- create sate var
local state = {} -- init the state object
state.defines = {} -- the table of known defines and replacements
state.screener = screener(input)
state.lineno = 0 -- the current line number
state.stack = {} -- stores wether the current stack level is to be included
state.once = {} -- stack level was once true (first if that evals to true)
state.macro_sources = macro_sources or {} -- original replacement text for functional macro
-- funcs
state.define = define
state.undefine = function(state, key)
state:define(key, nil)
state.macro_sources[key] = nil
end
state.defined = function(state, key)
return state.defines[key] ~= nil
end
state.apply = apply
state.includeFile = includeFile
state.doWork = doWork
state.getIndent = function(state)
return #state.stack
end
state.openBlock = function(state, bool)
state.stack[#state.stack+1] = bool
state.once [#state.once+1] = bool
state:define(__LCPP_INDENT__, state:getIndent(), true)
end
state.elseBlock = function(state, bool)
if state.once[#state.once] then
state.stack[#state.stack] = false
else
state.stack[#state.stack] = bool
if bool then state.once[#state.once] = true end
end
end
state.closeBlock = function(state)
state.stack[#state.stack] = nil
state.once [#state.once] = nil
state:define(__LCPP_INDENT__, state:getIndent(), true)
if state:getIndent() < 0 then error("Unopened block detected. Indentaion problem.") end
end
state.skip = function(state)
for i = 1, #state.stack do
if not state.stack[i] then return i end
end
return false
end
state.getLine = function(state)
state.lineno = state.lineno + 1
state:define(__LINE__, state.lineno, true)
return state.screener()
end
state.prepareMacro = prepareMacro
state.parseExpr = parseExpr
state.parseFunction = parseFunction
-- predefines
state:define(__DATE__, os.date("%B %d %Y"), true)
state:define(__TIME__, os.date("%H:%M:%S"), true)
state:define(__LINE__, state.lineno, true)
state:define(__LCPP_INDENT__, state:getIndent(), true)
predefines = predefines or {}
for k,v in pairs(lcpp.ENV) do state:define(k, v, true) end -- static ones
for k,v in pairs(predefines) do state:define(k, v, true) end
if lcpp.LCPP_TEST then lcpp.STATE = state end -- activate static state debugging
return state
end
--- the preprocessors main function.
-- returns the preprocessed output as a string.
-- @param code data as string
-- @param predefines OPTIONAL a table of predefined variables
-- @usage lcpp.compile("#define bar 0x1337\nstatic const int foo = bar;")
-- @usage lcpp.compile("#define bar 0x1337\nstatic const int foo = bar;", {["bar"] = "0x1338"})
function lcpp.compile(code, predefines, macro_sources)
local state = lcpp.init(code, predefines, macro_sources)
local buf = {}
for output in state:doWork() do
table.insert(buf, output)
end
local output = table.concat(buf, NEWL)
if lcpp.DEBUG then print(output) end
return output, state
end
--- preprocesses a file
-- @param filename the file to read
-- @param predefines OPTIONAL a table of predefined variables
-- @usage out, state = lcpp.compileFile("../odbg/plugin.h", {["MAX_PAH"]=260, ["UNICODE"]=true})
function lcpp.compileFile(filename, predefines, macro_sources, next, _local)
if not filename then error("processFile() arg1 has to be a string") end
local file = io.open(filename, 'r')
if not file then error("file not found: "..filename) end
local code = file:read('*a')
predefines = predefines or {}
predefines[__FILE__] = filename
return lcpp.compile(code, predefines, macro_sources)
end
-- ------------
-- SATIC UNIT TESTS
-- ------------
function lcpp.test(suppressMsg)
local testLabelCount = 0
local function getTestLabel()
testLabelCount = testLabelCount + 1
return " lcpp_assert_"..testLabelCount
end
-- this ugly global is required so our testcode can find it
_G.lcpp_test = {
assertTrueCalls = 0;
assertTrueCount = 0;
assertTrue = function()
lcpp_test.assertTrueCount = lcpp_test.assertTrueCount + 1;
end
}
local testlcpp = [[
assert(__LINE__ == 1, "_LINE_ macro test 1: __LINE__")
// This test uses LCPP with lua code (uncommon but possible)
assert(__LINE__ == 3, "_LINE_ macro test 3: __LINE__")
/*
* It therefore asserts any if/else/macro functions and various syntaxes
* (including this comment, that would cause errors if not filtered)
*/
assert(__LINE__ == 8, "_LINE_ macro test 8: __LINE__")
/*
assert(false, "multi-line comment not removed")
*/
/* pathological case which contains single line comment start in multiline comments.
* e.g. this multiline comment should be finish next line.
* http://foobar.com */ // comment
/* if singleline comment processes first, sometimes indicator of end of multiline loss */ #define THIS_SHOULD_ENABLE 111 /*
continuous multiline comment after macro definition
//*/
///* this removed.
assert(THIS_SHOULD_ENABLE == 111, "pathological multiline comment test")
#define TRUE
#define ONE (1)
#define TWO (2)
#define THREE_FUNC(x) (3)
#define LEET 0x1337
#define CLONG 123456789L
#define CLONGLONG 123456789123456789LL
#define CULONG 12345678UL
#define CUINT 123456U
#define BINARY -0b1001 /* -9 */
#define OCTET 075 /* 61 */
#define NON_OCTET 75
#define HEX 0xffffU
#define __P(x) x
#define WCHAR_ZERO L'\0'
# define NCURSES_IMPEXP
# define NCURSES_API
# define NCURSES_EXPORT(type) NCURSES_IMPEXP type NCURSES_API
#define MACRO_TO_ITSELF MACRO_TO_ITSELF
local MACRO_TO_ITSELF = 111
assert(MACRO_TO_ITSELF == 111, "can process macro to itself")
assert(WCHAR_ZERO == 0, "wchar evaluate fails")
assert(CLONG == 123456789, "read *L fails")
assert(CLONGLONG == 123456789123456789, "read *LL fails")
assert(CULONG == 12345678, "read *UL fails")
assert(HEX == 65535, "read hex fails")
#if CUINT != 123456U
assert(false, "cannot evaluate number which contains Unsinged postfix correctly")
#else
assert(CUINT == 123456, "read *U fails")
#endif
#pragma ignored
assert __P((BINARY == -9, "parse, binary literal fails"))
assert(OCTET == 61 and NON_OCTET == 75, "parse octet literal fails")
lcpp_test.assertTrue()
assert(LEET == 0x1337, "simple #define replacement")
local msg
/* function to check macro expand to empty */
local function check_argnum(...)
return select('#', ...)
end
NCURSES_EXPORT(function) test_export(a)
return a + 1
end
assert(test_export(2) == 3, "EXPORT style macro")
local macrofunc = function __P((
a, b))
return a + b
end
assert(macrofunc(1, 2) == 3, "macro arg contains parenthese")
msg = "tenary operator test"
#if (HEX % 2 == 1 ? CUINT : CULONG) == 123456
lcpp_test.assertTrue()
#else
assert(false, msg.."1")
#endif
#if (OCTET % 2 == 0 ? CUINT : CULONG) == 123456
assert(false, msg.."1")
#else
lcpp_test.assertTrue()
#endif
# if defined TRUE
lcpp_test.assertTrue() -- valid strange syntax test (spaces and missing brackets)
# endif
msg = "#define if/else test"
#ifdef TRUE
lcpp_test.assertTrue()
#else
assert(false, msg.."1")
#endif
#ifdef NOTDEFINED
assert(false, msg.."2")
#else
lcpp_test.assertTrue()
#endif
#ifndef NOTDEFINED
lcpp_test.assertTrue()
#else
assert(false, msg.."3")
#endif
msg = "#if defined statement test"
#if defined(TRUE)
lcpp_test.assertTrue()
#else
assert(false, msg.."1")
#endif
#if !defined(LEET) && !defined(TRUE)
assert(false, msg.."2")
#endif
#if !defined(NOTLEET) && !defined(NOTDEFINED)
lcpp_test.assertTrue()
#else
assert(false, msg.."3")
#endif
#if !(defined(LEET) && defined(TRUE))
assert(false, msg.."4")
#else
lcpp_test.assertTrue()
#endif
#if !defined(LEET) && !defined(TRUE)
assert(false, msg.."5")
#endif
#if defined(LEET) && defined(TRUE) && defined(NOTDEFINED)
assert(false, msg.."6")
#endif
#if ONE + TWO * TWO == 5
lcpp_test.assertTrue()
#else
assert(false, msg.."7")
#endif
#if (ONE + TWO) * TWO == 0x6
lcpp_test.assertTrue()
#else
assert(false, msg.."8")
#endif
#if ONE * TWO + ONE / TWO == 2.5
lcpp_test.assertTrue()
#else
assert(false, msg.."9")
#endif
#if ONE + ONE * TWO / TWO == 2
lcpp_test.assertTrue()
#else
assert(false, msg.."10")
#endif
#if TWO - - TWO == 4
lcpp_test.assertTrue()
#else
assert(false, msg.."11")
#endif
#if (TWO - - TWO) % (ONE + TWO) == 1
lcpp_test.assertTrue()
#else
assert(false, msg.."12")
#endif
#if ONE << TWO + TWO >> ONE == 8
lcpp_test.assertTrue()
#else
assert(false, msg.."13")
#endif
#if (ONE << TWO) + (TWO >> ONE) == 5
lcpp_test.assertTrue()
#else
assert(false, msg.."14")
#endif
#if (ONE << TWO) + TWO >> ONE == 3
lcpp_test.assertTrue()
#else
assert(false, msg.."15")
#endif
#if (THREE_FUNC(0xfffffU) & 4) == 0
lcpp_test.assertTrue()
#else
assert(false, msg.."16")
#endif
#if (0x3 & THREE_FUNC("foobar")) == 0b11
lcpp_test.assertTrue()
#else
assert(false, msg.."17")
#endif
#if defined(TWO) && ((TWO-0) < 3)
lcpp_test.assertTrue()
#else
assert(false, msg.."17")
#endif
#if TWO == 1--1
lcpp_test.assertTrue()
#else
assert(false, msg.."18")
#endif
#if HEX > 0xfFfFU
assert(false, msg.."18")
#else
lcpp_test.assertTrue()
#endif
#define TRUE_DEFINED defined(TRUE)
#if TRUE_DEFINED
lcpp_test.assertTrue()
#else
assert(false, msg.."19")
#endif
#define NOTDEFINED_DEFINED defined(TRUE) && defined(NOTDEFINED)
#if NOTDEFINED_DEFINED
assert(false, msg.."20")
#else
lcpp_test.assertTrue()
#endif
#if LEET && LEET > 0x1336
lcpp_test.assertTrue()
#else
assert(false, msg.."20")
#endif
#if NOTLEET && NOTLEET > 0x1336
assert(false, msg.."21")
#else
lcpp_test.assertTrue()
#endif
#if defined(NOTLEET) || BINARY + 0 >= 10L || !defined(TRUE)
assert(false, msg.."22")
#else
lcpp_test.assertTrue()
#endif
msg = "macro chaining"
#define FOO 0x7B
#define BAR (FOO+0x7B)
assert(-BAR == -0x7B*2, msg)
#define BAZ 456
#define BLUR BA##Z
assert(BLUR == 456, msg)
local testfunc = function (x) return "["..tostring(x).."]" end
#define FOOBAR(x) testfunc(x)
assert(FOOBAR(1) == "[1]", msg)
#define testfunc(x)
#define FOOBAZ(x) testfunc(x)
assert(check_argnum(FOOBAR(1)) == 0, msg)
assert(check_argnum(FOOBAZ(1)) == 0, msg)
#undef testfunc
assert(FOOBAR(1) == "[1]", msg)
assert(FOOBAZ(1) == "[1]", msg)
msg = "indentation test"
assert(__LCPP_INDENT__ == 0, msg.."1")
#if defined(TRUE)
assert(__LCPP_INDENT__ == 1, msg.."2")
#endif
assert(__LCPP_INDENT__ == 0, msg.."3")
#define LCPP_FUNCTION_1(x, y) (x and not y)
assert(LCPP_FUNCTION_1(true, false), "function macro")
#define LCPP_FUNCTION_2(x, y) \
(not x \
and y)
assert(LCPP_FUNCTION_2(false, true), "multiline function macro")
#define LCPP_FUNCTION_3(_x, _y) LCPP_FUNCTION_2(_x, _y)
assert(LCPP_FUNCTION_3(false, true), "function macro with argname contains _")
#define LCPP_FUNCTION_4_CHILD() false
#define LCPP_FUNCTION_4(_x)
assert(check_argnum(LCPP_FUNCTION_4(LCPP_FUNCTION_4_CHILD())) == 0, "functional macro which receives functional macro as argument")
assert(check_argnum(LCPP_FUNCTION_4(LCPP_FUNCTION_3(true, true))) == 0, "functional macro which receives functional macro as argument2")
#define LCPP_FUNCTION_5(x, y) (x) + (x) + (y) + (y)
assert(LCPP_FUNCTION_5(10, 20) == 60, "macro argument multiple usage")
#define LCPP_NOT_FUNCTION (BLUR)
assert(LCPP_NOT_FUNCTION == 456, "if space between macro name and argument definition exists, it is regarded as replacement macro")
#define __CONCAT(x, y, z, w) x ## y ## z (w)
local __fncall = function (x) return x + 111 end
assert(111 == __CONCAT( __ , fnc , all, 0 ), "funcall fails")
assert(222 == __CONCAT( __ ,, fncall, 111 ), "funcall fails2")
#define __ATTRIB_CALL(x, y, attrib) __attribute__(x, y, attrib)
local __attribute__ = function (x, y, attr)
return attr * (x + y)
end
assert(__ATTRIB_CALL( 1, 2 , 100 ) == 300, "funcall fails3")
msg = "#elif test"
#if defined(NOTDEFINED)
-- it should not be processed
#if NOTDEFINED
#else
assert(false, msg.."1")
#endif
#elif defined(NOTDEFINED)
assert(false, msg.."2")
#elif defined(TRUE)
lcpp_test.assertTrue()
#else
assert(false, msg.."3")
#endif
msg = "#else if test"
#if defined(NOTDEFINED)
assert(false, msg.."1")
#else if defined(NOTDEFINED)
assert(false, msg.."2")
#else if defined(TRUE)
lcpp_test.assertTrue()
#else
assert(false, msg.."3")
#endif
msg = "bock stack tree test"
#ifdef TRUE
#ifdef NOTDEFINED
assert(false, msg.."1")
#elif defined(TRUE)
lcpp_test.assertTrue()
#else
assert(false, msg.."2")
#endif
#else
assert(false, msg.."3")
#endif
#ifdef NOTDEFINED
#ifdef TRUE
assert(false, msg.."4")
#endif
#endif
msg = "test concat ## operator"
#define CONCAT_TEST1 foo##bar
local CONCAT_TEST1 = "blubb"
assert(foobar == "blubb", msg)
#define CONCAT_TEST2() bar##foo
local CONCAT_TEST2() = "blubb"
assert(barfoo == "blubb", msg)
-- dont process ## within strings
#define CONCAT_TEST3 "foo##bar"
assert(CONCAT_TEST3 == "foo##bar", msg)
msg = "test concat inside func type macro"
#define CONCAT_TEST4(baz) CONCAT_TEST##baz
local CONCAT_TEST4(1) = "bazbaz"
assert(foobar == "bazbaz", msg)
msg = "#undef test"
#define UNDEF_TEST
#undef UNDEF_TEST
#ifdef UNDEF_TEST
assert(false, msg)
#endif
msg = "stringify operator(#) test"
#define STRINGIFY(str) #str
assert(STRINGIFY(abcde) == "abcde", msg)
#define STRINGIFY_AND_CONCAT(str1, str2) #str1 ## \
#str2
assert(STRINGIFY_AND_CONCAT(fgh, ij) == "fghij", msg)
#define msg_concat(msg1, msg2) msg1 ## msg2
assert("I, am, lcpp" == msg_concat("I, am", ", lcpp"), "processing macro argument which includes ,")
#define FUNC__ARG 500
#define __ARG 100
#define FUNC(x) FUNC##x
assert(FUNC(__ARG) == 500, "create new macro symbol by concat")
msg = "same macro definition which has exactly same value allows. (checked with gcc 4.4.7 __WORDSIZE)"
#define DUP_MACRO_DEF (111)
#define DUP_MACRO_DEF (111)
#define DUP_FUNC_MACRO(x, y) x + y
#define DUP_FUNC_MACRO(x, y) x + y
msg = "check #if conditional check"
#define VALUE1 (123)
#if VALUE1 != 123
assert(false, msg .." #if " .. tostring(VALUE1) .. " != 123")
#endif
#if 123 != VALUE1
assert(false, msg .." #if " .. tostring(VALUE1) .. " != 123 (2)")
#endif
#define VALUE2 ("hoge")
#if VALUE2 == "hoge"
#define VALUE3 (true)
#endif
assert(VALUE3 == true, msg .. " #if " .. tostring(VALUE3) .. " == true")
#define VALUE4 (VALUE1 + VALUE1)
#if VALUE4 != 246
assert(false, msg .." #if check for nested definition:" .. tostring(VALUE4))
#endif
msg = "+-*/<> in #if expression:"
#define CALC_VALUE_A (1)
#define CALC_VALUE_B (2)
#if (CALC_VALUE_A + CALC_VALUE_B) != 3
assert(false, msg .. " + not work:")
#endif
#if (CALC_VALUE_A * CALC_VALUE_B) != 2
assert(false, msg .. " * not work:")
#endif
#if (CALC_VALUE_A - CALC_VALUE_B) != -1
assert(false, msg .. " - not work:")
#endif
#if (CALC_VALUE_A / CALC_VALUE_B) != 0.5
assert(false, msg .. " / not work:")
#endif
#if (CALC_VALUE_A >= CALC_VALUE_A)
#else
assert(false, msg .. " >= not work1")
#endif
#if (CALC_VALUE_B >= CALC_VALUE_A)
#else
assert(false, msg .. " >= not work2")
#endif
#if (CALC_VALUE_B <= CALC_VALUE_B)
#else
assert(false, msg .. " <= not work1")
#endif
#if (CALC_VALUE_A <= CALC_VALUE_B)
#else
assert(false, msg .. " <= not work2")
#endif
#if (CALC_VALUE_B > CALC_VALUE_A)
#else
assert(false, msg .. " > not work1")
#endif
#if (CALC_VALUE_A > CALC_VALUE_A)
assert(false, msg .. " > not work2")
#endif
#if (CALC_VALUE_A < CALC_VALUE_B)
#else
assert(false, msg .. " < not work1")
#endif
#if (CALC_VALUE_B < CALC_VALUE_B)
assert(false, msg .. " < not work2")
#endif
#if (CALC_VALUE_B | CALC_VALUE_A) != 3
assert(false, msg .. " | not work")
#endif
#if (CALC_VALUE_B & CALC_VALUE_A) != 0
assert(false, msg .. " & not work")
#endif
#if (CALC_VALUE_B ^ CALC_VALUE_A) != 3
assert(false, msg .. " ^ not work")
#endif
#if -CALC_VALUE_B != -2
assert(false, msg .. " unary - not work")
#endif
#if ~CALC_VALUE_B != -3
assert(false, msg .. " unary ~ not work")
#endif
]]
lcpp.FAST = false -- enable full valid output for testing
lcpp.SELF_TEST = true
local testlua = lcpp.compile(testlcpp)
lcpp.SELF_TEST = nil
-- print(testlua)
assert(loadstring(testlua, "testlua"))()
lcpp_test.assertTrueCalls = findn(testlcpp, "lcpp_test.assertTrue()")
assert(lcpp_test.assertTrueCount == lcpp_test.assertTrueCalls, "assertTrue calls:"..lcpp_test.assertTrueCalls.." count:"..lcpp_test.assertTrueCount)
_G.lcpp_test = nil -- delete ugly global hack
if not suppressMsg then print("Test run suscessully") end
end
if lcpp.LCPP_TEST then lcpp.test(true) end
-- ------------
-- REGISTER LCPP
-- ------------
--- disable lcpp processing for ffi, loadstring and such
lcpp.disable = function()
if lcpp.LCPP_LUA then
-- activate LCPP_LUA actually does anything useful
-- _G.loadstring = _G.loadstring_lcpp_backup
end
if lcpp.LCPP_FFI and pcall(require, "ffi") then
ffi = require("ffi")
if ffi.lcpp_cdef_backup then
ffi.cdef = ffi.lcpp_cdef_backup
ffi.lcpp_cdef_backup = nil
end
end
end
--- (re)enable lcpp processing for ffi, loadstring and such
lcpp.enable = function()
-- Use LCPP to process Lua code (load, loadfile, loadstring...)
if lcpp.LCPP_LUA then
-- TODO: make it properly work on all functions
error("lcpp.LCPP_LUA = true -- not properly implemented yet");
_G.loadstring_lcpp_backup = _G.loadstring
_G.loadstring = function(str, chunk)
return loadstring_lcpp_backup(lcpp.compile(str), chunk)
end
end
-- Use LCPP as LuaJIT PreProcessor if used inside LuaJIT. i.e. Hook ffi.cdef
if lcpp.LCPP_FFI and pcall(require, "ffi") then
ffi = require("ffi")
if not ffi.lcpp_cdef_backup then
if not ffi.lcpp_defs then ffi.lcpp_defs = {} end -- defs are stored and reused
ffi.lcpp = function(input)
local output, state = lcpp.compile(input, ffi.lcpp_defs, ffi.lcpp_macro_sources)
ffi.lcpp_defs = state.defines
ffi.lcpp_macro_sources = state.macro_sources
return output
end
ffi.lcpp_cdef_backup = ffi.cdef
ffi.cdef = function(input)
if true then
return ffi.lcpp_cdef_backup(ffi.lcpp(input))
else
local fn,cnt = input:gsub('#include ["<].-([^/]+%.h)[">]', '%1')
input = ffi.lcpp(input)
if cnt > 0 then
local f = io.open("./tmp/"..fn, 'w')
if f then
f:write(input)
f:close()
else
assert(fn:find('/'), 'cannot open: ./tmp/'..fn)
end
end
return ffi.lcpp_cdef_backup(input)
end
end
end
end
end
lcpp.enable()
return lcpp