Retro68/Rez/RezLexer.cc
2015-08-27 20:49:55 +02:00

191 lines
4.1 KiB
C++

#include "RezLexer.h"
#include <boost/wave.hpp>
#include <boost/wave/cpplexer/cpp_lex_iterator.hpp>
#include <boost/wave/token_ids.hpp>
#include <boost/regex.hpp>
#include "RezLexerWaveToken.h"
#include "RezWorld.h"
#include "Diagnostic.h"
namespace wave = boost::wave;
using namespace boost::wave;
static std::string readContents(std::istream&& instream)
{
instream.unsetf(std::ios::skipws);
return std::string(std::istreambuf_iterator<char>(instream.rdbuf()),
std::istreambuf_iterator<char>());
}
static std::string preFilter(std::string str)
{
boost::regex endif("#endif[^\r\n]*");
str = boost::regex_replace(str, endif, "#endif");
boost::regex dollar_escape("\\\\\\$([a-zA-Z0-9][a-zA-Z0-9])");
str = boost::regex_replace(str, dollar_escape, "\\\\0x$1");
if(str.size() == 0 || str[str.size()-1] != '\n')
str += "\n";
return str;
}
struct load_file_to_string_filtered
{
template <typename IterContextT>
class inner
{
public:
template <typename PositionT>
static void init_iterators(IterContextT &iter_ctx,
PositionT const &act_pos, language_support language)
{
typedef typename IterContextT::iterator_type iterator_type;
// read in the file
std::ifstream instream(iter_ctx.filename.c_str());
if (!instream.is_open()) {
BOOST_WAVE_THROW_CTX(iter_ctx.ctx, preprocess_exception,
bad_include_file, iter_ctx.filename.c_str(), act_pos);
return;
}
iter_ctx.instring = preFilter(readContents(std::move(instream)));
iter_ctx.first = iterator_type(
iter_ctx.instring.begin(), iter_ctx.instring.end(),
PositionT(iter_ctx.filename), language);
iter_ctx.last = iterator_type();
}
private:
std::string instring;
};
};
typedef wave::cpplexer::lex_iterator<
wave::cpplexer::lex_token<> >
lex_iterator_type;
typedef wave::context<
std::string::iterator, lex_iterator_type,
load_file_to_string_filtered>
context_type;
typedef context_type::iterator_type pp_iterator_type;
struct RezLexer::Priv
{
std::string input;
context_type ctx;
pp_iterator_type iter;
Priv(std::string data, std::string name)
: input(data), ctx(input.begin(), input.end(), name.c_str())
{
}
};
static std::string readInitial(RezWorld& world, std::string filename)
{
std::ifstream in(filename);
if(!in.is_open())
{
world.problem(Diagnostic(Diagnostic::error,
"could not open " + filename, yy::location()));
}
return readContents(std::move(in));
}
RezLexer::RezLexer(RezWorld& world, std::string filename)
: RezLexer(world, filename, readInitial(world,filename))
{
}
RezLexer::RezLexer(RezWorld& world, std::string filename, const std::string &data)
: world(world), curFile(filename), lastLocation(&curFile)
{
pImpl.reset(new Priv(preFilter(data), filename));
pImpl->ctx.add_macro_definition("DeRez=0");
pImpl->ctx.add_macro_definition("Rez=1");
pImpl->ctx.add_macro_definition("true=1");
pImpl->ctx.add_macro_definition("false=0");
pImpl->iter = pImpl->ctx.begin();
}
RezLexer::~RezLexer()
{
}
void RezLexer::addDefine(std::string str)
{
pImpl->ctx.add_macro_definition(str);
}
void RezLexer::addIncludePath(std::string path)
{
std::size_t pos = path.find(':');
if(pos == std::string::npos)
{
pImpl->ctx.add_include_path(path.c_str());
}
else
{
addIncludePath(path.substr(0,pos));
addIncludePath(path.substr(pos + 1));
}
}
bool RezLexer::atEnd()
{
return pImpl->iter == pImpl->ctx.end();
}
RezLexer::WaveToken RezLexer::nextWave()
{
try
{
if(pImpl->iter == pImpl->ctx.end())
return WaveToken();
else
{
WaveToken tok = *pImpl->iter++;
return tok;
}
}
catch(preprocess_exception e)
{
curFile = e.file_name();
auto yypos = yy::position(&curFile, e.line_no(), e.column_no());
yy::location loc(yypos);
lastLocation = loc;
world.problem(Diagnostic(
e.severity_level(e.get_errorcode()) >= util::severity_error
? Diagnostic::error
: Diagnostic::warning,
preprocess_exception::error_text(e.get_errorcode()), loc));
if(e.is_recoverable())
return nextWave();
else
return WaveToken();
}
}
RezLexer::WaveToken RezLexer::peekWave()
{
return pImpl->iter == pImpl->ctx.end() ? WaveToken() : *pImpl->iter;
}