qasm/eval.cpp

704 lines
20 KiB
C++
Raw Normal View History

2019-11-11 15:56:03 -08:00
#include "asm.h"
#include "eval.h"
#include <string.h>
#include <stdio.h>
#define CLASS TEvaluator
2019-11-12 10:13:15 -08:00
#define DEF_VAL 0
2019-11-11 15:56:03 -08:00
std::ostream& operator<<(std::ostream& os, const Token& token)
{
os << token.str;
return os;
}
CLASS::CLASS(T65816Asm &_asm) : assembler(_asm)
{
}
CLASS::~CLASS()
{
}
std::deque<Token> CLASS::exprToTokens(const std::string& expr)
{
std::deque<Token> tokens;
int state = 0;
char c;
2019-11-13 15:05:12 -08:00
char delim = 0;
2019-11-11 15:56:03 -08:00
std::string ident, asc;
std::string ops = "+-*//^!.&()";
std::string c1;
char *tokptr;
char *tptr;
bool numexpect;
Token::Type t;
numexpect = true;
for (const auto* p = expr.c_str(); *p; ++p)
{
c = *p;
c1 = c;
tptr = (char *)c1.c_str();
tokptr = strpbrk(tptr, (const char *)ops.c_str());
// printf("state=%d %c %p\n", state, c,tokptr);
switch (state)
{
default:
printf("bad token state\n");
state = 0;
break;
case 11:
if ((c < ' ') || (c == delim))
{
// SGQ - convert ascii to a number here
asc = "0";
//printf("ident=|%s|\n",ident.c_str());
if (ident.length() > 0)
{
// SGQ - convert ascii to a number here
}
t = Token::Type::Number;
int pr = 1; // precedence
bool ra = false; // rightAssociative
tokens.push_back(Token
{
t, asc, pr, ra
});
ident = "";
state = 0;
if (c != delim)
{
p--;
}
}
else
{
ident += c;
}
break;
case 10:
case 20:
if ((c <= ' ') || (tokptr != NULL))
{
if (ident.length() > 0)
{
if (state == 20)
{
t = Token::Type::Symbol;
}
else
{
t = Token::Type::Number;
}
int pr = 1; // precedence
bool ra = false; // rightAssociative
tokens.push_back(Token
{
t, ident, pr, ra
});
ident = "";
}
state = 0;
p--;
}
else
{
ident += c;
}
break;
case 0:
if ((c == '$') && (numexpect))
{
state = 10;
ident += c;
numexpect = false;
}
else if ((numexpect) && ( (c == '^') || (c == '<') || (c == '>') || (c == '|')))
{
ident = c;
tokens.push_back(Token{Token::Type::Shift, ident, 1, true});
ident = "";
}
2019-11-11 15:56:03 -08:00
else if ((c == '*') && (numexpect))
{
numexpect = false;
state = 0;
2019-11-11 15:56:03 -08:00
ident += c;
tokens.push_back(Token{Token::Type::Symbol, ident, 1, false});
ident = "";
2019-11-11 15:56:03 -08:00
}
else if ((c == '%') && (numexpect))
{
state = 10;
ident += c;
numexpect = false;
}
else if ((c == '\'') && (numexpect))
{
delim = c;
state = 11;
numexpect = false;
}
else if ((c == '"') && (numexpect))
{
delim = c;
state = 11;
numexpect = false;
}
else if (((c == '-') || (c == '+')) && (numexpect))
{
state = 10;
ident += c;
}
else if (isdigit(c))
{
state = 10;
ident += c;
numexpect = false;
}
else if (c >= ':')
2019-11-11 15:56:03 -08:00
{
state = 20;
ident += c;
numexpect = false;
}
else if ((tokptr != NULL) && (!numexpect))
{
t = Token::Type::Unknown;
int pr = -1; // precedence
bool ra = false; // rightAssociative
switch (c)
{
default: break;
case '(': t = Token::Type::LeftParen; break;
case ')': t = Token::Type::RightParen; break;
case '!': t = Token::Type::Operator; pr = 5; break;
case '.': t = Token::Type::Operator; pr = 5; break;
case '&': t = Token::Type::Operator; pr = 5; break;
case '^': t = Token::Type::Operator; pr = 4; ra = true; break;
case '*': t = Token::Type::Operator; pr = 3; break;
case '/': t = Token::Type::Operator; pr = 3; break;
case '+': t = Token::Type::Operator; pr = 2; break;
case '-': t = Token::Type::Operator; pr = 2; break;
}
tokens.push_back(Token
{
t, std::string(1, c), pr, ra
});
numexpect = true;
}
}
}
return tokens;
}
std::deque<Token> CLASS::shuntingYard(const std::deque<Token>& tokens)
{
std::deque<Token> queue;
std::vector<Token> stack;
TSymbol *sym;
char buff[128];
// While there are tokens to be read:
for (auto token : tokens)
{
// Read a token
switch (token.type)
{
case Token::Type::Symbol:
token.type = Token::Type::Number;
if (token.str == "*")
{
2019-11-12 20:32:10 -08:00
sprintf(buff, "%u", assembler.PC.currentpc);
2019-11-11 15:56:03 -08:00
token.str = buff;
}
else
{
2019-11-12 00:15:47 -08:00
//printf("symbol find |%s|\n",token.str.c_str());
2019-11-11 15:56:03 -08:00
sym = assembler.findSymbol(token.str);
if (sym != NULL)
{
2019-11-12 10:13:15 -08:00
sym->used = true;
2019-11-12 00:15:47 -08:00
sprintf(buff, "%d", sym->value);
2019-11-11 15:56:03 -08:00
token.str = buff;
}
else
{
2019-11-12 10:13:15 -08:00
setError(Token::unknownSymbolErr);
badsymbol = token.str;
token.str = "0";
2019-11-11 15:56:03 -08:00
}
}
queue.push_back(token);
break;
case Token::Type::Number:
// If the token is a number, then add it to the output queue
queue.push_back(token);
break;
case Token::Type::Shift:
stack.push_back(token);
break;
2019-11-11 15:56:03 -08:00
case Token::Type::Operator:
{
// If the token is operator, o1, then:
const auto o1 = token;
// while there is an operator token,
while (!stack.empty())
{
// o2, at the top of stack, and
const auto o2 = stack.back();
// either o1 is left-associative and its precedence is
// *less than or equal* to that of o2,
// or o1 if right associative, and has precedence
// *less than* that of o2,
if (
(! o1.rightAssociative && o1.precedence <= o2.precedence)
|| ( o1.rightAssociative && o1.precedence < o2.precedence)
)
{
// then pop o2 off the stack,
stack.pop_back();
// onto the output queue;
queue.push_back(o2);
continue;
}
// @@ otherwise, exit.
break;
}
// push o1 onto the stack.
stack.push_back(o1);
}
break;
case Token::Type::LeftParen:
// If token is left parenthesis, then push it onto the stack
stack.push_back(token);
break;
case Token::Type::RightParen:
// If token is right parenthesis:
{
bool match = false;
while (! stack.empty())
{
// Until the token at the top of the stack
// is a left parenthesis,
const auto tos = stack.back();
if (tos.type != Token::Type::LeftParen)
{
// pop operators off the stack
stack.pop_back();
// onto the output queue.
queue.push_back(tos);
}
// Pop the left parenthesis from the stack,
// but not onto the output queue.
stack.pop_back();
match = true;
break;
}
if (!match && stack.empty())
{
// If the stack runs out without finding a left parenthesis,
// then there are mismatched parentheses.
//printf("RightParen error (%s)\n", token.str.c_str());
2019-11-12 10:13:15 -08:00
setError(Token::operatorErr);
2019-11-11 15:56:03 -08:00
return queue;
}
}
break;
default:
2019-11-12 10:13:15 -08:00
setError(Token::syntaxErr);
//printf("error (%s)\n", token.str.c_str());
2019-11-11 15:56:03 -08:00
return queue;
break;
}
//debugReport(token, queue, stack);
}
// When there are no more tokens to read:
// While there are still operator tokens in the stack:
while (! stack.empty())
{
// If the operator token on the top of the stack is a parenthesis,
// then there are mismatched parentheses.
if (stack.back().type == Token::Type::LeftParen)
{
2019-11-12 10:13:15 -08:00
setError(Token::parenErr);
//printf("Mismatched parentheses error\n");
2019-11-11 15:56:03 -08:00
return queue;
}
// Pop the operator onto the output queue.
queue.push_back(std::move(stack.back()));
stack.pop_back();
}
//debugReport(Token { Token::Type::Unknown, "End" }, queue, stack);
//Exit.
return queue;
}
int CLASS::parseNumber(std::string n, int64_t &val)
{
2019-11-12 10:13:15 -08:00
int res = DEF_VAL;
2019-11-11 15:56:03 -08:00
int state = 0;
char c;
std::string s;
uint32_t i, l;
bool valid = false;
bool err = false;
bool neg = false;
int64_t tval = 0;
val = 0;
i = 0;
2019-11-13 15:05:12 -08:00
l = (int)n.length();
2019-11-11 15:56:03 -08:00
s = "";
for (i = 0; i < l; i++)
{
c = n[i];
switch (state)
{
case 0:
if (c == '$')
{
state = 10;
}
else if (c == '%')
{
state = 20;
}
else if (c == '-')
2019-11-11 15:56:03 -08:00
{
if (!valid)
{
neg = !neg;
}
else
{
state = 99;
}
2019-11-11 15:56:03 -08:00
}
else if (isdigit(c))
{
s += c;
valid = true;
state = 1;
tval = c - '0';
}
else
{
state = 99;
}
break;
case 1:
if (isdigit(c))
{
valid = true;
2019-11-11 15:56:03 -08:00
s += c;
tval *= 10;
tval += c - '0';
}
else
{
state = 99;
}
break;
case 10:
if ((c >= 'a') && (c <= 'f'))
{
c = c - 0x20; // make it uppercase
s += c;
tval <<= 4;
tval |= (c - 'A') + 10;
valid = true;
}
else if ((c >= 'A') && (c <= 'F'))
{
s += c;
tval <<= 4;
tval |= (c - 'A') + 10;
valid = true;
}
else if ((c >= '0') && (c <= '9'))
{
s += c;
tval <<= 4;;
tval += c - '0';
valid = true;
}
else { state = 99; }
break;
case 20:
if ((c >= '0') && (c <= '1'))
{
s += c;
tval <<= 1;
if (c == '1')
{
tval |= 1;
}
valid = true;
}
else if (c == '_')
{
// allow these in binary
}
else { state = 99; }
break;
case 99:
err = true;
2019-11-11 15:56:03 -08:00
// if you get into this state there is an error
break;
}
}
if (tval > (int64_t)0xFFFFFFFF)
{
2019-11-12 10:13:15 -08:00
setError(Token::overflowErr);
2019-11-11 15:56:03 -08:00
}
//printf("parsenumber: |%s|\n",s.c_str());
2019-11-11 15:56:03 -08:00
if ((state == 99) || (err))
{
setError(Token::syntaxErr);
valid = false;
2019-11-12 10:13:15 -08:00
val = DEF_VAL;
2019-11-11 15:56:03 -08:00
}
if ((valid) && (!err))
{
if (neg)
{
tval = -tval;
}
val = tval;
//printf("value=%08lX\n", val);
2019-11-11 15:56:03 -08:00
res = 0;
}
return (res);
}
2019-11-12 10:13:15 -08:00
void CLASS::setError(int ecode)
{
if ((evalerror == Token::noError) || (ecode == Token::noError))
{
evalerror = ecode;
}
if (evalerror == Token::noError)
{
badsymbol = "";
}
}
int CLASS::evaluate(std::string & e, int64_t &res, uint8_t &_shiftmode)
2019-11-11 15:56:03 -08:00
{
// const std::string expr = "3+4*2/(1-5)^2^3"; // Wikipedia's example
// const std::string expr = "20-30/3+4*2^3";
_shiftmode=shiftmode=0;
2019-11-12 10:13:15 -08:00
res = DEF_VAL;
setError(Token::noError);
2019-11-11 15:56:03 -08:00
int u;
int64_t val;
std::string expr = Poco::trim(e);
expr += " "; // add a space at end to make parsing easier
if (isDebug() >= 4)
{
printf("eval: expression: |%s|\n", expr.c_str());
}
2019-11-11 15:56:03 -08:00
const auto tokens = exprToTokens(expr);
auto queue = shuntingYard(tokens);
std::vector<int64_t> stack;
// printf("\nCalculation\n");
//printf("|%-3s|%-32s|%-10s|\n", "Tkn", "Queue", "Stack");
while (! queue.empty())
{
2019-11-12 10:13:15 -08:00
//std::string op;
2019-11-11 15:56:03 -08:00
const auto token = queue.front();
queue.pop_front();
switch (token.type)
{
case Token::Type::Symbol:
stack.push_back(std::stoi((char *)"0"));
2019-11-12 10:13:15 -08:00
//op = "Push " + token.str;
2019-11-12 00:15:47 -08:00
//printf("shouldn't get this kind of token\n");
2019-11-11 15:56:03 -08:00
break;
case Token::Type::Number:
val = 0;
u = parseNumber(token.str, val);
if (u < 0)
{
2019-11-12 10:13:15 -08:00
setError(Token::numberErr);
val = DEF_VAL;
2019-11-11 15:56:03 -08:00
}
stack.push_back(val);
2019-11-12 10:13:15 -08:00
//op = "Push " + token.str;
2019-11-11 15:56:03 -08:00
break;
case Token::Type::Shift:
{
auto rhs = DEF_VAL;
if (stack.size() > 0)
{
rhs = stack.back();
stack.pop_back();
shiftmode=token.str[0];
if (token.str=="^")
{
//rhs = (rhs >> 16) &0xFFFF ;
}
else if (token.str=="|")
{
//rhs = (rhs >> 16) & 0xFFFF;
}
else if (token.str=="<")
{
//rhs = (rhs << 8 ) & 0xFFFF;
}
else if (token.str==">")
{
//rhs=(rhs>>8) & 0xFFFF;
}
stack.push_back(rhs);
}
else
{
//printf("nothing on stack\n");
}
}
break;
2019-11-11 15:56:03 -08:00
case Token::Type::Operator:
{
2019-11-12 10:13:15 -08:00
auto rhs = DEF_VAL;
auto lhs = DEF_VAL;
2019-11-11 15:56:03 -08:00
2019-11-12 10:13:15 -08:00
bool v = true;
if (stack.size() > 0)
2019-11-11 15:56:03 -08:00
{
rhs = stack.back();
stack.pop_back();
2019-11-12 10:13:15 -08:00
}
else
{
v = false;
}
if (stack.size() > 0)
{
2019-11-11 15:56:03 -08:00
lhs = stack.back();
stack.pop_back();
}
2019-11-12 00:15:47 -08:00
else
{
2019-11-12 10:13:15 -08:00
v = false;
}
if (!v)
{
setError(Token::badParamErr);
//printf("not enough parameters for the operator\n");
2019-11-12 00:15:47 -08:00
}
2019-11-11 15:56:03 -08:00
switch (token.str[0])
{
default:
2019-11-12 10:13:15 -08:00
setError(Token::operatorErr);
//printf("Operator error [%s]\n", token.str.c_str());
2019-11-11 15:56:03 -08:00
return (-1);
break;
case '^':
stack.push_back(static_cast<int>(pow(lhs, rhs)));
break;
case '*':
stack.push_back(lhs * rhs);
break;
case '/':
if (rhs != 0)
{
stack.push_back(lhs / rhs);
}
else
{
stack.push_back(0);
}
break;
case '+':
stack.push_back(lhs + rhs);
break;
case '-':
stack.push_back(lhs - rhs);
break;
case '!':
stack.push_back(lhs ^ rhs);
break;
case '&':
stack.push_back(lhs & rhs);
2019-11-12 00:15:47 -08:00
break;
2019-11-11 15:56:03 -08:00
break; case '.':
stack.push_back(lhs | rhs);
break;
}
}
break;
default:
//printf("Token error\n");
2019-11-12 10:13:15 -08:00
setError(Token::syntaxErr);
goto out;
2019-11-11 15:56:03 -08:00
}
}
2019-11-12 10:13:15 -08:00
out:
int64_t v = DEF_VAL;
2019-11-11 15:56:03 -08:00
if (stack.size() > 0)
{
v = stack.back();
}
2019-11-12 10:13:15 -08:00
else
2019-11-11 15:56:03 -08:00
{
2019-11-12 10:13:15 -08:00
setError(Token::syntaxErr);
2019-11-11 15:56:03 -08:00
}
_shiftmode=shiftmode;
2019-11-12 10:13:15 -08:00
res = v;
return (evalerror);
2019-11-11 15:56:03 -08:00
}