mirror of
https://github.com/ksherlock/mpw-shell.git
synced 2025-01-19 13:32:07 +00:00
180 lines
2.9 KiB
C++
180 lines
2.9 KiB
C++
|
#include "phase1.h"
|
||
|
#include <cassert>
|
||
|
|
||
|
enum {
|
||
|
st_text,
|
||
|
st_text_esc,
|
||
|
|
||
|
st_comment,
|
||
|
|
||
|
st_vstring,
|
||
|
st_vstring_esc,
|
||
|
|
||
|
st_dstring,
|
||
|
st_dstring_esc,
|
||
|
|
||
|
st_sstring,
|
||
|
st_sstring_esc,
|
||
|
|
||
|
st_estring,
|
||
|
st_estring1,
|
||
|
st_estring1_esc,
|
||
|
|
||
|
st_estring2,
|
||
|
st_estring2_esc,
|
||
|
|
||
|
st_estring3,
|
||
|
};
|
||
|
|
||
|
|
||
|
int phase1::process(unsigned char c, int st) {
|
||
|
|
||
|
const unsigned char esc = 0xb6;
|
||
|
|
||
|
|
||
|
if (c == '\r' || c == '\n') {
|
||
|
switch (st) {
|
||
|
case st_text:
|
||
|
case st_comment:
|
||
|
default: // will error later.
|
||
|
flush();
|
||
|
multiline = false;
|
||
|
line++;
|
||
|
return st_text;
|
||
|
|
||
|
case st_text_esc:
|
||
|
case st_vstring_esc:
|
||
|
case st_dstring_esc:
|
||
|
case st_sstring_esc:
|
||
|
case st_estring1_esc:
|
||
|
case st_estring2_esc:
|
||
|
multiline = true;
|
||
|
scratch.pop_back();
|
||
|
line++;
|
||
|
return st - 1;
|
||
|
}
|
||
|
}
|
||
|
|
||
|
if (st != st_comment) scratch.push_back(c);
|
||
|
|
||
|
switch(st) {
|
||
|
|
||
|
case st_text:
|
||
|
text:
|
||
|
switch(c) {
|
||
|
case '#':
|
||
|
scratch.pop_back();
|
||
|
return st_comment;
|
||
|
case esc:
|
||
|
return st_text_esc;
|
||
|
case '{':
|
||
|
return st_vstring;
|
||
|
case '"':
|
||
|
return st_dstring;
|
||
|
case '\'':
|
||
|
return st_sstring;
|
||
|
case '`':
|
||
|
return st_estring;
|
||
|
|
||
|
default:
|
||
|
return st_text;
|
||
|
}
|
||
|
break;
|
||
|
|
||
|
case st_comment:
|
||
|
return st;
|
||
|
break;
|
||
|
|
||
|
case st_text_esc:
|
||
|
case st_dstring_esc:
|
||
|
case st_estring1_esc:
|
||
|
case st_estring2_esc:
|
||
|
return st-1;
|
||
|
break;
|
||
|
|
||
|
|
||
|
case st_sstring_esc:
|
||
|
// fall through
|
||
|
case st_sstring:
|
||
|
if (c == '\'') return st_text;
|
||
|
if (c == esc) return st_sstring_esc;
|
||
|
return st_sstring;
|
||
|
break;
|
||
|
|
||
|
case st_dstring:
|
||
|
if (c == '\"') return st_text;
|
||
|
if (c == esc) return st_dstring_esc;
|
||
|
return st_dstring;
|
||
|
break;
|
||
|
|
||
|
case st_vstring_esc:
|
||
|
// fall through
|
||
|
case st_vstring:
|
||
|
// '{' var '}' or '{{' var '}}'
|
||
|
// don't care if {{ or { at this point. A single } terminates.
|
||
|
if (c == '}') return st_text;
|
||
|
if (c == esc) return st_vstring_esc;
|
||
|
return st_vstring;
|
||
|
|
||
|
case st_estring:
|
||
|
// ``...`` or `...`
|
||
|
if (c == '`') return st_estring2;
|
||
|
// fall through.
|
||
|
case st_estring1:
|
||
|
if (c == '`') return st_text;
|
||
|
if (c == esc) return st_estring1_esc;
|
||
|
return st_estring1;
|
||
|
|
||
|
case st_estring2:
|
||
|
if (c == '`') return st_estring3;
|
||
|
if (c == esc) return st_estring2_esc;
|
||
|
return st_estring2;
|
||
|
|
||
|
case st_estring3:
|
||
|
if (c == '`') return st_text;
|
||
|
// error! handled later.
|
||
|
goto text;
|
||
|
|
||
|
break;
|
||
|
|
||
|
}
|
||
|
assert(!"unknown state");
|
||
|
}
|
||
|
|
||
|
|
||
|
void phase1::process(const std::string &s, bool final) {
|
||
|
|
||
|
for (auto c : s) {
|
||
|
cs = process(c, cs);
|
||
|
}
|
||
|
if (final) finish();
|
||
|
}
|
||
|
|
||
|
void phase1::process(const unsigned char *begin, const unsigned char *end, bool final) {
|
||
|
while (begin != end) {
|
||
|
cs = process(*begin++, cs);
|
||
|
}
|
||
|
if (final) finish();
|
||
|
}
|
||
|
|
||
|
void phase1::finish() {
|
||
|
|
||
|
cs = process('\n', cs);
|
||
|
flush();
|
||
|
}
|
||
|
|
||
|
void phase1::reset() {
|
||
|
cs = st_text;
|
||
|
multiline = false;
|
||
|
line = 1;
|
||
|
scratch.clear();
|
||
|
}
|
||
|
|
||
|
void phase1::flush() {
|
||
|
multiline = false;
|
||
|
if (scratch.empty()) return;
|
||
|
// strip trailing whitespace?
|
||
|
if (pipe_to) pipe_to(std::move(scratch));
|
||
|
scratch.clear();
|
||
|
}
|