aboutsummaryrefslogtreecommitdiff
path: root/src/interp.c
diff options
context:
space:
mode:
authorFranklin Wei <git@fwei.tk>2015-11-08 12:45:58 -0500
committerFranklin Wei <git@fwei.tk>2015-11-08 12:45:58 -0500
commit768628ea1767b966418f21dced0572e222a6208b (patch)
tree74395ea195bddb3ec876febd52d025e06ec410e4 /src/interp.c
parent89e35bddfb92c6c37177d9830bf0664e9abb29d9 (diff)
downloadducky-768628ea1767b966418f21dced0572e222a6208b.zip
ducky-768628ea1767b966418f21dced0572e222a6208b.tar.gz
ducky-768628ea1767b966418f21dced0572e222a6208b.tar.bz2
ducky-768628ea1767b966418f21dced0572e222a6208b.tar.xz
rename to interpreter
Diffstat (limited to 'src/interp.c')
-rw-r--r--src/interp.c1336
1 files changed, 1336 insertions, 0 deletions
diff --git a/src/interp.c b/src/interp.c
new file mode 100644
index 0000000..e3b00b6
--- /dev/null
+++ b/src/interp.c
@@ -0,0 +1,1336 @@
+#include <platform.h>
+
+/*******************************************************************************
+ * The scripting language implemented here is an extension of DuckyScript.
+ * DuckyScript as it is now is limited to simple tasks, as it lacks good flow
+ * control or variable support.
+ *
+ * These following extensions to DuckyScript are (to be) implemented.
+ *
+ * Variables: variable names consist of all characters that are not operators
+ * or digits. The limit on variable names is 24 characters.
+ *
+ * NOTE: to have a command on a line following a command using an expression, a
+ * semicolon (;) is needed to separate them.
+ *
+ * "JUMP <EXPR>;" - jumps to line <EXPR> in the file
+ *
+ * "IF <CONDITION>;" - if <CONDITION> equals zero, skip the rest of the line
+ *
+ * "LET X=<EXPR>;" - loads the value of <EXPR> into variable X. Greedy.
+ *
+ * "LOG ..." - outputs any remaining text to the device's screen.
+ * "LOGVAR <EXPR>;" - outputs variable <EXPR> in decimal to the device's screen
+ * "NEWLINE" - outputs a newline
+ * "LOGCHAR <EXPR>;" - outputs <EXPR> as an ASCII character
+ ******************************************************************************/
+
+/*** Defines ***/
+
+#define DEFAULT_DELAY 0
+#define STRING_DELAY 0
+#define TOKEN_IS(str) (strcmp(tok, str) == 0)
+#define MAX_LINE_LEN 512
+
+#define MAXOPSTACK 64
+#define MAXNUMSTACK 64
+#define CALL_STACK_SZ 64
+#define VARMAP_SIZE 256
+
+#define VARFORMAT "%lld"
+#define VARNAME_MAX 24
+
+#define ARRAYLEN(x) (sizeof(x)/sizeof(x[0]))
+
+#define MIN(x,y) ((x<y)?(x):(y))
+
+typedef long long int vartype;
+
+/*** Globals ***/
+
+off_t *line_offset = NULL;
+
+unsigned lines_executed = 0, current_line = 0, num_lines;
+
+unsigned call_stack[CALL_STACK_SZ];
+unsigned stack_frame = 0;
+
+int log_fd = -1, file_des = -1;
+
+struct varnode_t {
+ char name[VARNAME_MAX + 1];
+ vartype val;
+ bool constant; /* used by setVariable */
+ struct varnode_t *next;
+};
+
+void error(const char *fmt, ...) __attribute__((noreturn,format(print,1,2)));
+void vid_write(const char *str);
+void vid_writef(const char *fmt, ...) __attribute__((format(printf,1,2)));
+void debug(const char *fmt, ...) __attribute__((format(printf,1,2)));
+bool isValidVariable(const char *c);
+
+/* variables are stored in a chained hash map */
+/* collisions are manageable, but should be minimized */
+
+struct varnode_t *var_map[VARMAP_SIZE];
+
+/* simple DJB hash */
+uint32_t var_hash(const char *str)
+{
+ uint32_t hash = 5381;
+ char c;
+ while((c = *str++))
+ {
+ hash = ((hash << 5) + hash) ^ c;
+ }
+
+ return hash;
+}
+
+struct varnode_t *lookup_var(const char *name)
+{
+ uint32_t hash = var_hash(name) % VARMAP_SIZE;
+
+ struct varnode_t *iter = var_map[hash];
+ struct varnode_t *last = NULL;
+
+ while(iter)
+ {
+ if(strcmp(iter->name, name) == 0)
+ return iter;
+ last = iter;
+ iter = iter->next;
+ }
+
+ /* not found in this bucket, so add it to the linked list */
+ struct varnode_t *new = malloc(sizeof(struct varnode_t));
+
+ memset(new, 0, sizeof(struct varnode_t));
+ strlcpy(new->name, name, sizeof(new->name));
+ new->val = 0;
+ new->constant = false;
+ new->next = NULL;
+
+ if(!last)
+ var_map[hash] = new;
+ else
+ last->next = new;
+
+ return new;
+}
+
+vartype getVariable(const char *name)
+{
+ return lookup_var(name)->val;
+}
+
+void setVariable(const char *name, vartype val)
+{
+ struct varnode_t *node = lookup_var(name);
+ if(!node->constant)
+ node->val = val;
+ else
+ error("attempted to modify a constant variable");
+}
+
+void setConst(const char *name, bool c)
+{
+ lookup_var(name)->constant = c;
+}
+
+void incVar(const char *name)
+{
+ struct varnode_t *node = lookup_var(name);
+ if(!node->constant)
+ ++lookup_var(name)->val;
+ else
+ error("attempted to modify a constant variable");
+}
+
+void decVar(const char *name)
+{
+ struct varnode_t *node = lookup_var(name);
+ if(!node->constant)
+ --lookup_var(name)->val;
+ else
+ error("attempted to modify a constant variable");
+}
+
+/*** Utility functions ***/
+
+void exit_handler(void)
+{
+ if(file_des >= 0)
+ close(file_des);
+ if(log_fd >= 0)
+ close(log_fd);
+ if(line_offset)
+ free(line_offset);
+ /* free all our variables */
+ for(int i = 0; i < VARMAP_SIZE; ++i)
+ {
+ struct varnode_t *iter = var_map[i], *next;
+ while(iter)
+ {
+ next = iter->next;
+ free(iter);
+ iter = next;
+ }
+ }
+}
+
+void vid_write(const char *str)
+{
+ printf("%s", str);
+}
+
+void __attribute__((format(printf,1,2))) vid_writef(const char *fmt, ...)
+{
+ char fmtbuf[256];
+
+ va_list ap;
+ va_start(ap, fmt);
+ vsnprintf(fmtbuf, sizeof(fmtbuf), fmt, ap);
+ vid_write(fmtbuf);
+ va_end(ap);
+}
+
+void __attribute__((noreturn,format(printf,1,2))) error(const char *fmt, ...)
+{
+ char fmtbuf[256];
+
+ va_list ap;
+ va_start(ap, fmt);
+ vsnprintf(fmtbuf, sizeof(fmtbuf), fmt, ap);
+ if(current_line)
+ vid_writef("Line %d: ", current_line);
+ vid_writef("ERROR: %s\n", fmtbuf);
+ va_end(ap);
+
+ exit(EXIT_FAILURE);
+}
+
+void __attribute__((format(printf,1,2))) warning(const char *fmt, ...)
+{
+ char fmtbuf[256];
+
+ va_list ap;
+ va_start(ap, fmt);
+ vsnprintf(fmtbuf, sizeof(fmtbuf), fmt, ap);
+ vid_writef("Line %d: WARNING: %s\n", current_line, fmtbuf);
+ va_end(ap);
+}
+
+/* grabs a line from a file, -1 on error, returns # bytes read otherwise */
+int read_line(int fd, char *buf, size_t sz)
+{
+ unsigned i = 0;
+ int bytes_read = 0;
+ int status = 1;
+ while(i < sz)
+ {
+ char c;
+ status = read(fd, &c, 1);
+ if(status != 1)
+ break;
+
+ ++bytes_read;
+
+ if(c == '\r')
+ continue;
+ if(c == '\n' || c == EOF)
+ {
+ break;
+ }
+
+ buf[i++] = c;
+ }
+ buf[MIN(i, sz - 1)] = '\0';
+
+ return (status <= 0)?-1:bytes_read;
+}
+
+/* index_lines() precalculates the offset of each line for faster jumping */
+/* also it does a quick pass to index all the labels */
+
+off_t *index_lines(int fd, unsigned *numlines)
+{
+ size_t sz = sizeof(off_t);
+ off_t *data = malloc(sz);
+
+ /* this uses 1-indexed line numbers, so the first indice is wasted */
+ unsigned idx = 1;
+
+ while(1)
+ {
+ sz += sizeof(off_t);
+ data = realloc(data, sz);
+ data[idx] = lseek(fd, 0, SEEK_CUR);
+
+ char buf[MAX_LINE_LEN];
+
+ if(read_line(fd, buf, sizeof(buf)) < 0)
+ break;
+
+ char *save = NULL;
+ char *tok = strtok_r(buf, " \t", &save);
+ if(tok && (strcmp(tok, "LABEL") == 0 || strcmp("LBL", tok) == 0))
+ {
+ tok = strtok_r(NULL, " \t", &save);
+ if(tok && isValidVariable(tok))
+ {
+ setVariable(tok, idx);
+ lookup_var(tok)->constant = true;
+ }
+ }
+
+ ++idx;
+ }
+
+ lseek(fd, 0, SEEK_SET);
+
+ *numlines = idx - 1;
+
+ return data;
+}
+
+void jump_line(int fd, unsigned where)
+{
+ if(1 <= where && where <= num_lines)
+ {
+ lseek(fd, line_offset[where], SEEK_SET);
+ }
+ else
+ error("JUMP target out of range (%u)", where);
+ current_line = where - 1;
+}
+
+void sub_call(int fd, unsigned where)
+{
+ if(stack_frame < ARRAYLEN(call_stack))
+ {
+ call_stack[stack_frame] = current_line + 1;
+ ++stack_frame;
+ jump_line(fd, where);
+ }
+ else
+ error("call stack overflow");
+}
+
+void sub_return(int fd)
+{
+ if(stack_frame > 0)
+ {
+ --stack_frame;
+ jump_line(fd, call_stack[stack_frame]);
+ }
+}
+
+/** Expression Parsing **/
+
+/* based on http://en.literateprograms.org/Shunting_yard_algorithm_%28C%29 */
+
+vartype eval_uminus(vartype a1, vartype a2)
+{
+ (void) a2;
+ return -a1;
+}
+vartype eval_exp(vartype a1, vartype a2)
+{
+ return a2<0 ? 0 : (a2==0?1:a1*eval_exp(a1, a2-1));
+}
+vartype eval_mul(vartype a1, vartype a2)
+{
+ return a1*a2;
+}
+vartype eval_div(vartype a1, vartype a2)
+{
+ if(!a2) {
+ error("division by zero");
+ }
+ return a1/a2;
+}
+vartype eval_mod(vartype a1, vartype a2)
+{
+ if(!a2) {
+ error("division by zero");
+ }
+ return a1%a2;
+}
+vartype eval_add(vartype a1, vartype a2)
+{
+ return a1+a2;
+}
+vartype eval_sub(vartype a1, vartype a2)
+{
+ return a1-a2;
+}
+vartype eval_eq(vartype a1, vartype a2)
+{
+ return a1 == a2;
+}
+vartype eval_neq(vartype a1, vartype a2)
+{
+ return a1 != a2;
+}
+vartype eval_leq(vartype a1, vartype a2)
+{
+ return a1 <= a2;
+}
+vartype eval_geq(vartype a1, vartype a2)
+{
+ return a1 >= a2;
+}
+vartype eval_lt(vartype a1, vartype a2)
+{
+ return a1 < a2;
+}
+vartype eval_gt(vartype a1, vartype a2)
+{
+ return a1 > a2;
+}
+vartype eval_log_neg(vartype a1, vartype a2)
+{
+ (void) a2;
+ return !a1;
+}
+vartype eval_log_and(vartype a1, vartype a2)
+{
+ return a1 && a2;
+}
+vartype eval_log_or(vartype a1, vartype a2)
+{
+ return a1 || a2;
+}
+vartype eval_bit_and(vartype a1, vartype a2)
+{
+ return a1 & a2;
+}
+vartype eval_bit_xor(vartype a1, vartype a2)
+{
+ return a1 ^ a2;
+}
+vartype eval_bit_or(vartype a1, vartype a2)
+{
+ return a1 | a2;
+}
+vartype eval_bit_comp(vartype a1, vartype a2)
+{
+ (void) a2;
+ return ~a1;
+}
+vartype eval_lsh(vartype a1, vartype a2)
+{
+ return a1 << a2;
+}
+vartype eval_rsh(vartype a1, vartype a2)
+{
+ return a1 >> a2;
+}
+vartype eval_sqrt(vartype a1, vartype a2)
+{
+ (void) a2;
+ return sqrt(a1);
+}
+
+enum {ASSOC_NONE=0, ASSOC_LEFT, ASSOC_RIGHT};
+
+/* order matters in this table, because operators can share prefixes */
+/* apart from that, they should be ordered by frequency of use */
+/* operator precedence is based on that of C */
+/* frequency is based off a crude analysis of the rockbox source tree: */
+
+/* 99639 * */
+/* 48282 - */
+/* 46639 + */
+/* 27678 & */
+/* 24542 < */
+/* 21862 / */
+/* 20000 | */
+/* 19138 == */
+/* 12694 % */
+/* 11619 > */
+/* 11087 ! */
+/* 8230 << */
+/* 7339 && */
+/* 7180 != */
+/* 6010 >> */
+/* 5575 || */
+/* 3121 ~ */
+/* 1311 ^ */
+
+/* arrays are implemented as UNARY OPERATORS */
+
+struct op_s {
+ const char *op;
+ int prec;
+ int assoc;
+ int unary;
+ vartype (*eval)(vartype a1, vartype a2);
+ unsigned int len;
+} ops[] = {
+ {"+", 20, ASSOC_LEFT, 0, eval_add, -1},
+ {"-", 20, ASSOC_LEFT, 0, eval_sub, -1},
+ {"**", 40, ASSOC_RIGHT, 0, eval_exp, -1},
+ {"*", 30, ASSOC_LEFT, 0, eval_mul, -1},
+ {"&&", 8, ASSOC_LEFT, 0, eval_log_and, -1},
+ {"&", 11, ASSOC_LEFT, 0, eval_bit_and, -1},
+ {"<<", 15, ASSOC_LEFT, 0, eval_lsh, -1},
+ {">>", 15, ASSOC_LEFT, 0, eval_rsh, -1},
+ {"<=", 14, ASSOC_LEFT, 0, eval_leq, -1},
+ {">=", 14, ASSOC_LEFT, 0, eval_geq, -1},
+ {"<", 14, ASSOC_LEFT, 0, eval_lt, -1},
+ {">", 14, ASSOC_LEFT, 0, eval_gt, -1},
+ {"/", 30, ASSOC_LEFT, 0, eval_div, -1},
+ {"||", 7, ASSOC_LEFT, 0, eval_log_or, -1},
+ {"|", 9, ASSOC_LEFT, 0, eval_bit_or, -1},
+ {"==", 12, ASSOC_LEFT, 0, eval_eq, -1},
+ {"!=", 12, ASSOC_LEFT, 0, eval_neq, -1},
+ {"%", 30, ASSOC_LEFT, 0, eval_mod, -1},
+ {"!", 50, ASSOC_LEFT, 1, eval_log_neg, -1},
+ {"~", 50, ASSOC_LEFT, 1, eval_bit_comp, -1},
+ {"^", 10, ASSOC_LEFT, 0, eval_bit_xor, -1},
+ {"(", 0, ASSOC_NONE, 0, NULL, -1},
+ {")", 0, ASSOC_NONE, 0, NULL, -1},
+ {"sqrt", 1, ASSOC_LEFT, 1, eval_sqrt, -1},
+};
+
+#define OPMAP_SIZE 25
+
+void op_hash_round(char c, uint32_t *hash)
+{
+ *hash *= 70;
+ *hash ^= c;
+}
+
+uint32_t op_hash(const char *c)
+{
+ uint32_t hash = 4412;
+ while(1)
+ {
+ if(!*c)
+ return hash;
+ op_hash_round(*c, &hash);
+ ++c;
+ }
+}
+
+/* optimized hash map for fast lookup of operators */
+struct op_s op_map[OPMAP_SIZE];
+size_t longest_op = 0;
+
+void opmap_insert(struct op_s *op)
+{
+ if(op->len > longest_op)
+ longest_op = op->len;
+
+ uint32_t hash = op_hash(op->op) % OPMAP_SIZE;
+
+ if(op_map[hash].op)
+ error("hash map collision %lu: %s VS %s", hash, op->op, op_map[hash].op);
+ memcpy(op_map+hash, op, sizeof(*op));
+}
+
+void init_optable(void)
+{
+ memset(op_map, 0, sizeof(op_map));
+ for(unsigned int i = 0; i < ARRAYLEN(ops); ++i)
+ {
+ ops[i].len = strlen(ops[i].op);
+ opmap_insert(ops+i);
+ }
+}
+
+const struct op_s *getop(const char *ch, int *len)
+{
+ unsigned int i = 0;
+ uint32_t hash = 4412;
+ const struct op_s *poss = NULL;
+ do {
+ op_hash_round(ch[i], &hash);
+ uint32_t modhash = hash % OPMAP_SIZE;
+
+ if(op_map[modhash].op && strncmp(ch, op_map[modhash].op, op_map[modhash].len) == 0)
+ {
+ *len = op_map[modhash].len;
+ poss = op_map + modhash;
+ }
+ } while(ch[i++] && i < longest_op);
+ return poss;
+}
+
+const struct op_s *opstack[MAXOPSTACK];
+int nopstack;
+
+vartype numstack[MAXNUMSTACK];
+int nnumstack;
+
+void push_opstack(const struct op_s *op)
+{
+ if(nopstack>MAXOPSTACK - 1) {
+ error("operator stack overflow");
+ }
+ opstack[nopstack++] = op;
+}
+
+const struct op_s *pop_opstack(void)
+{
+ if(!nopstack) {
+ error("operator stack empty");
+ }
+ return opstack[--nopstack];
+}
+
+void push_numstack(vartype num)
+{
+ if(nnumstack>MAXNUMSTACK - 1) {
+ error("number stack overflow");
+ }
+ numstack[nnumstack++] = num;
+}
+
+vartype pop_numstack(void)
+{
+ if(!nnumstack) {
+ error("number stack empty");
+ }
+ return numstack[--nnumstack];
+}
+
+bool isDigit(char c)
+{
+ return '0' <= c && c <= '9';
+}
+
+bool isValidNumber(char *str)
+{
+ //vid_writef("isValidNumber %s", str);
+ if(str && (isDigit(*str) || *str == '-'))
+ {
+ while(1)
+ {
+ char c = *str++;
+ if(!c)
+ break;
+ if(!isDigit(c))
+ return false;
+ }
+ return true;
+ }
+ return false;
+}
+
+bool isSpace(char c)
+{
+ //vid_writef("isSpace '%c'", c);
+ return (c == ' ') || (c == '\t');
+}
+
+bool isValidVariable(const char *c)
+{
+ //vid_writef("isValidVariable %s", c);
+ if(!isDigit(*c) && !getop(c, NULL) && !isSpace(*c))
+ {
+ return true;
+ }
+ return false;
+}
+
+vartype getValue(char *str, char *cur)
+{
+ //vid_writef("getValue %s", str);
+ if(str && isValidVariable(str))
+ {
+ /* isolate the variable name into a buffer */
+ char varname[VARNAME_MAX + 1] = { 0 };
+ memcpy(varname, str, cur - str);
+ return getVariable(varname);
+ }
+ return strtol(str, NULL, 0);
+}
+
+bool isValidNumberOrVariable(const char *c)
+{
+ //vid_writef("isValidNumberOrVariable %s", c);
+ if(isDigit(*c) || isValidVariable(c))
+ {
+ return true;
+ }
+ return false;
+}
+
+void shunt_op(const struct op_s *op)
+{
+ const struct op_s *pop;
+ vartype n1, n2;
+ if(strcmp(op->op, "(") == 0)
+ {
+ push_opstack(op);
+ return;
+ }
+ else if(strcmp(op->op, ")") == 0)
+ {
+ while(nopstack > 0 && strcmp(opstack[nopstack-1]->op, "(") != 0)
+ {
+ pop = pop_opstack();
+ n1 = pop_numstack();
+
+ if(pop->unary)
+ push_numstack(pop->eval(n1, 0));
+ else
+ {
+ n2 = pop_numstack();
+ push_numstack(pop->eval(n2, n1));
+ }
+ }
+
+ if(!(pop = pop_opstack()) || strcmp(pop->op,"(") != 0)
+ {
+ error("mismatched parentheses");
+ }
+ return;
+ }
+
+ if(op->assoc == ASSOC_LEFT)
+ {
+ while(nopstack && op->prec <= opstack[nopstack - 1]->prec)
+ {
+ pop = pop_opstack();
+ n1 = pop_numstack();
+ if(pop->unary)
+ push_numstack(pop->eval(n1, 0));
+ else
+ {
+ n2 = pop_numstack();
+ push_numstack(pop->eval(n2, n1));
+ }
+ }
+ }
+ else
+ {
+ while(nopstack && op->prec<opstack[nopstack - 1]->prec)
+ {
+ pop = pop_opstack();
+ n1 = pop_numstack();
+ if(pop->unary)
+ push_numstack(pop->eval(n1, 0));
+ else
+ {
+ n2 = pop_numstack();
+ push_numstack(pop->eval(n2, n1));
+ }
+ }
+ }
+
+ push_opstack(op);
+}
+
+vartype eval_expr(char *str)
+{
+ //vid_write("**************** EVAL EXPR ***************");
+
+ /* token start */
+ char *tstart = NULL;
+
+ /* hard-code some operators that are for internal use only */
+ const struct op_s startop = {"startop_", 0, ASSOC_NONE, 0, NULL, strlen("startop_")};
+ const struct op_s unaryminus = {"-", 50, ASSOC_RIGHT, 1, eval_uminus, strlen("-")};
+
+ const struct op_s *op = NULL;
+ vartype n1, n2;
+ const struct op_s *lastop = &startop;
+
+ nopstack = 0;
+ nnumstack = 0;
+
+ int len;
+ char *expr;
+ for(expr = str; *expr; expr += len)
+ {
+ //vid_write("****** PARSING A CHARACTER ******");
+ len = 1;
+ if(!tstart)
+ {
+ if((op = getop(expr, &len)))
+ {
+ if(lastop && (lastop == &startop || strcmp(lastop->op, ")") != 0))
+ {
+ if(strcmp(op->op, "-") == 0)
+ {
+ op = &unaryminus;
+ len = 1;
+ }
+ else if(strcmp(op->op, "(") != 0 && !op->unary)
+ {
+ error("illegal use of binary operator (%s)", op->op);
+ }
+ }
+ shunt_op(op);
+ lastop = op;
+ }
+ else if(isValidNumberOrVariable(expr))
+ tstart = expr;
+ else if(!isSpace(*expr))
+ {
+ error("syntax error");
+ }
+ }
+ else
+ {
+ if(isSpace(*expr))
+ {
+ push_numstack(getValue(tstart, expr));
+ tstart = NULL;
+ lastop = NULL;
+ }
+ else if((op = getop(expr, &len)))
+ {
+ push_numstack(getValue(tstart, expr));
+ tstart = NULL;
+ shunt_op(op);
+ lastop = op;
+ }
+ else if(!isValidNumberOrVariable(expr))
+ {
+ error("syntax error");
+ }
+ }
+ }
+
+ if(tstart)
+ push_numstack(getValue(tstart, expr));
+
+ while(nopstack) {
+ op = pop_opstack();
+ n1 = pop_numstack();
+ if(!op->unary)
+ {
+ n2 = pop_numstack();
+ push_numstack(op->eval(n2, n1));
+ }
+ else
+ push_numstack(op->eval(n1, 0));
+ }
+
+ if(nnumstack != 1) {
+ error("invalid expression");
+ }
+
+ return numstack[0];
+}
+
+#define OK 0
+#define DONE 1
+#define NEXT 2
+#define BREAK 3
+
+int let_handler(char **save, int *repeats_left)
+{
+ (void) save; (void) repeats_left;
+ char *varname = strtok_r(NULL, "= \t", save);
+
+ if(varname && isValidVariable(varname))
+ {
+ struct varnode_t *node = lookup_var(varname);
+ if(node->constant)
+ error("attempted to modify a constant variable");
+
+ char *tok = strtok_r(NULL, "=;", save);
+ if(tok)
+ node->val = eval_expr(tok);
+ else
+ error("exprected valid expression after LET");
+ }
+ else
+ {
+ error("invalid variable name for LET");
+ }
+ return OK;
+}
+
+int repeat_handler(char **save, int *repeats_left)
+{
+ (void) save; (void) repeats_left;
+ char *tok = strtok_r(NULL, ";", save);
+ if(tok)
+ {
+ if(current_line == 1)
+ error("REPEAT without a previous instruction");
+ *repeats_left = eval_expr(tok) - 1;
+ jump_line(file_des, current_line - 1);
+ return NEXT;
+ }
+ else
+ error("expected valid expression after REPEAT");
+}
+
+int goto_handler(char **save, int *repeats_left)
+{
+ (void) save; (void) repeats_left;
+ char *tok = strtok_r(NULL, ";", save);
+ if(tok)
+ {
+ jump_line(file_des, eval_expr(tok));
+ return NEXT;
+ }
+ else
+ error("expected valid expression after GOTO");
+}
+
+int call_handler(char **save, int *repeats_left)
+{
+ (void) save; (void) repeats_left;
+ char *tok = strtok_r(NULL, "", save);
+ if(tok)
+ {
+ sub_call(file_des, eval_expr(tok));
+ return NEXT;
+ }
+ else
+ error("expected destination for CALL");
+}
+
+int ret_handler(char **save, int *repeats_left)
+{
+ (void) save; (void) repeats_left;
+ sub_return(file_des);
+ return NEXT;
+}
+
+int inc_handler(char **save, int *repeats_left)
+{
+ (void) save; (void) repeats_left;
+ char *tok = strtok_r(NULL, " \t", save);
+ if(isValidVariable(tok))
+ incVar(tok);
+ return OK;
+}
+
+int dec_handler(char **save, int *repeats_left)
+{
+ (void) save; (void) repeats_left;
+ char *tok = strtok_r(NULL, " \t", save);
+ if(isValidVariable(tok))
+ decVar(tok);
+ return OK;
+}
+
+int if_handler(char **save, int *repeats_left)
+{
+ (void) save; (void) repeats_left;
+ char *tok = strtok_r(NULL, ";", save);
+
+ if(!tok)
+ error("expected conditional after IF");
+
+ /* break out of the do-while if the condition is false */
+ if(!eval_expr(tok))
+ {
+ return BREAK;
+ }
+ return OK;
+}
+
+int delay_handler(char **save, int *repeats_left)
+{
+ (void) save; (void) repeats_left;
+ /* delay N 1000ths of a sec */
+ char *tok = strtok_r(NULL, ";", save);
+ if(tok)
+ {
+ int ms = eval_expr(tok);
+ struct timespec t;
+ t.tv_sec = ms / 1000;
+ t.tv_nsec = (ms % 1000) * 1000000;
+ nanosleep(&t, NULL);
+ }
+ else
+ error("expected valid expression after DELAY");
+
+ return OK;
+}
+
+int log_handler(char **save, int *repeats_left)
+{
+ (void) save; (void) repeats_left;
+ char *tok = strtok_r(NULL, "", save);
+
+ vid_write(tok);
+ return OK;
+}
+
+int logvar_handler(char **save, int *repeats_left)
+{
+ (void) save; (void) repeats_left;
+ char *tok = strtok_r(NULL, ";", save);
+ if(tok)
+ {
+ vid_writef(VARFORMAT, eval_expr(tok));
+ return OK;
+ }
+ else
+ error("expected expression after LOGVAR");
+}
+
+int rem_handler(char **save, int *repeats_left)
+{
+ (void) save; (void) repeats_left;
+ return BREAK;
+}
+
+int quit_handler(char **save, int *repeats_left)
+{
+ (void) save; (void) repeats_left;
+ return DONE;
+}
+
+int newline_handler(char **save, int *repeats_left)
+{
+ (void) save; (void) repeats_left;
+ vid_write("\n");
+ return OK;
+}
+
+int logchar_handler(char **save, int *repeats_left)
+{
+ (void) repeats_left;
+ char *tok = strtok_r(NULL, ";", save);
+ if(tok)
+ {
+ vid_writef("%c", eval_expr(tok));
+ return OK;
+ }
+ else
+ error("expected expression after LOGCHAR");
+
+}
+
+struct token_t {
+ const char *tok;
+ int (*func)(char **save, int *repeats_left);
+} tokens[] = {
+ { "LET", let_handler, },
+ { "REPEAT", repeat_handler, },
+ { "JUMP", goto_handler, },
+ { "GOTO", goto_handler, },
+ { "CALL", call_handler, },
+ { "GOSUB", call_handler, },
+ { "RET", ret_handler, },
+ { "RETURN", ret_handler, },
+ { "INC", inc_handler, },
+ { "DEC", dec_handler, },
+ { "IF", if_handler, },
+ { "DELAY", delay_handler, },
+ { "LOG", log_handler, },
+ { "LOGVAR", logvar_handler, },
+ { "LOGCHAR", logchar_handler },
+ { "NEWLINE", newline_handler, },
+ { "REM", rem_handler, },
+ { "//", rem_handler, },
+ { "LABEL", rem_handler, },
+ { "LBL", rem_handler, },
+ { "QUIT", quit_handler, },
+ { "EXIT", quit_handler, },
+};
+
+/* once again, this lookup table is implemented with a perfect hash map */
+
+#define TOKMAP_SIZE ARRAYLEN(tokens)
+struct token_t tokmap[TOKMAP_SIZE];
+
+/* auto-generated with mph-1.2 */
+/*
+ * d=3
+ * n=28
+ * m=22
+ * c=1.23
+ * maxlen=7
+ * minklen=2
+ * maxklen=7
+ * minchar=47
+ * maxchar=89
+ * loop=0
+ * numiter=200
+ * seed=
+ */
+
+static int g[] = {
+ 19, 12, -1, 15, 17, 1, 4, 4, 0, 13,
+ 10, 19, 18, -1, 14, 19, 19, 21, 19, 0,
+ 7, 0, 15, 18, 4, 0, 4, 3,
+};
+
+static int T0[] = {
+ 0x15, 0x0c, 0x1a, 0x17, 0x16, 0x02, 0x16, 0x07, 0x17, 0x09,
+ 0x0f, 0x0f, 0x0f, 0x17, 0x07, 0x0c, 0x1a, 0x08, 0x17, 0x04,
+ 0x14, 0x07, 0x06, 0x07, 0x10, 0x0e, 0x0e, 0x18, 0x01, 0x08,
+ 0x1b, 0x17, 0x14, 0x19, 0x12, 0x1a, 0x0b, 0x0c, 0x12, 0x07,
+ 0x05, 0x05, 0x06, 0x13, 0x06, 0x19, 0x07, 0x0d, 0x01, 0x0c,
+ 0x1a, 0x09, 0x15, 0x1b, 0x16, 0x03, 0x15, 0x19, 0x12, 0x07,
+ 0x1b, 0x05, 0x08, 0x0a, 0x15, 0x05, 0x16, 0x0b, 0x0a, 0x00,
+ 0x0e, 0x0d, 0x08, 0x0a, 0x04, 0x1b, 0x07, 0x17, 0x0c, 0x15,
+ 0x07, 0x0a, 0x02, 0x0c, 0x15, 0x08, 0x0d, 0x12, 0x10, 0x00,
+ 0x07, 0x13, 0x15, 0x10, 0x17, 0x0a, 0x0e, 0x01, 0x14, 0x14,
+ 0x1a, 0x06, 0x15, 0x05, 0x0a, 0x14, 0x03, 0x12, 0x04, 0x0c,
+ 0x11, 0x1b, 0x0e, 0x1b, 0x17, 0x03, 0x08, 0x09, 0x15, 0x08,
+ 0x15, 0x0c, 0x1b, 0x0e, 0x00, 0x16, 0x08, 0x1b, 0x08, 0x10,
+ 0x0a, 0x00, 0x09, 0x01, 0x00, 0x09, 0x13, 0x03, 0x19, 0x03,
+ 0x05, 0x15, 0x10, 0x06, 0x13, 0x02, 0x19, 0x15, 0x13, 0x12,
+ 0x18, 0x16, 0x02, 0x0b, 0x0a, 0x1b, 0x0a, 0x15, 0x08, 0x06,
+ 0x09, 0x12, 0x06, 0x12, 0x14, 0x12, 0x0c, 0x17, 0x15, 0x09,
+ 0x1a, 0x0b, 0x05, 0x00, 0x1b, 0x0c, 0x10, 0x09, 0x02, 0x17,
+ 0x11, 0x0a, 0x15, 0x11, 0x18, 0x12, 0x16, 0x00, 0x0e, 0x10,
+ 0x18, 0x11, 0x0b, 0x07, 0x0b, 0x1a, 0x1b, 0x07, 0x07, 0x15,
+ 0x0a, 0x16, 0x1a, 0x0f, 0x06, 0x19, 0x0c, 0x17, 0x06, 0x0e,
+ 0x12, 0x08, 0x18, 0x17, 0x09, 0x0c, 0x03, 0x1b, 0x15, 0x0e,
+ 0x06, 0x01, 0x11, 0x0e, 0x04, 0x08, 0x05, 0x1b, 0x05, 0x03,
+ 0x15, 0x04, 0x17, 0x10, 0x0e, 0x07, 0x0e, 0x14, 0x13, 0x17,
+ 0x14, 0x1b, 0x0a, 0x07, 0x18, 0x04, 0x03, 0x00, 0x10, 0x19,
+ 0x1a, 0x16, 0x0a, 0x0f, 0x14, 0x1a, 0x18, 0x19, 0x0c, 0x1b,
+ 0x06, 0x0a, 0x03, 0x0b, 0x0e, 0x1b, 0x1b, 0x0d, 0x03, 0x0d,
+ 0x19, 0x0a, 0x0f, 0x14, 0x14, 0x06, 0x00, 0x01, 0x10, 0x0d,
+ 0x19, 0x18, 0x09, 0x1b, 0x17, 0x16, 0x14, 0x15, 0x0b, 0x10,
+ 0x14, 0x02, 0x1b, 0x08, 0x0d, 0x0d, 0x13, 0x0c, 0x0a, 0x16,
+ 0x09,
+};
+
+static int T1[] = {
+ 0x13, 0x0e, 0x17, 0x12, 0x13, 0x12, 0x08, 0x19, 0x05, 0x0d,
+ 0x0b, 0x07, 0x06, 0x05, 0x0b, 0x0f, 0x06, 0x07, 0x12, 0x06,
+ 0x11, 0x0d, 0x08, 0x10, 0x18, 0x1b, 0x18, 0x12, 0x03, 0x00,
+ 0x00, 0x16, 0x1a, 0x07, 0x18, 0x11, 0x19, 0x10, 0x1a, 0x0e,
+ 0x0e, 0x16, 0x16, 0x02, 0x10, 0x0d, 0x11, 0x0a, 0x02, 0x14,
+ 0x00, 0x0c, 0x1a, 0x1a, 0x08, 0x02, 0x01, 0x06, 0x0b, 0x0b,
+ 0x06, 0x02, 0x13, 0x15, 0x0f, 0x11, 0x0d, 0x01, 0x04, 0x0c,
+ 0x0b, 0x13, 0x02, 0x11, 0x06, 0x12, 0x0e, 0x07, 0x01, 0x10,
+ 0x1b, 0x01, 0x01, 0x0a, 0x0b, 0x09, 0x0c, 0x13, 0x11, 0x0a,
+ 0x03, 0x11, 0x02, 0x13, 0x01, 0x08, 0x0c, 0x0a, 0x06, 0x0e,
+ 0x00, 0x13, 0x1b, 0x03, 0x12, 0x01, 0x01, 0x0e, 0x0d, 0x09,
+ 0x11, 0x1b, 0x08, 0x05, 0x0b, 0x0c, 0x02, 0x08, 0x10, 0x13,
+ 0x02, 0x13, 0x14, 0x04, 0x16, 0x15, 0x18, 0x06, 0x10, 0x13,
+ 0x1a, 0x01, 0x03, 0x16, 0x17, 0x12, 0x1b, 0x10, 0x0f, 0x0f,
+ 0x06, 0x0f, 0x0f, 0x1a, 0x10, 0x17, 0x18, 0x09, 0x06, 0x10,
+ 0x01, 0x03, 0x06, 0x0d, 0x03, 0x0d, 0x0d, 0x0f, 0x16, 0x09,
+ 0x13, 0x14, 0x0b, 0x16, 0x1a, 0x12, 0x0d, 0x1a, 0x06, 0x00,
+ 0x19, 0x18, 0x17, 0x18, 0x1b, 0x10, 0x0d, 0x14, 0x17, 0x16,
+ 0x0a, 0x04, 0x0e, 0x03, 0x10, 0x1a, 0x01, 0x10, 0x19, 0x04,
+ 0x09, 0x0f, 0x08, 0x0b, 0x1a, 0x0f, 0x0f, 0x09, 0x09, 0x1b,
+ 0x18, 0x08, 0x16, 0x03, 0x10, 0x05, 0x14, 0x02, 0x19, 0x0f,
+ 0x18, 0x13, 0x03, 0x16, 0x06, 0x1b, 0x01, 0x0f, 0x19, 0x0d,
+ 0x00, 0x0a, 0x11, 0x0f, 0x0d, 0x0e, 0x08, 0x10, 0x1b, 0x0c,
+ 0x1b, 0x19, 0x08, 0x17, 0x0c, 0x1b, 0x0a, 0x12, 0x0d, 0x0f,
+ 0x0a, 0x14, 0x04, 0x0f, 0x0b, 0x05, 0x0f, 0x18, 0x04, 0x18,
+ 0x09, 0x05, 0x06, 0x1b, 0x04, 0x13, 0x19, 0x0c, 0x1b, 0x0c,
+ 0x18, 0x19, 0x08, 0x0e, 0x11, 0x0b, 0x03, 0x16, 0x1b, 0x15,
+ 0x11, 0x14, 0x09, 0x09, 0x17, 0x0e, 0x12, 0x1a, 0x14, 0x12,
+ 0x19, 0x08, 0x16, 0x07, 0x12, 0x0a, 0x17, 0x14, 0x13, 0x06,
+ 0x10, 0x0f, 0x03, 0x18, 0x0d, 0x04, 0x13, 0x10, 0x1b, 0x03,
+ 0x09,
+};
+
+static int T2[] = {
+ 0x16, 0x04, 0x18, 0x10, 0x13, 0x0f, 0x08, 0x19, 0x19, 0x17,
+ 0x13, 0x0b, 0x0b, 0x08, 0x0a, 0x08, 0x01, 0x05, 0x15, 0x1a,
+ 0x11, 0x02, 0x16, 0x0f, 0x0d, 0x09, 0x16, 0x13, 0x17, 0x0d,
+ 0x05, 0x11, 0x11, 0x0d, 0x05, 0x14, 0x01, 0x19, 0x12, 0x0a,
+ 0x15, 0x15, 0x15, 0x17, 0x13, 0x15, 0x0e, 0x18, 0x11, 0x0f,
+ 0x03, 0x04, 0x03, 0x09, 0x1a, 0x13, 0x04, 0x08, 0x09, 0x07,
+ 0x15, 0x16, 0x05, 0x11, 0x02, 0x00, 0x15, 0x10, 0x1b, 0x0d,
+ 0x14, 0x18, 0x10, 0x0f, 0x13, 0x13, 0x14, 0x11, 0x10, 0x0a,
+ 0x05, 0x03, 0x1a, 0x14, 0x0d, 0x19, 0x05, 0x1a, 0x1a, 0x00,
+ 0x06, 0x0c, 0x07, 0x11, 0x01, 0x18, 0x12, 0x06, 0x02, 0x06,
+ 0x1a, 0x17, 0x03, 0x0d, 0x09, 0x02, 0x09, 0x19, 0x03, 0x01,
+ 0x16, 0x0d, 0x17, 0x10, 0x01, 0x06, 0x18, 0x06, 0x10, 0x16,
+ 0x07, 0x06, 0x12, 0x1a, 0x17, 0x04, 0x16, 0x19, 0x0a, 0x1b,
+ 0x15, 0x16, 0x13, 0x11, 0x09, 0x1b, 0x02, 0x05, 0x12, 0x0c,
+ 0x10, 0x11, 0x08, 0x0f, 0x0c, 0x05, 0x0d, 0x0f, 0x19, 0x01,
+ 0x1b, 0x17, 0x03, 0x08, 0x00, 0x1a, 0x0d, 0x0c, 0x07, 0x19,
+ 0x17, 0x01, 0x03, 0x0e, 0x02, 0x18, 0x19, 0x10, 0x02, 0x00,
+ 0x0c, 0x02, 0x0a, 0x0b, 0x1a, 0x11, 0x19, 0x01, 0x16, 0x02,
+ 0x09, 0x01, 0x10, 0x1a, 0x0c, 0x0c, 0x12, 0x10, 0x18, 0x1b,
+ 0x14, 0x17, 0x17, 0x12, 0x1b, 0x08, 0x0d, 0x0c, 0x07, 0x1a,
+ 0x04, 0x03, 0x0b, 0x0e, 0x1b, 0x16, 0x10, 0x08, 0x17, 0x16,
+ 0x16, 0x10, 0x17, 0x0a, 0x1a, 0x0c, 0x17, 0x0f, 0x0a, 0x19,
+ 0x00, 0x0c, 0x08, 0x11, 0x17, 0x09, 0x17, 0x0f, 0x00, 0x05,
+ 0x17, 0x05, 0x05, 0x17, 0x17, 0x15, 0x0f, 0x00, 0x00, 0x19,
+ 0x0c, 0x19, 0x0f, 0x11, 0x08, 0x18, 0x01, 0x10, 0x17, 0x17,
+ 0x0d, 0x18, 0x13, 0x15, 0x0d, 0x0e, 0x0e, 0x09, 0x05, 0x17,
+ 0x14, 0x17, 0x16, 0x16, 0x1b, 0x10, 0x10, 0x0c, 0x06, 0x02,
+ 0x17, 0x12, 0x05, 0x08, 0x12, 0x00, 0x0b, 0x17, 0x07, 0x12,
+ 0x08, 0x01, 0x18, 0x0a, 0x19, 0x16, 0x01, 0x0b, 0x12, 0x12,
+ 0x06, 0x0a, 0x0e, 0x0c, 0x10, 0x0d, 0x00, 0x04, 0x19, 0x12,
+ 0x06,
+};
+
+#define uchar unsigned char
+
+int
+tok_hash(const uchar *key)
+{
+ int i;
+ unsigned f0, f1, f2;
+ const uchar *kp = key;
+
+ for (i=-47, f0=f1=f2=0; *kp; ++kp) {
+ if (*kp < 47 || *kp > 89)
+ return -1;
+ if (kp-key > 6)
+ return -1;
+ f0 += T0[i + *kp];
+ f1 += T1[i + *kp];
+ f2 += T2[i + *kp];
+ i += 43;
+ }
+
+ if (kp-key < 2)
+ return -1;
+
+ f0 %= 28;
+ f1 %= 28;
+ f2 %= 28;
+
+ return (g[f0] + g[f1] + g[f2]) % 22;
+}
+
+void tokmap_insert(struct token_t *tok)
+{
+ uint32_t hash = tok_hash(tok->tok) % TOKMAP_SIZE;
+ if(hash < 0 || tokmap[hash].tok)
+ error("FIXME: hash map collision");
+ memcpy(tokmap+hash, tok, sizeof(*tok));
+}
+
+void init_tokmap(void)
+{
+ memset(tokmap, 0, sizeof(tokmap));
+ for(unsigned int i = 0; i < ARRAYLEN(tokens); ++i)
+ {
+ tokmap_insert(tokens+i);
+ }
+}
+
+void init_globals(void)
+{
+ line_offset = NULL;
+ log_fd = -1;
+ file_des = -1;
+ stack_frame = 0;
+ lines_executed = 0;
+ current_line = 0;
+ memset(var_map, 0, sizeof(var_map));
+}
+
+void ducky_main(int fd, bool verbose)
+{
+ init_globals();
+
+ if(verbose)
+ {
+ vid_write("*** DS-2 INIT ***");
+ vid_write("QUACK AT YOUR OWN RISK!");
+ vid_write("The author assumes no liability for any damages caused by this program.");
+ }
+
+ file_des = fd;
+
+ atexit(exit_handler);
+
+ if(file_des < 0)
+ error("invalid file");
+
+ init_optable();
+ init_tokmap();
+
+ /* initialize the "." variable, which is the line counter */
+ setVariable(".", 0);
+ setConst(".", true);
+
+ struct varnode_t *dot_var = lookup_var(".");
+
+ /* initialize some other constants */
+ setVariable("true", 1);
+ setConst("true", true);
+
+ setVariable("false", 0);
+ setConst("false", true);
+
+ line_offset = index_lines(file_des, &num_lines);
+ if(verbose)
+ {
+ vid_writef("Indexing complete (%u lines).", num_lines);
+
+ vid_write("Executing...");
+ }
+ int repeats_left = 0;
+
+ while(1)
+ {
+ char instr_buf[MAX_LINE_LEN];
+ memset(instr_buf, 0, sizeof(instr_buf));
+ if(read_line(file_des, instr_buf, sizeof(instr_buf)) <= 0)
+ {
+ if(verbose)
+ vid_writef("end of file");
+ goto done;
+ }
+ char *tok = NULL, *save = NULL;
+
+ ++current_line;
+ dot_var->val = current_line;
+ ++lines_executed;
+
+ char *buf = instr_buf;
+
+ /* execute all the commands on this line/instruction */
+ do {
+ tok = strtok_r(buf, " -\t", &save);
+ buf = NULL;
+
+ if(!tok)
+ break;
+
+ int hash = tok_hash(tok) % TOKMAP_SIZE;
+ struct token_t *t = tokmap+hash;
+ if(hash >= 0 && strcmp(t->tok, tok) == 0)
+ switch(tokmap[hash].func(&save, &repeats_left))
+ {
+ case OK:
+ break;
+ case BREAK:
+ goto break_out;
+ case DONE:
+ goto done;
+ case NEXT:
+ goto next_line;
+ default:
+ error("FIXME: invalid return value");
+ }
+ else if(tok[0] != '#')
+ {
+ error("unknown token `%s` on line %d %d", tok, current_line);
+ goto done;
+ }
+ } while(tok);
+ break_out:
+
+ if(repeats_left > 0)
+ {
+ --repeats_left;
+ if(repeats_left)
+ jump_line(file_des, current_line);
+ else
+ {
+ if(current_line + 2 > num_lines)
+ goto done;
+ jump_line(file_des, current_line + 2);
+ }
+ }
+ next_line:
+ ;
+ }
+
+done:
+
+ return;
+}