#include #include #include #include /* simple tagging * ends in 00: pointer * 01: fixnum * 011: symbol * 111: immediate symbol * 0110: char * 1110: other immediate object (NULL, TRUE, FALSE) */ #define SEXP_FIXNUM_BITS 2 #define SEXP_IMMEDIATE_BITS 3 #define SEXP_EXTENDED_BITS 4 #define SEXP_FIXNUM_MASK 3 #define SEXP_IMMEDIATE_MASK 7 #define SEXP_EXTENDED_MASK 15 #define SEXP_POINTER_TAG 0 #define SEXP_FIXNUM_TAG 1 #define SEXP_LSYMBOL_TAG 3 #define SEXP_ISYMBOL_TAG 7 #define SEXP_CHAR_TAG 6 enum sexp_types { SEXP_FIXNUM, SEXP_CHAR, SEXP_BOOLEAN, SEXP_PAIR, SEXP_SYMBOL, SEXP_STRING, SEXP_VECTOR, SEXP_PROCEDURE, SEXP_ENV, SEXP_BYTECODE, SEXP_CORE, SEXP_OPCODE, }; typedef struct sexp_struct { char tag; void *data1; void *data2; } *sexp; #include "sexp-hufftabs.c" static int initialized_p = 0; /* static sexp the_dot_symbol; */ static sexp the_quote_symbol; static sexp the_quasiquote_symbol; static sexp the_unquote_symbol; static sexp the_unquote_splicing_symbol; static sexp the_lambda_symbol; static sexp the_begin_symbol; static sexp the_define_symbol; static sexp the_set_x_symbol; static sexp the_if_symbol; #define MAKE_IMMEDIATE(n) ((sexp) ((n<<4) + 14)) #define SEXP_NULL MAKE_IMMEDIATE(0) #define SEXP_FALSE MAKE_IMMEDIATE(1) #define SEXP_TRUE MAKE_IMMEDIATE(2) #define SEXP_EOF MAKE_IMMEDIATE(3) #define SEXP_UNDEF MAKE_IMMEDIATE(4) #define SEXP_ERROR MAKE_IMMEDIATE(5) #define SEXP_CLOSE MAKE_IMMEDIATE(6) /* internal use */ #define SEXP_RAWDOT MAKE_IMMEDIATE(7) /* internal use */ #define SEXP_NULLP(x) ((x) == SEXP_NULL) #define SEXP_POINTERP(x) (((unsigned long)(x) & SEXP_FIXNUM_MASK) == SEXP_POINTER_TAG) #define SEXP_INTEGERP(x) (((unsigned long)(x) & SEXP_FIXNUM_MASK) == SEXP_FIXNUM_TAG) #define SEXP_ISYMBOLP(x) (((unsigned long)(x) & SEXP_IMMEDIATE_MASK) == SEXP_ISYMBOL_TAG) #define SEXP_CHARP(x) (((unsigned long)(x) & SEXP_EXTENDED_MASK) == SEXP_CHAR_TAG) #define SEXP_BOOLEANP(x) (((x) == SEXP_TRUE) || ((x) == SEXP_FALSE)) #define SEXP_PAIRP(x) (SEXP_POINTERP(x) && ((sexp)(x))->tag == SEXP_PAIR) #define SEXP_STRINGP(x) (SEXP_POINTERP(x) && ((sexp)(x))->tag == SEXP_STRING) #define SEXP_LSYMBOLP(x) (SEXP_POINTERP(x) && ((sexp)(x))->tag == SEXP_SYMBOL) #define SEXP_VECTORP(x) (SEXP_POINTERP(x) && ((sexp)(x))->tag == SEXP_VECTOR) #define SEXP_PROCEDUREP(x) (SEXP_POINTERP(x) && ((sexp)(x))->tag == SEXP_PROCEDURE) #define SEXP_ENVP(x) (SEXP_POINTERP(x) && ((sexp)(x))->tag == SEXP_ENV) #define SEXP_BYTECODEP(x) (SEXP_POINTERP(x) && ((sexp)(x))->tag ==SEXP_BYTECODE) #define SEXP_COREP(x) (SEXP_POINTERP(x) && ((sexp)(x))->tag == SEXP_CORE) #define SEXP_OPCODEP(x) (SEXP_POINTERP(x) && ((sexp)(x))->tag == SEXP_OPCODE) #define SEXP_SYMBOLP(x) (SEXP_ISYMBOLP(x) || SEXP_LSYMBOLP(x)) /* #define SEXP_DOTP(x) (SEXP_SYMBOLP(x) && (strncmp(string_data(x), ".", 2) == 0)) */ /* #define SEXP_DOTP(x) (x==the_dot_symbol) */ #define SEXP_DOTP(x) (((unsigned long)(x))==((0x5D00<>SEXP_FIXNUM_BITS) #define make_character(n) ((sexp) (((long) n<>SEXP_EXTENDED_BITS) #define vector_length(x) ((unsigned long) x->data1) #define vector_data(x) ((sexp*) x->data2) #define procedure_code(x) ((bytecode) ((sexp)x)->data1) #define procedure_vars(x) ((sexp) ((sexp)x)->data2) #define string_length(x) ((unsigned long) x->data1) #define string_data(x) ((char*) x->data2) #define symbol_pointer(x) ((sexp) (((unsigned long)x)-SEXP_LSYMBOL_TAG)) #define symbol_length(x) ((unsigned long) (symbol_pointer(x)->data1)) #define symbol_data(x) ((char*) (symbol_pointer(x)->data2)) #define sexp_add(a, b) ((sexp)(((unsigned long)a)+((unsigned long)b)-SEXP_FIXNUM_TAG)) #define sexp_sub(a, b) ((sexp)(((unsigned long)a)-((unsigned long)b)+SEXP_FIXNUM_TAG)) #define sexp_mul(a, b) ((sexp)((((((unsigned long)a)-SEXP_FIXNUM_TAG)*(((unsigned long)b)>>SEXP_FIXNUM_BITS))+SEXP_FIXNUM_TAG))) #define sexp_div(a, b) ((sexp)(((((unsigned long)a)>>SEXP_FIXNUM_BITS)/(((unsigned long)b)>>SEXP_FIXNUM_BITS))<>SEXP_FIXNUM_BITS)%(((unsigned long)b)>>SEXP_FIXNUM_BITS))<tag = SEXP_PAIR; pair->data1 = (void*) head; pair->data2 = (void*) tail; return pair; } #define list2(a, b) cons(a, cons(b, SEXP_NULL)) #define list3(a, b, c) cons(a, cons(b, cons(c, SEXP_NULL))) #define list4(a, b, c, d) cons(a, cons(b, cons(c, cons(d, SEXP_NULL)))) #define SEXP_CAR(x) (((sexp)x)->data1) #define SEXP_CDR(x) (((sexp)x)->data2) #define SEXP_CAAR(x) (SEXP_CAR(SEXP_CAR(x))) #define SEXP_CADR(x) (SEXP_CAR(SEXP_CDR(x))) #define SEXP_CDAR(x) (SEXP_CDR(SEXP_CAR(x))) #define SEXP_CDDR(x) (SEXP_CDR(SEXP_CDR(x))) #define SEXP_CADDR(x) (SEXP_CAR(SEXP_CDDR(x))) #define SEXP_CDDDR(x) (SEXP_CDR(SEXP_CDDR(x))) #define SEXP_CADDDR(x) (SEXP_CADR(SEXP_CDDR(x))) #define SEXP_CDDDDR(x) (SEXP_CDDR(SEXP_CDDR(x))) sexp read_sexp (FILE *in); /* separators: space, tab, newline, ; () [] , ' " */ /* 9 10 11 12 13 32 34 39 40 41 44 59 91 93 */ /* 0 1 2 3 4 23 25 30 31 32 35 50 82 84 */ /* 0000000 */ /* 0000001 */ /* 0000010 */ /* 0000011 */ /* 0000100 */ /* 0010111 */ /* 0011001 */ /* 0011110 */ /* 0011111 */ /* 0100000 */ /* 0100011 */ /* 0110010 */ /* 1010010 */ /* 1010100 */ static char separators[] = { /* 1 2 3 4 5 6 7 8 9 a b c d e f */ 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 0, 0, /* x0_ */ 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, /* x1_ */ 1, 0, 1, 0, 0, 0, 0, 1, 1, 1, 0, 0, 1, 0, 0, 0, /* x2_ */ 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, /* x3_ */ 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, /* x4_ */ 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 0, /* x5_ */ 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, /* x6_ */ 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, /* x7_ */ }; static int is_separator (int c) { /* return (!((c-9)&(~3))) | (~(c^4)); */ return 0tag = SEXP_STRING; s->data1 = (void*) len; s->data2 = (void*) mystr; return s; } struct huff_entry { unsigned char len; unsigned short bits; }; static struct huff_entry huff_table[] = { #include "sexp-huff.c" }; /* http://planetmath.org/encyclopedia/GoodHashTablePrimes.html */ static sexp* symbol_table = NULL; static unsigned long symbol_table_primes[] = { 97, 389, 1543, 6151, 12289, 24593, 49157, 98317, 196613, 393241, 786433, 1572869, 3145739, 6291469, 12582917, 25165843, 50331653, 100663319, 201326611, 402653189, 805306457, 1610612741}; static int symbol_table_prime_index = 0; static int symbol_table_count = 0; #define FNV_PRIME 16777619 #define FNV_OFFSET_BASIS 2166136261uL int string_hash(char *str, int acc) { while (*str) {acc *= FNV_PRIME; acc ^= *str++;} return acc; } sexp intern(char *str) { struct huff_entry he; unsigned long len, res=FNV_OFFSET_BASIS, space=3, newbits, i, d, cell; char c, *mystr, *p=str; sexp sym, *newtable; res = 0; for (p=str; c=*p; p++) { he = huff_table[c]; newbits = he.len; if ((space+newbits) > (sizeof(sexp)*8)) { goto normal_intern; } res |= (((unsigned long) he.bits) << space); space += newbits; } /* fprintf(stderr, "immediate symbol: %x\n", res); */ return (sexp) (res + SEXP_ISYMBOL_TAG); normal_intern: /* fprintf(stderr, "normal intern\n"); */ res = string_hash(p, res); d = symbol_table_primes[symbol_table_prime_index]; cell = res % d; for (i=0; i d*4) { fprintf(stderr, "resizing symbol table\n"); newtable = malloc(symbol_table_primes[symbol_table_prime_index++] * sizeof(sexp)); free(symbol_table); symbol_table = newtable; } new_entry: sym = SEXP_NEW(); if (! sym) return SEXP_ERROR; len = strlen(str); mystr = SEXP_ALLOC(len+1); if (! mystr) { SEXP_FREE(sym); return SEXP_ERROR; } memcpy(mystr, str, len+1); sym->tag = SEXP_SYMBOL; sym->data1 = (void*) len; sym->data2 = (void*) mystr; symbol_table[cell] = (sexp) (((unsigned long)sym) + 3); return symbol_table[cell]; } sexp make_vector(unsigned long len, sexp dflt) { int i; sexp v = SEXP_NEW(); if (v == NULL) return SEXP_ERROR; sexp *x = (void*) SEXP_ALLOC(len*sizeof(sexp)); if (x == NULL) return SEXP_ERROR; for (i=0; itag = SEXP_VECTOR; v->data1 = (void*) len; v->data2 = (void*) x; return v; } sexp list_to_vector(sexp ls) { sexp vec = make_vector(length(ls), SEXP_FALSE); if (vec == SEXP_ERROR) return vec; sexp x; sexp *elts = vector_data(vec); int i; for (i=0, x=ls; SEXP_PAIRP(x); i++, x=cdr(x)) { elts[i] = car(x); } return vec; } sexp vector(int count, ...) { sexp vec = make_vector(count, SEXP_FALSE); if (vec == SEXP_ERROR) return vec; sexp *elts = vector_data(vec); va_list ap; int i; va_start(ap, count); for (i=0; i"); } else if (SEXP_POINTERP(obj)) { switch (obj->tag) { case SEXP_PAIR: fprintf(out, "("); write_sexp(out, car(obj)); for (x=cdr(obj); SEXP_PAIRP(x); x=cdr(x)) { fprintf(out, " "); write_sexp(out, car(x)); } if (! SEXP_NULLP(x)) { fprintf(out, " . "); write_sexp(out, x); } fprintf(out, ")"); break; case SEXP_VECTOR: len = vector_length(obj); sexp *elts = vector_data(obj); if (len == 0) { fprintf(out, "#()"); } else { fprintf(out, "#("); write_sexp(out, elts[0]); for (i=1; i"); break; case SEXP_STRING: fprintf(out, "\""); /* FALLTHROUGH */ case SEXP_SYMBOL: fprintf(out, "%s", string_data(obj)); if (obj->tag == SEXP_STRING) { fprintf(out, "\""); } break; } } else if (SEXP_INTEGERP(obj)) { fprintf(out, "%d", unbox_integer(obj)); } else if (SEXP_CHARP(obj)) { if (33 <= unbox_character(obj) < 127) { fprintf(out, "#\\%c", unbox_character(obj)); } else { fprintf(out, "#\\x%02d", unbox_character(obj)); } } else if (SEXP_SYMBOLP(obj)) { if (((unsigned long)obj&7)==7) { c = ((unsigned long)obj)>>3; while (c) { #include "sexp-unhuff.c" putc(res, out); } } else { fprintf(out, "%s", symbol_data(obj)); } } else { switch ((unsigned long) obj) { case (int) SEXP_NULL: fprintf(out, "()"); break; case (int) SEXP_TRUE: fprintf(out, "#t"); break; case (int) SEXP_FALSE: fprintf(out, "#f"); break; case (int) SEXP_EOF: fprintf(out, "#"); break; case (int) SEXP_UNDEF: fprintf(out, "#"); break; default: fprintf(out, "#"); } } } void* free_sexp (sexp obj) { int len, i; sexp *elts; if (SEXP_POINTERP(obj)) { switch (obj->tag) { case SEXP_PAIR: free_sexp(car(obj)); free_sexp(cdr(obj)); break; case SEXP_VECTOR: len = vector_length(obj); elts = vector_data(obj); for (i=0; i #else #define errx(code, msg, ...) (fprintf(stderr,msg"\n",__VA_ARGS__), exit(code)) #endif #define INIT_BCODE_SIZE 128 #define INIT_STACK_SIZE 1024 typedef struct bytecode { char tag; unsigned int len; unsigned char data[]; } *bytecode; /* env binding: #(id chain offset flags) */ /* chain is the index into the closure parent list (0 for current lambda) */ /* macros/constants have a value instead of chain */ typedef struct env { char tag; struct env *parent; sexp bindings; } *env; enum core_form_names { CORE_DEFINE, CORE_SET, CORE_LAMBDA, CORE_IF, CORE_BEGIN, CORE_QUOTE, CORE_DEFINE_SYNTAX, CORE_LET_SYNTAX, CORE_LETREC_SYNTAX, }; typedef struct core_form { char tag; char* name; char code; } *core_form; static struct core_form core_forms[] = { {SEXP_CORE, "define", CORE_DEFINE}, {SEXP_CORE, "set!", CORE_SET}, {SEXP_CORE, "lambda", CORE_LAMBDA}, {SEXP_CORE, "if", CORE_IF}, {SEXP_CORE, "begin", CORE_BEGIN}, {SEXP_CORE, "quote", CORE_QUOTE}, {SEXP_CORE, "define-syntax", CORE_DEFINE_SYNTAX}, {SEXP_CORE, "let-syntax", CORE_LET_SYNTAX}, {SEXP_CORE, "letrec-syntax", CORE_LETREC_SYNTAX}, }; enum opcode_classes { OPC_GENERIC, OPC_TYPE_PREDICATE, OPC_PREDICATE, OPC_ARITHMETIC, OPC_ARITHMETIC_INV, OPC_ARITHMETIC_CMP, OPC_CONSTRUCTOR, }; /* #define OP_UNSAFE(op) ((op)+128) */ enum opcode_names { OP_NOOP, OP_STACK_REF, OP_STACK_SET, OP_GLOBAL_REF, OP_GLOBAL_SET, OP_CLOSURE_REF, OP_CLOSURE_SET, OP_PUSH, OP_DUP, OP_DROP, OP_SWAP, OP_CAR, OP_CDR, OP_CONS, OP_ADD, OP_SUB, OP_MUL, OP_DIV, OP_MOD, OP_NEG, OP_INV, OP_LT, OP_CALL, OP_JUMP_UNLESS, OP_JUMP, OP_RET, OP_DONE, }; typedef struct opcode { char tag; char op_class; char op_name; char num_args; char var_args_p; char arg1_type; char arg2_type; char* name; sexp proc; } *opcode; static struct opcode opcodes[] = { {SEXP_OPCODE, OPC_TYPE_PREDICATE, OP_CAR, 1, 0, SEXP_PAIR, 0, "car", NULL}, {SEXP_OPCODE, OPC_TYPE_PREDICATE, OP_CDR, 1, 0, SEXP_PAIR, 0, "cdr", NULL}, {SEXP_OPCODE, OPC_ARITHMETIC, OP_ADD, 0, 1, SEXP_FIXNUM, 0, "+", NULL}, {SEXP_OPCODE, OPC_ARITHMETIC_INV, OP_SUB, 0, 1, SEXP_FIXNUM, 0, "-", NULL}, {SEXP_OPCODE, OPC_ARITHMETIC, OP_MUL, 0, 1, SEXP_FIXNUM, 0, "*", NULL}, {SEXP_OPCODE, OPC_ARITHMETIC_INV, OP_DIV, 0, 1, SEXP_FIXNUM, 0, "/", NULL}, {SEXP_OPCODE, OPC_ARITHMETIC, OP_MOD, 2, 0, SEXP_FIXNUM, SEXP_FIXNUM, "%", NULL}, {SEXP_OPCODE, OPC_ARITHMETIC_CMP, OP_LT, 0, 1, SEXP_FIXNUM, 0, "<", NULL}, }; sexp env_cell(env e, sexp key) { sexp ls, res=NULL; do { for (ls=e->bindings; SEXP_PAIRP(ls); ls=SEXP_CDR(ls)) { if (SEXP_CAAR(ls) == key) { res = SEXP_CAR(ls); break; } } e = e->parent; } while (e && ! res); return res; } sexp make_procedure(sexp bc, sexp vars) { sexp proc = SEXP_NEW(); if (! proc) return SEXP_ERROR; proc->tag = SEXP_PROCEDURE; proc->data1 = (void*) bc; proc->data2 = (void*) vars; return proc; } void env_define(env e, sexp key, sexp value) { sexp cell = env_cell(e, key); if (cell) { SEXP_CDR(cell) = value; } else { e->bindings = cons(cons(key, value), e->bindings); } } env make_standard_env() { int i; env e = (env) malloc(sizeof(struct env)); e->tag = SEXP_ENV; e->parent = NULL; e->bindings = SEXP_NULL; for (i=0; i<(sizeof(core_forms)/sizeof(struct core_form)); i++) { env_define(e, intern(core_forms[i].name), (sexp)(&core_forms[i])); } for (i=0; i<(sizeof(opcodes)/sizeof(struct opcode)); i++) { env_define(e, intern(opcodes[i].name), (sexp)(&opcodes[i])); } return e; } /* ******************************************************************** */ /* char *buffncpy(char *buf, unsigned int n, unsigned int len) { */ /* char *res; */ /* if (n==len) { */ /* res = buf; */ /* } else { */ /* res = (char*) malloc(n); */ /* strncpy(res, buf, n); */ /* free(buf); */ /* } */ /* return res; */ /* } */ /* char *buffngrow(char *buf, unsigned int newlen) { */ /* char *tmp = (char*) malloc(newlen); */ /* strncpy(tmp, buf, newlen/2); */ /* free(buf); */ /* return tmp; */ /* } */ void print_bytecode (bytecode bc) { int i; fprintf(stderr, "bytecode @ %p, data @ %p, length = %d\n", bc, bc->data, bc->len); for (i=0; i+8 < bc->len; i+=8) { fprintf(stderr, "%02x: %02x %02x %02x %02x %02x %02x %02x %02x\n", i, bc->data[i], bc->data[i+1], bc->data[i+2], bc->data[i+3], bc->data[i+4], bc->data[i+5], bc->data[i+6], bc->data[i+7]); } if (i != bc->len) { fprintf(stderr, "%02x:", i); for ( ; i < bc->len; i++) { fprintf(stderr, " %02x", bc->data[i]); } fprintf(stderr, "\n"); } } void print_stack (sexp *stack, int top) { int i; for (i=0; ilen != i) { fprintf(stderr, "shrinking to %d\n", i); tmp = (bytecode) malloc(sizeof(struct bytecode) + i); tmp->tag = SEXP_BYTECODE; tmp->len = i; memcpy(tmp->data, (*bc)->data, i); SEXP_FREE(*bc); *bc = tmp; } } void emit(bytecode *bc, unsigned int *i, char c) { bytecode tmp; if ((*bc)->len < (*i)+1) { fprintf(stderr, "expanding (%d < %d)\n", (*bc)->len, (*i)+1); tmp = (bytecode) malloc(sizeof(unsigned int) + (*bc)->len*2); tmp->len = (*bc)->len*2; memcpy(tmp->data, (*bc)->data, (*bc)->len); SEXP_FREE(*bc); *bc = tmp; } (*bc)->data[(*i)++] = c; } void emit_word(bytecode *bc, unsigned int *i, unsigned long val) { bytecode tmp; if ((*bc)->len < (*i)+4) { tmp = (bytecode) malloc(sizeof(unsigned int) + (*bc)->len*2); tmp->len = (*bc)->len*2; memcpy(tmp->data, (*bc)->data, (*bc)->len); SEXP_FREE(*bc); *bc = tmp; } *((unsigned long*)(&((*bc)->data[*i]))) = val; *i += sizeof(unsigned long); } bytecode compile(sexp params, sexp obj, env e, int done_p); void analyze_app (sexp obj, bytecode *bc, unsigned int *i, env e, sexp params, unsigned int *d); void analyze_lambda (sexp name, sexp formals, sexp body, bytecode *bc, unsigned int *i, env e, sexp params, unsigned int *d); void analyze(sexp obj, bytecode *bc, unsigned int *i, env e, sexp params, unsigned int *d) { int tmp1, tmp2; env e2 = e; sexp o1, o2, cell; if (SEXP_PAIRP(obj)) { /* fprintf(stderr, ":: pair\n"); */ if (SEXP_SYMBOLP(SEXP_CAR(obj))) { fprintf(stderr, ":: symbol application\n"); o1 = env_cell(e, SEXP_CAR(obj)); /* fprintf(stderr, ":: => %p\n", o1); */ if (! o1) errx(1, "unknown operator: %s", SEXP_CAR(obj)); o1 = SEXP_CDR(o1); /* fprintf(stderr, ":: => %p\n", o1); */ if (SEXP_COREP(o1)) { /* core form */ fprintf(stderr, ":: core form\n"); switch (((core_form)o1)->code) { case CORE_LAMBDA: fprintf(stderr, ":: lambda\n"); analyze_lambda(SEXP_FALSE, SEXP_CADR(obj), SEXP_CADDR(obj), bc, i, e, params, d); break; case CORE_DEFINE: case CORE_SET: fprintf(stderr, "compiling global set: %p\n", SEXP_CADR(obj)); if ((((core_form)o1)->code == CORE_DEFINE) && SEXP_PAIRP(SEXP_CADR(obj))) { analyze_lambda(SEXP_CAR(SEXP_CADR(obj)), SEXP_CDR(SEXP_CADR(obj)), SEXP_CADDR(obj), bc, i, e, params, d); } else { analyze(SEXP_CADDR(obj), bc, i, e, params, d); } emit(bc, i, OP_GLOBAL_SET); emit_word(bc, i, (unsigned long) (SEXP_PAIRP(SEXP_CADR(obj)) ? SEXP_CAR(SEXP_CADR(obj)) : SEXP_CADR(obj))); emit(bc, i, OP_PUSH); (*d)++; emit_word(bc, i, (unsigned long) SEXP_UNDEF); break; case CORE_BEGIN: for (o2 = SEXP_CDR(obj); SEXP_PAIRP(o2); o2 = SEXP_CDR(o2)) { analyze(SEXP_CAR(o2), bc, i, e, params, d); } break; case CORE_IF: fprintf(stderr, "test clause: %d\n", *i); analyze(SEXP_CADR(obj), bc, i, e, params, d); emit(bc, i, OP_JUMP_UNLESS); /* jumps if test fails */ tmp1 = *i; emit(bc, i, 0); fprintf(stderr, "pass clause: %d\n", *i); analyze(SEXP_CADDR(obj), bc, i, e, params, d); emit(bc, i, OP_JUMP); tmp2 = *i; emit(bc, i, 0); ((signed char*) (*bc)->data)[tmp1] = (*i)-tmp1-1; /* patch */ fprintf(stderr, "fail clause: %d\n", *i); if (SEXP_PAIRP(SEXP_CDDDR(obj))) { analyze(SEXP_CADDDR(obj), bc, i, e, params, d); } else { emit(bc, i, OP_PUSH); (*d)++; emit_word(bc, i, (unsigned long) SEXP_UNDEF); } ((signed char*) (*bc)->data)[tmp2] = (*i)-tmp2-1; /* patch */ break; case CORE_QUOTE: emit(bc, i, OP_PUSH); (*d)++; emit_word(bc, i, (unsigned long)SEXP_CADR(obj)); break; default: errx(1, "unknown core form: %s", ((core_form)o1)->code); } } else if (SEXP_OPCODEP(o1)) { fprintf(stderr, ":: opcode\n"); /* direct opcode */ /* verify arity */ switch (((opcode)o1)->op_class) { case OPC_TYPE_PREDICATE: case OPC_PREDICATE: case OPC_ARITHMETIC: case OPC_ARITHMETIC_CMP: /* fprintf(stderr, ":: class: %d\n", ((opcode)o1)->op_class); */ for (o2 = reverse(SEXP_CDR(obj)); SEXP_PAIRP(o2); o2 = SEXP_CDR(o2)) { /* fprintf(stderr, ":: arg: %d\n", SEXP_CAR(o2)); */ analyze(SEXP_CAR(o2), bc, i, e, params, d); } fprintf(stderr, ":: name: %d\n", ((opcode)o1)->op_name); emit(bc, i, ((opcode)o1)->op_name); (*d) -= length(SEXP_CDDR(obj)); break; default: errx(1, "unknown opcode class: %d", ((opcode)o1)->op_class); } } else { /* function call */ analyze_app(obj, bc, i, e, params, d); } } else if (SEXP_PAIRP(SEXP_CAR(obj))) { o2 = env_cell(e, SEXP_CAAR(obj)); if (o2 && SEXP_COREP(SEXP_CDR(o2)) && (((core_form)SEXP_CDR(o2))->code == CORE_LAMBDA)) { /* let */ } else { /* computed application */ analyze_app(obj, bc, i, e, params, d); } } else { errx(1, "invalid operator: %s", SEXP_CAR(obj)); } } else if (SEXP_SYMBOLP(obj)) { /* variable reference */ /* cell = env_cell(e, obj); */ fprintf(stderr, "symbol lookup, param length: %d\n", length(params)); if ((tmp1 = list_index(params, obj)) >= 0) { fprintf(stderr, "compiling local ref: %p => %d (d = %d)\n", obj, tmp1, *d); emit(bc, i, OP_STACK_REF); emit_word(bc, i, tmp1 + *d + 3); (*d)++; } else { fprintf(stderr, "compiling global ref: %p\n", obj); emit(bc, i, OP_GLOBAL_REF); emit_word(bc, i, (unsigned long) obj); (*d)++; } } else { fprintf(stderr, "push: %d\n", (unsigned long)obj); emit(bc, i, OP_PUSH); emit_word(bc, i, (unsigned long)obj); (*d)++; } } void analyze_app (sexp obj, bytecode *bc, unsigned int *i, env e, sexp params, unsigned int *d) { sexp o1; unsigned long len = length(SEXP_CDR(obj)); /* push the arguments onto the stack */ for (o1 = reverse(SEXP_CDR(obj)); SEXP_PAIRP(o1); o1 = SEXP_CDR(o1)) { analyze(SEXP_CAR(o1), bc, i, e, params, d); } /* push the operator onto the stack */ analyze(SEXP_CAR(obj), bc, i, e, params, d); /* make the call */ emit(bc, i, OP_CALL); emit_word(bc, i, (unsigned long) make_integer(len)); } void analyze_lambda (sexp name, sexp formals, sexp body, bytecode *bc, unsigned int *i, env e, sexp params, unsigned int *d) { sexp obj = (sexp) compile(formals, body, e, 0); emit(bc, i, OP_PUSH); (*d)++; obj = make_procedure(obj, SEXP_NULL); emit_word(bc, i, (unsigned long) obj); } sexp vm(bytecode bc, env e, sexp* stack, unsigned int top) { unsigned char *ip=bc->data; sexp cp, tmp; int i; loop: /* fprintf(stderr, "opcode: %d, ip: %d\n", *ip, ip); */ /* print_bytecode(bc); */ switch (*ip++) { case OP_NOOP: fprintf(stderr, "noop\n"); break; case OP_GLOBAL_REF: fprintf(stderr, "global ref: ip: %p => %p: ", ip, ((sexp*)ip)[0]); fflush(stderr); write_sexp(stderr, ((sexp*)ip)[0]); fprintf(stderr, "\n"); tmp = env_cell(e, ((sexp*)ip)[0]); stack[top++]=SEXP_CDR(tmp); ip += sizeof(sexp); break; case OP_GLOBAL_SET: fprintf(stderr, "global set: %p: ", ((sexp*)ip)[0]); fflush(stderr); write_sexp(stderr, ((sexp*)ip)[0]); fprintf(stderr, "\n"); env_define(e, ((sexp*)ip)[0], stack[--top]); ip += sizeof(sexp); break; case OP_STACK_REF: fprintf(stderr, "stack ref: ip=%p, %d - %d => ", ip, top, (unsigned long) ((sexp*)ip)[0]); fflush(stderr); write_sexp(stderr, stack[top - (unsigned int) ((sexp*)ip)[0]]); fprintf(stderr, "\n"); stack[top] = stack[top - (unsigned int) ((sexp*)ip)[0]]; ip += sizeof(sexp); top++; break; case OP_CLOSURE_REF: /* stack[top++]=cp[*ip++]; */ break; case OP_CLOSURE_SET: /* cp[*ip++]=stack[top--]; */ break; case OP_PUSH: /* fprintf(stderr, " (push)\n"); */ stack[top++]=((sexp*)ip)[0]; ip += sizeof(sexp); break; case OP_DUP: stack[top]=stack[top-1]; top++; break; case OP_DROP: top--; break; case OP_SWAP: tmp = stack[top-2]; stack[top-2]=stack[top-1]; stack[top-1]=tmp; break; case OP_CAR: stack[top-1]=car(stack[top-1]); break; case OP_CDR: stack[top-1]=cdr(stack[top-1]); break; case OP_CONS: stack[top-2]=cons(stack[top-2], stack[top-1]); top--; break; case OP_ADD: stack[top-2]=sexp_add(stack[top-2],stack[top-1]); top--; break; case OP_SUB: stack[top-2]=sexp_sub(stack[top-2],stack[top-1]); top--; break; case OP_MUL: stack[top-2]=sexp_mul(stack[top-2],stack[top-1]); top--; break; case OP_DIV: stack[top-2]=sexp_div(stack[top-2],stack[top-1]); top--; break; case OP_MOD: stack[top-2]=sexp_mod(stack[top-2],stack[top-1]); top--; break; case OP_LT: stack[top-2]=((stack[top-2] < stack[top-1]) ? SEXP_TRUE : SEXP_FALSE); top--; break; case OP_CALL: fprintf(stderr, "CALL\n"); i = (unsigned long) ((sexp*)ip)[0]; tmp = stack[top-1]; if (! SEXP_PROCEDUREP(tmp)) errx(2, "non-procedure application: %p", tmp); stack[top-1] = (sexp) i; stack[top] = (sexp) (ip+4); top++; bc = procedure_code(tmp); print_bytecode(bc); ip = bc->data; fprintf(stderr, "... jumping to procedure at %p\n", ip); /* print_stack(stack, top); */ break; case OP_JUMP_UNLESS: fprintf(stderr, "JUMP UNLESS, stack top is %d\n", stack[top-1]); if (stack[--top] == SEXP_FALSE) { fprintf(stderr, "test passed, jumping to + %d => %d\n", ((signed char*)ip)[0], ip + ((signed char*)ip)[0]); ip += ((signed char*)ip)[0]; } else { fprintf(stderr, "test failed, not jumping\n"); ip++; } break; case OP_JUMP: fprintf(stderr, "jumping to + %d => %d\n", ((signed char*)ip)[0], ip + ((signed char*)ip)[0]); ip += ((signed char*)ip)[0]; break; case OP_RET: fprintf(stderr, "returning @ %d: ", top-1); fflush(stderr); write_sexp(stderr, stack[top-1]); fprintf(stderr, "\n"); /* print_stack(stack, top); */ /* top-1 */ /* stack: args ... n ip result */ ip = (unsigned char*) stack[top-2]; i = unbox_integer(stack[top-3]); stack[top-i-3] = stack[top-1]; top = top-i-2; break; case OP_DONE: fprintf(stderr, "finally returning @ %d: ", top-1); fflush(stderr); write_sexp(stderr, stack[top-1]); fprintf(stderr, "\n"); goto end_loop; default: fprintf(stderr, "unknown opcode: %d\n", *(ip-1)); stack[top] = SEXP_ERROR; goto end_loop; } goto loop; end_loop: return stack[top-1]; } bytecode compile(sexp params, sexp obj, env e, int done_p) { bytecode bc = (bytecode) malloc(sizeof(struct bytecode)+INIT_BCODE_SIZE); unsigned int i = 0, d = 0; bc->tag = SEXP_BYTECODE; bc->len = INIT_BCODE_SIZE; fprintf(stderr, "analyzing\n"); analyze(obj, &bc, &i, e, params, &d); emit(&bc, &i, done_p ? OP_DONE : OP_RET); /* fprintf(stderr, "shrinking\n"); */ shrink_bcode(&bc, i); fprintf(stderr, "done compiling:\n"); print_bytecode(bc); return bc; } sexp eval_in_stack(sexp obj, env e, sexp* stack, unsigned int top) { bytecode bc = compile(SEXP_NULL, obj, e, 1); fprintf(stderr, "evaling\n"); return vm(bc, e, stack, top); } sexp eval(sexp obj, env e) { sexp* stack = (sexp*) malloc(sizeof(sexp) * INIT_STACK_SIZE); sexp res = eval_in_stack(obj, e, stack, 0); free(stack); return res; } int main (int argc, char **argv) { sexp obj, res, *stack; env e; sexp_init(); e = make_standard_env(); stack = (sexp*) malloc(sizeof(sexp) * INIT_STACK_SIZE); /* repl */ fprintf(stdout, "> "); fflush(stdout); while ((obj = read_sexp(stdin)) != SEXP_EOF) { write_sexp(stdout, obj); fprintf(stdout, "\n => "); res = eval_in_stack(obj, e, stack, 0); /* fprintf(stderr, " (=> %d)\n", res); */ write_sexp(stdout, res); fprintf(stdout, "\n> "); fflush(stdout); } fprintf(stdout, "\n"); return 0; }