/* -*-comment-start: "//";comment-end:""-*- * Mes --- Maxwell Equations of Software * Copyright © 2016 Jan Nieuwenhuizen * * This file is part of Mes. * * Mes is free software; you can redistribute it and/or modify it * under the terms of the GNU General Public License as published by * the Free Software Foundation; either version 3 of the License, or (at * your option) any later version. * * Mes is distributed in the hope that it will be useful, but * WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU General Public License for more details. * * You should have received a copy of the GNU General Public License * along with Mes. If not, see . */ #define _GNU_SOURCE #include #include #include #include #include #include #include #include #define DEBUG 0 #define QUASIQUOTE 1 #define QUASISYNTAX 0 #define ENV_CACHE 0 #define FIXED_PRIMITIVES 1 #define READER 1 #if READER int ARENA_SIZE = 1000000; #else int ARENA_SIZE = 100000; #endif int MAX_ARENA_SIZE = 20000000; int GC_SAFETY = 100; typedef long SCM; enum type_t {CHAR, FUNCTION, MACRO, NUMBER, PAIR, SPECIAL, STRING, SYMBOL, REF, VALUES, VECTOR, BROKEN_HEART}; typedef SCM (*function0_t) (void); typedef SCM (*function1_t) (SCM); typedef SCM (*function2_t) (SCM, SCM); typedef SCM (*function3_t) (SCM, SCM, SCM); typedef SCM (*functionn_t) (SCM); typedef struct function_t { union { function0_t function0; function1_t function1; function2_t function2; function3_t function3; functionn_t functionn; }; int arity; } function; struct scm_t; typedef struct scm_t { enum type_t type; union { char const *name; SCM string; SCM car; SCM ref; int length; }; union { int value; int function; SCM cdr; SCM macro; SCM vector; int hits; }; } scm; function functions[200]; int g_function = 0; #include "mes.symbols.h" #include "define.h" #include "display.h" #include "lib.h" #include "math.h" #include "mes.h" #include "posix.h" #include "quasiquote.h" #include "reader.h" #include "string.h" #include "type.h" SCM g_symbols = 0; SCM stack = 0; SCM r0 = 0; // a/env SCM r1 = 0; // param 1 SCM r2 = 0; // param 2 SCM r3 = 0; // param 3 SCM tmp; SCM tmp_num; SCM tmp_num2; SCM tmp_num3; SCM tmp_num4; scm scm_nil = {SPECIAL, "()"}; scm scm_f = {SPECIAL, "#f"}; scm scm_t = {SPECIAL, "#t"}; scm scm_dot = {SPECIAL, "."}; scm scm_undefined = {SPECIAL, "*undefined*"}; scm scm_unspecified = {SPECIAL, "*unspecified*"}; scm scm_closure = {SPECIAL, "*closure*"}; scm scm_circular = {SPECIAL, "*circular*"}; #if BOOT scm scm_label = { SPECIAL, "label"}; #endif scm scm_begin = {SPECIAL, "*begin*"}; scm scm_symbol_lambda = {SYMBOL, "lambda"}; scm scm_symbol_begin = {SYMBOL, "begin"}; scm scm_symbol_if = {SYMBOL, "if"}; scm scm_symbol_define = {SYMBOL, "define"}; scm scm_symbol_define_macro = {SYMBOL, "define-macro"}; scm scm_symbol_set_x = {SYMBOL, "set!"}; scm scm_symbol_quote = {SYMBOL, "quote"}; scm scm_symbol_quasiquote = {SYMBOL, "quasiquote"}; scm scm_symbol_unquote = {SYMBOL, "unquote"}; scm scm_symbol_unquote_splicing = {SYMBOL, "unquote-splicing"}; scm scm_symbol_sc_expand = {SYMBOL, "sc-expand"}; scm scm_symbol_expand_macro = {SYMBOL, "expand-macro"}; scm scm_symbol_sc_expander_alist = {SYMBOL, "*sc-expander-alist*"}; scm scm_symbol_noexpand = {SYMBOL, "noexpand"}; scm scm_symbol_syntax = {SYMBOL, "syntax"}; scm scm_symbol_quasisyntax = {SYMBOL, "quasisyntax"}; scm scm_symbol_unsyntax = {SYMBOL, "unsyntax"}; scm scm_symbol_unsyntax_splicing = {SYMBOL, "unsyntax-splicing"}; scm scm_symbol_call_with_values = {SYMBOL, "call-with-values"}; scm scm_symbol_current_module = {SYMBOL, "current-module"}; scm scm_symbol_primitive_load = {SYMBOL, "primitive-load"}; scm scm_symbol_read_input_file = {SYMBOL, "read-input-file"}; scm scm_symbol_the_unquoters = {SYMBOL, "*the-unquoters*"}; scm scm_symbol_car = {SYMBOL, "car"}; scm scm_symbol_cdr = {SYMBOL, "cdr"}; scm scm_symbol_null_p = {SYMBOL, "null?"}; scm scm_symbol_eq_p = {SYMBOL, "eq?"}; scm scm_symbol_cons = {SYMBOL, "cons"}; scm char_eof = {CHAR, .name="*eof*", .value=-1}; scm char_nul = {CHAR, .name="nul", .value=0}; scm char_backspace = {CHAR, .name="backspace", .value=8}; scm char_tab = {CHAR, .name="tab", .value=9}; scm char_newline = {CHAR, .name="newline", .value=10}; scm char_vt = {CHAR, .name="vt", .value=11}; scm char_page = {CHAR, .name="page", .value=12}; scm char_return = {CHAR, .name="return", .value=13}; scm char_space = {CHAR, .name="space", .value=32}; scm g_free = {NUMBER, .value=0}; scm *g_cells; scm *g_news = 0; #define CAR(x) g_cells[x].car #define CDR(x) g_cells[x].cdr #define HITS(x) g_cells[x].hits #define LENGTH(x) g_cells[x].length #define NAME(x) g_cells[x].name #define STRING(x) g_cells[x].string #define TYPE(x) g_cells[x].type #define MACRO(x) g_cells[x].macro #define REF(x) g_cells[x].ref #define VALUE(x) g_cells[x].value #define VECTOR(x) g_cells[x].vector #define FUNCTION(x) functions[g_cells[x].function] #define NCAR(x) g_news[x].car #define NTYPE(x) g_news[x].type #define CAAR(x) CAR (CAR (x)) #define CDAR(x) CDR (CAR (x)) #define CAAR(x) CAR (CAR (x)) #define CADAR(x) CAR (CDR (CAR (x))) #define CADDR(x) CAR (CDR (CDR (x))) #define CDADAR(x) CAR (CDR (CAR (CDR (x)))) #define CADR(x) CAR (CDR (x)) SCM display_ (FILE* f, SCM x); SCM vm_call (function0_t f, SCM p1, SCM p2, SCM a); SCM alloc (int n) { assert (g_free.value + n < ARENA_SIZE); SCM x = g_free.value; g_free.value += n; return x; } SCM make_cell (SCM type, SCM car, SCM cdr) { SCM x = alloc (1); assert (TYPE (type) == NUMBER); TYPE (x) = VALUE (type); if (VALUE (type) == CHAR || VALUE (type) == NUMBER) { if (car) CAR (x) = CAR (car); if (cdr) CDR (x) = CDR (cdr); } else if (VALUE (type) == FUNCTION) { if (car) CAR (x) = car; if (cdr) CDR (x) = CDR (cdr); } else { CAR (x) = car; CDR (x) = cdr; } return x; } SCM cons (SCM x, SCM y) { g_cells[tmp_num].value = PAIR; return make_cell (tmp_num, x, y); } SCM car (SCM x) { assert (TYPE (x) == PAIR); return CAR (x); } SCM cdr (SCM x) { assert (TYPE (x) == PAIR); return CDR (x); } SCM eq_p (SCM x, SCM y) { return (x == y || (TYPE (x) == CHAR && TYPE (y) == CHAR && VALUE (x) == VALUE (y)) || (TYPE (x) == NUMBER && TYPE (y) == NUMBER && VALUE (x) == VALUE (y))) ? cell_t : cell_f; } SCM set_car_x (SCM x, SCM e) { assert (TYPE (x) == PAIR); CAR (x) = e; return cell_unspecified; } SCM set_cdr_x (SCM x, SCM e) { assert (TYPE (x) == PAIR); CDR (x) = e; return cell_unspecified; } SCM set_env_x (SCM x, SCM e, SCM a) { SCM p = assert_defined (x, assq (x, a)); return set_cdr_x (p, e); } SCM quote (SCM x) { return cons (cell_symbol_quote, x); } SCM quasiquote (SCM x) { return cons (cell_symbol_quasiquote, x); } SCM quasisyntax (SCM x) { return cons (cell_symbol_quasisyntax, x); } SCM pairlis (SCM x, SCM y, SCM a) { if (x == cell_nil) return a; if (pair_p (x) == cell_f) return cons (cons (x, y), a); return cons (cons (car (x), car (y)), pairlis (cdr (x), cdr (y), a)); } SCM assq (SCM x, SCM a) { while (a != cell_nil && eq_p (x, CAAR (a)) == cell_f) { if (TYPE (a) == BROKEN_HEART || TYPE (CAR (a)) == BROKEN_HEART) fprintf (stderr, "oops, broken heart\n"); a = CDR (a); } return a != cell_nil ? car (a) : cell_f; } SCM assq_ref_cache (SCM x, SCM a) { x = assq (x, a); if (x == cell_f) return cell_undefined; return cdr (x); } SCM assert_defined (SCM x, SCM e) { if (e == cell_undefined) { fprintf (stderr, "eval: unbound variable:"); display_ (stderr, x); fprintf (stderr, "\n"); assert (!"unbound variable"); } return e; } SCM vm_evlis_env () { if (r1 == cell_nil) return cell_nil; if (TYPE (r1) != PAIR) return eval_env (r1, r0); r2 = eval_env (car (r1), r0); r1 = evlis_env (cdr (r1), r0); return cons (r2, r1); } SCM vm_call_lambda () { return vm_call (vm_begin_env, r1, cell_undefined, r0); } SCM call_lambda (SCM e, SCM x, SCM aa, SCM a) ///((internal)) { SCM cl = cons (cons (cell_closure, x), x); r1 = e; r0 = cl; r2 = a; r3 = aa; return vm_call_lambda (); } SCM vm_apply_env () { if (TYPE (r1) != PAIR) { if (TYPE (r1) == FUNCTION) return call (r1, r2); if (r1 == cell_symbol_call_with_values) return call_with_values_env (car (r2), cadr (r2), r0); if (r1 == cell_symbol_current_module) return r0; } else if (car (r1) == cell_symbol_lambda) { SCM args = cadr (r1); SCM body = cddr (r1); SCM p = pairlis (args, r2, r0); return call_lambda (body, p, p, r0); } else if (car (r1) == cell_closure) { SCM args = caddr (r1); SCM body = cdddr (r1); SCM aa = cdadr (r1); aa = cdr (aa); SCM p = pairlis (args, r2, aa); return call_lambda (body, p, aa, r0); } #if BOOT else if (car (r1) == cell_symbol_label) return apply_env (caddr (r1), r2, cons (cons (cadr (r1), caddr (r1)), r0)); #endif SCM e = eval_env (r1, r0); char const* type = 0; if (e == cell_f || e == cell_t) type = "bool"; if (TYPE (e) == CHAR) type = "char"; if (TYPE (e) == NUMBER) type = "number"; if (TYPE (e) == STRING) type = "string"; if (e == cell_unspecified) type = "*unspecified*"; if (e == cell_undefined) type = "*undefined*"; if (type) { fprintf (stderr, "cannot apply: %s: ", type); display_ (stderr, e); fprintf (stderr, " ["); display_ (stderr, r1); fprintf (stderr, "]\n"); assert (!"cannot apply"); } return apply_env (e, r2, r0); } SCM vm_eval_env () { switch (TYPE (r1)) { case PAIR: { #if FIXED_PRIMITIVES if (car (r1) == cell_symbol_car) return car (eval_env (CADR (r1), r0)); if (car (r1) == cell_symbol_cdr) return cdr (eval_env (CADR (r1), r0)); if (car (r1) == cell_symbol_cons) { SCM m = evlis_env (CDR (r1), r0); return cons (CAR (m), CADR (m)); } if (car (r1) == cell_symbol_null_p) return null_p (eval_env (CADR (r1), r0)); #endif // FIXED_PRIMITIVES if (car (r1) == cell_symbol_quote) return cadr (r1); #if QUASISYNTAX if (car (r1) == cell_symbol_syntax) return r1; #endif if (car (r1) == cell_symbol_begin) return begin_env (r1, r0); if (car (r1) == cell_symbol_lambda) return make_closure (cadr (r1), cddr (r1), assq (cell_closure, r0)); if (car (r1) == cell_closure) return r1; if (car (r1) == cell_symbol_if) return if_env (cdr (r1), r0); #if !BOOT if (car (r1) == cell_symbol_define) return define_env (r1, r0); if (car (r1) == cell_symbol_define_macro) return define_env (r1, r0); if (car (r1) == cell_symbol_primitive_load) return begin_env (read_input_file_env (r0), r0); #else if (car (r1) == cell_symbol_define) { fprintf (stderr, "C DEFINE: "); display_ (stderr, TYPE (cadr (r1)) == SYMBOL ? STRING (cadr (r1)) : STRING (caadr (r1))); fprintf (stderr, "\n"); } assert (car (r1) != cell_symbol_define); assert (car (r1) != cell_symbol_define_macro); #endif #if 1 //!BOOT if (car (r1) == cell_symbol_set_x) { SCM x = eval_env (caddr (r1), r0); return set_env_x (cadr (r1), x, r0); } #else assert (car (r1) != cell_symbol_set_x); #endif #if QUASIQUOTE if (car (r1) == cell_symbol_unquote) return eval_env (cadr (r1), r0); if (car (r1) == cell_symbol_quasiquote) return eval_quasiquote (cadr (r1), add_unquoters (r0)); #endif //QUASIQUOTE #if QUASISYNTAX if (car (r1) == cell_symbol_unsyntax) return eval_env (cadr (r1), r0); if (car (r1) == cell_symbol_quasisyntax) return eval_quasisyntax (cadr (r1), add_unsyntaxers (r0)); #endif //QUASISYNTAX SCM x = expand_macro_env (r1, r0); if (x != r1) return eval_env (x, r0); SCM m = evlis_env (CDR (r1), r0); return apply_env (car (r1), m, r0); } case SYMBOL: return assert_defined (r1, assq_ref_cache (r1, r0)); default: return r1; } } SCM vm_expand_macro_env () { if (TYPE (CAR (r1)) == STRING && string_to_symbol (CAR (r1)) == cell_symbol_noexpand) return cadr (r1); SCM macro; SCM expanders; if (TYPE (r1) == PAIR && (macro = lookup_macro (car (r1), r0)) != cell_f) return apply_env (macro, CDR (r1), r0); else if (TYPE (r1) == PAIR && TYPE (CAR (r1)) == SYMBOL && ((expanders = assq_ref_cache (cell_symbol_sc_expander_alist, r0)) != cell_undefined) && ((macro = assq (CAR (r1), expanders)) != cell_f)) { SCM sc_expand = assq_ref_cache (cell_symbol_expand_macro, r0); if (sc_expand != cell_undefined && sc_expand != cell_f) r1 = apply_env (sc_expand, cons (r1, cell_nil), r0); } return r1; } SCM vm_begin_env () { SCM r = cell_unspecified; while (r1 != cell_nil) { if (TYPE (r1) == PAIR && TYPE (CAR (r1)) == PAIR) { if (caar (r1) == cell_symbol_begin) r1 = append2 (cdar (r1), cdr (r1)); else if (caar (r1) == cell_symbol_primitive_load) { SCM f = read_input_file_env (r0); r1 = append2 (f, cdr (r1)); } } r = eval_env (car (r1), r0); r1 = CDR (r1); } return r; } SCM vm_if_env () { SCM x = eval_env (car (r1), r0); if (x != cell_f) return eval_env (cadr (r1), r0); if (cddr (r1) != cell_nil) return eval_env (caddr (r1), r0); return cell_unspecified; } SCM vm_call_with_values_env () { SCM v = apply_env (r1, cell_nil, r0); if (TYPE (v) == VALUES) v = CDR (v); return apply_env (r2, v, r0); } SCM call (SCM fn, SCM x) { if ((FUNCTION (fn).arity > 0 || FUNCTION (fn).arity == -1) && x != cell_nil && TYPE (CAR (x)) == VALUES) x = cons (CADAR (x), CDR (x)); if ((FUNCTION (fn).arity > 1 || FUNCTION (fn).arity == -1) && x != cell_nil && TYPE (CDR (x)) == PAIR && TYPE (CADR (x)) == VALUES) x = cons (CAR (x), cons (CDADAR (x), CDR (x))); switch (FUNCTION (fn).arity) { case 0: return FUNCTION (fn).function0 (); case 1: return FUNCTION (fn).function1 (car (x)); case 2: return FUNCTION (fn).function2 (car (x), cadr (x)); case 3: return FUNCTION (fn).function3 (car (x), cadr (x), caddr (x)); case -1: return FUNCTION (fn).functionn (x); } return cell_unspecified; } SCM gc_frame (SCM stack) { SCM frame = car (stack); r1 = car (frame); r2 = cadr (frame); r3 = caddr (frame); r0 = cadddr (frame); return frame; } SCM gc_stack (SCM a) { SCM frame = cons (r1, cons (r2, cons (r3, cons (r0, cell_nil)))); stack = cons (frame, stack); stack = gc (stack); gc_frame (stack); stack = cdr (stack); return stack; } SCM vm_call (function0_t f, SCM p1, SCM p2, SCM a) { SCM frame = cons (r1, cons (r2, cons (r3, cons (r0, cell_nil)))); stack = cons (frame, stack); r1 = p1; r2 = p2; r0 = a; if (g_free.value + GC_SAFETY > ARENA_SIZE) gc_stack (stack); SCM r = f (); frame = gc_frame (stack); stack = cdr (stack); return r; } SCM evlis_env (SCM m, SCM a) { return vm_call (vm_evlis_env, m, cell_undefined, a); } SCM apply_env (SCM fn, SCM x, SCM a) { return vm_call (vm_apply_env, fn, x, a); } SCM eval_env (SCM e, SCM a) { return vm_call (vm_eval_env, e, cell_undefined, a); } SCM expand_macro_env (SCM e, SCM a) { return vm_call (vm_expand_macro_env, e, cell_undefined, a); } SCM begin_env (SCM e, SCM a) { return vm_call (vm_begin_env, e, cell_undefined, a); } SCM if_env (SCM e, SCM a) { return vm_call (vm_if_env, e, cell_undefined, a); } SCM call_with_values_env (SCM producer, SCM consumer, SCM a) { return vm_call (vm_call_with_values_env, producer, consumer, a); } SCM append2 (SCM x, SCM y) { if (x == cell_nil) return y; assert (TYPE (x) == PAIR); return cons (car (x), append2 (cdr (x), y)); } SCM append (SCM x) ///((arity . n)) { if (x == cell_nil) return cell_nil; return append2 (car (x), append (cdr (x))); } SCM make_char (int x) { g_cells[tmp_num].value = CHAR; g_cells[tmp_num2].value = x; return make_cell (tmp_num, tmp_num2, tmp_num2); } SCM make_function (SCM name, SCM id, SCM arity) { g_cells[tmp_num3].value = FUNCTION; function *f = (function*)malloc (sizeof (function)); f->arity = VALUE (arity); g_cells[tmp_num4].value = (long)f; return make_cell (tmp_num3, name, tmp_num4); } SCM make_macro (SCM name, SCM x) { g_cells[tmp_num].value = MACRO; return make_cell (tmp_num, STRING (name), x); } SCM make_number (int x) { g_cells[tmp_num].value = NUMBER; g_cells[tmp_num2].value = x; return make_cell (tmp_num, tmp_num2, tmp_num2); } SCM make_ref (SCM x) { g_cells[tmp_num].value = REF; return make_cell (tmp_num, x, x); } SCM make_string (SCM x) { g_cells[tmp_num].value = STRING; return make_cell (tmp_num, x, 0); } SCM cstring_to_list (char const* s) { SCM p = cell_nil; int i = strlen (s); while (i--) p = cons (make_char (s[i]), p); return p; } SCM null_p (SCM x) { return x == cell_nil ? cell_t : cell_f; } SCM internal_make_symbol (SCM s) { g_cells[tmp_num].value = SYMBOL; SCM x = make_cell (tmp_num, s, 0); g_symbols = cons (x, g_symbols); return x; } SCM make_symbol (SCM s) { SCM x = internal_lookup_symbol (s); return x ? x : internal_make_symbol (s); } SCM make_vector (SCM n) { int k = VALUE (n); g_cells[tmp_num].value = VECTOR; SCM v = alloc (k); SCM x = make_cell (tmp_num, k, v); for (int i=0; i jam[%d]\n", g_free.value); return stack; } SCM gc_show () { fprintf (stderr, "cells: "); scm *t = g_cells; display_ (stderr, -1); fprintf (stderr, "\n"); if (g_news) { fprintf (stderr, "news: "); g_cells = g_news; display_ (stderr, -1); fprintf (stderr, "\n"); } g_cells = t; return cell_unspecified; } // Environment setup SCM acons (SCM key, SCM value, SCM alist) { return cons (cons (key, value), alist); } SCM add_environment (SCM a, char const *name, SCM x) { return acons (make_symbol (cstring_to_list (name)), x, a); } SCM gc_init_cells () { g_cells = (scm *)malloc (2*ARENA_SIZE*sizeof(scm)); g_cells[0].type = VECTOR; g_cells[0].length = 1000; g_cells[0].vector = 0; g_cells++; g_cells[0].type = CHAR; g_cells[0].value = 'c'; g_free.value = 1; // 0 is tricky } SCM gc_init_news () { g_news = g_cells-1 + ARENA_SIZE; g_news[0].type = VECTOR; g_news[0].length = 1000; g_news[0].vector = 0; g_news++; g_news[0].type = CHAR; g_news[0].value = 'n'; } SCM mes_symbols () ///((internal)) { gc_init_cells (); gc_init_news (); #include "mes.symbols.i" g_symbol_max = g_free.value; make_tmps (g_cells); g_symbols = 0; for (int i=1; i> 8, stdout); fputc (stack % 256, stdout); for (int i=0; i 1 && !strcmp (argv[1], "--help")) return puts ("Usage: mes < FILE\n"); if (argc > 1 && !strcmp (argv[1], "--version")) return puts ("Mes 0.3\n"); g_stdin = stdin; r0 = mes_environment (); SCM program = (argc > 1 && !strcmp (argv[1], "--load")) ? bload_env (r0) : load_env (r0); if (argc > 1 && !strcmp (argv[1], "--dump")) return dump (); display_ (stderr, begin_env (program, r0)); fputs ("", stderr); gc (stack); if (g_debug) fprintf (stderr, "\nstats: [%d]\n", g_free.value); return 0; }