2024-04-04 12:04:27 -04:00
|
|
|
#include <stdio.h>
|
|
|
|
|
2024-04-04 12:29:36 -04:00
|
|
|
typedef struct {
|
2024-04-27 17:47:06 -04:00
|
|
|
unsigned int id, refs;
|
|
|
|
char *a, *b;
|
2024-04-04 12:29:36 -04:00
|
|
|
} Rule;
|
|
|
|
|
2024-04-27 17:47:06 -04:00
|
|
|
static unsigned char rmin = 0xff, rmax = 0x00;
|
2024-04-23 22:36:49 -04:00
|
|
|
static int flip, quiet, cycles = 0x10000;
|
2024-04-25 15:17:31 -04:00
|
|
|
static Rule rules[0x1000], *rules_ = rules, lambda;
|
2024-04-24 18:17:57 -04:00
|
|
|
static char dict[0x8000], *dict_ = dict, empty;
|
2024-04-14 22:36:16 -04:00
|
|
|
static char bank_a[0x4000], *src_ = bank_a;
|
|
|
|
static char bank_b[0x4000], *dst_ = bank_b;
|
2024-04-27 17:47:06 -04:00
|
|
|
static char *regs[0x100];
|
2024-04-23 22:36:49 -04:00
|
|
|
|
2024-04-11 12:26:55 -04:00
|
|
|
#define spacer(c) (c <= ' ' || c == '(' || c == ')')
|
2024-04-04 19:52:09 -04:00
|
|
|
|
2024-04-04 13:59:00 -04:00
|
|
|
static char *
|
|
|
|
walk(char *s)
|
|
|
|
{
|
|
|
|
char c;
|
2024-04-04 22:40:16 -04:00
|
|
|
int depth = 0;
|
2024-04-12 13:30:59 -04:00
|
|
|
if(*s == '(') {
|
2024-04-04 22:37:03 -04:00
|
|
|
while((c = *s++)) {
|
|
|
|
if(c == '(') depth++;
|
|
|
|
if(c == ')') --depth;
|
|
|
|
if(!depth) return s;
|
2024-04-04 20:26:16 -04:00
|
|
|
}
|
2024-04-04 14:35:58 -04:00
|
|
|
}
|
2024-04-08 18:08:22 -04:00
|
|
|
while((c = *s) && !spacer(c)) s++;
|
2024-04-04 20:15:16 -04:00
|
|
|
return s;
|
2024-04-04 13:59:00 -04:00
|
|
|
}
|
|
|
|
|
2024-04-25 21:36:45 -04:00
|
|
|
static void
|
2024-04-22 20:54:17 -04:00
|
|
|
write_reg(char r, char *reg)
|
2024-04-04 15:20:06 -04:00
|
|
|
{
|
2024-04-21 12:13:30 -04:00
|
|
|
char c, *cap = walk(reg);
|
2024-04-22 23:22:54 -04:00
|
|
|
switch(r) {
|
|
|
|
case ':': /* op: output */
|
2024-04-21 12:13:30 -04:00
|
|
|
if(*reg == '(') reg++, --cap;
|
|
|
|
while(reg < cap) {
|
|
|
|
c = *reg++;
|
2024-04-14 20:33:42 -04:00
|
|
|
if(c == '\\') {
|
2024-04-21 12:13:30 -04:00
|
|
|
switch(*reg++) {
|
2024-04-14 20:33:42 -04:00
|
|
|
case 't': putc(0x09, stdout); break;
|
|
|
|
case 'n': putc(0x0a, stdout); break;
|
|
|
|
case 's': putc(0x20, stdout); break;
|
|
|
|
}
|
|
|
|
} else
|
|
|
|
putc(c, stdout);
|
|
|
|
}
|
2024-04-25 21:36:45 -04:00
|
|
|
return;
|
|
|
|
case '~': { /* op: input */
|
2024-04-22 23:22:54 -04:00
|
|
|
while(fread(&c, 1, 1, stdin) && c >= ' ')
|
|
|
|
*dst_++ = c;
|
2024-04-25 21:36:45 -04:00
|
|
|
if(feof(stdin))
|
|
|
|
*dst_++ = 'E', *dst_++ = 'O', *dst_++ = 'F';
|
|
|
|
return;
|
|
|
|
}
|
2024-04-22 23:22:54 -04:00
|
|
|
case '^': /* op: join */
|
|
|
|
if(*reg == '(') reg++, --cap;
|
|
|
|
while(reg < cap && (c = *reg++))
|
|
|
|
if(!spacer(c)) *dst_++ = c;
|
2024-04-25 21:36:45 -04:00
|
|
|
return;
|
2024-04-22 23:22:54 -04:00
|
|
|
case '.': /* op: unwrap */
|
|
|
|
if(*reg == '(') reg++, --cap;
|
2024-04-21 12:13:30 -04:00
|
|
|
while(reg < cap) *dst_++ = *reg++;
|
2024-04-25 21:36:45 -04:00
|
|
|
return;
|
2024-04-22 23:22:54 -04:00
|
|
|
case '*': { /* op: explode */
|
|
|
|
int i, depth = 0;
|
2024-04-23 16:51:25 -04:00
|
|
|
if(*reg == '(' && reg[1] != ')') { /* tuple */
|
2024-04-22 23:22:54 -04:00
|
|
|
reg++;
|
|
|
|
while(reg < cap) {
|
|
|
|
while((c = *reg) && !spacer(c))
|
|
|
|
*dst_++ = c, reg++;
|
|
|
|
*dst_++ = ' ';
|
|
|
|
*dst_++ = '(', reg++, depth++;
|
|
|
|
}
|
2024-04-23 23:20:31 -04:00
|
|
|
} else /* token */
|
2024-04-22 23:22:54 -04:00
|
|
|
while((c = *reg++) && !spacer(c))
|
|
|
|
*dst_++ = c, *dst_++ = ' ', *dst_++ = '(', depth++;
|
|
|
|
for(i = 0; i < depth; i++) *dst_++ = ')';
|
2024-04-25 21:36:45 -04:00
|
|
|
return;
|
2024-04-22 23:22:54 -04:00
|
|
|
}
|
|
|
|
default:
|
|
|
|
while(reg < cap) *dst_++ = *reg++;
|
2024-04-25 21:36:45 -04:00
|
|
|
return;
|
2024-04-22 23:22:54 -04:00
|
|
|
}
|
2024-04-04 15:20:06 -04:00
|
|
|
}
|
|
|
|
|
2024-04-07 17:55:55 -04:00
|
|
|
static int
|
2024-04-27 11:46:31 -04:00
|
|
|
write_tail(char *s)
|
2024-04-04 17:55:51 -04:00
|
|
|
{
|
2024-04-14 22:36:16 -04:00
|
|
|
while((*dst_++ = *s++))
|
2024-04-07 17:55:55 -04:00
|
|
|
;
|
2024-04-24 18:46:27 -04:00
|
|
|
*dst_ = 0;
|
2024-04-14 22:36:16 -04:00
|
|
|
if((flip = !flip))
|
|
|
|
src_ = bank_b, dst_ = bank_a;
|
2024-04-06 11:36:10 -04:00
|
|
|
else
|
2024-04-14 22:36:16 -04:00
|
|
|
src_ = bank_a, dst_ = bank_b;
|
2024-04-07 17:55:55 -04:00
|
|
|
return 1;
|
2024-04-04 17:55:51 -04:00
|
|
|
}
|
|
|
|
|
2024-04-25 15:17:31 -04:00
|
|
|
static int
|
2024-04-25 21:39:17 -04:00
|
|
|
apply_rule(Rule *r, char *s)
|
2024-04-22 20:39:39 -04:00
|
|
|
{
|
2024-04-27 12:24:48 -04:00
|
|
|
unsigned int i, rid;
|
2024-04-27 17:47:06 -04:00
|
|
|
char c, *a = r->a, *b = r->b, *origin = dst_, *reg;
|
2024-04-27 11:46:31 -04:00
|
|
|
/* phase: clean regs */
|
2024-04-27 17:47:06 -04:00
|
|
|
if(rmax) {
|
|
|
|
for(i = 0; i <= rmax; i++)
|
|
|
|
regs[i] = 0;
|
|
|
|
rmin = 0xff, rmax = 0x00;
|
|
|
|
}
|
2024-04-24 14:12:57 -04:00
|
|
|
/* phase: match rule */
|
2024-04-24 23:26:56 -04:00
|
|
|
while((c = *a++)) {
|
2024-04-22 20:43:35 -04:00
|
|
|
if(c == '?') {
|
2024-04-24 14:18:06 -04:00
|
|
|
char *pcap = walk(s);
|
2024-04-27 17:47:06 -04:00
|
|
|
rid = *a++;
|
2024-04-27 12:24:48 -04:00
|
|
|
if((reg = regs[rid])) { /* reg cmp */
|
2024-04-22 23:32:42 -04:00
|
|
|
char *rcap = walk(reg), *pp = s;
|
2024-04-22 20:43:35 -04:00
|
|
|
while(reg < rcap || pp < pcap)
|
2024-04-25 15:17:31 -04:00
|
|
|
if(*reg++ != *pp++) return 0;
|
2024-04-27 17:47:06 -04:00
|
|
|
} else { /* reg set */
|
2024-04-27 12:24:48 -04:00
|
|
|
regs[rid] = s;
|
2024-04-27 17:47:06 -04:00
|
|
|
if(rid < rmin) rmin = rid;
|
|
|
|
if(rid > rmax) rmax = rid;
|
|
|
|
}
|
2024-04-26 14:06:30 -04:00
|
|
|
s = pcap;
|
|
|
|
} else if(c != *s++)
|
|
|
|
return 0;
|
2024-04-22 20:43:35 -04:00
|
|
|
}
|
2024-04-26 01:35:15 -04:00
|
|
|
c = *s;
|
|
|
|
if(!spacer(c)) return 0;
|
2024-04-24 14:12:57 -04:00
|
|
|
/* phase: write rule */
|
2024-04-25 12:48:24 -04:00
|
|
|
while((c = *b++)) {
|
|
|
|
if(c == '?') {
|
2024-04-27 17:47:06 -04:00
|
|
|
rid = *b;
|
|
|
|
if((reg = regs[rid]))
|
|
|
|
b++, write_reg(rid, reg);
|
2024-04-25 12:48:24 -04:00
|
|
|
else
|
2024-04-22 20:54:17 -04:00
|
|
|
*dst_++ = c;
|
2024-04-25 12:48:24 -04:00
|
|
|
} else
|
|
|
|
*dst_++ = c;
|
2024-04-22 20:54:17 -04:00
|
|
|
}
|
2024-04-25 12:48:24 -04:00
|
|
|
if(dst_ == origin) {
|
|
|
|
while(*s == ' ') s++;
|
|
|
|
if(*s == ')' && *(dst_ - 1) == ' ') dst_--;
|
|
|
|
}
|
2024-04-27 12:02:56 -04:00
|
|
|
if(!quiet && r) printf("%02d %s\n", r->id, src_), ++r->refs;
|
2024-04-27 11:46:31 -04:00
|
|
|
return write_tail(s);
|
2024-04-22 20:54:17 -04:00
|
|
|
}
|
|
|
|
|
2024-04-24 16:41:09 -04:00
|
|
|
static char *
|
2024-04-24 16:45:08 -04:00
|
|
|
compile_rule(Rule *r, int id, char *src)
|
2024-04-24 13:31:46 -04:00
|
|
|
{
|
2024-04-24 18:08:09 -04:00
|
|
|
char c, *cap;
|
2024-04-27 17:47:06 -04:00
|
|
|
int wrapped;
|
|
|
|
r->id = id, r->a = &empty, r->b = ∅
|
2024-04-24 18:46:27 -04:00
|
|
|
/* phase: compile left */
|
2024-04-24 18:08:09 -04:00
|
|
|
while((c = *src) && c == ' ') src++;
|
2024-04-24 18:17:57 -04:00
|
|
|
if(c == ')' || (c == '<' && src[1] == '>')) return src;
|
2024-04-24 18:34:11 -04:00
|
|
|
r->a = dict_, cap = walk(src), wrapped = c == '(';
|
2024-04-24 18:08:09 -04:00
|
|
|
if(wrapped) src++, cap--;
|
|
|
|
while(src < cap) {
|
2024-04-24 18:34:11 -04:00
|
|
|
c = *src, *dict_++ = *src++;
|
2024-04-24 17:03:14 -04:00
|
|
|
}
|
2024-04-24 18:34:11 -04:00
|
|
|
src += wrapped, *dict_++ = 0;
|
2024-04-24 18:46:27 -04:00
|
|
|
/* phase: compile right */
|
2024-04-24 18:08:09 -04:00
|
|
|
while((c = *src) && c == ' ') src++;
|
2024-04-24 18:17:57 -04:00
|
|
|
if(c == ')' || (c == '<' && src[1] == '>')) return src;
|
2024-04-24 18:34:11 -04:00
|
|
|
r->b = dict_, cap = walk(src), wrapped = c == '(';
|
2024-04-24 18:08:09 -04:00
|
|
|
if(wrapped) src++, cap--;
|
|
|
|
while(src < cap) {
|
2024-04-24 18:34:11 -04:00
|
|
|
c = *src, *dict_++ = *src++;
|
2024-04-24 17:54:40 -04:00
|
|
|
}
|
2024-04-24 18:34:11 -04:00
|
|
|
src += wrapped, *dict_++ = 0;
|
2024-04-24 16:41:09 -04:00
|
|
|
return src;
|
2024-04-24 13:31:46 -04:00
|
|
|
}
|
|
|
|
|
2024-04-26 23:50:22 -04:00
|
|
|
static Rule *
|
2024-04-27 00:18:02 -04:00
|
|
|
find_rule(char *s, char *cap)
|
2024-04-26 23:50:22 -04:00
|
|
|
{
|
|
|
|
Rule *r = rules;
|
2024-04-27 00:18:02 -04:00
|
|
|
if(*s == '(') s++, cap--;
|
2024-04-26 23:50:22 -04:00
|
|
|
while(r < rules_) {
|
|
|
|
char *ss = s, *a = r->a;
|
2024-04-27 14:24:00 -04:00
|
|
|
if(a)
|
|
|
|
while(*ss++ == *a++)
|
|
|
|
if(!*a && ss == cap) return r;
|
2024-04-26 23:50:22 -04:00
|
|
|
r++;
|
|
|
|
}
|
2024-04-27 00:18:02 -04:00
|
|
|
return r;
|
2024-04-26 23:50:22 -04:00
|
|
|
}
|
|
|
|
|
2024-04-04 13:07:49 -04:00
|
|
|
static int
|
2024-04-07 19:16:33 -04:00
|
|
|
rewrite(void)
|
2024-04-04 13:07:49 -04:00
|
|
|
{
|
2024-04-25 21:39:17 -04:00
|
|
|
char c, last = 0, *cap, *s = src_;
|
2024-04-21 12:13:30 -04:00
|
|
|
while(*s == ' ') s++;
|
2024-04-11 12:40:04 -04:00
|
|
|
while((c = *s)) {
|
2024-04-26 12:02:03 -04:00
|
|
|
if(c == '(' || spacer(last)) {
|
2024-04-24 13:31:46 -04:00
|
|
|
Rule *r = NULL;
|
2024-04-26 23:50:22 -04:00
|
|
|
/* phase: define */
|
2024-04-24 18:55:48 -04:00
|
|
|
if(c == '<' && s[1] == '>') {
|
2024-04-27 15:30:40 -04:00
|
|
|
r = rules_;
|
2024-04-24 16:49:21 -04:00
|
|
|
s = compile_rule(r, rules_ - rules - 1, s + 2);
|
2024-04-27 15:30:40 -04:00
|
|
|
if(*r->a) {
|
|
|
|
if(!quiet && r->a)
|
2024-04-27 17:47:06 -04:00
|
|
|
printf("<> (%s) (%s)\n", r->a, r->b);
|
2024-04-27 15:30:40 -04:00
|
|
|
while(*s == ' ') s++;
|
|
|
|
rules_++;
|
|
|
|
}
|
2024-04-27 11:46:31 -04:00
|
|
|
return write_tail(s);
|
2024-04-10 15:19:44 -04:00
|
|
|
}
|
2024-04-26 23:50:22 -04:00
|
|
|
/* phase: undefine */
|
|
|
|
if(c == '>' && s[1] == '<') {
|
2024-04-27 00:35:31 -04:00
|
|
|
s += 2;
|
2024-04-21 12:13:30 -04:00
|
|
|
while(*s == ' ') s++;
|
2024-04-27 13:04:01 -04:00
|
|
|
cap = walk(s), r = find_rule(s, cap);
|
2024-04-27 12:24:48 -04:00
|
|
|
if(!quiet && r->a)
|
2024-04-27 17:47:06 -04:00
|
|
|
printf(">< (%s) (%s)\n", r->a, r->b);
|
2024-04-27 13:04:01 -04:00
|
|
|
r->a = 0;
|
2024-04-27 00:18:02 -04:00
|
|
|
while(*cap == ' ') cap++;
|
2024-04-27 11:46:31 -04:00
|
|
|
return write_tail(cap);
|
|
|
|
}
|
|
|
|
/* phase: lambda */
|
|
|
|
if(c == '?' && s[1] == '(') {
|
|
|
|
cap = walk(s + 1), compile_rule(&lambda, -1, s + 2), s = cap;
|
|
|
|
while(*s == ' ') s++;
|
|
|
|
if(!apply_rule(&lambda, s)) write_tail(s);
|
|
|
|
return 1;
|
2024-04-22 23:13:19 -04:00
|
|
|
}
|
2024-04-24 18:55:48 -04:00
|
|
|
/* phase: match */
|
2024-04-22 23:15:33 -04:00
|
|
|
for(r = rules; r < rules_; r++)
|
2024-04-26 23:50:22 -04:00
|
|
|
if(r->a && apply_rule(r, s)) return 1;
|
2024-04-04 15:09:47 -04:00
|
|
|
}
|
2024-04-14 22:36:16 -04:00
|
|
|
*dst_++ = last = c;
|
2024-04-11 12:40:04 -04:00
|
|
|
s++;
|
2024-04-04 13:30:31 -04:00
|
|
|
}
|
2024-04-14 22:36:16 -04:00
|
|
|
*dst_++ = 0;
|
2024-04-04 22:55:05 -04:00
|
|
|
return 0;
|
2024-04-04 13:07:49 -04:00
|
|
|
}
|
|
|
|
|
2024-04-07 13:58:39 -04:00
|
|
|
int
|
|
|
|
main(int argc, char **argv)
|
2024-04-07 13:56:43 -04:00
|
|
|
{
|
2024-04-07 13:58:39 -04:00
|
|
|
FILE *f;
|
2024-04-27 11:46:31 -04:00
|
|
|
int i, pl = 0, pr = 0, rw = 0;
|
2024-04-26 14:06:30 -04:00
|
|
|
char c, last = 0, *w = bank_a;
|
2024-04-07 13:58:39 -04:00
|
|
|
if(argc < 2)
|
2024-04-18 14:33:23 -04:00
|
|
|
return !printf("usage: modal [-vqn] source.modal\n");
|
|
|
|
for(i = 1; i < argc && *argv[i] == '-'; i++) {
|
|
|
|
switch(argv[i][1]) {
|
2024-04-27 11:46:31 -04:00
|
|
|
case 'v': /* version */ return !printf("Modal Interpreter, 27 Apr 2024.\n");
|
2024-04-22 18:29:54 -04:00
|
|
|
case 'q': /* quiet */ quiet = 1; break;
|
2024-04-18 14:33:23 -04:00
|
|
|
case 'n': /* infinite */ cycles = 0xffffffff; break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
if(!(f = fopen(argv[i], "r")))
|
2024-04-27 12:02:56 -04:00
|
|
|
return !printf("Modal file invalid: %s.\n", argv[i]);
|
2024-04-07 13:56:43 -04:00
|
|
|
while(fread(&c, 1, 1, f)) {
|
2024-04-12 11:54:07 -04:00
|
|
|
c = c <= 0x20 ? 0x20 : c;
|
2024-04-26 14:06:30 -04:00
|
|
|
if(c == ' ' && last == '(') continue;
|
|
|
|
if(c == ')' && last == ' ') w--;
|
|
|
|
if(c == ' ' && last == ' ') w--;
|
2024-04-23 12:35:58 -04:00
|
|
|
if(c == '(') pl++;
|
|
|
|
if(c == ')') pr++;
|
2024-04-26 14:06:30 -04:00
|
|
|
if(c == '(' && last != '?' && !spacer(last)) *w++ = ' ';
|
|
|
|
if(last == ')' && !spacer(c)) *w++ = ' ';
|
|
|
|
*w++ = last = c;
|
2024-04-07 13:56:43 -04:00
|
|
|
}
|
2024-04-08 18:26:53 -04:00
|
|
|
while(*(--w) <= ' ') *w = 0;
|
2024-04-07 13:56:43 -04:00
|
|
|
fclose(f);
|
2024-04-21 12:46:53 -04:00
|
|
|
if(pr != pl)
|
2024-04-27 12:02:56 -04:00
|
|
|
return !printf("Modal program imbalanced.\n");
|
2024-04-27 11:46:31 -04:00
|
|
|
while(rewrite() && ++rw)
|
2024-04-27 12:02:56 -04:00
|
|
|
if(!cycles--) return !printf("Modal rewrites exceeded.\n");
|
|
|
|
if(!quiet) {
|
|
|
|
while(rules_-- > rules)
|
|
|
|
if(!rules_->refs && rules_->a)
|
|
|
|
printf("-- Unused rule: %d <> (%s) (%s)\n", rules_->refs, rules_->a, rules_->b);
|
|
|
|
printf(".. %s\nCompleted in %d rewrites.\n", src_, rw);
|
|
|
|
}
|
2024-04-04 14:54:31 -04:00
|
|
|
return 0;
|
2024-04-04 12:04:27 -04:00
|
|
|
}
|