-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathContcomp.fs
384 lines (321 loc) · 13.7 KB
/
Contcomp.fs
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
(* File MicroC/Contcomp.fs
A continuation-based (backwards) compiler from micro-C, a fraction of
the C language, to an abstract machine.
[email protected] * 2011-11-10
The abstract machine code is generated backwards, so that jumps to
jumps can be eliminated, so that tail-calls (calls immediately
followed by return) can be recognized, dead code can be eliminated,
etc.
The compilation of a block, which may contain a mixture of
declarations and statements, proceeds in two passes:
Pass 1: elaborate declarations to find the environment in which
each statement must be compiled; also translate
declarations into allocation instructions, of type
bstmtordec.
Pass 2: compile the statements in the given environments.
*)
module Contcomp
open System.IO
open Absyn
open StackMachine
open System.Diagnostics
open Debug
(* The intermediate representation between passes 1 and 2 above: *)
type bstmtordec =
| BDec of instr list (* Declaration of local variable *)
| BStmt of stmt (* A statement *)
(* ------------------------------------------------------------------- *)
(* Code-generating functions that perform local optimizations *)
let rec addINCSP m1 C : instr list =
match C with
| INCSP m2 :: C1 -> addINCSP (m1+m2) C1
| RET m2 :: C1 -> RET (m2-m1) :: C1
| Label lab :: RET m2 :: _ -> RET (m2-m1) :: C
| _ -> if m1=0 then C else INCSP m1 :: C
let addLabel C : label * instr list = (* Conditional jump to C *)
match C with
| Label lab :: _ -> (lab, C)
| GOTO lab :: _ -> (lab, C)
| _ -> let lab = newLabel()
(lab, Label lab :: C)
let makeJump C : instr * instr list = (* Unconditional jump to C *)
match C with
| RET m :: _ -> (RET m, C)
| Label lab :: RET m :: _ -> (RET m, C)
| Label lab :: _ -> (GOTO lab, C)
| GOTO lab :: _ -> (GOTO lab, C)
| _ -> let lab = newLabel()
(GOTO lab, Label lab :: C)
let makeCall m lab C : instr list =
match C with
| RET n :: C1 -> TCALL(m, n, lab) :: C1
| Label _ :: RET n :: _ -> TCALL(m, n, lab) :: C
| _ -> CALL(m, lab) :: C
let rec deadcode C =
match C with
| [] -> []
| Label lab :: _ -> C
| _ :: C1 -> deadcode C1
let addNOT C =
match C with
| NOT :: C1 -> C1
| IFZERO lab :: C1 -> IFNZRO lab :: C1
| IFNZRO lab :: C1 -> IFZERO lab :: C1
| _ -> NOT :: C
let addJump jump C = (* jump is GOTO or RET *)
let C1 = deadcode C
match (jump, C1) with
| (GOTO lab1, Label lab2 :: _) -> if lab1=lab2 then C1
else GOTO lab1 :: C1
| _ -> jump :: C1
let addGOTO lab C =
addJump (GOTO lab) C
let rec addCST i C =
match (i, C) with
| (0, ADD :: C1) -> C1
| (0, SUB :: C1) -> C1
| (0, NOT :: C1) -> addCST 1 C1
| (_, NOT :: C1) -> addCST 0 C1
| (1, MUL :: C1) -> C1
| (1, DIV :: C1) -> C1
| (0, EQ :: C1) -> addNOT C1
| (_, INCSP m :: C1) -> if m < 0 then addINCSP (m+1) C1
else CSTI i :: C
| (0, IFZERO lab :: C1) -> addGOTO lab C1
| (_, IFZERO lab :: C1) -> C1
| (0, IFNZRO lab :: C1) -> C1
| (_, IFNZRO lab :: C1) -> addGOTO lab C1
| _ -> CSTI i :: C
(* ------------------------------------------------------------------- *)
(* Simple environment operations *)
type 'data Env = (string * 'data) list
let rec lookup env x =
match env with
| [] -> failwith (x + " not found")
| (y, v)::yr -> if x=y then v else lookup yr x
(* A global variable has an absolute address, a local one has an offset: *)
type Var =
| Glovar of int (* absolute address in stack *)
| Locvar of int (* address relative to bottom of frame *)
(* The variable environment keeps track of global and local variables, and
keeps track of next available offset for local variables *)
type VarEnv = (Var * typ) Env * int
(* The function environment maps a function name to the function's label,
its return type, and its parameter declarations *)
type Paramdecs = (typ * string) list
type FunEnv = (label * typ option * Paramdecs) Env
(* Bind declared variable in varEnv and generate code to allocate it: *)
let allocate (kind : int -> Var) (typ, x) (varEnv : VarEnv) : VarEnv * instr list =
let (env, fdepth) = varEnv
match typ with
| TypA (TypA _, _) -> failwith "allocate: arrays of arrays not permitted"
| TypA (t, Some i) ->
let newEnv = ((x, (kind (fdepth+i), typ)) :: env, fdepth+i+1)
let code = [INCSP i; GETSP; CSTI (i-1); SUB]
(newEnv, code)
| _ ->
let newEnv = ((x, (kind (fdepth), typ)) :: env, fdepth+1)
let code = [INCSP 1]
(newEnv, code)
(* Bind declared parameter in env: *)
let bindParam (env, fdepth) (typ, x) : VarEnv =
((x, (Locvar fdepth, typ)) :: env, fdepth+1);
let bindParams paras (env, fdepth) : VarEnv =
List.fold bindParam (env, fdepth) paras;
(* ------------------------------------------------------------------- *)
(* Build environments for global variables and global functions *)
let makeGlobalEnvs(topdecs : topdec list) : VarEnv * FunEnv * instr list =
let rec addv decs varEnv funEnv =
match decs with
| [] -> (varEnv, funEnv, [])
| dec::decr ->
match dec with
| Vardec (typ, x) ->
let (varEnv1, code1) = allocate Glovar (typ, x) varEnv
let (varEnvr, funEnvr, coder) = addv decr varEnv1 funEnv
(varEnvr, funEnvr, code1 @ coder)
| Fundec (tyOpt, f, xs, body) ->
addv decr varEnv ((f, (newLabel(), tyOpt, xs)) :: funEnv)
addv topdecs ([], 0) []
(* ------------------------------------------------------------------- *)
(* Compiling micro-C statements:
* stmt is the statement to compile
* varenv is the local and global variable environment
* funEnv is the global function environment
* C is the code that follows the code for stmt
*)
let rec cStmt stmt (varEnv : VarEnv) (funEnv : FunEnv) (C : instr list) : instr list =
match stmt with
| If(e, stmt1, stmt2) ->
let (jumpend, C1) = makeJump C
let (labelse, C2) = addLabel (cStmt stmt2 varEnv funEnv C1)
cExpr e varEnv funEnv (IFZERO labelse
:: cStmt stmt1 varEnv funEnv (addJump jumpend C2))
| While(e, body) ->
let labbegin = newLabel()
let (jumptest, C1) =
makeJump (cExpr e varEnv funEnv (IFNZRO labbegin :: C))
addJump jumptest (Label labbegin :: cStmt body varEnv funEnv C1)
| Expr e ->
cExpr e varEnv funEnv (addINCSP -1 C)
| Block stmts ->
let rec pass1 stmts ((_, fdepth) as varEnv) =
match stmts with
| [] -> ([], fdepth)
| s1::sr ->
let (_, varEnv1) as res1 = bStmtordec s1 varEnv
let (resr, fdepthr) = pass1 sr varEnv1
(res1 :: resr, fdepthr)
let (stmtsback, fdepthend) = pass1 stmts varEnv
let rec pass2 pairs C =
match pairs with
| [] -> C
| (BDec code, varEnv) :: sr -> code @ pass2 sr C
| (BStmt stmt, varEnv) :: sr -> cStmt stmt varEnv funEnv (pass2 sr C)
pass2 stmtsback (addINCSP(snd varEnv - fdepthend) C)
| Return None ->
RET (snd varEnv - 1) :: deadcode C
| Return (Some e) ->
cExpr e varEnv funEnv (RET (snd varEnv) :: deadcode C)
and bStmtordec stmtOrDec varEnv : bstmtordec * VarEnv =
match stmtOrDec with
| Stmt stmt ->
(BStmt stmt, varEnv)
| Dec (typ, x) ->
let (varEnv1, code) = allocate Locvar (typ, x) varEnv
(BDec code, varEnv1)
(* Compiling micro-C expressions:
* e is the expression to compile
* varEnv is the compile-time variable environment
* funEnv is the compile-time environment
* C is the code following the code for this expression
Net effect principle: if the compilation (cExpr e varEnv funEnv C) of
expression e returns the instruction sequence instrs, then the
execution of instrs will have the same effect as an instruction
sequence that first computes the value of expression e on the stack
top and then executes C, but because of optimizations instrs may
actually achieve this in a different way.
*)
and cExpr (e : expr) (varEnv : VarEnv) (funEnv : FunEnv) (C : instr list) : instr list =
match e with
| Access acc -> cAccess acc varEnv funEnv (LDI :: C)
| Assign(acc, e) -> cAccess acc varEnv funEnv (cExpr e varEnv funEnv (STI :: C))
| CstI i -> addCST i C
| Addr acc -> cAccess acc varEnv funEnv C
| Prim1(ope, e1) ->
cExpr e1 varEnv funEnv
(match ope with
| "!" -> addNOT C
| "printi" -> PRINTI :: C
| "printc" -> PRINTC :: C
| _ -> failwith "unknown primitive 1")
| Prim2(ope, e1, e2) ->
cExpr e1 varEnv funEnv
(cExpr e2 varEnv funEnv
(match ope with
| "*" -> MUL :: C
| "+" -> ADD :: C
| "-" -> SUB :: C
| "/" -> DIV :: C
| "%" -> MOD :: C
| "==" -> EQ :: C
| "!=" -> EQ :: addNOT C
| "<" -> LT :: C
| ">=" -> LT :: addNOT C
| ">" -> SWAP :: LT :: C
| "<=" -> SWAP :: LT :: addNOT C
| _ -> failwith "unknown primitive 2"))
| Andalso(e1, e2) ->
match C with
| IFZERO lab :: _ ->
cExpr e1 varEnv funEnv (IFZERO lab :: cExpr e2 varEnv funEnv C)
| IFNZRO labthen :: C1 ->
let (labelse, C2) = addLabel C1
cExpr e1 varEnv funEnv
(IFZERO labelse
:: cExpr e2 varEnv funEnv (IFNZRO labthen :: C2))
| _ ->
let (jumpend, C1) = makeJump C
let (labfalse, C2) = addLabel (addCST 0 C1)
cExpr e1 varEnv funEnv
(IFZERO labfalse
:: cExpr e2 varEnv funEnv (addJump jumpend C2))
| Orelse(e1, e2) ->
match C with
| IFNZRO lab :: _ ->
cExpr e1 varEnv funEnv (IFNZRO lab :: cExpr e2 varEnv funEnv C)
| IFZERO labthen :: C1 ->
let(labelse, C2) = addLabel C1
cExpr e1 varEnv funEnv
(IFNZRO labelse :: cExpr e2 varEnv funEnv
(IFZERO labthen :: C2))
| _ ->
let (jumpend, C1) = makeJump C
let (labtrue, C2) = addLabel(addCST 1 C1)
cExpr e1 varEnv funEnv
(IFNZRO labtrue
:: cExpr e2 varEnv funEnv (addJump jumpend C2))
| Call(f, es) -> callfun f es varEnv funEnv C
(* Generate code to access variable, dereference pointer or index array: *)
and cAccess access varEnv funEnv C =
match access with
| AccVar x ->
match lookup (fst varEnv) x with
| Glovar addr, _ -> addCST addr C
| Locvar addr, _ -> GETBP :: addCST addr (ADD :: C)
| AccDeref e ->
cExpr e varEnv funEnv C
| AccIndex(acc, idx) ->
cAccess acc varEnv funEnv (LDI :: cExpr idx varEnv funEnv (ADD :: C))
(* Generate code to evaluate a list es of expressions: *)
and cExprs es varEnv funEnv C =
match es with
| [] -> C
| e1::er -> cExpr e1 varEnv funEnv (cExprs er varEnv funEnv C)
(* Generate code to evaluate arguments es and then call function f: *)
and callfun f es varEnv funEnv C : instr list =
let (labf, tyOpt, paramdecs) = lookup funEnv f
let argc = List.length es
if argc = List.length paramdecs then
cExprs es varEnv funEnv (makeCall argc labf C)
else
failwith (f + ": parameter/argument mismatch")
(* Compile a complete micro-C program: globals, call to main, functions *)
let cProgram (Prog topdecs) : instr list =
let _ = resetLabels ()
let ((globalVarEnv, _), funEnv, globalInit) = makeGlobalEnvs topdecs
let compilefun (tyOpt, f, xs, body) =
let (labf, _, paras) = lookup funEnv f
let (envf, fdepthf) = bindParams paras (globalVarEnv, 0)
let C0 = [RET (List.length paras-1)]
let code = cStmt body (envf, fdepthf) funEnv C0
Label labf :: code
let functions =
List.choose (function
| Fundec (rTy, name, argTy, body)
-> Some (compilefun (rTy, name, argTy, body))
| Vardec _ -> None)
topdecs
let (mainlab, _, mainparams) = lookup funEnv "main"
let argc = List.length mainparams
globalInit
@ [LDARGS argc; CALL(argc, mainlab); STOP]
@ List.concat functions
(* Compile the program (in abstract syntax) and write it to file
fname; also, return the program as a list of instructions.
*)
let intsToFile (inss : int list) (fname : string) =
printfn $"VM numeric code saved in file:\n\t{fname}"
File.WriteAllText(fname, String.concat " " (List.map string inss))
let writeInstr fname instrs =
let ins = String.concat "\n" (List.map string instrs)
File.WriteAllText(fname, ins)
printfn $"VM instructions saved in file:\n\t{fname}"
let contCompileToFile program fname =
let instrs = cProgram program
// printf "\nStack VM optimized instructions:\n %A\n" instrs
writeInstr (fname + ".opt.ins") instrs
let bytecode = code2ints instrs
// printf "\nStack VM optimized numeric code:\n %A\n" bytecode
intsToFile bytecode (fname+".opt.out"); instrs
(* Example programs are found in the files ex1.c, ex2.c, etc *)