2025-07-28 22:40:06 +08:00
|
|
|
|
module TComp
|
|
|
|
|
include("./parser.jl")
|
|
|
|
|
using .Parser
|
2025-08-19 23:57:14 +08:00
|
|
|
|
using Match
|
|
|
|
|
|
2025-08-21 00:00:59 +08:00
|
|
|
|
# For pass 2
|
|
|
|
|
struct SimpleExp
|
|
|
|
|
binds
|
|
|
|
|
body
|
|
|
|
|
end
|
2025-08-19 23:57:14 +08:00
|
|
|
|
|
|
|
|
|
inp = ARGS
|
|
|
|
|
f = open(ARGS[1], "r")
|
|
|
|
|
prog = read(f, String)
|
|
|
|
|
|
2025-09-01 01:21:11 +08:00
|
|
|
|
#(prog)
|
2025-08-19 23:57:14 +08:00
|
|
|
|
parsed = Parser.totalParse(prog)
|
2025-09-01 01:21:11 +08:00
|
|
|
|
#print(parsed)
|
2025-08-19 23:57:14 +08:00
|
|
|
|
tmp_var_no = 0
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
2025-08-21 00:00:59 +08:00
|
|
|
|
# Pass 1: Duplicated varname uniquified
|
|
|
|
|
function uniquifyVar(parsed, env)
|
2025-08-19 23:57:14 +08:00
|
|
|
|
@match parsed begin
|
|
|
|
|
# letrec is not considered
|
|
|
|
|
#[("%let", "id"), [ty, var], val, [("%lambda", "id"), args, body]] => nothing
|
|
|
|
|
|
|
|
|
|
[("%let", "id"), [ty, var], val, body] =>
|
|
|
|
|
begin
|
|
|
|
|
envNew = env
|
|
|
|
|
push!(envNew, var[1]) # push x of var = ("x", "id") in newEnv
|
|
|
|
|
res = [("%let", "id"),
|
2025-08-21 00:00:59 +08:00
|
|
|
|
[ty, uniquifyVar(var, envNew)],
|
|
|
|
|
uniquifyVar(val, env),
|
|
|
|
|
uniquifyVar(body, envNew)]
|
2025-08-19 23:57:14 +08:00
|
|
|
|
return res
|
|
|
|
|
end
|
|
|
|
|
(var, "id") =>
|
|
|
|
|
begin
|
|
|
|
|
reversedEnv = reverse(env)
|
|
|
|
|
index = length(env) - findfirst(e -> e == var, reversedEnv) + 1
|
2025-08-21 00:00:59 +08:00
|
|
|
|
newVar = var * string(index)
|
|
|
|
|
return (newVar, "id")
|
2025-08-19 23:57:14 +08:00
|
|
|
|
end
|
2025-08-21 00:00:59 +08:00
|
|
|
|
[("%prime", "id"), op, [lhs, rhs]] =>
|
2025-08-19 23:57:14 +08:00
|
|
|
|
begin
|
2025-08-21 00:00:59 +08:00
|
|
|
|
lhs_new = uniquifyVar(lhs, env)
|
|
|
|
|
rhs_new = uniquifyVar(rhs, env)
|
|
|
|
|
return [("%prime", "id"), op, [lhs_new, rhs_new]]
|
2025-08-19 23:57:14 +08:00
|
|
|
|
end
|
|
|
|
|
[("%call", "id"), callee, args...] =>
|
|
|
|
|
begin
|
2025-08-21 00:00:59 +08:00
|
|
|
|
unifiedCallee = uniquifyVar(callee, env)
|
|
|
|
|
unifiedArgs = map(x ->uniquifyVar(x, env), args[1])
|
2025-08-19 23:57:14 +08:00
|
|
|
|
|
|
|
|
|
return vcat([("%call", "id"), unifiedCallee], [unifiedArgs])
|
|
|
|
|
end
|
|
|
|
|
(c, "int") => return parsed
|
|
|
|
|
_ => "Error"
|
|
|
|
|
end
|
|
|
|
|
end
|
|
|
|
|
|
2025-08-21 00:00:59 +08:00
|
|
|
|
# PASS2 explicit Control and Remove Complex
|
|
|
|
|
function explicitControlRemoveComplex(prog)
|
|
|
|
|
function rmComplex(exp)
|
|
|
|
|
return rmComplexAux1(exp, 0)
|
|
|
|
|
end
|
|
|
|
|
function rmComplexAux1(exp, varNo)
|
|
|
|
|
if exp[1] == ("%let", "id")
|
|
|
|
|
res = splitLet([], exp, varNo)
|
|
|
|
|
tup = rmComplexAux2(SimpleExp(res[1], res[2]), res[3])
|
|
|
|
|
else
|
|
|
|
|
tup = rmComplexAux2(SimpleExp([], exp), varNo)
|
|
|
|
|
end
|
|
|
|
|
return tup
|
|
|
|
|
end
|
|
|
|
|
|
2025-08-19 23:57:14 +08:00
|
|
|
|
|
2025-08-21 00:00:59 +08:00
|
|
|
|
function rmComplexAux2(exp, varNo)
|
|
|
|
|
|
|
|
|
|
return @match exp.body begin
|
|
|
|
|
(c, "int") => return (exp, varNo)
|
|
|
|
|
(v, "id") => return (exp, varNo)
|
|
|
|
|
[(id, "id"), caller, callee] where (id == "%prime" || id == "%call") =>
|
|
|
|
|
begin
|
|
|
|
|
newResList = exp.binds
|
|
|
|
|
new_exp_body = Any[(id, "id"), caller]
|
|
|
|
|
new_exp_args = []
|
|
|
|
|
|
|
|
|
|
for i in callee
|
|
|
|
|
res = rmComplexAux1(i, varNo)
|
|
|
|
|
varNo = res[2]
|
|
|
|
|
newBind = res[1].binds
|
|
|
|
|
if newBind != []
|
|
|
|
|
newResList = vcat(newResList, newBind)
|
2025-08-24 22:44:32 +08:00
|
|
|
|
push!(new_exp_args, last(newBind)[2][2])
|
2025-08-21 00:00:59 +08:00
|
|
|
|
else
|
|
|
|
|
push!(new_exp_args, i)
|
|
|
|
|
end
|
|
|
|
|
|
|
|
|
|
end
|
|
|
|
|
push!(new_exp_body, new_exp_args)
|
2025-09-01 01:21:11 +08:00
|
|
|
|
|
2025-08-24 22:44:32 +08:00
|
|
|
|
newBindVar = [("int", "id"), ("tmp" * string(varNo) , "id")]
|
2025-08-21 00:00:59 +08:00
|
|
|
|
varNo += 1
|
|
|
|
|
newBind = [("%let", "id"), newBindVar, new_exp_body]
|
|
|
|
|
push!(newResList, newBind)
|
|
|
|
|
return (SimpleExp(newResList, newBindVar), varNo)
|
|
|
|
|
|
|
|
|
|
end
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
_ => "Error"
|
|
|
|
|
end
|
|
|
|
|
end
|
|
|
|
|
|
|
|
|
|
function splitLet(binds, exp, varNo)
|
2025-09-01 01:21:11 +08:00
|
|
|
|
|
2025-08-21 00:00:59 +08:00
|
|
|
|
if exp[1] == ("%let", "id")
|
|
|
|
|
res = rmComplexAux1(exp[3], varNo)
|
2025-09-01 01:21:11 +08:00
|
|
|
|
|
2025-08-21 00:00:59 +08:00
|
|
|
|
binds = vcat(binds, res[1].binds)
|
|
|
|
|
new_exp = res[1].body
|
2025-09-01 01:21:11 +08:00
|
|
|
|
|
|
|
|
|
#fix bug[("int", "id"), ("tmp1", "id")] => ("tmp1", "id")
|
|
|
|
|
if new_exp[1] == ("int", "id")
|
|
|
|
|
new_exp = new_exp[2]
|
|
|
|
|
end
|
2025-08-21 00:00:59 +08:00
|
|
|
|
new_bind = [("%let", "id"), exp[2], new_exp]
|
|
|
|
|
push!(binds, new_bind)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
varNo = res[2]
|
|
|
|
|
return splitLet(binds, exp[4], varNo)
|
|
|
|
|
else
|
|
|
|
|
return (binds, exp, varNo)
|
|
|
|
|
end
|
|
|
|
|
end
|
|
|
|
|
|
2025-08-24 22:44:32 +08:00
|
|
|
|
|
|
|
|
|
raw_res = rmComplex(prog)[1]
|
2025-09-01 01:21:11 +08:00
|
|
|
|
raw_res_body = raw_res.body
|
|
|
|
|
#fix bug[("int", "id"), ("tmp1", "id")] => ("tmp1", "id")
|
|
|
|
|
if raw_res_body[1] == ("int", "id")
|
|
|
|
|
raw_res_body = [("%return", "id"), raw_res_body[2]]
|
|
|
|
|
end
|
|
|
|
|
|
|
|
|
|
if raw_res_body[2] == "int" # ("$8", "int")
|
|
|
|
|
raw_res_body = [("%return", "id"), raw_res_body]
|
|
|
|
|
end
|
|
|
|
|
|
|
|
|
|
res = push!(raw_res.binds, raw_res_body)
|
2025-08-24 22:44:32 +08:00
|
|
|
|
return res
|
2025-08-21 00:00:59 +08:00
|
|
|
|
end
|
|
|
|
|
|
2025-08-24 22:44:32 +08:00
|
|
|
|
### PASS 3 assign x86 instruction
|
|
|
|
|
function assignInstruction(inp)
|
|
|
|
|
resList = []
|
|
|
|
|
for i in inp
|
|
|
|
|
@match i begin
|
2025-09-01 01:21:11 +08:00
|
|
|
|
[("%return", "id"), (val, t_val)] => begin
|
|
|
|
|
if t_val == "int"
|
|
|
|
|
val = "\$" * val
|
|
|
|
|
end
|
|
|
|
|
push!(resList, ["movq", val, "%rax"])
|
|
|
|
|
end
|
2025-08-24 22:44:32 +08:00
|
|
|
|
[("%let", "id"), [_ty, (id, "id")],
|
2025-09-01 01:21:11 +08:00
|
|
|
|
[("%prime", "id"), (op, _), [(lhs, lhs_t), (rhs, rhs_t)]]] =>
|
2025-08-24 22:44:32 +08:00
|
|
|
|
begin
|
|
|
|
|
instr = ""
|
|
|
|
|
ops = ["+", "-", "*", "/"]
|
2025-09-01 01:21:11 +08:00
|
|
|
|
instrs = ["addq", "subq", "imulq", "divq"]
|
2025-08-24 22:44:32 +08:00
|
|
|
|
opIndex = findfirst(x -> x == op, ops)
|
|
|
|
|
instr = instrs[opIndex]
|
|
|
|
|
|
2025-09-01 01:21:11 +08:00
|
|
|
|
if lhs_t == "int"
|
|
|
|
|
lhs = "\$" * lhs
|
|
|
|
|
end
|
|
|
|
|
|
|
|
|
|
if rhs_t == "int"
|
|
|
|
|
rhs = "\$" * rhs
|
|
|
|
|
end
|
|
|
|
|
|
2025-08-24 22:44:32 +08:00
|
|
|
|
if rhs == id
|
|
|
|
|
line1 = [instr, lhs, id]
|
|
|
|
|
push!(resList, line1)
|
|
|
|
|
else
|
|
|
|
|
line1 = ["movq", lhs, id]
|
|
|
|
|
line2 = [instr, rhs, id]
|
|
|
|
|
|
|
|
|
|
push!(resList, line1)
|
|
|
|
|
push!(resList, line2)
|
|
|
|
|
end
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
#TODO [("%call", "id"), (op, _), args] => ...
|
|
|
|
|
end
|
|
|
|
|
|
2025-09-01 01:21:11 +08:00
|
|
|
|
[("%let", "id"), [_ty, (id, "id")], (val, t_val)] =>
|
2025-08-24 22:44:32 +08:00
|
|
|
|
begin
|
2025-09-01 01:21:11 +08:00
|
|
|
|
if t_val == "int"
|
|
|
|
|
val = "\$" * val
|
|
|
|
|
end
|
2025-08-24 22:44:32 +08:00
|
|
|
|
line = ["movq", val, id]
|
|
|
|
|
push!(resList, line)
|
|
|
|
|
end
|
|
|
|
|
|
2025-09-01 01:21:11 +08:00
|
|
|
|
(c, "int") => begin
|
|
|
|
|
c_modified = "\$" * c
|
|
|
|
|
push!(resList, [c_modified])
|
|
|
|
|
end
|
2025-08-24 22:44:32 +08:00
|
|
|
|
|
|
|
|
|
(v, "id") => push!(resList, [v])
|
|
|
|
|
_ => println("Error")
|
|
|
|
|
end
|
|
|
|
|
end
|
|
|
|
|
|
|
|
|
|
return resList
|
|
|
|
|
|
|
|
|
|
end
|
|
|
|
|
|
|
|
|
|
|
2025-08-21 00:00:59 +08:00
|
|
|
|
emptyEnv = []
|
|
|
|
|
res = uniquifyVar(parsed, emptyEnv)
|
2025-09-01 01:21:11 +08:00
|
|
|
|
#println("PASS1", res)
|
2025-08-21 00:00:59 +08:00
|
|
|
|
res2 = explicitControlRemoveComplex(res)
|
2025-08-24 22:44:32 +08:00
|
|
|
|
|
2025-09-01 01:21:11 +08:00
|
|
|
|
#println("PASS2", Parser.prettyStringLisp(res2))
|
2025-08-24 22:44:32 +08:00
|
|
|
|
res3 = assignInstruction(res2)
|
2025-09-01 01:21:11 +08:00
|
|
|
|
#println("PASS3", res3)
|
2025-08-24 22:44:32 +08:00
|
|
|
|
|
2025-08-19 23:57:14 +08:00
|
|
|
|
|
2025-09-01 01:21:11 +08:00
|
|
|
|
# PASS4 assign home
|
|
|
|
|
function assignHomes(inp)
|
|
|
|
|
varRegex = r"(^[^\$%].*)"
|
|
|
|
|
res = []
|
|
|
|
|
vars = []
|
|
|
|
|
for i in inp
|
|
|
|
|
orig = i[2]
|
|
|
|
|
dest = i[3]
|
|
|
|
|
if match(varRegex, orig) != nothing # i.e. orig is a var and not a reg.
|
|
|
|
|
if !(orig in vars)
|
|
|
|
|
push!(vars, orig)
|
|
|
|
|
end
|
|
|
|
|
end
|
|
|
|
|
if match(varRegex, dest) != nothing # i.e. dest is a var and not a reg.
|
|
|
|
|
if !(dest in vars)
|
|
|
|
|
push!(vars, dest)
|
|
|
|
|
end
|
|
|
|
|
end
|
|
|
|
|
end
|
|
|
|
|
#println("ALL_VAR", vars)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
varsLength = length(vars)
|
|
|
|
|
for i in inp
|
|
|
|
|
instr = i[1]
|
|
|
|
|
orig = i[2]
|
|
|
|
|
dest = i[3]
|
|
|
|
|
|
|
|
|
|
origIdx = findfirst(x -> x == orig,vars)
|
|
|
|
|
if origIdx != nothing
|
|
|
|
|
realAddressIdx = varsLength - origIdx + 1
|
|
|
|
|
realAddress = "-$(realAddressIdx * 8)(%rbp)"
|
|
|
|
|
orig = realAddress
|
|
|
|
|
end
|
|
|
|
|
|
|
|
|
|
destIdx = findfirst(x -> x == dest,vars)
|
|
|
|
|
if destIdx != nothing
|
|
|
|
|
realAddressIdx = varsLength - destIdx + 1
|
|
|
|
|
realAddress = "-$(realAddressIdx * 8)(%rbp)"
|
|
|
|
|
dest = realAddress
|
|
|
|
|
end
|
|
|
|
|
|
|
|
|
|
push!(res, [instr, orig, dest])
|
|
|
|
|
end
|
|
|
|
|
return (res, varsLength)
|
|
|
|
|
end
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
# PASS5 patch instruction (ensure "instr x(rbp) y(rbp)" not happened)
|
|
|
|
|
function patchInstruction(inp)
|
|
|
|
|
memoryRegex = r".+[(]%rbp[)]$"
|
|
|
|
|
res = []
|
|
|
|
|
|
|
|
|
|
for i in inp
|
|
|
|
|
inst = i[1]
|
|
|
|
|
orig = i[2]
|
|
|
|
|
dest = i[3]
|
|
|
|
|
if (match(memoryRegex, orig) != nothing) & (match(memoryRegex, dest) != nothing)
|
|
|
|
|
cmd1 = ["movq", orig, "%rax"]
|
|
|
|
|
push!(res, cmd1)
|
|
|
|
|
|
|
|
|
|
cmd2 = [inst, "%rax", dest]
|
|
|
|
|
push!(res, cmd2)
|
|
|
|
|
elseif (inst == "imulq") & (match(r"^%.+", dest) == nothing)
|
|
|
|
|
cmd1 = ["movq", dest, "%rax"]
|
|
|
|
|
cmd2 = ["imulq", orig, "%rax"]
|
|
|
|
|
cmd3 = ["movq", "%rax", dest]
|
|
|
|
|
push!(res, cmd1)
|
|
|
|
|
push!(res, cmd2)
|
|
|
|
|
push!(res, cmd3)
|
|
|
|
|
|
|
|
|
|
else
|
|
|
|
|
push!(res, i)
|
|
|
|
|
end
|
|
|
|
|
end
|
|
|
|
|
return res
|
|
|
|
|
end
|
2025-08-19 23:57:14 +08:00
|
|
|
|
|
2025-09-01 01:21:11 +08:00
|
|
|
|
res4 = assignHomes(res3)
|
|
|
|
|
res4_prog = res4[1]
|
|
|
|
|
varNumber = res4[2]
|
|
|
|
|
res5 = patchInstruction(res4_prog)
|
|
|
|
|
#println("PASS5",res5)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
## PASS6 add prelude and conclude
|
|
|
|
|
function preludeConclude(prog, varNumber)
|
|
|
|
|
rspSubqMax = varNumber * 8
|
|
|
|
|
|
|
|
|
|
body = "start:\n"
|
|
|
|
|
|
|
|
|
|
for i in prog
|
|
|
|
|
ln_cmd = ""
|
|
|
|
|
if length(i) == 3
|
|
|
|
|
ln_cmd = "\t$(i[1])\t$(i[2]), $(i[3])\n"
|
|
|
|
|
body = body * ln_cmd
|
|
|
|
|
end
|
|
|
|
|
end
|
|
|
|
|
body *= "\tjmp\tconclusion\n\n\n"
|
|
|
|
|
|
|
|
|
|
prelude = """
|
|
|
|
|
.globl main
|
|
|
|
|
main:
|
|
|
|
|
pushq %rbp
|
|
|
|
|
movq %rsp, %rbp\n""" * "\tsubq \$$rspSubqMax, %rsp\n\tjmp start\n\n"
|
|
|
|
|
|
|
|
|
|
conclude = """\nconclusion:\n""" * "\taddq \$$rspSubqMax, %rsp\n\tpopq %rbp\n\tretq"
|
|
|
|
|
|
|
|
|
|
assemblyProg = prelude * body * conclude
|
|
|
|
|
return assemblyProg
|
|
|
|
|
end
|
|
|
|
|
|
|
|
|
|
res6 = preludeConclude(res5, varNumber)
|
|
|
|
|
# println("PASS6",res6) # emit assembly code
|
|
|
|
|
f2 = open("./a.s", "w")
|
|
|
|
|
write(f2, res6) #write the assembly code
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
close(f)
|
|
|
|
|
close(f2)
|
2025-07-28 22:40:06 +08:00
|
|
|
|
|
|
|
|
|
|
|
|
|
|
end # module
|