diff --git a/code_generator.py b/code_generator.py index f4ac090..efdcce6 100644 --- a/code_generator.py +++ b/code_generator.py @@ -1,169 +1,264 @@ from tree_nodes import * -sd = 0 -jumpId = 65 -let_count = 0 -rho = {} -localVarCount = 1 +sd = 0 #stack distance +jumpId = 65 #Labels to jump to +let_count = 0 #Count lets to slide at the end +rho = {} #Address space +localVarCount = 1 #local variable count +varsUsedInFun = [] #to find all variables used in the function def inorder to find the free variables +otherType = ["add", "sub", "mul", "div", "if", "asgn", "let", "fun", "if","app"] #all tags for type 'Other' +opType = ["add", "sub", "mul", "div"] #binary operators +op2 = ["le", "lt", "ge", "gt", "eq"] #Comparision operators +localAssignmentCount = 0 -def parse_syntaxTree(tree): +###parsing of the code called from main +def parse_syntaxTree(tree): #Assume the program starts with only let, if and let_rec if(tree.tag == "if"): code_gen_for_if(tree.children) elif(tree.tag == "let"): code_gen_for_let(tree.children) print(str(sd) + " slide " + str(let_count)) + elif(tree.tag == "rec"): + code_gen_for_rec(tree.children) -#code_generation for let +###code_generation for let def code_gen_for_let(children): global let_count - let_count+=1 + let_count+=1 #increment every time a let statement is encountered + + #first child of let is an assignment always (to_be_confirmed) if(children[0].tag == "asgn"): code_gen_for_asgn(children[0].children) - + + #second child of let can be a let, binary operator or a function application if(children[1].tag == "let"): code_gen_for_let(children[1].children) - elif(children[1].tag == "add"): - code_gen_for_op(children[1].children, "add") - elif(children[1].tag == "mul"): - code_gen_for_op(children[1].children, "mul") - elif(children[1].tag == "sub"): - code_gen_for_op(children[1].children, "sub") - elif(children[1].tag == "div"): - code_gen_for_op(children[1].children, "div") + elif(children[1].tag in opType): + code_gen_for_op(children[1].children, children[1].tag) elif(children[1].tag == "app"): code_gen_for_application(children[1].children) + elif(children[1].tag == "uadd" or children[1].tag == "usub"): + code_gen_for_uop(children[1].children, children[1].tag) + +###code_generation for unary operators +def code_gen_for_uop(children, type): + if(children[0].tag == "var"): + code_gen_for_var(children[0].var) + elif(children[0].tag == "basic"): + code_gen_for_basic_val(children[0].value) + print(str(sd) + " " +type) + print(str(sd) + " mkbasic") -#code_gen for assignment +###code_gen for assignment def code_gen_for_asgn(children): global rho, localVarCount + #first child of assignment can be a var or an fvar. If its a var the second child will be a basic value, an if or a binary operator. If its an fvar, the second child is a function if(children[0].tag == "var"): - #print("Variable name: " + children[0].var + "added at" + str(localVarCount)) rho[children[0].var] = ("L",localVarCount) localVarCount += 1 if(children[1].tag == "basic"): code_gen_for_basic_val(children[1].value) - elif(children[1].tag == "mul"): - code_gen_for_op(children[1].children, "mul") + elif(children[1].tag in opType): + code_gen_for_op(children[1].children, children[1].tag) + elif(children[1].tag == "if"): + code_gen_for_if(children[1].children) if(children[0].tag == "fvar"): rho[children[0].var] = ("L",localVarCount) localVarCount+=1 - if(children[1].tag == "basic"): - print(children[1].value) - elif(children[1].tag == "fun"): + if(children[1].tag == "fun"): code_gen_for_fun(children[1].children) -#code_generation for basic -def code_gen_for_basic_val(value): +###code_generation for basic value +def code_gen_for_basic_val(value, makebasic = True): global sd print(str(sd) + " loadc "+ str(value)) sd+=1 - print(str(sd) + " mkbasic") + if (makebasic == True): #when the value is not used immediatly we make basic + print(str(sd) + " mkbasic") -#code_generation for var +###code_generation for var def code_gen_for_var(var_name, getbasic = True): global rho, sd - value = rho[var_name][1] varType = rho[var_name][0] - if varType == "L": + value = rho[var_name][1] + #check if the variable is local or global + if varType == "L": value = sd - value print(str(sd) + " pushloc " + str(value)) elif varType == "G": print(str(sd) + " pushglob " + str(value)) sd+=1 - if (getbasic): + if (getbasic): #if the value is used now print(str(sd) + " getbasic") -#code_genation for binary operators -def code_gen_for_op(children, type): +###code_generation for binary operators +def code_gen_for_op(children, type): #The children of operators can be var arg or basic global sd - if(children[0].tag == "var"): + if(children[0].tag == "var" or children[0].tag == "arg"): code_gen_for_var(children[0].var) elif(children[0].tag == "basic"): - code_gen_for_basic_val(children[0].value) + code_gen_for_basic_val(children[0].value, type in opType) if (children[1].tag == "var" or children[1].tag == "arg"): code_gen_for_var(children[1].var) elif(children[1].tag == "basic"): - code_gen_for_basic_val(children[1].value) + code_gen_for_basic_val(children[1].value, type in opType) print(str(sd) + " " + type) sd-=1 - print(str(sd) + " mkbasic") + if (type in opType): + print(str(sd) + " mkbasic") #TODO: check if mkbasic comes here or when call to this function returns + +''' +###code_generation for comparision operators +def code_gen_for_op2(children, type): + global sd + if(children[0].tag == "var" or children[0].tag == "arg"): + code_gen_for_var(children[0].var) + elif(children[0].tag == "basic"): + code_gen_for_basic_val(children[0].value, False) + + if (children[1].tag == "var" or children[1].tag == "arg"): + code_gen_for_var(children[1].var) + elif(children[1].tag == "basic"): + code_gen_for_basic_val(children[1].value, False) + + print(str(sd) + " " + type) + sd-=1 +''' -#code_generation for if -def code_gen_for_if(children): +###code_generation for if +def code_gen_for_if(children): global jumpId - if(children[0].tag == "basic"): + if(children[0].tag == "basic"): #the condition can be a basic type or a op2 type code_gen_for_basic_val(children[0].value) + elif(children[0].tag in op2): + code_gen_for_op(children[0].children, children[0].tag) - print("jumpz " + chr(jumpId)) + print(str(sd) + " jumpz " + chr(jumpId)) jumpId+= 1 - if(children[1].tag == "basic"): - code_gen_for_basic_val(children[1].value) + #then part of if can be basic, var or arg type + if(children[1].tag == "basic"): + code_gen_for_basic_val(children[1].value, False) + elif(children[1].tag == "var" or children[1].tag == "arg"): + code_gen_for_var(children[1].var, False) - print("jump " + chr(jumpId)) + print(str(sd) + " jump " + chr(jumpId)) + print(chr(jumpId - 1) + ":") jumpId+= 1 - - if(children[2].tag == "basic"): - code_gen_for_basic_val(children[2].value) -#code_generation for function + #else part of if can be either basic or application type + if(children[2].tag == "basic"): + code_gen_for_basic_val(children[2].value, False) + elif (children[2].tag == "app"): + code_gen_for_application(children[2].children) + print(chr(jumpId - 1) + ":") + +###code_generation for function def code_gen_for_fun(children): - global sd, rho - funArgVars = [] - for funArg in children: - if (funArg.tag == "arg"): + global sd, rho, jumpId + funArgVars = [] #the formal parameters + localFunNameLabel = jumpId #label for the function name to be created + jumpId += 1 + localFunJumpLabel = jumpId #label for the jump after the function call + jumpId += 1 + for funArg in children: #there could be 1-n parameters for the function + if (funArg.tag == "arg"): funArgVars.append(funArg.var) - else: - varsUsed = getVarsUsed() - freeVars = list(set(varsUsed) - set(funArgVars)) - #generate code for free-vars - for var in freeVars: + else: #the actual execution of the function + varsUsed = getVarsUsed(children) #all variables used inside the function definition + freeVars = list(set(varsUsed) - set(funArgVars)) #variables that are not formal parameters + varsUsedInFun = [] #reset the global variable + + for var in freeVars: #first generate code for free-vars code_gen_for_var(var, False) print(str(sd) + " mkvec " + str(len(freeVars))) - print(str(sd) + " mkfunval A") - print(str(sd) + " jump B") - oldSD = sd #new stack distance + print(str(sd) + " mkfunval " + chr(localFunNameLabel)) + print(str(sd) + " jump " + chr(localFunJumpLabel)) + + oldSD = sd #new stack distance and address space in the function definiton sd = 0 oldRHO = rho rho = {} formalParamCount = 0 globalFunVarCount = 0 - for var in funArgVars: + + for var in funArgVars: #define the address space of the local and formal parameters rho[var] = ("L",formalParamCount) formalParamCount-=1 for var in freeVars: rho[var] = ("G",globalFunVarCount) globalFunVarCount+=1 - print("A:") + + print(chr(localFunNameLabel) + ":") #start of the function definition code generation print (str(sd) + " targ " + str(len(funArgVars))) - if (funArg.tag == "add"): - code_gen_for_op(funArg.children, "add") - print (str(sd) + " return " + str(len(funArgVars))) - sd=oldSD + if (funArg.tag in opType): #the last child of a function can be an operator or an if + code_gen_for_op(funArg.children, funArg.tag) + elif (funArg.tag == "if"): + code_gen_for_if(funArg.children) + + print (str(sd) + " return " + str(len(funArgVars))) #end of the function definition code generation + + sd=oldSD #reset the sd and the address space rho = oldRHO - print("B:") + print(chr(localFunJumpLabel) + ":") #Return variables used inside a function inorder to determine the free variables -def getVarsUsed(): #TODO - return ["a", "b"] +def getVarsUsed(children): + global varsUsedInFun + for i in children: + if (i.tag == "var" or i.tag == "fvar" or i.tag == "arg"): + if(not i.var in varsUsedInFun): + varsUsedInFun.append(i.var) + elif (i.tag in otherType): + getVarsUsed(i.children) + return varsUsedInFun -#code generation for function application +###code generation for function application def code_gen_for_application(children): global sd preAppSD = sd - print(str(sd) + " mark C") - sd=sd+3 - for i in range((len(children)-1),-1, -1): + localMarkVar = jumpId #label for the jump after the function application + print(str(sd) + " mark " + chr(localMarkVar)) + sd=sd+3 #three org cells loaded + for i in range((len(children)-1),-1, -1): #the children are read in reverse order and are either basic, binary operator or a fvar if(children[i].tag == "basic"): code_gen_for_basic_val(children[i].value) - elif(children[i].tag == "add"): - code_gen_for_op(children[i].children,"add") + elif(children[i].tag in opType): + code_gen_for_op(children[i].children,children[i].tag) elif(children[i].tag == "fvar"): code_gen_for_var(children[i].var,False) print(str(sd) + " apply") - print("C:") - sd = preAppSD + 1 + print(chr(localMarkVar) + ":") + sd = preAppSD + 1 + +###code generation for rec +def code_gen_for_rec(children): + global sd + n = allocateLocalVars(children) #find no of local variables to be allocated + print(str(sd) + " alloc " + str(n)) + sd+=n + if(children[0].tag == "asgn"): #first child of let_rec is an assignment + code_gen_for_asgn(children[0].children) + print(str(sd) + " rewrite " + str(n)) + sd-=1 + if(children[1].tag == "app"): #second child of let_rec is an application + code_gen_for_application(children[1].children) + print(str(sd) + " slide " + str(n)) + +#find the value of n for rec definitions +def allocateLocalVars(children): + global localAssignmentCount + for i in children: + if (i.tag == "asgn"): + localAssignmentCount+=1 + elif (i.tag == "var" or i.tag == "fvar" or i.tag == "basic" or i.tag == "arg"): + pass + else: + allocateLocalVars(i.children) + return localAssignmentCount + + \ No newline at end of file diff --git a/main.py b/main.py index 7cb233d..a56eaea 100644 --- a/main.py +++ b/main.py @@ -64,5 +64,14 @@ #parse_syntaxTree(result) #result = parse_tree("let a = 17 in let f = fun b -> a + b in f (39 + 2)") #parse_syntaxTree(result) - result = parse_tree("let a = 17 in let f = fun b -> a + b in f 42") # 140 - parse_syntaxTree(result) \ No newline at end of file + #result = parse_tree("let a = 17 in let f = fun b -> a + b in f 42") # 140 + #parse_syntaxTree(result) + #result = parse_tree("let rec f = fun x y -> if y <= 1 then x else f ( x * y ) ( y - 1 ) in f 1") + #parse_syntaxTree(result) + #result = parse_tree("let x3 = 4 in + x3 ") + #parse_syntaxTree(result) + #result = parse_tree("let f = fun x y -> let a = 5 in let b = x + 2*y in b + a*x in f 0 1") + #parse_syntaxTree(result) + #result = parse_tree("if y > x then x else 7 + y * x") + #parse_syntaxTree(result) +