1
0
Fork 0

Add first part of IR Generator implementation

This commit is contained in:
Vili Sinervä 2025-02-05 17:16:17 +02:00
parent f059870e81
commit dc50ce64eb
No known key found for this signature in database
GPG key ID: DF8FEAF54EFAC996
5 changed files with 238 additions and 1 deletions

View file

@ -1,6 +1,8 @@
use std::io;
use interpreter::interpret;
use ir::IrInstruction;
use ir_generator::generate_ir;
use parser::parse;
use symtab::SymTab;
use tokenizer::tokenize;
@ -8,6 +10,8 @@ use type_checker::type_check;
mod ast;
mod interpreter;
mod ir;
mod ir_generator;
mod parser;
mod symtab;
mod token;
@ -15,10 +19,20 @@ mod tokenizer;
mod type_checker;
mod variable;
pub fn compile(code: &str) {
pub fn compile(code: &str) -> Vec<IrInstruction> {
let tokens = tokenize(code);
let mut ast = parse(&tokens);
type_check(&mut ast, &mut SymTab::new_type_table());
generate_ir(&ast)
}
pub fn start_compiler() {
let lines = io::stdin().lines();
for line in lines.map_while(Result::ok) {
for instruction in compile(&line) {
println!("{instruction}");
}
}
}
pub fn start_interpreter() {

98
src/compiler/ir.rs Normal file
View file

@ -0,0 +1,98 @@
use std::{collections::HashMap, fmt};
use crate::compiler::{token::CodeLocation, variable::Type};
#[derive(PartialEq, Clone, Eq, Hash)]
pub struct IrVar {
pub name: String,
}
impl fmt::Debug for IrVar {
fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
write!(f, "{}", self.name)
}
}
impl fmt::Display for IrVar {
fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
write!(f, "{}", self.name)
}
}
impl IrVar {
pub fn new(name: &str) -> Self {
Self {
name: name.to_owned(),
}
}
pub fn new_global_types() -> HashMap<IrVar, Type> {
use Type::*;
HashMap::from([
(IrVar::new("unit"), Unit),
(IrVar::new("print_bool"), Func(vec![Bool], Box::new(Unit))),
(IrVar::new("print_int"), Func(vec![Int], Box::new(Unit))),
(IrVar::new("read_int"), Func(vec![], Box::new(Int))),
(IrVar::new("+"), Func(vec![Int, Int], Box::new(Int))),
(IrVar::new("*"), Func(vec![Int, Int], Box::new(Int))),
(IrVar::new("-"), Func(vec![Int, Int], Box::new(Int))),
(IrVar::new("/"), Func(vec![Int, Int], Box::new(Int))),
(IrVar::new("%"), Func(vec![Int, Int], Box::new(Int))),
(IrVar::new("<"), Func(vec![Int, Int], Box::new(Bool))),
(IrVar::new("<="), Func(vec![Int, Int], Box::new(Bool))),
(IrVar::new(">"), Func(vec![Int, Int], Box::new(Bool))),
(IrVar::new(">="), Func(vec![Int, Int], Box::new(Bool))),
(IrVar::new("not"), Func(vec![Bool], Box::new(Bool))),
(IrVar::new("neg"), Func(vec![Int], Box::new(Int))),
(IrVar::new("or"), Func(vec![Bool, Bool], Box::new(Bool))),
(IrVar::new("and"), Func(vec![Bool, Bool], Box::new(Bool))),
])
}
}
impl fmt::Display for IrInstruction {
fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
write!(f, "{} # From {}", self.instruction, self.loc)
}
}
#[derive(Debug, PartialEq, Clone)]
pub struct IrInstruction {
pub loc: CodeLocation,
pub instruction: IrInstructionType,
}
impl IrInstruction {
pub fn new(loc: CodeLocation, instruction: IrInstructionType) -> Self {
Self { loc, instruction }
}
}
#[derive(Debug, PartialEq, Clone)]
pub enum IrInstructionType {
LoadBoolConst(bool, IrVar),
LoadIntConst(i64, IrVar),
Copy(IrVar, IrVar),
Call(IrVar, Vec<IrVar>, IrVar),
Jump(Box<IrInstruction>),
CondJump(IrVar, Box<IrInstruction>, Box<IrInstruction>),
Label(String),
}
impl fmt::Display for IrInstructionType {
fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
let string = match self {
IrInstructionType::LoadBoolConst(val, dest) => format!("LoadBoolConst({val}, {dest})"),
IrInstructionType::LoadIntConst(val, dest) => format!("LoadIntConst({val}, {dest})"),
IrInstructionType::Copy(src, dest) => format!("Copy({src}, {dest})"),
IrInstructionType::Call(f, args, res) => format!("Call({f}, {args:?}, {res})"),
IrInstructionType::Jump(dest) => format!("Jump({})", *dest),
IrInstructionType::CondJump(cond, then_dest, else_dest) => {
format!("CondJump({cond}, {then_dest}, {else_dest})")
}
IrInstructionType::Label(name) => format!("Label({name})"),
};
write!(f, "{}", string)
}
}

View file

@ -0,0 +1,115 @@
use std::collections::HashMap;
use crate::compiler::{
ast::{AstNode, Expression::*},
ir::{IrInstruction, IrInstructionType::*, IrVar},
symtab::SymTab,
variable::Type,
};
pub fn generate_ir(ast: &AstNode) -> Vec<IrInstruction> {
let mut instructions = Vec::new();
let mut symbols = SymTab::new();
let global_types = IrVar::new_global_types();
let mut types = global_types.clone();
for var in global_types.keys() {
symbols.insert(&var.name, var.clone());
}
let result = visit_ast_node(ast, &mut types, &mut symbols, &mut instructions);
match types.get(&result) {
Some(Type::Int) => {
let loc = instructions.last().unwrap().loc;
let fn_var = symbols.get("print_int").clone();
instructions.push(IrInstruction::new(
loc,
Call(fn_var, vec![result], symbols.get("unit").clone()),
));
}
Some(Type::Bool) => {
let loc = instructions.last().unwrap().loc;
let fn_var = symbols.get("print_bool").clone();
instructions.push(IrInstruction::new(
loc,
Call(fn_var, vec![result], symbols.get("unit").clone()),
));
}
_ => (),
}
instructions
}
fn add_var(var_type: &Type, types: &mut HashMap<IrVar, Type>) -> IrVar {
let mut i = 1;
//let type_str = match var_type {
// Type::Int => "i",
// Type::Bool => "b",
// Type::Func(_, _) => "f",
// Type::Unit => "u",
//};
let type_str = "x";
let mut var = IrVar::new(&format!("{}{}", type_str, i));
while types.contains_key(&var) {
i += 1;
var = IrVar::new(&format!("{}{}", type_str, i));
}
types.insert(var.clone(), var_type.clone());
var
}
fn visit_ast_node(
ast: &AstNode,
types: &mut HashMap<IrVar, Type>,
symbols: &mut SymTab<IrVar>,
instructions: &mut Vec<IrInstruction>,
) -> IrVar {
match &ast.expr {
EmptyLiteral() => symbols.get("unit").clone(),
IntLiteral(val) => {
let var = add_var(&Type::Int, types);
instructions.push(IrInstruction::new(ast.loc, LoadIntConst(*val, var.clone())));
var
}
BoolLiteral(val) => {
let var = add_var(&Type::Bool, types);
instructions.push(IrInstruction {
loc: ast.loc,
instruction: LoadBoolConst(*val, var.clone()),
});
var
}
Identifier(name) => symbols.get(name).clone(),
UnaryOp(_, _) => todo!(),
BinaryOp(left, op, right) => match *op {
"=" => todo!(), // TODO Special handling
"and" => todo!(), // TODO Special handling
"or" => todo!(), // TODO Special handling
_ => {
let op_var = symbols.get(op).clone();
let left_var = visit_ast_node(left, types, symbols, instructions);
let right_var = visit_ast_node(right, types, symbols, instructions);
let result_var = add_var(&ast.node_type, types);
instructions.push(IrInstruction::new(
ast.loc,
Call(op_var, vec![left_var, right_var], result_var.clone()),
));
result_var
}
},
VarDeclaration(_, _, _) => todo!(),
Conditional(_, _, _) => todo!(),
While(_, _) => todo!(),
FunCall(_, _) => todo!(),
Block(_) => todo!(),
}
}

View file

@ -37,6 +37,14 @@ impl<'source, T> SymTab<'source, T> {
}
}
impl<'source, T> SymTab<'source, T> {
pub fn new() -> SymTab<'source, T> {
SymTab {
tables: vec![HashMap::new()],
}
}
}
impl<'source> SymTab<'source, Type> {
pub fn new_type_table() -> SymTab<'source, Type> {
use Type::*;

View file

@ -9,6 +9,8 @@ fn main() {
if let Some(flag) = args.get(1) {
if flag == "-i" {
compiler::start_interpreter();
} else if flag == "-c" {
compiler::start_compiler();
}
} else {
server::start("::".parse().unwrap(), 3000);