mod dtype;
mod equiv;
mod interp;
mod parse;
mod visualize;
mod write_ir;
use core::convert::TryFrom;
use core::fmt;
use core::ops::{Deref, DerefMut};
use std::collections::{BTreeMap, HashMap};
use std::hash::{Hash, Hasher};
pub use dtype::{Dtype, DtypeError, HasDtype};
use hexf_parse::{parse_hexf32, parse_hexf64};
pub use interp::{Value, interp};
use itertools::Itertools;
use lang_c::ast;
use ordered_float::OrderedFloat;
pub use parse::Parse;
pub use visualize::Visualizer;
#[derive(Debug, Clone, PartialEq)]
pub struct TranslationUnit {
pub decls: BTreeMap<String, Declaration>,
pub structs: HashMap<String, Option<Dtype>>,
}
#[derive(Debug, Clone, PartialEq)]
pub enum Declaration {
Variable {
dtype: Dtype,
initializer: Option<ast::Initializer>,
},
Function {
signature: FunctionSignature,
definition: Option<FunctionDefinition>,
},
}
impl TryFrom<Dtype> for Declaration {
type Error = DtypeError;
fn try_from(dtype: Dtype) -> Result<Self, Self::Error> {
match &dtype {
Dtype::Unit { .. } => Err(DtypeError::Misc {
message: "A variable of type `void` cannot be declared".to_string(),
}),
Dtype::Int { .. }
| Dtype::Float { .. }
| Dtype::Pointer { .. }
| Dtype::Array { .. }
| Dtype::Struct { .. } => Ok(Declaration::Variable {
dtype,
initializer: None,
}),
Dtype::Function { .. } => Ok(Declaration::Function {
signature: FunctionSignature::new(dtype),
definition: None,
}),
Dtype::Typedef { .. } => panic!("typedef should be replaced by real dtype"),
}
}
}
impl Declaration {
pub fn get_variable(&self) -> Option<(&Dtype, &Option<ast::Initializer>)> {
if let Self::Variable { dtype, initializer } = self {
Some((dtype, initializer))
} else {
None
}
}
pub fn get_function(&self) -> Option<(&FunctionSignature, &Option<FunctionDefinition>)> {
if let Self::Function {
signature,
definition,
} = self
{
Some((signature, definition))
} else {
None
}
}
pub fn get_function_mut(
&mut self,
) -> Option<(&mut FunctionSignature, &mut Option<FunctionDefinition>)> {
if let Self::Function {
signature,
definition,
} = self
{
Some((signature, definition))
} else {
None
}
}
pub fn is_compatible(&self, other: &Declaration) -> bool {
match (self, other) {
(Self::Variable { dtype, .. }, Self::Variable { dtype: other, .. }) => dtype == other,
(
Self::Function { signature, .. },
Self::Function {
signature: other, ..
},
) => signature.dtype() == other.dtype(),
_ => false,
}
}
}
impl HasDtype for Declaration {
fn dtype(&self) -> Dtype {
match self {
Self::Variable { dtype, .. } => dtype.clone(),
Self::Function { signature, .. } => signature.dtype(),
}
}
}
#[derive(Debug, Clone, PartialEq, Eq)]
pub struct FunctionSignature {
pub ret: Dtype,
pub params: Vec<Dtype>,
}
impl FunctionSignature {
pub fn new(dtype: Dtype) -> Self {
let (ret, params) = dtype
.get_function_inner()
.expect("function signature's dtype must be function type");
Self {
ret: ret.clone(),
params: params.clone(),
}
}
}
impl HasDtype for FunctionSignature {
fn dtype(&self) -> Dtype {
Dtype::function(self.ret.clone(), self.params.clone())
}
}
#[derive(Debug, Clone, PartialEq, Eq)]
pub struct FunctionDefinition {
pub allocations: Vec<Named<Dtype>>,
pub blocks: BTreeMap<BlockId, Block>,
pub bid_init: BlockId,
}
#[derive(Debug, Clone, Copy, PartialEq, Eq, PartialOrd, Ord, Hash)]
pub struct BlockId(pub usize);
impl fmt::Display for BlockId {
fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
write!(f, "b{}", self.0)
}
}
#[derive(Debug, Clone, PartialEq, Eq)]
pub struct Block {
pub phinodes: Vec<Named<Dtype>>,
pub instructions: Vec<Named<Instruction>>,
pub exit: BlockExit,
}
#[derive(Debug, Clone, PartialEq, Eq)]
pub enum Instruction {
Nop,
Value {
value: Operand,
},
BinOp {
op: ast::BinaryOperator,
lhs: Operand,
rhs: Operand,
dtype: Dtype,
},
UnaryOp {
op: ast::UnaryOperator,
operand: Operand,
dtype: Dtype,
},
Store {
ptr: Operand,
value: Operand,
},
Load {
ptr: Operand,
},
Call {
callee: Operand,
args: Vec<Operand>,
return_type: Dtype,
},
TypeCast {
value: Operand,
target_dtype: Dtype,
},
GetElementPtr {
ptr: Operand,
offset: Operand,
dtype: Dtype,
},
}
impl HasDtype for Instruction {
fn dtype(&self) -> Dtype {
match self {
Self::Nop | Self::Store { .. } => Dtype::unit(),
Self::Value { value } => value.dtype(),
Self::BinOp { dtype, .. }
| Self::UnaryOp { dtype, .. }
| Self::Call {
return_type: dtype, ..
}
| Self::TypeCast {
target_dtype: dtype,
..
}
| Self::GetElementPtr { dtype, .. } => dtype.clone(),
Self::Load { ptr } => ptr
.dtype()
.get_pointer_inner()
.expect("Load instruction must have pointer value as operand")
.clone()
.set_const(false),
}
}
}
impl Instruction {
pub fn has_no_side_effects(&self) -> bool {
!matches!(self, Self::Store { .. } | Self::Call { .. })
}
}
pub trait WriteOp {
fn write_operation(&self) -> String;
}
impl WriteOp for ast::BinaryOperator {
fn write_operation(&self) -> String {
match self {
Self::Multiply => "mul",
Self::Divide => "div",
Self::Modulo => "mod",
Self::Plus => "add",
Self::Minus => "sub",
Self::ShiftLeft => "shl",
Self::ShiftRight => "shr",
Self::Equals => "cmp eq",
Self::NotEquals => "cmp ne",
Self::Less => "cmp lt",
Self::LessOrEqual => "cmp le",
Self::Greater => "cmp gt",
Self::GreaterOrEqual => "cmp ge",
Self::BitwiseAnd => "and",
Self::BitwiseXor => "xor",
Self::BitwiseOr => "or",
_ => todo!(
"ast::BinaryOperator::WriteOp: write operation for {:?} is needed",
self
),
}
.to_string()
}
}
impl WriteOp for ast::UnaryOperator {
fn write_operation(&self) -> String {
match self {
Self::Plus => "plus",
Self::Minus => "minus",
Self::Negate => "negate",
_ => todo!(
"ast::UnaryOperator::WriteOp: write operation for {:?} is needed",
self
),
}
.to_string()
}
}
impl fmt::Display for Instruction {
fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
match self {
Instruction::Nop => write!(f, "nop"),
Instruction::Value { value } => write!(f, "{value}"),
Instruction::BinOp { op, lhs, rhs, .. } => {
write!(f, "{} {} {}", op.write_operation(), lhs, rhs)
}
Instruction::UnaryOp { op, operand, .. } => {
write!(f, "{} {}", op.write_operation(), operand)
}
Instruction::Store { ptr, value } => write!(f, "store {value} {ptr}"),
Instruction::Load { ptr } => write!(f, "load {ptr}"),
Instruction::Call { callee, args, .. } => {
write!(
f,
"call {}({})",
callee,
args.iter()
.format_with(", ", |operand, f| f(&format_args!("{operand}")))
)
}
Instruction::TypeCast {
value,
target_dtype,
} => write!(f, "typecast {value} to {target_dtype}"),
Instruction::GetElementPtr { ptr, offset, .. } => {
write!(f, "getelementptr {ptr} offset {offset}")
}
}
}
}
#[derive(Debug, Clone, PartialEq, Eq)]
pub enum BlockExit {
Jump {
arg: JumpArg,
},
ConditionalJump {
condition: Operand,
arg_then: JumpArg,
arg_else: JumpArg,
},
Switch {
value: Operand,
default: JumpArg,
cases: Vec<(Constant, JumpArg)>,
},
Return {
value: Operand,
},
Unreachable,
}
impl BlockExit {
pub fn walk_jump_args<F>(&mut self, mut f: F)
where
F: FnMut(&mut JumpArg),
{
match self {
Self::Jump { arg } => f(arg),
Self::ConditionalJump {
arg_then, arg_else, ..
} => {
f(arg_then);
f(arg_else);
}
Self::Switch { default, cases, .. } => {
f(default);
for (_, arg) in cases {
f(arg);
}
}
Self::Return { .. } | Self::Unreachable => {}
}
}
}
impl fmt::Display for BlockExit {
fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
match self {
BlockExit::Jump { arg } => write!(f, "j {arg}"),
BlockExit::ConditionalJump {
condition,
arg_then,
arg_else,
} => write!(f, "br {condition}, {arg_then}, {arg_else}"),
BlockExit::Switch {
value,
default,
cases,
} => write!(
f,
"switch {} default {} [\n{}\n ]",
value,
default,
cases.iter().format_with("\n", |(v, b), f| f(&format_args!(
" {}:{} {}",
v,
v.dtype(),
b
)))
),
BlockExit::Return { value } => write!(f, "ret {value}"),
BlockExit::Unreachable => write!(f, "<unreachable>\t\t\t\t; error state"),
}
}
}
#[derive(Debug, Clone, PartialEq, Eq)]
pub struct JumpArg {
pub bid: BlockId,
pub args: Vec<Operand>,
}
impl JumpArg {
pub fn new(bid: BlockId, args: Vec<Operand>) -> Self {
Self { bid, args }
}
}
impl fmt::Display for JumpArg {
fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
write!(
f,
"{}({})",
self.bid,
self.args
.iter()
.format_with(", ", |a, f| f(&format_args!("{a}")))
)
}
}
#[derive(Debug, Clone, PartialEq, Eq, Hash)]
pub enum Operand {
Constant(Constant),
Register { rid: RegisterId, dtype: Dtype },
}
impl Operand {
pub fn constant(value: Constant) -> Self {
Self::Constant(value)
}
pub fn register(rid: RegisterId, dtype: Dtype) -> Self {
Self::Register { rid, dtype }
}
pub fn get_constant(&self) -> Option<&Constant> {
if let Self::Constant(constant) = self {
Some(constant)
} else {
None
}
}
pub fn get_register(&self) -> Option<(&RegisterId, &Dtype)> {
if let Self::Register { rid, dtype } = self {
Some((rid, dtype))
} else {
None
}
}
pub fn get_register_mut(&mut self) -> Option<(&mut RegisterId, &mut Dtype)> {
if let Self::Register { rid, dtype } = self {
Some((rid, dtype))
} else {
None
}
}
}
impl fmt::Display for Operand {
fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
match self {
Self::Constant(value) => write!(f, "{}:{}", value, value.dtype()),
Self::Register { rid, dtype } => write!(f, "{rid}:{dtype}"),
}
}
}
impl HasDtype for Operand {
fn dtype(&self) -> Dtype {
match self {
Self::Constant(value) => value.dtype(),
Self::Register { dtype, .. } => dtype.clone(),
}
}
}
#[derive(Debug, Eq, Clone, Copy)]
pub enum RegisterId {
Local { aid: usize },
Arg { bid: BlockId, aid: usize },
Temp { bid: BlockId, iid: usize },
}
impl RegisterId {
pub fn local(aid: usize) -> Self {
Self::Local { aid }
}
pub fn arg(bid: BlockId, aid: usize) -> Self {
Self::Arg { bid, aid }
}
pub fn temp(bid: BlockId, iid: usize) -> Self {
Self::Temp { bid, iid }
}
pub fn is_const(&self, bid_init: BlockId) -> bool {
match self {
Self::Local { .. } => true,
Self::Arg { bid, .. } => bid == &bid_init,
_ => false,
}
}
}
impl fmt::Display for RegisterId {
fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
match self {
Self::Local { aid } => write!(f, "%l{aid}"),
Self::Arg { bid, aid } => write!(f, "%{bid}:p{aid}"),
Self::Temp { bid, iid } => write!(f, "%{bid}:i{iid}"),
}
}
}
impl PartialEq<RegisterId> for RegisterId {
fn eq(&self, other: &RegisterId) -> bool {
match (self, other) {
(Self::Local { aid }, Self::Local { aid: other_aid }) => aid == other_aid,
(
Self::Arg { bid, aid },
Self::Arg {
bid: other_bid,
aid: other_aid,
},
) => bid == other_bid && aid == other_aid,
(
Self::Temp { bid, iid },
Self::Temp {
bid: other_bid,
iid: other_iid,
},
) => bid == other_bid && iid == other_iid,
_ => false,
}
}
}
impl Hash for RegisterId {
fn hash<H: Hasher>(&self, state: &mut H) {
match self {
Self::Local { aid } => aid.hash(state),
Self::Arg { bid, aid } => {
bid.hash(state);
aid.hash(state);
}
Self::Temp { bid, iid } => {
bid.hash(state);
iid.hash(state);
}
}
}
}
#[derive(Debug, Clone, PartialEq, Eq, Hash)]
pub enum Constant {
Undef {
dtype: Dtype,
},
Unit,
Int {
value: u128,
width: usize,
is_signed: bool,
},
Float {
value: OrderedFloat<f64>,
width: usize,
},
GlobalVariable {
name: String,
dtype: Dtype,
},
}
impl TryFrom<&ast::Constant> for Constant {
type Error = ();
fn try_from(constant: &ast::Constant) -> Result<Self, Self::Error> {
match constant {
ast::Constant::Integer(integer) => {
let dtype = match integer.suffix.size {
ast::IntegerSize::Int => Dtype::INT,
ast::IntegerSize::Long => Dtype::LONG,
ast::IntegerSize::LongLong => Dtype::LONGLONG,
};
let pat = match integer.base {
ast::IntegerBase::Decimal => Self::DECIMAL,
ast::IntegerBase::Octal => Self::OCTAL,
ast::IntegerBase::Hexadecimal => Self::HEXADECIMAL,
ast::IntegerBase::Binary => Self::BINARY,
};
let value = if integer.suffix.unsigned {
u128::from_str_radix(integer.number.deref(), pat).unwrap()
} else {
i128::from_str_radix(integer.number.deref(), pat).unwrap() as u128
};
let is_signed = !integer.suffix.unsigned && {
let width = dtype.get_int_width().unwrap();
let threshold = 1u128 << (width as u128 - 1);
value < threshold
};
Ok(Self::int(value, dtype.set_signed(is_signed)))
}
ast::Constant::Float(float) => {
let pat = match float.base {
ast::FloatBase::Decimal => Self::DECIMAL,
ast::FloatBase::Hexadecimal => Self::HEXADECIMAL,
};
let (dtype, value) = match float.suffix.format {
ast::FloatFormat::Float => {
let value = match pat {
Self::DECIMAL => float.number.parse::<f32>().unwrap() as f64,
Self::HEXADECIMAL => {
let mut hex_number = "0x".to_string();
hex_number.push_str(float.number.deref());
parse_hexf32(&hex_number, true).unwrap() as f64
}
_ => panic!(
"Constant::try_from::<&ast::Constant>: \
{pat:?} is not a pattern of `pat`"
),
};
(Dtype::FLOAT, value)
}
ast::FloatFormat::Double => {
let value = match pat {
Self::DECIMAL => float.number.parse::<f64>().unwrap(),
Self::HEXADECIMAL => {
let mut hex_number = "0x".to_string();
hex_number.push_str(float.number.deref());
parse_hexf64(&hex_number, true).unwrap()
}
_ => panic!(
"Constant::try_from::<&ast::Constant>: \
{pat:?} is not a pattern of `pat`"
),
};
(Dtype::DOUBLE, value)
}
ast::FloatFormat::LongDouble => {
panic!("`FloatFormat::LongDouble` is_unsupported")
}
ast::FloatFormat::TS18661Format(_) => {
panic!("`FloatFormat::TS18661Format` is_unsupported")
}
};
Ok(Self::float(value, dtype))
}
ast::Constant::Character(character) => {
let dtype = Dtype::CHAR;
let value = character.parse::<char>().unwrap() as u128;
Ok(Self::int(value, dtype))
}
}
}
}
impl TryFrom<&ast::Expression> for Constant {
type Error = ();
fn try_from(expr: &ast::Expression) -> Result<Self, Self::Error> {
match expr {
ast::Expression::Constant(constant) => Self::try_from(&constant.node),
ast::Expression::UnaryOperator(unary) => {
let constant = Self::try_from(&unary.node.operand.node)?;
match &unary.node.operator.node {
ast::UnaryOperator::Minus => Ok(constant.minus()),
ast::UnaryOperator::Plus => Ok(constant),
_ => Err(()),
}
}
_ => Err(()),
}
}
}
impl Constant {
const DECIMAL: u32 = 10;
const OCTAL: u32 = 8;
const HEXADECIMAL: u32 = 16;
const BINARY: u32 = 2;
#[inline]
pub fn is_integer_constant(&self) -> bool {
matches!(self, Self::Int { .. })
}
#[inline]
pub fn undef(dtype: Dtype) -> Self {
Self::Undef { dtype }
}
#[inline]
pub fn unit() -> Self {
Self::Unit
}
#[inline]
pub fn int(value: u128, dtype: Dtype) -> Self {
let width = dtype.get_int_width().expect("`dtype` must be `Dtype::Int`");
let is_signed = dtype.is_int_signed();
Self::Int {
value,
width,
is_signed,
}
}
#[inline]
pub fn float(value: f64, dtype: Dtype) -> Self {
let width = dtype
.get_float_width()
.expect("`dtype` must be `Dtype::Float`");
Self::Float {
value: value.into(),
width,
}
}
#[inline]
pub fn global_variable(name: String, dtype: Dtype) -> Self {
Self::GlobalVariable { name, dtype }
}
#[inline]
pub fn get_int(&self) -> Option<(u128, usize, bool)> {
if let Self::Int {
value,
width,
is_signed,
} = self
{
Some((*value, *width, *is_signed))
} else {
None
}
}
#[inline]
pub fn get_global_variable_name(&self) -> Option<String> {
if let Self::GlobalVariable { name, .. } = self {
Some(name.clone())
} else {
None
}
}
#[inline]
fn minus(self) -> Self {
match self {
Self::Int {
value,
width,
is_signed,
} => {
assert!(is_signed);
let minus_value = -(value as i128);
Self::Int {
value: minus_value as u128,
width,
is_signed,
}
}
Self::Float { mut value, width } => {
*value.as_mut() *= -1.0f64;
Self::Float { value, width }
}
_ => panic!(
"constant value generated by `Constant::from_ast_expression` \
must be `Constant(Int, Float)`"
),
}
}
pub fn is_undef(&self) -> bool {
matches!(self, Self::Undef { .. })
}
#[must_use]
pub fn typecast(self, target_dtype: Dtype) -> Self {
if self.dtype() == target_dtype {
return self;
}
match (&self, &target_dtype) {
(
Constant::Int { value, width, .. },
Dtype::Int {
width: target_width,
is_signed: target_signed,
..
},
) => {
let result = if *target_signed {
if *width >= *target_width {
let value = trim_unnecessary_bits(*value, *target_width as u128);
sign_extension(value, *target_width as u128)
} else {
*value
}
} else {
trim_unnecessary_bits(*value, *target_width as u128)
};
Constant::int(result, target_dtype)
}
(
Constant::Int {
value, is_signed, ..
},
Dtype::Float { .. },
) => {
let casted_value = if *is_signed {
*value as i128 as f64
} else {
*value as f64
};
Constant::float(casted_value, target_dtype)
}
(Constant::Float { value, .. }, Dtype::Int { is_signed, .. }) => {
let casted_value = if *is_signed {
value.into_inner() as i128 as u128
} else {
value.into_inner() as u128
};
Constant::int(casted_value, target_dtype)
}
(Constant::Float { value, .. }, Dtype::Float { .. }) => {
Constant::float(value.into_inner(), target_dtype)
}
_ => todo!("typecast ({:?}) {:?}", self, target_dtype),
}
}
}
#[inline]
pub fn sign_extension(value: u128, width: u128) -> u128 {
let base = 1u128 << (width - 1);
if value >= base {
let bit_mask = -1i128 << (width as i128);
value | bit_mask as u128
} else {
value
}
}
#[inline]
pub fn trim_unnecessary_bits(value: u128, width: u128) -> u128 {
let bit_mask = (1u128 << width) - 1;
value & bit_mask
}
impl fmt::Display for Constant {
fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
match self {
Self::Undef { .. } => write!(f, "undef"),
Self::Unit => write!(f, "unit"),
Self::Int {
value, is_signed, ..
} => write!(
f,
"{}",
if *is_signed {
(*value as i128).to_string()
} else {
value.to_string()
}
),
Self::Float { value, .. } => {
let mut val_str = value.to_string();
if !val_str.contains('.') {
val_str += ".0"
};
write!(f, "{val_str}")
}
Self::GlobalVariable { name, .. } => write!(f, "@{name}"),
}
}
}
impl HasDtype for Constant {
fn dtype(&self) -> Dtype {
match self {
Self::Undef { dtype } => dtype.clone(),
Self::Unit => Dtype::unit(),
Self::Int {
width, is_signed, ..
} => Dtype::int(*width).set_signed(*is_signed),
Self::Float { width, .. } => Dtype::float(*width),
Self::GlobalVariable { dtype, .. } => Dtype::pointer(dtype.clone()),
}
}
}
#[derive(Debug, Clone, PartialEq, Eq, Hash)]
pub struct Named<T> {
name: Option<String>,
inner: T,
}
impl<T> Deref for Named<T> {
type Target = T;
fn deref(&self) -> &Self::Target {
&self.inner
}
}
impl<T> DerefMut for Named<T> {
fn deref_mut(&mut self) -> &mut Self::Target {
&mut self.inner
}
}
impl<T> Named<T> {
pub fn new(name: Option<String>, inner: T) -> Self {
Self { name, inner }
}
pub fn name(&self) -> Option<&String> {
self.name.as_ref()
}
pub fn destruct(self) -> (T, Option<String>) {
(self.inner, self.name)
}
pub fn into_inner(self) -> T {
self.inner
}
}
impl<T: fmt::Display> fmt::Display for Named<T> {
fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
write!(f, "{}", self.inner)
}
}