mirror of
https://github.com/pezkuwichain/revive.git
synced 2026-05-07 21:18:02 +00:00
94ec34c4d5
Separate between compilation and linker phases to allow deploy time linking and back-porting era compiler changes to fix #91. Unlinked contract binaries (caused by missing libraries or missing factory dependencies in turn) are emitted as raw ELF object. Few drive by fixes: - #98 - A compiler panic on missing libraries definitions. - Fixes some incosistent type forwarding in JSON output (empty string vs. null object). - Remove the unused fallback for size optimization setting. - Remove the broken `--lvm-ir` mode. - CI workflow fixes. --------- Signed-off-by: Cyrill Leutwiler <bigcyrill@hotmail.com> Signed-off-by: xermicus <bigcyrill@hotmail.com> Signed-off-by: xermicus <cyrill@parity.io>
239 lines
9.0 KiB
Rust
239 lines
9.0 KiB
Rust
//! The YUL source code literal.
|
|
|
|
use inkwell::values::BasicValue;
|
|
use num::Num;
|
|
use num::One;
|
|
use num::Zero;
|
|
use serde::Deserialize;
|
|
use serde::Serialize;
|
|
|
|
use revive_common::BASE_DECIMAL;
|
|
use revive_common::BASE_HEXADECIMAL;
|
|
use revive_common::BYTE_LENGTH_WORD;
|
|
use revive_llvm_context::PolkaVMArgument;
|
|
use revive_llvm_context::PolkaVMContext;
|
|
|
|
use crate::error::Error;
|
|
use crate::lexer::token::lexeme::literal::boolean::Boolean as BooleanLiteral;
|
|
use crate::lexer::token::lexeme::literal::integer::Integer as IntegerLiteral;
|
|
use crate::lexer::token::lexeme::literal::Literal as LexicalLiteral;
|
|
use crate::lexer::token::lexeme::symbol::Symbol;
|
|
use crate::lexer::token::lexeme::Lexeme;
|
|
use crate::lexer::token::location::Location;
|
|
use crate::lexer::token::Token;
|
|
use crate::lexer::Lexer;
|
|
use crate::parser::error::Error as ParserError;
|
|
use crate::parser::r#type::Type;
|
|
use crate::visitor::AstNode;
|
|
use crate::visitor::AstVisitor;
|
|
|
|
/// Represents a literal in YUL without differentiating its type.
|
|
#[derive(Debug, Serialize, Deserialize, Clone, PartialEq, Eq)]
|
|
pub struct Literal {
|
|
/// The location.
|
|
pub location: Location,
|
|
/// The lexical literal.
|
|
pub inner: LexicalLiteral,
|
|
/// The type, if it has been explicitly specified.
|
|
pub yul_type: Option<Type>,
|
|
}
|
|
|
|
impl Literal {
|
|
/// The element parser.
|
|
pub fn parse(lexer: &mut Lexer, initial: Option<Token>) -> Result<Self, Error> {
|
|
let token = crate::parser::take_or_next(initial, lexer)?;
|
|
|
|
let (location, literal) = match token {
|
|
Token {
|
|
lexeme: Lexeme::Literal(literal),
|
|
location,
|
|
..
|
|
} => (location, literal),
|
|
token => {
|
|
return Err(ParserError::InvalidToken {
|
|
location: token.location,
|
|
expected: vec!["{literal}"],
|
|
found: token.lexeme.to_string(),
|
|
}
|
|
.into());
|
|
}
|
|
};
|
|
|
|
let yul_type = match lexer.peek()? {
|
|
Token {
|
|
lexeme: Lexeme::Symbol(Symbol::Colon),
|
|
..
|
|
} => {
|
|
lexer.next()?;
|
|
Some(Type::parse(lexer, None)?)
|
|
}
|
|
_ => None,
|
|
};
|
|
|
|
Ok(Self {
|
|
location,
|
|
inner: literal,
|
|
yul_type,
|
|
})
|
|
}
|
|
|
|
/// Converts the literal into its LLVM.
|
|
pub fn into_llvm<'ctx>(
|
|
self,
|
|
context: &PolkaVMContext<'ctx>,
|
|
) -> anyhow::Result<PolkaVMArgument<'ctx>> {
|
|
match self.inner {
|
|
LexicalLiteral::Boolean(inner) => {
|
|
let value = self
|
|
.yul_type
|
|
.unwrap_or_default()
|
|
.into_llvm(context)
|
|
.const_int(
|
|
match inner {
|
|
BooleanLiteral::False => 0,
|
|
BooleanLiteral::True => 1,
|
|
},
|
|
false,
|
|
)
|
|
.as_basic_value_enum();
|
|
|
|
let constant = match inner {
|
|
BooleanLiteral::False => num::BigUint::zero(),
|
|
BooleanLiteral::True => num::BigUint::one(),
|
|
};
|
|
|
|
Ok(PolkaVMArgument::value(value).with_constant(constant))
|
|
}
|
|
LexicalLiteral::Integer(inner) => {
|
|
let r#type = self.yul_type.unwrap_or_default().into_llvm(context);
|
|
let value = match inner {
|
|
IntegerLiteral::Decimal { ref inner } => r#type.const_int_from_string(
|
|
inner.as_str(),
|
|
inkwell::types::StringRadix::Decimal,
|
|
),
|
|
IntegerLiteral::Hexadecimal { ref inner } => r#type.const_int_from_string(
|
|
&inner["0x".len()..],
|
|
inkwell::types::StringRadix::Hexadecimal,
|
|
),
|
|
}
|
|
.expect("The value is valid")
|
|
.as_basic_value_enum();
|
|
|
|
let constant = match inner {
|
|
IntegerLiteral::Decimal { ref inner } => {
|
|
num::BigUint::from_str_radix(inner.as_str(), BASE_DECIMAL)
|
|
}
|
|
IntegerLiteral::Hexadecimal { ref inner } => {
|
|
num::BigUint::from_str_radix(&inner["0x".len()..], BASE_HEXADECIMAL)
|
|
}
|
|
}
|
|
.expect("Always valid");
|
|
|
|
Ok(PolkaVMArgument::value(value).with_constant(constant))
|
|
}
|
|
LexicalLiteral::String(inner) => {
|
|
let string = inner.inner;
|
|
let r#type = self.yul_type.unwrap_or_default().into_llvm(context);
|
|
|
|
let mut hex_string = if inner.is_hexadecimal {
|
|
string.clone()
|
|
} else {
|
|
let mut hex_string = String::with_capacity(BYTE_LENGTH_WORD * 2);
|
|
let mut index = 0;
|
|
loop {
|
|
if index >= string.len() {
|
|
break;
|
|
}
|
|
|
|
if string[index..].starts_with('\\') {
|
|
index += 1;
|
|
|
|
if string[index..].starts_with('x') {
|
|
hex_string.push_str(&string[index + 1..index + 3]);
|
|
index += 3;
|
|
} else if string[index..].starts_with('u') {
|
|
let codepoint_str = &string[index + 1..index + 5];
|
|
let codepoint =
|
|
u32::from_str_radix(codepoint_str, BASE_HEXADECIMAL).map_err(
|
|
|error| {
|
|
anyhow::anyhow!(
|
|
"Invalid codepoint `{}`: {}",
|
|
codepoint_str,
|
|
error
|
|
)
|
|
},
|
|
)?;
|
|
let unicode_char = char::from_u32(codepoint).ok_or_else(|| {
|
|
anyhow::anyhow!("Invalid codepoint {}", codepoint)
|
|
})?;
|
|
let mut unicode_bytes = vec![0u8; 3];
|
|
unicode_char.encode_utf8(&mut unicode_bytes);
|
|
|
|
for byte in unicode_bytes.into_iter() {
|
|
hex_string.push_str(format!("{byte:02x}").as_str());
|
|
}
|
|
index += 5;
|
|
} else if string[index..].starts_with('t') {
|
|
hex_string.push_str("09");
|
|
index += 1;
|
|
} else if string[index..].starts_with('n') {
|
|
hex_string.push_str("0a");
|
|
index += 1;
|
|
} else if string[index..].starts_with('r') {
|
|
hex_string.push_str("0d");
|
|
index += 1;
|
|
} else if string[index..].starts_with('\n') {
|
|
index += 1;
|
|
} else {
|
|
hex_string
|
|
.push_str(format!("{:02x}", string.as_bytes()[index]).as_str());
|
|
index += 1;
|
|
}
|
|
} else {
|
|
hex_string
|
|
.push_str(format!("{:02x}", string.as_bytes()[index]).as_str());
|
|
index += 1;
|
|
}
|
|
}
|
|
hex_string
|
|
};
|
|
|
|
if hex_string.len() > BYTE_LENGTH_WORD * 2 {
|
|
return Ok(revive_llvm_context::PolkaVMArgument::value(
|
|
r#type.const_zero().as_basic_value_enum(),
|
|
)
|
|
.with_original(string));
|
|
}
|
|
|
|
if hex_string.len() < BYTE_LENGTH_WORD * 2 {
|
|
hex_string.push_str(
|
|
"0".repeat((BYTE_LENGTH_WORD * 2) - hex_string.len())
|
|
.as_str(),
|
|
);
|
|
}
|
|
|
|
let value = r#type
|
|
.const_int_from_string(
|
|
hex_string.as_str(),
|
|
inkwell::types::StringRadix::Hexadecimal,
|
|
)
|
|
.expect("The value is valid")
|
|
.as_basic_value_enum();
|
|
Ok(PolkaVMArgument::value(value).with_original(string))
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
impl AstNode for Literal {
|
|
fn accept(&self, ast_visitor: &mut impl AstVisitor) {
|
|
ast_visitor.visit_literal(self);
|
|
}
|
|
|
|
fn visit_children(&self, _ast_visitor: &mut impl AstVisitor) {}
|
|
|
|
fn location(&self) -> Location {
|
|
self.location
|
|
}
|
|
}
|