mirror of
https://github.com/zaphar/ucg.git
synced 2025-07-22 18:19:54 -04:00
1139 lines
32 KiB
Rust
1139 lines
32 KiB
Rust
// Copyright 2017 Jeremy Wall <jeremy@marzhillstudios.com>
|
|
//
|
|
// Licensed under the Apache License, Version 2.0 (the "License");
|
|
// you may not use this file except in compliance with the License.
|
|
// You may obtain a copy of the License at
|
|
//
|
|
// http://www.apache.org/licenses/LICENSE-2.0
|
|
//
|
|
// Unless required by applicable law or agreed to in writing, software
|
|
// distributed under the License is distributed on an "AS IS" BASIS,
|
|
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
// See the License for the specific language governing permissions and
|
|
// limitations under the License.
|
|
|
|
//! The definitions of the ucg AST and Tokens.
|
|
use std;
|
|
use std::borrow::Borrow;
|
|
use std::cmp::Eq;
|
|
use std::cmp::Ordering;
|
|
use std::cmp::PartialEq;
|
|
use std::cmp::PartialOrd;
|
|
use std::collections::BTreeMap;
|
|
use std::convert::Into;
|
|
use std::fmt;
|
|
use std::hash::Hash;
|
|
use std::hash::Hasher;
|
|
use std::path::PathBuf;
|
|
use std::rc::Rc;
|
|
|
|
use abortable_parser;
|
|
|
|
use crate::build::scope::Scope;
|
|
use crate::build::Val;
|
|
|
|
pub mod printer;
|
|
pub mod rewrite;
|
|
pub mod typecheck;
|
|
pub mod walk;
|
|
|
|
#[derive(Debug, PartialEq, Clone)]
|
|
pub enum TemplatePart {
|
|
Str(Vec<char>),
|
|
PlaceHolder(usize),
|
|
Expression(Expression),
|
|
}
|
|
|
|
macro_rules! enum_type_equality {
|
|
( $slf:ident, $r:expr, $( $l:pat ),* ) => {
|
|
match $slf {
|
|
$(
|
|
$l => {
|
|
if let $l = $r {
|
|
true
|
|
} else {
|
|
false
|
|
}
|
|
}
|
|
)*
|
|
}
|
|
}
|
|
}
|
|
|
|
/// Represents a line and a column position in UCG code.
|
|
///
|
|
/// It is used for generating error messages mostly. Most all
|
|
/// parts of the UCG AST have a positioned associated with them.
|
|
#[derive(Debug, PartialEq, Eq, Clone, PartialOrd, Ord, Hash)]
|
|
pub struct Position {
|
|
pub file: Option<PathBuf>,
|
|
pub line: usize,
|
|
pub column: usize,
|
|
pub offset: usize,
|
|
}
|
|
|
|
impl Position {
|
|
/// Construct a new Position.
|
|
pub fn new(line: usize, column: usize, offset: usize) -> Self {
|
|
Position {
|
|
file: None,
|
|
line,
|
|
column,
|
|
offset,
|
|
}
|
|
}
|
|
|
|
pub fn with_file<P: Into<PathBuf>>(mut self, file: P) -> Self {
|
|
self.file = Some(file.into());
|
|
self
|
|
}
|
|
}
|
|
|
|
impl<'a> From<&'a Position> for Position {
|
|
fn from(source: &'a Position) -> Self {
|
|
source.clone()
|
|
}
|
|
}
|
|
|
|
impl std::fmt::Display for Position {
|
|
fn fmt(&self, f: &mut std::fmt::Formatter) -> Result<(), std::fmt::Error> {
|
|
if let Some(ref file) = self.file {
|
|
write!(f, "file: {} ", file.to_string_lossy().to_string())?;
|
|
}
|
|
write!(f, "line: {} column: {}", self.line, self.column)
|
|
}
|
|
}
|
|
|
|
/// Defines the types of tokens in UCG syntax.
|
|
#[derive(Debug, PartialEq, Eq, Clone, PartialOrd, Ord, Hash)]
|
|
pub enum TokenType {
|
|
EMPTY,
|
|
BOOLEAN,
|
|
END,
|
|
WS,
|
|
COMMENT,
|
|
QUOTED,
|
|
PIPEQUOTE,
|
|
DIGIT,
|
|
BAREWORD,
|
|
PUNCT,
|
|
}
|
|
|
|
/// Defines a Token representing a building block of UCG syntax.
|
|
///
|
|
/// Token's are passed to the parser stage to be parsed into an AST.
|
|
#[derive(Debug, PartialEq, Eq, Clone, PartialOrd, Ord, Hash)]
|
|
pub struct Token {
|
|
pub typ: TokenType,
|
|
pub fragment: Rc<str>,
|
|
pub pos: Position,
|
|
}
|
|
|
|
impl Token {
|
|
/// Constructs a new Token with a type and line and column information.
|
|
pub fn new<S: Into<Rc<str>>, P: Into<Position>>(f: S, typ: TokenType, p: P) -> Self {
|
|
Self::new_with_pos(f, typ, p.into())
|
|
}
|
|
|
|
// Constructs a new Token with a type and a Position.
|
|
pub fn new_with_pos<S: Into<Rc<str>>>(f: S, typ: TokenType, pos: Position) -> Self {
|
|
Token {
|
|
typ,
|
|
fragment: f.into(),
|
|
pos,
|
|
}
|
|
}
|
|
}
|
|
|
|
impl<'a> From<&'a Token> for PositionedItem<Rc<str>> {
|
|
fn from(value: &'a Token) -> Self {
|
|
Self::new(value.fragment.clone(), value.pos.clone())
|
|
}
|
|
}
|
|
|
|
impl abortable_parser::Positioned for Token {
|
|
fn line(&self) -> usize {
|
|
self.pos.line
|
|
}
|
|
fn column(&self) -> usize {
|
|
self.pos.column
|
|
}
|
|
}
|
|
|
|
impl Borrow<str> for Token {
|
|
fn borrow(&self) -> &str {
|
|
&self.fragment
|
|
}
|
|
}
|
|
|
|
/// Helper macro for making a Positioned Value.
|
|
macro_rules! value_node {
|
|
($v:expr, $p:expr) => {
|
|
PositionedItem::new_with_pos($v, $p)
|
|
};
|
|
}
|
|
|
|
/// Helper macro for making a Token.
|
|
#[allow(unused_macros)]
|
|
macro_rules! make_tok {
|
|
(EOF => $i:expr) => {
|
|
Token::new("", TokenType::END, &$i)
|
|
};
|
|
|
|
(WS => $i:expr) => {
|
|
Token::new("", TokenType::WS, &$i)
|
|
};
|
|
|
|
(CMT => $e:expr, $i:expr) => {
|
|
Token::new($e, TokenType::COMMENT, &$i)
|
|
};
|
|
|
|
(QUOT => $e:expr, $i:expr) => {
|
|
Token::new($e, TokenType::QUOTED, &$i)
|
|
};
|
|
|
|
(PUNCT => $e:expr, $i:expr) => {
|
|
Token::new($e, TokenType::PUNCT, &$i)
|
|
};
|
|
|
|
(DIGIT => $e:expr, $i:expr) => {
|
|
Token::new($e, TokenType::DIGIT, &$i)
|
|
};
|
|
|
|
($e:expr, $i:expr) => {
|
|
Token::new($e, TokenType::BAREWORD, &$i)
|
|
};
|
|
}
|
|
|
|
/// Helper macro for making expressions.
|
|
#[allow(unused_macros)]
|
|
macro_rules! make_expr {
|
|
($e:expr, $i:expr) => {
|
|
Expression::Simple(Value::Symbol(PositionedItem::new_with_pos(
|
|
$e.to_string(),
|
|
$i,
|
|
)))
|
|
};
|
|
|
|
($e:expr => int, $i:expr) => {
|
|
Expression::Simple(Value::Int(PositionedItem::new_with_pos($e, $i)))
|
|
};
|
|
}
|
|
|
|
/// An ordered list of Name = Value pairs.
|
|
///
|
|
/// This is usually used as the body of a tuple in the UCG AST.
|
|
pub type FieldList = Vec<(Token, Expression)>; // Token is expected to be a symbol
|
|
|
|
pub type TupleShape = Vec<(PositionedItem<Rc<str>>, Shape)>;
|
|
pub type ShapeList = Vec<Shape>;
|
|
|
|
#[derive(PartialEq, Debug, Clone)]
|
|
pub struct FuncShapeDef {
|
|
args: BTreeMap<Rc<str>, Shape>,
|
|
ret: Box<Shape>,
|
|
}
|
|
|
|
#[derive(PartialEq, Debug, Clone)]
|
|
pub struct ModuleShape {
|
|
items: TupleShape,
|
|
ret: Box<Shape>,
|
|
}
|
|
|
|
#[doc = "Value types represent the Values that UCG can have."]
|
|
#[derive(PartialEq, Debug, Clone)]
|
|
pub enum Value {
|
|
Empty(Position),
|
|
Boolean(PositionedItem<bool>),
|
|
Int(PositionedItem<i64>),
|
|
Float(PositionedItem<f64>),
|
|
Str(PositionedItem<Rc<str>>),
|
|
Symbol(PositionedItem<Rc<str>>),
|
|
Tuple(PositionedItem<FieldList>),
|
|
List(ListDef),
|
|
}
|
|
|
|
#[derive(PartialEq, Debug, Clone)]
|
|
pub enum ImportShape {
|
|
Resolved(Position, TupleShape),
|
|
Unresolved(PositionedItem<Rc<str>>),
|
|
}
|
|
|
|
#[derive(PartialEq, Debug, Clone)]
|
|
pub struct NarrowedShape {
|
|
pub pos: Position,
|
|
pub types: Vec<Shape>,
|
|
}
|
|
|
|
impl NarrowedShape {
|
|
pub fn new(types: Vec<Shape>, line: usize, column: usize, offset: usize) -> Self {
|
|
Self::new_with_pos(types, Position::new(line, column, offset))
|
|
}
|
|
|
|
pub fn new_with_pos(types: Vec<Shape>, pos: Position) -> Self {
|
|
Self { pos, types }
|
|
}
|
|
|
|
pub fn with_pos(mut self, pos: Position) -> Self {
|
|
self.pos = pos;
|
|
self
|
|
}
|
|
|
|
pub fn merge_in_shape(&mut self, shape: Shape, symbol_table: &mut BTreeMap<Rc<str>, Shape>) {
|
|
for s in self.types.iter() {
|
|
if s.equivalent(&shape, symbol_table) {
|
|
return;
|
|
}
|
|
}
|
|
self.types.push(shape)
|
|
}
|
|
}
|
|
|
|
// TODO(jwall): Display implementations for shapes.
|
|
/// Shapes represent the types that UCG values or expressions can have.
|
|
#[derive(PartialEq, Debug, Clone)]
|
|
pub enum Shape {
|
|
Boolean(Position),
|
|
Int(Position),
|
|
Float(Position),
|
|
Str(Position),
|
|
Tuple(PositionedItem<TupleShape>),
|
|
List(NarrowedShape),
|
|
Func(FuncShapeDef),
|
|
Module(ModuleShape),
|
|
Hole(PositionedItem<Rc<str>>), // A type hole We don't know what this type is yet.
|
|
Narrowed(NarrowedShape), // A narrowed type. We know *some* of the possible options.
|
|
Import(ImportShape), // A type hole We don't know what this type is yet.
|
|
TypeErr(Position, String), // A type hole We don't know what this type is yet.
|
|
}
|
|
|
|
impl Shape {
|
|
pub fn equivalent(&self, right: &Shape, symbol_table: &BTreeMap<Rc<str>, Shape>) -> bool {
|
|
match (self, right) {
|
|
(Shape::Str(_), Shape::Str(_))
|
|
| (Shape::Boolean(_), Shape::Boolean(_))
|
|
| (Shape::Int(_), Shape::Int(_))
|
|
| (Shape::Hole(_), Shape::Hole(_))
|
|
| (Shape::Float(_), Shape::Float(_)) => true,
|
|
(Shape::Narrowed(left_slist), Shape::Narrowed(right_slist))
|
|
| (Shape::List(left_slist), Shape::List(right_slist)) => {
|
|
for ls in left_slist.types.iter() {
|
|
let mut found = false;
|
|
for rs in right_slist.types.iter() {
|
|
if ls.equivalent(rs, symbol_table) {
|
|
found = true;
|
|
break;
|
|
}
|
|
}
|
|
if !found {
|
|
return false;
|
|
}
|
|
}
|
|
true
|
|
}
|
|
(Shape::Tuple(left_slist), Shape::Tuple(right_slist)) => {
|
|
for (lt, ls) in left_slist.val.iter() {
|
|
let mut found = false;
|
|
for (rt, rs) in right_slist.val.iter() {
|
|
if lt.val == rt.val && ls.equivalent(rs, symbol_table) {
|
|
found = true;
|
|
}
|
|
}
|
|
if !found {
|
|
return false;
|
|
}
|
|
}
|
|
true
|
|
}
|
|
(Shape::Func(left_opshape), Shape::Func(right_opshape)) => {
|
|
if left_opshape.args.len() != right_opshape.args.len() {
|
|
return false;
|
|
}
|
|
let left_args: Vec<&Shape> = dbg!(left_opshape.args.values().collect());
|
|
let right_args: Vec<&Shape> = dbg!(right_opshape.args.values().collect());
|
|
for idx in 0..left_args.len() {
|
|
let shap = left_args[idx];
|
|
if !shap.equivalent(right_args[idx], symbol_table) {
|
|
return false;
|
|
}
|
|
}
|
|
if !&left_opshape
|
|
.ret
|
|
.equivalent(&right_opshape.ret, symbol_table)
|
|
{
|
|
return false;
|
|
}
|
|
true
|
|
}
|
|
(Shape::Module(left_opshape), Shape::Module(right_opshape)) => {
|
|
todo!();
|
|
}
|
|
_ => false,
|
|
}
|
|
}
|
|
|
|
pub fn narrow(&self, right: &Shape, symbol_table: &mut BTreeMap<Rc<str>, Shape>) -> Self {
|
|
match (self, right) {
|
|
(Shape::Str(_), Shape::Str(_))
|
|
| (Shape::Boolean(_), Shape::Boolean(_))
|
|
| (Shape::Int(_), Shape::Int(_))
|
|
| (Shape::Float(_), Shape::Float(_)) => self.clone(),
|
|
(Shape::Hole(sym), other) | (other, Shape::Hole(sym)) => {
|
|
if symbol_table.contains_key(&sym.val) {
|
|
symbol_table.insert(sym.val.clone(), other.clone().with_pos(sym.pos.clone()));
|
|
}
|
|
other.clone()
|
|
}
|
|
(Shape::Narrowed(left_slist), Shape::Narrowed(right_slist))
|
|
| (Shape::List(left_slist), Shape::List(right_slist)) => {
|
|
self.narrow_list_shapes(left_slist, right_slist, right, symbol_table)
|
|
}
|
|
(Shape::Tuple(left_slist), Shape::Tuple(right_slist)) => {
|
|
self.narrow_tuple_shapes(left_slist, right_slist, right, symbol_table)
|
|
}
|
|
(Shape::Func(left_opshape), Shape::Func(right_opshape)) => {
|
|
todo!();
|
|
}
|
|
(Shape::Module(left_opshape), Shape::Module(right_opshape)) => {
|
|
todo!();
|
|
}
|
|
_ => Shape::TypeErr(
|
|
right.pos().clone(),
|
|
format!(
|
|
"Expected {} but got {}",
|
|
self.type_name(),
|
|
right.type_name()
|
|
),
|
|
),
|
|
}
|
|
}
|
|
|
|
fn narrow_tuple_shapes(
|
|
&self,
|
|
left_slist: &PositionedItem<Vec<(PositionedItem<Rc<str>>, Shape)>>,
|
|
right_slist: &PositionedItem<Vec<(PositionedItem<Rc<str>>, Shape)>>,
|
|
right: &Shape,
|
|
symbol_table: &mut BTreeMap<Rc<str>, Shape>,
|
|
) -> Shape {
|
|
let left_iter = left_slist.val.iter();
|
|
let right_iter = right_slist.val.iter();
|
|
if is_tuple_subset(left_iter, right_slist, symbol_table) {
|
|
self.clone()
|
|
} else if is_tuple_subset(right_iter, left_slist, symbol_table) {
|
|
right.clone()
|
|
} else {
|
|
Shape::TypeErr(right.pos().clone(), "Incompatible Tuple Shapes".to_owned())
|
|
}
|
|
}
|
|
|
|
fn narrow_list_shapes(
|
|
&self,
|
|
left_slist: &NarrowedShape,
|
|
right_slist: &NarrowedShape,
|
|
right: &Shape,
|
|
symbol_table: &mut BTreeMap<Rc<str>, Shape>,
|
|
) -> Shape {
|
|
let left_iter = left_slist.types.iter();
|
|
let right_iter = right_slist.types.iter();
|
|
if is_list_subset(left_iter, right_slist, symbol_table) {
|
|
self.clone()
|
|
} else if is_list_subset(right_iter, left_slist, symbol_table) {
|
|
right.clone()
|
|
} else {
|
|
Shape::TypeErr(right.pos().clone(), "Incompatible List Shapes".to_owned())
|
|
}
|
|
}
|
|
|
|
pub fn type_name(&self) -> &'static str {
|
|
match self {
|
|
Shape::Str(s) => "str",
|
|
Shape::Int(s) => "int",
|
|
Shape::Float(s) => "float",
|
|
Shape::Boolean(b) => "boolean",
|
|
// TODO(jwall): make these type names account for what they contain.
|
|
Shape::List(lst) => "list",
|
|
Shape::Tuple(flds) => "tuple",
|
|
Shape::Func(_) => "func",
|
|
Shape::Module(_) => "module",
|
|
Shape::Narrowed(_) => "narrowed",
|
|
Shape::Import(_) => "import",
|
|
Shape::Hole(_) => "type-hole",
|
|
Shape::TypeErr(_, _) => "type-error",
|
|
}
|
|
}
|
|
|
|
pub fn pos(&self) -> &Position {
|
|
match self {
|
|
Shape::Str(p) => &p,
|
|
Shape::Int(p) => &p,
|
|
Shape::Float(p) => &p,
|
|
Shape::Boolean(p) => &p,
|
|
Shape::List(lst) => &lst.pos,
|
|
Shape::Tuple(flds) => &flds.pos,
|
|
Shape::Func(def) => def.ret.pos(),
|
|
Shape::Module(def) => def.ret.pos(),
|
|
Shape::Narrowed(pi) => &pi.pos,
|
|
Shape::Hole(pi) => &pi.pos,
|
|
Shape::TypeErr(pos, _) => pos,
|
|
Shape::Import(ImportShape::Resolved(p, _)) => p,
|
|
Shape::Import(ImportShape::Unresolved(pi)) => &pi.pos,
|
|
}
|
|
}
|
|
|
|
pub fn with_pos(self, pos: Position) -> Self {
|
|
match self {
|
|
Shape::Str(_) => Shape::Str(pos.clone()),
|
|
Shape::Int(_) => Shape::Int(pos.clone()),
|
|
Shape::Float(_) => Shape::Float(pos.clone()),
|
|
Shape::Boolean(_) => Shape::Boolean(pos.clone()),
|
|
Shape::List(lst) => Shape::List(NarrowedShape::new_with_pos(lst.types, pos)),
|
|
Shape::Tuple(flds) => Shape::Tuple(PositionedItem::new(flds.val, pos)),
|
|
Shape::Func(_) | Shape::Module(_) => self.clone(),
|
|
Shape::Narrowed(pi) => Shape::Narrowed(pi.with_pos(pos)),
|
|
Shape::Hole(pi) => Shape::Hole(pi.with_pos(pos)),
|
|
Shape::Import(ImportShape::Resolved(_, s)) => {
|
|
Shape::Import(ImportShape::Resolved(pos, s))
|
|
}
|
|
Shape::Import(ImportShape::Unresolved(pi)) => {
|
|
Shape::Import(ImportShape::Unresolved(pi.with_pos(pos)))
|
|
}
|
|
Shape::TypeErr(_, msg) => Shape::TypeErr(pos, msg),
|
|
}
|
|
}
|
|
}
|
|
|
|
fn is_tuple_subset(
|
|
mut left_iter: std::slice::Iter<(PositionedItem<Rc<str>>, Shape)>,
|
|
right_slist: &PositionedItem<Vec<(PositionedItem<Rc<str>>, Shape)>>,
|
|
symbol_table: &mut BTreeMap<Rc<str>, Shape>,
|
|
) -> bool {
|
|
return loop {
|
|
if let Some((lt, ls)) = left_iter.next() {
|
|
let mut matched = false;
|
|
for (rt, rs) in right_slist.val.iter() {
|
|
if rt.val == lt.val {
|
|
if let Shape::TypeErr(_, _) = ls.narrow(rs, symbol_table) {
|
|
// noop
|
|
} else {
|
|
matched = true;
|
|
continue;
|
|
}
|
|
}
|
|
}
|
|
if !matched {
|
|
break false;
|
|
} else {
|
|
continue;
|
|
}
|
|
}
|
|
break true;
|
|
};
|
|
}
|
|
|
|
fn is_list_subset(
|
|
mut right_iter: std::slice::Iter<Shape>,
|
|
left_slist: &NarrowedShape,
|
|
symbol_table: &mut BTreeMap<Rc<str>, Shape>,
|
|
) -> bool {
|
|
let right_subset = loop {
|
|
let mut matches = false;
|
|
let ls = if let Some(ls) = right_iter.next() {
|
|
ls
|
|
} else {
|
|
break true;
|
|
};
|
|
for rs in left_slist.types.iter() {
|
|
let s = ls.narrow(rs, symbol_table);
|
|
if let Shape::TypeErr(_, _) = s {
|
|
// noop
|
|
} else {
|
|
matches = true;
|
|
}
|
|
}
|
|
if !matches {
|
|
break matches;
|
|
}
|
|
};
|
|
right_subset
|
|
}
|
|
|
|
impl Value {
|
|
/// Returns the type name of the Value it is called on as a string.
|
|
pub fn type_name(&self) -> String {
|
|
match self {
|
|
&Value::Empty(_) => "EmptyValue".to_string(),
|
|
&Value::Boolean(_) => "Boolean".to_string(),
|
|
&Value::Int(_) => "Integer".to_string(),
|
|
&Value::Float(_) => "Float".to_string(),
|
|
&Value::Str(_) => "String".to_string(),
|
|
&Value::Symbol(_) => "Symbol".to_string(),
|
|
&Value::Tuple(_) => "Tuple".to_string(),
|
|
&Value::List(_) => "List".to_string(),
|
|
}
|
|
}
|
|
|
|
fn fields_to_string(v: &FieldList) -> String {
|
|
let mut buf = String::new();
|
|
buf.push_str("{\n");
|
|
for ref t in v.iter() {
|
|
buf.push_str("\t");
|
|
buf.push_str(&t.0.fragment);
|
|
buf.push_str("\n");
|
|
}
|
|
buf.push_str("}");
|
|
return buf;
|
|
}
|
|
|
|
fn elems_to_string(v: &Vec<Expression>) -> String {
|
|
return format!("{}", v.len());
|
|
}
|
|
|
|
/// Returns a stringified version of the Value.
|
|
pub fn to_string(&self) -> String {
|
|
match self {
|
|
&Value::Empty(_) => "EmptyValue".to_string(),
|
|
&Value::Boolean(ref b) => format!("{}", b.val),
|
|
&Value::Int(ref i) => format!("{}", i.val),
|
|
&Value::Float(ref f) => format!("{}", f.val),
|
|
&Value::Str(ref s) => format!("{}", s.val),
|
|
&Value::Symbol(ref s) => format!("{}", s.val),
|
|
&Value::Tuple(ref fs) => format!("{}", Self::fields_to_string(&fs.val)),
|
|
&Value::List(ref def) => format!("[{}]", Self::elems_to_string(&def.elems)),
|
|
}
|
|
}
|
|
|
|
/// Returns the position for a Value.
|
|
pub fn pos(&self) -> &Position {
|
|
match self {
|
|
&Value::Empty(ref pos) => pos,
|
|
&Value::Boolean(ref b) => &b.pos,
|
|
&Value::Int(ref i) => &i.pos,
|
|
&Value::Float(ref f) => &f.pos,
|
|
&Value::Str(ref s) => &s.pos,
|
|
&Value::Symbol(ref s) => &s.pos,
|
|
&Value::Tuple(ref fs) => &fs.pos,
|
|
&Value::List(ref def) => &def.pos,
|
|
}
|
|
}
|
|
|
|
/// Returns true if called on a Value that is the same type as itself.
|
|
pub fn type_equal(&self, target: &Self) -> bool {
|
|
enum_type_equality!(
|
|
self,
|
|
target,
|
|
&Value::Empty(_),
|
|
&Value::Boolean(_),
|
|
&Value::Int(_),
|
|
&Value::Float(_),
|
|
&Value::Str(_),
|
|
&Value::Symbol(_),
|
|
&Value::Tuple(_),
|
|
&Value::List(_)
|
|
)
|
|
}
|
|
}
|
|
|
|
/// Represents an expansion of a Macro that is expected to already have been
|
|
/// defined.
|
|
#[derive(PartialEq, Debug, Clone)]
|
|
pub struct CallDef {
|
|
pub funcref: Value,
|
|
pub arglist: Vec<Expression>,
|
|
pub pos: Position,
|
|
}
|
|
|
|
/// The allowable types to which you can perform a primitive cast.
|
|
#[derive(PartialEq, Debug, Clone)]
|
|
pub enum CastType {
|
|
Int,
|
|
Float,
|
|
Str,
|
|
Bool,
|
|
}
|
|
|
|
impl fmt::Display for CastType {
|
|
fn fmt(&self, w: &mut fmt::Formatter) -> fmt::Result {
|
|
write!(
|
|
w,
|
|
"{}",
|
|
match self {
|
|
CastType::Int => "int",
|
|
CastType::Float => "float",
|
|
CastType::Bool => "bool",
|
|
CastType::Str => "str",
|
|
}
|
|
)
|
|
}
|
|
}
|
|
|
|
/// Represents a cast of a target to a primitive type.
|
|
#[derive(PartialEq, Debug, Clone)]
|
|
pub struct CastDef {
|
|
pub cast_type: CastType,
|
|
pub target: Box<Expression>,
|
|
pub pos: Position,
|
|
}
|
|
|
|
/// Encodes a select expression in the UCG AST.
|
|
#[derive(PartialEq, Debug, Clone)]
|
|
pub struct SelectDef {
|
|
pub val: Box<Expression>,
|
|
pub default: Option<Box<Expression>>,
|
|
pub tuple: FieldList,
|
|
pub pos: Position,
|
|
}
|
|
|
|
/// Adds position information to any type `T`.
|
|
#[derive(Debug, Clone)]
|
|
pub struct PositionedItem<T> {
|
|
pub pos: Position,
|
|
pub val: T,
|
|
}
|
|
|
|
impl<T: std::fmt::Display> std::fmt::Display for PositionedItem<T> {
|
|
fn fmt(&self, f: &mut std::fmt::Formatter) -> Result<(), std::fmt::Error> {
|
|
write!(f, "{}", self.val)
|
|
}
|
|
}
|
|
|
|
impl<T> PositionedItem<T> {
|
|
/// Constructs a new Positioned<T> with a value, line, and column information.
|
|
pub fn new<P: Into<Position>>(v: T, p: P) -> Self {
|
|
Self::new_with_pos(v, p.into())
|
|
}
|
|
|
|
/// Constructs a new Positioned<T> with a value and a Position.
|
|
pub fn new_with_pos(v: T, pos: Position) -> Self {
|
|
PositionedItem { pos, val: v }
|
|
}
|
|
|
|
pub fn with_pos(mut self, pos: Position) -> Self {
|
|
self.pos = pos;
|
|
self
|
|
}
|
|
}
|
|
|
|
impl<T: PartialEq> PartialEq for PositionedItem<T> {
|
|
fn eq(&self, other: &Self) -> bool {
|
|
self.val == other.val
|
|
}
|
|
}
|
|
|
|
impl<T: Eq> Eq for PositionedItem<T> {}
|
|
|
|
impl<T: Ord> Ord for PositionedItem<T> {
|
|
fn cmp(&self, other: &Self) -> Ordering {
|
|
self.val.cmp(&other.val)
|
|
}
|
|
}
|
|
|
|
impl<T: PartialOrd> PartialOrd for PositionedItem<T> {
|
|
fn partial_cmp(&self, other: &Self) -> Option<Ordering> {
|
|
self.val.partial_cmp(&other.val)
|
|
}
|
|
}
|
|
|
|
impl<T: Hash> Hash for PositionedItem<T> {
|
|
fn hash<H: Hasher>(&self, state: &mut H) {
|
|
self.val.hash(state);
|
|
}
|
|
}
|
|
|
|
impl<'a> From<&'a Token> for PositionedItem<String> {
|
|
fn from(t: &'a Token) -> PositionedItem<String> {
|
|
PositionedItem {
|
|
pos: t.pos.clone(),
|
|
val: t.fragment.to_string(),
|
|
}
|
|
}
|
|
}
|
|
|
|
impl<'a> From<&'a PositionedItem<Rc<str>>> for PositionedItem<Rc<str>> {
|
|
fn from(t: &PositionedItem<Rc<str>>) -> PositionedItem<Rc<str>> {
|
|
PositionedItem {
|
|
pos: t.pos.clone(),
|
|
val: t.val.clone(),
|
|
}
|
|
}
|
|
}
|
|
|
|
/// Encodes a func expression in the UCG AST..
|
|
///
|
|
/// A func is a pure function over a expression.
|
|
#[derive(PartialEq, Debug, Clone)]
|
|
pub struct FuncDef {
|
|
pub scope: Option<Scope>,
|
|
pub argdefs: Vec<PositionedItem<Rc<str>>>,
|
|
pub fields: Box<Expression>,
|
|
pub pos: Position,
|
|
}
|
|
|
|
/// Specifies the types of binary operations supported in
|
|
/// UCG expression.
|
|
#[derive(Debug, PartialEq, Clone)]
|
|
pub enum BinaryExprType {
|
|
// Math
|
|
Add,
|
|
Sub,
|
|
Mul,
|
|
Div,
|
|
Mod,
|
|
// Boolean
|
|
AND,
|
|
OR,
|
|
// Comparison
|
|
Equal,
|
|
GT,
|
|
LT,
|
|
NotEqual,
|
|
GTEqual,
|
|
LTEqual,
|
|
REMatch,
|
|
NotREMatch,
|
|
IN,
|
|
IS,
|
|
// Selector operator
|
|
DOT,
|
|
}
|
|
|
|
impl BinaryExprType {
|
|
/// Returns the precedence level for the binary operator.
|
|
///
|
|
/// Higher values bind tighter than lower values.
|
|
pub fn precedence_level(&self) -> u32 {
|
|
match self {
|
|
// Equality operators are least tightly bound
|
|
BinaryExprType::Equal => 1,
|
|
BinaryExprType::NotEqual => 1,
|
|
BinaryExprType::GTEqual => 1,
|
|
BinaryExprType::LTEqual => 1,
|
|
BinaryExprType::GT => 1,
|
|
BinaryExprType::LT => 1,
|
|
BinaryExprType::REMatch => 1,
|
|
BinaryExprType::NotREMatch => 1,
|
|
BinaryExprType::IN => 2,
|
|
BinaryExprType::IS => 2,
|
|
// Sum operators are next least tightly bound
|
|
BinaryExprType::Add => 3,
|
|
BinaryExprType::Sub => 3,
|
|
// Product operators are next tightly bound
|
|
BinaryExprType::Mul => 4,
|
|
BinaryExprType::Div => 4,
|
|
BinaryExprType::Mod => 4,
|
|
// Boolean operators bind tighter than math
|
|
BinaryExprType::AND => 5,
|
|
BinaryExprType::OR => 5,
|
|
// Dot operators are most tightly bound.
|
|
BinaryExprType::DOT => 6,
|
|
}
|
|
}
|
|
}
|
|
|
|
/// Represents an expression with a left and a right side.
|
|
#[derive(Debug, PartialEq, Clone)]
|
|
pub struct BinaryOpDef {
|
|
pub kind: BinaryExprType,
|
|
pub left: Box<Expression>,
|
|
pub right: Box<Expression>,
|
|
pub pos: Position,
|
|
}
|
|
|
|
/// Encodes a tuple Copy expression in the UCG AST.
|
|
#[derive(Debug, PartialEq, Clone)]
|
|
pub struct CopyDef {
|
|
pub selector: Value,
|
|
pub fields: FieldList,
|
|
pub pos: Position,
|
|
}
|
|
|
|
/// Encodes one of two possible forms for format expression arguments.
|
|
#[derive(Debug, PartialEq, Clone)]
|
|
pub enum FormatArgs {
|
|
List(Vec<Expression>),
|
|
Single(Box<Expression>),
|
|
}
|
|
|
|
/// Encodes a format expression in the UCG AST.
|
|
#[derive(Debug, PartialEq, Clone)]
|
|
pub struct FormatDef {
|
|
pub template: String,
|
|
pub args: FormatArgs,
|
|
pub pos: Position,
|
|
}
|
|
|
|
/// Encodes an import statement in the UCG AST.
|
|
#[derive(Debug, PartialEq, Clone)]
|
|
pub struct IncludeDef {
|
|
pub pos: Position,
|
|
pub path: Token,
|
|
pub typ: Token,
|
|
}
|
|
|
|
/// Encodes a list expression in the UCG AST.
|
|
#[derive(Debug, PartialEq, Clone)]
|
|
pub struct ListDef {
|
|
pub elems: Vec<Expression>,
|
|
pub pos: Position,
|
|
}
|
|
|
|
#[derive(Debug, PartialEq, Clone)]
|
|
pub enum FuncOpDef {
|
|
Reduce(ReduceOpDef),
|
|
Map(MapFilterOpDef),
|
|
Filter(MapFilterOpDef),
|
|
}
|
|
|
|
#[derive(Debug, PartialEq, Clone)]
|
|
pub struct ReduceOpDef {
|
|
pub func: Box<Expression>,
|
|
pub acc: Box<Expression>,
|
|
pub target: Box<Expression>,
|
|
pub pos: Position,
|
|
}
|
|
|
|
/// MapFilterOpDef implements the list operations in the UCG AST.
|
|
#[derive(Debug, PartialEq, Clone)]
|
|
pub struct MapFilterOpDef {
|
|
pub func: Box<Expression>,
|
|
pub target: Box<Expression>,
|
|
pub pos: Position,
|
|
}
|
|
|
|
impl FuncOpDef {
|
|
pub fn pos(&self) -> &Position {
|
|
match self {
|
|
FuncOpDef::Map(def) => &def.pos,
|
|
FuncOpDef::Filter(def) => &def.pos,
|
|
FuncOpDef::Reduce(def) => &def.pos,
|
|
}
|
|
}
|
|
}
|
|
|
|
#[derive(Debug, PartialEq, Clone)]
|
|
pub struct ModuleDef {
|
|
pub scope: Option<Scope>,
|
|
pub pos: Position,
|
|
pub arg_set: FieldList,
|
|
pub out_expr: Option<Box<Expression>>,
|
|
pub arg_tuple: Option<Rc<Val>>,
|
|
pub statements: Vec<Statement>,
|
|
}
|
|
|
|
impl ModuleDef {
|
|
pub fn new<P: Into<Position>>(arg_set: FieldList, stmts: Vec<Statement>, pos: P) -> Self {
|
|
ModuleDef {
|
|
scope: None,
|
|
pos: pos.into(),
|
|
arg_set,
|
|
out_expr: None,
|
|
arg_tuple: None,
|
|
statements: stmts,
|
|
}
|
|
}
|
|
|
|
pub fn set_out_expr(&mut self, expr: Expression) {
|
|
self.out_expr = Some(Box::new(expr));
|
|
}
|
|
|
|
pub fn derive_shape(&self, symbol_table: &mut BTreeMap<Rc<str>, Shape>) -> Shape {
|
|
todo!()
|
|
}
|
|
}
|
|
|
|
/// RangeDef defines a range with optional step.
|
|
#[derive(Debug, PartialEq, Clone)]
|
|
pub struct RangeDef {
|
|
pub pos: Position,
|
|
pub start: Box<Expression>,
|
|
pub step: Option<Box<Expression>>,
|
|
pub end: Box<Expression>,
|
|
}
|
|
|
|
/// Encodes an import expression in the UCG AST.
|
|
#[derive(Debug, PartialEq, Clone)]
|
|
pub struct ImportDef {
|
|
pub pos: Position,
|
|
pub path: Token,
|
|
}
|
|
|
|
#[derive(Debug, PartialEq, Clone)]
|
|
pub struct IsDef {
|
|
pub pos: Position,
|
|
pub target: Box<Expression>,
|
|
pub typ: Token,
|
|
}
|
|
|
|
#[derive(Debug, PartialEq, Clone)]
|
|
pub struct FailDef {
|
|
pub pos: Position,
|
|
pub message: Box<Expression>,
|
|
}
|
|
|
|
#[derive(Debug, PartialEq, Clone)]
|
|
pub struct NotDef {
|
|
pub pos: Position,
|
|
pub expr: Box<Expression>,
|
|
}
|
|
|
|
#[derive(Debug, PartialEq, Clone)]
|
|
pub struct DebugDef {
|
|
pub pos: Position,
|
|
pub expr: Box<Expression>,
|
|
}
|
|
|
|
/// Encodes a ucg expression. Expressions compute a value from.
|
|
#[derive(Debug, PartialEq, Clone)]
|
|
pub enum Expression {
|
|
// Base Expression
|
|
Simple(Value),
|
|
Not(NotDef),
|
|
|
|
// Binary expressions
|
|
Binary(BinaryOpDef),
|
|
|
|
// Complex Expressions
|
|
Copy(CopyDef),
|
|
Range(RangeDef),
|
|
Grouped(Box<Expression>, Position),
|
|
Format(FormatDef),
|
|
Include(IncludeDef),
|
|
Import(ImportDef),
|
|
Call(CallDef),
|
|
Cast(CastDef),
|
|
Func(FuncDef),
|
|
Select(SelectDef),
|
|
FuncOp(FuncOpDef),
|
|
Module(ModuleDef),
|
|
|
|
// Declarative failure expressions
|
|
Fail(FailDef),
|
|
// Debugging assistance
|
|
Debug(DebugDef),
|
|
}
|
|
|
|
impl Expression {
|
|
/// Returns the position of the Expression.
|
|
pub fn pos(&self) -> &Position {
|
|
match self {
|
|
&Expression::Simple(ref v) => v.pos(),
|
|
&Expression::Binary(ref def) => &def.pos,
|
|
&Expression::Copy(ref def) => &def.pos,
|
|
&Expression::Range(ref def) => &def.pos,
|
|
&Expression::Grouped(_, ref pos) => pos,
|
|
&Expression::Format(ref def) => &def.pos,
|
|
&Expression::Call(ref def) => &def.pos,
|
|
&Expression::Cast(ref def) => &def.pos,
|
|
&Expression::Func(ref def) => &def.pos,
|
|
&Expression::Module(ref def) => &def.pos,
|
|
&Expression::Select(ref def) => &def.pos,
|
|
&Expression::FuncOp(ref def) => def.pos(),
|
|
&Expression::Include(ref def) => &def.pos,
|
|
&Expression::Import(ref def) => &def.pos,
|
|
&Expression::Fail(ref def) => &def.pos,
|
|
&Expression::Not(ref def) => &def.pos,
|
|
&Expression::Debug(ref def) => &def.pos,
|
|
}
|
|
}
|
|
}
|
|
|
|
impl fmt::Display for Expression {
|
|
fn fmt(&self, w: &mut fmt::Formatter) -> fmt::Result {
|
|
match self {
|
|
&Expression::Simple(ref v) => {
|
|
write!(w, "{}", v.to_string())?;
|
|
}
|
|
&Expression::Binary(_) => {
|
|
write!(w, "<Expr>")?;
|
|
}
|
|
&Expression::FuncOp(_) => {
|
|
write!(w, "<Expr>")?;
|
|
}
|
|
&Expression::Copy(_) => {
|
|
write!(w, "<Copy>")?;
|
|
}
|
|
&Expression::Range(_) => {
|
|
write!(w, "<Range>")?;
|
|
}
|
|
&Expression::Grouped(_, _) => {
|
|
write!(w, "(<Expr>)")?;
|
|
}
|
|
&Expression::Format(_) => {
|
|
write!(w, "<Format Expr>")?;
|
|
}
|
|
&Expression::Call(_) => {
|
|
write!(w, "<FuncCall>")?;
|
|
}
|
|
&Expression::Cast(_) => {
|
|
write!(w, "<Cast>")?;
|
|
}
|
|
&Expression::Func(_) => {
|
|
write!(w, "<Func>")?;
|
|
}
|
|
&Expression::Module(_) => {
|
|
write!(w, "<Module>")?;
|
|
}
|
|
&Expression::Select(_) => {
|
|
write!(w, "<Select>")?;
|
|
}
|
|
&Expression::Include(_) => {
|
|
write!(w, "<Include>")?;
|
|
}
|
|
&Expression::Import(_) => {
|
|
write!(w, "<Include>")?;
|
|
}
|
|
&Expression::Fail(_) => {
|
|
write!(w, "<Fail>")?;
|
|
}
|
|
&Expression::Not(ref def) => {
|
|
write!(w, "!{}", def.expr)?;
|
|
}
|
|
&Expression::Debug(ref def) => {
|
|
write!(w, "!{}", def.expr)?;
|
|
}
|
|
}
|
|
Ok(())
|
|
}
|
|
}
|
|
|
|
/// Encodes a let statement in the UCG AST.
|
|
#[derive(Debug, PartialEq, Clone)]
|
|
pub struct LetDef {
|
|
pub pos: Position,
|
|
pub name: Token,
|
|
pub value: Expression,
|
|
}
|
|
|
|
/// Encodes a parsed statement in the UCG AST.
|
|
#[derive(Debug, PartialEq, Clone)]
|
|
pub enum Statement {
|
|
// simple expression
|
|
Expression(Expression),
|
|
|
|
// Named bindings
|
|
Let(LetDef),
|
|
|
|
// Assert statement
|
|
Assert(Position, Expression),
|
|
|
|
// Identify an Expression for output.
|
|
Output(Position, Token, Expression),
|
|
|
|
// Print the expression to stdout.
|
|
Print(Position, Token, Expression),
|
|
}
|
|
|
|
impl Statement {
|
|
fn pos(&self) -> &Position {
|
|
match self {
|
|
Statement::Expression(ref e) => e.pos(),
|
|
Statement::Let(ref def) => &def.pos,
|
|
Statement::Assert(ref pos, _) => pos,
|
|
Statement::Output(ref pos, _, _) => pos,
|
|
Statement::Print(ref pos, _, _) => pos,
|
|
}
|
|
}
|
|
}
|
|
|
|
#[cfg(test)]
|
|
mod test;
|