forked from M-Labs/nac3
Compare commits
3 Commits
Author | SHA1 | Date | |
---|---|---|---|
65d9b620fe | |||
075245f4c2 | |||
0e9dea0e65 |
@ -160,50 +160,50 @@ fn resolve_function<'a>(
|
||||
}
|
||||
}
|
||||
|
||||
fn get_expression_unknowns<'a>(
|
||||
defined: &[&'a str],
|
||||
fn get_expr_unknowns<'a>(
|
||||
defined: &mut Vec<&'a str>,
|
||||
unknowns: &mut Vec<&'a str>,
|
||||
expr: &'a ExpressionType,
|
||||
) {
|
||||
match expr {
|
||||
ExpressionType::BoolOp { values, .. } => {
|
||||
for v in values.iter() {
|
||||
get_expression_unknowns(defined, unknowns, &v.node)
|
||||
get_expr_unknowns(defined, unknowns, &v.node)
|
||||
}
|
||||
}
|
||||
ExpressionType::Binop { a, b, .. } => {
|
||||
get_expression_unknowns(defined, unknowns, &a.node);
|
||||
get_expression_unknowns(defined, unknowns, &b.node);
|
||||
get_expr_unknowns(defined, unknowns, &a.node);
|
||||
get_expr_unknowns(defined, unknowns, &b.node);
|
||||
}
|
||||
ExpressionType::Subscript { a, b } => {
|
||||
get_expression_unknowns(defined, unknowns, &a.node);
|
||||
get_expression_unknowns(defined, unknowns, &b.node);
|
||||
get_expr_unknowns(defined, unknowns, &a.node);
|
||||
get_expr_unknowns(defined, unknowns, &b.node);
|
||||
}
|
||||
ExpressionType::Unop { a, .. } => {
|
||||
get_expression_unknowns(defined, unknowns, &a.node);
|
||||
get_expr_unknowns(defined, unknowns, &a.node);
|
||||
}
|
||||
ExpressionType::Compare { vals, .. } => {
|
||||
for v in vals.iter() {
|
||||
get_expression_unknowns(defined, unknowns, &v.node)
|
||||
get_expr_unknowns(defined, unknowns, &v.node)
|
||||
}
|
||||
}
|
||||
ExpressionType::Attribute { value, .. } => {
|
||||
get_expression_unknowns(defined, unknowns, &value.node);
|
||||
get_expr_unknowns(defined, unknowns, &value.node);
|
||||
}
|
||||
ExpressionType::Call { function, args, .. } => {
|
||||
get_expression_unknowns(defined, unknowns, &function.node);
|
||||
get_expr_unknowns(defined, unknowns, &function.node);
|
||||
for v in args.iter() {
|
||||
get_expression_unknowns(defined, unknowns, &v.node)
|
||||
get_expr_unknowns(defined, unknowns, &v.node)
|
||||
}
|
||||
}
|
||||
ExpressionType::List { elements } => {
|
||||
for v in elements.iter() {
|
||||
get_expression_unknowns(defined, unknowns, &v.node)
|
||||
get_expr_unknowns(defined, unknowns, &v.node)
|
||||
}
|
||||
}
|
||||
ExpressionType::Tuple { elements } => {
|
||||
for v in elements.iter() {
|
||||
get_expression_unknowns(defined, unknowns, &v.node)
|
||||
get_expr_unknowns(defined, unknowns, &v.node)
|
||||
}
|
||||
}
|
||||
ExpressionType::Comprehension { kind, generators } => {
|
||||
@ -211,22 +211,22 @@ fn get_expression_unknowns<'a>(
|
||||
unimplemented!()
|
||||
}
|
||||
let g = &generators[0];
|
||||
get_expression_unknowns(defined, unknowns, &g.iter.node);
|
||||
let mut scoped = defined.to_owned();
|
||||
get_expression_unknowns(defined, &mut scoped, &g.target.node);
|
||||
get_expr_unknowns(defined, unknowns, &g.iter.node);
|
||||
let mut scoped = defined.clone();
|
||||
get_expr_unknowns(defined, &mut scoped, &g.target.node);
|
||||
for if_expr in g.ifs.iter() {
|
||||
get_expression_unknowns(&scoped, unknowns, &if_expr.node);
|
||||
get_expr_unknowns(&mut scoped, unknowns, &if_expr.node);
|
||||
}
|
||||
match kind.as_ref() {
|
||||
ComprehensionKind::List { element } => {
|
||||
get_expression_unknowns(&scoped, unknowns, &element.node);
|
||||
get_expr_unknowns(&mut scoped, unknowns, &element.node);
|
||||
}
|
||||
_ => unimplemented!(),
|
||||
}
|
||||
}
|
||||
ExpressionType::Slice { elements } => {
|
||||
for v in elements.iter() {
|
||||
get_expression_unknowns(defined, unknowns, &v.node);
|
||||
get_expr_unknowns(defined, unknowns, &v.node);
|
||||
}
|
||||
}
|
||||
ExpressionType::Identifier { name } => {
|
||||
@ -235,35 +235,81 @@ fn get_expression_unknowns<'a>(
|
||||
}
|
||||
}
|
||||
ExpressionType::IfExpression { test, body, orelse } => {
|
||||
get_expression_unknowns(defined, unknowns, &test.node);
|
||||
get_expression_unknowns(defined, unknowns, &body.node);
|
||||
get_expression_unknowns(defined, unknowns, &orelse.node);
|
||||
get_expr_unknowns(defined, unknowns, &test.node);
|
||||
get_expr_unknowns(defined, unknowns, &body.node);
|
||||
get_expr_unknowns(defined, unknowns, &orelse.node);
|
||||
}
|
||||
_ => (),
|
||||
};
|
||||
}
|
||||
|
||||
pub fn get_pattern_match_unknowns<'a>(
|
||||
defined: &mut Vec<&'a str>,
|
||||
unknowns: &mut Vec<&'a str>,
|
||||
expr: &'a ExpressionType,
|
||||
) {
|
||||
match expr {
|
||||
ExpressionType::Identifier { name } => {
|
||||
defined.push(&name.as_str());
|
||||
}
|
||||
ExpressionType::Tuple { elements } => {
|
||||
for v in elements.iter() {
|
||||
get_pattern_match_unknowns(defined, unknowns, &v.node);
|
||||
struct ExprPattern<'a>(&'a ExpressionType, Vec<usize>, bool);
|
||||
|
||||
impl<'a> ExprPattern<'a> {
|
||||
fn new(expr: &'a ExpressionType) -> ExprPattern {
|
||||
let mut pattern = ExprPattern(expr, Vec::new(), true);
|
||||
pattern.find_leaf();
|
||||
pattern
|
||||
}
|
||||
|
||||
fn pointed(&mut self) -> &'a ExpressionType {
|
||||
let mut current = self.0;
|
||||
for v in self.1.iter() {
|
||||
if let ExpressionType::Tuple { elements } = current {
|
||||
current = &elements[*v].node
|
||||
} else {
|
||||
unreachable!()
|
||||
}
|
||||
}
|
||||
_ => {
|
||||
get_expression_unknowns(defined, unknowns, expr);
|
||||
current
|
||||
}
|
||||
|
||||
fn find_leaf(&mut self) {
|
||||
let mut current = self.pointed();
|
||||
while let ExpressionType::Tuple { elements } = current {
|
||||
if elements.is_empty() {
|
||||
break;
|
||||
}
|
||||
current = &elements[0].node;
|
||||
self.1.push(0);
|
||||
}
|
||||
}
|
||||
|
||||
fn inc(&mut self) -> bool {
|
||||
loop {
|
||||
if self.1.is_empty() {
|
||||
return false;
|
||||
}
|
||||
let ind = self.1.pop().unwrap() + 1;
|
||||
let parent = self.pointed();
|
||||
if let ExpressionType::Tuple { elements } = parent {
|
||||
if ind < elements.len() {
|
||||
self.1.push(ind);
|
||||
self.find_leaf();
|
||||
return true;
|
||||
}
|
||||
} else {
|
||||
unreachable!()
|
||||
}
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
pub fn get_statement_unknowns<'a>(
|
||||
impl<'a> Iterator for ExprPattern<'a> {
|
||||
type Item = &'a ExpressionType;
|
||||
fn next(&mut self) -> Option<Self::Item> {
|
||||
if self.2 {
|
||||
self.2 = false;
|
||||
Some(self.pointed())
|
||||
} else if self.inc() {
|
||||
Some(self.pointed())
|
||||
} else {
|
||||
None
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
fn get_stmt_unknowns<'a>(
|
||||
defined: &mut Vec<&'a str>,
|
||||
unknowns: &mut Vec<&'a str>,
|
||||
stmts: &'a [Statement],
|
||||
@ -271,59 +317,78 @@ pub fn get_statement_unknowns<'a>(
|
||||
for stmt in stmts.iter() {
|
||||
match &stmt.node {
|
||||
StatementType::Return { value } => {
|
||||
if let Some(v) = value {
|
||||
get_expression_unknowns(defined, unknowns, &v.node);
|
||||
if let Some(value) = value {
|
||||
get_expr_unknowns(defined, unknowns, &value.node);
|
||||
}
|
||||
}
|
||||
StatementType::Assign { targets, value } => {
|
||||
get_expression_unknowns(defined, unknowns, &value.node);
|
||||
for t in targets.iter() {
|
||||
get_pattern_match_unknowns(defined, unknowns, &t.node);
|
||||
get_expr_unknowns(defined, unknowns, &value.node);
|
||||
for target in targets.iter() {
|
||||
for node in ExprPattern::new(&target.node).into_iter() {
|
||||
if let ExpressionType::Identifier { name } = node {
|
||||
let name = name.as_str();
|
||||
if !defined.contains(&name) {
|
||||
defined.push(name);
|
||||
}
|
||||
} else {
|
||||
get_expr_unknowns(defined, unknowns, node);
|
||||
}
|
||||
}
|
||||
}
|
||||
}
|
||||
StatementType::AugAssign { target, value, .. } => {
|
||||
get_expression_unknowns(defined, unknowns, &target.node);
|
||||
get_expression_unknowns(defined, unknowns, &value.node);
|
||||
get_expr_unknowns(defined, unknowns, &target.node);
|
||||
get_expr_unknowns(defined, unknowns, &value.node);
|
||||
}
|
||||
StatementType::AnnAssign { target, value, .. } => {
|
||||
if let Some(v) = value {
|
||||
get_expression_unknowns(defined, unknowns, &v.node);
|
||||
get_expr_unknowns(defined, unknowns, &target.node);
|
||||
if let Some(value) = value {
|
||||
get_expr_unknowns(defined, unknowns, &value.node);
|
||||
}
|
||||
get_pattern_match_unknowns(defined, unknowns, &target.node);
|
||||
}
|
||||
StatementType::Expression { expression } => {
|
||||
get_expression_unknowns(defined, unknowns, &expression.node);
|
||||
get_expr_unknowns(defined, unknowns, &expression.node);
|
||||
}
|
||||
StatementType::Global { names } => {
|
||||
for name in names.iter() {
|
||||
let name = name.as_str();
|
||||
if !unknowns.contains(&name) {
|
||||
unknowns.push(name);
|
||||
}
|
||||
}
|
||||
}
|
||||
StatementType::If { test, body, orelse }
|
||||
| StatementType::While { test, body, orelse } => {
|
||||
get_expression_unknowns(defined, unknowns, &test.node);
|
||||
get_statement_unknowns(defined, unknowns, body.as_slice());
|
||||
get_expr_unknowns(defined, unknowns, &test.node);
|
||||
// we are not very strict at this point...
|
||||
// some identifiers not treated as unknowns may not be resolved
|
||||
// but should be checked during type inference
|
||||
get_stmt_unknowns(defined, unknowns, body.as_slice());
|
||||
if let Some(orelse) = orelse {
|
||||
get_statement_unknowns(defined, unknowns, orelse.as_slice());
|
||||
get_stmt_unknowns(defined, unknowns, orelse.as_slice());
|
||||
}
|
||||
}
|
||||
StatementType::For { is_async, target, body, orelse, iter } => {
|
||||
StatementType::For { is_async, target, iter, body, orelse } => {
|
||||
if *is_async {
|
||||
unimplemented!();
|
||||
unimplemented!()
|
||||
}
|
||||
let mut scoped = defined.to_owned();
|
||||
get_expression_unknowns(defined, unknowns, &iter.node);
|
||||
get_expression_unknowns(defined, &mut scoped, &target.node);
|
||||
get_statement_unknowns(&mut scoped, unknowns, body.as_slice());
|
||||
get_expr_unknowns(defined, unknowns, &iter.node);
|
||||
for node in ExprPattern::new(&target.node).into_iter() {
|
||||
if let ExpressionType::Identifier { name } = node {
|
||||
let name = name.as_str();
|
||||
if !defined.contains(&name) {
|
||||
defined.push(name);
|
||||
}
|
||||
} else {
|
||||
get_expr_unknowns(defined, unknowns, node);
|
||||
}
|
||||
}
|
||||
get_stmt_unknowns(defined, unknowns, body.as_slice());
|
||||
if let Some(orelse) = orelse {
|
||||
get_statement_unknowns(&mut scoped, unknowns, orelse.as_slice());
|
||||
get_stmt_unknowns(defined, unknowns, orelse.as_slice());
|
||||
}
|
||||
}
|
||||
StatementType::With { is_async, items, body } => {
|
||||
if *is_async {
|
||||
unimplemented!();
|
||||
}
|
||||
let mut scoped = defined.to_owned();
|
||||
for item in items.iter() {
|
||||
|
||||
}
|
||||
}
|
||||
_ => {}
|
||||
_ => (),
|
||||
}
|
||||
}
|
||||
}
|
||||
@ -390,7 +455,7 @@ pub fn resolve_signatures<'a>(ctx: &mut TopLevelContext<'a>, stmts: &'a [Stateme
|
||||
mod tests {
|
||||
use super::*;
|
||||
use indoc::indoc;
|
||||
use rustpython_parser::parser::parse_program;
|
||||
use rustpython_parser::parser::{parse_program, parse_statement};
|
||||
|
||||
#[test]
|
||||
fn test_get_classes() {
|
||||
@ -400,14 +465,14 @@ mod tests {
|
||||
b: Test
|
||||
|
||||
def test(self, a: int32) -> Test2:
|
||||
return b
|
||||
return self.b
|
||||
|
||||
class Bar(Foo, 'FooBar'):
|
||||
def test2(self, a: list[Foo]) -> Test2:
|
||||
return b
|
||||
return self.b
|
||||
|
||||
def test3(self, a: list[FooBar2]) -> Test2:
|
||||
return b
|
||||
return self.b
|
||||
" })
|
||||
.unwrap();
|
||||
let (mut classes, mut unknowns) = get_typenames(&ast.statements);
|
||||
@ -420,4 +485,19 @@ mod tests {
|
||||
assert_eq!(&classes, &["Bar", "Foo"]);
|
||||
assert_eq!(&unknowns, &["FooBar", "FooBar2", "Test", "Test2"]);
|
||||
}
|
||||
|
||||
#[test]
|
||||
fn test_assignment() {
|
||||
let ast = parse_statement(indoc! {"
|
||||
((a, b), c[i]) = core.foo(x, get_y())
|
||||
" })
|
||||
.unwrap();
|
||||
let mut defined = Vec::new();
|
||||
let mut unknowns = Vec::new();
|
||||
get_stmt_unknowns(&mut defined, &mut unknowns, ast.as_slice());
|
||||
defined.sort();
|
||||
unknowns.sort();
|
||||
assert_eq!(defined.as_slice(), &["a", "b"]);
|
||||
assert_eq!(unknowns.as_slice(), &["c", "core", "get_y", "i", "x"]);
|
||||
}
|
||||
}
|
||||
|
19
todo.txt
19
todo.txt
@ -12,12 +12,23 @@ Errors:
|
||||
- Incorrect number of parameters
|
||||
|
||||
Symbol Resolution:
|
||||
- Add all files with annotated class/functions.
|
||||
- Find class references, load them all in TopLevelContext.
|
||||
- Find unbounded identifiers/functions in functions.
|
||||
- `inspect.getmodule(x)` every unknown `x` if not primitive/list of primitives,
|
||||
check their files recursively by getting their file path, cache with
|
||||
(normalized) path as key.
|
||||
- Find unbounded identifiers in the functions.
|
||||
- If it is a function/class name, record its object ID.
|
||||
- Otherwise, load its value. (check to see if specified with `global`)
|
||||
(Function implemented in python, with rust binding to add value to global
|
||||
variable dictionary)
|
||||
|
||||
Global variable dictionary:
|
||||
- Primitives, including integers, floats, bools, etc.
|
||||
- Primitive lists.
|
||||
- Numpy multi-dimensional array, with value + dimension vectors.
|
||||
- Reference array, with integer index referring to other things.
|
||||
- Symbol table: python id -> reference id.
|
||||
|
||||
TopLevelContext/InferenceContext:
|
||||
- Restrict visibility by user defined function.
|
||||
|
||||
|
||||
|
||||
|
Loading…
Reference in New Issue
Block a user