Compare commits

..

3 Commits

Author SHA1 Message Date
65d9b620fe Merge remote-tracking branch 'origin/master' 2021-01-27 16:00:47 +08:00
075245f4c2 get list of unknowns 2021-01-27 16:00:06 +08:00
0e9dea0e65 updated todo 2021-01-25 17:09:17 +08:00
2 changed files with 168 additions and 77 deletions

View File

@ -160,50 +160,50 @@ fn resolve_function<'a>(
} }
} }
fn get_expression_unknowns<'a>( fn get_expr_unknowns<'a>(
defined: &[&'a str], defined: &mut Vec<&'a str>,
unknowns: &mut Vec<&'a str>, unknowns: &mut Vec<&'a str>,
expr: &'a ExpressionType, expr: &'a ExpressionType,
) { ) {
match expr { match expr {
ExpressionType::BoolOp { values, .. } => { ExpressionType::BoolOp { values, .. } => {
for v in values.iter() { for v in values.iter() {
get_expression_unknowns(defined, unknowns, &v.node) get_expr_unknowns(defined, unknowns, &v.node)
} }
} }
ExpressionType::Binop { a, b, .. } => { ExpressionType::Binop { a, b, .. } => {
get_expression_unknowns(defined, unknowns, &a.node); get_expr_unknowns(defined, unknowns, &a.node);
get_expression_unknowns(defined, unknowns, &b.node); get_expr_unknowns(defined, unknowns, &b.node);
} }
ExpressionType::Subscript { a, b } => { ExpressionType::Subscript { a, b } => {
get_expression_unknowns(defined, unknowns, &a.node); get_expr_unknowns(defined, unknowns, &a.node);
get_expression_unknowns(defined, unknowns, &b.node); get_expr_unknowns(defined, unknowns, &b.node);
} }
ExpressionType::Unop { a, .. } => { ExpressionType::Unop { a, .. } => {
get_expression_unknowns(defined, unknowns, &a.node); get_expr_unknowns(defined, unknowns, &a.node);
} }
ExpressionType::Compare { vals, .. } => { ExpressionType::Compare { vals, .. } => {
for v in vals.iter() { for v in vals.iter() {
get_expression_unknowns(defined, unknowns, &v.node) get_expr_unknowns(defined, unknowns, &v.node)
} }
} }
ExpressionType::Attribute { value, .. } => { ExpressionType::Attribute { value, .. } => {
get_expression_unknowns(defined, unknowns, &value.node); get_expr_unknowns(defined, unknowns, &value.node);
} }
ExpressionType::Call { function, args, .. } => { ExpressionType::Call { function, args, .. } => {
get_expression_unknowns(defined, unknowns, &function.node); get_expr_unknowns(defined, unknowns, &function.node);
for v in args.iter() { for v in args.iter() {
get_expression_unknowns(defined, unknowns, &v.node) get_expr_unknowns(defined, unknowns, &v.node)
} }
} }
ExpressionType::List { elements } => { ExpressionType::List { elements } => {
for v in elements.iter() { for v in elements.iter() {
get_expression_unknowns(defined, unknowns, &v.node) get_expr_unknowns(defined, unknowns, &v.node)
} }
} }
ExpressionType::Tuple { elements } => { ExpressionType::Tuple { elements } => {
for v in elements.iter() { for v in elements.iter() {
get_expression_unknowns(defined, unknowns, &v.node) get_expr_unknowns(defined, unknowns, &v.node)
} }
} }
ExpressionType::Comprehension { kind, generators } => { ExpressionType::Comprehension { kind, generators } => {
@ -211,22 +211,22 @@ fn get_expression_unknowns<'a>(
unimplemented!() unimplemented!()
} }
let g = &generators[0]; let g = &generators[0];
get_expression_unknowns(defined, unknowns, &g.iter.node); get_expr_unknowns(defined, unknowns, &g.iter.node);
let mut scoped = defined.to_owned(); let mut scoped = defined.clone();
get_expression_unknowns(defined, &mut scoped, &g.target.node); get_expr_unknowns(defined, &mut scoped, &g.target.node);
for if_expr in g.ifs.iter() { for if_expr in g.ifs.iter() {
get_expression_unknowns(&scoped, unknowns, &if_expr.node); get_expr_unknowns(&mut scoped, unknowns, &if_expr.node);
} }
match kind.as_ref() { match kind.as_ref() {
ComprehensionKind::List { element } => { ComprehensionKind::List { element } => {
get_expression_unknowns(&scoped, unknowns, &element.node); get_expr_unknowns(&mut scoped, unknowns, &element.node);
} }
_ => unimplemented!(), _ => unimplemented!(),
} }
} }
ExpressionType::Slice { elements } => { ExpressionType::Slice { elements } => {
for v in elements.iter() { for v in elements.iter() {
get_expression_unknowns(defined, unknowns, &v.node); get_expr_unknowns(defined, unknowns, &v.node);
} }
} }
ExpressionType::Identifier { name } => { ExpressionType::Identifier { name } => {
@ -235,35 +235,81 @@ fn get_expression_unknowns<'a>(
} }
} }
ExpressionType::IfExpression { test, body, orelse } => { ExpressionType::IfExpression { test, body, orelse } => {
get_expression_unknowns(defined, unknowns, &test.node); get_expr_unknowns(defined, unknowns, &test.node);
get_expression_unknowns(defined, unknowns, &body.node); get_expr_unknowns(defined, unknowns, &body.node);
get_expression_unknowns(defined, unknowns, &orelse.node); get_expr_unknowns(defined, unknowns, &orelse.node);
} }
_ => (), _ => (),
}; };
} }
pub fn get_pattern_match_unknowns<'a>( struct ExprPattern<'a>(&'a ExpressionType, Vec<usize>, bool);
defined: &mut Vec<&'a str>,
unknowns: &mut Vec<&'a str>, impl<'a> ExprPattern<'a> {
expr: &'a ExpressionType, fn new(expr: &'a ExpressionType) -> ExprPattern {
) { let mut pattern = ExprPattern(expr, Vec::new(), true);
match expr { pattern.find_leaf();
ExpressionType::Identifier { name } => { pattern
defined.push(&name.as_str()); }
}
ExpressionType::Tuple { elements } => { fn pointed(&mut self) -> &'a ExpressionType {
for v in elements.iter() { let mut current = self.0;
get_pattern_match_unknowns(defined, unknowns, &v.node); for v in self.1.iter() {
if let ExpressionType::Tuple { elements } = current {
current = &elements[*v].node
} else {
unreachable!()
} }
} }
_ => { current
get_expression_unknowns(defined, unknowns, expr); }
fn find_leaf(&mut self) {
let mut current = self.pointed();
while let ExpressionType::Tuple { elements } = current {
if elements.is_empty() {
break;
}
current = &elements[0].node;
self.1.push(0);
}
}
fn inc(&mut self) -> bool {
loop {
if self.1.is_empty() {
return false;
}
let ind = self.1.pop().unwrap() + 1;
let parent = self.pointed();
if let ExpressionType::Tuple { elements } = parent {
if ind < elements.len() {
self.1.push(ind);
self.find_leaf();
return true;
}
} else {
unreachable!()
}
} }
} }
} }
pub fn get_statement_unknowns<'a>( impl<'a> Iterator for ExprPattern<'a> {
type Item = &'a ExpressionType;
fn next(&mut self) -> Option<Self::Item> {
if self.2 {
self.2 = false;
Some(self.pointed())
} else if self.inc() {
Some(self.pointed())
} else {
None
}
}
}
fn get_stmt_unknowns<'a>(
defined: &mut Vec<&'a str>, defined: &mut Vec<&'a str>,
unknowns: &mut Vec<&'a str>, unknowns: &mut Vec<&'a str>,
stmts: &'a [Statement], stmts: &'a [Statement],
@ -271,59 +317,78 @@ pub fn get_statement_unknowns<'a>(
for stmt in stmts.iter() { for stmt in stmts.iter() {
match &stmt.node { match &stmt.node {
StatementType::Return { value } => { StatementType::Return { value } => {
if let Some(v) = value { if let Some(value) = value {
get_expression_unknowns(defined, unknowns, &v.node); get_expr_unknowns(defined, unknowns, &value.node);
} }
} }
StatementType::Assign { targets, value } => { StatementType::Assign { targets, value } => {
get_expression_unknowns(defined, unknowns, &value.node); get_expr_unknowns(defined, unknowns, &value.node);
for t in targets.iter() { for target in targets.iter() {
get_pattern_match_unknowns(defined, unknowns, &t.node); for node in ExprPattern::new(&target.node).into_iter() {
if let ExpressionType::Identifier { name } = node {
let name = name.as_str();
if !defined.contains(&name) {
defined.push(name);
}
} else {
get_expr_unknowns(defined, unknowns, node);
}
}
} }
} }
StatementType::AugAssign { target, value, .. } => { StatementType::AugAssign { target, value, .. } => {
get_expression_unknowns(defined, unknowns, &target.node); get_expr_unknowns(defined, unknowns, &target.node);
get_expression_unknowns(defined, unknowns, &value.node); get_expr_unknowns(defined, unknowns, &value.node);
} }
StatementType::AnnAssign { target, value, .. } => { StatementType::AnnAssign { target, value, .. } => {
if let Some(v) = value { get_expr_unknowns(defined, unknowns, &target.node);
get_expression_unknowns(defined, unknowns, &v.node); if let Some(value) = value {
get_expr_unknowns(defined, unknowns, &value.node);
} }
get_pattern_match_unknowns(defined, unknowns, &target.node);
} }
StatementType::Expression { expression } => { StatementType::Expression { expression } => {
get_expression_unknowns(defined, unknowns, &expression.node); get_expr_unknowns(defined, unknowns, &expression.node);
}
StatementType::Global { names } => {
for name in names.iter() {
let name = name.as_str();
if !unknowns.contains(&name) {
unknowns.push(name);
}
}
} }
StatementType::If { test, body, orelse } StatementType::If { test, body, orelse }
| StatementType::While { test, body, orelse } => { | StatementType::While { test, body, orelse } => {
get_expression_unknowns(defined, unknowns, &test.node); get_expr_unknowns(defined, unknowns, &test.node);
get_statement_unknowns(defined, unknowns, body.as_slice()); // we are not very strict at this point...
// some identifiers not treated as unknowns may not be resolved
// but should be checked during type inference
get_stmt_unknowns(defined, unknowns, body.as_slice());
if let Some(orelse) = orelse { if let Some(orelse) = orelse {
get_statement_unknowns(defined, unknowns, orelse.as_slice()); get_stmt_unknowns(defined, unknowns, orelse.as_slice());
} }
} }
StatementType::For { is_async, target, body, orelse, iter } => { StatementType::For { is_async, target, iter, body, orelse } => {
if *is_async { if *is_async {
unimplemented!(); unimplemented!()
} }
let mut scoped = defined.to_owned(); get_expr_unknowns(defined, unknowns, &iter.node);
get_expression_unknowns(defined, unknowns, &iter.node); for node in ExprPattern::new(&target.node).into_iter() {
get_expression_unknowns(defined, &mut scoped, &target.node); if let ExpressionType::Identifier { name } = node {
get_statement_unknowns(&mut scoped, unknowns, body.as_slice()); let name = name.as_str();
if !defined.contains(&name) {
defined.push(name);
}
} else {
get_expr_unknowns(defined, unknowns, node);
}
}
get_stmt_unknowns(defined, unknowns, body.as_slice());
if let Some(orelse) = orelse { if let Some(orelse) = orelse {
get_statement_unknowns(&mut scoped, unknowns, orelse.as_slice()); get_stmt_unknowns(defined, unknowns, orelse.as_slice());
} }
} }
StatementType::With { is_async, items, body } => { _ => (),
if *is_async {
unimplemented!();
}
let mut scoped = defined.to_owned();
for item in items.iter() {
}
}
_ => {}
} }
} }
} }
@ -390,7 +455,7 @@ pub fn resolve_signatures<'a>(ctx: &mut TopLevelContext<'a>, stmts: &'a [Stateme
mod tests { mod tests {
use super::*; use super::*;
use indoc::indoc; use indoc::indoc;
use rustpython_parser::parser::parse_program; use rustpython_parser::parser::{parse_program, parse_statement};
#[test] #[test]
fn test_get_classes() { fn test_get_classes() {
@ -400,14 +465,14 @@ mod tests {
b: Test b: Test
def test(self, a: int32) -> Test2: def test(self, a: int32) -> Test2:
return b return self.b
class Bar(Foo, 'FooBar'): class Bar(Foo, 'FooBar'):
def test2(self, a: list[Foo]) -> Test2: def test2(self, a: list[Foo]) -> Test2:
return b return self.b
def test3(self, a: list[FooBar2]) -> Test2: def test3(self, a: list[FooBar2]) -> Test2:
return b return self.b
" }) " })
.unwrap(); .unwrap();
let (mut classes, mut unknowns) = get_typenames(&ast.statements); let (mut classes, mut unknowns) = get_typenames(&ast.statements);
@ -420,4 +485,19 @@ mod tests {
assert_eq!(&classes, &["Bar", "Foo"]); assert_eq!(&classes, &["Bar", "Foo"]);
assert_eq!(&unknowns, &["FooBar", "FooBar2", "Test", "Test2"]); assert_eq!(&unknowns, &["FooBar", "FooBar2", "Test", "Test2"]);
} }
#[test]
fn test_assignment() {
let ast = parse_statement(indoc! {"
((a, b), c[i]) = core.foo(x, get_y())
" })
.unwrap();
let mut defined = Vec::new();
let mut unknowns = Vec::new();
get_stmt_unknowns(&mut defined, &mut unknowns, ast.as_slice());
defined.sort();
unknowns.sort();
assert_eq!(defined.as_slice(), &["a", "b"]);
assert_eq!(unknowns.as_slice(), &["c", "core", "get_y", "i", "x"]);
}
} }

View File

@ -12,12 +12,23 @@ Errors:
- Incorrect number of parameters - Incorrect number of parameters
Symbol Resolution: Symbol Resolution:
- Add all files with annotated class/functions.
- Find class references, load them all in TopLevelContext. - Find class references, load them all in TopLevelContext.
- Find unbounded identifiers/functions in functions. - Find unbounded identifiers in the functions.
- `inspect.getmodule(x)` every unknown `x` if not primitive/list of primitives, - If it is a function/class name, record its object ID.
check their files recursively by getting their file path, cache with - Otherwise, load its value. (check to see if specified with `global`)
(normalized) path as key. (Function implemented in python, with rust binding to add value to global
variable dictionary)
Global variable dictionary:
- Primitives, including integers, floats, bools, etc.
- Primitive lists.
- Numpy multi-dimensional array, with value + dimension vectors.
- Reference array, with integer index referring to other things.
- Symbol table: python id -> reference id.
TopLevelContext/InferenceContext: TopLevelContext/InferenceContext:
- Restrict visibility by user defined function. - Restrict visibility by user defined function.