Compare commits

..

3 Commits

Author SHA1 Message Date
65d9b620fe Merge remote-tracking branch 'origin/master' 2021-01-27 16:00:47 +08:00
075245f4c2 get list of unknowns 2021-01-27 16:00:06 +08:00
0e9dea0e65 updated todo 2021-01-25 17:09:17 +08:00
2 changed files with 168 additions and 77 deletions

View File

@ -160,50 +160,50 @@ fn resolve_function<'a>(
}
}
fn get_expression_unknowns<'a>(
defined: &[&'a str],
fn get_expr_unknowns<'a>(
defined: &mut Vec<&'a str>,
unknowns: &mut Vec<&'a str>,
expr: &'a ExpressionType,
) {
match expr {
ExpressionType::BoolOp { values, .. } => {
for v in values.iter() {
get_expression_unknowns(defined, unknowns, &v.node)
get_expr_unknowns(defined, unknowns, &v.node)
}
}
ExpressionType::Binop { a, b, .. } => {
get_expression_unknowns(defined, unknowns, &a.node);
get_expression_unknowns(defined, unknowns, &b.node);
get_expr_unknowns(defined, unknowns, &a.node);
get_expr_unknowns(defined, unknowns, &b.node);
}
ExpressionType::Subscript { a, b } => {
get_expression_unknowns(defined, unknowns, &a.node);
get_expression_unknowns(defined, unknowns, &b.node);
get_expr_unknowns(defined, unknowns, &a.node);
get_expr_unknowns(defined, unknowns, &b.node);
}
ExpressionType::Unop { a, .. } => {
get_expression_unknowns(defined, unknowns, &a.node);
get_expr_unknowns(defined, unknowns, &a.node);
}
ExpressionType::Compare { vals, .. } => {
for v in vals.iter() {
get_expression_unknowns(defined, unknowns, &v.node)
get_expr_unknowns(defined, unknowns, &v.node)
}
}
ExpressionType::Attribute { value, .. } => {
get_expression_unknowns(defined, unknowns, &value.node);
get_expr_unknowns(defined, unknowns, &value.node);
}
ExpressionType::Call { function, args, .. } => {
get_expression_unknowns(defined, unknowns, &function.node);
get_expr_unknowns(defined, unknowns, &function.node);
for v in args.iter() {
get_expression_unknowns(defined, unknowns, &v.node)
get_expr_unknowns(defined, unknowns, &v.node)
}
}
ExpressionType::List { elements } => {
for v in elements.iter() {
get_expression_unknowns(defined, unknowns, &v.node)
get_expr_unknowns(defined, unknowns, &v.node)
}
}
ExpressionType::Tuple { elements } => {
for v in elements.iter() {
get_expression_unknowns(defined, unknowns, &v.node)
get_expr_unknowns(defined, unknowns, &v.node)
}
}
ExpressionType::Comprehension { kind, generators } => {
@ -211,22 +211,22 @@ fn get_expression_unknowns<'a>(
unimplemented!()
}
let g = &generators[0];
get_expression_unknowns(defined, unknowns, &g.iter.node);
let mut scoped = defined.to_owned();
get_expression_unknowns(defined, &mut scoped, &g.target.node);
get_expr_unknowns(defined, unknowns, &g.iter.node);
let mut scoped = defined.clone();
get_expr_unknowns(defined, &mut scoped, &g.target.node);
for if_expr in g.ifs.iter() {
get_expression_unknowns(&scoped, unknowns, &if_expr.node);
get_expr_unknowns(&mut scoped, unknowns, &if_expr.node);
}
match kind.as_ref() {
ComprehensionKind::List { element } => {
get_expression_unknowns(&scoped, unknowns, &element.node);
get_expr_unknowns(&mut scoped, unknowns, &element.node);
}
_ => unimplemented!(),
}
}
ExpressionType::Slice { elements } => {
for v in elements.iter() {
get_expression_unknowns(defined, unknowns, &v.node);
get_expr_unknowns(defined, unknowns, &v.node);
}
}
ExpressionType::Identifier { name } => {
@ -235,35 +235,81 @@ fn get_expression_unknowns<'a>(
}
}
ExpressionType::IfExpression { test, body, orelse } => {
get_expression_unknowns(defined, unknowns, &test.node);
get_expression_unknowns(defined, unknowns, &body.node);
get_expression_unknowns(defined, unknowns, &orelse.node);
get_expr_unknowns(defined, unknowns, &test.node);
get_expr_unknowns(defined, unknowns, &body.node);
get_expr_unknowns(defined, unknowns, &orelse.node);
}
_ => (),
};
}
pub fn get_pattern_match_unknowns<'a>(
defined: &mut Vec<&'a str>,
unknowns: &mut Vec<&'a str>,
expr: &'a ExpressionType,
) {
match expr {
ExpressionType::Identifier { name } => {
defined.push(&name.as_str());
}
ExpressionType::Tuple { elements } => {
for v in elements.iter() {
get_pattern_match_unknowns(defined, unknowns, &v.node);
struct ExprPattern<'a>(&'a ExpressionType, Vec<usize>, bool);
impl<'a> ExprPattern<'a> {
fn new(expr: &'a ExpressionType) -> ExprPattern {
let mut pattern = ExprPattern(expr, Vec::new(), true);
pattern.find_leaf();
pattern
}
fn pointed(&mut self) -> &'a ExpressionType {
let mut current = self.0;
for v in self.1.iter() {
if let ExpressionType::Tuple { elements } = current {
current = &elements[*v].node
} else {
unreachable!()
}
}
_ => {
get_expression_unknowns(defined, unknowns, expr);
current
}
fn find_leaf(&mut self) {
let mut current = self.pointed();
while let ExpressionType::Tuple { elements } = current {
if elements.is_empty() {
break;
}
current = &elements[0].node;
self.1.push(0);
}
}
fn inc(&mut self) -> bool {
loop {
if self.1.is_empty() {
return false;
}
let ind = self.1.pop().unwrap() + 1;
let parent = self.pointed();
if let ExpressionType::Tuple { elements } = parent {
if ind < elements.len() {
self.1.push(ind);
self.find_leaf();
return true;
}
} else {
unreachable!()
}
}
}
}
pub fn get_statement_unknowns<'a>(
impl<'a> Iterator for ExprPattern<'a> {
type Item = &'a ExpressionType;
fn next(&mut self) -> Option<Self::Item> {
if self.2 {
self.2 = false;
Some(self.pointed())
} else if self.inc() {
Some(self.pointed())
} else {
None
}
}
}
fn get_stmt_unknowns<'a>(
defined: &mut Vec<&'a str>,
unknowns: &mut Vec<&'a str>,
stmts: &'a [Statement],
@ -271,59 +317,78 @@ pub fn get_statement_unknowns<'a>(
for stmt in stmts.iter() {
match &stmt.node {
StatementType::Return { value } => {
if let Some(v) = value {
get_expression_unknowns(defined, unknowns, &v.node);
if let Some(value) = value {
get_expr_unknowns(defined, unknowns, &value.node);
}
}
StatementType::Assign { targets, value } => {
get_expression_unknowns(defined, unknowns, &value.node);
for t in targets.iter() {
get_pattern_match_unknowns(defined, unknowns, &t.node);
get_expr_unknowns(defined, unknowns, &value.node);
for target in targets.iter() {
for node in ExprPattern::new(&target.node).into_iter() {
if let ExpressionType::Identifier { name } = node {
let name = name.as_str();
if !defined.contains(&name) {
defined.push(name);
}
} else {
get_expr_unknowns(defined, unknowns, node);
}
}
}
}
StatementType::AugAssign { target, value, .. } => {
get_expression_unknowns(defined, unknowns, &target.node);
get_expression_unknowns(defined, unknowns, &value.node);
get_expr_unknowns(defined, unknowns, &target.node);
get_expr_unknowns(defined, unknowns, &value.node);
}
StatementType::AnnAssign { target, value, .. } => {
if let Some(v) = value {
get_expression_unknowns(defined, unknowns, &v.node);
get_expr_unknowns(defined, unknowns, &target.node);
if let Some(value) = value {
get_expr_unknowns(defined, unknowns, &value.node);
}
get_pattern_match_unknowns(defined, unknowns, &target.node);
}
StatementType::Expression { expression } => {
get_expression_unknowns(defined, unknowns, &expression.node);
get_expr_unknowns(defined, unknowns, &expression.node);
}
StatementType::Global { names } => {
for name in names.iter() {
let name = name.as_str();
if !unknowns.contains(&name) {
unknowns.push(name);
}
}
}
StatementType::If { test, body, orelse }
| StatementType::While { test, body, orelse } => {
get_expression_unknowns(defined, unknowns, &test.node);
get_statement_unknowns(defined, unknowns, body.as_slice());
get_expr_unknowns(defined, unknowns, &test.node);
// we are not very strict at this point...
// some identifiers not treated as unknowns may not be resolved
// but should be checked during type inference
get_stmt_unknowns(defined, unknowns, body.as_slice());
if let Some(orelse) = orelse {
get_statement_unknowns(defined, unknowns, orelse.as_slice());
get_stmt_unknowns(defined, unknowns, orelse.as_slice());
}
}
StatementType::For { is_async, target, body, orelse, iter } => {
StatementType::For { is_async, target, iter, body, orelse } => {
if *is_async {
unimplemented!();
unimplemented!()
}
let mut scoped = defined.to_owned();
get_expression_unknowns(defined, unknowns, &iter.node);
get_expression_unknowns(defined, &mut scoped, &target.node);
get_statement_unknowns(&mut scoped, unknowns, body.as_slice());
get_expr_unknowns(defined, unknowns, &iter.node);
for node in ExprPattern::new(&target.node).into_iter() {
if let ExpressionType::Identifier { name } = node {
let name = name.as_str();
if !defined.contains(&name) {
defined.push(name);
}
} else {
get_expr_unknowns(defined, unknowns, node);
}
}
get_stmt_unknowns(defined, unknowns, body.as_slice());
if let Some(orelse) = orelse {
get_statement_unknowns(&mut scoped, unknowns, orelse.as_slice());
get_stmt_unknowns(defined, unknowns, orelse.as_slice());
}
}
StatementType::With { is_async, items, body } => {
if *is_async {
unimplemented!();
}
let mut scoped = defined.to_owned();
for item in items.iter() {
}
}
_ => {}
_ => (),
}
}
}
@ -390,7 +455,7 @@ pub fn resolve_signatures<'a>(ctx: &mut TopLevelContext<'a>, stmts: &'a [Stateme
mod tests {
use super::*;
use indoc::indoc;
use rustpython_parser::parser::parse_program;
use rustpython_parser::parser::{parse_program, parse_statement};
#[test]
fn test_get_classes() {
@ -400,14 +465,14 @@ mod tests {
b: Test
def test(self, a: int32) -> Test2:
return b
return self.b
class Bar(Foo, 'FooBar'):
def test2(self, a: list[Foo]) -> Test2:
return b
return self.b
def test3(self, a: list[FooBar2]) -> Test2:
return b
return self.b
" })
.unwrap();
let (mut classes, mut unknowns) = get_typenames(&ast.statements);
@ -420,4 +485,19 @@ mod tests {
assert_eq!(&classes, &["Bar", "Foo"]);
assert_eq!(&unknowns, &["FooBar", "FooBar2", "Test", "Test2"]);
}
#[test]
fn test_assignment() {
let ast = parse_statement(indoc! {"
((a, b), c[i]) = core.foo(x, get_y())
" })
.unwrap();
let mut defined = Vec::new();
let mut unknowns = Vec::new();
get_stmt_unknowns(&mut defined, &mut unknowns, ast.as_slice());
defined.sort();
unknowns.sort();
assert_eq!(defined.as_slice(), &["a", "b"]);
assert_eq!(unknowns.as_slice(), &["c", "core", "get_y", "i", "x"]);
}
}

View File

@ -12,12 +12,23 @@ Errors:
- Incorrect number of parameters
Symbol Resolution:
- Add all files with annotated class/functions.
- Find class references, load them all in TopLevelContext.
- Find unbounded identifiers/functions in functions.
- `inspect.getmodule(x)` every unknown `x` if not primitive/list of primitives,
check their files recursively by getting their file path, cache with
(normalized) path as key.
- Find unbounded identifiers in the functions.
- If it is a function/class name, record its object ID.
- Otherwise, load its value. (check to see if specified with `global`)
(Function implemented in python, with rust binding to add value to global
variable dictionary)
Global variable dictionary:
- Primitives, including integers, floats, bools, etc.
- Primitive lists.
- Numpy multi-dimensional array, with value + dimension vectors.
- Reference array, with integer index referring to other things.
- Symbol table: python id -> reference id.
TopLevelContext/InferenceContext:
- Restrict visibility by user defined function.