Skip to content

Commit

Permalink
[red-knot] support non-local name lookups (#13177)
Browse files Browse the repository at this point in the history
Add support for non-local name lookups.

There's one TODO around annotated assignments without a RHS; these need
a fair amount of attention, which they'll get in an upcoming PR about
declared vs inferred types.

Fixes #11663
  • Loading branch information
carljm committed Sep 3, 2024
1 parent 29c36a5 commit 3c4ec82
Show file tree
Hide file tree
Showing 3 changed files with 161 additions and 41 deletions.
4 changes: 4 additions & 0 deletions crates/red_knot_python_semantic/src/semantic_index/symbol.rs
Original file line number Diff line number Diff line change
Expand Up @@ -149,6 +149,10 @@ impl FileScopeId {
FileScopeId::from_u32(0)
}

pub fn is_global(self) -> bool {
self == FileScopeId::global()
}

pub fn to_scope_id(self, db: &dyn Db, file: File) -> ScopeId<'_> {
let index = semantic_index(db, file);
index.scope_ids_by_scope[self]
Expand Down
192 changes: 156 additions & 36 deletions crates/red_knot_python_semantic/src/types/infer.rs
Original file line number Diff line number Diff line change
Expand Up @@ -44,12 +44,13 @@ use crate::semantic_index::ast_ids::{HasScopedAstId, HasScopedUseId, ScopedExpre
use crate::semantic_index::definition::{Definition, DefinitionKind, DefinitionNodeKey};
use crate::semantic_index::expression::Expression;
use crate::semantic_index::semantic_index;
use crate::semantic_index::symbol::{FileScopeId, NodeWithScopeKind, NodeWithScopeRef, ScopeId};
use crate::semantic_index::symbol::{NodeWithScopeKind, NodeWithScopeRef, ScopeId};
use crate::semantic_index::SemanticIndex;
use crate::types::diagnostic::{TypeCheckDiagnostic, TypeCheckDiagnostics};
use crate::types::{
builtins_symbol_ty_by_name, definitions_ty, global_symbol_ty_by_name, symbol_ty,
BytesLiteralType, ClassType, FunctionType, StringLiteralType, Type, UnionBuilder,
symbol_ty_by_name, BytesLiteralType, ClassType, FunctionType, StringLiteralType, Type,
UnionBuilder,
};
use crate::Db;

Expand Down Expand Up @@ -301,7 +302,7 @@ impl<'db> TypeInferenceBuilder<'db> {
self.file.is_stub(self.db.upcast())
}

/// Are we currently inferred deferred types?
/// Are we currently inferring deferred types?
fn is_deferred(&self) -> bool {
matches!(self.region, InferenceRegion::Deferred(_))
}
Expand Down Expand Up @@ -1823,6 +1824,61 @@ impl<'db> TypeInferenceBuilder<'db> {
Type::Unknown
}

/// Look up a name reference that isn't bound in the local scope.
fn lookup_name(&self, name: &ast::name::Name) -> Type<'db> {
let file_scope_id = self.scope.file_scope_id(self.db);
let symbols = self.index.symbol_table(file_scope_id);
let symbol = symbols
.symbol_by_name(name)
.expect("Expected the symbol table to create a symbol for every Name node");

// In function-like scopes, any local variable (symbol that is defined in this
// scope) can only have a definition in this scope, or be undefined; it never references
// another scope. (At runtime, it would use the `LOAD_FAST` opcode.)
if !symbol.is_defined() || !self.scope.is_function_like(self.db) {
// Walk up parent scopes looking for a possible enclosing scope that may have a
// definition of this name visible to us (would be `LOAD_DEREF` at runtime.)
for (enclosing_scope_file_id, _) in self.index.ancestor_scopes(file_scope_id) {
// Class scopes are not visible to nested scopes, and we need to handle global
// scope differently (because an unbound name there falls back to builtins), so
// check only function-like scopes.
let enclosing_scope_id = enclosing_scope_file_id.to_scope_id(self.db, self.file);
if !enclosing_scope_id.is_function_like(self.db) {
continue;
}
let enclosing_symbol_table = self.index.symbol_table(enclosing_scope_file_id);
let Some(enclosing_symbol) = enclosing_symbol_table.symbol_by_name(name) else {
continue;
};
// TODO a "definition" that is just an annotated-assignment with no RHS should not
// count as "is_defined" here.
if enclosing_symbol.is_defined() {
// We can return early here, because the nearest function-like scope that
// defines a name must be the only source for the nonlocal reference (at
// runtime, it is the scope that creates the cell for our closure.) If the name
// isn't bound in that scope, we should get an unbound name, not continue
// falling back to other scopes / globals / builtins.
return symbol_ty_by_name(self.db, enclosing_scope_id, name);
}
}
// No nonlocal binding, check module globals. Avoid infinite recursion if `self.scope`
// already is module globals.
let ty = if file_scope_id.is_global() {
Type::Unbound
} else {
global_symbol_ty_by_name(self.db, self.file, name)
};
// Fallback to builtins (without infinite recursion if we're already in builtins.)
if ty.may_be_unbound(self.db) && Some(self.scope) != builtins_scope(self.db) {
ty.replace_unbound_with(self.db, builtins_symbol_ty_by_name(self.db, name))
} else {
ty
}
} else {
Type::Unbound
}
}

fn infer_name_expression(&mut self, name: &ast::ExprName) -> Type<'db> {
let ast::ExprName { range: _, id, ctx } = name;
let file_scope_id = self.scope.file_scope_id(self.db);
Expand All @@ -1843,30 +1899,7 @@ impl<'db> TypeInferenceBuilder<'db> {
let may_be_unbound = use_def.use_may_be_unbound(use_id);

let unbound_ty = if may_be_unbound {
let symbols = self.index.symbol_table(file_scope_id);
// SAFETY: the symbol table always creates a symbol for every Name node.
let symbol = symbols.symbol_by_name(id).unwrap();
if !symbol.is_defined() || !self.scope.is_function_like(self.db) {
// implicit global
let unbound_ty = if file_scope_id == FileScopeId::global() {
Type::Unbound
} else {
global_symbol_ty_by_name(self.db, self.file, id)
};
// fallback to builtins
if unbound_ty.may_be_unbound(self.db)
&& Some(self.scope) != builtins_scope(self.db)
{
Some(unbound_ty.replace_unbound_with(
self.db,
builtins_symbol_ty_by_name(self.db, id),
))
} else {
Some(unbound_ty)
}
} else {
Some(Type::Unbound)
}
Some(self.lookup_name(id))
} else {
None
};
Expand Down Expand Up @@ -2385,6 +2418,31 @@ mod tests {
assert_eq!(ty.display(db).to_string(), expected);
}

fn assert_scope_ty(
db: &TestDb,
file_name: &str,
scopes: &[&str],
symbol_name: &str,
expected: &str,
) {
let file = system_path_to_file(db, file_name).expect("Expected file to exist.");
let index = semantic_index(db, file);
let mut file_scope_id = FileScopeId::global();
let mut scope = file_scope_id.to_scope_id(db, file);
for expected_scope_name in scopes {
file_scope_id = index
.child_scopes(file_scope_id)
.next()
.unwrap_or_else(|| panic!("scope of {expected_scope_name}"))
.0;
scope = file_scope_id.to_scope_id(db, file);
assert_eq!(scope.name(db), *expected_scope_name);
}

let ty = symbol_ty_by_name(db, scope, symbol_name);
assert_eq!(ty.display(db).to_string(), expected);
}

#[test]
fn follow_import_to_class() -> anyhow::Result<()> {
let mut db = setup_db();
Expand Down Expand Up @@ -3601,15 +3659,6 @@ mod tests {
Ok(())
}

fn first_public_def<'db>(db: &'db TestDb, file: File, name: &str) -> Definition<'db> {
let scope = global_scope(db, file);
use_def_map(db, scope)
.public_definitions(symbol_table(db, scope).symbol_id_by_name(name).unwrap())
.next()
.unwrap()
.definition
}

#[test]
fn big_int() -> anyhow::Result<()> {
let mut db = setup_db();
Expand Down Expand Up @@ -3694,6 +3743,77 @@ mod tests {
Ok(())
}

#[test]
fn nonlocal_name_reference() -> anyhow::Result<()> {
let mut db = setup_db();

db.write_dedented(
"/src/a.py",
"
def f():
x = 1
def g():
y = x
",
)?;

assert_scope_ty(&db, "/src/a.py", &["f", "g"], "y", "Literal[1]");

Ok(())
}

#[test]
fn nonlocal_name_reference_multi_level() -> anyhow::Result<()> {
let mut db = setup_db();

db.write_dedented(
"/src/a.py",
"
def f():
x = 1
def g():
def h():
y = x
",
)?;

assert_scope_ty(&db, "/src/a.py", &["f", "g", "h"], "y", "Literal[1]");

Ok(())
}

#[test]
fn nonlocal_name_reference_skips_class_scope() -> anyhow::Result<()> {
let mut db = setup_db();

db.write_dedented(
"/src/a.py",
"
def f():
x = 1
class C:
x = 2
def g():
y = x
",
)?;

assert_scope_ty(&db, "/src/a.py", &["f", "C", "g"], "y", "Literal[1]");

Ok(())
}

// Incremental inference tests

fn first_public_def<'db>(db: &'db TestDb, file: File, name: &str) -> Definition<'db> {
let scope = global_scope(db, file);
use_def_map(db, scope)
.public_definitions(symbol_table(db, scope).symbol_id_by_name(name).unwrap())
.next()
.unwrap()
.definition
}

#[test]
fn dependency_public_symbol_type_change() -> anyhow::Result<()> {
let mut db = setup_db();
Expand Down
6 changes: 1 addition & 5 deletions crates/ruff_benchmark/benches/red_knot.rs
Original file line number Diff line number Diff line change
Expand Up @@ -21,10 +21,9 @@ struct Case {

const TOMLLIB_312_URL: &str = "https://raw.githubusercontent.com/python/cpython/8e8a4baf652f6e1cee7acde9d78c4b6154539748/Lib/tomllib";

// The "unresolved import" is because we don't understand `*` imports yet.
// The failed import from 'collections.abc' is due to lack of support for 'import *'.
static EXPECTED_DIAGNOSTICS: &[&str] = &[
"/src/tomllib/_parser.py:7:29: Module 'collections.abc' has no member 'Iterable'",
"/src/tomllib/_parser.py:686:23: Object of type 'Unbound' is not callable",
"Line 69 is too long (89 characters)",
"Use double quotes for strings",
"Use double quotes for strings",
Expand All @@ -33,10 +32,7 @@ static EXPECTED_DIAGNOSTICS: &[&str] = &[
"Use double quotes for strings",
"Use double quotes for strings",
"Use double quotes for strings",
"/src/tomllib/_parser.py:330:32: Name 'header' used when not defined.",
"/src/tomllib/_parser.py:330:41: Name 'key' used when not defined.",
"/src/tomllib/_parser.py:628:75: Name 'e' used when not defined.",
"/src/tomllib/_parser.py:686:23: Name 'parse_float' used when not defined.",
];

fn get_test_file(name: &str) -> TestFile {
Expand Down

0 comments on commit 3c4ec82

Please sign in to comment.