From f04a3bfe5c34243172333d776b1b93a117cca34b Mon Sep 17 00:00:00 2001 From: Alex Waygood Date: Thu, 22 Aug 2024 13:23:00 +0100 Subject: [PATCH 1/2] [red-knot] Improve the accuracy of the unresolved-import check --- crates/red_knot_python_semantic/src/types.rs | 17 +-- .../src/types/infer.rs | 129 +++++++++--------- crates/red_knot_wasm/tests/api.rs | 2 +- crates/ruff_benchmark/benches/red_knot.rs | 11 +- 4 files changed, 73 insertions(+), 86 deletions(-) diff --git a/crates/red_knot_python_semantic/src/types.rs b/crates/red_knot_python_semantic/src/types.rs index b649a6bfb238b..0dae3d286ef0f 100644 --- a/crates/red_knot_python_semantic/src/types.rs +++ b/crates/red_knot_python_semantic/src/types.rs @@ -444,7 +444,7 @@ mod tests { let foo = system_path_to_file(&db, "src/foo.py").context("Failed to resolve foo.py")?; let diagnostics = super::check_types(&db, foo); - assert_diagnostic_messages(&diagnostics, &["Import 'bar' could not be resolved."]); + assert_diagnostic_messages(&diagnostics, &["Cannot resolve import 'bar'."]); Ok(()) } @@ -457,7 +457,7 @@ mod tests { .unwrap(); let foo = system_path_to_file(&db, "src/foo.py").unwrap(); let diagnostics = super::check_types(&db, foo); - assert_diagnostic_messages(&diagnostics, &["Import 'bar' could not be resolved."]); + assert_diagnostic_messages(&diagnostics, &["Cannot resolve import 'bar'."]); } #[test] @@ -469,15 +469,9 @@ mod tests { let b_file = system_path_to_file(&db, "/src/b.py").unwrap(); let b_file_diagnostics = super::check_types(&db, b_file); - assert_diagnostic_messages( - &b_file_diagnostics, - &["Could not resolve import of 'thing' from 'a'"], - ); + assert_diagnostic_messages(&b_file_diagnostics, &["Module 'a' has no member 'thing'"]); } - #[ignore = "\ -A spurious second 'Unresolved import' diagnostic message is emitted on `b.py`, \ -despite the symbol existing in the symbol table for `a.py`"] #[test] fn resolved_import_of_symbol_from_unresolved_import() { let mut db = setup_db(); @@ -490,10 +484,7 @@ despite the symbol existing in the symbol table for `a.py`"] let a_file = system_path_to_file(&db, "/src/a.py").unwrap(); let a_file_diagnostics = super::check_types(&db, a_file); - assert_diagnostic_messages( - &a_file_diagnostics, - &["Import 'foo' could not be resolved."], - ); + assert_diagnostic_messages(&a_file_diagnostics, &["Cannot resolve import 'foo'."]); // Importing the unresolved import into a second first-party file should not trigger // an additional "unresolved import" violation diff --git a/crates/red_knot_python_semantic/src/types/infer.rs b/crates/red_knot_python_semantic/src/types/infer.rs index 69ae1e7cc4dec..4a65ecfa15bc6 100644 --- a/crates/red_knot_python_semantic/src/types/infer.rs +++ b/crates/red_knot_python_semantic/src/types/infer.rs @@ -941,24 +941,20 @@ impl<'db> TypeInferenceBuilder<'db> { asname: _, } = alias; - let module_ty = ModuleName::new(name) - .ok_or(ModuleResolutionError::InvalidSyntax) - .and_then(|module_name| self.module_ty_from_name(module_name)); - - let module_ty = match module_ty { - Ok(ty) => ty, - Err(ModuleResolutionError::InvalidSyntax) => { - tracing::debug!("Failed to resolve import due to invalid syntax"); - Type::Unknown - } - Err(ModuleResolutionError::UnresolvedModule) => { + let module_ty = if let Some(module_name) = ModuleName::new(name) { + if let Some(module) = self.module_ty_from_name(module_name) { + module + } else { self.add_diagnostic( AnyNodeRef::Alias(alias), "unresolved-import", - format_args!("Import '{name}' could not be resolved."), + format_args!("Cannot resolve import '{name}'."), ); Type::Unknown } + } else { + tracing::debug!("Failed to resolve import due to invalid syntax"); + Type::Unknown }; self.types.definitions.insert(definition, module_ty); @@ -998,6 +994,23 @@ impl<'db> TypeInferenceBuilder<'db> { self.infer_optional_expression(cause.as_deref()); } + fn unresolved_module_name( + &mut self, + import_from: &ast::StmtImportFrom, + level: usize, + module: Option<&str>, + ) { + self.add_diagnostic( + AnyNodeRef::StmtImportFrom(import_from), + "unresolved-import", + format_args!( + "Cannot resolve import '{}{}'.", + ".".repeat(level), + module.unwrap_or_default() + ), + ); + } + /// Given a `from .foo import bar` relative import, resolve the relative module /// we're importing `bar` from into an absolute [`ModuleName`] /// using the name of the module we're currently analyzing. @@ -1009,37 +1022,41 @@ impl<'db> TypeInferenceBuilder<'db> { /// - `from .foo import bar` => `tail == "foo"` /// - `from ..foo.bar import baz` => `tail == "foo.bar"` fn relative_module_name( - &self, + &mut self, tail: Option<&str>, level: NonZeroU32, - ) -> Result { + import_from: &ast::StmtImportFrom, + ) -> Option { + let mut level = level.get(); let Some(module) = file_to_module(self.db, self.file) else { tracing::debug!( "Relative module resolution '{}' failed; could not resolve file '{}' to a module", - format_import_from_module(level.get(), tail), + format_import_from_module(level, tail), self.file.path(self.db) ); - return Err(ModuleResolutionError::UnresolvedModule); + self.unresolved_module_name(import_from, level as usize, tail); + return None; }; - let mut level = level.get(); if module.kind().is_package() { level -= 1; } let mut module_name = module.name().to_owned(); for _ in 0..level { - module_name = module_name - .parent() - .ok_or(ModuleResolutionError::UnresolvedModule)?; + let Some(parent) = module_name.parent() else { + self.unresolved_module_name(import_from, level as usize, tail); + return None; + }; + module_name = parent; } if let Some(tail) = tail { if let Some(valid_tail) = ModuleName::new(tail) { module_name.extend(&valid_tail); } else { tracing::debug!("Relative module resolution failed: invalid syntax"); - return Err(ModuleResolutionError::InvalidSyntax); + return None; } } - Ok(module_name) + Some(module_name) } fn infer_import_from_definition( @@ -1067,19 +1084,27 @@ impl<'db> TypeInferenceBuilder<'db> { format_import_from_module(level.get(), module), self.file.path(self.db), ); - self.relative_module_name(module, level) + self.relative_module_name(module, level, import_from) } else { tracing::trace!( "Resolving imported object '{}' from module '{}'", alias.name, format_import_from_module(*level, module), ); - module - .and_then(ModuleName::new) - .ok_or(ModuleResolutionError::InvalidSyntax) + module.and_then(ModuleName::new) }; - let module_ty = module_name.and_then(|module_name| self.module_ty_from_name(module_name)); + let module_ty = if let Some(module_name) = module_name { + if let Some(module_ty) = self.module_ty_from_name(module_name) { + module_ty + } else { + self.unresolved_module_name(import_from, *level as usize, module); + Type::Unknown + } + } else { + tracing::debug!("Failed to resolve import due to invalid syntax"); + Type::Unknown + }; let ast::Alias { range: _, @@ -1087,39 +1112,30 @@ impl<'db> TypeInferenceBuilder<'db> { asname: _, } = alias; - // If a symbol is unbound in the module the symbol was originally defined in, - // when we're trying to import the symbol from that module into "our" module, - // the runtime error will occur immediately (rather than when the symbol is *used*, - // as would be the case for a symbol with type `Unbound`), so it's appropriate to - // think of the type of the imported symbol as `Unknown` rather than `Unbound` - let member_ty = module_ty - .unwrap_or(Type::Unbound) - .member(self.db, &Name::new(&name.id)) - .replace_unbound_with(self.db, Type::Unknown); + let member_ty = module_ty.member(self.db, &Name::new(&name.id)); - if matches!(module_ty, Err(ModuleResolutionError::UnresolvedModule)) { - self.add_diagnostic( - AnyNodeRef::StmtImportFrom(import_from), - "unresolved-import", - format_args!( - "Import '{}{}' could not be resolved.", - ".".repeat(*level as usize), - module.unwrap_or_default() - ), - ); - } else if module_ty.is_ok() && member_ty.is_unknown() { + // TODO: What if it's a union where one of the elements is `Unbound`? + if member_ty.is_unbound() { self.add_diagnostic( AnyNodeRef::Alias(alias), "unresolved-import", format_args!( - "Could not resolve import of '{name}' from '{}{}'", + "Module '{}{}' has no member '{name}'", ".".repeat(*level as usize), module.unwrap_or_default() ), ); } - self.types.definitions.insert(definition, member_ty); + // If a symbol is unbound in the module the symbol was originally defined in, + // when we're trying to import the symbol from that module into "our" module, + // the runtime error will occur immediately (rather than when the symbol is *used*, + // as would be the case for a symbol with type `Unbound`), so it's appropriate to + // think of the type of the imported symbol as `Unknown` rather than `Unbound` + self.types.definitions.insert( + definition, + member_ty.replace_unbound_with(self.db, Type::Unknown), + ); } fn infer_return_statement(&mut self, ret: &ast::StmtReturn) { @@ -1133,13 +1149,8 @@ impl<'db> TypeInferenceBuilder<'db> { } } - fn module_ty_from_name( - &self, - module_name: ModuleName, - ) -> Result, ModuleResolutionError> { - resolve_module(self.db, module_name) - .map(|module| Type::Module(module.file())) - .ok_or(ModuleResolutionError::UnresolvedModule) + fn module_ty_from_name(&self, module_name: ModuleName) -> Option> { + resolve_module(self.db, module_name).map(|module| Type::Module(module.file())) } fn infer_decorator(&mut self, decorator: &ast::Decorator) -> Type<'db> { @@ -1915,12 +1926,6 @@ fn format_import_from_module(level: u32, module: Option<&str>) -> String { ) } -#[derive(Debug, Copy, Clone, PartialEq, Eq)] -enum ModuleResolutionError { - InvalidSyntax, - UnresolvedModule, -} - #[cfg(test)] mod tests { use anyhow::Context; diff --git a/crates/red_knot_wasm/tests/api.rs b/crates/red_knot_wasm/tests/api.rs index edf76c0d1b71e..6a8dfd4eac850 100644 --- a/crates/red_knot_wasm/tests/api.rs +++ b/crates/red_knot_wasm/tests/api.rs @@ -19,6 +19,6 @@ fn check() { assert_eq!( result, - vec!["/test.py:1:8: Import 'random22' could not be resolved.",] + vec!["/test.py:1:8: Cannot resolve import 'random22'."] ); } diff --git a/crates/ruff_benchmark/benches/red_knot.rs b/crates/ruff_benchmark/benches/red_knot.rs index debcd6c2459d2..94a7a5edaaf03 100644 --- a/crates/ruff_benchmark/benches/red_knot.rs +++ b/crates/ruff_benchmark/benches/red_knot.rs @@ -22,17 +22,8 @@ struct Case { const TOMLLIB_312_URL: &str = "https://raw.githubusercontent.com/python/cpython/8e8a4baf652f6e1cee7acde9d78c4b6154539748/Lib/tomllib"; // This first "unresolved import" is because we don't understand `*` imports yet. -// The following "unresolved import" violations are because we can't distinguish currently from -// "Symbol exists in the module but its type is unknown" and -// "Symbol does not exist in the module" static EXPECTED_DIAGNOSTICS: &[&str] = &[ - "/src/tomllib/_parser.py:7:29: Could not resolve import of 'Iterable' from 'collections.abc'", - "/src/tomllib/_parser.py:10:20: Could not resolve import of 'Any' from 'typing'", - "/src/tomllib/_parser.py:13:5: Could not resolve import of 'RE_DATETIME' from '._re'", - "/src/tomllib/_parser.py:14:5: Could not resolve import of 'RE_LOCALTIME' from '._re'", - "/src/tomllib/_parser.py:15:5: Could not resolve import of 'RE_NUMBER' from '._re'", - "/src/tomllib/_parser.py:20:21: Could not resolve import of 'Key' from '._types'", - "/src/tomllib/_parser.py:20:26: Could not resolve import of 'ParseFloat' from '._types'", + "/src/tomllib/_parser.py:7:29: Module 'collections.abc' has no member 'Iterable'", "Line 69 is too long (89 characters)", "Use double quotes for strings", "Use double quotes for strings", From 097e24ddb5e92412310cbd9994b91a5baccb50f3 Mon Sep 17 00:00:00 2001 From: Alex Waygood Date: Tue, 27 Aug 2024 13:44:38 +0100 Subject: [PATCH 2/2] Add back an error enum (but use it more narrowly) --- .../src/types/infer.rs | 115 +++++++++++------- crates/ruff_benchmark/benches/red_knot.rs | 2 +- 2 files changed, 70 insertions(+), 47 deletions(-) diff --git a/crates/red_knot_python_semantic/src/types/infer.rs b/crates/red_knot_python_semantic/src/types/infer.rs index 4a65ecfa15bc6..cd317bc8d2eef 100644 --- a/crates/red_knot_python_semantic/src/types/infer.rs +++ b/crates/red_knot_python_semantic/src/types/infer.rs @@ -934,7 +934,7 @@ impl<'db> TypeInferenceBuilder<'db> { } } - fn infer_import_definition(&mut self, alias: &ast::Alias, definition: Definition<'db>) { + fn infer_import_definition(&mut self, alias: &'db ast::Alias, definition: Definition<'db>) { let ast::Alias { range: _, name, @@ -945,11 +945,7 @@ impl<'db> TypeInferenceBuilder<'db> { if let Some(module) = self.module_ty_from_name(module_name) { module } else { - self.add_diagnostic( - AnyNodeRef::Alias(alias), - "unresolved-import", - format_args!("Cannot resolve import '{name}'."), - ); + self.unresolved_module_diagnostic(alias, 0, Some(name)); Type::Unknown } } else { @@ -994,18 +990,18 @@ impl<'db> TypeInferenceBuilder<'db> { self.infer_optional_expression(cause.as_deref()); } - fn unresolved_module_name( + fn unresolved_module_diagnostic( &mut self, - import_from: &ast::StmtImportFrom, - level: usize, + import_node: impl Into>, + level: u32, module: Option<&str>, ) { self.add_diagnostic( - AnyNodeRef::StmtImportFrom(import_from), + import_node.into(), "unresolved-import", format_args!( "Cannot resolve import '{}{}'.", - ".".repeat(level), + ".".repeat(level as usize), module.unwrap_or_default() ), ); @@ -1022,46 +1018,32 @@ impl<'db> TypeInferenceBuilder<'db> { /// - `from .foo import bar` => `tail == "foo"` /// - `from ..foo.bar import baz` => `tail == "foo.bar"` fn relative_module_name( - &mut self, + &self, tail: Option<&str>, level: NonZeroU32, - import_from: &ast::StmtImportFrom, - ) -> Option { + ) -> Result { + let module = file_to_module(self.db, self.file) + .ok_or(ModuleNameResolutionError::UnknownCurrentModule)?; let mut level = level.get(); - let Some(module) = file_to_module(self.db, self.file) else { - tracing::debug!( - "Relative module resolution '{}' failed; could not resolve file '{}' to a module", - format_import_from_module(level, tail), - self.file.path(self.db) - ); - self.unresolved_module_name(import_from, level as usize, tail); - return None; - }; if module.kind().is_package() { level -= 1; } let mut module_name = module.name().to_owned(); for _ in 0..level { - let Some(parent) = module_name.parent() else { - self.unresolved_module_name(import_from, level as usize, tail); - return None; - }; - module_name = parent; + module_name = module_name + .parent() + .ok_or(ModuleNameResolutionError::TooManyDots)?; } if let Some(tail) = tail { - if let Some(valid_tail) = ModuleName::new(tail) { - module_name.extend(&valid_tail); - } else { - tracing::debug!("Relative module resolution failed: invalid syntax"); - return None; - } + let tail = ModuleName::new(tail).ok_or(ModuleNameResolutionError::InvalidSyntax)?; + module_name.extend(&tail); } - Some(module_name) + Ok(module_name) } fn infer_import_from_definition( &mut self, - import_from: &ast::StmtImportFrom, + import_from: &'db ast::StmtImportFrom, alias: &ast::Alias, definition: Definition<'db>, ) { @@ -1077,6 +1059,7 @@ impl<'db> TypeInferenceBuilder<'db> { let ast::StmtImportFrom { module, level, .. } = import_from; tracing::trace!("Resolving imported object {alias:?} from statement {import_from:?}"); let module = module.as_deref(); + let module_name = if let Some(level) = NonZeroU32::new(*level) { tracing::trace!( "Resolving imported object '{}' from module '{}' relative to file '{}'", @@ -1084,26 +1067,49 @@ impl<'db> TypeInferenceBuilder<'db> { format_import_from_module(level.get(), module), self.file.path(self.db), ); - self.relative_module_name(module, level, import_from) + self.relative_module_name(module, level) } else { tracing::trace!( "Resolving imported object '{}' from module '{}'", alias.name, format_import_from_module(*level, module), ); - module.and_then(ModuleName::new) + module + .and_then(ModuleName::new) + .ok_or(ModuleNameResolutionError::InvalidSyntax) }; - let module_ty = if let Some(module_name) = module_name { - if let Some(module_ty) = self.module_ty_from_name(module_name) { - module_ty - } else { - self.unresolved_module_name(import_from, *level as usize, module); + let module_ty = match module_name { + Ok(name) => { + if let Some(ty) = self.module_ty_from_name(name) { + ty + } else { + self.unresolved_module_diagnostic(import_from, *level, module); + Type::Unknown + } + } + Err(ModuleNameResolutionError::InvalidSyntax) => { + tracing::debug!("Failed to resolve import due to invalid syntax"); + // Invalid syntax diagnostics are emitted elsewhere. + Type::Unknown + } + Err(ModuleNameResolutionError::TooManyDots) => { + tracing::debug!( + "Relative module resolution '{}' failed: too many leading dots", + format_import_from_module(*level, module), + ); + self.unresolved_module_diagnostic(import_from, *level, module); + Type::Unknown + } + Err(ModuleNameResolutionError::UnknownCurrentModule) => { + tracing::debug!( + "Relative module resolution '{}' failed; could not resolve file '{}' to a module", + format_import_from_module(*level, module), + self.file.path(self.db) + ); + self.unresolved_module_diagnostic(import_from, *level, module); Type::Unknown } - } else { - tracing::debug!("Failed to resolve import due to invalid syntax"); - Type::Unknown }; let ast::Alias { @@ -1926,6 +1932,23 @@ fn format_import_from_module(level: u32, module: Option<&str>) -> String { ) } +/// Various ways in which resolving a [`ModuleName`] +/// from an [`ast::StmtImport`] or [`ast::StmtImportFrom`] node might fail +#[derive(Debug, Copy, Clone, PartialEq, Eq)] +enum ModuleNameResolutionError { + /// The import statement has invalid syntax + InvalidSyntax, + + /// We couldn't resolve the file we're currently analyzing back to a module + /// (Only necessary for relative import statements) + UnknownCurrentModule, + + /// The relative import statement seems to take us outside of the module search path + /// (e.g. our current module is `foo.bar`, and the relative import statement in `foo.bar` + /// is `from ....baz import spam`) + TooManyDots, +} + #[cfg(test)] mod tests { use anyhow::Context; diff --git a/crates/ruff_benchmark/benches/red_knot.rs b/crates/ruff_benchmark/benches/red_knot.rs index 94a7a5edaaf03..6996c42fadca7 100644 --- a/crates/ruff_benchmark/benches/red_knot.rs +++ b/crates/ruff_benchmark/benches/red_knot.rs @@ -21,7 +21,7 @@ struct Case { const TOMLLIB_312_URL: &str = "https://raw.githubusercontent.com/python/cpython/8e8a4baf652f6e1cee7acde9d78c4b6154539748/Lib/tomllib"; -// This first "unresolved import" is because we don't understand `*` imports yet. +// The "unresolved import" is because we don't understand `*` imports yet. static EXPECTED_DIAGNOSTICS: &[&str] = &[ "/src/tomllib/_parser.py:7:29: Module 'collections.abc' has no member 'Iterable'", "Line 69 is too long (89 characters)",