From 5e35a55d4af459746f448d7ac348c3cf66e27af0 Mon Sep 17 00:00:00 2001 From: Dhruv Manilawala Date: Thu, 21 Sep 2023 07:51:03 +0530 Subject: [PATCH] Detect `noqa` directives for multi-line f-strings (#7326) ## Summary This PR updates the NoQA directive detection to consider the new f-string tokens. The reason being that now there can be multi-line f-strings without triple-quotes: ```python f"{ x * y }" ``` Here, the `noqa` directive should go at the end of the last line. ## Test Plan * Add new test cases for f-strings * Tested with `--add-noqa` using the following command with the above code snippet: ```console $ cargo run --bin ruff -- check --select=F821 --no-cache --isolated ~/playground/ruff/fstring.py --add-noqa Added 1 noqa directive. ``` Output: ```python f"{ x * y }" # noqa: F821 ``` Running the same command again doesn't add `noqa` directive and without the `--add-noqa` flag, the violation isn't reported. fixes: #7291 --- crates/ruff_linter/src/directives.rs | 149 +++++++++++++++--- .../ruff_python_index/src/fstring_ranges.rs | 17 +- crates/ruff_python_index/src/indexer.rs | 12 +- 3 files changed, 154 insertions(+), 24 deletions(-) diff --git a/crates/ruff_linter/src/directives.rs b/crates/ruff_linter/src/directives.rs index 60f8c69b78651..87095f9ac65a7 100644 --- a/crates/ruff_linter/src/directives.rs +++ b/crates/ruff_linter/src/directives.rs @@ -1,5 +1,6 @@ //! Extract `# noqa`, `# isort: skip`, and `# TODO` directives from tokenized source. +use std::iter::Peekable; use std::str::FromStr; use bitflags::bitflags; @@ -85,6 +86,39 @@ pub fn extract_directives( } } +struct SortedMergeIter +where + L: Iterator, + R: Iterator, +{ + left: Peekable, + right: Peekable, +} + +impl Iterator for SortedMergeIter +where + L: Iterator, + R: Iterator, + Item: Ranged, +{ + type Item = Item; + + fn next(&mut self) -> Option { + match (self.left.peek(), self.right.peek()) { + (Some(left), Some(right)) => { + if left.start() <= right.start() { + Some(self.left.next().unwrap()) + } else { + Some(self.right.next().unwrap()) + } + } + (Some(_), None) => Some(self.left.next().unwrap()), + (None, Some(_)) => Some(self.right.next().unwrap()), + (None, None) => None, + } + } +} + /// Extract a mapping from logical line to noqa line. fn extract_noqa_line_for(lxr: &[LexResult], locator: &Locator, indexer: &Indexer) -> NoqaMapping { let mut string_mappings = Vec::new(); @@ -113,6 +147,29 @@ fn extract_noqa_line_for(lxr: &[LexResult], locator: &Locator, indexer: &Indexer } } + // The capacity allocated here might be more than we need if there are + // nested f-strings. + let mut fstring_mappings = Vec::with_capacity(indexer.fstring_ranges().len()); + + // For nested f-strings, we expect `noqa` directives on the last line of the + // outermost f-string. The last f-string range will be used to skip over + // the inner f-strings. + let mut last_fstring_range: TextRange = TextRange::default(); + for fstring_range in indexer.fstring_ranges().values() { + if !locator.contains_line_break(*fstring_range) { + continue; + } + if last_fstring_range.contains_range(*fstring_range) { + continue; + } + let new_range = TextRange::new( + locator.line_start(fstring_range.start()), + fstring_range.end(), + ); + fstring_mappings.push(new_range); + last_fstring_range = new_range; + } + let mut continuation_mappings = Vec::new(); // For continuations, we expect `noqa` directives on the last line of the @@ -137,27 +194,20 @@ fn extract_noqa_line_for(lxr: &[LexResult], locator: &Locator, indexer: &Indexer } // Merge the mappings in sorted order - let mut mappings = - NoqaMapping::with_capacity(continuation_mappings.len() + string_mappings.len()); + let mut mappings = NoqaMapping::with_capacity( + continuation_mappings.len() + string_mappings.len() + fstring_mappings.len(), + ); - let mut continuation_mappings = continuation_mappings.into_iter().peekable(); - let mut string_mappings = string_mappings.into_iter().peekable(); - - while let (Some(continuation), Some(string)) = - (continuation_mappings.peek(), string_mappings.peek()) - { - if continuation.start() <= string.start() { - mappings.push_mapping(continuation_mappings.next().unwrap()); - } else { - mappings.push_mapping(string_mappings.next().unwrap()); - } - } - - for mapping in continuation_mappings { - mappings.push_mapping(mapping); - } + let string_mappings = SortedMergeIter { + left: fstring_mappings.into_iter().peekable(), + right: string_mappings.into_iter().peekable(), + }; + let all_mappings = SortedMergeIter { + left: string_mappings.peekable(), + right: continuation_mappings.into_iter().peekable(), + }; - for mapping in string_mappings { + for mapping in all_mappings { mappings.push_mapping(mapping); } @@ -429,6 +479,67 @@ ghi NoqaMapping::from_iter([TextRange::new(TextSize::from(6), TextSize::from(28))]) ); + let contents = "x = f'abc { +a + * + b +}' +y = 2 +"; + assert_eq!( + noqa_mappings(contents), + NoqaMapping::from_iter([TextRange::new(TextSize::from(0), TextSize::from(32))]) + ); + + let contents = "x = f'''abc +def +ghi +''' +y = 2 +z = x + 1"; + assert_eq!( + noqa_mappings(contents), + NoqaMapping::from_iter([TextRange::new(TextSize::from(0), TextSize::from(23))]) + ); + + let contents = "x = 1 +y = f'''abc +def +ghi +''' +z = 2"; + assert_eq!( + noqa_mappings(contents), + NoqaMapping::from_iter([TextRange::new(TextSize::from(6), TextSize::from(29))]) + ); + + let contents = "x = 1 +y = f'''abc +def +ghi +'''"; + assert_eq!( + noqa_mappings(contents), + NoqaMapping::from_iter([TextRange::new(TextSize::from(6), TextSize::from(29))]) + ); + + let contents = "x = 1 +y = f'''abc +def {f'''nested +fstring''' f'another nested'} +end''' +"; + assert_eq!( + noqa_mappings(contents), + NoqaMapping::from_iter([TextRange::new(TextSize::from(6), TextSize::from(70))]) + ); + + let contents = "x = 1 +y = f'normal' +z = f'another but {f'nested but {f'still single line'} nested'}' +"; + assert_eq!(noqa_mappings(contents), NoqaMapping::default()); + let contents = r"x = \ 1"; assert_eq!( diff --git a/crates/ruff_python_index/src/fstring_ranges.rs b/crates/ruff_python_index/src/fstring_ranges.rs index d2d13802a5cf4..b95c9b665083b 100644 --- a/crates/ruff_python_index/src/fstring_ranges.rs +++ b/crates/ruff_python_index/src/fstring_ranges.rs @@ -50,9 +50,20 @@ impl FStringRanges { .map(|(_, range)| *range) } - #[cfg(test)] - pub(crate) fn ranges(&self) -> impl Iterator + '_ { - self.raw.values().copied() + /// Returns an iterator over all f-string [`TextRange`] sorted by their + /// start location. + /// + /// For nested f-strings, the outermost f-string is yielded first, moving + /// inwards with each iteration. + #[inline] + pub fn values(&self) -> impl Iterator + '_ { + self.raw.values() + } + + /// Returns the number of f-string ranges stored. + #[inline] + pub fn len(&self) -> usize { + self.raw.len() } } diff --git a/crates/ruff_python_index/src/indexer.rs b/crates/ruff_python_index/src/indexer.rs index a48eab6cb8c2d..78bf2606b2033 100644 --- a/crates/ruff_python_index/src/indexer.rs +++ b/crates/ruff_python_index/src/indexer.rs @@ -353,7 +353,11 @@ f"implicit " f"concatenation" let lxr: Vec = lexer::lex(contents, Mode::Module).collect(); let indexer = Indexer::from_tokens(lxr.as_slice(), &Locator::new(contents)); assert_eq!( - indexer.fstring_ranges().ranges().collect::>(), + indexer + .fstring_ranges() + .values() + .copied() + .collect::>(), &[ TextRange::new(TextSize::from(0), TextSize::from(18)), TextRange::new(TextSize::from(19), TextSize::from(55)), @@ -385,7 +389,11 @@ f-string"""} let lxr: Vec = lexer::lex(contents, Mode::Module).collect(); let indexer = Indexer::from_tokens(lxr.as_slice(), &Locator::new(contents)); assert_eq!( - indexer.fstring_ranges().ranges().collect::>(), + indexer + .fstring_ranges() + .values() + .copied() + .collect::>(), &[ TextRange::new(TextSize::from(0), TextSize::from(39)), TextRange::new(TextSize::from(40), TextSize::from(68)),