Skip to content

Commit

Permalink
Check for link error
Browse files Browse the repository at this point in the history
  • Loading branch information
evanrittenhouse committed Apr 25, 2023
1 parent 58bfb57 commit 4554c0c
Show file tree
Hide file tree
Showing 3 changed files with 57 additions and 22 deletions.
4 changes: 4 additions & 0 deletions crates/ruff/resources/test/fixtures/flake8_todo/TDO003.py
Original file line number Diff line number Diff line change
Expand Up @@ -8,3 +8,7 @@
# TDO003 - errors
# TODO: this comment has no
# link after it

# TODO: here's a TODO with no link after it
def foo(x):
return x
57 changes: 39 additions & 18 deletions crates/ruff/src/rules/flake8_todo/rules.rs
Original file line number Diff line number Diff line change
Expand Up @@ -224,8 +224,7 @@ impl Violation for MissingSpaceAfterColonInTodo {
//
// Note: Regexes taken from https://github.com/orsinium-labs/flake8-todos/blob/master/flake8_todos/_rules.py#L12.
static TODO_REGEX: Lazy<Regex> = Lazy::new(|| {
Regex::new(r"^#\s*(?P<tag>[tT][oO][dD][oO]|BUG|FIXME|XXX)( {0,1}\(.*\))?(:)?( )?(.+)?$")
.unwrap()
Regex::new(r"^# (?P<tag>[tT][oO][dD][oO]|BUG|FIXME|XXX)( {0,1}\(.*\))?(:)?( )?(.+)?$").unwrap()
});

static ISSUE_LINK_REGEX_SET: Lazy<RegexSet> = Lazy::new(|| {
Expand All @@ -238,6 +237,7 @@ static ISSUE_LINK_REGEX_SET: Lazy<RegexSet> = Lazy::new(|| {
});

static NUM_CAPTURE_GROUPS: usize = 5usize;
static TODO_LENGTH: usize = 4usize;

pub fn check_todos(
tokens: &[LexResult],
Expand All @@ -246,11 +246,33 @@ pub fn check_todos(
) -> Vec<Diagnostic> {
let mut diagnostics: Vec<Diagnostic> = vec![];
let mut prev_token_is_todo = false;
let mut prev_token_todo_start = 2; // Default to 2, the position of "T" in a properly formed TODO

for (start, token, end) in tokens.iter().flatten() {
let diagnostics_ref = &mut diagnostics;
let range = Range::new(*start, *end);

let token_opt = match token {
Tok::Comment(s) => Some(s),
_ => None,
};

// Check for errors due to a missing link: TDO003.
if prev_token_is_todo {
if token_opt.is_some() && ISSUE_LINK_REGEX_SET.is_match(token_opt.unwrap()) {
prev_token_is_todo = false;
continue;
}

diagnostics_ref.push(Diagnostic::new(
MissingLinkInTodo,
Range::new(
Location::new(start.row() - 1, prev_token_todo_start),
Location::new(end.row() - 1, prev_token_todo_start + TODO_LENGTH),
),
));
}

let Some(comment) = token_opt else {
prev_token_is_todo = false;
continue;
Expand All @@ -264,7 +286,7 @@ pub fn check_todos(
continue;
};

// Check for errors on the tag.
// Check for errors on the tag: TDO001/TDO006.
// Unwrap is safe because the "tag" capture group is required to get here.
let captures = captures_opt.peek().unwrap();
let tag = captures.name("tag").unwrap().as_str();
Expand All @@ -285,25 +307,12 @@ pub fn check_todos(
)
.with_fix(
if should_autofix(autofix, settings, Rule::InvalidCapitalizationInTodo) {
// The TODO regex allows for any number of spaces, so let's find where the first "t"
// or "T" is. We know the unwrap is safe because of the mandatory regex
// match. We'll use position() since "#" is 2 bytes which could throw
// off an implementation that uses byte-indexing.
let first_t_position = comment
.chars()
.position(|c| c.to_string() == "t" || c.to_string() == "T")
.unwrap();
let first_t_position = find_first_t_position(comment);

Fix::new(vec![Edit::replacement(
"TODO".to_string(),
Location::new(range.location.row(), first_t_position),
Location::new(
range.location.row(),
// We know `tag` is 4 bytes long because we've already ensured
// it's some variant of "TODO", so we're guaranteed to have
// consistency.
first_t_position + tag.len(),
),
Location::new(range.location.row(), first_t_position + TODO_LENGTH),
)])
} else {
Fix::empty()
Expand All @@ -327,6 +336,7 @@ pub fn check_todos(
}

prev_token_is_todo = true;
prev_token_todo_start = find_first_t_position(comment);
}

diagnostics
Expand Down Expand Up @@ -360,3 +370,14 @@ fn should_autofix(autofix: flags::Autofix, settings: &Settings, rule: Rule) -> b
fn get_captured_matches(text: &str) -> Peekable<CaptureMatches> {
TODO_REGEX.captures_iter(text).peekable()
}

fn find_first_t_position(comment: &str) -> usize {
// The TODO regex allows for any number of spaces, so let's find where the first "t"
// or "T" is. We know the unwrap is safe because of the mandatory regex
// match. We'll use position() since "#" is 2 bytes which could throw
// off an implementation that uses byte-indexing.
comment
.chars()
.position(|c| c.to_string() == "t" || c.to_string() == "T")
.unwrap()
}
Original file line number Diff line number Diff line change
@@ -1,12 +1,22 @@
---
source: crates/ruff/src/rules/flake8_todo/mod.rs
---
TDO003.py:10:1: TDO003 Missing issue link in TODO
TDO003.py:9:3: TDO003 Missing issue link following TODO
|
9 | # TDO003 - errors
10 | # TODO: this comment has no
| ^^^^ TDO003
11 | # link after it
|

TDO003.py:12:3: TDO003 Missing issue link following TODO
|
10 | # TDO003 - errors
11 | # TODO: this comment has no
12 | # link after it
| ^^^^^^^^^^^^^^^ TDO003
13 |
14 | # TODO: here's a TODO with no link after it
| ^^^^ TDO003
15 | def foo(x):
16 | return x
|


0 comments on commit 4554c0c

Please sign in to comment.