astral-sh · dhruvmanila · Jul 2, 2024 · Jun 28, 2024 · dhruvmanila · Jun 28, 2024
diff --git a/crates/ruff_linter/resources/test/fixtures/flake8_commas/COM81_syntax_error.py b/crates/ruff_linter/resources/test/fixtures/flake8_commas/COM81_syntax_error.py
@@ -1,3 +1,8 @@
+# Check for `flake8-commas` violation for a file containing syntax errors.
 (
     *args
 )
+
+def foo[(param1='test', param2='test',):
+    pass
+
diff --git a/crates/ruff_linter/resources/test/fixtures/flake8_implicit_str_concat/ISC_syntax_error.py b/crates/ruff_linter/resources/test/fixtures/flake8_implicit_str_concat/ISC_syntax_error.py
@@ -0,0 +1,29 @@
+# The lexer doesn't emit a string token if it's unterminated
+"a" "b
+"a" "b" "c
+"a" """b
+c""" "d
+
+# For f-strings, the `FStringRanges` won't contain the range for
+# unterminated f-strings.
+f"a" f"b
+f"a" f"b" f"c
+f"a" f"""b
+c""" f"d {e
+
+(
+    "a"
+    "b
+    "c"
+    "d"
+)
+
+
+# Triple-quoted strings, if unterminated, consume everything that comes after
+# the opening quote. So, no test code should raise the violation after this.
+(
+    """abc"""
+    f"""def
+    "g" "h"
+    "i" "j"
+)
diff --git a/crates/ruff_linter/resources/test/fixtures/pycodestyle/E30_syntax_error.py b/crates/ruff_linter/resources/test/fixtures/pycodestyle/E30_syntax_error.py
@@ -0,0 +1,26 @@
+# Check for E30 errors in a file containing syntax errors with unclosed
+# parenthesis.
+
+def foo[T1, T2():
+    pass
+
+def bar():
+    pass
+
+
+
+class Foo:
+    def __init__(
+        pass
+    def method():
+        pass
+
+foo = Foo(
+
+
+def top(
+    def nested1():
+        pass
+    def nested2():
+        pass
+
diff --git a/crates/ruff_linter/resources/test/fixtures/pylint/invalid_characters_syntax_error.py b/crates/ruff_linter/resources/test/fixtures/pylint/invalid_characters_syntax_error.py
@@ -0,0 +1,13 @@
+# These test cases contain syntax errors. The characters within the unterminated
+# strings shouldn't be highlighted.
+
+# Before any syntax error
+b = ''
+# Unterminated string
+b = '
+b = ''
+# Unterminated f-string
+b = f'
+b = f''
+# Implicitly concatenated
+b = '' f'' '
diff --git a/crates/ruff_linter/src/checkers/tokens.rs b/crates/ruff_linter/src/checkers/tokens.rs
@@ -93,7 +93,7 @@ pub(crate) fn check_tokens(
         Rule::InvalidCharacterNul,
         Rule::InvalidCharacterZeroWidthSpace,
     ]) {
-        for token in tokens.up_to_first_unknown() {
+        for token in tokens {
             pylint::rules::invalid_string_characters(
                 &mut diagnostics,
                 token.kind(),

diff --git a/crates/ruff_linter/src/directives.rs b/crates/ruff_linter/src/directives.rs
@@ -107,14 +107,9 @@ where
 fn extract_noqa_line_for(tokens: &Tokens, locator: &Locator, indexer: &Indexer) -> NoqaMapping {
     let mut string_mappings = Vec::new();
 
-    for token in tokens.up_to_first_unknown() {
+    for token in tokens {
         match token.kind() {
-            TokenKind::EndOfFile => {
-                break;
-            }
-
-            // For multi-line strings, we expect `noqa` directives on the last line of the
-            // string.
+            // For multi-line strings, we expect `noqa` directives on the last line of the string.
             TokenKind::String if token.is_triple_quoted_string() => {
                 if locator.contains_line_break(token.range()) {
                     string_mappings.push(TextRange::new(

diff --git a/crates/ruff_linter/src/doc_lines.rs b/crates/ruff_linter/src/doc_lines.rs
@@ -24,7 +24,7 @@ pub(crate) struct DocLines<'a> {
 impl<'a> DocLines<'a> {
     fn new(tokens: &'a Tokens) -> Self {
         Self {
-            inner: tokens.up_to_first_unknown().iter(),
+            inner: tokens.iter(),
             prev: TextSize::default(),
         }
     }

diff --git a/crates/ruff_linter/src/rules/flake8_commas/rules/trailing_commas.rs b/crates/ruff_linter/src/rules/flake8_commas/rules/trailing_commas.rs
@@ -231,7 +231,7 @@ pub(crate) fn trailing_commas(
     indexer: &Indexer,
 ) {
     let mut fstrings = 0u32;
-    let simple_tokens = tokens.up_to_first_unknown().iter().filter_map(|token| {
+    let simple_tokens = tokens.iter().filter_map(|token| {
         match token.kind() {
             // Completely ignore comments -- they just interfere with the logic.
             TokenKind::Comment => None,

diff --git a/...ke8_commas/snapshots/ruff_linter__rules__flake8_commas__tests__COM81_syntax_error.py.snap b/...ke8_commas/snapshots/ruff_linter__rules__flake8_commas__tests__COM81_syntax_error.py.snap
@@ -1,10 +1,30 @@
 ---
 source: crates/ruff_linter/src/rules/flake8_commas/mod.rs
 ---
-COM81_syntax_error.py:2:5: SyntaxError: Starred expression cannot be used here
+COM81_syntax_error.py:3:5: SyntaxError: Starred expression cannot be used here
   |
-1 | (
-2 |     *args
+1 | # Check for `flake8-commas` violation for a file containing syntax errors.
+2 | (
+3 |     *args
   |     ^
-3 | )
+4 | )
   |
+
+COM81_syntax_error.py:6:9: SyntaxError: Type parameter list cannot be empty
+  |
+4 | )
+5 | 
+6 | def foo[(param1='test', param2='test',):
+  |         ^
+7 |     pass
+  |
+
+COM81_syntax_error.py:6:38: COM819 Trailing comma prohibited
+  |
+4 | )
+5 | 
+6 | def foo[(param1='test', param2='test',):
+  |                                      ^ COM819
+7 |     pass
+  |
+  = help: Remove trailing comma
diff --git a/crates/ruff_linter/src/rules/flake8_implicit_str_concat/mod.rs b/crates/ruff_linter/src/rules/flake8_implicit_str_concat/mod.rs
@@ -15,6 +15,14 @@ mod tests {
 
     #[test_case(Rule::SingleLineImplicitStringConcatenation, Path::new("ISC.py"))]
     #[test_case(Rule::MultiLineImplicitStringConcatenation, Path::new("ISC.py"))]
+    #[test_case(
+        Rule::SingleLineImplicitStringConcatenation,
+        Path::new("ISC_syntax_error.py")
+    )]
+    #[test_case(
+        Rule::MultiLineImplicitStringConcatenation,
+        Path::new("ISC_syntax_error.py")
+    )]
     #[test_case(Rule::ExplicitStringConcatenation, Path::new("ISC.py"))]
     fn rules(rule_code: Rule, path: &Path) -> Result<()> {
         let snapshot = format!("{}_{}", rule_code.noqa_code(), path.to_string_lossy());

diff --git a/crates/ruff_linter/src/rules/flake8_implicit_str_concat/rules/implicit.rs b/crates/ruff_linter/src/rules/flake8_implicit_str_concat/rules/implicit.rs
@@ -98,7 +98,6 @@ pub(crate) fn implicit(
     indexer: &Indexer,
 ) {
     for (a_token, b_token) in tokens
-        .up_to_first_unknown()
         .iter()
         .filter(|token| {
             token.kind() != TokenKind::Comment

diff --git a/...ts/ruff_linter__rules__flake8_implicit_str_concat__tests__ISC001_ISC_syntax_error.py.snap b/...ts/ruff_linter__rules__flake8_implicit_str_concat__tests__ISC001_ISC_syntax_error.py.snap
@@ -0,0 +1,181 @@
+---
+source: crates/ruff_linter/src/rules/flake8_implicit_str_concat/mod.rs
+---
+ISC_syntax_error.py:2:5: SyntaxError: missing closing quote in string literal
+  |
+1 | # The lexer doesn't emit a string token if it's unterminated
+2 | "a" "b
+  |     ^
+3 | "a" "b" "c
+4 | "a" """b
+  |
+
+ISC_syntax_error.py:2:7: SyntaxError: Expected a statement
+  |
+1 | # The lexer doesn't emit a string token if it's unterminated
+2 | "a" "b
+  |       ^
+3 | "a" "b" "c
+4 | "a" """b
+5 | c""" "d
+  |
+
+ISC_syntax_error.py:3:1: ISC001 Implicitly concatenated string literals on one line
+  |
+1 | # The lexer doesn't emit a string token if it's unterminated
+2 | "a" "b
+3 | "a" "b" "c
+  | ^^^^^^^ ISC001
+4 | "a" """b
+5 | c""" "d
+  |
+  = help: Combine string literals
+
+ISC_syntax_error.py:3:9: SyntaxError: missing closing quote in string literal
+  |
+1 | # The lexer doesn't emit a string token if it's unterminated
+2 | "a" "b
+3 | "a" "b" "c
+  |         ^
+4 | "a" """b
+5 | c""" "d
+  |
+
+ISC_syntax_error.py:3:11: SyntaxError: Expected a statement
+  |
+1 | # The lexer doesn't emit a string token if it's unterminated
+2 | "a" "b
+3 | "a" "b" "c
+  |           ^
+4 | "a" """b
+5 | c""" "d
+  |
+
+ISC_syntax_error.py:4:1: ISC001 Implicitly concatenated string literals on one line
+  |
+2 |   "a" "b
+3 |   "a" "b" "c
+4 | / "a" """b
+5 | | c""" "d
+  | |____^ ISC001
+6 |   
+7 |   # For f-strings, the `FStringRanges` won't contain the range for
+  |
+  = help: Combine string literals
+
+ISC_syntax_error.py:5:6: SyntaxError: missing closing quote in string literal
+  |
+3 | "a" "b" "c
+4 | "a" """b
+5 | c""" "d
+  |      ^
+6 | 
+7 | # For f-strings, the `FStringRanges` won't contain the range for
+  |
+
+ISC_syntax_error.py:5:8: SyntaxError: Expected a statement
+  |
+3 | "a" "b" "c
+4 | "a" """b
+5 | c""" "d
+  |        ^
+6 | 
+7 | # For f-strings, the `FStringRanges` won't contain the range for
+8 | # unterminated f-strings.
+  |
+
+ISC_syntax_error.py:9:8: SyntaxError: f-string: unterminated string
+   |
+ 7 | # For f-strings, the `FStringRanges` won't contain the range for
+ 8 | # unterminated f-strings.
+ 9 | f"a" f"b
+   |        ^
+10 | f"a" f"b" f"c
+11 | f"a" f"""b
+   |
+
+ISC_syntax_error.py:9:9: SyntaxError: Expected FStringEnd, found newline
+   |
+ 7 | # For f-strings, the `FStringRanges` won't contain the range for
+ 8 | # unterminated f-strings.
+ 9 | f"a" f"b
+   |         ^
+10 | f"a" f"b" f"c
+11 | f"a" f"""b
+12 | c""" f"d {e
+   |
+
+ISC_syntax_error.py:10:1: ISC001 Implicitly concatenated string literals on one line
+   |
+ 8 | # unterminated f-strings.
+ 9 | f"a" f"b
+10 | f"a" f"b" f"c
+   | ^^^^^^^^^ ISC001
+11 | f"a" f"""b
+12 | c""" f"d {e
+   |
+   = help: Combine string literals
+
+ISC_syntax_error.py:10:13: SyntaxError: f-string: unterminated string
+   |
+ 8 | # unterminated f-strings.
+ 9 | f"a" f"b
+10 | f"a" f"b" f"c
+   |             ^
+11 | f"a" f"""b
+12 | c""" f"d {e
+   |
+
+ISC_syntax_error.py:10:14: SyntaxError: Expected FStringEnd, found newline
+   |
+ 8 | # unterminated f-strings.
+ 9 | f"a" f"b
+10 | f"a" f"b" f"c
+   |              ^
+11 | f"a" f"""b
+12 | c""" f"d {e
+   |
+
+ISC_syntax_error.py:11:1: ISC001 Implicitly concatenated string literals on one line
+   |
+ 9 |   f"a" f"b
+10 |   f"a" f"b" f"c
+11 | / f"a" f"""b
+12 | | c""" f"d {e
+   | |____^ ISC001
+13 |   
+14 |   (
+   |
+   = help: Combine string literals
+
+ISC_syntax_error.py:16:5: SyntaxError: missing closing quote in string literal
+   |
+14 | (
+15 |     "a"
+16 |     "b
+   |     ^
+17 |     "c"
+18 |     "d"
+   |
+
+ISC_syntax_error.py:26:9: SyntaxError: f-string: unterminated triple-quoted string
+   |
+24 | (
+25 |     """abc"""
+26 |     f"""def
+   |         ^
+27 |     "g" "h"
+28 |     "i" "j"
+   |
+
+ISC_syntax_error.py:30:1: SyntaxError: unexpected EOF while parsing
+   |
+28 |     "i" "j"
+29 | )
+   |
+
+ISC_syntax_error.py:30:1: SyntaxError: f-string: unterminated string
+   |
+28 |     "i" "j"
+29 | )
+   |