-
Notifications
You must be signed in to change notification settings - Fork 1.1k
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
- Loading branch information
Sven Hager
committed
Oct 13, 2023
1 parent
4454fbf
commit 4ba7b3e
Showing
8 changed files
with
242 additions
and
0 deletions.
There are no files selected for viewing
44 changes: 44 additions & 0 deletions
44
crates/ruff_linter/resources/test/fixtures/pylint/unspecified_encoding.py
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,44 @@ | ||
import io | ||
import sys | ||
import tempfile | ||
import io as hugo | ||
import codecs | ||
|
||
# Errors. | ||
open("test.txt") | ||
io.TextIOWrapper(io.FileIO("test.txt")) | ||
hugo.TextIOWrapper(hugo.FileIO("test.txt")) | ||
tempfile.NamedTemporaryFile("w") | ||
tempfile.TemporaryFile("w") | ||
codecs.open("test.txt") | ||
tempfile.SpooledTemporaryFile(0, "w") | ||
|
||
# Non-errors. | ||
open("test.txt", encoding="utf-8") | ||
open("test.bin", "wb") | ||
open("test.bin", mode="wb") | ||
open("test.txt", "r", -1, "utf-8") | ||
open("test.txt", mode=sys.argv[1]) | ||
|
||
def func(*args, **kwargs): | ||
open(*args) | ||
open("text.txt", **kwargs) | ||
|
||
io.TextIOWrapper(io.FileIO("test.txt"), encoding="utf-8") | ||
io.TextIOWrapper(io.FileIO("test.txt"), "utf-8") | ||
tempfile.TemporaryFile("w", encoding="utf-8") | ||
tempfile.TemporaryFile("w", -1, "utf-8") | ||
tempfile.TemporaryFile("wb") | ||
tempfile.TemporaryFile() | ||
tempfile.NamedTemporaryFile("w", encoding="utf-8") | ||
tempfile.NamedTemporaryFile("w", -1, "utf-8") | ||
tempfile.NamedTemporaryFile("wb") | ||
tempfile.NamedTemporaryFile() | ||
codecs.open("test.txt", encoding="utf-8") | ||
codecs.open("test.bin", "wb") | ||
codecs.open("test.bin", mode="wb") | ||
codecs.open("test.txt", "r", -1, "utf-8") | ||
tempfile.SpooledTemporaryFile(0, "w", encoding="utf-8") | ||
tempfile.SpooledTemporaryFile(0, "w", -1, "utf-8") | ||
tempfile.SpooledTemporaryFile(0, "wb") | ||
tempfile.SpooledTemporaryFile(0, ) |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
118 changes: 118 additions & 0 deletions
118
crates/ruff_linter/src/rules/pylint/rules/unspecified_encoding.rs
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,118 @@ | ||
use ruff_diagnostics::{Diagnostic, Violation}; | ||
use ruff_macros::{derive_message_formats, violation}; | ||
use ruff_python_ast as ast; | ||
use ruff_text_size::Ranged; | ||
|
||
use crate::checkers::ast::Checker; | ||
|
||
/// ## What it does | ||
/// Checks for uses of `open` or similar calls without an explicit `encoding` argument. | ||
/// | ||
/// ## Why is this bad? | ||
/// Using `open` in text mode without an explicit encoding specified can lead to | ||
/// unportable code that leads to different behaviour on different systems. | ||
/// | ||
/// Instead, consider using the `encoding` parameter to explicitly enforce a specific encoding. | ||
/// | ||
/// ## Example | ||
/// ```python | ||
/// open("file.txt") | ||
/// ``` | ||
/// | ||
/// Use instead: | ||
/// ```python | ||
/// open("file.txt", encoding="utf-8") | ||
/// ``` | ||
/// | ||
/// ## References | ||
/// - [Python documentation: `open`](https://docs.python.org/3/library/functions.html#open) | ||
#[violation] | ||
pub struct UnspecifiedEncoding { | ||
function_name: String, | ||
} | ||
|
||
impl Violation for UnspecifiedEncoding { | ||
#[derive_message_formats] | ||
fn message(&self) -> String { | ||
format!( | ||
"`{}` {}without explicit `encoding` argument", | ||
self.function_name, | ||
if self.function_name == "open" { | ||
"in text mode " | ||
} else { | ||
"" | ||
} | ||
) | ||
} | ||
} | ||
|
||
fn is_binary_mode(expr: &ast::Expr) -> Option<bool> { | ||
Some(expr.as_constant_expr()?.value.as_str()?.value.contains("b")) | ||
} | ||
|
||
fn is_violation(call: &ast::ExprCall, path: &[&str]) -> bool { | ||
// this checks if we have something like *args which might contain the encoding argument | ||
if call.arguments.args.iter().any(|a| a.is_starred_expr()) { | ||
return false; | ||
} | ||
// this checks if we have something like **kwargs which might contain the encoding argument | ||
if call.arguments.keywords.iter().any(|a| a.arg.is_none()) { | ||
return false; | ||
} | ||
match path { | ||
["" | "codecs", "open"] => { | ||
if let Some(mode_arg) = call.arguments.find_argument("mode", 1) { | ||
if is_binary_mode(mode_arg).unwrap_or(true) { | ||
// binary mode or unknown mode is no violation | ||
return false; | ||
} | ||
} | ||
// else mode not specified, defaults to text mode | ||
call.arguments.find_argument("encoding", 3).is_none() | ||
} | ||
["io", "TextIOWrapper"] => call.arguments.find_argument("encoding", 1).is_none(), | ||
["tempfile", "TemporaryFile" | "NamedTemporaryFile" | "SpooledTemporaryFile"] => { | ||
let mode_pos = if path[1] == "SpooledTemporaryFile" { | ||
1 | ||
} else { | ||
0 | ||
}; | ||
|
||
if let Some(mode_arg) = call.arguments.find_argument("mode", mode_pos) { | ||
if is_binary_mode(mode_arg).unwrap_or(true) { | ||
// binary mode or unknown mode is no violation | ||
return false; | ||
} | ||
} else { | ||
// defaults to binary mode | ||
return false; | ||
} | ||
call.arguments | ||
.find_argument("encoding", mode_pos + 2) | ||
.is_none() | ||
} | ||
_ => false, | ||
} | ||
} | ||
|
||
/// PLW1514 | ||
pub(crate) fn unspecified_encoding(checker: &mut Checker, call: &ast::ExprCall) { | ||
let Some(path) = checker.semantic().resolve_call_path(&call.func) else { | ||
return; | ||
}; | ||
if is_violation(call, path.as_slice()) { | ||
let path_slice = if path[0] == "" { | ||
&path[1..] | ||
} else { | ||
&path[0..] | ||
}; | ||
let result = Diagnostic::new( | ||
UnspecifiedEncoding { | ||
function_name: path_slice.join("."), | ||
}, | ||
call.func.range(), | ||
); | ||
drop(path); | ||
checker.diagnostics.push(result); | ||
} | ||
} |
72 changes: 72 additions & 0 deletions
72
.../pylint/snapshots/ruff_linter__rules__pylint__tests__PLW1514_unspecified_encoding.py.snap
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,72 @@ | ||
--- | ||
source: crates/ruff_linter/src/rules/pylint/mod.rs | ||
--- | ||
unspecified_encoding.py:8:1: PLW1514 `open` in text mode without explicit `encoding` argument | ||
| | ||
7 | # Errors. | ||
8 | open("test.txt") | ||
| ^^^^ PLW1514 | ||
9 | io.TextIOWrapper(io.FileIO("test.txt")) | ||
10 | hugo.TextIOWrapper(hugo.FileIO("test.txt")) | ||
| | ||
|
||
unspecified_encoding.py:9:1: PLW1514 `io.TextIOWrapper` without explicit `encoding` argument | ||
| | ||
7 | # Errors. | ||
8 | open("test.txt") | ||
9 | io.TextIOWrapper(io.FileIO("test.txt")) | ||
| ^^^^^^^^^^^^^^^^ PLW1514 | ||
10 | hugo.TextIOWrapper(hugo.FileIO("test.txt")) | ||
11 | tempfile.NamedTemporaryFile("w") | ||
| | ||
|
||
unspecified_encoding.py:10:1: PLW1514 `io.TextIOWrapper` without explicit `encoding` argument | ||
| | ||
8 | open("test.txt") | ||
9 | io.TextIOWrapper(io.FileIO("test.txt")) | ||
10 | hugo.TextIOWrapper(hugo.FileIO("test.txt")) | ||
| ^^^^^^^^^^^^^^^^^^ PLW1514 | ||
11 | tempfile.NamedTemporaryFile("w") | ||
12 | tempfile.TemporaryFile("w") | ||
| | ||
|
||
unspecified_encoding.py:11:1: PLW1514 `tempfile.NamedTemporaryFile` without explicit `encoding` argument | ||
| | ||
9 | io.TextIOWrapper(io.FileIO("test.txt")) | ||
10 | hugo.TextIOWrapper(hugo.FileIO("test.txt")) | ||
11 | tempfile.NamedTemporaryFile("w") | ||
| ^^^^^^^^^^^^^^^^^^^^^^^^^^^ PLW1514 | ||
12 | tempfile.TemporaryFile("w") | ||
13 | codecs.open("test.txt") | ||
| | ||
|
||
unspecified_encoding.py:12:1: PLW1514 `tempfile.TemporaryFile` without explicit `encoding` argument | ||
| | ||
10 | hugo.TextIOWrapper(hugo.FileIO("test.txt")) | ||
11 | tempfile.NamedTemporaryFile("w") | ||
12 | tempfile.TemporaryFile("w") | ||
| ^^^^^^^^^^^^^^^^^^^^^^ PLW1514 | ||
13 | codecs.open("test.txt") | ||
14 | tempfile.SpooledTemporaryFile(0, "w") | ||
| | ||
|
||
unspecified_encoding.py:13:1: PLW1514 `codecs.open` without explicit `encoding` argument | ||
| | ||
11 | tempfile.NamedTemporaryFile("w") | ||
12 | tempfile.TemporaryFile("w") | ||
13 | codecs.open("test.txt") | ||
| ^^^^^^^^^^^ PLW1514 | ||
14 | tempfile.SpooledTemporaryFile(0, "w") | ||
| | ||
|
||
unspecified_encoding.py:14:1: PLW1514 `tempfile.SpooledTemporaryFile` without explicit `encoding` argument | ||
| | ||
12 | tempfile.TemporaryFile("w") | ||
13 | codecs.open("test.txt") | ||
14 | tempfile.SpooledTemporaryFile(0, "w") | ||
| ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ PLW1514 | ||
15 | | ||
16 | # Non-errors. | ||
| | ||
|
||
|
Some generated files are not rendered by default. Learn more about how customized files appear on GitHub.
Oops, something went wrong.