Unfortunately, checking for strings without context is exceedingly prone to false positives, while missing anything that indirectly opens a file. Python 3.10 has a feature to warn about this though -- and it uses a runtime check which runs at the same time that the code fails to open files in the broken Windows locale. Set this up automatically when running the testsuite. Sadly, Python's builtin feature to change the warning level, e.g. by setting EncodingWarning to error at startup, is utterly broken if you want to limit it to only certain modules. This is tracked in order to be more efficiently ignored at https://bugs.python.org/issue34624 and https://github.com/python/cpython/pull/9358 It is also very trigger happy and passing stuff around via environment variable either messes with the testsuite, or with thirdparty programs which are implemented in python *such as lots of gnome*, or perhaps both. Instead, add runtime code to meson itself, to add a hidden "feature". In the application source code, running the 'warnings' module, you can actually get the expected behavior that $PYTHONWARNINGS doesn't have. So check for a magic testsuite variable every time meson starts up, and if it does, then go ahead and initialize a warnings filter that makes EncodingWarning fatal, but *only* when triggered via Meson and not arbitrary subprocess scripts.pull/10112/head
parent
aa2b277c1a
commit
d910966991
5 changed files with 13 additions and 86 deletions
@ -1,76 +0,0 @@ |
||||
#!/usr/bin/env python3 |
||||
|
||||
from pathlib import Path |
||||
import typing as T |
||||
|
||||
root = Path(__file__).absolute().parent |
||||
mesonbuild = root / 'mesonbuild' |
||||
|
||||
whitelist = ['mesonbuild/', 'run_', 'ci/', 'tools/', 'docs/'] |
||||
|
||||
def check_missing_encoding(lines: T.List[str], path: str) -> int: |
||||
errors = 0 |
||||
functions = ['read_text', 'write_text', 'open'] |
||||
for num, line in enumerate(lines): |
||||
for func in functions: |
||||
l = line |
||||
|
||||
# Skip ignored lines |
||||
if '[ignore encoding]' in l: |
||||
continue |
||||
|
||||
# Do we have a match? |
||||
loc = l.find(func + '(') |
||||
if loc < 0: |
||||
continue |
||||
if loc > 0 and ord(l[loc-1].lower()) in [*range(ord('a'), ord('z')), *range(ord('0'), ord('9')), '_']: |
||||
continue |
||||
loc += len(func) + 1 |
||||
# Some preprocessign to make parsing easier |
||||
l = l[loc:] |
||||
l = l.replace(' ', '') |
||||
l = l.replace('\t', '') |
||||
l = l.replace('\n', '') |
||||
l = l.replace('\'', '"') |
||||
|
||||
# Parameter begin |
||||
args = '' |
||||
b_open = 1 |
||||
while l: |
||||
c = l[0] |
||||
l = l[1:] |
||||
if c == ')': |
||||
b_open -= 1 |
||||
if b_open == 0: |
||||
break |
||||
elif b_open == 1: |
||||
args += c |
||||
if c == '(': |
||||
b_open += 1 |
||||
|
||||
binary_modes = ['rb', 'br', 'r+b', 'wb', 'bw', 'ab', 'ba'] |
||||
is_binary = any([f'"{x}"' in args for x in binary_modes]) |
||||
if 'encoding=' not in args and not (func == 'open' and is_binary): |
||||
location = f'\x1b[33;1m[\x1b[0;1m{path}:{num+1}\x1b[33m]\x1b[0m' |
||||
#print(f'{location:<64}: \x1b[31;1mERROR:\x1b[0m Missing `encoding=` parameter in "{line.strip()}"') |
||||
print(f'{location:<72}: \x1b[31;1mERROR:\x1b[0m Missing `encoding=` parameter in `{func}` call') |
||||
errors += 1 |
||||
return errors |
||||
|
||||
def main() -> int: |
||||
print('Scanning mesonbuild...') |
||||
errors = 0 |
||||
for i in sorted(root.glob('**/*.py')): |
||||
raw = i.read_text(encoding='utf-8') |
||||
lines = raw.splitlines() |
||||
filename = i.relative_to(root).as_posix() |
||||
|
||||
if not any([filename.startswith(x) for x in whitelist]): |
||||
continue |
||||
|
||||
errors += check_missing_encoding(lines, filename) |
||||
print(f'Found {errors} errors while scanning mesonbuild') |
||||
return 0 if errors == 0 else 1 |
||||
|
||||
if __name__ == '__main__': |
||||
raise SystemExit(main()) |
Loading…
Reference in new issue