We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 705b606 commit d2d7453Copy full SHA for d2d7453
gixy/core/regexp.py
@@ -26,7 +26,10 @@ def _build_reverse_list(original):
26
FIX_NAMED_GROUPS_RE = re.compile(r"(?<!\\)\(\?[<'](\w+)[>']")
27
28
CATEGORIES = {
29
- # Note: ASCII only, unicode not supported
+ # Note: ASCII-only character classes. While NGINX configs can contain unicode
30
+ # strings, NGINX's PCRE regex engine typically uses ASCII semantics for \w, \d, \s
31
+ # unless explicitly compiled with unicode support. This conservative approach is
32
+ # correct for security analysis since URLs are ASCII (unicode gets percent-encoded).
33
sre_parse.CATEGORY_SPACE: sre_parse.WHITESPACE,
34
sre_parse.CATEGORY_NOT_SPACE: _build_reverse_list(sre_parse.WHITESPACE),
35
sre_parse.CATEGORY_DIGIT: sre_parse.DIGITS,
0 commit comments