Current Path: > > lib64 > > python3.8
Operation : Linux premium107.web-hosting.com 4.18.0-553.44.1.lve.el8.x86_64 #1 SMP Thu Mar 13 14:29:12 UTC 2025 x86_64 Software : Apache Server IP : 198.54.126.246 | Your IP: 216.73.216.181 Domains : 1034 Domain(s) Permission : [ 0755 ]
| Name | Type | Size | Last Modified | Actions |
|---|---|---|---|---|
| __pycache__ | Directory | - | - | |
| asyncio | Directory | - | - | |
| collections | Directory | - | - | |
| concurrent | Directory | - | - | |
| config-3.8-x86_64-linux-gnu | Directory | - | - | |
| ctypes | Directory | - | - | |
| curses | Directory | - | - | |
| dbm | Directory | - | - | |
| distutils | Directory | - | - | |
| Directory | - | - | ||
| encodings | Directory | - | - | |
| ensurepip | Directory | - | - | |
| html | Directory | - | - | |
| http | Directory | - | - | |
| importlib | Directory | - | - | |
| json | Directory | - | - | |
| lib-dynload | Directory | - | - | |
| lib2to3 | Directory | - | - | |
| logging | Directory | - | - | |
| multiprocessing | Directory | - | - | |
| pydoc_data | Directory | - | - | |
| site-packages | Directory | - | - | |
| sqlite3 | Directory | - | - | |
| tkinter | Directory | - | - | |
| turtledemo | Directory | - | - | |
| unittest | Directory | - | - | |
| urllib | Directory | - | - | |
| venv | Directory | - | - | |
| wsgiref | Directory | - | - | |
| xml | Directory | - | - | |
| xmlrpc | Directory | - | - | |
| LICENSE.txt | File | 13937 bytes | June 06 2023 13:32:21. | |
| __future__.py | File | 5147 bytes | June 06 2023 13:32:21. | |
| __phello__.foo.py | File | 64 bytes | June 06 2023 13:32:21. | |
| _bootlocale.py | File | 1801 bytes | June 06 2023 13:32:21. | |
| _collections_abc.py | File | 26100 bytes | June 06 2023 13:32:21. | |
| _compat_pickle.py | File | 8749 bytes | June 06 2023 13:32:21. | |
| _compression.py | File | 5340 bytes | June 06 2023 13:32:21. | |
| _dummy_thread.py | File | 6027 bytes | June 06 2023 13:32:21. | |
| _markupbase.py | File | 14598 bytes | June 06 2023 13:32:21. | |
| _osx_support.py | File | 21774 bytes | June 06 2023 13:32:21. | |
| _py_abc.py | File | 6189 bytes | June 06 2023 13:32:21. | |
| _pydecimal.py | File | 228666 bytes | June 06 2023 13:32:21. | |
| _pyio.py | File | 93177 bytes | June 06 2023 13:32:21. | |
| _sitebuiltins.py | File | 3115 bytes | June 06 2023 13:32:21. | |
| _strptime.py | File | 25268 bytes | June 06 2023 13:32:21. | |
| _sysconfigdata__linux_x86_64-linux-gnu.py | File | 38510 bytes | October 17 2023 18:12:19. | |
| _sysconfigdata_d_linux_x86_64-linux-gnu.py | File | 38237 bytes | October 17 2023 18:03:44. | |
| _threading_local.py | File | 7220 bytes | June 06 2023 13:32:21. | |
| _weakrefset.py | File | 5735 bytes | June 06 2023 13:32:21. | |
| abc.py | File | 4489 bytes | June 06 2023 13:32:21. | |
| aifc.py | File | 32814 bytes | June 06 2023 13:32:21. | |
| antigravity.py | File | 477 bytes | June 06 2023 13:32:21. | |
| argparse.py | File | 96015 bytes | June 06 2023 13:32:21. | |
| ast.py | File | 19234 bytes | June 06 2023 13:32:21. | |
| asynchat.py | File | 11328 bytes | June 06 2023 13:32:21. | |
| asyncore.py | File | 20094 bytes | June 06 2023 13:32:21. | |
| base64.py | File | 20382 bytes | June 06 2023 13:32:21. | |
| bdb.py | File | 32056 bytes | June 06 2023 13:32:21. | |
| binhex.py | File | 13954 bytes | June 06 2023 13:32:21. | |
| bisect.py | File | 2214 bytes | June 06 2023 13:32:21. | |
| bz2.py | File | 12558 bytes | June 06 2023 13:32:21. | |
| cProfile.py | File | 7010 bytes | June 06 2023 13:32:21. | |
| calendar.py | File | 24832 bytes | June 06 2023 13:32:21. | |
| cgi.py | File | 33934 bytes | October 17 2023 18:02:14. | |
| cgitb.py | File | 12096 bytes | June 06 2023 13:32:21. | |
| chunk.py | File | 5435 bytes | June 06 2023 13:32:21. | |
| cmd.py | File | 14860 bytes | June 06 2023 13:32:21. | |
| code.py | File | 10622 bytes | June 06 2023 13:32:21. | |
| codecs.py | File | 36667 bytes | June 06 2023 13:32:21. | |
| codeop.py | File | 6330 bytes | June 06 2023 13:32:21. | |
| colorsys.py | File | 4064 bytes | June 06 2023 13:32:21. | |
| compileall.py | File | 13678 bytes | June 06 2023 13:32:21. | |
| configparser.py | File | 54374 bytes | June 06 2023 13:32:21. | |
| contextlib.py | File | 24995 bytes | June 06 2023 13:32:21. | |
| contextvars.py | File | 129 bytes | June 06 2023 13:32:21. | |
| copy.py | File | 8661 bytes | June 06 2023 13:32:21. | |
| copyreg.py | File | 7135 bytes | June 06 2023 13:32:21. | |
| crypt.py | File | 3610 bytes | June 06 2023 13:32:21. | |
| csv.py | File | 16144 bytes | June 06 2023 13:32:21. | |
| dataclasses.py | File | 49973 bytes | June 06 2023 13:32:21. | |
| datetime.py | File | 88287 bytes | June 06 2023 13:32:21. | |
| decimal.py | File | 320 bytes | June 06 2023 13:32:21. | |
| difflib.py | File | 84058 bytes | June 06 2023 13:32:21. | |
| dis.py | File | 20570 bytes | June 06 2023 13:32:21. | |
| doctest.py | File | 104543 bytes | June 06 2023 13:32:21. | |
| dummy_threading.py | File | 2815 bytes | June 06 2023 13:32:21. | |
| enum.py | File | 38136 bytes | June 06 2023 13:32:21. | |
| filecmp.py | File | 9830 bytes | June 06 2023 13:32:21. | |
| fileinput.py | File | 14709 bytes | June 06 2023 13:32:21. | |
| fnmatch.py | File | 4079 bytes | June 06 2023 13:32:21. | |
| formatter.py | File | 15143 bytes | June 06 2023 13:32:21. | |
| fractions.py | File | 24329 bytes | June 06 2023 13:32:21. | |
| ftplib.py | File | 35129 bytes | June 06 2023 13:32:21. | |
| functools.py | File | 37406 bytes | June 06 2023 13:32:21. | |
| genericpath.py | File | 4975 bytes | June 06 2023 13:32:21. | |
| getopt.py | File | 7489 bytes | June 06 2023 13:32:21. | |
| getpass.py | File | 5994 bytes | June 06 2023 13:32:21. | |
| gettext.py | File | 27138 bytes | June 06 2023 13:32:21. | |
| glob.py | File | 5697 bytes | June 06 2023 13:32:21. | |
| gzip.py | File | 21413 bytes | June 06 2023 13:32:21. | |
| hashlib.py | File | 8333 bytes | October 17 2023 18:02:14. | |
| heapq.py | File | 22877 bytes | June 06 2023 13:32:21. | |
| hmac.py | File | 7850 bytes | October 17 2023 18:02:14. | |
| imaplib.py | File | 53606 bytes | June 06 2023 13:32:21. | |
| imghdr.py | File | 3808 bytes | June 06 2023 13:32:21. | |
| imp.py | File | 10536 bytes | June 06 2023 13:32:21. | |
| inspect.py | File | 118550 bytes | June 06 2023 13:32:21. | |
| io.py | File | 3541 bytes | June 06 2023 13:32:21. | |
| ipaddress.py | File | 71644 bytes | June 06 2023 13:32:21. | |
| keyword.py | File | 945 bytes | June 06 2023 13:32:21. | |
| linecache.py | File | 5330 bytes | June 06 2023 13:32:21. | |
| locale.py | File | 78191 bytes | June 06 2023 13:32:21. | |
| lzma.py | File | 12983 bytes | June 06 2023 13:32:21. | |
| mailbox.py | File | 78661 bytes | June 06 2023 13:32:21. | |
| mailcap.py | File | 9067 bytes | June 06 2023 13:32:21. | |
| mimetypes.py | File | 21664 bytes | June 06 2023 13:32:21. | |
| modulefinder.py | File | 24430 bytes | June 06 2023 13:32:21. | |
| netrc.py | File | 5566 bytes | June 06 2023 13:32:21. | |
| nntplib.py | File | 43261 bytes | June 06 2023 13:32:21. | |
| ntpath.py | File | 27734 bytes | June 06 2023 13:32:21. | |
| nturl2path.py | File | 2887 bytes | June 06 2023 13:32:21. | |
| numbers.py | File | 10244 bytes | June 06 2023 13:32:21. | |
| opcode.py | File | 5808 bytes | June 06 2023 13:32:21. | |
| operator.py | File | 10711 bytes | June 06 2023 13:32:21. | |
| optparse.py | File | 60369 bytes | June 06 2023 13:32:21. | |
| os.py | File | 38995 bytes | June 06 2023 13:32:21. | |
| pathlib.py | File | 52610 bytes | June 06 2023 13:32:21. | |
| pdb.py | File | 62738 bytes | June 06 2023 13:32:21. | |
| pickle.py | File | 64467 bytes | June 06 2023 13:32:21. | |
| pickletools.py | File | 93486 bytes | June 06 2023 13:32:21. | |
| pipes.py | File | 8916 bytes | June 06 2023 13:32:21. | |
| pkgutil.py | File | 21500 bytes | June 06 2023 13:32:21. | |
| platform.py | File | 40425 bytes | June 06 2023 13:32:21. | |
| plistlib.py | File | 32220 bytes | June 06 2023 13:32:21. | |
| poplib.py | File | 15077 bytes | June 06 2023 13:32:21. | |
| posixpath.py | File | 15627 bytes | June 06 2023 13:32:21. | |
| pprint.py | File | 21484 bytes | June 06 2023 13:32:21. | |
| profile.py | File | 23546 bytes | June 06 2023 13:32:21. | |
| pstats.py | File | 27345 bytes | June 06 2023 13:32:21. | |
| pty.py | File | 4807 bytes | June 06 2023 13:32:21. | |
| py_compile.py | File | 8203 bytes | October 17 2023 18:02:14. | |
| pyclbr.py | File | 15255 bytes | June 06 2023 13:32:21. | |
| pydoc.py | File | 106700 bytes | October 17 2023 18:12:57. | |
| queue.py | File | 11356 bytes | June 06 2023 13:32:21. | |
| quopri.py | File | 7252 bytes | June 06 2023 13:32:21. | |
| random.py | File | 28802 bytes | June 06 2023 13:32:21. | |
| re.py | File | 15861 bytes | June 06 2023 13:32:21. | |
| reprlib.py | File | 5267 bytes | June 06 2023 13:32:21. | |
| rlcompleter.py | File | 7097 bytes | June 06 2023 13:32:21. | |
| runpy.py | File | 12052 bytes | June 06 2023 13:32:21. | |
| sched.py | File | 6442 bytes | June 06 2023 13:32:21. | |
| secrets.py | File | 2038 bytes | June 06 2023 13:32:21. | |
| selectors.py | File | 18561 bytes | June 06 2023 13:32:21. | |
| shelve.py | File | 8527 bytes | June 06 2023 13:32:21. | |
| shlex.py | File | 13325 bytes | June 06 2023 13:32:21. | |
| shutil.py | File | 51761 bytes | June 06 2023 13:32:21. | |
| signal.py | File | 2273 bytes | June 06 2023 13:32:21. | |
| site.py | File | 21838 bytes | October 17 2023 18:02:14. | |
| smtpd.py | File | 34709 bytes | June 06 2023 13:32:21. | |
| smtplib.py | File | 45001 bytes | June 06 2023 13:32:21. | |
| sndhdr.py | File | 7099 bytes | June 06 2023 13:32:21. | |
| socket.py | File | 35243 bytes | June 06 2023 13:32:21. | |
| socketserver.py | File | 27296 bytes | June 06 2023 13:32:21. | |
| sre_compile.py | File | 26695 bytes | June 06 2023 13:32:21. | |
| sre_constants.py | File | 7154 bytes | June 06 2023 13:32:21. | |
| sre_parse.py | File | 40230 bytes | June 06 2023 13:32:21. | |
| ssl.py | File | 50760 bytes | June 06 2023 13:32:21. | |
| stat.py | File | 5485 bytes | June 06 2023 13:32:21. | |
| statistics.py | File | 39690 bytes | June 06 2023 13:32:21. | |
| string.py | File | 10535 bytes | June 06 2023 13:32:21. | |
| stringprep.py | File | 12917 bytes | June 06 2023 13:32:21. | |
| struct.py | File | 257 bytes | June 06 2023 13:32:21. | |
| subprocess.py | File | 78250 bytes | June 06 2023 13:32:21. | |
| sunau.py | File | 18375 bytes | June 06 2023 13:32:21. | |
| symbol.py | File | 2109 bytes | October 17 2023 18:04:15. | |
| symtable.py | File | 8021 bytes | June 06 2023 13:32:21. | |
| sysconfig.py | File | 24896 bytes | October 17 2023 18:12:55. | |
| tabnanny.py | File | 11406 bytes | June 06 2023 13:32:21. | |
| tarfile.py | File | 106473 bytes | October 17 2023 18:02:14. | |
| telnetlib.py | File | 23254 bytes | June 06 2023 13:32:21. | |
| tempfile.py | File | 27537 bytes | June 06 2023 13:32:21. | |
| textwrap.py | File | 19407 bytes | June 06 2023 13:32:21. | |
| this.py | File | 1003 bytes | June 06 2023 13:32:21. | |
| threading.py | File | 50820 bytes | June 06 2023 13:32:21. | |
| timeit.py | File | 13480 bytes | June 06 2023 13:32:21. | |
| token.py | File | 2368 bytes | June 06 2023 13:32:21. | |
| tokenize.py | File | 25841 bytes | June 06 2023 13:32:21. | |
| trace.py | File | 29870 bytes | June 06 2023 13:32:21. | |
| traceback.py | File | 23611 bytes | June 06 2023 13:32:21. | |
| tracemalloc.py | File | 17076 bytes | June 06 2023 13:32:21. | |
| tty.py | File | 879 bytes | June 06 2023 13:32:21. | |
| turtle.py | File | 143716 bytes | June 06 2023 13:32:21. | |
| types.py | File | 9713 bytes | June 06 2023 13:32:21. | |
| typing.py | File | 68962 bytes | June 06 2023 13:32:21. | |
| uu.py | File | 7277 bytes | October 17 2023 18:12:57. | |
| uuid.py | File | 30515 bytes | October 17 2023 18:02:14. | |
| warnings.py | File | 19688 bytes | June 06 2023 13:32:21. | |
| wave.py | File | 18230 bytes | June 06 2023 13:32:21. | |
| weakref.py | File | 21387 bytes | June 06 2023 13:32:21. | |
| webbrowser.py | File | 24083 bytes | June 06 2023 13:32:21. | |
| xdrlib.py | File | 5913 bytes | June 06 2023 13:32:21. | |
| zipapp.py | File | 7535 bytes | June 06 2023 13:32:21. | |
| zipfile.py | File | 87728 bytes | June 06 2023 13:32:21. | |
| zipimport.py | File | 30765 bytes | June 06 2023 13:32:21. |
#
# Secret Labs' Regular Expression Engine
#
# convert template to internal format
#
# Copyright (c) 1997-2001 by Secret Labs AB. All rights reserved.
#
# See the sre.py file for information on usage and redistribution.
#
"""Internal support module for sre"""
import _sre
import sre_parse
from sre_constants import *
assert _sre.MAGIC == MAGIC, "SRE module mismatch"
_LITERAL_CODES = {LITERAL, NOT_LITERAL}
_REPEATING_CODES = {REPEAT, MIN_REPEAT, MAX_REPEAT}
_SUCCESS_CODES = {SUCCESS, FAILURE}
_ASSERT_CODES = {ASSERT, ASSERT_NOT}
_UNIT_CODES = _LITERAL_CODES | {ANY, IN}
# Sets of lowercase characters which have the same uppercase.
_equivalences = (
# LATIN SMALL LETTER I, LATIN SMALL LETTER DOTLESS I
(0x69, 0x131), # iı
# LATIN SMALL LETTER S, LATIN SMALL LETTER LONG S
(0x73, 0x17f), # sſ
# MICRO SIGN, GREEK SMALL LETTER MU
(0xb5, 0x3bc), # µμ
# COMBINING GREEK YPOGEGRAMMENI, GREEK SMALL LETTER IOTA, GREEK PROSGEGRAMMENI
(0x345, 0x3b9, 0x1fbe), # \u0345ιι
# GREEK SMALL LETTER IOTA WITH DIALYTIKA AND TONOS, GREEK SMALL LETTER IOTA WITH DIALYTIKA AND OXIA
(0x390, 0x1fd3), # ΐΐ
# GREEK SMALL LETTER UPSILON WITH DIALYTIKA AND TONOS, GREEK SMALL LETTER UPSILON WITH DIALYTIKA AND OXIA
(0x3b0, 0x1fe3), # ΰΰ
# GREEK SMALL LETTER BETA, GREEK BETA SYMBOL
(0x3b2, 0x3d0), # βϐ
# GREEK SMALL LETTER EPSILON, GREEK LUNATE EPSILON SYMBOL
(0x3b5, 0x3f5), # εϵ
# GREEK SMALL LETTER THETA, GREEK THETA SYMBOL
(0x3b8, 0x3d1), # θϑ
# GREEK SMALL LETTER KAPPA, GREEK KAPPA SYMBOL
(0x3ba, 0x3f0), # κϰ
# GREEK SMALL LETTER PI, GREEK PI SYMBOL
(0x3c0, 0x3d6), # πϖ
# GREEK SMALL LETTER RHO, GREEK RHO SYMBOL
(0x3c1, 0x3f1), # ρϱ
# GREEK SMALL LETTER FINAL SIGMA, GREEK SMALL LETTER SIGMA
(0x3c2, 0x3c3), # ςσ
# GREEK SMALL LETTER PHI, GREEK PHI SYMBOL
(0x3c6, 0x3d5), # φϕ
# LATIN SMALL LETTER S WITH DOT ABOVE, LATIN SMALL LETTER LONG S WITH DOT ABOVE
(0x1e61, 0x1e9b), # ṡẛ
# LATIN SMALL LIGATURE LONG S T, LATIN SMALL LIGATURE ST
(0xfb05, 0xfb06), # ſtst
)
# Maps the lowercase code to lowercase codes which have the same uppercase.
_ignorecase_fixes = {i: tuple(j for j in t if i != j)
for t in _equivalences for i in t}
def _combine_flags(flags, add_flags, del_flags,
TYPE_FLAGS=sre_parse.TYPE_FLAGS):
if add_flags & TYPE_FLAGS:
flags &= ~TYPE_FLAGS
return (flags | add_flags) & ~del_flags
def _compile(code, pattern, flags):
# internal: compile a (sub)pattern
emit = code.append
_len = len
LITERAL_CODES = _LITERAL_CODES
REPEATING_CODES = _REPEATING_CODES
SUCCESS_CODES = _SUCCESS_CODES
ASSERT_CODES = _ASSERT_CODES
iscased = None
tolower = None
fixes = None
if flags & SRE_FLAG_IGNORECASE and not flags & SRE_FLAG_LOCALE:
if flags & SRE_FLAG_UNICODE:
iscased = _sre.unicode_iscased
tolower = _sre.unicode_tolower
fixes = _ignorecase_fixes
else:
iscased = _sre.ascii_iscased
tolower = _sre.ascii_tolower
for op, av in pattern:
if op in LITERAL_CODES:
if not flags & SRE_FLAG_IGNORECASE:
emit(op)
emit(av)
elif flags & SRE_FLAG_LOCALE:
emit(OP_LOCALE_IGNORE[op])
emit(av)
elif not iscased(av):
emit(op)
emit(av)
else:
lo = tolower(av)
if not fixes: # ascii
emit(OP_IGNORE[op])
emit(lo)
elif lo not in fixes:
emit(OP_UNICODE_IGNORE[op])
emit(lo)
else:
emit(IN_UNI_IGNORE)
skip = _len(code); emit(0)
if op is NOT_LITERAL:
emit(NEGATE)
for k in (lo,) + fixes[lo]:
emit(LITERAL)
emit(k)
emit(FAILURE)
code[skip] = _len(code) - skip
elif op is IN:
charset, hascased = _optimize_charset(av, iscased, tolower, fixes)
if flags & SRE_FLAG_IGNORECASE and flags & SRE_FLAG_LOCALE:
emit(IN_LOC_IGNORE)
elif not hascased:
emit(IN)
elif not fixes: # ascii
emit(IN_IGNORE)
else:
emit(IN_UNI_IGNORE)
skip = _len(code); emit(0)
_compile_charset(charset, flags, code)
code[skip] = _len(code) - skip
elif op is ANY:
if flags & SRE_FLAG_DOTALL:
emit(ANY_ALL)
else:
emit(ANY)
elif op in REPEATING_CODES:
if flags & SRE_FLAG_TEMPLATE:
raise error("internal: unsupported template operator %r" % (op,))
if _simple(av[2]):
if op is MAX_REPEAT:
emit(REPEAT_ONE)
else:
emit(MIN_REPEAT_ONE)
skip = _len(code); emit(0)
emit(av[0])
emit(av[1])
_compile(code, av[2], flags)
emit(SUCCESS)
code[skip] = _len(code) - skip
else:
emit(REPEAT)
skip = _len(code); emit(0)
emit(av[0])
emit(av[1])
_compile(code, av[2], flags)
code[skip] = _len(code) - skip
if op is MAX_REPEAT:
emit(MAX_UNTIL)
else:
emit(MIN_UNTIL)
elif op is SUBPATTERN:
group, add_flags, del_flags, p = av
if group:
emit(MARK)
emit((group-1)*2)
# _compile_info(code, p, _combine_flags(flags, add_flags, del_flags))
_compile(code, p, _combine_flags(flags, add_flags, del_flags))
if group:
emit(MARK)
emit((group-1)*2+1)
elif op in SUCCESS_CODES:
emit(op)
elif op in ASSERT_CODES:
emit(op)
skip = _len(code); emit(0)
if av[0] >= 0:
emit(0) # look ahead
else:
lo, hi = av[1].getwidth()
if lo != hi:
raise error("look-behind requires fixed-width pattern")
emit(lo) # look behind
_compile(code, av[1], flags)
emit(SUCCESS)
code[skip] = _len(code) - skip
elif op is CALL:
emit(op)
skip = _len(code); emit(0)
_compile(code, av, flags)
emit(SUCCESS)
code[skip] = _len(code) - skip
elif op is AT:
emit(op)
if flags & SRE_FLAG_MULTILINE:
av = AT_MULTILINE.get(av, av)
if flags & SRE_FLAG_LOCALE:
av = AT_LOCALE.get(av, av)
elif flags & SRE_FLAG_UNICODE:
av = AT_UNICODE.get(av, av)
emit(av)
elif op is BRANCH:
emit(op)
tail = []
tailappend = tail.append
for av in av[1]:
skip = _len(code); emit(0)
# _compile_info(code, av, flags)
_compile(code, av, flags)
emit(JUMP)
tailappend(_len(code)); emit(0)
code[skip] = _len(code) - skip
emit(FAILURE) # end of branch
for tail in tail:
code[tail] = _len(code) - tail
elif op is CATEGORY:
emit(op)
if flags & SRE_FLAG_LOCALE:
av = CH_LOCALE[av]
elif flags & SRE_FLAG_UNICODE:
av = CH_UNICODE[av]
emit(av)
elif op is GROUPREF:
if not flags & SRE_FLAG_IGNORECASE:
emit(op)
elif flags & SRE_FLAG_LOCALE:
emit(GROUPREF_LOC_IGNORE)
elif not fixes: # ascii
emit(GROUPREF_IGNORE)
else:
emit(GROUPREF_UNI_IGNORE)
emit(av-1)
elif op is GROUPREF_EXISTS:
emit(op)
emit(av[0]-1)
skipyes = _len(code); emit(0)
_compile(code, av[1], flags)
if av[2]:
emit(JUMP)
skipno = _len(code); emit(0)
code[skipyes] = _len(code) - skipyes + 1
_compile(code, av[2], flags)
code[skipno] = _len(code) - skipno
else:
code[skipyes] = _len(code) - skipyes + 1
else:
raise error("internal: unsupported operand type %r" % (op,))
def _compile_charset(charset, flags, code):
# compile charset subprogram
emit = code.append
for op, av in charset:
emit(op)
if op is NEGATE:
pass
elif op is LITERAL:
emit(av)
elif op is RANGE or op is RANGE_UNI_IGNORE:
emit(av[0])
emit(av[1])
elif op is CHARSET:
code.extend(av)
elif op is BIGCHARSET:
code.extend(av)
elif op is CATEGORY:
if flags & SRE_FLAG_LOCALE:
emit(CH_LOCALE[av])
elif flags & SRE_FLAG_UNICODE:
emit(CH_UNICODE[av])
else:
emit(av)
else:
raise error("internal: unsupported set operator %r" % (op,))
emit(FAILURE)
def _optimize_charset(charset, iscased=None, fixup=None, fixes=None):
# internal: optimize character set
out = []
tail = []
charmap = bytearray(256)
hascased = False
for op, av in charset:
while True:
try:
if op is LITERAL:
if fixup:
lo = fixup(av)
charmap[lo] = 1
if fixes and lo in fixes:
for k in fixes[lo]:
charmap[k] = 1
if not hascased and iscased(av):
hascased = True
else:
charmap[av] = 1
elif op is RANGE:
r = range(av[0], av[1]+1)
if fixup:
if fixes:
for i in map(fixup, r):
charmap[i] = 1
if i in fixes:
for k in fixes[i]:
charmap[k] = 1
else:
for i in map(fixup, r):
charmap[i] = 1
if not hascased:
hascased = any(map(iscased, r))
else:
for i in r:
charmap[i] = 1
elif op is NEGATE:
out.append((op, av))
else:
tail.append((op, av))
except IndexError:
if len(charmap) == 256:
# character set contains non-UCS1 character codes
charmap += b'\0' * 0xff00
continue
# Character set contains non-BMP character codes.
if fixup:
hascased = True
# There are only two ranges of cased non-BMP characters:
# 10400-1044F (Deseret) and 118A0-118DF (Warang Citi),
# and for both ranges RANGE_UNI_IGNORE works.
if op is RANGE:
op = RANGE_UNI_IGNORE
tail.append((op, av))
break
# compress character map
runs = []
q = 0
while True:
p = charmap.find(1, q)
if p < 0:
break
if len(runs) >= 2:
runs = None
break
q = charmap.find(0, p)
if q < 0:
runs.append((p, len(charmap)))
break
runs.append((p, q))
if runs is not None:
# use literal/range
for p, q in runs:
if q - p == 1:
out.append((LITERAL, p))
else:
out.append((RANGE, (p, q - 1)))
out += tail
# if the case was changed or new representation is more compact
if hascased or len(out) < len(charset):
return out, hascased
# else original character set is good enough
return charset, hascased
# use bitmap
if len(charmap) == 256:
data = _mk_bitmap(charmap)
out.append((CHARSET, data))
out += tail
return out, hascased
# To represent a big charset, first a bitmap of all characters in the
# set is constructed. Then, this bitmap is sliced into chunks of 256
# characters, duplicate chunks are eliminated, and each chunk is
# given a number. In the compiled expression, the charset is
# represented by a 32-bit word sequence, consisting of one word for
# the number of different chunks, a sequence of 256 bytes (64 words)
# of chunk numbers indexed by their original chunk position, and a
# sequence of 256-bit chunks (8 words each).
# Compression is normally good: in a typical charset, large ranges of
# Unicode will be either completely excluded (e.g. if only cyrillic
# letters are to be matched), or completely included (e.g. if large
# subranges of Kanji match). These ranges will be represented by
# chunks of all one-bits or all zero-bits.
# Matching can be also done efficiently: the more significant byte of
# the Unicode character is an index into the chunk number, and the
# less significant byte is a bit index in the chunk (just like the
# CHARSET matching).
charmap = bytes(charmap) # should be hashable
comps = {}
mapping = bytearray(256)
block = 0
data = bytearray()
for i in range(0, 65536, 256):
chunk = charmap[i: i + 256]
if chunk in comps:
mapping[i // 256] = comps[chunk]
else:
mapping[i // 256] = comps[chunk] = block
block += 1
data += chunk
data = _mk_bitmap(data)
data[0:0] = [block] + _bytes_to_codes(mapping)
out.append((BIGCHARSET, data))
out += tail
return out, hascased
_CODEBITS = _sre.CODESIZE * 8
MAXCODE = (1 << _CODEBITS) - 1
_BITS_TRANS = b'0' + b'1' * 255
def _mk_bitmap(bits, _CODEBITS=_CODEBITS, _int=int):
s = bits.translate(_BITS_TRANS)[::-1]
return [_int(s[i - _CODEBITS: i], 2)
for i in range(len(s), 0, -_CODEBITS)]
def _bytes_to_codes(b):
# Convert block indices to word array
a = memoryview(b).cast('I')
assert a.itemsize == _sre.CODESIZE
assert len(a) * a.itemsize == len(b)
return a.tolist()
def _simple(p):
# check if this subpattern is a "simple" operator
if len(p) != 1:
return False
op, av = p[0]
if op is SUBPATTERN:
return av[0] is None and _simple(av[-1])
return op in _UNIT_CODES
def _generate_overlap_table(prefix):
"""
Generate an overlap table for the following prefix.
An overlap table is a table of the same size as the prefix which
informs about the potential self-overlap for each index in the prefix:
- if overlap[i] == 0, prefix[i:] can't overlap prefix[0:...]
- if overlap[i] == k with 0 < k <= i, prefix[i-k+1:i+1] overlaps with
prefix[0:k]
"""
table = [0] * len(prefix)
for i in range(1, len(prefix)):
idx = table[i - 1]
while prefix[i] != prefix[idx]:
if idx == 0:
table[i] = 0
break
idx = table[idx - 1]
else:
table[i] = idx + 1
return table
def _get_iscased(flags):
if not flags & SRE_FLAG_IGNORECASE:
return None
elif flags & SRE_FLAG_UNICODE:
return _sre.unicode_iscased
else:
return _sre.ascii_iscased
def _get_literal_prefix(pattern, flags):
# look for literal prefix
prefix = []
prefixappend = prefix.append
prefix_skip = None
iscased = _get_iscased(flags)
for op, av in pattern.data:
if op is LITERAL:
if iscased and iscased(av):
break
prefixappend(av)
elif op is SUBPATTERN:
group, add_flags, del_flags, p = av
flags1 = _combine_flags(flags, add_flags, del_flags)
if flags1 & SRE_FLAG_IGNORECASE and flags1 & SRE_FLAG_LOCALE:
break
prefix1, prefix_skip1, got_all = _get_literal_prefix(p, flags1)
if prefix_skip is None:
if group is not None:
prefix_skip = len(prefix)
elif prefix_skip1 is not None:
prefix_skip = len(prefix) + prefix_skip1
prefix.extend(prefix1)
if not got_all:
break
else:
break
else:
return prefix, prefix_skip, True
return prefix, prefix_skip, False
def _get_charset_prefix(pattern, flags):
while True:
if not pattern.data:
return None
op, av = pattern.data[0]
if op is not SUBPATTERN:
break
group, add_flags, del_flags, pattern = av
flags = _combine_flags(flags, add_flags, del_flags)
if flags & SRE_FLAG_IGNORECASE and flags & SRE_FLAG_LOCALE:
return None
iscased = _get_iscased(flags)
if op is LITERAL:
if iscased and iscased(av):
return None
return [(op, av)]
elif op is BRANCH:
charset = []
charsetappend = charset.append
for p in av[1]:
if not p:
return None
op, av = p[0]
if op is LITERAL and not (iscased and iscased(av)):
charsetappend((op, av))
else:
return None
return charset
elif op is IN:
charset = av
if iscased:
for op, av in charset:
if op is LITERAL:
if iscased(av):
return None
elif op is RANGE:
if av[1] > 0xffff:
return None
if any(map(iscased, range(av[0], av[1]+1))):
return None
return charset
return None
def _compile_info(code, pattern, flags):
# internal: compile an info block. in the current version,
# this contains min/max pattern width, and an optional literal
# prefix or a character map
lo, hi = pattern.getwidth()
if hi > MAXCODE:
hi = MAXCODE
if lo == 0:
code.extend([INFO, 4, 0, lo, hi])
return
# look for a literal prefix
prefix = []
prefix_skip = 0
charset = [] # not used
if not (flags & SRE_FLAG_IGNORECASE and flags & SRE_FLAG_LOCALE):
# look for literal prefix
prefix, prefix_skip, got_all = _get_literal_prefix(pattern, flags)
# if no prefix, look for charset prefix
if not prefix:
charset = _get_charset_prefix(pattern, flags)
## if prefix:
## print("*** PREFIX", prefix, prefix_skip)
## if charset:
## print("*** CHARSET", charset)
# add an info block
emit = code.append
emit(INFO)
skip = len(code); emit(0)
# literal flag
mask = 0
if prefix:
mask = SRE_INFO_PREFIX
if prefix_skip is None and got_all:
mask = mask | SRE_INFO_LITERAL
elif charset:
mask = mask | SRE_INFO_CHARSET
emit(mask)
# pattern length
if lo < MAXCODE:
emit(lo)
else:
emit(MAXCODE)
prefix = prefix[:MAXCODE]
emit(min(hi, MAXCODE))
# add literal prefix
if prefix:
emit(len(prefix)) # length
if prefix_skip is None:
prefix_skip = len(prefix)
emit(prefix_skip) # skip
code.extend(prefix)
# generate overlap table
code.extend(_generate_overlap_table(prefix))
elif charset:
charset, hascased = _optimize_charset(charset)
assert not hascased
_compile_charset(charset, flags, code)
code[skip] = len(code) - skip
def isstring(obj):
return isinstance(obj, (str, bytes))
def _code(p, flags):
flags = p.state.flags | flags
code = []
# compile info block
_compile_info(code, p, flags)
# compile the pattern
_compile(code, p.data, flags)
code.append(SUCCESS)
return code
def _hex_code(code):
return '[%s]' % ', '.join('%#0*x' % (_sre.CODESIZE*2+2, x) for x in code)
def dis(code):
import sys
labels = set()
level = 0
offset_width = len(str(len(code) - 1))
def dis_(start, end):
def print_(*args, to=None):
if to is not None:
labels.add(to)
args += ('(to %d)' % (to,),)
print('%*d%s ' % (offset_width, start, ':' if start in labels else '.'),
end=' '*(level-1))
print(*args)
def print_2(*args):
print(end=' '*(offset_width + 2*level))
print(*args)
nonlocal level
level += 1
i = start
while i < end:
start = i
op = code[i]
i += 1
op = OPCODES[op]
if op in (SUCCESS, FAILURE, ANY, ANY_ALL,
MAX_UNTIL, MIN_UNTIL, NEGATE):
print_(op)
elif op in (LITERAL, NOT_LITERAL,
LITERAL_IGNORE, NOT_LITERAL_IGNORE,
LITERAL_UNI_IGNORE, NOT_LITERAL_UNI_IGNORE,
LITERAL_LOC_IGNORE, NOT_LITERAL_LOC_IGNORE):
arg = code[i]
i += 1
print_(op, '%#02x (%r)' % (arg, chr(arg)))
elif op is AT:
arg = code[i]
i += 1
arg = str(ATCODES[arg])
assert arg[:3] == 'AT_'
print_(op, arg[3:])
elif op is CATEGORY:
arg = code[i]
i += 1
arg = str(CHCODES[arg])
assert arg[:9] == 'CATEGORY_'
print_(op, arg[9:])
elif op in (IN, IN_IGNORE, IN_UNI_IGNORE, IN_LOC_IGNORE):
skip = code[i]
print_(op, skip, to=i+skip)
dis_(i+1, i+skip)
i += skip
elif op in (RANGE, RANGE_UNI_IGNORE):
lo, hi = code[i: i+2]
i += 2
print_(op, '%#02x %#02x (%r-%r)' % (lo, hi, chr(lo), chr(hi)))
elif op is CHARSET:
print_(op, _hex_code(code[i: i + 256//_CODEBITS]))
i += 256//_CODEBITS
elif op is BIGCHARSET:
arg = code[i]
i += 1
mapping = list(b''.join(x.to_bytes(_sre.CODESIZE, sys.byteorder)
for x in code[i: i + 256//_sre.CODESIZE]))
print_(op, arg, mapping)
i += 256//_sre.CODESIZE
level += 1
for j in range(arg):
print_2(_hex_code(code[i: i + 256//_CODEBITS]))
i += 256//_CODEBITS
level -= 1
elif op in (MARK, GROUPREF, GROUPREF_IGNORE, GROUPREF_UNI_IGNORE,
GROUPREF_LOC_IGNORE):
arg = code[i]
i += 1
print_(op, arg)
elif op is JUMP:
skip = code[i]
print_(op, skip, to=i+skip)
i += 1
elif op is BRANCH:
skip = code[i]
print_(op, skip, to=i+skip)
while skip:
dis_(i+1, i+skip)
i += skip
start = i
skip = code[i]
if skip:
print_('branch', skip, to=i+skip)
else:
print_(FAILURE)
i += 1
elif op in (REPEAT, REPEAT_ONE, MIN_REPEAT_ONE):
skip, min, max = code[i: i+3]
if max == MAXREPEAT:
max = 'MAXREPEAT'
print_(op, skip, min, max, to=i+skip)
dis_(i+3, i+skip)
i += skip
elif op is GROUPREF_EXISTS:
arg, skip = code[i: i+2]
print_(op, arg, skip, to=i+skip)
i += 2
elif op in (ASSERT, ASSERT_NOT):
skip, arg = code[i: i+2]
print_(op, skip, arg, to=i+skip)
dis_(i+2, i+skip)
i += skip
elif op is INFO:
skip, flags, min, max = code[i: i+4]
if max == MAXREPEAT:
max = 'MAXREPEAT'
print_(op, skip, bin(flags), min, max, to=i+skip)
start = i+4
if flags & SRE_INFO_PREFIX:
prefix_len, prefix_skip = code[i+4: i+6]
print_2(' prefix_skip', prefix_skip)
start = i + 6
prefix = code[start: start+prefix_len]
print_2(' prefix',
'[%s]' % ', '.join('%#02x' % x for x in prefix),
'(%r)' % ''.join(map(chr, prefix)))
start += prefix_len
print_2(' overlap', code[start: start+prefix_len])
start += prefix_len
if flags & SRE_INFO_CHARSET:
level += 1
print_2('in')
dis_(start, i+skip)
level -= 1
i += skip
else:
raise ValueError(op)
level -= 1
dis_(0, len(code))
def compile(p, flags=0):
# internal: convert pattern list to internal format
if isstring(p):
pattern = p
p = sre_parse.parse(p, flags)
else:
pattern = None
code = _code(p, flags)
if flags & SRE_FLAG_DEBUG:
print()
dis(code)
# map in either direction
groupindex = p.state.groupdict
indexgroup = [None] * p.state.groups
for k, i in groupindex.items():
indexgroup[i] = k
return _sre.compile(
pattern, flags | p.state.flags, code,
p.state.groups-1,
groupindex, tuple(indexgroup)
)
SILENT KILLER Tool