Linux vmi2545633.contaboserver.net 6.1.0-32-amd64 #1 SMP PREEMPT_DYNAMIC Debian 6.1.129-1 (2025-03-06) x86_64
Apache/2.4.62 (Debian)
Server IP : 127.0.0.1 & Your IP : 127.0.0.1
Domains :
Cant Read [ /etc/named.conf ]
User : www-data
Terminal
Auto Root
Create File
Create Folder
Localroot Suggester
Backdoor Destroyer
Readme
/
usr /
lib /
python3.11 /
Delete
Unzip
Name
Size
Permission
Date
Action
__phello__
[ DIR ]
drwxr-xr-x
2025-04-07 20:15
__pycache__
[ DIR ]
drwxr-xr-x
2025-04-07 20:15
asyncio
[ DIR ]
drwxr-xr-x
2025-04-07 20:15
collections
[ DIR ]
drwxr-xr-x
2025-04-07 20:15
concurrent
[ DIR ]
drwxr-xr-x
2025-04-07 20:15
config-3.11-x86_64-linux-gnu
[ DIR ]
drwxr-xr-x
2025-04-08 16:44
ctypes
[ DIR ]
drwxr-xr-x
2025-04-07 20:15
curses
[ DIR ]
drwxr-xr-x
2025-04-07 20:15
dbm
[ DIR ]
drwxr-xr-x
2025-04-07 20:15
distutils
[ DIR ]
drwxr-xr-x
2025-04-08 16:44
email
[ DIR ]
drwxr-xr-x
2025-04-07 20:15
encodings
[ DIR ]
drwxr-xr-x
2025-04-07 20:15
html
[ DIR ]
drwxr-xr-x
2025-04-07 20:15
http
[ DIR ]
drwxr-xr-x
2025-04-07 20:15
importlib
[ DIR ]
drwxr-xr-x
2025-04-07 20:15
json
[ DIR ]
drwxr-xr-x
2025-04-07 20:15
lib-dynload
[ DIR ]
drwxr-xr-x
2025-04-07 20:15
lib2to3
[ DIR ]
drwxr-xr-x
2025-04-08 16:44
logging
[ DIR ]
drwxr-xr-x
2025-04-07 20:15
multiprocessing
[ DIR ]
drwxr-xr-x
2025-04-07 20:15
pydoc_data
[ DIR ]
drwxr-xr-x
2025-04-07 20:15
re
[ DIR ]
drwxr-xr-x
2025-04-07 20:15
sqlite3
[ DIR ]
drwxr-xr-x
2025-04-07 20:15
test
[ DIR ]
drwxr-xr-x
2025-04-07 20:15
tomllib
[ DIR ]
drwxr-xr-x
2025-04-07 20:15
unittest
[ DIR ]
drwxr-xr-x
2025-04-07 20:15
urllib
[ DIR ]
drwxr-xr-x
2025-04-07 20:15
venv
[ DIR ]
drwxr-xr-x
2025-04-07 20:15
wsgiref
[ DIR ]
drwxr-xr-x
2025-04-07 20:15
xml
[ DIR ]
drwxr-xr-x
2025-04-07 20:15
xmlrpc
[ DIR ]
drwxr-xr-x
2025-04-07 20:15
zoneinfo
[ DIR ]
drwxr-xr-x
2025-04-07 20:15
EXTERNALLY-MANAGED
645
B
-rw-r--r--
2024-11-30 21:22
LICENSE.txt
13.61
KB
-rw-r--r--
2024-11-30 21:22
__future__.py
5.1
KB
-rw-r--r--
2024-11-30 21:22
__hello__.py
227
B
-rw-r--r--
2024-11-30 21:22
_aix_support.py
3.31
KB
-rw-r--r--
2024-11-30 21:22
_bootsubprocess.py
2.61
KB
-rw-r--r--
2024-11-30 21:22
_collections_abc.py
29.49
KB
-rw-r--r--
2024-11-30 21:22
_compat_pickle.py
8.56
KB
-rw-r--r--
2024-11-30 21:22
_compression.py
5.55
KB
-rw-r--r--
2024-11-30 21:22
_distutils_system_mod.py
6.16
KB
-rw-r--r--
2024-11-30 21:22
_markupbase.py
14.31
KB
-rw-r--r--
2024-11-30 21:22
_osx_support.py
21.28
KB
-rw-r--r--
2024-11-30 21:22
_py_abc.py
6.04
KB
-rw-r--r--
2024-11-30 21:22
_pydecimal.py
223.83
KB
-rw-r--r--
2024-11-30 21:22
_pyio.py
91.83
KB
-rw-r--r--
2024-11-30 21:22
_sitebuiltins.py
3.05
KB
-rw-r--r--
2024-11-30 21:22
_strptime.py
24.68
KB
-rw-r--r--
2024-11-30 21:22
_sysconfigdata__linux_x86_64-linux-gnu.py
42.36
KB
-rw-r--r--
2024-11-30 21:22
_sysconfigdata__x86_64-linux-gnu.py
42.36
KB
-rw-r--r--
2024-11-30 21:22
_threading_local.py
7.05
KB
-rw-r--r--
2024-11-30 21:22
_weakrefset.py
5.75
KB
-rw-r--r--
2024-11-30 21:22
abc.py
6.37
KB
-rw-r--r--
2024-11-30 21:22
aifc.py
33.41
KB
-rw-r--r--
2024-11-30 21:22
antigravity.py
500
B
-rw-r--r--
2024-11-30 21:22
argparse.py
97.28
KB
-rw-r--r--
2024-11-30 21:22
ast.py
59.25
KB
-rw-r--r--
2024-11-30 21:22
asynchat.py
11.3
KB
-rw-r--r--
2024-11-30 21:22
asyncore.py
19.83
KB
-rw-r--r--
2024-11-30 21:22
base64.py
20.53
KB
-rwxr-xr-x
2024-11-30 21:22
bdb.py
31.59
KB
-rw-r--r--
2024-11-30 21:22
bisect.py
3.06
KB
-rw-r--r--
2024-11-30 21:22
bz2.py
11.57
KB
-rw-r--r--
2024-11-30 21:22
cProfile.py
6.19
KB
-rwxr-xr-x
2024-11-30 21:22
calendar.py
24.17
KB
-rw-r--r--
2024-11-30 21:22
cgi.py
33.61
KB
-rwxr-xr-x
2024-11-30 21:22
cgitb.py
12.13
KB
-rw-r--r--
2024-11-30 21:22
chunk.py
5.37
KB
-rw-r--r--
2024-11-30 21:22
cmd.py
14.52
KB
-rw-r--r--
2024-11-30 21:22
code.py
10.37
KB
-rw-r--r--
2024-11-30 21:22
codecs.py
35.85
KB
-rw-r--r--
2024-11-30 21:22
codeop.py
5.47
KB
-rw-r--r--
2024-11-30 21:22
colorsys.py
3.93
KB
-rw-r--r--
2024-11-30 21:22
compileall.py
19.78
KB
-rw-r--r--
2024-11-30 21:22
configparser.py
53.96
KB
-rw-r--r--
2024-11-30 21:22
contextlib.py
26.44
KB
-rw-r--r--
2024-11-30 21:22
contextvars.py
129
B
-rw-r--r--
2024-11-30 21:22
copy.py
8.48
KB
-rw-r--r--
2024-11-30 21:22
copyreg.py
7.5
KB
-rw-r--r--
2024-11-30 21:22
crypt.py
3.82
KB
-rw-r--r--
2024-11-30 21:22
csv.py
15.65
KB
-rw-r--r--
2024-11-30 21:22
dataclasses.py
56.5
KB
-rw-r--r--
2024-11-30 21:22
datetime.py
89.85
KB
-rw-r--r--
2024-11-30 21:22
decimal.py
320
B
-rw-r--r--
2024-11-30 21:22
difflib.py
81.36
KB
-rw-r--r--
2024-11-30 21:22
dis.py
28.28
KB
-rw-r--r--
2024-11-30 21:22
doctest.py
102.71
KB
-rw-r--r--
2024-11-30 21:22
enum.py
76.81
KB
-rw-r--r--
2024-11-30 21:22
filecmp.py
9.94
KB
-rw-r--r--
2024-11-30 21:22
fileinput.py
15.33
KB
-rw-r--r--
2024-11-30 21:22
fnmatch.py
5.86
KB
-rw-r--r--
2024-11-30 21:22
fractions.py
28
KB
-rw-r--r--
2024-11-30 21:22
ftplib.py
34.66
KB
-rw-r--r--
2024-11-30 21:22
functools.py
37.51
KB
-rw-r--r--
2024-11-30 21:22
genericpath.py
4.86
KB
-rw-r--r--
2024-11-30 21:22
getopt.py
7.31
KB
-rw-r--r--
2024-11-30 21:22
getpass.py
5.85
KB
-rw-r--r--
2024-11-30 21:22
gettext.py
20.8
KB
-rw-r--r--
2024-11-30 21:22
glob.py
8.48
KB
-rw-r--r--
2024-11-30 21:22
graphlib.py
9.43
KB
-rw-r--r--
2024-11-30 21:22
gzip.py
23.51
KB
-rw-r--r--
2024-11-30 21:22
hashlib.py
11.49
KB
-rw-r--r--
2024-11-30 21:22
heapq.py
22.48
KB
-rw-r--r--
2024-11-30 21:22
hmac.py
7.54
KB
-rw-r--r--
2024-11-30 21:22
imaplib.py
53.58
KB
-rw-r--r--
2024-11-30 21:22
imghdr.py
3.86
KB
-rw-r--r--
2024-11-30 21:22
imp.py
10.36
KB
-rw-r--r--
2024-11-30 21:22
inspect.py
121.28
KB
-rw-r--r--
2024-11-30 21:22
io.py
4.14
KB
-rw-r--r--
2024-11-30 21:22
ipaddress.py
76.45
KB
-rw-r--r--
2024-11-30 21:22
keyword.py
1.04
KB
-rw-r--r--
2024-11-30 21:22
linecache.py
5.56
KB
-rw-r--r--
2024-11-30 21:22
locale.py
77.15
KB
-rw-r--r--
2024-11-30 21:22
lzma.py
12.97
KB
-rw-r--r--
2024-11-30 21:22
mailbox.py
76.95
KB
-rw-r--r--
2024-11-30 21:22
mailcap.py
9.15
KB
-rw-r--r--
2024-11-30 21:22
mimetypes.py
22.26
KB
-rw-r--r--
2024-11-30 21:22
modulefinder.py
23.14
KB
-rw-r--r--
2024-11-30 21:22
netrc.py
6.77
KB
-rw-r--r--
2024-11-30 21:22
nntplib.py
40.12
KB
-rw-r--r--
2024-11-30 21:22
ntpath.py
28.95
KB
-rw-r--r--
2024-11-30 21:22
nturl2path.py
2.82
KB
-rw-r--r--
2024-11-30 21:22
numbers.py
10.11
KB
-rw-r--r--
2024-11-30 21:22
opcode.py
10.2
KB
-rw-r--r--
2024-11-30 21:22
operator.py
10.71
KB
-rw-r--r--
2024-11-30 21:22
optparse.py
58.95
KB
-rw-r--r--
2024-11-30 21:22
os.py
38.58
KB
-rw-r--r--
2024-11-30 21:22
pathlib.py
47.44
KB
-rw-r--r--
2024-11-30 21:22
pdb.py
62.4
KB
-rwxr-xr-x
2024-11-30 21:22
pickle.py
63.43
KB
-rw-r--r--
2024-11-30 21:22
pickletools.py
91.29
KB
-rw-r--r--
2024-11-30 21:22
pipes.py
8.77
KB
-rw-r--r--
2024-11-30 21:22
pkgutil.py
24.04
KB
-rw-r--r--
2024-11-30 21:22
platform.py
41.28
KB
-rwxr-xr-x
2024-11-30 21:22
plistlib.py
27.59
KB
-rw-r--r--
2024-11-30 21:22
poplib.py
14.84
KB
-rw-r--r--
2024-11-30 21:22
posixpath.py
16.61
KB
-rw-r--r--
2024-11-30 21:22
pprint.py
23.92
KB
-rw-r--r--
2024-11-30 21:22
profile.py
22.33
KB
-rwxr-xr-x
2024-11-30 21:22
pstats.py
28.67
KB
-rw-r--r--
2024-11-30 21:22
pty.py
5.09
KB
-rw-r--r--
2024-11-30 21:22
py_compile.py
7.69
KB
-rw-r--r--
2024-11-30 21:22
pyclbr.py
11.13
KB
-rw-r--r--
2024-11-30 21:22
pydoc.py
106.57
KB
-rwxr-xr-x
2024-11-30 21:22
queue.py
11.23
KB
-rw-r--r--
2024-11-30 21:22
quopri.py
7.1
KB
-rwxr-xr-x
2024-11-30 21:22
random.py
31.41
KB
-rw-r--r--
2024-11-30 21:22
reprlib.py
5.31
KB
-rw-r--r--
2024-11-30 21:22
rlcompleter.py
7.64
KB
-rw-r--r--
2024-11-30 21:22
runpy.py
12.85
KB
-rw-r--r--
2024-11-30 21:22
sched.py
6.2
KB
-rw-r--r--
2024-11-30 21:22
secrets.py
1.98
KB
-rw-r--r--
2024-11-30 21:22
selectors.py
19.03
KB
-rw-r--r--
2024-11-30 21:22
shelve.py
8.36
KB
-rw-r--r--
2024-11-30 21:22
shlex.py
13.18
KB
-rw-r--r--
2024-11-30 21:22
shutil.py
53.58
KB
-rw-r--r--
2024-11-30 21:22
signal.py
2.38
KB
-rw-r--r--
2024-11-30 21:22
site.py
23.17
KB
-rw-r--r--
2024-11-30 21:22
sitecustomize.py
155
B
-rw-r--r--
2023-03-13 12:18
smtpd.py
30.43
KB
-rwxr-xr-x
2024-11-30 21:22
smtplib.py
44.35
KB
-rwxr-xr-x
2024-11-30 21:22
sndhdr.py
7.27
KB
-rw-r--r--
2024-11-30 21:22
socket.py
36.41
KB
-rw-r--r--
2024-11-30 21:22
socketserver.py
26.94
KB
-rw-r--r--
2024-11-30 21:22
sre_compile.py
231
B
-rw-r--r--
2024-11-30 21:22
sre_constants.py
232
B
-rw-r--r--
2024-11-30 21:22
sre_parse.py
229
B
-rw-r--r--
2024-11-30 21:22
ssl.py
52.71
KB
-rw-r--r--
2024-11-30 21:22
stat.py
5.36
KB
-rw-r--r--
2024-11-30 21:22
statistics.py
46.59
KB
-rw-r--r--
2024-11-30 21:22
string.py
11.51
KB
-rw-r--r--
2024-11-30 21:22
stringprep.py
12.61
KB
-rw-r--r--
2024-11-30 21:22
struct.py
257
B
-rw-r--r--
2024-11-30 21:22
subprocess.py
83.74
KB
-rw-r--r--
2024-11-30 21:22
sunau.py
18.05
KB
-rw-r--r--
2024-11-30 21:22
symtable.py
10.13
KB
-rw-r--r--
2024-11-30 21:22
sysconfig.py
31.35
KB
-rw-r--r--
2024-11-30 21:22
tabnanny.py
11.03
KB
-rwxr-xr-x
2024-11-30 21:22
tarfile.py
95.25
KB
-rwxr-xr-x
2024-11-30 21:22
telnetlib.py
22.75
KB
-rw-r--r--
2024-11-30 21:22
tempfile.py
34.66
KB
-rw-r--r--
2024-11-30 21:22
textwrap.py
19.26
KB
-rw-r--r--
2024-11-30 21:22
this.py
1003
B
-rw-r--r--
2024-11-30 21:22
threading.py
56.46
KB
-rw-r--r--
2024-11-30 21:22
timeit.py
13.18
KB
-rwxr-xr-x
2024-11-30 21:22
token.py
2.33
KB
-rw-r--r--
2024-11-30 21:22
tokenize.py
25.72
KB
-rw-r--r--
2024-11-30 21:22
trace.py
28.52
KB
-rwxr-xr-x
2024-11-30 21:22
traceback.py
37.52
KB
-rw-r--r--
2024-11-30 21:22
tracemalloc.py
17.62
KB
-rw-r--r--
2024-11-30 21:22
tty.py
879
B
-rw-r--r--
2024-11-30 21:22
turtle.py
140.97
KB
-rw-r--r--
2024-11-30 21:22
types.py
9.83
KB
-rw-r--r--
2024-11-30 21:22
typing.py
114.35
KB
-rw-r--r--
2024-11-30 21:22
uu.py
6.86
KB
-rwxr-xr-x
2024-11-30 21:22
uuid.py
26.95
KB
-rw-r--r--
2024-11-30 21:22
warnings.py
20.53
KB
-rw-r--r--
2024-11-30 21:22
wave.py
21.33
KB
-rw-r--r--
2024-11-30 21:22
weakref.py
21.01
KB
-rw-r--r--
2024-11-30 21:22
webbrowser.py
24.5
KB
-rwxr-xr-x
2024-11-30 21:22
xdrlib.py
5.84
KB
-rw-r--r--
2024-11-30 21:22
zipapp.py
7.36
KB
-rw-r--r--
2024-11-30 21:22
zipfile.py
90.81
KB
-rw-r--r--
2024-11-30 21:22
zipimport.py
30.17
KB
-rw-r--r--
2024-11-30 21:22
Save
Rename
"""Shared support for scanning document type declarations in HTML and XHTML. This module is used as a foundation for the html.parser module. It has no documented public API and should not be used directly. """ import re _declname_match = re.compile(r'[a-zA-Z][-_.a-zA-Z0-9]*\s*').match _declstringlit_match = re.compile(r'(\'[^\']*\'|"[^"]*")\s*').match _commentclose = re.compile(r'--\s*>') _markedsectionclose = re.compile(r']\s*]\s*>') # An analysis of the MS-Word extensions is available at # http://www.planetpublish.com/xmlarena/xap/Thursday/WordtoXML.pdf _msmarkedsectionclose = re.compile(r']\s*>') del re class ParserBase: """Parser base class which provides some common support methods used by the SGML/HTML and XHTML parsers.""" def __init__(self): if self.__class__ is ParserBase: raise RuntimeError( "_markupbase.ParserBase must be subclassed") def reset(self): self.lineno = 1 self.offset = 0 def getpos(self): """Return current line number and offset.""" return self.lineno, self.offset # Internal -- update line number and offset. This should be # called for each piece of data exactly once, in order -- in other # words the concatenation of all the input strings to this # function should be exactly the entire input. def updatepos(self, i, j): if i >= j: return j rawdata = self.rawdata nlines = rawdata.count("\n", i, j) if nlines: self.lineno = self.lineno + nlines pos = rawdata.rindex("\n", i, j) # Should not fail self.offset = j-(pos+1) else: self.offset = self.offset + j-i return j _decl_otherchars = '' # Internal -- parse declaration (for use by subclasses). def parse_declaration(self, i): # This is some sort of declaration; in "HTML as # deployed," this should only be the document type # declaration ("<!DOCTYPE html...>"). # ISO 8879:1986, however, has more complex # declaration syntax for elements in <!...>, including: # --comment-- # [marked section] # name in the following list: ENTITY, DOCTYPE, ELEMENT, # ATTLIST, NOTATION, SHORTREF, USEMAP, # LINKTYPE, LINK, IDLINK, USELINK, SYSTEM rawdata = self.rawdata j = i + 2 assert rawdata[i:j] == "<!", "unexpected call to parse_declaration" if rawdata[j:j+1] == ">": # the empty comment <!> return j + 1 if rawdata[j:j+1] in ("-", ""): # Start of comment followed by buffer boundary, # or just a buffer boundary. return -1 # A simple, practical version could look like: ((name|stringlit) S*) + '>' n = len(rawdata) if rawdata[j:j+2] == '--': #comment # Locate --.*-- as the body of the comment return self.parse_comment(i) elif rawdata[j] == '[': #marked section # Locate [statusWord [...arbitrary SGML...]] as the body of the marked section # Where statusWord is one of TEMP, CDATA, IGNORE, INCLUDE, RCDATA # Note that this is extended by Microsoft Office "Save as Web" function # to include [if...] and [endif]. return self.parse_marked_section(i) else: #all other declaration elements decltype, j = self._scan_name(j, i) if j < 0: return j if decltype == "doctype": self._decl_otherchars = '' while j < n: c = rawdata[j] if c == ">": # end of declaration syntax data = rawdata[i+2:j] if decltype == "doctype": self.handle_decl(data) else: # According to the HTML5 specs sections "8.2.4.44 Bogus # comment state" and "8.2.4.45 Markup declaration open # state", a comment token should be emitted. # Calling unknown_decl provides more flexibility though. self.unknown_decl(data) return j + 1 if c in "\"'": m = _declstringlit_match(rawdata, j) if not m: return -1 # incomplete j = m.end() elif c in "abcdefghijklmnopqrstuvwxyzABCDEFGHIJKLMNOPQRSTUVWXYZ": name, j = self._scan_name(j, i) elif c in self._decl_otherchars: j = j + 1 elif c == "[": # this could be handled in a separate doctype parser if decltype == "doctype": j = self._parse_doctype_subset(j + 1, i) elif decltype in {"attlist", "linktype", "link", "element"}: # must tolerate []'d groups in a content model in an element declaration # also in data attribute specifications of attlist declaration # also link type declaration subsets in linktype declarations # also link attribute specification lists in link declarations raise AssertionError("unsupported '[' char in %s declaration" % decltype) else: raise AssertionError("unexpected '[' char in declaration") else: raise AssertionError("unexpected %r char in declaration" % rawdata[j]) if j < 0: return j return -1 # incomplete # Internal -- parse a marked section # Override this to handle MS-word extension syntax <![if word]>content<![endif]> def parse_marked_section(self, i, report=1): rawdata= self.rawdata assert rawdata[i:i+3] == '<![', "unexpected call to parse_marked_section()" sectName, j = self._scan_name( i+3, i ) if j < 0: return j if sectName in {"temp", "cdata", "ignore", "include", "rcdata"}: # look for standard ]]> ending match= _markedsectionclose.search(rawdata, i+3) elif sectName in {"if", "else", "endif"}: # look for MS Office ]> ending match= _msmarkedsectionclose.search(rawdata, i+3) else: raise AssertionError( 'unknown status keyword %r in marked section' % rawdata[i+3:j] ) if not match: return -1 if report: j = match.start(0) self.unknown_decl(rawdata[i+3: j]) return match.end(0) # Internal -- parse comment, return length or -1 if not terminated def parse_comment(self, i, report=1): rawdata = self.rawdata if rawdata[i:i+4] != '<!--': raise AssertionError('unexpected call to parse_comment()') match = _commentclose.search(rawdata, i+4) if not match: return -1 if report: j = match.start(0) self.handle_comment(rawdata[i+4: j]) return match.end(0) # Internal -- scan past the internal subset in a <!DOCTYPE declaration, # returning the index just past any whitespace following the trailing ']'. def _parse_doctype_subset(self, i, declstartpos): rawdata = self.rawdata n = len(rawdata) j = i while j < n: c = rawdata[j] if c == "<": s = rawdata[j:j+2] if s == "<": # end of buffer; incomplete return -1 if s != "<!": self.updatepos(declstartpos, j + 1) raise AssertionError( "unexpected char in internal subset (in %r)" % s ) if (j + 2) == n: # end of buffer; incomplete return -1 if (j + 4) > n: # end of buffer; incomplete return -1 if rawdata[j:j+4] == "<!--": j = self.parse_comment(j, report=0) if j < 0: return j continue name, j = self._scan_name(j + 2, declstartpos) if j == -1: return -1 if name not in {"attlist", "element", "entity", "notation"}: self.updatepos(declstartpos, j + 2) raise AssertionError( "unknown declaration %r in internal subset" % name ) # handle the individual names meth = getattr(self, "_parse_doctype_" + name) j = meth(j, declstartpos) if j < 0: return j elif c == "%": # parameter entity reference if (j + 1) == n: # end of buffer; incomplete return -1 s, j = self._scan_name(j + 1, declstartpos) if j < 0: return j if rawdata[j] == ";": j = j + 1 elif c == "]": j = j + 1 while j < n and rawdata[j].isspace(): j = j + 1 if j < n: if rawdata[j] == ">": return j self.updatepos(declstartpos, j) raise AssertionError("unexpected char after internal subset") else: return -1 elif c.isspace(): j = j + 1 else: self.updatepos(declstartpos, j) raise AssertionError("unexpected char %r in internal subset" % c) # end of buffer reached return -1 # Internal -- scan past <!ELEMENT declarations def _parse_doctype_element(self, i, declstartpos): name, j = self._scan_name(i, declstartpos) if j == -1: return -1 # style content model; just skip until '>' rawdata = self.rawdata if '>' in rawdata[j:]: return rawdata.find(">", j) + 1 return -1 # Internal -- scan past <!ATTLIST declarations def _parse_doctype_attlist(self, i, declstartpos): rawdata = self.rawdata name, j = self._scan_name(i, declstartpos) c = rawdata[j:j+1] if c == "": return -1 if c == ">": return j + 1 while 1: # scan a series of attribute descriptions; simplified: # name type [value] [#constraint] name, j = self._scan_name(j, declstartpos) if j < 0: return j c = rawdata[j:j+1] if c == "": return -1 if c == "(": # an enumerated type; look for ')' if ")" in rawdata[j:]: j = rawdata.find(")", j) + 1 else: return -1 while rawdata[j:j+1].isspace(): j = j + 1 if not rawdata[j:]: # end of buffer, incomplete return -1 else: name, j = self._scan_name(j, declstartpos) c = rawdata[j:j+1] if not c: return -1 if c in "'\"": m = _declstringlit_match(rawdata, j) if m: j = m.end() else: return -1 c = rawdata[j:j+1] if not c: return -1 if c == "#": if rawdata[j:] == "#": # end of buffer return -1 name, j = self._scan_name(j + 1, declstartpos) if j < 0: return j c = rawdata[j:j+1] if not c: return -1 if c == '>': # all done return j + 1 # Internal -- scan past <!NOTATION declarations def _parse_doctype_notation(self, i, declstartpos): name, j = self._scan_name(i, declstartpos) if j < 0: return j rawdata = self.rawdata while 1: c = rawdata[j:j+1] if not c: # end of buffer; incomplete return -1 if c == '>': return j + 1 if c in "'\"": m = _declstringlit_match(rawdata, j) if not m: return -1 j = m.end() else: name, j = self._scan_name(j, declstartpos) if j < 0: return j # Internal -- scan past <!ENTITY declarations def _parse_doctype_entity(self, i, declstartpos): rawdata = self.rawdata if rawdata[i:i+1] == "%": j = i + 1 while 1: c = rawdata[j:j+1] if not c: return -1 if c.isspace(): j = j + 1 else: break else: j = i name, j = self._scan_name(j, declstartpos) if j < 0: return j while 1: c = self.rawdata[j:j+1] if not c: return -1 if c in "'\"": m = _declstringlit_match(rawdata, j) if m: j = m.end() else: return -1 # incomplete elif c == ">": return j + 1 else: name, j = self._scan_name(j, declstartpos) if j < 0: return j # Internal -- scan a name token and the new position and the token, or # return -1 if we've reached the end of the buffer. def _scan_name(self, i, declstartpos): rawdata = self.rawdata n = len(rawdata) if i == n: return None, -1 m = _declname_match(rawdata, i) if m: s = m.group() name = s.strip() if (i + len(s)) == n: return None, -1 # end of buffer return name.lower(), m.end() else: self.updatepos(declstartpos, i) raise AssertionError( "expected name token at %r" % rawdata[declstartpos:declstartpos+20] ) # To be overridden -- handlers for unknown objects def unknown_decl(self, data): pass