Server : Apache System : Linux indy02.toastserver.com 3.10.0-962.3.2.lve1.5.85.el7.x86_64 #1 SMP Thu Apr 18 15:18:36 UTC 2024 x86_64 User : palandch ( 1163) PHP Version : 7.1.33 Disable Function : NONE Directory : /opt/alt/python37/lib64/python3.7/site-packages/guppy/gsl/ |
class GsmlHandler: # To be mixed in with something like HTMLParser.HTMLParser def handle_starttag(self, tag, attrs): self.stack.append(self.out) self.out = [] if attrs: at = [] for k, v in attrs: at.append(self.mod.node_of_taci(k, v)) self.out.append(self.mod.node_of_taci('with', '', at)) def handle_endtag(self, tag): node = self.mod.node_of_taci(tag, '', self.out) self.out = self.stack.pop() self.out.append(node) def handle_charref(self, name): if name[:1] == "x": char = int(name[1:], 16) name = '0'+name else: char = int(name) if 0 <= char < 128: char = chr(char) self.handle_data(char) else: self.out.append(self.mod.node_of_taci('char', name)) def handle_entityref(self, name): if name not in self.mod.entitydefs: self.unknown_entityref(name) self.out.append(self.mod.node_of_taci('char', name)) def unknown_entityref(self, name): raise SyntaxError('Unknown entity ref: %r' % name) def handle_data(self, data): # data = data.strip() if data.strip(): self.out.extend(self.mod.nodes_of_text(data)) def handle_comment(self, data): self.out.append(self.mod.node_of_taci('comment', data, (), 0)) def handle_decl(self, decl): self.out.append(self.mod.node_of_taci('html_declaration', decl)) def handle_pi(self, data): self.out.append(self.mod.node_of_taci('processing_instruction', data)) class _GLUECLAMP_: _imports_ = ( '_root.html.parser:HTMLParser', '_parent.SpecNodes:node_of_taci', '_parent.SpecNodes:nodes_of_text', '_root.htmlentitydefs:entitydefs', ) encoding = "iso-8859-1" def node_of_gsml(self, text): class Parser(GsmlHandler, self.HTMLParser): def __init__(self, mod): mod.HTMLParser.__init__(self) self.mod = mod self.out = [] self.stack = [] p = Parser(self) p.feed(text) p.close() if p.stack: raise SyntaxError('Missing end tag') node = self.node_of_taci('block', '', p.out, 0) return node def _test_main_(self): x = """ <!DOCTYPE html...> This is an <em> emphasized </em> word. See also <a href="guppy-pe.sf.net"> Guppy. </a> Defined as <use_my_macro/>. Handle char ref: d. Handle char ref: <. <!-- A comment --> <?A processing instruction> <namespace:tag /> """ node = self.node_of_gsml(x) # FIXME: Assert equals to something? print(node)