# -*- coding: utf-8 -*- # # Copyright (C) 2012 Ben Kurtovic # # Permission is hereby granted, free of charge, to any person obtaining a copy # of this software and associated documentation files (the "Software"), to deal # in the Software without restriction, including without limitation the rights # to use, copy, modify, merge, publish, distribute, sublicense, and/or sell # copies of the Software, and to permit persons to whom the Software is # furnished to do so, subject to the following conditions: # # The above copyright notice and this permission notice shall be included in # all copies or substantial portions of the Software. # # THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR # IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, # FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE # AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER # LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, # OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE # SOFTWARE. import re from . import tokens from ..nodes import Heading, HTMLEntity, Tag, Template, Text from ..nodes.extras import Attribute, Parameter from ..smart_list import SmartList from ..wikicode import Wikicode __all__ = ["Builder"] class Builder(object): def __init__(self): self._tokens = [] self._stacks = [] def _wrap(self, nodes): return Wikicode(SmartList(nodes)) def _push(self): self._stacks.append([]) def _pop(self, wrap=True): if wrap: return self._wrap(self._stacks.pop()) return self._stacks.pop() def _write(self, item): self._stacks[-1].append(item) def _handle_parameter(self, key): showkey = False self._push() while self._tokens: token = self._tokens.pop(0) if isinstance(token, tokens.TemplateParamEquals): key = self._pop() showkey = True self._push() elif isinstance(token, (tokens.TemplateParamSeparator, tokens.TemplateClose)): self._tokens.insert(0, token) value = self._pop() return Parameter(key, value, showkey) else: self._write(self._handle_token(token)) def _handle_template(self): params = [] int_keys = set() int_key_range = {1} self._push() while self._tokens: token = self._tokens.pop(0) if isinstance(token, tokens.TemplateParamSeparator): if not params: name = self._pop() default = unicode(min(int_key_range - int_keys)) param = self._handle_parameter(self._wrap([Text(default)])) if re.match(r"[1-9][0-9]*$", param.name.strip()): # We try a more restrictive test for integers than # try: int(), because "01" as a key will pass through int() # correctly but is not a valid integer key in wikicode: int_keys.add(int(unicode(param.name))) int_key_range.add(len(int_keys) + 1) params.append(param) elif isinstance(token, tokens.TemplateClose): if not params: name = self._pop() return Template(name, params) else: self._write(self._handle_token(token)) def _handle_entity(self): token = self._tokens.pop(0) if isinstance(token, tokens.HTMLEntityNumeric): token = self._tokens.pop(0) if isinstance(token, tokens.HTMLEntityHex): text = self._tokens.pop(0) self._tokens.pop(0) # Remove HTMLEntityEnd return HTMLEntity(text.text, named=False, hexadecimal=True, hex_char=token.char) self._tokens.pop(0) # Remove HTMLEntityEnd return HTMLEntity(token.text, named=False, hexadecimal=False) self._tokens.pop(0) # Remove HTMLEntityEnd return HTMLEntity(token.text, named=True, hexadecimal=False) def _handle_heading(self, token): level = token.level self._push() while self._tokens: token = self._tokens.pop(0) if isinstance(token, tokens.HeadingBlock): title = self._pop() return Heading(title, level) else: self._write(self._handle_token(token)) def _handle_attribute(self): name, quoted = None, False self._push() while self._tokens: token = self._tokens.pop(0) if isinstance(token, tokens.TagAttrEquals): name = self._pop() self._push() elif isinstance(token, tokens.TagAttrQuote): quoted = True elif isinstance(token, (tokens.TagAttrStart, tokens.TagCloseOpen)): self._tokens.insert(0, token) if name is not None: return Attribute(name, self._pop(), quoted) return Attribute(self._pop(), quoted=quoted) else: self._write(self._handle_token(token)) def _handle_tag(self, token): type_, showtag = token.type, token.showtag attrs = [] self._push() while self._tokens: token = self._tokens.pop(0) if isinstance(token, tokens.TagAttrStart): attrs.append(self._handle_attribute()) elif isinstance(token, tokens.TagCloseOpen): open_pad = token.padding tag = self._pop() self._push() elif isinstance(token, tokens.TagCloseSelfclose): tag = self._pop() return Tag(type_, tag, attrs=attrs, showtag=showtag, self_closing=True, open_padding=token.padding) elif isinstance(token, tokens.TagOpenClose): contents = self._pop() elif isinstance(token, tokens.TagCloseClose): return Tag(type_, tag, contents, attrs, showtag, False, open_pad, token.padding) else: self._write(self._handle_token(token)) def _handle_token(self, token): if isinstance(token, tokens.Text): return Text(token.text) elif isinstance(token, tokens.TemplateOpen): return self._handle_template() elif isinstance(token, tokens.HTMLEntityStart): return self._handle_entity() elif isinstance(token, tokens.HeadingBlock): return self._handle_heading(token) elif isinstance(token, tokens.TagOpenOpen): return self._handle_tag(token) def build(self, tokenlist): self._tokens = tokenlist self._push() while self._tokens: node = self._handle_token(self._tokens.pop(0)) self._write(node) return self._pop()