|
- # -*- coding: utf-8 -*-
- #
- # Copyright (C) 2012 Ben Kurtovic <ben.kurtovic@verizon.net>
- #
- # Permission is hereby granted, free of charge, to any person obtaining a copy
- # of this software and associated documentation files (the "Software"), to deal
- # in the Software without restriction, including without limitation the rights
- # to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
- # copies of the Software, and to permit persons to whom the Software is
- # furnished to do so, subject to the following conditions:
- #
- # The above copyright notice and this permission notice shall be included in
- # all copies or substantial portions of the Software.
- #
- # THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
- # IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
- # FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
- # AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
- # LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
- # OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
- # SOFTWARE.
-
- import re
-
- from . import tokens
- from ..nodes import Heading, HTMLEntity, Tag, Template, Text
- from ..nodes.extras import Attribute, Parameter
- from ..smart_list import SmartList
- from ..wikicode import Wikicode
-
- __all__ = ["Builder"]
-
- class Builder(object):
- def __init__(self):
- self._tokens = []
- self._stacks = []
-
- def _wrap(self, nodes):
- return Wikicode(SmartList(nodes))
-
- def _push(self):
- self._stacks.append([])
-
- def _pop(self, wrap=True):
- if wrap:
- return self._wrap(self._stacks.pop())
- return self._stacks.pop()
-
- def _write(self, item):
- self._stacks[-1].append(item)
-
- def _handle_parameter(self, key):
- showkey = False
- self._push()
- while self._tokens:
- token = self._tokens.pop(0)
- if isinstance(token, tokens.TemplateParamEquals):
- key = self._pop()
- showkey = True
- self._push()
- elif isinstance(token, (tokens.TemplateParamSeparator,
- tokens.TemplateClose)):
- self._tokens.insert(0, token)
- value = self._pop()
- return Parameter(key, value, showkey)
- else:
- self._write(self._handle_token(token))
-
- def _handle_template(self):
- params = []
- int_keys = set()
- int_key_range = {1}
- self._push()
- while self._tokens:
- token = self._tokens.pop(0)
- if isinstance(token, tokens.TemplateParamSeparator):
- if not params:
- name = self._pop()
- default = unicode(min(int_key_range - int_keys))
- param = self._handle_parameter(self._wrap([Text(default)]))
- if re.match(r"[1-9][0-9]*$", param.name.strip()):
- # We try a more restrictive test for integers than
- # try: int(), because "01" as a key will pass through int()
- # correctly but is not a valid integer key in wikicode:
- int_keys.add(int(unicode(param.name)))
- int_key_range.add(len(int_keys) + 1)
- params.append(param)
- elif isinstance(token, tokens.TemplateClose):
- if not params:
- name = self._pop()
- return Template(name, params)
- else:
- self._write(self._handle_token(token))
-
- def _handle_entity(self):
- token = self._tokens.pop(0)
- if isinstance(token, tokens.HTMLEntityNumeric):
- token = self._tokens.pop(0)
- if isinstance(token, tokens.HTMLEntityHex):
- text = self._tokens.pop(0)
- self._tokens.pop(0) # Remove HTMLEntityEnd
- return HTMLEntity(text.text, named=False, hexadecimal=True,
- hex_char=token.char)
- self._tokens.pop(0) # Remove HTMLEntityEnd
- return HTMLEntity(token.text, named=False, hexadecimal=False)
- self._tokens.pop(0) # Remove HTMLEntityEnd
- return HTMLEntity(token.text, named=True, hexadecimal=False)
-
- def _handle_heading(self, token):
- level = token.level
- self._push()
- while self._tokens:
- token = self._tokens.pop(0)
- if isinstance(token, tokens.HeadingBlock):
- title = self._pop()
- return Heading(title, level)
- else:
- self._write(self._handle_token(token))
-
- def _handle_attribute(self):
- name, quoted = None, False
- self._push()
- while self._tokens:
- token = self._tokens.pop(0)
- if isinstance(token, tokens.TagAttrEquals):
- name = self._pop()
- self._push()
- elif isinstance(token, tokens.TagAttrQuote):
- quoted = True
- elif isinstance(token, (tokens.TagAttrStart,
- tokens.TagCloseOpen)):
- self._tokens.insert(0, token)
- if name is not None:
- return Attribute(name, self._pop(), quoted)
- return Attribute(self._pop(), quoted=quoted)
- else:
- self._write(self._handle_token(token))
-
- def _handle_tag(self, token):
- type_, showtag = token.type, token.showtag
- attrs = []
- self._push()
- while self._tokens:
- token = self._tokens.pop(0)
- if isinstance(token, tokens.TagAttrStart):
- attrs.append(self._handle_attribute())
- elif isinstance(token, tokens.TagCloseOpen):
- open_pad = token.padding
- tag = self._pop()
- self._push()
- elif isinstance(token, tokens.TagCloseSelfclose):
- tag = self._pop()
- return Tag(type_, tag, attrs=attrs, showtag=showtag,
- self_closing=True, open_padding=token.padding)
- elif isinstance(token, tokens.TagOpenClose):
- contents = self._pop()
- elif isinstance(token, tokens.TagCloseClose):
- return Tag(type_, tag, contents, attrs, showtag, False,
- open_pad, token.padding)
- else:
- self._write(self._handle_token(token))
-
- def _handle_token(self, token):
- if isinstance(token, tokens.Text):
- return Text(token.text)
- elif isinstance(token, tokens.TemplateOpen):
- return self._handle_template()
- elif isinstance(token, tokens.HTMLEntityStart):
- return self._handle_entity()
- elif isinstance(token, tokens.HeadingBlock):
- return self._handle_heading(token)
- elif isinstance(token, tokens.TagOpenOpen):
- return self._handle_tag(token)
-
- def build(self, tokenlist):
- self._tokens = tokenlist
- self._push()
- while self._tokens:
- node = self._handle_token(self._tokens.pop(0))
- self._write(node)
- return self._pop()
|