[temp] ~stack tokenizer

2013-08-04 16:30:06 +02:00 · 2013-08-04 16:30:06 +02:00 · 3dc85536ad
commit 3dc85536ad
parent aa740e8a4a
1 changed files with 129 additions and 2 deletions
--- a/tests/test_core_util.py
+++ b/tests/test_core_util.py
@ -239,6 +239,130 @@ class KeyConstraintDictAdvancedTests(unittest.TestCase):
        del kcd["foo"]
        assert kcd.missing() == set(["foo"])
 import re
 def formatp(string, **kwargs):
    """
    Function for advanced format strings with partial formatting
    This function consumes format strings with groups enclosed in brackets. A
    group enclosed in brackets will only become part of the result if all fields
    inside the group evaluate True in boolean contexts.
    Groups can be nested. The fields in a nested group do not count as fields in
    the enclosing group, i.e. the enclosing group will evaluate to an empty
    string even if a nested group would be eligible for formatting. Nesting is
    thus equivalent to a logical or of all enclosing groups with the enclosed
    group.
    Escaped brackets, i.e. \[ and \] are copied verbatim to output.
    """
    class Token:
        def __repr__(self):
            return "<%s> " % self.__class__.__name__
    class OpeningBracket(Token):
        def __repr__(self):
            return "<Group>"
    class ClosingBracket(Token):
        def __repr__(self):
            return "</Group>"
    class String(Token):
        def __init__(self, str):
            self.string = str
        def __repr__(self):
            return super().__repr__() + repr(self.string)
    TOKENS = {
        "[": OpeningBracket,
        "]": ClosingBracket,
    }
    print("==")
    print(string)
    print("==")
    stack = []
    # Index of next unconsumed char
    next = 0
    # Last consumed char
    prev = ""
    # Current char
    char = ""
    while next < len(string):
        prev = char
        char = string[next]
        next += 1
        if prev != "\\" and char in TOKENS:
            token = TOKENS[char]()
            token.index = next
            stack.append(token)
        else:
            if stack and isinstance(stack[-1], String):
                stack[-1].string += c
            else:
                stack.append(String(c))
    print("-----")
    print("Dumping decomposition of")
    print(string)
    print("----")
    output = ""
    i = 0
    for token in stack:
        if token.__class__ == ClosingBracket:
            i-=1
        print("  " * i, repr(token))
        if token.__class__ == OpeningBracket:
            i+=1
    print("----")
    """pbracket = formatp.obracket_re.search(string)
    if not pbracket:
        return string.format(**kwargs)
    pbracket = pbracket.start()
    sbracket = list(formatp.cbracket_re.finditer(string))[-1].end()-1
    prefix = string[:pbracket].format(**kwargs)
    suffix = string[sbracket+1:].format(**kwargs)
    string = string[pbracket+1:sbracket]
    while True:
        b = formatp.obracket_re.search(string)
        e = list(formatp.cbracket_re.finditer(string))
        if b and e:
            b = b.start()
            e = e[-1].end()
            string = string[:b] + formatp(string[b:e], **kwargs) + string[e:]
        else:
            break
    fields = formatp.field_re.findall(string)
    successful_fields = 0
    for fieldspec, fieldname in fields:
        if kwargs.get(fieldname, False):
            successful_fields += 1
    if successful_fields != len(fields):
        return prefix + suffix
    else:
        string = string.replace("\[", "[").replace("\]", "]")
        return prefix + string.format(**kwargs) + suffix"""
 formatp.field_re = re.compile(r"({(\w+)[^}]*})")
 formatp.obracket_re = re.compile(r"(?<!\\)\[")
 formatp.cbracket_re = re.compile(r"(?<!\\)\]")
 util.formatp = formatp
 class FormatPTests(unittest.TestCase):
    def test_escaping(self):
        assert util.formatp("[razamba \[ mabe \]]") == "razamba [ mabe ]"
@ -264,5 +388,8 @@ class FormatPTests(unittest.TestCase):
        assert util.formatp("[{t}]grml") == "grml"
    def test_generic(self):
-        s = "{status} [{artist} / {album} / ]{title}[ {song_elapsed}/{song_length}]"
+        s = "{status} [{artist} / [{album} / ]]{title}[ {song_elapsed}/{song_length}]"
-        assert util.formatp(s, status="▷", title="Only For The Weak", song_elapsed="1:41", song_length="4:55") == "▷ Only For The Weal 1:41/4:55"
+        assert util.formatp(s, status="▷", title="Only For The Weak", song_elapsed="1:41", song_length="4:55") == "▷ Only For The Weak 1:41/4:55"
 fpt = FormatPTests()
 fpt.test_generic()