import matplotlib.pyplot as plt
import re

def parse_test_line(line):
    fields = line.rstrip().split()
    try:
        fields[0] = float(fields[0])
        fields[1] = int(fields[1])
        fields[2] = float(fields[2])
        fields[3] = int(fields[3])
        assert fields[4] in ["Yes", "No"]
        fields[4] = (fields[4] == "Yes")
    except:
        return None
    return fields

def parse_test_label(line):
    m = re.match(r"..*\((.*)\)", line)
    if m:
        return m.group(1)
    else:
        return None

def read_test(f):
    line = f.readline()
    while not parse_test_label(line):
        line = f.readline()
        if line == "":
            raise Exception("end of file")
    label = parse_test_label(line)

    while not parse_test_line(line):
        line = f.readline()
        if line == "":
            raise Exception("end of file")
    entries = []
    while parse_test_line(line):
        entries.append(parse_test_line(line))
        line = f.readline()
        if line == "":
            break
    return label, entries
        
def plot_tests(filename, colors, limit=None, alpha=1.0, linewidth=1):
    y_lim = 0
    
    f = open(filename)
    for color in colors:
        xs = []
        ys = []
        label, entries = read_test(f)
        for lg_p_A, n_sym, n_bits_ideal, n_bits_actual, does_match in entries:
            if limit != None and lg_p_A < limit:
                break
                
            x = -lg_p_A
            y = 100.0 * n_bits_ideal / n_bits_actual
            if y < y_lim:
                x_prev, y_prev = xs[-2], ys[-2]
                frac = (y_lim - y_prev) / (y - y_prev)
                xs.append(x_prev + frac * (x - x_prev))
                ys.append(y_prev + frac * (y - y_prev))
                break
                
            xs.append(x)
            ys.append(y)
        plt.plot(xs, ys, color, label=(label + " (12-bit)"),
                 alpha=alpha, linewidth=linewidth)
        plt.xlabel("- lg ( p_A )")
        plt.ylabel("coding efficiency (%)")
        plt.legend(loc="lower left", framealpha=0.5)
    plt.show()


plot_tests("test1_12.out", ["b", "r", "g"], alpha=0.5, linewidth=2)
plot_tests("test1_12.out", ["b", "r", "g"], limit=-12.5, 
           alpha=0.5, linewidth=2)
plot_tests("test1_12.out", ["b", "r", "g"], limit=-11.5)


from walrus_piece import *

def transitions_const_p_A(coder_nbits, p_A):
    assert p_A <= .5
    
    max_width = 1 << coder_nbits
    ip_A = int(p_A * P_A_STOP + .5)
    # undone and done are sets of state-widths
    undone = set([max_width])
    done = set()
    transitions = []
    while undone:
        width = undone.pop()
        short_i = 0
        while (max_width >> short_i) > width:
            short_i += 1
        walrus_len, w, e = choose_walrus_len(ip_A, "A", "B", 
                                         coder_nbits, width, short_i)
        walrus_width = max_width >> walrus_len
        if w == "A":
            walrus_prob, eggman_prob = p_A, 1.0 - p_A
        else:
            walrus_prob, eggman_prob = 1.0 - p_A, p_A
        out_states = set()
        # Walrus transition
        transitions.append( (width, walrus_prob, max_width,
                             walrus_len) )
        out_states.add(max_width)
        # Eggman transition
        #     If and only if the eggman after_width is a power of two,
        #     the pessimistic walrus shifts up and transitions to the
        #     start state (max_width).
        after_width = width - walrus_width
        for i in range(short_i, coder_nbits + 1):
            if after_width == max_width >> i:
                transitions.append( (width, eggman_prob, max_width, i) )
                out_states.add(max_width)  # Unnecessary, really.
                break
        else:
            assert after_width > 1, (width, walrus_len, after_width, short_i)
            transitions.append( (width, eggman_prob, 
                                 after_width, 0) )
            out_states.add(after_width)
        done.add(width)
        for out_state in out_states:
            if out_state not in done:
                undone.add(out_state)
    return transitions

print transitions_const_p_A(12, .5)
print
print transitions_const_p_A(12, .376)
print
print transitions_const_p_A(12, .374)
print
print transitions_const_p_A(12, .25)
print

[(4096, 0.5, 4096, 1), (4096, 0.5, 4096, 1)]

[(4096, 0.624, 4096, 1), (4096, 0.376, 4096, 1)]

[(4096, 0.374, 4096, 2), (4096, 0.626, 3072, 0), (3072, 0.626, 4096, 1), (3072, 0.374, 4096, 2)]

[(4096, 0.25, 4096, 2), (4096, 0.75, 3072, 0), (3072, 0.75, 4096, 1), (3072, 0.25, 4096, 2)]


from collections import Counter, defaultdict
from math import log # fer chrissakes.

def trans_tree_to_loops(transitions):
    """
    transitions is a list
        [
            (in_state, prob, out_state, n_bits),
             ...
        ]
    The higher states in the tree have higher numbers.
    Output is a list of one tuple per loop
        [
            (probability, n_syms, n_bits),
            ...
        ]
    """
    state_trans = defaultdict(list)
    for in_state, p, o, n in transitions:
        state_trans[in_state].append( (p, o, n) )
    states = list(state_trans.keys())
    start_state = max(states)
    
    # Check that transitions are tree-like except going back to start.
    n_trans_to = Counter(out for (i, p, out, n) in transitions)
    assert len(state_trans) == len(n_trans_to)
    assert all(n_trans_to[state] == 1 for state in states 
               if state != start_state)
    
    loops = []
    # state_info values are tuples (in_state, prob, n_syms, n_bits)
    state_info = set([ (start_state, 1.0, 0, 0) ])
    while state_info:
        in_state, in_prob, in_n_syms, in_n_bits = state_info.pop()
        for tran_prob, out_state, tran_n_bits in state_trans[in_state]:
            prob = in_prob * tran_prob
            n_syms = in_n_syms + 1
            n_bits = in_n_bits + tran_n_bits
            if out_state == start_state:
                loops.append( (prob, n_syms, n_bits) )
            else:
                state_info.add( (out_state, prob, n_syms, n_bits) )
    return loops

def loops_demo(p_A, coder_nbits=12):
    """
    Print a table of loops for the given p_A.
    """
    trans = transitions_const_p_A(coder_nbits, p_A)
    loops = trans_tree_to_loops(trans)
    print "Loops for fixed p_A ==", p_A
    fmt1 = "%8f  |%6d  |  %4i  %8f  |  %8.5f  %8f"
    fmt2 = "%8f  |%6s  |  %4s  %8f  |  %8s  %8f"
    fmt0 = "%8s  |%6s  |  %4s  %8s  |  %8s  %8s"
    print fmt0 % ("", "syms", "bits", "", "", "")
    print fmt0 % ("prob", "in ", "out", "weighted", "entropy", "weighted")
    horiz_line = "----------+--------+------------------+--------------------"
    print horiz_line
    weighted_n_bits = 0.0
    weighted_entropy = 0.0
    total_prob = 0.0
    worst_effish = 1.0
    for prob, n_syms, n_bits in loops:
        entropy = -log(prob, 2)
        print fmt1 % (prob, n_syms, n_bits, prob * n_bits, entropy, prob * entropy)
        weighted_n_bits += prob * n_bits
        weighted_entropy += prob * entropy
        worst_effish = min(worst_effish, entropy / n_bits)
        total_prob += prob
    print horiz_line
    print fmt2 % (total_prob, "", "", weighted_n_bits, "", weighted_entropy)
    print 
    print "expected efficiency:", weighted_entropy / weighted_n_bits
    print "worst-case efficiency:", worst_effish
    
loops_demo(.376)
print

loops_demo(.374)
print

loops_demo(.333)
print

loops_demo(.26)
print

loops_demo(.24)
print

loops_demo(.125)
print

Loops for fixed p_A == 0.376
          |  syms  |  bits            |                    
    prob  |   in   |   out  weighted  |   entropy  weighted
----------+--------+------------------+--------------------
0.624000  |     1  |     1  0.624000  |   0.68038  0.424558
0.376000  |     1  |     1  0.376000  |   1.41120  0.530609
----------+--------+------------------+--------------------
1.000000  |        |        1.000000  |            0.955168

expected efficiency: 0.955167891861
worst-case efficiency: 0.6803820658

Loops for fixed p_A == 0.374
          |  syms  |  bits            |                    
    prob  |   in   |   out  weighted  |   entropy  weighted
----------+--------+------------------+--------------------
0.374000  |     1  |     2  0.748000  |   1.41889  0.530665
0.391876  |     2  |     1  0.391876  |   1.35153  0.529633
0.234124  |     2  |     2  0.468248  |   2.09466  0.490409
----------+--------+------------------+--------------------
1.000000  |        |        1.608124  |            1.550706

expected efficiency: 0.964295276046
worst-case efficiency: 0.709444912387

Loops for fixed p_A == 0.333
          |  syms  |  bits            |                    
    prob  |   in   |   out  weighted  |   entropy  weighted
----------+--------+------------------+--------------------
0.333000  |     1  |     2  0.666000  |   1.58641  0.528273
0.444889  |     2  |     1  0.444889  |   1.16848  0.519845
0.222111  |     2  |     2  0.444222  |   2.17065  0.482125
----------+--------+------------------+--------------------
1.000000  |        |        1.555111  |            1.530243

expected efficiency: 0.984008786099
worst-case efficiency: 0.793202958795

Loops for fixed p_A == 0.26
          |  syms  |  bits            |                    
    prob  |   in   |   out  weighted  |   entropy  weighted
----------+--------+------------------+--------------------
0.260000  |     1  |     2  0.520000  |   1.94342  0.505288
0.547600  |     2  |     1  0.547600  |   0.86881  0.475758
0.192400  |     2  |     2  0.384800  |   2.37782  0.457492
----------+--------+------------------+--------------------
1.000000  |        |        1.452400  |            1.438539

expected efficiency: 0.990456271094
worst-case efficiency: 0.868805648292

Loops for fixed p_A == 0.24
          |  syms  |  bits            |                    
    prob  |   in   |   out  weighted  |   entropy  weighted
----------+--------+------------------+--------------------
0.240000  |     1  |     2  0.480000  |   2.05889  0.494134
0.182400  |     2  |     3  0.547200  |   2.45482  0.447760
0.438976  |     3  |     1  0.438976  |   1.18779  0.521410
0.138624  |     3  |     3  0.415872  |   2.85075  0.395183
----------+--------+------------------+--------------------
1.000000  |        |        1.882048  |            1.858486

expected efficiency: 0.987480742834
worst-case efficiency: 0.818274121795

Loops for fixed p_A == 0.125
          |  syms  |  bits            |                    
    prob  |   in   |   out  weighted  |   entropy  weighted
----------+--------+------------------+--------------------
0.125000  |     1  |     3  0.375000  |   3.00000  0.375000
0.109375  |     2  |     3  0.328125  |   3.19265  0.349196
0.095703  |     3  |     3  0.287109  |   3.38529  0.323983
0.083740  |     4  |     4  0.334961  |   3.57794  0.299617
0.512909  |     5  |     1  0.512909  |   0.96323  0.494047
0.073273  |     5  |     4  0.293091  |   3.77058  0.276281
----------+--------+------------------+--------------------
1.000000  |        |        2.131195  |            2.118123

expected efficiency: 0.993866351017
worst-case efficiency: 0.894483808457


def loops_performance(loops):
    """ 
    Returns expected efficiency, worst-case efficiency, 
    and expected bits/symbol.
    """
    weighted_n_bits = 0.0
    weighted_entropy = 0.0
    weighted_n_syms = 0.0
    worst_effish = 1.0
    worst_bits_per_sym = 0.0
    for (prob, n_syms, n_bits) in loops:
        entropy = -log(prob, 2)
        weighted_n_bits += prob * n_bits
        weighted_entropy += prob * entropy
        weighted_n_syms += prob * n_syms
        worst_effish = min(worst_effish, entropy / n_bits)
        worst_bits_per_sym = max(worst_bits_per_sym,
                                 n_bits / n_syms)
    return (weighted_entropy / weighted_n_bits, worst_effish, 
            weighted_n_bits / weighted_n_syms)

def performance_graph(graph_type, coder_nbits=12,
                      x_axis_type="log", y_axis_type="linear",
                      lg_p_A_start=-1.0, lg_p_A_stop=-4.0,
                      lg_p_A_step=-.01):
    if graph_type == "bits/sym":
        title = "%d-bit pessimistic walrus expected bits per symbol" % coder_nbits
        ylabel = "bits/sym"
    elif graph_type == "efficiency":
        title = "%d-bit pessimistic walrus coding efficiency" % coder_nbits
        ylabel = "coding efficiency (%)"
    elif graph_type == "inefficiency":
        title = "%d-bit pessimistic walrus coding inefficiency" % coder_nbits
        ylabel = "coding inefficiency (fraction)"        
    else:
        raise ValueError(str(graph_type) + " isn't a valid graph_type")
    
    plt.figure(figsize=(6, 6), dpi=75)
    xs = []
    ys = []
    ys_worst = []
    ys_ideal = []
    for lg_p_A in arange(lg_p_A_start, lg_p_A_stop, lg_p_A_step):
        p_A = 2 ** lg_p_A
        trans = transitions_const_p_A(coder_nbits, p_A)
        loops = trans_tree_to_loops(trans)
        expected_effish, worst_effish, expected_bits_per_sym = \
            loops_performance(loops)
                
        # Either remember y(s) and x, or skip (continue):
        if graph_type == "bits/sym":
            ys.append(expected_bits_per_sym)
            ys_ideal.append(-log(p_A, 2) * p_A \
                            - log(1 - p_A, 2) * (1 - p_A))
        elif graph_type == "efficiency":
            ys.append(100.0 * expected_effish)
            ys_worst.append(100.0 * worst_effish)
        elif graph_type == "inefficiency":
            if expected_effish == 1.0:
                continue
                
            ys.append(1.0 - expected_effish)
            ys_worst.append(1.0 - worst_effish)
        else:
            raise ValueError(str(graph_type) + " isn't a valid graph_type")

        # (If we get to this point) remember the x.
        if x_axis_type == "log":
            xs.append(-lg_p_A)
        else:
            xs.append(p_A)
            
    plt.title(title)
    if x_axis_type == "log":
        plt.xlabel("- lg ( p_A )")
    else:
        plt.xlabel("p_A")
        plt.gca().invert_xaxis()
    if y_axis_type == "log":
        plt.yscale("log", basey=2)
    else:
        plt.yscale("linear")
        
    ymax = max(ys)
    plt.plot(xs[:1], [ymax * 1.02], "w")

    plt.ylabel(ylabel)
    plt.plot(xs, ys, "g", label="expected")
    if ys_worst:
        plt.plot(xs, ys_worst, "r", label="worst-case")
        plt.legend(loc="lower left", framealpha=0.5)
    if ys_ideal:
        plt.plot(xs, ys_ideal, "b", label="ideal")
        plt.legend(loc="lower left", framealpha=0.5)
    plt.show()

# performance_graph("bits/sym", coder_nbits=4,
#                   lg_p_A_stop=-6.0, lg_p_A_step=-.05, 
#                   x_axis_type="log", y_axis_type="log")
performance_graph("efficiency", lg_p_A_stop=-13.0)
performance_graph("inefficiency", lg_p_A_start=-1.1, lg_p_A_stop=-13.0, 
                  y_axis_type="log")
# performance_graph("efficiency", lg_p_A_start=-1.0, lg_p_A_stop=-5.0,
#                   lg_p_A_step=-.002, x_axis_type="log")
performance_graph("bits/sym", lg_p_A_stop=-2.5, y_axis_type="linear")
performance_graph("bits/sym", lg_p_A_start=-11.0, lg_p_A_stop=-16.0,
                  lg_p_A_step=-.05, 
                  x_axis_type="log", y_axis_type="log")

Walrus coder vs. Arithmetic coder Efficiency Comparisons¶

Empirical tests using `test1_12.out`¶

Generating Markov models for constant p_A¶

Transition table format¶

From transitions to loops¶

Walrus coder vs. Arithmetic coder Efficiency Comparisons¶

Empirical tests using test1_12.out¶

Generating Markov models for constant p_A¶

Transition table format¶

From transitions to loops¶

Empirical tests using `test1_12.out`¶