from flippy import infer, condition, keep_deterministic, mem, \
    Categorical
from flippy.distributions import Dirichlet
import pandas as pd
import seaborn as sns
import matplotlib.pyplot as plt
from frozendict import frozendict

# The inverse temperature controls the sharpness of the right-hand side
# expansion probabilities. When rules that branch have lower Dirichlet weights
# than rules that do not, a higher inverse temperature leads to a bias towards
# shorter rules.
inv_temp = 1.0

# We set a maximum depth for expression, to avoid the generation of extremely large programs.
max_depth = 5

@mem
def expansion_dist(rhs_probs: dict) -> Categorical:
    dirichlet_weights = [v**inv_temp for v in list(rhs_probs.values())]
    probs = Dirichlet(dirichlet_weights).sample()
    return Categorical(list(rhs_probs.keys()), probabilities=probs)

def simple_boolean():
    def PREDICATE():
        feature_dist = expansion_dist({
            "SIZE": 2.0,
            "SHAPE": 1.4,
            "COLOR": 1.9,
        })
        attribute = feature_dist.sample()
        if attribute == 'COLOR':
            color_dist = expansion_dist({
                "yellow": .6,
                "green": .5,
                "blue": 1.5
            })
            return f"(lambda obj: obj['color'] == '{color_dist.sample()}')"
        elif attribute == 'SHAPE':
            shape_dist = expansion_dist({
                "triangle": 1.0,
                "rectangle": 0.4,
                "circle": 1.9
            })
            return f"(lambda obj: obj['shape'] == '{shape_dist.sample()}')"
        elif attribute == 'SIZE':
            size_dist = expansion_dist({
                "large": 1.0,
                "medium": 0.3,
                "small": 1,
            })
            return f"(lambda obj: obj['size'] == '{size_dist.sample()}')"

    def BOOL(depth):
        condition(depth < max_depth)
        bool_dist = expansion_dist({
            "or": 1.,
            "and": 0.25,
            "not": 2.0,
            "PREDICATE": 1.6,
        })
        symbol = bool_dist.sample()
        if symbol in ("or", "and"):
            expr = f"({BOOL(depth+1)} {symbol} {BOOL(depth+1)})"
        elif symbol == "not":
            expr = f"not {BOOL(depth+1)}"
        elif symbol == "PREDICATE":
            expr = f"{PREDICATE()}(x)"
        # Avoid some trivial cases
        condition("not not" not in expr)
        return expr

    def START(depth):
        return f"lambda x: {BOOL(depth+1)}"

    expr = START(0)
    return expr

def print_sorted_dist(dist, top=None):
    sorted_dist = sorted(
        [(s, dist.prob(s)) for s in dist.support],
        key=lambda pair: pair[-1],
        reverse=True
    )
    print("Prob\tExpression")
    if top is not None:
        sorted_dist = sorted_dist[:top]
    for expr, prob in sorted_dist:
        print(f"{prob:.4f}\t{expr}")

dist = infer(method="LikelihoodWeighting", samples=30, seed=42)(simple_boolean)()
print_sorted_dist(dist)

Prob	Expression
0.2941	lambda x: (lambda obj: obj['color'] == 'blue')(x)
0.1765	lambda x: not (lambda obj: obj['color'] == 'blue')(x)
0.1765	lambda x: not (lambda obj: obj['size'] == 'large')(x)
0.0588	lambda x: (lambda obj: obj['size'] == 'medium')(x)
0.0588	lambda x: not (lambda obj: obj['shape'] == 'circle')(x)
0.0588	lambda x: (lambda obj: obj['shape'] == 'circle')(x)
0.0588	lambda x: ((lambda obj: obj['color'] == 'blue')(x) or ((lambda obj: obj['color'] == 'blue')(x) and ((lambda obj: obj['shape'] == 'triangle')(x) and (lambda obj: obj['size'] == 'small')(x))))
0.0588	lambda x: (lambda obj: obj['size'] == 'large')(x)
0.0588	lambda x: ((lambda obj: obj['size'] == 'small')(x) or (lambda obj: obj['shape'] == 'triangle')(x))

# To make the concept executable, we need a deterministic transformation of it
@keep_deterministic
def convert_to_executable(func):
    # Because we are returning a function, it similarly must be marked as deterministic.
    return keep_deterministic(eval(func))

@infer(method="MetropolisHastings", samples=2000, seed=1234, burn_in=2000)
def posterior(pcfg, data):
    p_correct_label = 0.95
    concept = pcfg()
    executable_concept = convert_to_executable(concept)
    for example, value in data:
        condition(p_correct_label if executable_concept(example) == value else 1 - p_correct_label)
    return concept

examples = (
    (frozendict({'color': 'yellow', 'shape': 'circle', 'size': 'small'}), True),
    (frozendict({'color': 'blue', 'shape': 'rectangle', 'size': 'medium'}), False),
    (frozendict({'color': 'yellow', 'shape': 'triangle', 'size': 'large'}), True),
    (frozendict({'color': 'green', 'shape': 'circle', 'size': 'small'}), False)
)
dist = posterior(simple_boolean, examples)

print_sorted_dist(dist, top=10)

Prob	Expression
0.5155	lambda x: (lambda obj: obj['color'] == 'yellow')(x)
0.1485	lambda x: (lambda obj: obj['size'] == 'large')(x)
0.1040	lambda x: ((lambda obj: obj['size'] == 'large')(x) or (lambda obj: obj['color'] == 'yellow')(x))
0.0590	lambda x: (lambda obj: obj['shape'] == 'triangle')(x)
0.0425	lambda x: ((lambda obj: obj['color'] == 'yellow')(x) or (lambda obj: obj['color'] == 'yellow')(x))
0.0260	lambda x: not (lambda obj: obj['color'] == 'blue')(x)
0.0245	lambda x: (lambda obj: obj['shape'] == 'circle')(x)
0.0225	lambda x: not (not (lambda obj: obj['color'] == 'yellow')(x) or not (lambda obj: obj['color'] == 'yellow')(x))
0.0100	lambda x: (lambda obj: obj['size'] == 'small')(x)
0.0080	lambda x: not (not (lambda obj: obj['color'] == 'yellow')(x) and not (lambda obj: obj['color'] == 'yellow')(x))

Probabilistic Language of Thought¶

Prerequisites¶

Learning Objectives¶

What is the Language of Thought?¶

The Prior over Concepts¶

Performing Inference¶

Summary¶