# first some imports
import torch
torch.set_default_dtype(torch.float64)  # double precision for numerical stability

import collections
from collections import namedtuple

import argparse
import matplotlib.pyplot as plt

import pyro
import pyro.distributions as dist
import pyro.poutine as poutine

from pyro_rsa_book_utils.search_inference import Marginal, marginalize
from pyro_rsa_book_utils import visualize


# these could be given like in the introduction
state = ... # s
l0_dist = ... # p(s|u)

value_function = ... # V()
expectation = lambda distr, func: \
    torch.sum(torch.cat([distr.log_prob(x).exp() * func(x) for x in distr.enumerate_support()]))

Utility = namedtuple("Utility", ("epistemic","social"))

# util = Utility(
#    l0_dist.log_prob(state),
#    expectation(literal_listener_dist, value_function)
# )

phi = 0.8
# speaker_utility = phi * util.epistemic + (1-phi) * util.social


# speaker's possible secret true judgements
states = [1, 2, 3, 4, 5]

# uniform distribution over speaker states
def state_prior():
    prior_dist = dist.Categorical(probs=torch.ones(len(states))/len(states))
    idx = pyro.sample("state", prior_dist)
    return states[idx]

# what we let the speaker choose from
utterances = [
    "terrible",
    "bad",
    "okay",
    "good",
    "amazing"
]

# correspondence of utterances to states
# (empirically measured)
literal_semantics = {
    "terrible":[.95,.85,.02,.02,.02],
    "bad":[.85,.95,.02,.02,.02],
    "okay":[0.02,0.25,0.95,.65,.35],
    "good":[.02,.05,.55,.95,.93],
    "amazing":[.02,.02,.02,.65,0.95]
}

# helper function
# to determine whether the utterance describes the state
# by flipping a coin with 
# the literal_semantics[utterance][state] weight
def meaning(utterance, state): 
    # meaning(u, s) := [[u]](s) in the notation above 
    weight = literal_semantics[utterance][state-1]
    bernoulli = dist.Bernoulli(probs=weight)
    m = pyro.sample("meaning", bernoulli)
    return m

# literal listener
@Marginal
def literal_listener(utterance):
    state = state_prior()
    # values below are log probs
    pyro.factor("literal_meaning", 0. if meaning(utterance, state) else -999999.)
    return state


utterance = "okay"
l0_dist = literal_listener(utterance)
visualize(l0_dist)


# value function scales social utility by a parameter lambda
lambda_ = 1.25 # MAP estimate from Yoon, Tessler, et al. (2016)
value_function = lambda state: lambda_ * state

# alpha = 10 # MAP estimate from Yoon, Tessler, et al. (2016)
alpha = 1

def utterance_prior():
    prior_dist = dist.Categorical( probs = torch.ones(len(utterances)) / len(utterances) )
    idx = pyro.sample("utterance", prior_dist)
    return utterances[idx]

@Marginal
def speaker1(state, phi=1):
    utterance = utterance_prior()
    l0_posterior = literal_listener(utterance)
    
    Util = Utility(
        l0_posterior.log_prob(state),
        expectation(l0_posterior, value_function)
    )
    s1_utility = phi * Util.epistemic + (1-phi) * Util.social
    
    pyro.factor("s1_util", alpha * s1_utility)
    return utterance


s1_dist = speaker1(1, 0.8)
visualize(s1_dist)


def phi_prior():
    # possible phis:
    phis = torch.arange(start=0.00, end=1.0, step=0.05)
    uniform = dist.Categorical(torch.ones(len(phis)) / len(phis))
    idx = pyro.sample("phi", uniform)
    return phis[idx]
    
@Marginal
def pragmatic_listener(utterance):
    
    # your code here

    return state, phi


l1_dist = pragmatic_listener("good")
visualize(l1_dist, x_name="state", y_name="phi")


alpha2 = 1

@Marginal
def speaker2(state, phi, omega):
    
    # your code here
    
    # ---- marginal posterior distributions ----
    
    # speaker's simulation of l1's marginal state posterior
    # ("what state would l1 probably infer from this utterance?")
    l1_state = marginalize(l1_dist, 0)
    
    # speaker's simulation of l1's marginal goal posterior
    # ("what goal would l1 probably infer from this utterance?")
    l1_goal = marginalize(l1_dist, 1)
    
    # your code here

    return utterance


Omega = namedtuple("Omega", ("epistemic", "social", "presentational"))
s2_dist = speaker2(1, 0.0, Omega(0.8, 0.1, 0.1))
visualize(s2_dist)

1. A new speaker¶

An Example¶

Exercises 1 a)¶

Exercises 1 b)¶

2. A listener who understands politeness¶

Exercises 2¶

3. Politeness with indirect speech acts¶

Exercises 3¶

Gricean Maximes¶

Exercises 4¶

Chapter 9: Social reasoning about social reasoning¶

1. A new speaker¶

An Example¶

Exercises 1 a)¶

Exercises 1 b)¶

2. A listener who understands politeness¶

Exercises 2¶

3. Politeness with indirect speech acts¶

Exercises 3¶

Gricean Maximes¶

Exercises 4¶