piantado/Fleet/_quantifier_2_my_hypothesis_8h_source.html

 #pragma once

 #include "DeterministicLOTHypothesis.h"
 #include "CachedCallHypothesis.h"

 class InnerHypothesis : public DeterministicLOTHypothesis<InnerHypothesis,Utterance,TruthValue,MyGrammar,&grammar>,
                         public CachedCallHypothesis<InnerHypothesis,Utterance,TruthValue>  {
 public:
     using Super = DeterministicLOTHypothesis<InnerHypothesis,Utterance,TruthValue,MyGrammar,&grammar>;
     using Super::Super; // inherit the constructors
     using CCH = CachedCallHypothesis<InnerHypothesis,Utterance,TruthValue>;

     InnerHypothesis(const InnerHypothesis& c) : Super(c), CCH(c) {}
     InnerHypothesis(const InnerHypothesis&& c) :  Super(c), CCH(c) { }

     InnerHypothesis& operator=(const InnerHypothesis& c) {
         Super::operator=(c);
         CachedCallHypothesis::operator=(c);
         return *this;
     }
     InnerHypothesis& operator=(const InnerHypothesis&& c) {
         Super::operator=(c);
         CachedCallHypothesis::operator=(c);
         return *this;
     }

     void set_value(Node&  v) {
         Super::set_value(v);
         CachedCallHypothesis::clear_cache();
     }
     void set_value(Node&& v) {
         Super::set_value(v);
         CachedCallHypothesis::clear_cache();
     }

     virtual double compute_prior() override {
         return prior = ( get_value().count() < MAX_NODES ? Super::compute_prior() : -infinity);
     }

     [[nodiscard]] virtual ProposalType propose() const override {

         ProposalType p;

         if(flip(0.85))      p = Proposals::regenerate(&grammar, value);
         else if(flip(0.5))  p = Proposals::sample_function_leaving_args(&grammar, value);
         else if(flip(0.5))  p = Proposals::swap_args(&grammar, value);
         else if(flip())     p = Proposals::insert_tree(&grammar, value);
         else                p = Proposals::delete_tree(&grammar, value);

         return p;
     }

     double get_weight_fromcache() const {
         if(cache.size() == 0) { return 1.0; } // for empty cache

         int numtrue = 0;
         for(auto& v : cache) {
             numtrue += (v == TruthValue::True);
         }

         // use the actual weight formula
         return 1.0 / (0.1 + double(numtrue) / cache.size());
     }


     virtual TruthValue cached_call_wrapper(const Utterance& di) override {
         // override how cached_call accesses the data
         return this->call(di, TruthValue::Undefined);
     }


 };

 #include "Lexicon.h"

 struct ignore_t  {};
 class MyHypothesis : public Lexicon<MyHypothesis, std::string, InnerHypothesis, ignore_t,ignore_t, Utterance> {
     // Takes a node (in a bigger tree) and a word
     using Super = Lexicon<MyHypothesis, std::string, InnerHypothesis, ignore_t,ignore_t, Utterance>;
     using Super::Super; // inherit the constructors
 public:

     void clear_cache() {
         for(auto& [k,f] : factors) {
             f.clear_cache();
         }
     }


     virtual double compute_likelihood(const data_t& data, double breakout=-infinity) override {

         // need to set this; probably not necessary?
         for(auto& [k,f] : factors)
             f.program.loader = this;

         // get the cached version
         for(auto& [k,f] : factors) {
             f.cached_call(data);

             if(f.got_error)
                 return likelihood = -infinity;
         }

         // first compute the weights -- these will depend on how how often each is true
         std::map<key_t,double> weights;
         double W = 0.0; // total weight
         for(auto& [k, f] : factors) {
             weights[k] = f.get_weight_fromcache();
             W += weights[k];
         }


         likelihood = 0.0;
         for(size_t i=0;i<data.size();i++) {
             const Utterance& utterance = data[i];

             // Check all the words that are true and select
             bool wtrue   = false; // was w true?
             bool wpresup = false; // was w presuppositionally valid?
             double Wpt = 0.0; // total weight of those that are true and presup
             double Wp = 0.0; // total weight of those that are true and presup

             // must loop over each word and see when it is true
             for(auto& [k,f] : factors) {
                 // we just call the right factor on utterance -- note that the "word" in u is
                 // ignored within the function call
                 auto tv = f.cache.at(i);

                 if(tv != TruthValue::Undefined) {
                     Wp += weights[k]; // presup met
                     if(tv == TruthValue::True) {
                         Wpt += weights[k];
                     }
                 }

                 if(utterance.word == k) {
                     wtrue   = (tv == TruthValue::True);
                     wpresup = (tv != TruthValue::Undefined);
                 }
             }


             // compute p -- equation (13) in the paper
             double w = weights.at(utterance.word);
             double p = (wtrue and wpresup ? alpha_p*alpha_t*w/Wpt : 0)  +
                        (wpresup ? alpha_p*(1-alpha_t)*w/Wp : 0)  +
                        (1.0-alpha_p)*w/W;
             likelihood += log(p);
         }

         return likelihood;
     }

     virtual std::string string(std::string prefix="") const override {
         extern MyHypothesis target;

         std::string out = prefix;
         for(auto& [k,f] : factors) {

             // TODO: get precision and recall relative to the target for presup and for
             bool conservative = true;
             int agr = 0;
             for(size_t i=0;i<PRDATA;i++) {
                 auto& di = prdata[i];

                 auto o = const_cast<InnerHypothesis*>(&f)->call(di); // we have to const_cast here since call is not const,
                 auto to = target.at(k).call(di);
                 agr += (to == o);

                 // we compute whether we give the same answer on <A,intersection(A,B)> as <A,B>
                 auto conservative_di = di; // copy the dat
                 conservative_di.color = DSL::intersection(conservative_di.shape, conservative_di.color);
                 auto co = const_cast<InnerHypothesis*>(&f)->call(conservative_di);
                 if(co != o) {
                     conservative = false;
                 }
             }

             out += str("\t", k,
                              f.get_weight_fromcache(),
                              target.at(k).get_weight_fromcache(),
                              double(agr)/PRDATA,
                              conservative,
                              QQ(f.string())) + "\n";
         }
         assert(out.size() > 0); // better not factors here
         out.erase(out.size()-1); //remove last newline

         return out;
     }

     virtual void show(std::string prefix="") override {
         extern MyHypothesis target;
         extern MyHypothesis bunny_spread;
         extern MyHypothesis classical_spread;

         print(":", prefix, this->posterior, this->prior, this->likelihood, target.likelihood, bunny_spread.likelihood, classical_spread.likelihood);
         print(this->string());
     }
 };
LOTHypothesis< InnerHypothesis, BindingTree *, bool, MyGrammar, grammar, defaultdatum_t< BindingTree *, bool >, std::vector< defaultdatum_t< BindingTree *, bool > >, typename MyGrammar ::VirtualMachineState_t >::get_value
Node & get_value()
Definition: LOTHypothesis.h:161

Lexicon.h
A lexicon stores an association of numbers (in a vector) to some other kind of hypotheses (typically ...

grammar
MyGrammar grammar

Proposals::sample_function_leaving_args
std::optional< std::pair< Node, double > > sample_function_leaving_args(GrammarType *grammar, const Node &from)
This samples functions f(a,b) -> g(a,b) (e.g. without destroying what&#39;s below). This uses a little tr...
Definition: Proposers.h:331

QQ
std::string QQ(const std::string &x)
Definition: Strings.h:190

Bayesable< Args... >::likelihood
double likelihood
Definition: Bayesable.h:43

TruthValue::True

InnerHypothesis::set_value
void set_value(Node &v)
Definition: MyHypothesis.h:27

Node
Definition: Node.h:22

DeterministicLOTHypothesis< InnerHypothesis, BindingTree *, bool, MyGrammar,&grammar >::Super
LOTHypothesis< InnerHypothesis, BindingTree *, bool, MyGrammar, grammar, defaultdatum_t< BindingTree *, bool >, std::vector< defaultdatum_t< BindingTree *, bool > >, typename MyGrammar ::VirtualMachineState_t > Super
Definition: DeterministicLOTHypothesis.h:17

InnerHypothesis::compute_prior
virtual double compute_prior() override
Compute the prior – defaultly just the PCFG (grammar) prior.
Definition: MyHypothesis.h:36

LOTHypothesis< InnerHypothesis, BindingTree *, bool, MyGrammar, grammar, defaultdatum_t< BindingTree *, bool >, std::vector< defaultdatum_t< BindingTree *, bool > >, typename MyGrammar ::VirtualMachineState_t >::set_value
void set_value(Node &v, bool should_compile=true)
Set the value to v. (NOTE: This compiles into a program)
Definition: LOTHypothesis.h:168

TruthValue
TruthValue
Definition: Main.cpp:32

MyHypothesis::compute_likelihood
virtual double compute_likelihood(const data_t &data, double breakout=-infinity) override
Compute the likelihood of a collection of data, by calling compute_single_likelihood on each...
Definition: MyHypothesis.h:94

LOTHypothesis< InnerHypothesis, BindingTree *, bool, MyGrammar, grammar, defaultdatum_t< BindingTree *, bool >, std::vector< defaultdatum_t< BindingTree *, bool > >, typename MyGrammar ::VirtualMachineState_t >::value
Node value
Definition: LOTHypothesis.h:72

InnerHypothesis::Super
DeterministicLOTHypothesis< InnerHypothesis, BindingTree *, bool, MyGrammar,&grammar > Super
Definition: InnerHypothesis.h:14

bunny_spread
MyHypothesis bunny_spread
Definition: Main.cpp:56

InnerHypothesis
Definition: InnerHypothesis.h:9

Bayesable< Args... >::prior
double prior
Definition: Bayesable.h:42

DeterministicLOTHypothesis< InnerHypothesis, BindingTree *, bool, MyGrammar,&grammar >::call
virtual output_t call(const input_t x, const output_t &err=output_t{})
A variant of call that assumes no stochasticity and therefore outputs only a single value...
Definition: DeterministicLOTHypothesis.h:32

PRDATA
const int PRDATA
Definition: Main.cpp:27

InnerHypothesis::operator=
InnerHypothesis & operator=(const InnerHypothesis &c)
Definition: MyHypothesis.h:16

flip
bool flip(float p=0.5)
Definition: Random.h:25

MyHypothesis::clear_cache
void clear_cache()
Definition: MyHypothesis.h:87

str
std::string str(BindingTree *t)
Definition: BindingTree.h:195

Bayesable< Args... >::posterior
double posterior
Definition: Bayesable.h:44

InnerHypothesis::propose
virtual ProposalType propose() const override
Default proposal is rational-rules style regeneration.
Definition: MyHypothesis.h:40

CachedCallHypothesis
Definition: CachedCallHypothesis.h:14

MyHypothesis
we don&#39;t need inputs/outputs for out MyHypothesis
Definition: MyHypothesis.h:6

MyHypothesis::show
virtual void show(std::string prefix="") override
Definition: MyHypothesis.h:197

DeterministicLOTHypothesis.h

DSL::intersection
const auto intersection
Definition: DSL.h:32

print
void print(FIRST f, ARGS... args)
Lock output_lock and print to std:cout.
Definition: IO.h:53

Proposals::delete_tree
std::optional< std::pair< Node, double > > delete_tree(GrammarType *grammar, const Node &from)
Definition: Proposers.h:275

InnerHypothesis::set_value
void set_value(Node &&v)
Definition: MyHypothesis.h:31

CachedCallHypothesis::clear_cache
void clear_cache()
Definition: CachedCallHypothesis.h:23

infinity
constexpr double infinity
Definition: Numerics.h:20

Utterance
Definition: Main.cpp:40

DeterministicLOTHypothesis
Definition: DeterministicLOTHypothesis.h:14

classical_spread
MyHypothesis classical_spread
Definition: Main.cpp:57

prdata
MyHypothesis::data_t prdata
Definition: Main.cpp:42

InnerHypothesis::cached_call_wrapper
virtual TruthValue cached_call_wrapper(const Utterance &di) override
This is how we access the data before calling – needed to say how this interfaces with the data...
Definition: MyHypothesis.h:70

InnerHypothesis::operator=
InnerHypothesis & operator=(const InnerHypothesis &&c)
Definition: MyHypothesis.h:21

ignore_t
Definition: MyHypothesis.h:80

Proposals::regenerate
std::optional< std::pair< Node, double > > regenerate(GrammarType *grammar, const Node &from)
A little helper function that resamples everything below when we can. If we can&#39;t, then we&#39;ll recurse.
Definition: Proposers.h:107

target
MyHypothesis target
Definition: Main.cpp:55

Lexicon
Definition: Lexicon.h:27

InnerHypothesis::get_weight_fromcache
double get_weight_fromcache() const
This computes the weight of this factor from its cached values.
Definition: MyHypothesis.h:57

MyHypothesis::string
virtual std::string string(std::string prefix="") const override
Definition: MyHypothesis.h:159

LOTHypothesis< InnerHypothesis, BindingTree *, bool, MyGrammar, grammar, defaultdatum_t< BindingTree *, bool >, std::vector< defaultdatum_t< BindingTree *, bool > >, typename MyGrammar ::VirtualMachineState_t >::ProposalType
std::optional< std::pair< InnerHypothesis, double > > ProposalType
Definition: LOTHypothesis.h:55

InnerHypothesis::InnerHypothesis
InnerHypothesis(const InnerHypothesis &&c)
Definition: MyHypothesis.h:14

CachedCallHypothesis.h
This is a hypothesis that allows you to cache an entire call on data. NOTE: This only catches std::ex...

LOTHypothesis< InnerHypothesis, BindingTree *, bool, MyGrammar, grammar, defaultdatum_t< BindingTree *, bool >, std::vector< defaultdatum_t< BindingTree *, bool > >, typename MyGrammar ::VirtualMachineState_t >::operator=
LOTHypothesis & operator=(const LOTHypothesis &c)
Definition: LOTHypothesis.h:100

InnerHypothesis::InnerHypothesis
InnerHypothesis(const InnerHypothesis &c)
Definition: MyHypothesis.h:13

Proposals::insert_tree
std::optional< std::pair< Node, double > > insert_tree(GrammarType *grammar, const Node &from)
Definition: Proposers.h:192

LOTHypothesis< InnerHypothesis, BindingTree *, bool, MyGrammar, grammar, defaultdatum_t< BindingTree *, bool >, std::vector< defaultdatum_t< BindingTree *, bool > >, typename MyGrammar ::VirtualMachineState_t >::compute_prior
virtual double compute_prior() override
Compute the prior – defaultly just the PCFG (grammar) prior.
Definition: LOTHypothesis.h:185

InnerHypothesis::MAX_NODES
const double MAX_NODES
Definition: InnerHypothesis.h:20

Utterance::word
std::string word
Definition: Main.cpp:44

Bayesable< Args... >::data_t
std::vector< Args... > data_t
Definition: Bayesable.h:39

TruthValue::Undefined

Proposals::swap_args
std::optional< std::pair< Node, double > > swap_args(GrammarType *grammar, const Node &from)
This propose swaps around arguments of the same type.
Definition: Proposers.h:389

BaseNode::count
virtual size_t count() const
How many nodes total are below me?
Definition: BaseNode.h:358

Lexicon::at
INNER & at(const key_t &k)
Definition: Lexicon.h:60

cache
Definition: LRUCache.h:19