piantado/Fleet/_base_grammar_hypothesis_8h_source.html

 #pragma once

  // Tune up eigen wrt thread safety
 #include <assert.h>
 #include <utility>
 #include <regex>
 #include <signal.h>
 #include <unordered_map>

 #include "EigenLib.h"
 #include "Errors.h"
 #include "Numerics.h"
 #include "DiscreteDistribution.h"

 #include "Vector2D.h"
 #include "HumanDatum.h"
 #include "Control.h"
 #include "TopN.h"
 #include "MCMCChain.h"

 //extern volatile sig_atomic_t CTRL_C;

 #include "VectorHalfNormalHypothesis.h"
 #include "VectorNormalHypothesis.h"
 #include "TNormalVariable.h"
 #include "Batch.h"
 #include "LOTHypothesis.h"
 #include "Grammar.h"

 template<typename this_t,
          typename _HYP,
          typename datum_t=HumanDatum<_HYP>,
          typename data_t=std::vector<datum_t>,
          typename _Predict_t=Vector2D<DiscreteDistribution<typename _HYP::output_t>> >  // The type here for Predict_t will depend on the subtype (deterministic or not; thunk or not)
 class BaseGrammarHypothesis : public MCMCable<this_t, datum_t, data_t>,
                               public Serializable<this_t> {
 public:
     using HYP = _HYP;

     // The type for predictions varies between subclasses -- might be a Vector2D of DiscreteDistribution (for FullGrammarHypothesis),
     // a Vector2D of single outputs (for deterministic), or a Vector2D with only one value for the second dimension when it
     // is a thunk. These variants are the whole reason we have subclasses, although there is a lot of repeated code
     // so this might change in the future.
     // NOTE: These do NOT mix in alpha -- that happens in compute_likelihood
     using Predict_t = _Predict_t;

     // take a data pointer and map it to a hypothesis x i'th item for that data point
     using LL_t = std::unordered_map<typename datum_t::data_t*, std::vector<Vector> >;

     typename HYP::Grammar_t* grammar;

     // Here is a list of built-in parameters that we can use. Each stores a standard
     // normal and a value under the specified transformation, which is chosen here to give
     // a reasonably shaped prior
 public:
     // if this is true, then we don't propose to any of logA, and we treat logA just as a bunch of zeros
     bool flat_prior;

     // where we store the logA values
     VectorHalfNormalHypothesis logA;

 protected:
     // these are now protected because when they are set, we have to recompute stuff sometimes
     // Parameters for inference
     UniformVariable alpha; // uniform in [0,1]
     ExponentialVariable decay;  // expoential decay parameter
 //  TNormalVariable< +[](float x)->float { return expf((x-0.33)/1.50); }>    llt;
 //  TNormalVariable< +[](float x)->float { return expf(x/5.0); }>            pt; // NOTE: Pt is not currently in use!

 public:

     // All of these are shared_ptr so that we can copy hypotheses quickly
     // without recomputing them. NOTE that this assumes that the data does not change
     // between hypotheses of this class.

     std::shared_ptr<Matrix>    C;
     std::shared_ptr<LL_t>      LL; // type for the likelihood

     std::shared_ptr<Predict_t> P;

     // These variables store some parameters and get recomputed
     // in proposal when necessary
     std::shared_ptr<Matrix> decayedLikelihood;

     // stored so we can remember what we computed for.
     const data_t* which_data;
     std::vector<HYP>* which_hypotheses;


     BaseGrammarHypothesis() : flat_prior(false) {
         decay.set_untransformed(0.1);
         alpha.set_untransformed(1.0);
     }

     BaseGrammarHypothesis(std::vector<HYP>& hypotheses, const data_t* human_data) : flat_prior(false) {
         // This has to take human_data as a pointer because of how MCMCable::make works -- can't forward a reference
         // but the rest of this class likes the references, so we convert here
         decay.set_untransformed(0.1);
         alpha.set_untransformed(1.0);
         this->set_hypotheses_and_data(hypotheses, *human_data);
     }

     // must do these together
     void set_decay(const ExponentialVariable& ev) {
         if(ev != decay) {
             decay = ev;
             this->recompute_decayedLikelihood(*which_data);
         }
     }

     void set_decay_untransformed(double v) {
         if(v != decay.get_untransformed()){
             decay.set_untransformed(v);
             this->recompute_decayedLikelihood(*which_data);
         }
     }

     void set_alpha(const UniformVariable& a ) {
         if(a != alpha) {
             alpha = a;
             this->recompute_LL(*which_hypotheses, *which_data);
         }
     }
     void set_alpha_untransformed(double v) {
         if(v != alpha.get_untransformed()){
             alpha.set_untransformed(v);
             this->recompute_LL(*which_hypotheses, *which_data);
         }
     }

     void copy_parameters(const BaseGrammarHypothesis& h) {
         // sometimes we want the parameters of h, but on some new (e.g. heldout) data
         this->logA  = h.logA;
 //      this->llt   = h.llt;
 //      this->pt    = h.pt;
         this->set_alpha(h.alpha);
         this->set_decay(h.decay);       // NOTE: this calls recompute_decayedLikelihood on my OWN data
     }

     // we write this as a function so that we can override (and remove llt if we want)
 //  float get_llt() const { return llt.get(); }
     float get_alpha() const { return alpha.get(); }
     float get_decay() const { return decay.get(); }

     size_t ndata() const { return which_data->size(); }

     // we overwrite this because in MCMCable, this wants to check get_value, which is not defined here
     [[nodiscard]] static this_t sample(std::vector<HYP>& hypotheses, const data_t* human_data) {
         // NOTE: Cannot use templates because then it doesn't pass my hypotheses ref the right way
         auto h = this_t(hypotheses, human_data);
         return h.restart();
     }

     virtual void set_hypotheses_and_data(std::vector<HYP>& hypotheses, const data_t& human_data) {

         // set first because it's required below
         which_data = std::addressof(human_data);
         which_hypotheses = std::addressof(hypotheses);

         // read the hypothesis from the first grammar, and check its the same for everyone
         grammar = hypotheses.at(0).get_grammar();
         for(auto& h: hypotheses) {
             assert(h.get_grammar() == grammar && "*** It's bad news for GrammarHypothesis if your hypotheses don't all have the same grammar.");
         }

         if(logA.size() != grammar->count_rules()) {
             if(logA.size() > 0) print("*** Warning: resizing and zeroing logA");
             logA.set_size(grammar->count_rules());
         }

         // when we are initialized this way, we compute C, LL, P, and the decayed ll.
         COUT "# Computing prior counts" ENDL;
         this->recompute_C(hypotheses);
         COUT "# Computing model predictions" ENDL;
         this->recompute_P(hypotheses, human_data); // note this comes before LL because LL might use P
         COUT "# Computing incremental likelihoods " ENDL;
         this->recompute_LL(hypotheses, human_data);
         COUT "# Computing decayedLikelihood" ENDL;
         this->recompute_decayedLikelihood(human_data);
         COUT "# Done. " ENDL;

     }

     virtual void set_can_propose(size_t i, bool b) {
         logA.set_can_propose(i,b);

         if(logA(i) != 0.0) { CERR "# Warning, set_can_propose is setting false to logA(" << str(i) << ") != 0.0 (this is untransformed space)" ENDL; }
     }


     void set_flat_prior(bool fp) {
         flat_prior = fp;
         if(flat_prior) {
             for(size_t i=0;i<logA.size();i++) {
                 logA.set(i,0.0);
             }
         }
     }

     virtual size_t nhypotheses() const { return C->rows(); }

     virtual void recompute_C(const std::vector<HYP>& hypotheses) {

         assert(hypotheses.size() > 0);

         size_t nRules = hypotheses[0].get_grammar()->count_rules();

         C.reset(new Matrix(hypotheses.size(), nRules));

         const auto indexer = grammar->get_rule_indexer(); // map rules to
         const auto R = grammar->count_rules();

         #pragma omp parallel for
         for(size_t i=0;i<hypotheses.size();i++) {
             assert(hypotheses[i].get_grammar() == grammar); // this only works if they have the same grammar, since they share an indexer

             // hypotheses here are factors so we have to sum them
             Vector cv = Vector::Zero(R);

             auto c = grammar->get_counts(hypotheses[i].get_value(), indexer); // extract counts using indexer
             for(size_t r=0;r<R;r++)  // update cv
                 cv[r] += c[r];

             #pragma omp critical
             C->row(i) = std::move(cv);
         }

         assert( (size_t)C->rows() == hypotheses.size());
     }

     virtual void recompute_LL(std::vector<HYP>& hypotheses, const data_t& human_data) {
         assert(which_data == std::addressof(human_data));
 //      print("*** Recomputing LL");

         // For each HumanDatum::data, figure out the max amount of data it contains
         std::unordered_map<typename datum_t::data_t*, size_t> max_sizes;
         for(auto& d : human_data) {
             if( (not max_sizes.contains(d.data)) or max_sizes[d.data] < d.ndata) {
                 max_sizes[d.data] = d.ndata;
             }
         }

         auto a = this->alpha.get();

         LL.reset(new LL_t());
         LL->reserve(max_sizes.size()); // reserve for the same number of elements

         // now go through and compute the likelihood of each hypothesis on each data set
         for(const auto& [dptr, sz] : max_sizes) {
             if(CTRL_C) break;

             LL->emplace(dptr, nhypotheses()); // in this place, make something of size nhypotheses

             #pragma omp parallel for
             for(size_t h=0;h<nhypotheses();h++) {

                 // set up all the likelihoods here
                 Vector data_lls = Vector::Zero(sz);

                 // read the max size from above and compute all the likelihoods
                 for(size_t i=0;i<max_sizes[dptr];i++) {

                     // here we could do
                     // data_lls(i) = hypotheses[h].compute_single_likelihood(x.first->at(i));
                     // but the problem is that isn't defined for some hypotheses. So we'll use
                     // the slightly slower
                     typename HYP::data_t d = { dptr->at(i) };
                     for(auto& di : d)  {
                         di.reliability = a; // set to our alpha value
                     }

                     data_lls(i) = hypotheses[h].compute_likelihood(d);

                     //print(hypotheses[h].string(), data_lls(i) , str(dptr->at(i)), hypotheses[h].call(dptr->at(i).input), dptr->at(i).output);

                     assert(not std::isnan(data_lls(i))); // NaNs will really mess everything up
                 }

                 #pragma omp critical
                 //print(h, max_sizes[dptr], data_lls.transpose(), hypotheses[h].string());
                 LL->at(dptr)[h] = std::move(data_lls);

             }
         }


         //print("HEERRRE", LL->at(human_data[87].data)[1], str(*human_data[87].data));
         //print("HEERRRE", LL->at(human_data[8].data)[1], str(*human_data[8].data));


     }

     virtual void recompute_decayedLikelihood(const data_t& human_data) {
         assert(which_data == std::addressof(human_data));

         // we need a NEW decayed ll if we change it
         decayedLikelihood.reset(new Matrix(nhypotheses(), human_data.size()));

         // find the max power we'll ever need
         int MX = 0; // we could start this at -1 but then for zero data things go bad
         for(auto& di : human_data) {
             MX = std::max(MX, di.decay_index+1); // need +1 since 0 decay needs one value
         }

         // just compute this once -- should be faster to use vector intrinsics?
         // we store these in reverse order from some max data size
         // so that we can just take the tail for what we need
         Vector powers = Vector::Ones(MX);
         auto dc = get_decay();
         for(int i=1;i<MX;i++) { // intentionally leaving powers(0) = 1 here
             powers(i) = powf(i,-dc);
         }

         // sum up with the memory decay
         #pragma omp parallel for
         for(size_t h=0;h<nhypotheses();h++) {
             for(int di=0;di<(int)human_data.size();di++) {
                 const datum_t& d = human_data[di];
                 const Vector& v = LL->at(d.data)[h]; // get the pre-computed vector of data here

                 double dl = 0.0; // the decayed likelihood value
                 for(size_t k=0;k<d.ndata;k++) {
                     dl += v(k) * powers(d.decay_index - d.decay_position->at(k)); // TODO: This could be stored as a vector -- might be faster w/o loop?
                 }

                 // #pragma may not be needed?
                 #pragma omp critical
                 assert(not std::isnan(dl));
                 (*decayedLikelihood)(h,di) = dl;
             }
         }
     }

     virtual void recompute_P(std::vector<HYP>& hypotheses, const data_t& human_data) = 0;

     virtual std::map<typename HYP::output_t, double> compute_model_predictions(const data_t& human_data, const size_t i, const Matrix& hposterior) const = 0;


     virtual const HYP& computeMAP( const size_t di, const Matrix& hposterior) const {
         // compute the MAP hypothesis at a given data amount
         int best_idx = 0;
         double best_score = -infinity;

         for(int h=0;h<hposterior.rows();h++) {
             if(hposterior(h,di) > best_score) {
                 best_idx = h;
                 best_score = hposterior(h,di);
             }
         }
         return std::ref(which_hypotheses->at(best_idx));
     }

     virtual double human_chance_lp(const typename datum_t::output_t& r, const datum_t& hd) const {
         return log(hd.chance);
     }


     virtual double compute_prior() override {
         return this->prior = logA.compute_prior() +
                              alpha.compute_prior() +
 //                           llt.compute_prior() +
                              //pt.compute_prior() +
                              decay.compute_prior();
     }

     virtual Matrix compute_normalized_posterior() const {

         // the model's posterior
         // do we need to normalize the prior here? The answer is no -- because its just a constant
         // and that will get normalized away in posterior
         const auto hprior =  this->hypothesis_prior();
         const auto hlikelihood = (*decayedLikelihood );
         Matrix hposterior = hlikelihood.colwise() + hprior;
         //Matrix hposterior = (*decayedLikelihood).colwise() + hprior;

         // now normalize it and convert to probabilities
         #pragma omp parallel for
         for(int di=0;di<hposterior.cols();di++) {

             // here we normalize and convert it to *probability* space
             const Vector& v = hposterior.col(di);
             const Vector lv = lognormalize(v).array().exp();
             // wow it's a real mystery that the below does not work
             // (it compiles, but gives weirdo answers...)
             // const auto& lv = lognormalize(hposterior.col(di)).array().exp();

             #pragma omp critical
             hposterior.col(di) = lv;
         }

         return hposterior;
     }

     virtual double compute_likelihood(const data_t& human_data, const double breakout=-infinity) override {

         // recompute our likelihood if its the wrong size or not using this data
         if(which_data != std::addressof(human_data)) {
             CERR "*** You are computing likelihood on a dataset that the BaseGrammarHypothesis was not constructed with." ENDL
             CERR "      You must call set_hypotheses_and_data before calling this likelihood, but note that when you" ENDL
             CERR "      do that, it will need to recompute everything (which might take a while)." ENDL;
             assert(false);
         }

         // Ok this needs a little explanation. If we have overwritten the types, then we can get compilation
         // errors below because for instance r.first won't be of the right type to index into model_predictions.
         // So this line catches that and removes this chunk of code at compile time if we have removed
         // those types. In its place, we add a runtime assertion fail, meaning you should have overwritten
         // compute_likelihood if you change these types
         if constexpr(std::is_same<std::vector<std::pair<typename HYP::output_t,size_t>>, typename datum_t::response_t>::value) {

             const Matrix hposterior = this->compute_normalized_posterior();

             this->likelihood  = 0.0; // for all the human data

             // precompute these so we don't keep doing it
             const auto log_alpha = log(get_alpha());
             const auto log_1malpha = log(1.0-get_alpha());

             #pragma omp parallel for
             for(size_t i=0;i<human_data.size();i++) {

                 const auto model_predictions = compute_model_predictions(human_data, i, hposterior);
                 //print(str(model_predictions));

                 double ll = 0.0; // the likelihood here
                 auto& di = human_data[i];
                 for(const auto& [r,cnt] : di.responses) {
                     ll += cnt * logplusexp_full( log_1malpha + human_chance_lp(r,di),
                                                  log_alpha   + log(get(model_predictions, r, 0.0)));
                 }

                 #pragma omp atomic
                 this->likelihood += ll;
             }

             return this->likelihood;
         }
         else {
             assert(false && "*** If you use BaseGrammarHypothesis with non-default types, you need to overwrite compute_likelihood so it does the right thing.");
         }

     }

     [[nodiscard]] virtual this_t restart() const override {
         this_t out(*static_cast<const this_t*>(this)); // copy

         out.logA = logA.restart();

         out.set_alpha(alpha.restart());
         out.set_decay(decay.restart());
 //      out.llt   = llt.restart();
         //out.pt    = pt.restart();

         return out;
     }

     [[nodiscard]] virtual std::optional<std::pair<this_t,double>> propose() const override {

         // TODO: Can probably speed this up by not making the copy if the proposal fails

         // make a copy
         this_t out(*static_cast<const this_t*>(this));

         if(flat_prior or flip(0.15)){ // if flat, we NEVER propose to logA

             double myfb = 0.0;
             auto which = random_nonempty_subset(2, 0.25);

             if(which.at(0)) {
                 auto p = alpha.propose();
                 if(not p) return {}; // Hmm can change this -- failed proposals can just be skipped here
                 auto [ v, fb ] = p.value();
                 out.set_alpha(v);
                 myfb += fb;
             }

             if(which.at(1)) {
                 auto p = decay.propose();
                 if(not p) return {};
                 auto [ v, fb ] = p.value();
                 out.set_decay(v);
                 myfb += fb;
             }

             return std::make_pair(out, myfb);
         }
         else {
             auto p = logA.propose();
             if(not p) return {};
             auto [ v, fb ] = p.value();
             out.logA = v;
             return std::make_pair(out, fb);
         }
     }
     virtual Vector hypothesis_prior() const {

         if(flat_prior) {
             return Vector::Zero(C->rows());
         }

         // We might want this version, but actually if we normalize, I think
         // that the prior then becomes underdetermined because we can scale
         // everything by a constant; otoh without this it isn't normalized,
         // which is probably fine
 //      return lognormalize( (*C) * (-logA.value) / pt.get() );

         // The unnormalized version -- note that pt here also lets us scale to possibly weird
         // value.
         //return (*C) * (-logA.value) / pt.get();

         return (*C) * (-logA.value);

         // One alternative is to have "pt" be the amount of heldout mass?
         //return lognormalize( (*C) * (-logA.value) - pt.get() );


         // This version does the rational-rule thing and requires that logA store the log of the A values
         // that ends up giving kinda crazy values. NOTE: This version also constrains each NT to sum to 1,
         // which our general version below does not.

         //      Vector out(nhypotheses()); // one for each hypothesis

         // get the marginal probability of the counts via  dirichlet-multinomial
         //Vector allA = logA.value.array().exp(); // translate [-inf,inf] into [0,inf]

 //      #pragma omp parallel for
 //      for(auto i=0;i<myC.rows();i++) {
 //
 //          double lp = 0.0;
 //          size_t offset = 0; //
 //          for(size_t nt=0;nt<grammar->count_nonterminals();nt++) { // each nonterminal in the grammar is a DM
 //              size_t nrules = grammar->count_rules( (nonterminal_t) nt);
 //              if(nrules > 1) { // don't need to do anything if only one rule (but must incremnet offset)
 //                  Vector a = eigenslice(allA,offset,nrules); // TODO: seqN doesn't seem to work with this eigen version
 //                  Vector c = eigenslice(myC.row(i),offset,nrules);
 //
 //                  // This version does RR marginalization and requires us to use logA.value.array().exp() above.
 //                  double n = a.sum(); assert(n > 0.0);
 //                  double c0 = c.sum();
 //                  if(c0 != 0.0) { // TODO: Check this...
 //                      // NOTE: std::lgamma here is not thread safe, so we use mylgamma defined in Numerics
 //                      lp += mylgamma(n+1) + mylgamma(c0) - mylgamma(n+c0)
 //                           + (c.array() + a.array()).array().lgamma().sum()
 //                           - (c.array()+1).array().lgamma().sum()
 //                           - a.array().lgamma().sum();
 //                  }
 //              }
 //              offset += nrules;
 //          }
 //
 //          #pragma omp critical
 //          out(i) = lp / temp; // NOTE: we use the temp before we lognormalize
 //      }

     }

     virtual bool operator==(const this_t& h) const override {
         return (C == h.C and LL == h.LL and P == h.P) and
                 (logA == h.logA)   and
                 (alpha == h.alpha) and
                 (decay == h.decay);
     }

     virtual std::string string(std::string prefix="") const override {
         // For now we just provide partial information
         //return "GrammarHypothesis["+str(this->posterior) + params.string() + ", " + logA.string() + "]";
         std::string out = "";

         // the -1 here is just to contrast with the nt printed below
         out += prefix + "-1\tposterior.score" +"\t"+ str(this->posterior) + "\n";
         out += prefix + "-1\tparameter.prior" +"\t"+ str(this->prior) + "\n";
         out += prefix + "-1\thuman.likelihood" +"\t"+ str(this->likelihood) + "\n";
         out += prefix + "-1\talpha" +"\t"+ str(get_alpha()) + "\n";
 //      out += prefix + "-1\tllt" +"\t"+ str(get_llt()) + "\n";
 //      out += prefix + "-1\tpt" +"\t"+ str(pt.get()) + "\n";
         out += prefix + "-1\tdecay" +"\t"+ str(get_decay()) + "\n";

         // now add the grammar operations
         size_t xi=0;
         for(auto& r : *grammar) {
             if(logA.can_propose[xi]) { // we'll skip the things we set as effectively constants (but still increment xi)
                 std::string rs = r.format;
                 rs = std::regex_replace(rs, std::regex("\\%s"), "X");
                 out += prefix + str(r.nt) + "\t" + QQ(rs) +"\t" + str(flat_prior ? 0.0 : logA(xi)) + "\n"; // unlogged here
             }
             xi++;
         }
         out.erase(out.size()-1,1); // delete the final newline

         return out;
     }

     virtual void show(std::string prefix="") override {
         print(string(prefix));
     }

     virtual size_t hash() const override {
         size_t output = logA.hash();
         hash_combine(output, alpha.hash(), decay.hash());
         return output;
     }

     virtual std::string serialize() const override { throw NotImplementedError();}
     static this_t deserialize(const std::string& s) { throw NotImplementedError(); }

 };
random_nonempty_subset
std::vector< bool > random_nonempty_subset(const size_t n, const double p)
Returns a random nonempty subset of n elements, as a vector<bool> of length n with trues for elements...
Definition: Random.h:220

VectorHalfNormalHypothesis::compute_prior
virtual double compute_prior() override
Definition: VectorHalfNormalHypothesis.h:65

BaseGrammarHypothesis::LL
std::shared_ptr< LL_t > LL
Definition: BaseGrammarHypothesis.h:90

BaseGrammarHypothesis::computeMAP
virtual const HYP & computeMAP(const size_t di, const Matrix &hposterior) const
Definition: BaseGrammarHypothesis.h:402

QQ
std::string QQ(const std::string &x)
Definition: Strings.h:190

BaseGrammarHypothesis::compute_normalized_posterior
virtual Matrix compute_normalized_posterior() const
This returns a matrix hposterior[h,di] giving the posterior on the h&#39;th element. NOTE: not output is ...
Definition: BaseGrammarHypothesis.h:440

Bayesable< Args... >::likelihood
double likelihood
Definition: Bayesable.h:43

TNormalVariable::get_untransformed
float get_untransformed()
Definition: TNormalVariable.h:45

BaseGrammarHypothesis::decayedLikelihood
std::shared_ptr< Matrix > decayedLikelihood
Definition: BaseGrammarHypothesis.h:96

BaseGrammarHypothesis::recompute_decayedLikelihood
virtual void recompute_decayedLikelihood(const data_t &human_data)
Recomputes the decayed likelihood (e.g. at the given decay level, the total ll for each data point...
Definition: BaseGrammarHypothesis.h:343

BaseGrammarHypothesis::recompute_LL
virtual void recompute_LL(std::vector< HYP > &hypotheses, const data_t &human_data)
Recompute LL[h,di] a hypothesis from each hypothesis and data point to a vector of prior responses...
Definition: BaseGrammarHypothesis.h:271

BaseGrammarHypothesis::propose
virtual std::optional< std::pair< this_t, double > > propose() const override
Propose to the hypothesis. The sometimes does grammar parameters and sometimes other parameters...
Definition: BaseGrammarHypothesis.h:545

Vector2D.h
A little trick here to force bools to act like chars and have normal std::vector iterators etc...

BaseGrammarHypothesis::recompute_P
virtual void recompute_P(std::vector< HYP > &hypotheses, const data_t &human_data)=0
Recompute the predictions for the hypotheses and data.

BaseGrammarHypothesis::copy_parameters
void copy_parameters(const BaseGrammarHypothesis &h)
Definition: BaseGrammarHypothesis.h:144

MCMCable
Definition: MCMCable.h:14

BaseGrammarHypothesis::set_hypotheses_and_data
virtual void set_hypotheses_and_data(std::vector< HYP > &hypotheses, const data_t &human_data)
This is the primary function for setting hypothese and data on construction.
Definition: BaseGrammarHypothesis.h:172

BaseGrammarHypothesis::compute_likelihood
virtual double compute_likelihood(const data_t &human_data, const double breakout=-infinity) override
This computes the likelihood of the human data.
Definition: BaseGrammarHypothesis.h:474

BaseGrammarHypothesis::string
virtual std::string string(std::string prefix="") const override
This returns a string for this hypothesis. Defaulty, now, just in tidy format with all the parameters...
Definition: BaseGrammarHypothesis.h:664

BaseGrammarHypothesis::decay
ExponentialVariable decay
Definition: BaseGrammarHypothesis.h:79

Numerics.h

VectorHalfNormalHypothesis::restart
virtual self_t restart() const override
Definition: VectorHalfNormalHypothesis.h:107

BaseGrammarHypothesis::show
virtual void show(std::string prefix="") override
Need to override print since it will print in a different format.
Definition: BaseGrammarHypothesis.h:697

BaseGrammarHypothesis::set_alpha
void set_alpha(const UniformVariable &a)
Definition: BaseGrammarHypothesis.h:131

BaseGrammarHypothesis::ndata
size_t ndata() const
Definition: BaseGrammarHypothesis.h:158

BaseGrammarHypothesis::hash
virtual size_t hash() const override
Definition: BaseGrammarHypothesis.h:701

VectorNormalHypothesis.h
Half-normal hypothese are bounded at zero, normal proposals wrap around.

BaseGrammarHypothesis::logA
VectorHalfNormalHypothesis logA
Definition: BaseGrammarHypothesis.h:73

BaseGrammarHypothesis::set_can_propose
virtual void set_can_propose(size_t i, bool b)
Set whether I can propose to a value in logA – this is handled by VectorNormalHypothesis Here...
Definition: BaseGrammarHypothesis.h:208

Serializable
Definition: Serializable.h:4

VectorHalfNormalHypothesis::set_can_propose
void set_can_propose(size_t i, bool b)
Set whether we can propose to each element of b or not.
Definition: VectorHalfNormalHypothesis.h:46

Matrix
Eigen::MatrixXf Matrix
Definition: EigenLib.h:18

BaseGrammarHypothesis::get_alpha
float get_alpha() const
Definition: BaseGrammarHypothesis.h:155

Bayesable< Args... >::prior
double prior
Definition: Bayesable.h:42

BaseGrammarHypothesis::human_chance_lp
virtual double human_chance_lp(const typename datum_t::output_t &r, const datum_t &hd) const
Get the chance probability of response r in hd (i.e. of a human response). This may typically be pret...
Definition: BaseGrammarHypothesis.h:422

EigenLib.h

flip
bool flip(float p=0.5)
Definition: Random.h:25

TNormalVariable
Definition: TNormalVariable.h:17

str
std::string str(BindingTree *t)
Definition: BindingTree.h:195

Bayesable< Args... >::posterior
double posterior
Definition: Bayesable.h:44

BaseGrammarHypothesis
Definition: BaseGrammarHypothesis.h:48

BaseGrammarHypothesis::operator==
virtual bool operator==(const this_t &h) const override
Definition: BaseGrammarHypothesis.h:651

TNormalVariable::set_untransformed
void set_untransformed(const T v)
Definition: TNormalVariable.h:38

BaseGrammarHypothesis::nhypotheses
virtual size_t nhypotheses() const
A convenient function that uses C to say how many hypotheses.
Definition: BaseGrammarHypothesis.h:228

MyHypothesis
we don&#39;t need inputs/outputs for out MyHypothesis
Definition: MyHypothesis.h:6

CTRL_C
volatile sig_atomic_t CTRL_C

logplusexp_full
T logplusexp_full(const T a, const T b)
logsumexp with no shortcuts for precision
Definition: Numerics.h:163

BaseGrammarHypothesis::recompute_C
virtual void recompute_C(const std::vector< HYP > &hypotheses)
Computes our matrix C[h,r] of hypotheses (rows) by counts of each grammar rule. (requires that each h...
Definition: BaseGrammarHypothesis.h:235

BaseGrammarHypothesis::deserialize
static this_t deserialize(const std::string &s)
Definition: BaseGrammarHypothesis.h:708

print
void print(FIRST f, ARGS... args)
Lock output_lock and print to std:cout.
Definition: IO.h:53

VectorHalfNormalHypothesis::propose
virtual std::optional< std::pair< self_t, double > > propose() const override
Definition: VectorHalfNormalHypothesis.h:82

infinity
constexpr double infinity
Definition: Numerics.h:20

BaseGrammarHypothesis::set_alpha_untransformed
void set_alpha_untransformed(double v)
Definition: BaseGrammarHypothesis.h:137

TNormalVariable.h
A TNormalVariable encapsulates MCMC operations on a single real number with a standard normal prior...

HumanDatum
Definition: HumanDatum.h:19

BaseGrammarHypothesis::compute_model_predictions
virtual std::map< typename HYP::output_t, double > compute_model_predictions(const data_t &human_data, const size_t i, const Matrix &hposterior) const =0
This uses hposterior (computed via this->compute_normalized_posterior()) to compute the model predict...

Errors.h

BaseGrammarHypothesis::C
std::shared_ptr< Matrix > C
Definition: BaseGrammarHypothesis.h:89

TNormalVariable::restart
virtual self_t restart() const override
Definition: TNormalVariable.h:76

TNormalVariable::compute_prior
virtual double compute_prior() override
Definition: TNormalVariable.h:56

CERR
#define CERR
Definition: IO.h:23

Bayesable< Args... >::datum_t
Args... datum_t
Definition: Bayesable.h:38

BaseGrammarHypothesis::which_hypotheses
std::vector< HYP > * which_hypotheses
Definition: BaseGrammarHypothesis.h:100

BaseGrammarHypothesis::P
std::shared_ptr< Predict_t > P
Definition: BaseGrammarHypothesis.h:92

TNormalVariable::propose
virtual std::optional< std::pair< self_t, double > > propose() const override
Definition: TNormalVariable.h:67

Vector2D
Just a little wrapper to allow vectors to be handled as 2D arrays, which simplifie some stuff in Gram...
Definition: Vector2D.h:14

BaseGrammarHypothesis::BaseGrammarHypothesis
BaseGrammarHypothesis()
Definition: BaseGrammarHypothesis.h:103

NotImplementedError
Definition: Errors.h:7

BaseGrammarHypothesis::hypothesis_prior
virtual Vector hypothesis_prior() const
Compute a vector of the prior (one for each hypothesis) using the given counts matrix (hypotheses x r...
Definition: BaseGrammarHypothesis.h:589

ENDL
#define ENDL
Definition: IO.h:21

LOTHypothesis.h
A LOTHypothesis is the basic unit for doing LOT models. It store a Node as its value, and handles all of the proposing and computing priors, likelihoods, etc. It compiles this Node into a "program" which is used to make function calls, which means that the value should only be changed via LOTHypothesis::set_value.

VectorHalfNormalHypothesis::hash
virtual size_t hash() const override
Definition: VectorHalfNormalHypothesis.h:117

DiscreteDistribution.h
This stores a distribution from values of T to log probabilities. It is used as the return value from...

BaseGrammarHypothesis::flat_prior
bool flat_prior
Definition: BaseGrammarHypothesis.h:70

BaseGrammarHypothesis::which_data
const data_t * which_data
Definition: BaseGrammarHypothesis.h:99

BaseGrammarHypothesis::get_decay
float get_decay() const
Definition: BaseGrammarHypothesis.h:156

Bayesable< Args... >::data_t
std::vector< Args... > data_t
Definition: Bayesable.h:39

BaseGrammarHypothesis::restart
virtual this_t restart() const override
Definition: BaseGrammarHypothesis.h:524

BaseGrammarHypothesis::set_decay_untransformed
void set_decay_untransformed(double v)
Definition: BaseGrammarHypothesis.h:124

BaseGrammarHypothesis< MyGrammarHypothesis, MyHypothesis, MyHumanDatum, std::vector< MyHumanDatum >, Vector2D< DiscreteDistribution< S > > >::LL_t
std::unordered_map< typename MyHumanDatum ::std::vector< MyHumanDatum > *, std::vector< Vector > > LL_t
Definition: BaseGrammarHypothesis.h:61

VectorHalfNormalHypothesis.h
Distribution on half-normals. Man, it was a pain to try to make this inherit from VectorNormalHypothe...

VectorHalfNormalHypothesis::value
Vector value
Definition: VectorHalfNormalHypothesis.h:24

TopN.h

VectorHalfNormalHypothesis::can_propose
std::vector< bool > can_propose
Definition: VectorHalfNormalHypothesis.h:28

BaseGrammarHypothesis::alpha
UniformVariable alpha
Definition: BaseGrammarHypothesis.h:78

BaseGrammarHypothesis::grammar
HYP::Grammar_t * grammar
Definition: BaseGrammarHypothesis.h:63

Batch.h

VectorHalfNormalHypothesis
Definition: VectorHalfNormalHypothesis.h:13

BaseGrammarHypothesis::sample
static this_t sample(std::vector< HYP > &hypotheses, const data_t *human_data)
Definition: BaseGrammarHypothesis.h:161

BaseGrammarHypothesis::set_decay
void set_decay(const ExponentialVariable &ev)
Definition: BaseGrammarHypothesis.h:117

BaseGrammarHypothesis::BaseGrammarHypothesis
BaseGrammarHypothesis(std::vector< HYP > &hypotheses, const data_t *human_data)
Definition: BaseGrammarHypothesis.h:108

COUT
#define COUT
Definition: IO.h:24

BaseGrammarHypothesis::set_flat_prior
void set_flat_prior(bool fp)
Definition: BaseGrammarHypothesis.h:215

VectorHalfNormalHypothesis::set_size
void set_size(size_t n)
Definition: VectorHalfNormalHypothesis.h:56

MCMCChain.h
This represents an MCMC hain on a hypothesis of type HYP. It uses HYP::propose and HYP::compute_poste...

lognormalize
Vector lognormalize(const Vector &v)
Definition: EigenLib.h:35

HumanDatum.h
A human data series contains a list of human data points, some of which may be presented at the same ...

Control.h
This class has all the information for running MCMC or MCTS in a little package. It defaultly constru...

Vector
Eigen::VectorXf Vector
Definition: EigenLib.h:17

BaseGrammarHypothesis::serialize
virtual std::string serialize() const override
Definition: BaseGrammarHypothesis.h:707

TNormalVariable::get
float get() const
Get interfaces to the transformed variable.
Definition: TNormalVariable.h:52

BaseGrammarHypothesis::compute_prior
virtual double compute_prior() override
Definition: BaseGrammarHypothesis.h:427

Grammar.h
A grammar stores all of the rules associated with any kind of nonterminal and permits us to sample as...

TNormalVariable::hash
virtual size_t hash() const override
Definition: TNormalVariable.h:87

VectorHalfNormalHypothesis::set
void set(int i, double v)
Definition: VectorHalfNormalHypothesis.h:38

VectorHalfNormalHypothesis::size
size_t size() const
Definition: VectorHalfNormalHypothesis.h:61