software/TRF-html/trf-model_8h_source.html

 // You may obtain a copy of the License at
 //
 //     http://www.apache.org/licenses/LICENSE-2.0
 //
 // Unless required by applicable law or agreed to in writing, software
 // distributed under the License is distributed on an "AS IS" BASIS,
 // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 // See the License for the specific language governing permissions and
 // limitations under the License.
 //
 // Copyright 2014-2015 Tsinghua University
 // Author: wb.th08@gmail.com (Bin Wang), ozj@tsinghua.edu.cn (Zhijian Ou)
 //
 // All h, cpp, cc, and script files (e.g. bat, sh, pl, py) should include the above
 // license declaration. Different coding language may use different comment styles.


 #pragma once
 #include "trf-feature.h"
 #include "trf-alg.h"
 #include <omp.h>

 namespace trf
 {


     class Model;

     class AlgNode : public Algfb
     {
     private:
         Model *m_pModel;
         Seq m_seq;
     public:
         AlgNode(Model *p) :m_pModel(p){};
         virtual LogP ClusterSum(int *pSeq, int nLen, int nPos, int nOrder);
     };
     class Model
     {
     public:
         Feat *m_pFeat;
         Vec<PValue> m_value;

         int m_maxlen;
         Vec<Prob> m_pi;
         Vec<LogP> m_logz;
         Vec<LogP> m_zeta;

         Vocab *m_pVocab;

         Mat<Prob> m_matLenJump;
         int m_maxSampleLen;

     protected:
         AlgNode m_AlgNode;

     public:
         Model(Vocab *pv) :
             m_pFeat(NULL),
             m_maxlen(0),
             m_pVocab(pv),
             m_AlgNode(this){
             m_nLenJumpAccTimes = 0;
             m_nLenJumpTotalTime = 0;
             m_nSampleHAccTimes = 0;
             m_nSampleHTotalTimes = 0;
         };
         Model(Vocab *pv, int maxlen) :
             m_pFeat(NULL),
             m_maxlen(0),
             m_pVocab(pv),
             m_AlgNode(this) {
             Reset(pv, maxlen);
             m_nLenJumpAccTimes = 0;
             m_nLenJumpTotalTime = 0;
             m_nSampleHAccTimes = 0;
             m_nSampleHTotalTimes = 0;
         }
         ~Model()
         {
             SAFE_DELETE(m_pFeat);
         }
         int GetMaxLen() const { return m_maxlen; }
         Vocab *GetVocab() const { return m_pVocab; }
         int GetMaxOrder() const { return m_pFeat->GetMaxOrder(); }
         int GetParamNum() const { return (m_pFeat) ? m_pFeat->GetNum() : 0; }
         void Reset(Vocab *pv, int maxlen);
         virtual void SetParam(PValue *pValue);
         void GetParam(PValue *pValue);
         void SetPi(Prob *pPi);
         template <typename T>
         void SetZeta(T *pzeta)
         {
             ExactNormalize(1);
             for (int i = 1; i <= m_maxlen; i++) {
                 m_zeta[i] = (LogP)( pzeta[i] - pzeta[1] );
                 m_logz[i] = (LogP)( m_zeta[i] + m_logz[1] );
             }
         }
         template <typename T>
         void GetZeta(T *pzeta)
         {
             for (int i = 1; i <= m_maxlen; i++) {
                 pzeta[i] = (T) m_zeta[i];
             }
         }
         LogP GetLogProb(Seq &seq, bool bNorm = true);
         void LoadFromCorpus(const char *pcorpus, const char *pfeatstyle, int nOrder);
         void FeatCount(Seq &seq, double *pCount, double dadd = 1.0);

         void ReadT(const char *pfilename);
         void WriteT(const char *pfilename);
 //      void ReadB(const char *pfilename);
 //      /// Write Binary
 //      void WriteB(const char *pfilename);

         /************************************************************************/
         /*exactly calculation functions                                         */
         /************************************************************************/
     public:
         LogP ClusterSum(Seq &seq, int nPos, int nOrder);
         virtual double ExactNormalize(int nLen);
         virtual void ExactNormalize();
         void GetNodeExp(int nLen, double *pExp);
         void GetNodeExp(double *pExp, Prob *pLenProb = NULL);

         /************************************************************************/
         /*sampling functions                                                    */
         /************************************************************************/
     public:
         int m_nLenJumpAccTimes;
         int m_nLenJumpTotalTime;
         int m_nSampleHAccTimes;
         int m_nSampleHTotalTimes;
         void Sample(Seq &seq);
         void LocalJump(Seq &seq);
         virtual void MarkovMove(Seq &seq);
         LogP ProposeLength(int nOld, int &nNew, bool bSample);
         LogP ProposeC0(VocabID &ci, Seq &seq, int nPos, bool bSample);
         void ProposeCProbs(VecShell<LogP> &logps, Seq &seq, int nPos);
         /* To reduce the computation cost, we using the following function to replace GetLogProb
            when sampling c_i at position i in function ProposeCProbs and ProposeC0.
            There we only consinder the features depending on c_i and indenpending with w_i,
            i.e. calculating the propose prob without knowing the w_i at position i.
         */
         LogP GetReducedModelForC(Seq &seq, int nPos);
         LogP GetReducedModelForW(Seq &seq, int nPos);
         LogP GetReducedModel(Seq &seq, int nPos);
         LogP GetMarginalProbOfC(Seq &seq, int nPos);
         /* the only differnece with ProposeC0 is than
            SampleC will accept the current class after propose it.
            While ProposeC0 not.
            ProposeC0 used in local jump. It cannot accept the propose c0 as there is no intial value of c_i.
            SampleC used in Markov move.
         */
         void SampleC(Seq &seq, int nPos);
         /* if bSample=ture, then sample x[nPos]. Otherwise only calculate the conditional probabilities of current x[nPos]. */
         LogP SampleX(Seq &seq, int nPos, bool bSample = true);
     public:
         LogP AISNormalize(int nLen, int nChain, int nInter);
         void AISNormalize(int nLenMin, int nLenMax, int nChain, int nInter);
     };

     class Model_FastSample : public Model
     {
     public:
         int m_nMHtimes;
     public:
         Model_FastSample(Vocab *pv) :Model(pv) {
             m_nMHtimes = 1;
         }
         Model_FastSample(Vocab *pv, int maxlen) :Model(pv, maxlen) {
             m_nMHtimes = 1;
         }
         LogP ProposeW0(VocabID &wi, Seq &seq, int nPos, bool bSample = true)
         {
             Array<VocabID> *pXs = m_pVocab->GetWord(seq.x[class_layer][nPos]);
             Array<LogP> aLogps;

             VocabID nSaveX = seq.x[word_layer][nPos]; // save w[nPos]
             for (int i = 0; i < pXs->GetNum(); i++) {
                 seq.x[word_layer][nPos] = pXs->Get(i);

 //              LogP d = 0;
 //              Array<int> afeat;
 //              m_pFeat->Find(afeat, seq, nPos, 1);
 //              for (int i = 0; i < afeat.GetNum(); i++)
 //                  d += m_value[afeat[i]];
                 aLogps[i] = 1; //GetReducedModelForW(seq, nPos);
             }
             seq.x[word_layer][nPos] = nSaveX;
             LogLineNormalize(aLogps, pXs->GetNum());

             int idx;
             if (bSample) {
                 /* sample a value for x[nPos] */
                 idx = LogLineSampling(aLogps, pXs->GetNum());
                 wi = pXs->Get(idx);
             }
             else {
                 idx = pXs->Find(nSaveX); // find nSave in the array.
                 if (idx == -1) {
                     lout_error("Can't find the VocabID(" << nSaveX << ") in the array.\n"
                         << "This may beacuse word(" << nSaveX << ") doesnot belongs to class("
                         << seq.x[class_layer][nPos] << ")");
                 }
             }

             return aLogps[idx];
         }

         void ProposeCProbs(VecShell<LogP> &logps, Seq &seq, int nPos)
         {
             VocabID savecid = seq.x[class_layer][nPos];
             for (int cid = 0; cid < m_pVocab->GetClassNum(); cid++) {
                 seq.x[class_layer][nPos] = cid;
                 logps[cid] = 1;
             }
             seq.x[class_layer][nPos] = savecid;
             LogLineNormalize(logps.GetBuf(), m_pVocab->GetClassNum());
         }

         void MarkovMove(Seq &seq)
         {
             for (int i = 0; i < seq.GetLen(); i++)
                 SamplePos(seq, i);
         }
         void SamplePos(Seq &seq, int nPos)
         {
             for (int times = 0; times < m_nMHtimes; times++)
             {

                 VocabID old_c = seq.x[class_layer][nPos];
                 VocabID old_w = seq.x[word_layer][nPos];
                 LogP pold = GetReducedModel(seq, nPos);


                 VocabID prop_c = omp_nrand(0, m_pVocab->GetClassNum());
                 Array<VocabID> *pWords = m_pVocab->GetWord(prop_c);
                 int prop_w_id = omp_nrand(0, pWords->GetNum());
                 VocabID prop_w = pWords->Get(prop_w_id);

                 seq.x[class_layer][nPos] = prop_c;
                 seq.x[word_layer][nPos] = prop_w;
                 LogP pnew = GetReducedModel(seq, nPos);

                 LogP g_old = Prob2LogP(1.0 / m_pVocab->GetClassNum()) + Prob2LogP(1.0 / m_pVocab->GetWord(old_c)->GetNum());
                 LogP g_new = Prob2LogP(1.0 / m_pVocab->GetClassNum()) + Prob2LogP(1.0 / m_pVocab->GetWord(prop_c)->GetNum());
                 LogP acclogp = pnew + g_old - (pold + g_new);

                 if (Acceptable(LogP2Prob(acclogp))) {
                     m_nSampleHAccTimes++;
                     seq.x[class_layer][nPos] = prop_c;
                     seq.x[word_layer][nPos] = prop_w;
                 }
                 else {
                     seq.x[class_layer][nPos] = old_c;
                     seq.x[word_layer][nPos] = old_w;
                 }
                 m_nSampleHTotalTimes++;

                 lout_assert(seq.x[class_layer][nPos] == m_pVocab->GetClass(seq.x[word_layer][nPos]));
             }

 //          Vec<LogP> vlogps_c(m_pVocab->GetClassNum());
 //          ProposeCProbs(vlogps_c, seq, nPos);
 //          VocabID ci = seq.x[class_layer][nPos];
 //          VocabID C0 = LogLineSampling(vlogps_c.GetBuf(), vlogps_c.GetSize());
 //          LogP gci = vlogps_c[ci];
 //          LogP gc0 = vlogps_c[C0];
 //
 //          VocabID wi = seq.x[word_layer][nPos];
 //          VocabID w0;
 //          seq.x[class_layer][nPos] = ci;
 //          LogP gwi_ci = ProposeW0(wi, seq, nPos, false);
 //          seq.x[class_layer][nPos] = C0;
 //          LogP gw0_c0 = ProposeW0(w0, seq, nPos, true);
 //
 //          seq.x[class_layer][nPos] = ci;
 //          seq.x[word_layer][nPos] = wi;
 //          LogP pold = GetReducedModel(seq, nPos);
 //          seq.x[class_layer][nPos] = C0;
 //          seq.x[word_layer][nPos] = w0;
 //          LogP pnew = GetReducedModel(seq, nPos);
 //
 //          LogP acclogp = pnew + gci + gwi_ci - (pold + gc0 + gw0_c0);
 //          if (Acceptable(LogP2Prob(acclogp))) {
 //              m_nSampleHAccTimes++;
 //              seq.x[class_layer][nPos] = C0;
 //              seq.x[word_layer][nPos] = w0;
 //          }
 //          else {
 //              seq.x[class_layer][nPos] = ci;
 //              seq.x[word_layer][nPos] = wi;
 //          }
 //          m_nSampleHTotalTimes++;
         }
     };
 }
wb::Mat< Prob >

trf::Model::m_pi
Vec< Prob > m_pi
the prior length distribution
Definition: trf-model.h:58

trf::Model::GetParamNum
int GetParamNum() const
Get parameter number.
Definition: trf-model.h:106

trf::Prob
double Prob
Definition: trf-def.h:28

SAFE_DELETE
#define SAFE_DELETE(p)
memory release
Definition: wb-vector.h:49

wb::Vector::Get
T & Get(int i)
get the value at position i
Definition: wb-vector.h:99

trf::Model::Model
Model(Vocab *pv)
constructor
Definition: trf-model.h:72

WriteT
m WriteT(cfg_pathModelWrite)

trf::LogLineSampling
int LogLineSampling(const LogP *pdProbs, int nNum)
Definition: trf-def.cpp:62

trf::Model::Model
Model(Vocab *pv, int maxlen)
constructor
Definition: trf-model.h:83

trf::Model_FastSample::MarkovMove
void MarkovMove(Seq &seq)
[sample] Markov Move - perform the gibbs sampling
Definition: trf-model.h:276

trf::Feat::GetMaxOrder
int GetMaxOrder()
Get maximum order.
Definition: trf-feature.cpp:435

trf::Model::m_maxSampleLen
int m_maxSampleLen
[sample] the maximum sample length, default = m_maxlen + 2
Definition: trf-model.h:65

trf::VocabID
int VocabID
Definition: trf-vocab.h:23

wb::VecShell< LogP >

lout_error
#define lout_error(x)
Definition: wb-log.h:183

lout_assert
#define lout_assert(p)
Definition: wb-log.h:185

trf::Model_FastSample
TRF model, revise the sample method to speedup the MCMC.
Definition: trf-model.h:217

trf::Model::SetZeta
void SetZeta(T *pzeta)
Set updated zeta.
Definition: trf-model.h:117

trf::Algfb
Definition: trf-alg.h:34

trf::Prob2LogP
LogP Prob2LogP(Prob x)
Definition: trf-def.h:36

trf::PValue
double PValue
Definition: trf-def.h:26

trf::Model::m_nSampleHAccTimes
int m_nSampleHAccTimes
sample H the acceptance times
Definition: trf-model.h:169

trf::Model::GetZeta
void GetZeta(T *pzeta)
Definition: trf-model.h:126

trf::LogP
double LogP
Definition: trf-def.h:27

trf::Model_FastSample::Model_FastSample
Model_FastSample(Vocab *pv)
Definition: trf-model.h:222

trf::Seq::GetLen
int GetLen() const
Definition: trf-feature.h:71

trf::Model_FastSample::SamplePos
void SamplePos(Seq &seq, int nPos)
Definition: trf-model.h:281

trf::Model::m_nLenJumpAccTimes
int m_nLenJumpAccTimes
lenght jump the acceptance times
Definition: trf-model.h:167

trf::AlgNode::ClusterSum
virtual LogP ClusterSum(int *pSeq, int nLen, int nPos, int nOrder)
This function need be derived. Calcualte the log probability of each cluster.
Definition: trf-model.cpp:22

trf::Seq
define a sequence including the word sequence and class sequence
Definition: trf-feature.h:41

wb::Vec< PValue >

trf::Model_FastSample::m_nMHtimes
int m_nMHtimes
Definition: trf-model.h:220

trf::Model_FastSample::ProposeW0
LogP ProposeW0(VocabID &wi, Seq &seq, int nPos, bool bSample=true)
Definition: trf-model.h:228

trf::Feat::GetNum
int GetNum() const
Get number.
Definition: trf-feature.h:200

trf::Model::GetMaxOrder
int GetMaxOrder() const
Get maximum order.
Definition: trf-model.h:104

trf::Model::m_maxlen
int m_maxlen
the maximum length of model, excluding <s> and </s>. The min-len = 1
Definition: trf-model.h:57

trf::Model
TRF model.
Definition: trf-model.h:51

wb::Array::Find
int Find(T t)
Find a value and return the position.
Definition: wb-vector.h:248

trf::Model::m_zeta
Vec< LogP > m_zeta
the estimated normalization constants  (fix  = 0)
Definition: trf-model.h:60

wb::VecShell::GetBuf
T * GetBuf() const
Definition: wb-mat.h:68

word_layer
#define word_layer
Definition: trf-feature.h:31

trf::Seq::x
Mat< VocabID > x
Definition: trf-feature.h:44

trf::Model::m_nLenJumpTotalTime
int m_nLenJumpTotalTime
total times of length jump
Definition: trf-model.h:168

trf::Acceptable
bool Acceptable(Prob prob)
Definition: trf-def.cpp:127

trf::Model::m_pFeat
Feat * m_pFeat
hash all the features
Definition: trf-model.h:54

trf::Model::m_pVocab
Vocab * m_pVocab
Definition: trf-model.h:62

trf::Vocab
Definition: trf-vocab.h:34

trf::Model::GetVocab
Vocab * GetVocab() const
Get Vocab.
Definition: trf-model.h:102

trf::Model::m_nSampleHTotalTimes
int m_nSampleHTotalTimes
Definition: trf-model.h:170

wb::Array::GetNum
int GetNum() const
Get Array number.
Definition: wb-vector.h:240

trf::LogLineNormalize
LogP LogLineNormalize(LogP *pdProbs, int nNum)
Definition: trf-def.cpp:53

trf::AlgNode::AlgNode
AlgNode(Model *p)
Definition: trf-model.h:44

trf::Model_FastSample::ProposeCProbs
void ProposeCProbs(VecShell< LogP > &logps, Seq &seq, int nPos)
Definition: trf-model.h:265

trf::Model_FastSample::Model_FastSample
Model_FastSample(Vocab *pv, int maxlen)
Definition: trf-model.h:225

trf::LogP2Prob
Prob LogP2Prob(LogP x)
Definition: trf-def.h:33

trf::Model::~Model
~Model()
destructor
Definition: trf-model.h:95

trf::Feat
include all the feature table
Definition: trf-feature.h:179

trf::omp_nrand
int omp_nrand(int nMin, int nMax)
get a random integer int [nMin, nMax-1]
Definition: trf-def.cpp:152

trf::AlgNode
the forward-backward algorithms for TRF model
Definition: trf-model.h:38

trf-feature.h

trf
Definition: trf-alg.cpp:20

trf-alg.h

trf::Model::m_logz
Vec< LogP > m_logz
the normalization constants log Z_l
Definition: trf-model.h:59

trf::Model::GetMaxLen
int GetMaxLen() const
Get max-len.
Definition: trf-model.h:100

trf::Model::m_AlgNode
AlgNode m_AlgNode
the forward-backward calculation each node
Definition: trf-model.h:68

class_layer
#define class_layer
Definition: trf-feature.h:32

trf::Model::m_value
Vec< PValue > m_value
the value for each features
Definition: trf-model.h:55

trf::Model::m_matLenJump
Mat< Prob > m_matLenJump
[sample] used to propose a new length
Definition: trf-model.h:64

wb::Array< VocabID >