software/TRF-html/hrf-model_8cpp_source.html

 #include "hrf-model.h"

 namespace hrf
 {
     void Seq::Reset(int len, int hlayer, int hnode)
     {
         if (m_nLen != len || GetHlayer() != hlayer || GetHnode() != hnode) {
             m_nLen = len;
             m_hlayer = hlayer;
             m_hnode = hnode;
             x.Reset(len);
             h.Reset(len, hlayer * hnode);
         }
     }
     void Seq::Copy(Seq &seq)
     {
         x.Copy(seq.x);
         h.Copy(seq.h);
         m_nLen = seq.m_nLen;
     }
     Seq Seq::GetSubSeq(int nPos, int nOrder)
     {
         if (nPos + nOrder > m_nLen) {
             lout_error("[Seq] GetSubSeq: nPos+nOrder > nLen!!");
         }
         Seq sub(nOrder, GetHlayer(), GetHnode());
         for (int i = nPos; i < nPos + nOrder; i++) {
             sub.x.GetWordSeq()[i - nPos] = x.GetWordSeq()[i];
             sub.x.GetClassSeq()[i - nPos] = x.GetClassSeq()[i];
             sub.h[i - nPos] = h[i];
         }
         return sub;
     }
     bool Seq::operator==(Seq &s)
     {
         if (GetLen() != s.GetLen())
             return false;

         if (x.x == s.x.x && h == s.h)
             return true;
         return false;
     }
     void Seq::Print()
     {
         for (int i = 0; i < h.GetCol(); i++) {
             for (int j = 0; j < m_nLen; j++) {
                 lout << h[j][i] << "\t";
             }
             lout << endl;
         }
         x.Print();
     }
     void Seq::Write(File &file)
     {
         ofstream ofile(file.fp);
         for (int i = 0; i < h.GetCol(); i++) {
             for (int j = 0; j < m_nLen; j++) {
                 ofile << h[j][i] << "\t";
             }
             ofile << endl;
         }
         x.Print(file);
     }

     void Model::Reset(Vocab *pv, int hlayer, int hnode, int maxlen)
     {
         trf::Model::Reset(pv, maxlen);

         m_hlayer = hlayer;
         m_hnode = hnode;
         m_m3dVH.Reset(m_pVocab->GetSize(), m_hlayer * m_hnode, 2); // 0 and 1
         m_m3dCH.Reset(m_pVocab->GetClassNum(), m_hlayer * m_hnode, 2); // 0 and 1
         m_m3dHH.Reset(m_hlayer * m_hnode, m_hnode, 4); // 0-0, 0-1, 1-0, 1-1
         m_matBias.Reset(m_hlayer*m_hnode, 2); // 0 and 1
     }


     void Model::SetParam(PValue *pParam)
     {
         if (m_pFeat) {
             trf::Model::SetParam(pParam);
             pParam += m_pFeat->GetNum();
         }

         HRF_VALUE_SET(pParam, m_m3dVH);
         HRF_VALUE_SET(pParam, m_m3dCH);
         HRF_VALUE_SET(pParam, m_m3dHH);
         HRF_VALUE_SET(pParam, m_matBias);
 //      memcpy(m_m3dVH.GetBuf(), pParam, sizeof(PValue)*m_m3dVH.GetSize());
 //      pParam += m_m3dVH.GetSize();
 //      memcpy(m_m3dCH.GetBuf(), pParam, sizeof(PValue)*m_m3dCH.GetSize());
 //      pParam += m_m3dCH.GetSize();
 //      memcpy(m_m3dHH.GetBuf(), pParam, sizeof(PValue)*m_m3dHH.GetSize());
     }
     void Model::GetParam(PValue *pParam)
     {
         if (m_pFeat) {
             trf::Model::GetParam(pParam);
             pParam += m_pFeat->GetNum();
         }
         HRF_VALUE_GET(pParam, m_m3dVH);
         HRF_VALUE_GET(pParam, m_m3dCH);
         HRF_VALUE_GET(pParam, m_m3dHH);
         HRF_VALUE_GET(pParam, m_matBias);

 //      memcpy(pParam, m_m3dVH.GetBuf(), sizeof(PValue)*m_m3dVH.GetSize());
 //      pParam += m_m3dVH.GetSize();
 //      memcpy(pParam, m_m3dCH.GetBuf(), sizeof(PValue)*m_m3dCH.GetSize());
 //      pParam += m_m3dCH.GetSize();
 //      memcpy(pParam, m_m3dHH.GetBuf(), sizeof(PValue)*m_m3dHH.GetSize());
     }
     LogP Model::GetLogProb(Seq &seq, bool bNorm /* = true */)
     {
         LogP logSum = trf::Model::GetLogProb(seq.x, false);

         //double dfactor = 1.0 / seq.GetLen();
         double dfactor = 1.0;

         // Vocab * Hidden
         for (int i = 0; i < seq.GetLen(); i++) {
             logSum += dfactor * SumVHWeight(m_m3dVH[seq.wseq()[i]], seq.h[i]);
         }

         // Class * Hidden
         if (m_m3dCH.GetSize() > 0) {
             for (int i = 0; i < seq.GetLen(); i++) {
                 logSum += dfactor * SumVHWeight(m_m3dCH[seq.cseq()[i]], seq.h[i]);
             }
         }

         // Hidden * Hidden
         for (int i = 0; i < seq.GetLen() - 1; i++) {
             logSum += dfactor * SumHHWeight(m_m3dHH, seq.h[i], seq.h[i + 1]);
         }

         // Bias
         for (int i = 0; i < seq.GetLen(); i++) {
             logSum += dfactor * SumVHWeight(m_matBias, seq.h[i]);
         }

         // normalization
         if (bNorm) {
             int nLen = min(m_maxlen, seq.GetLen());
             logSum = logSum - m_logz[nLen] + trf::Prob2LogP(m_pi[nLen]);
         }
         return logSum;
     }

     void Model::ReadT(const char *pfilename)
     {
         File fout(pfilename, "rt");

         lout << "[Model]: Read(txt) from " << pfilename << endl;

         int nVocabSize = 0;
         fout.Scanf("m_vocabsize=%d\n", &nVocabSize);
         fout.Scanf("m_maxlen=%d\n", &m_maxlen);
         fout.Scanf("m_hlayer=%d\n", &m_hlayer);
         fout.Scanf("m_hnode=%d\n", &m_hnode);
         // Reset
         Reset(m_pVocab, m_hlayer, m_hnode, m_maxlen);
         if (m_pVocab->GetSize() != nVocabSize) {
             lout_error("[Model] ReadT: the input nVocabSize(" << nVocabSize << ") != m_pVocab->GetSize(" << m_pVocab->GetSize() << ")");
         }

         double dValue;
         fout.Scanf("m_pi=[ ");
         for (int i = 1; i <= m_maxlen; i++) {
             fout.Scanf("%lf ", &dValue);
             m_pi[i] = dValue;
         }
         fout.Scanf("]\n");
         fout.Scanf("m_logz=[ ");
         for (int i = 1; i <= m_maxlen; i++) {
             fout.Scanf("%lf ", &dValue);
             m_logz[i] = dValue;
         }
         fout.Scanf("]\n");
         fout.Scanf("m_zeta=[ ");
         for (int i = 1; i <= m_maxlen; i++) {
             fout.Scanf("%lf ", &dValue);
             m_zeta[i] = dValue;
         }
         fout.Scanf("]\n");

         int nValue = 0;
         fout.Scanf("featnum=%d\n", &nValue);
         m_value.Reset(nValue);
         SAFE_DELETE(m_pFeat);
         m_pFeat = new trf::Feat;
         m_pFeat->m_nTotalNum = nValue;
         m_pFeat->ReadT(fout, m_value.GetBuf());

         /* Init all the values */
         m_m3dVH.Reset();
         m_m3dCH.Reset();
         m_m3dHH.Reset();

         char *pLine = NULL;
         while (pLine = fout.GetLine()) {
             int nFeatNum = 0;
             int nRow, nCol;
             String strLabel = strtok(pLine, ": \t");
             pLine = strtok(NULL, ": \t");
             if (strLabel == "m_matVH")
             {
                 // VH
                 sscanf(pLine, "(num=%d*%d)", &nRow, &nCol);
                 m_m3dVH.Reset(nRow, nCol, 2);
                 m_m3dVH.Read(fout);
             }
             else if (strLabel == "m_matCH")
             {
                 // CH
                 sscanf(pLine, "(num=%d*%d)", &nRow, &nCol);
                 m_m3dCH.Reset(nRow, nCol, 2);
                 m_m3dCH.Read(fout);
             }
             else if (strLabel == "m_matHH")
             {
                 sscanf(pLine, "(num=%d*%d)", &nRow, &nCol);
                 m_m3dHH.Reset(nRow, nCol, 4);
                 m_m3dHH.Read(fout);
             }
             else if (strLabel == "m_matBias")
             {
                 sscanf(pLine, "(num=%d)", &nRow);
                 m_matBias.Reset(nRow, 2);
                 m_matBias.Read(fout);
             }
         }
     }
     void Model::WriteT(const char *pfilename)
     {
         File fout(pfilename, "wt");
         lout << "[Model] Write(txt) to " << pfilename << endl;

         fout.Print("m_vocabsize=%d\n", m_pVocab->GetSize());
         fout.Print("m_maxlen=%d\n", m_maxlen);
         fout.Print("m_hlayer=%d\n", m_hlayer);
         fout.Print("m_hnode=%d\n", m_hnode);
         fout.Print("m_pi=[ ");
         for (int i = 1; i <= m_maxlen; i++) {
             fout.Print("%f ", m_pi[i]);
         }
         fout.Print("]\n");
         fout.Print("m_logz=[ ");
         for (int i = 1; i <= m_maxlen; i++) {
             fout.Print("%f ", m_logz[i]);
         }
         fout.Print("]\n");
         fout.Print("m_zeta=[ ");
         for (int i = 1; i <= m_maxlen; i++) {
             fout.Print("%f ", m_zeta[i]);
         }
         fout.Print("]\n");

         fout.Print("featnum=%d\n", m_pFeat->GetNum());
         m_pFeat->WriteT(fout, m_value.GetBuf());

         // VH
         fout.Print("m_matVH: (num=%d*%d)\n", m_m3dVH.GetXDim(), m_m3dVH.GetYDim());
         m_m3dVH.Write(fout);

         // CH
         fout.Print("m_matCH: (num=%d*%d)\n", m_m3dCH.GetXDim(), m_m3dCH.GetYDim());
         m_m3dCH.Write(fout);

         // HH
         fout.Print("m_matHH: (num=%d*%d)\n", m_m3dHH.GetXDim(), m_m3dHH.GetYDim());
         m_m3dHH.Write(fout);

         // Bias
         fout.Print("m_matBias: (num=%d)\n", m_matBias.GetRow());
         m_matBias.Write(fout);
     }
     LogP Model::GetLogProb(VecShell<VocabID> &x, bool bNorm /* = true */)
     {
         LogP logProb = 0;
         for (int layer = 0; layer < m_hlayer; layer++) {
             AlgLayer alg(this, x, layer);
             alg.ForwardBackward(x.GetSize(), GetHiddenOrder(), GetEncodeLayerLimit());
             logProb += alg.GetLogSummation();
         }

         trf::Seq trfseq;
         trfseq.Set(x.GetBuf(), x.GetSize(), m_pVocab);
         logProb += FeatClusterSum(trfseq, 0, x.GetSize());

         if (bNorm) {
             int nLen = min(m_maxlen, x.GetSize());
             logProb = logProb - m_logz[nLen] + trf::Prob2LogP(m_pi[nLen]);
         }

         return logProb;
     }
     LogP Model::ClusterSum(Seq &seq, int nPos, int nOrder)
     {
         return FeatClusterSum(seq.x, nPos, nOrder) + HiddenClusterSum(seq, nPos, nOrder);
     }
     LogP Model::FeatClusterSum(trf::Seq &x, int nPos, int nOrder)
     {
         return trf::Model::ClusterSum(x, nPos, nOrder);
     }
     LogP Model::HiddenClusterSum(Seq &seq, int nPos, int nOrder)
     {
         LogP LogSum = 0;

         //double dfactor = 1.0 / seq.GetLen();
         double dfactor = 1.0;

         // Word * hidden
         LogSum += dfactor * SumVHWeight(m_m3dVH[seq.wseq()[nPos]], seq.h[nPos]);

         if (nPos == seq.GetLen() - nOrder) { // The last cluster
             for (int i = nPos + 1; i < seq.GetLen(); i++) {
                 LogSum += dfactor * SumVHWeight(m_m3dVH[seq.wseq()[i]], seq.h[i]);
             }
         }

         // Class * hidden
         if (m_m3dCH.GetSize() > 0) {
             LogSum += dfactor * SumVHWeight(m_m3dCH[seq.cseq()[nPos]], seq.h[nPos]);

             if (nPos == seq.GetLen() - nOrder) { // The last cluster
                 for (int i = nPos + 1; i < seq.GetLen(); i++) {
                     LogSum += dfactor * SumVHWeight(m_m3dCH[seq.cseq()[i]], seq.h[i]);
                 }
             }
         }

         // Hidden * Hidden
         if (nOrder > 1) { // if order=1, then no HH matrix
             LogSum += dfactor * SumHHWeight(m_m3dHH, seq.h[nPos], seq.h[nPos + 1]);

             if (nPos == seq.GetLen() - nOrder) { // The last cluster
                 for (int i = nPos + 1; i < seq.GetLen() - 1; i++)
                     LogSum += dfactor * SumHHWeight(m_m3dHH, seq.h[i], seq.h[i + 1]);
             }
         }

         // bias
         LogSum += dfactor * SumVHWeight(m_matBias, seq.h[nPos]);

         if (nPos == seq.GetLen() - nOrder) { // The last cluster
             for (int i = nPos + 1; i < seq.GetLen(); i++) {
                 LogSum += dfactor * SumVHWeight(m_matBias, seq.h[i]);
             }
         }


         return LogSum;
     }
     LogP Model::LayerClusterSum(Seq &seq, int nlayer, int nPos, int nOrder)
     {
         LogP LogSum = 0;
         //double dfactor = 1.0 / seq.GetLen();
         double dfactor = 1.0;

         // Word * hidden
         LogSum += dfactor * SumVHWeight(m_m3dVH[seq.wseq()[nPos]], seq.h[nPos], nlayer);

         if (nPos == seq.GetLen() - nOrder) { // The last cluster
             for (int i = nPos + 1; i < seq.GetLen(); i++) {
                 LogSum += dfactor * SumVHWeight(m_m3dVH[seq.wseq()[i]], seq.h[i], nlayer);
             }
         }

         // Class * hidden
         if (m_m3dCH.GetSize() > 0) {
             LogSum += dfactor * SumVHWeight(m_m3dCH[seq.cseq()[nPos]], seq.h[nPos], nlayer);

             if (nPos == seq.GetLen() - nOrder) { // The last cluster
                 for (int i = nPos + 1; i < seq.GetLen(); i++) {
                     LogSum += dfactor * SumVHWeight(m_m3dCH[seq.cseq()[i]], seq.h[i], nlayer);
                 }
             }
         }

         // Hidden * Hidden
         if (nOrder > 1) { // if order=1, then no HH matrix
             LogSum += dfactor * SumHHWeight(m_m3dHH, seq.h[nPos], seq.h[nPos + 1], nlayer);

             if (nPos == seq.GetLen() - nOrder) { // The last cluster
                 for (int i = nPos + 1; i < seq.GetLen() - 1; i++)
                     LogSum += dfactor * SumHHWeight(m_m3dHH, seq.h[i], seq.h[i + 1], nlayer);
             }
         }

         // bias hidden
         LogSum += dfactor * SumVHWeight(m_matBias, seq.h[nPos], nlayer);

         if (nPos == seq.GetLen() - nOrder) { // The last cluster
             for (int i = nPos + 1; i < seq.GetLen(); i++) {
                 LogSum += dfactor * SumVHWeight(m_matBias, seq.h[i], nlayer);
             }
         }


         return LogSum;
     }
     double Model::ExactNormalize(int nLen)
     {
         int nMaxOrder = max(GetMaxOrder(), GetHiddenOrder());
         int nIterDim = min(nMaxOrder, nLen);


         /* as for exact Z_1 is need in joint SA algorithm.
         Calculate Z_1 using a different way
         */
         if (nLen == 1) {
             double dLogSum = trf::LogP_zero;
             for (VocabID x = m_pVocab->IterBeg(); x <= m_pVocab->IterEnd(); x++) {
                 trf::Seq xseq;
                 VocabID cid = m_pVocab->GetClass(x);
                 xseq.Set(&x, 1, m_pVocab);
                 double d1 = FeatClusterSum(xseq, 0, 1);
                 double d2 = 0;
                 for (int k = 0; k < m_hlayer * m_hnode; k++) {
                     /* After introducing CHmat, revise the equation !!! */
                     if (cid != trf::VocabID_none && m_m3dCH.GetSize() > 0) {
                         d2 += trf::Log_Sum(m_matBias[k][0] + m_m3dVH[x][k][0] + m_m3dCH[cid][k][0],
                             m_matBias[k][1] + m_m3dVH[x][k][1] + m_m3dCH[cid][k][1]);
                     }
                     else { // if cid == VocabID_none, it means on class infromation
                         d2 += trf::Log_Sum(m_matBias[k][0] + m_m3dVH[x][k][0], m_matBias[k][1] + m_m3dVH[x][k][1]);
                     }
                 }
                 dLogSum = trf::Log_Sum(dLogSum, d1 + d2);
             }
             m_logz[nLen] = dLogSum;
         }
         else {
             int nEncoderLimit = GetEncodeNodeLimit();
             // forward-backward
             m_nodeCal.ForwardBackward(nLen, nMaxOrder, nEncoderLimit);

             m_logz[nLen] = m_nodeCal.GetLogSummation();
         }

         return m_logz[nLen];

     }
     void Model::ExactNormalize()
     {
         for (int len = 1; len <= m_maxlen; len++) {
             ExactNormalize(len);
             m_zeta[len] = m_logz[len] - m_logz[1];
             //lout << " logZ[" << len << "] = " << m_logz[len] << endl;
         }
     }
     LogP Model::GetMarginalLogProb(int nLen, int nPos, Seq &sub, bool bNorm /* = true */)
     {
         // Forward-backward need be calculate

         if (nPos + sub.GetLen() > nLen) {
             lout_error("[Model] GetMarginalLogProb: nPos(" << nPos << ")+nOrder(" << sub.GetLen() << ") > seq.len(" << nLen << ")!!");
         }

         // encode the sub sequence
         Vec<int> nsub(sub.GetLen());
         EncodeNode(nsub, sub);

         LogP dSum = m_nodeCal.GetMarginalLogProb(nPos, nsub.GetBuf(), nsub.GetSize());

         return (bNorm) ? dSum - m_logz[nLen] : dSum;
     }

     void Model::GetNodeExp(double *pExp, Prob *pLenProb/* = NULL*/)
     {
         if (pLenProb == NULL)
             pLenProb = m_pi.GetBuf();
         VecShell<double> exp(pExp, GetParamNum());
         Vec<double> expTemp(GetParamNum());

         double *p = expTemp.GetBuf();
         VecShell<double> featexp;
         Mat3dShell<double> VHexp, CHexp, HHexp;
         MatShell<double> Bexp;
         BufMap(p, featexp, VHexp, CHexp, HHexp, Bexp);

         exp.Fill(0);
         for (int len = 1; len <= m_maxlen; len++) {

             int nMaxOrder = max(GetMaxOrder(), GetHiddenOrder());
             m_nodeCal.ForwardBackward(len, nMaxOrder, GetEncodeNodeLimit());

             GetNodeExp(len, featexp, VHexp, CHexp, HHexp, Bexp);
             //          GetNodeExp_feat(len, featexp);
             //          GetNodeExp_VH(len, VHexp);
             //          GetNodeExp_HH(len, HHexp);

             for (int i = 0; i < exp.GetSize(); i++) {
                 exp[i] += pLenProb[len] * expTemp[i];
             }
         }
     }
     void Model::GetNodeExp(int nLen, double *pExp)
     {
         VecShell<double> featexp;
         Mat3dShell<double> VHexp, CHexp, HHexp;
         MatShell<double> Bexp;
         BufMap(pExp, featexp, VHexp, CHexp, HHexp, Bexp);
         GetNodeExp(nLen, featexp, VHexp, CHexp, HHexp, Bexp);
     }
     void Model::GetNodeExp(int nLen, VecShell<double> featexp,
         Mat3dShell<double> VHexp, Mat3dShell<double> CHexp, Mat3dShell<double> HHexp,
         MatShell<double> Bexp)
     {
         // make sure the forward-backward is performed.
         featexp.Fill(0);
         VHexp.Fill(0);
         CHexp.Fill(0);
         HHexp.Fill(0);
         Bexp.Fill(0);

         //double dfactor = 1.0 / nLen;
         double dfactor = 1.0;

         //int nMaxOrder = m_nodeCal.m_nOrder;
         int nClusterNum = nLen - m_nodeCal.m_nOrder + 1;
         int nClusterDim = m_nodeCal.m_nOrder;
         if (nClusterNum < 1) {
             nClusterNum = 1;
             nClusterDim = nLen;
         }

         Vec<int> nseq(nLen);
         Seq seq(nLen, m_hlayer, m_hnode);

         // circle for the position pos
         for (int pos = 0; pos < nClusterNum; pos++) {
             // ergodic the cluster
             trf::VecIter iter(nseq.GetBuf() + pos, nClusterDim, 0, GetEncodeNodeLimit() - 1);
             while (iter.Next()) {
                 DecodeNode(nseq, seq, pos, nClusterDim);
                 Prob prob = trf::LogP2Prob(m_nodeCal.GetMarginalLogProb(pos, nseq.GetBuf()+pos, nClusterDim, m_logz[nLen]));

                 // the cluster before the last one
                 Array<int> afeat;
                 for (int n = 1; n <= nClusterDim; n++) {
                     m_pFeat->Find(afeat, seq.x, pos, n);
                 }
                 for (int i = 0; i < afeat.GetNum(); i++) {
                     featexp[afeat[i]] += prob;
                 }

                 VocabID x = seq.wseq()[pos];
                 for (int k = 0; k < m_hlayer*m_hnode; k++) {
                     VHexp[x][k][(int)(seq.h[pos][k])] += dfactor * prob;
                 }
                 if (m_pVocab->GetClassNum() > 0) {
                     VocabID c = seq.cseq()[pos];
                     for (int k = 0; k < m_hlayer*m_hnode; k++) {
                         CHexp[c][k][(int)(seq.h[pos][k])] += dfactor * prob;
                     }
                 }
                 if (nClusterDim > 1) {
                     for (int l = 0; l < m_hlayer; l++) {
                         for (int a = 0; a < m_hnode; a++) {
                             for (int b = 0; b < m_hnode; b++) {
                                 HHexp[l*m_hnode + a][b][HHMap(seq.h[pos][l*m_hnode + a], seq.h[pos + 1][l*m_hnode + b])] += dfactor * prob;
                             }
                         }
                     }
                 }
                 for (int k = 0; k < m_hlayer*m_hnode; k++) {
                     Bexp[k][(int)(seq.h[pos][k])] += dfactor * prob;
                 }


                 // the last cluster
                 if (pos == nClusterNum - 1) {
                     afeat.Clean();
                     for (int ii = 1; ii < nClusterDim; ii++) { // position ii
                         for (int n = 1; n <= nClusterDim - ii; n++) { // order n
                             m_pFeat->Find(afeat, seq.x, pos + ii, n);
                         }
                     }
                     for (int i = 0; i < afeat.GetNum(); i++) {
                         featexp[afeat[i]] += prob;
                     }

                     for (int ii = 1; ii < nClusterDim; ii++) {
                         VocabID x = seq.wseq()[pos+ii];
                         for (int k = 0; k < m_hlayer*m_hnode; k++) {
                             VHexp[x][k][seq.h[pos + ii][k]] += dfactor * prob;
                         }
                     }
                     if (m_pVocab->GetClassNum() > 0) {
                         for (int ii = 1; ii < nClusterDim; ii++) {
                             VocabID c = seq.cseq()[pos+ii];
                             for (int k = 0; k < m_hlayer*m_hnode; k++) {
                                 CHexp[c][k][seq.h[pos + ii][k]] += dfactor * prob;
                             }
                         }
                     }
                     for (int ii = 1; ii < nClusterDim - 1; ii++) {
                         for (int l = 0; l < m_hlayer; l++) {
                             for (int a = 0; a < m_hnode; a++) {
                                 for (int b = 0; b < m_hnode; b++) {
                                     HHexp[l*m_hnode + a][b][HHMap(seq.h[pos + ii][l*m_hnode + a], seq.h[pos + ii + 1][l*m_hnode + b])] += dfactor * prob;
                                 }
                             }
                         }
                     }
                     for (int ii = 1; ii < nClusterDim; ii++) {
                         for (int k = 0; k < m_hlayer*m_hnode; k++) {
                             Bexp[k][seq.h[pos + ii][k]] += dfactor * prob;
                         }
                     }
                 }
             }
         }
     }

     void Model::GetHiddenExp(VecShell<VocabID> x, double *pExp)
     {

         VecShell<double> featexp;
         Mat3dShell<double> VHexp, CHexp, HHexp;
         MatShell<double> Bexp;
         BufMap(pExp, featexp, VHexp, CHexp, HHexp, Bexp);


         int nLen = x.GetSize();
         int nMaxOrder = GetHiddenOrder();

         for (int layer = 0; layer < m_hlayer; layer++) {
             AlgLayer fb(this, x, layer);
             // forward-backward
             fb.ForwardBackward(nLen, nMaxOrder, GetEncodeLayerLimit());
             // get the normalization constant
             LogP logz = fb.GetLogSummation();
             // get the exp
             GetLayerExp(fb, layer, VHexp, CHexp, HHexp, Bexp, logz);
         }

         //get the feature expectation
         trf::Seq trfseq(nLen);
         trfseq.Set(x.GetBuf(), nLen, m_pVocab);
         trf::Model::FeatCount(trfseq, featexp.GetBuf());
     }

     void Model::GetLayerExp(AlgLayer &fb, int nLayer,
         Mat3dShell<double> &VHexp, Mat3dShell<double> &CHexp, Mat3dShell<double> &HHexp, MatShell<double> &Bexp,
         LogP logz /* = 0 */)
     {
         /* Don't clean the buffer!!!! */
         //int nMaxOrder = GetHiddenOrder();
         int nLen = fb.m_nLen;
         int nClusterNum = nLen - fb.m_nOrder + 1;
         int nClusterDim = fb.m_nOrder;
         if (nClusterNum < 1) {
             nClusterNum = 1;
             nClusterDim = nLen;
         }
         //double dfactor = 1.0 / nLen;
         double dfactor = 1.0;
         Vec<int> hseq(nLen);
         Mat<HValue> h(nLen, m_hlayer * m_hnode);
         for (int pos = 0; pos < nClusterNum; pos++) {
             // ergodic the cluster
             trf::VecIter iter(hseq.GetBuf() + pos, nClusterDim, 0, GetEncodeLayerLimit() - 1);
             while (iter.Next()) {
                 DecodeLayer(hseq, h, nLayer, pos, nClusterDim);
                 Prob prob = trf::LogP2Prob(fb.GetMarginalLogProb(pos, hseq.GetBuf()+pos, nClusterDim, logz)); // the prob of current cluster

                 // the cluster before the last one
                 VocabID x = fb.m_seq.wseq()[pos];
                 for (int k = nLayer*m_hnode; k < nLayer*m_hnode+m_hnode; k++) {
                     VHexp[x][k][h[pos][k]] += dfactor * prob;
                 }
                 if (m_pVocab->GetClassNum() > 0) {
                     VocabID c = fb.m_seq.cseq()[pos];
                     for (int k = nLayer*m_hnode; k < nLayer*m_hnode + m_hnode; k++) {
                         CHexp[c][k][h[pos][k]] += dfactor * prob;
                     }
                 }
                 if (nClusterDim > 1) {
                     for (int a = 0; a < m_hnode; a++) {
                         for (int b = 0; b < m_hnode; b++) {
                             HHexp[nLayer*m_hnode + a][b][HHMap(h[pos][nLayer*m_hnode + a], h[pos + 1][nLayer*m_hnode + b])] += dfactor * prob;
                         }
                     }
                 }
                 for (int k = nLayer*m_hnode; k < nLayer*m_hnode + m_hnode; k++) {
                     Bexp[k][h[pos][k]] += dfactor * prob;
                 }

                 // the last cluster
                 if (pos == nClusterNum - 1) {
                     for (int ii = 1; ii < nClusterDim; ii++) {
                         VocabID x = fb.m_seq.wseq()[pos + ii];
                         for (int k = nLayer*m_hnode; k < nLayer*m_hnode + m_hnode; k++) {
                             VHexp[x][k][h[pos + ii][k]] += dfactor * prob;
                         }
                         if (m_pVocab->GetClassNum() > 0) {
                             VocabID c = fb.m_seq.cseq()[pos + ii];
                             for (int k = nLayer*m_hnode; k < nLayer*m_hnode + m_hnode; k++) {
                                 CHexp[c][k][h[pos + ii][k]] += dfactor * prob;
                             }
                         }
                         for (int k = nLayer*m_hnode; k < nLayer*m_hnode + m_hnode; k++) {
                             Bexp[k][h[pos + ii][k]] += dfactor * prob;
                         }
                     }
                     for (int ii = 1; ii < nClusterDim - 1; ii++) {
                         for (int a = 0; a < m_hnode; a++) {
                             for (int b = 0; b < m_hnode; b++) {
                                 HHexp[nLayer*m_hnode + a][b][HHMap(h[pos + ii][nLayer*m_hnode + a], h[pos + ii + 1][nLayer*m_hnode + b])] += dfactor * prob;
                             }
                         }
                     }
                 }
             }
         }
     }

     void Model::Sample(Seq &seq)
     {
         LocalJump(seq);
         MarkovMove(seq);
     }
     void Model::LocalJump(Seq &seq)
     {
         int nOldLen = seq.GetLen();
         int nNewLen = 0;
         LogP j1 = ProposeLength(nOldLen, nNewLen, true);
         LogP j2 = ProposeLength(nNewLen, nOldLen, false);

         if (nNewLen == nOldLen)
             return;

         LogP logpAcc = 0;
         if (nNewLen == nOldLen + 1) {
             LogP logpold = GetLogProb(seq);
             seq.Reset(nNewLen, seq.GetHlayer(), seq.GetHnode());
             LogP Q = ProposeH0(seq.h[nNewLen - 1], seq, nNewLen - 1, true);
             LogP R = ProposeC0(seq.cseq()[nNewLen - 1], seq, nNewLen - 1, true);
             LogP G = SampleW(seq, nNewLen - 1);
             LogP logpnew = GetLogProb(seq);

             logpAcc = (j2 - j1) + logpnew - (logpold + Q + R + G);
         }
         else if (nNewLen == nOldLen - 1) {
             LogP logpold = GetLogProb(seq);
             LogP Q = ProposeH0(seq.h[nOldLen - 1], seq, nOldLen - 1, false);
             LogP R = ProposeC0(seq.cseq()[nOldLen - 1], seq, nOldLen - 1, false);
             LogP G = SampleW(seq, nOldLen - 1, false);

             seq.Reset(nNewLen, seq.GetHlayer(), seq.GetHnode());
             LogP logpnew = GetLogProb(seq);

             logpAcc = (j2 - j1) + logpnew + Q + R + G - logpold;
         }
         else if (nNewLen != nOldLen){
             lout_error("[Model] Sample: nNewLen(" << nNewLen << ") and nOldLen(" << nOldLen << ")");
         }


         if (trf::Acceptable(trf::LogP2Prob(logpAcc))) {
             seq.Reset(nNewLen, seq.GetHlayer(), seq.GetHnode());
             m_nLenJumpAccTimes++;
         }
         else {
             seq.Reset(nOldLen, seq.GetHlayer(), seq.GetHnode());
         }
         m_nLenJumpTotalTime++;

     }
     void Model::MarkovMove(Seq &seq)
     {
         /* Gibbs sampling */
         SampleHAndCGivenX(seq);
         for (int nPos = 0; nPos < seq.GetLen(); nPos++) {
             SampleC(seq, nPos);
             SampleW(seq, nPos);
         }
         //SampleHAndCGivenX(seq);
     }

     LogP Model::ProposeLength(int nOld, int &nNew, bool bSample)
     {
         if (bSample) {
             nNew = trf::LineSampling(m_matLenJump[nOld].GetBuf(), m_maxlen + 1);
         }

         return trf::Prob2LogP(m_matLenJump[nOld][nNew]);
     }
     LogP Model::ProposeH0(VecShell<HValue> &hi, Seq &seq, int nPos, bool bSample)
     {
         /* Note:
         The nPos may be larger than the length of seq. i.e nPos >= seq.GetLen();
         As we may want to propose a new position over the sequence.
         */

         if (nPos + 1 > seq.GetLen()) {
             seq.Reset(nPos + 1, seq.GetHlayer(), seq.GetHnode());
         }

         Vec<LogP> logps(m_hlayer*m_hnode);
         ProposeHProbs(logps, seq, nPos);


         /* Sample */
         if (bSample) {
             for (int i = 0; i < logps.GetSize(); i++) {
                 hi[i] = trf::Acceptable(trf::LogP2Prob(logps[i])) ? 1.0f : 0.0f;
             }
         }

         /* Get The probs */
         LogP resLogp = GetConditionalProbForH(hi, logps);


         return resLogp;
     }
     LogP Model::ProposeC0(VocabID &ci, Seq &seq, int nPos, bool bSample)
     {
         /* if there are no class, then return 0 */
         if (m_pVocab->GetClassNum() == 0) {
             ci = trf::VocabID_none;
             return 0;
         }

         Vec<LogP> vlogps(m_pVocab->GetClassNum());
         ProposeCProbs(vlogps, seq, nPos);

         if (bSample) {
             ci = trf::LogLineSampling(vlogps.GetBuf(), vlogps.GetSize());
         }

         return vlogps[ci];
     }
     void Model::ProposeHProbs(VecShell<LogP> &logps, Seq &seq, int nPos, bool bConsiderXandC /*=false*/)
     {
         logps.Fill(0);
         Mat<LogP> matLogp(m_hlayer*m_hnode, 2);
         matLogp.Fill(0);

         //double dfactor = 1.0 / seq.GetLen();
         double dfactor = 1.0;

         // HH connection
         if (nPos - 1 >= 0 && nPos - 1 <= seq.GetLen() - 1) {
             for (int l = 0; l < m_hlayer; l++) {
                 for (int i = 0; i < m_hnode; i++) {
                     HValue curh = seq.h[nPos - 1][l*m_hnode + i];
                     for (int j = 0; j < m_hnode; j++) {
                         matLogp.Get(l*m_hnode + j, 0) += dfactor * m_m3dHH.Get(l*m_hnode + i, j, HHMap(curh, 0));
                         matLogp.Get(l*m_hnode + j, 1) += dfactor * m_m3dHH.Get(l*m_hnode + i, j, HHMap(curh, 1));
                     }
                 }
             }
         }
         if (nPos + 1 <= seq.GetLen() - 1) {
             for (int l = 0; l < m_hlayer; l++) {
                 for (int i = 0; i < m_hnode; i++) {
                     HValue curh = seq.h[nPos + 1][l*m_hnode + i];
                     for (int j = 0; j < m_hnode; j++) {
                         matLogp.Get(l*m_hnode + j, 0) += dfactor * m_m3dHH.Get(l*m_hnode + j, i, HHMap(0, curh));
                         matLogp.Get(l*m_hnode + j, 1) += dfactor * m_m3dHH.Get(l*m_hnode + j, i, HHMap(1, curh));
                     }
                 }
             }
         }

         /* bias for H */
         for (int i = 0; i < m_hlayer*m_hnode; i++) {
             matLogp[i][0] += dfactor * m_matBias[i][0];
             matLogp[i][1] += dfactor * m_matBias[i][1];
         }

         if (bConsiderXandC) {
             /* Consider the VH matrix */
             for (int i = 0; i < m_hlayer*m_hnode; i++) {
                 matLogp[i][0] += dfactor * m_m3dVH[seq.wseq()[nPos]][i][0];
                 matLogp[i][1] += dfactor * m_m3dVH[seq.wseq()[nPos]][i][1];
             }
             if (m_m3dCH.GetSize() > 0) {
                 /* Consider the CH matrix */
                 for (int i = 0; i < m_hlayer*m_hnode; i++) {
                     matLogp[i][0] += dfactor * m_m3dCH[seq.cseq()[nPos]][i][0];
                     matLogp[i][1] += dfactor * m_m3dCH[seq.cseq()[nPos]][i][1];
                 }
             }
         }

         /*
         Get Probs
         */
         for (int i = 0; i < m_hlayer*m_hnode; i++) {
             //logps[i] = logps[i] - Log_Sum(logps[i], 0);
             logps[i] = matLogp[i][1] - trf::Log_Sum(matLogp[i][1], matLogp[i][0]);
         }
     }
     void Model::ProposeCProbs(VecShell<LogP> &logps, Seq &seq, int nPos)
     {
         VocabID savecid = seq.cseq()[nPos];
         for (int cid = 0; cid < m_pVocab->GetClassNum(); cid++) {
             seq.cseq()[nPos] = cid;
             logps[cid] = GetReducedModelForC(seq, nPos);
         }
         seq.cseq()[nPos] = savecid;
         trf::LogLineNormalize(logps.GetBuf(), m_pVocab->GetClassNum());
     }
     LogP Model::GetReducedModelForH(Seq &seq, int nPos)
     {
         // Only consider the HH-matrix, as VH matrix has been considered in GetLogWeightSumForW
         LogP logSum = 0;
         //double dfactor = 1.0 / seq.GetLen();
         double dfactor = 1.0;
         // Hidden * Hidden
         for (int i = max(0, nPos - 1); i <= min(seq.GetLen() - 2, nPos); i++) {
             logSum += dfactor * SumHHWeight(m_m3dHH, seq.h[i], seq.h[i + 1]);
         }
         // consider the bias for H
         logSum += dfactor * SumVHWeight(m_matBias, seq.h[nPos]);
         return logSum;
     }
     LogP Model::GetReducedModelForC(Seq &seq, int nPos)
     {
         // class features
         LogP logSum = trf::Model::GetReducedModelForC(seq.x, nPos);

         // CH
         //double dfactor = 1.0 / seq.GetLen();
         double dfactor = 1.0;
         if (m_m3dCH.GetSize() > 0) {
             logSum += dfactor * SumVHWeight(m_m3dCH[seq.cseq()[nPos]], seq.h[nPos]);
         }

         return logSum;
     }
     LogP Model::GetReducedModelForW(Seq &seq, int nPos)
     {
         // word features
         LogP logSum = trf::Model::GetReducedModelForW(seq.x, nPos);
         // VH
         //double dfactor = 1.0 / seq.GetLen();
         double dfactor = 1.0;
         logSum += dfactor * SumVHWeight(m_m3dVH[seq.wseq()[nPos]], seq.h[nPos]);
         return logSum;
     }
     LogP Model::GetConditionalProbForH(VecShell<HValue> &hi, VecShell<LogP> &logps)
     {
         /* Get The probs */
         LogP resLogp = 0;
         for (int i = 0; i < hi.GetSize(); i++) {
             resLogp += (hi[i] == 0) ? trf::Log_Sub(0, logps[i]) : logps[i];
         }

         return resLogp;
     }
     LogP Model::GetMarginalProbOfC(Seq &seq, int nPos)
     {
         LogP resLogp = trf::LogP_zero;

         Array<VocabID> *pXs = m_pVocab->GetWord(seq.cseq()[nPos]);

         VocabID saveX = seq.wseq()[nPos];
         for (int i = 0; i < pXs->GetNum(); i++) {
             seq.wseq()[nPos] = pXs->Get(i);
             /* Only need to calculate the summation of weight depending on x[nPos], c[nPos] */
             /* used to sample the c_i, fixed h */
             resLogp = trf::Log_Sum(resLogp, GetReducedModelForW(seq, nPos) + GetReducedModelForC(seq, nPos));
             //resLogp = Log_Sum(resLogp, GetLogProb(seq, false));
         }
         seq.wseq()[nPos] = saveX;

         return resLogp;
     }
     void Model::SampleC(Seq &seq, int nPos)
     {
         if (m_pVocab->GetClassNum() == 0) {
             seq.cseq()[nPos] = trf::VocabID_none;
             return;
         }

         /* Sample C0 */
         Vec<LogP> vlogps_c(m_pVocab->GetClassNum());
         ProposeCProbs(vlogps_c, seq, nPos);
         VocabID ci = seq.cseq()[nPos];
         VocabID C0 = trf::LogLineSampling(vlogps_c.GetBuf(), vlogps_c.GetSize());
         LogP logpRi = vlogps_c[ci];
         LogP logpR0 = vlogps_c[C0];


         /* Calculate the probability p_t(h, c) */
         seq.cseq()[nPos] = ci;
         LogP Logp_ci = GetMarginalProbOfC(seq, nPos);
         seq.cseq()[nPos] = C0;
         LogP Logp_C0 = GetMarginalProbOfC(seq, nPos);

         LogP acclogp = logpRi + Logp_C0 - (logpR0 + Logp_ci);

         m_nSampleHTotalTimes++;
         if (trf::Acceptable(trf::LogP2Prob(acclogp))) {
             m_nSampleHAccTimes++;
             seq.cseq()[nPos] = C0;
         }
         else {
             seq.cseq()[nPos] = ci;
         }
     }
     LogP Model::SampleW(Seq &seq, int nPos, bool bSample/* = true*/)
     {
         /*
         The function calculate G(w_i| w_{other}, c, h)
         if bSample is true, draw a sample for w_i;
         otherwise, only calcualte the conditional probability.
         */
         if (nPos >= seq.GetLen()) {
             lout_error("[Model] SampleH: the nPos(" << nPos << ") > the length of sequence(" << seq.GetLen() << ")");
         }

         Array<VocabID> *pXs = m_pVocab->GetWord(seq.cseq()[nPos]);
         Array<LogP> aLogps;

         VocabID nSaveX = seq.wseq()[nPos]; // save x[nPos]
         for (int i = 0; i < pXs->GetNum(); i++) {
             seq.wseq()[nPos] = pXs->Get(i);
             /* To reduce the computational cost, instead of GetLogProb,
             we just need to calculate the summation of weight depending on w[nPos]
             */
             aLogps[i] = GetReducedModelForW(seq, nPos);
         }
         trf::LogLineNormalize(aLogps, pXs->GetNum());

         int idx;
         if (bSample) {
             /* sample a value for x[nPos] */
             idx = trf::LogLineSampling(aLogps, pXs->GetNum());
             seq.wseq()[nPos] = pXs->Get(idx);
         }
         else {
             idx = pXs->Find(nSaveX); // find nSave in the array.
             seq.wseq()[nPos] = nSaveX;
             if (idx == -1) {
                 lout_error("Can't find the VocabID(" << nSaveX << ") in the array.\n"
                     << "This may beacuse word(" << nSaveX << ") doesnot belongs to class(" << seq.cseq()[nPos] << ")");
             }
         }

         return aLogps[idx];
     }
     LogP Model::SampleHAndCGivenX(Seq &seq, MatShell<HValue> *tagH /* = NULL */)
     {
         LogP totallogProb = 0;

         /* set class */
         m_pVocab->GetClass(seq.cseq(), seq.wseq(), seq.GetLen());

         /* sample h */
         for (int nPos = 0; nPos < seq.GetLen(); nPos++) {
             Vec<LogP> vlogps_h(m_hlayer * m_hnode);
             ProposeHProbs(vlogps_h, seq, nPos, true);

             Vec<HValue> hsample(m_hlayer * m_hnode);
             if (tagH) {
                 hsample.Copy((*tagH)[nPos]);
             }
             else { /* sampling */
                 for (int i = 0; i < hsample.GetSize(); i++) {
                     hsample[i] = trf::Acceptable(trf::LogP2Prob(vlogps_h[i])) ? 1.0f : 0.0f;
                 }

             }
             seq.h[nPos] = hsample;

             LogP logprob = GetConditionalProbForH(hsample, vlogps_h);
             totallogProb += logprob;
         }
         return totallogProb;
     }

     void Model::RandSeq(Seq &seq, int nLen /* = -1 */)
     {
         if (nLen == -1) {
             seq.Reset(rand() % GetMaxLen() + 1, m_hlayer, m_hnode);
         }
         else {
             seq.Reset(nLen, m_hlayer, m_hnode);
         }

         /* randomly set h*/
         for (int i = 0; i < seq.h.GetRow(); i++) {
             for (int k = 0; k < seq.h.GetCol(); k++) {
                 seq.h[i][k] = rand() % 2;
             }
         }

         seq.x.Random(m_pVocab);
     }
     void Model::RandHidden(Seq &seq)
     {
         /* randomly set h*/
         for (int i = 0; i < seq.h.GetRow(); i++) {
             for (int k = 0; k < seq.h.GetCol(); k++) {
                 seq.h[i][k] = rand() % 2;
             }
         }
     }

     int Model::EncodeNode(VocabID xi, VocabID ci, VecShell<HValue> &hi)
     {
         int hnum = EncodeHidden(hi);

         return hnum * m_pVocab->GetSize() + xi;
     }
     void Model::EncodeNode(VecShell<int> &vn, Seq &seq, int nPos /* = 0 */, int nDim /* = -1 */)
     {
         nDim = (nDim == -1) ? seq.GetLen() - nPos : nDim;
         for (int i = nPos; i < nPos + nDim; i++) {
             vn[i] = EncodeNode(seq.wseq()[i], seq.cseq()[i], seq.h[i]);
         }
     }
     void Model::DecodeNode(int n, VocabID &xi, VocabID &ci, VecShell<HValue> &hi)
     {
         int hnum = n / m_pVocab->GetSize();

         xi = n % m_pVocab->GetSize();
         ci = m_pVocab->GetClass(xi);
         DecodeHidden(hnum, hi);
     }
     void Model::DecodeNode(VecShell<int> &vn, Seq &seq, int nPos /* = 0 */, int nDim /* = -1 */)
     {
         nDim = (nDim == -1) ? vn.GetSize() - nPos : nDim;
         for (int i = nPos; i < nPos + nDim; i++) {
             DecodeNode(vn[i], seq.wseq()[i], seq.cseq()[i], seq.h[i]);
         }
     }
     int Model::GetEncodeNodeLimit() const
     {
         return GetEncodeHiddenLimit() * m_pVocab->GetSize();
     }
     int Model::EncodeHidden(VecShell<HValue> hi)
     {
         int hnum = 0;
         for (int i = 0; i < hi.GetSize(); i++) {
             hnum += (int)hi[i] * (1 << i);
         }

         return hnum;
     }
     void Model::DecodeHidden(int n, VecShell<HValue> hi)
     {
         for (int i = 0; i < hi.GetSize(); i++) {
             hi[i] = n % 2;
             n >>= 1;
         }
     }
     void Model::DecodeHidden(VecShell<int> &vn, Mat<HValue> &h, int nPos /* = 0 */, int nDim /* = -1 */)
     {
         nDim = (nDim == -1) ? vn.GetSize() - nPos : nDim;
         for (int i = nPos; i < nPos + nDim; i++) {
             DecodeHidden(vn[i], h[i]);
         }
     }
     int Model::GetEncodeHiddenLimit() const
     {
         /* if the m_hnode >= 32, the value over the maxiume number of int*/
         if (m_hnode >= 30) {
             lout_error("[Model] GetEncodeHiddenLimit: overflow! m_hnode = " << m_hnode);
         }
         return 1 << m_hlayer * m_hnode;
     }
     void Model::DecodeLayer(VecShell<int> &vn, Mat<HValue> &h, int layer, int nPos /* = 0 */, int nDim /* = -1 */)
     {
         nDim = (nDim == -1) ? vn.GetSize() - nPos : nDim;
         for (int i = nPos; i < nPos + nDim; i++) {
             DecodeHidden(vn[i], h[i].GetSub(layer*m_hnode, m_hnode));
         }
     }
     int Model::GetEncodeLayerLimit() const
     {
         return 1 << m_hnode;
     }

     void Model::FeatCount(Seq &seq, VecShell<double> featcount,
         Mat3dShell<double> VHcount, Mat3dShell<double> CHcount, Mat3dShell<double> HHcount,
         MatShell<double> Bcount, double dadd /* = 1 */)
     {
         trf::Model::FeatCount(seq.x, featcount.GetBuf(), dadd);

         HiddenFeatCount(seq, VHcount, CHcount, HHcount, Bcount, dadd);
     }
     void Model::HiddenFeatCount(Seq &seq,
         Mat3dShell<double> VHcount, Mat3dShell<double> CHcount, Mat3dShell<double> HHcount,
         MatShell<double> Bcount, double dadd /* = 1 */)
     {
         //double dfactor = 1.0 / seq.GetLen();
         double dfactor = 1.0;
         /* VH count */
         for (int i = 0; i < seq.GetLen(); i++) {
             for (int k = 0; k < m_hlayer*m_hnode; k++) {
                 VHcount[seq.wseq()[i]][k][seq.h[i][k]] += dfactor * dadd;
             }
         }

         /* CH count */
         if (m_pVocab->GetClassNum() > 0) {
             for (int i = 0; i < seq.GetLen(); i++) {
                 for (int k = 0; k < m_hlayer*m_hnode; k++) {
                     CHcount[seq.cseq()[i]][k][seq.h[i][k]] += dfactor * dadd;
                 }
             }
         }

         /* HH count */
         for (int i = 0; i < seq.GetLen() - 1; i++) {
             for (int l = 0; l < m_hlayer; l++) {
                 for (int a = 0; a < m_hnode; a++) {
                     for (int b = 0; b < m_hnode; b++) {
                         HHcount.Get(l * m_hnode + a, b, HHMap(seq.h.Get(i, l*m_hnode + a), seq.h.Get(i + 1, l*m_hnode + b))) += dfactor * dadd;
                     }
                 }
             }
         }

         /* Bias count */
         for (int i = 0; i < seq.GetLen(); i++) {
             for (int k = 0; k < m_hlayer*m_hnode; k++) {
                 Bcount[k][seq.h[i][k]] += dfactor * dadd;
             }
         }
     }
     void Model::FeatCount(Seq &seq, VecShell<double> count, double dadd /* = 1 */)
     {
         VecShell<double> featcount;
         Mat3dShell<double> VHcount, CHcount, HHcount;
         MatShell<double> Bcount;
         BufMap(count.GetBuf(), featcount, VHcount, CHcount, HHcount, Bcount);
         FeatCount(seq, featcount, VHcount, CHcount, HHcount, Bcount, dadd);
     }

     PValue Model::SumVHWeight(MatShell<PValue> m, VecShell<HValue> h)
     {
         PValue dsum = 0;
         for (int i = 0; i < h.GetSize(); i++) {
             dsum += m[i][(int)h[i]];
         }
         return dsum;
     }
     PValue Model::SumHHWeight(Mat3dShell<PValue> m, VecShell<HValue> h1, VecShell<HValue> h2)
     {
         PValue dsum = 0;

         for (int k = 0; k < m_hlayer; k++) {
             for (int i = 0; i < m_hnode; i++) {
                 for (int j = 0; j < m_hnode; j++)
                 {
                     dsum += m.Get(k*m_hnode + i, j, HHMap(h1[k*m_hnode + i], h2[k*m_hnode + j]));
                 }
             }
         }
         return dsum;
     }
     PValue Model::SumVHWeight(MatShell<PValue> m, VecShell<HValue> h, int layer)
     {
         PValue dsum = 0;
         for (int i = layer * m_hnode; i < layer *m_hnode + m_hnode; i++) {
             dsum += m[i][(int)h[i]];
         }
         return dsum;
     }
     PValue Model::SumHHWeight(Mat3dShell<PValue> m, VecShell<HValue> h1, VecShell<HValue> h2, int layer)
     {
         PValue dsum = 0;

         int k = layer;
         for (int i = 0; i < m_hnode; i++) {
             for (int j = 0; j < m_hnode; j++)
             {
                 dsum += m.Get(k*m_hnode + i, j, HHMap(h1[k*m_hnode + i], h2[k*m_hnode + j]));
             }
         }

         return dsum;
     }

     void Model::PerformSAMS(int nMinibatch, int tmax, int t0, int beta, double zgap)
     {
         int nThread = omp_get_max_threads();
         Mat<double> m_matSampleLen(nThread, GetMaxLen() + 1);
         Vec<double> m_vecSampleLen(GetMaxLen() + 1);

         // sequence for each threads
         Array<Seq*> aSeqs;
         for (int i = 0; i < nThread; i++) {
             aSeqs[i] = new Seq;
             RandSeq(*aSeqs[i]);
         }


         Vec<LogP> zeta;
         zeta.Copy(m_zeta);

         for (int t = 1; t <= tmax; t++) {
             m_matSampleLen.Fill(0);
             m_vecSampleLen.Fill(0);
             // sampling
 #pragma omp parallel for
             for (int m = 0; m < nMinibatch; m++) {
                 int tid = omp_get_thread_num();
                 this->Sample(*aSeqs[tid]);
                 int nLen = min(GetMaxLen(), aSeqs[tid]->GetLen());
                 m_matSampleLen[tid][nLen]++;
             }

             // Count
             for (int i = 0; i < nThread; i++) {
                 m_vecSampleLen += m_matSampleLen[i];
             }
             m_vecSampleLen /= nMinibatch;

             // learning rate
             double gamma = 0;
             if (t <= t0) {
                 gamma = 1.0 / pow(t, beta);
             }
             else {
                 gamma = 1.0 / (pow(t0, beta) + t - t0);
             }

             // update
             for (int i = 1; i <= GetMaxLen(); i++) {
                 zeta[i] += min(zgap, gamma * m_vecSampleLen[i] / m_pi[i]);
             }
             this->SetZeta(zeta.GetBuf());
         }


     }

     LogP Model::GetLogProb_AIS(VecShell<VocabID> &x, int nChain /* = 100 */, int nIntermediate /* = 10000 */)
     {
         int nLen = x.GetSize();
         int nParamsNumOfIntermediateModel = GetParamNum() - m_pFeat->GetNum();

         Vec<PValue> vParamsPn(nParamsNumOfIntermediateModel);
         Vec<PValue> vParamsP0(nParamsNumOfIntermediateModel);
         Vec<PValue> vParamsCur(nParamsNumOfIntermediateModel);

         /* get the parameters of current model */
         PValue *p = vParamsP0.GetBuf();
         HRF_VALUE_GET(p, m_m3dVH);
         HRF_VALUE_GET(p, m_m3dCH);
         HRF_VALUE_GET(p, m_m3dHH);
         HRF_VALUE_GET(p, m_matBias);


         /* get the parameters of the distribution P_n */
         /* Set with all the unigram values, i.e. all the VH and CH and bias*/
         vParamsPn.Copy(vParamsP0);
         p = vParamsPn.GetBuf() + m_m3dVH.GetSize() + m_m3dCH.GetSize();
         memset(p, 0, sizeof(PValue)*m_m3dHH.GetSize());

         /* calculate the normalization constants of P_n */
         LogP logz_pn = 0;
         for (int nPos = 0; nPos < nLen; nPos++) {
             VocabID xid = x[nPos];
             VocabID cid = m_pVocab->GetClass(xid);
             /* sum_{hi} Q(hi)*/
             double d2 = 0;
             for (int k = 0; k < m_hlayer * m_hnode; k++) {
                 if (cid != trf::VocabID_none && m_m3dCH.GetSize() > 0) {
                     d2 += trf::Log_Sum(m_m3dVH[xid][k][0] + m_m3dCH[cid][k][0] + m_matBias[k][0], m_m3dVH[xid][k][1] + m_m3dCH[cid][k][1] + m_matBias[k][1]);
                 }
                 else { // if cid == VocabID_none, it means on class infromation
                     d2 += trf::Log_Sum(m_m3dVH[xid][k][0] + m_matBias[k][0], m_m3dVH[xid][k][1] + m_matBias[k][1]);
                 }
             }
             logz_pn += d2;
         }

         // set intermediate model
         Array<Model*> aInterModel;
         aInterModel.SetNum(1);
         for (int i = 0; i < aInterModel.GetNum(); i++) {
             /* In the new created model :
             There are no word/class ngram features;
             All the word/class ngram parameters are not used, as we just sample H
             */
             aInterModel[i] = new Model(m_pVocab, m_hlayer, m_hnode, m_maxlen);
             aInterModel[i]->SetPi(m_pi.GetBuf());
             aInterModel[i]->m_zeta.Copy(m_zeta);
             aInterModel[i]->m_logz.Copy(m_logz);
             lout_assert(aInterModel[i]->GetParamNum() == nParamsNumOfIntermediateModel);
         }
         Array<LogP> aLogWeight;
         aLogWeight.SetNum(nChain);
         aLogWeight.Fill(0);

         //Title::Precent(0, true, nChain, "AIS");
         //#pragma omp parallel for firstprivate(vParamsCur)
         for (int k = 0; k < nChain; k++) {
             int tid = 0;//omp_get_thread_num();
             Model *pInterModel = aInterModel[tid];
             Seq seq(nLen, m_hlayer, m_hnode);
             seq.x.Set(x.GetBuf(), x.GetSize(), m_pVocab);

             /* sample the initial sequence */
             for (int nPos = 0; nPos < seq.GetLen(); nPos++) {
                 VocabID xid = x[nPos];
                 VocabID cid = m_pVocab->GetClass(xid);
                 for (int k = 0; k < m_hlayer * m_hnode; k++) {
                     LogP curP[2];
                     if (cid != trf::VocabID_none && m_m3dCH.GetSize() > 0) {
                         curP[0] = m_m3dVH[xid][k][0] + m_m3dCH[cid][k][0] + m_matBias[k][0];
                         curP[1] = m_m3dVH[xid][k][1] + m_m3dCH[cid][k][1] + m_matBias[k][1];
                     }
                     else { // if cid == VocabID_none, it means on class infromation
                         curP[0] = m_m3dVH[xid][k][0] + m_matBias[k][0];
                         curP[1] = m_m3dVH[xid][k][1] + m_matBias[k][1];
                     }
                     trf::LogLineNormalize(curP, 2);
                     seq.h[nPos][k] = trf::LogLineSampling(curP, 2);
                 }
             }


             pInterModel->SetParam(vParamsPn.GetBuf());
             //LogP logp_old = - GetHNode() * nLen * log(2);
             LogP logp_old = pInterModel->GetLogProb(seq, false) - logz_pn;

             double log_w = 0;
             for (int t = nIntermediate - 1; t >= 0; t--) {
                 /* set the intermediate parameters */
                 //double beta = 1.0 / nIntermediate * t;
                 double beta = trf::GetAISFactor(t, nIntermediate);
                 for (int i = 0; i < vParamsCur.GetSize(); i++)
                     vParamsCur[i] = vParamsP0[i] * (1 - beta) + vParamsPn[i] * beta;
                 pInterModel->SetParam(vParamsCur.GetBuf());

                 /* compute the weight */
                 LogP rate = pInterModel->GetLogProb(seq) - logp_old;
                 log_w += rate;

                 /* sample H */
                 pInterModel->SampleHAndCGivenX(seq);
                 logp_old = pInterModel->GetLogProb(seq);
             }

             aLogWeight[k] = log_w; // record the log-weight
             //Title::Precent();
         }

         for (int i = 0; i < aInterModel.GetNum(); i++) {
             SAFE_DELETE(aInterModel[i]);
         }


         LogP logprob = trf::Log_Sum(aLogWeight.GetBuffer(), aLogWeight.GetNum()) - trf::Prob2LogP(nChain);

         /* the logprob of all the x and c */
         Seq seq(nLen, m_hlayer, m_hnode);
         seq.x.Set(x.GetBuf(), x.GetSize(), m_pVocab);
         LogP logpx = FeatClusterSum(seq.x, 0, nLen);

         return logprob + logpx;
     }

     LogP Model::GetLogProb_Gibbs(VecShell<VocabID> &x, int num /* = 100 */)
     {
         int nLen = x.GetSize();
         Seq seq(nLen, m_hlayer, m_hnode);
         seq.x.Set(x.GetBuf(), x.GetSize(), m_pVocab);
         RandHidden(seq);

         LogP maxLogp = trf::LogP_zero;
         for (int i = 0; i < num; i++) {
             SampleHAndCGivenX(seq);
             LogP curlogp = GetLogProb(seq, true);
             if (curlogp > maxLogp) {
                 maxLogp = curlogp;
             }
         }
         return maxLogp;
     }

     /************************************************************************/
     /* Forward-backward class                                               */
     /************************************************************************/
     AlgNode::AlgNode(Model *p)
     {
         m_pModel = p;
     }
     LogP AlgNode::ClusterSum(int *pSeq, int nLen, int nPos, int nOrder)
     {
         m_seq.Reset(nLen, m_pModel->m_hlayer, m_pModel->m_hnode);
         m_pModel->DecodeNode(VecShell<int>(pSeq, nLen), m_seq, nPos, nOrder);
         return m_pModel->ClusterSum(m_seq, nPos, nOrder);
     }

     AlgLayer::AlgLayer(Model *p, VecShell<VocabID> x, int nlayer)
     {
         m_pModel = p;
         m_nlayer = nlayer;
         m_seq.Reset(x.GetSize(), p->m_hlayer, p->m_hnode);
         m_seq.x.Set(x.GetBuf(), x.GetSize(), p->GetVocab());
     }
     LogP AlgLayer::ClusterSum(int *pSeq, int nLen, int nPos, int nOrder)
     {
         m_pModel->DecodeLayer(VecShell<int>(pSeq, nLen), m_seq.h, m_nlayer, nPos, nOrder);
         return m_pModel->LayerClusterSum(m_seq, m_nlayer, nPos, nOrder);
     }
 }
wb::Mat< HValue >

hrf::Seq::Write
void Write(File &file)
Definition: hrf-model.cpp:53

hrf::Model::SampleHAndCGivenX
virtual LogP SampleHAndCGivenX(Seq &seq, MatShell< HValue > *tagH=NULL)
[sample] sample h given x using gibbs sampling.
Definition: hrf-model.cpp:1053

hrf::AlgLayer::AlgLayer
AlgLayer(Model *p, VecShell< VocabID > x, int nlayer)
Definition: hrf-model.cpp:1502

trf::Seq::Copy
void Copy(Seq &seq)
copy the sequence
Definition: trf-feature.h:66

trf::LogP_zero
const float LogP_zero
Definition: trf-def.h:30

wb::MatShell::Get
T & Get(unsigned int i, unsigned int j)
Definition: wb-mat.h:125

wb::Array::Copy
void Copy(const Array< T > &array)
Copy the array to current array.
Definition: wb-vector.h:260

hrf::VocabID
trf::VocabID VocabID
Definition: hrf-model.h:29

SAFE_DELETE
#define SAFE_DELETE(p)
memory release
Definition: wb-vector.h:49

trf::Log_Sub
LogP Log_Sub(LogP x, LogP y)
log[exp(x)-exp(y)]
Definition: trf-def.h:44

hrf::Model::GetEncodeNodeLimit
int GetEncodeNodeLimit() const
The encoded integer size.
Definition: hrf-model.cpp:1139

hrf::Seq::m_hlayer
int m_hlayer
Definition: hrf-model.h:46

wb::String
a dynamic string class
Definition: wb-string.h:53

wb::Vector::Get
T & Get(int i)
get the value at position i
Definition: wb-vector.h:99

hrf::Model::LocalJump
void LocalJump(Seq &seq)
[sample] Local Jump - sample a new length
Definition: hrf-model.cpp:730

hrf::Seq::GetLen
int GetLen() const
Definition: hrf-model.h:54

trf::LogLineSampling
int LogLineSampling(const LogP *pdProbs, int nNum)
Definition: trf-def.cpp:62

hrf::Seq::Seq
Seq()
Definition: hrf-model.h:50

hrf::Seq::cseq
VocabID * cseq()
Definition: hrf-model.h:59

hrf::Model::m_hnode
int m_hnode
the number of hidden nodes
Definition: hrf-model.h:102

hrf::Seq::Copy
void Copy(Seq &seq)
Definition: hrf-model.cpp:15

hrf::Seq::GetSubSeq
Seq GetSubSeq(int nPos, int nOrder)
Return the sub-sequence.
Definition: hrf-model.cpp:21

trf::Seq::Random
void Random(Vocab *pv)
Random.
Definition: trf-feature.cpp:39

trf::Model::Reset
void Reset(Vocab *pv, int maxlen)
reset, the maxlen is the length excluding the beg/end symbols.
Definition: trf-model.cpp:28

hrf::Seq::wseq
VocabID * wseq()
Definition: hrf-model.h:58

wb::VecShell
Definition: wb-mat.h:27

trf::VocabID_none
const int VocabID_none
Definition: trf-vocab.h:24

hrf::AlgLayer::ClusterSum
virtual LogP ClusterSum(int *pSeq, int nLen, int nPos, int nOrder)
This function need be derived. Calcualte the log probability of each cluster.
Definition: hrf-model.cpp:1509

lout_error
#define lout_error(x)
Definition: wb-log.h:183

lout_assert
#define lout_assert(p)
Definition: wb-log.h:185

hrf::PValue
trf::PValue PValue
Definition: hrf-model.h:24

wb::MatShell::Fill
void Fill(T v)
Definition: wb-mat.h:397

hrf::Seq
Definition: hrf-model.h:40

hrf::Seq::Reset
void Reset(int len, int hlayer, int hnode)
Definition: hrf-model.cpp:5

hrf::Seq::operator==
bool operator==(Seq &s)
If the two sequence is equal.
Definition: hrf-model.cpp:34

trf::Algfb::m_nLen
int m_nLen
the sequence length.
Definition: trf-alg.h:38

hrf::Model::ExactNormalize
void ExactNormalize()
[exact] Exact Normalization all the length
Definition: hrf-model.cpp:445

hrf::Model::GetMarginalLogProb
LogP GetMarginalLogProb(int nLen, int nPos, Seq &sub, bool bNorm=true)
[exact] Exactly calculate the marginal probability at position &#39;nPos&#39; and with order &#39;nOrder&#39; ...
Definition: hrf-model.cpp:453

trf::Prob2LogP
LogP Prob2LogP(Prob x)
Definition: trf-def.h:36

hrf::Model::GetLogProb_Gibbs
LogP GetLogProb_Gibbs(VecShell< VocabID > &x, int num=100)
sample the best hidden and calculate the joint probability.
Definition: hrf-model.cpp:1470

trf::Log_Sum
LogP Log_Sum(LogP x, LogP y)
Definition: trf-def.h:40

hrf::Model::HiddenClusterSum
LogP HiddenClusterSum(Seq &seq, int nPos, int nOrder)
[exact] Calculate the logp in each cluster. Only consinder the VH,CH,HH values, used in class AlgHidd...
Definition: hrf-model.cpp:306

trf::VecIter
Definition: trf-alg.h:83

trf::Model::GetLogProb
LogP GetLogProb(Seq &seq, bool bNorm=true)
calculate the probability
Definition: trf-model.cpp:74

hrf::Model::GetNodeExp
void GetNodeExp(double *pExp, Prob *pLenProb=NULL)
[exact] sum_l { n_l/n * E_{p_l}[f] }: Exactly calculate the expectation over x and h ...
Definition: hrf-model.cpp:470

hrf::Seq::m_nLen
int m_nLen
mutiple hidden matrix [position * (layer * hnode)]
Definition: hrf-model.h:45

wb::Mat3dShell::Get
T & Get(int x, int y, int z)
Definition: wb-mat.h:172

hrf::Model::SetParam
virtual void SetParam(PValue *pParam)
Set the parameters.
Definition: hrf-model.cpp:78

hrf::Model
hidden-random-field model
Definition: hrf-model.h:98

hrf::Model::GetLayerExp
void GetLayerExp(AlgLayer &fb, int nLayer, Mat3dShell< double > &VHexp, Mat3dShell< double > &CHexp, Mat3dShell< double > &HHexp, MatShell< double > &Bexp, LogP logz=0)
[exact] called in GetHiddenExp.
Definition: hrf-model.cpp:650

hrf::Prob
trf::Prob Prob
Definition: hrf-model.h:26

trf::Model::SetParam
virtual void SetParam(PValue *pValue)
Set the parameters.
Definition: trf-model.cpp:58

trf::Model::GetReducedModelForC
LogP GetReducedModelForC(Seq &seq, int nPos)
[sample] A unnormalized reduced model to sample class c_i.
Definition: trf-model.cpp:419

wb::File::Scanf
virtual int Scanf(const char *p_pMessage,...)
scanf
Definition: wb-file.cpp:132

hrf::Model::FeatCount
void FeatCount(Seq &seq, VecShell< double > featcount, Mat3dShell< double > VHcount, Mat3dShell< double > CHcount, Mat3dShell< double > HHcount, MatShell< double > Bcount, double dadd=1)
Count the feature number in current sequence, and add to the result.
Definition: hrf-model.cpp:1186

hrf::Model::GetEncodeHiddenLimit
int GetEncodeHiddenLimit() const
The encoded integer size.
Definition: hrf-model.cpp:1166

trf::Seq::Reset
void Reset(int p_len)
reset only change the len variable, does not change the buffer size.
Definition: trf-feature.h:51

wb::Vector::GetBuffer
T * GetBuffer(int i=0) const
get the buffer pointer
Definition: wb-vector.h:97

wb::File::fp
FILE * fp
file pointer
Definition: wb-file.h:97

wb::MatShell< double >

hrf::Model::GetMarginalProbOfC
LogP GetMarginalProbOfC(Seq &seq, int nPos)
[sample] Fixed h, given c_i, summate the probabilities of x_i, i.e. P(c_i)
Definition: hrf-model.cpp:961

hrf::Seq::h
Mat< HValue > h
Definition: hrf-model.h:44

hrf::Model::SampleC
void SampleC(Seq &seq, int nPos)
[sample] Sample the c_i at position nPos given h_i without x_i.
Definition: hrf-model.cpp:979

wb::File::Print
virtual void Print(const char *p_pMessage,...)
print
Definition: wb-file.cpp:115

hrf::Seq::x
trf::Seq x
Definition: hrf-model.h:43

trf::Algfb::m_nOrder
int m_nOrder
the order, i.e. the node number at each cluster {x_1,x_2,...,x_n}
Definition: trf-alg.h:37

trf::Seq
define a sequence including the word sequence and class sequence
Definition: trf-feature.h:41

hrf::Model::ProposeC0
LogP ProposeC0(VocabID &ci, Seq &seq, int nPos, bool bSample)
[sample] Propose the c_{i} at position i. Then return the propose probability R(c_i|h_i,c_{other})
Definition: hrf-model.cpp:824

trf::Model::FeatCount
void FeatCount(Seq &seq, double *pCount, double dadd=1.0)
Count the feature number in a sequence.
Definition: trf-model.cpp:106

wb::Vec
Definition: wb-mat.h:29

hrf::Seq::GetHnode
int GetHnode() const
Definition: hrf-model.h:56

hrf::Model::ClusterSum
LogP ClusterSum(Seq &seq, int nPos, int nOrder)
[exact] Calculate the logP in each cluster. Only used for forward-backword algorithms ( class AlgNode...
Definition: hrf-model.cpp:298

trf::Seq::Print
void Print()
Definition: trf-feature.cpp:52

trf::Feat::m_nTotalNum
int m_nTotalNum
total feature number
Definition: trf-feature.h:183

hrf::Model::ReadT
void ReadT(const char *pfilename)
Read Model.
Definition: hrf-model.cpp:149

trf::LineSampling
int LineSampling(const Prob *pdProbs, int nNum)
Definition: trf-def.cpp:103

hrf::Model::ProposeH0
LogP ProposeH0(VecShell< HValue > &hi, Seq &seq, int nPos, bool bSample)
[sample] Propose the h_{i} at position i. Then return the propose probability Q(h_i|h_{other}) ...
Definition: hrf-model.cpp:796

hrf::Model::GetReducedModelForC
LogP GetReducedModelForC(Seq &seq, int nPos)
[sample] A unnormalized reduced model to sample class c_i, consindering CH matrix(U) and class-ngram ...
Definition: hrf-model.cpp:927

hrf::Seq::GetHlayer
int GetHlayer() const
Definition: hrf-model.h:55

wb::VecShell::Fill
void Fill(T v)
Definition: wb-mat.h:279

wb::Array::Find
int Find(T t)
Find a value and return the position.
Definition: wb-vector.h:248

wb::File
file class.
Definition: wb-file.h:94

wb::VecShell::GetSize
int GetSize() const
Definition: wb-mat.h:69

hrf::Model::SampleW
LogP SampleW(Seq &seq, int nPos, bool bSample=true)
[sample] Sample the w_i at position nPos
Definition: hrf-model.cpp:1012

wb::Mat3dShell
Definition: wb-mat.h:160

trf::Model::GetParam
void GetParam(PValue *pValue)
Get the paremetre vector.
Definition: trf-model.cpp:64

hrf::Model::GetEncodeLayerLimit
int GetEncodeLayerLimit() const
The encoded integer size of one layer.
Definition: hrf-model.cpp:1181

trf::Seq::Set
void Set(Array< int > &aInt, Vocab *pv)
transform the word sequence (form file) to Seq
Definition: trf-feature.cpp:22

wb::VecShell::GetBuf
T * GetBuf() const
Definition: wb-mat.h:68

hrf::Model::ProposeLength
LogP ProposeLength(int nOld, int &nNew, bool bSample)
[sample] Propose the length, using the variable m_matLenJump
Definition: hrf-model.cpp:788

HRF_VALUE_SET
#define HRF_VALUE_SET(p, m)
Definition: hrf-model.h:86

wb::Array::SetNum
void SetNum(int n)
Set Array number, to melloc enough memory.
Definition: wb-vector.h:238

trf::Seq::x
Mat< VocabID > x
Definition: trf-feature.h:44

wb::File::GetLine
virtual char * GetLine(bool bPrecent=false)
Read a line into the buffer.
Definition: wb-file.cpp:47

trf::Acceptable
bool Acceptable(Prob prob)
Definition: trf-def.cpp:127

trf::Algfb::GetLogSummation
LogP GetLogSummation()
Get the summation over the sequence, corresponding to the log normalization constants &#39;logZ&#39;...
Definition: trf-alg.cpp:155

hrf::AlgLayer
Definition: hrf-model.h:302

trf::Vocab
Definition: trf-vocab.h:34

hrf::Model::ProposeCProbs
void ProposeCProbs(VecShell< LogP > &logps, Seq &seq, int nPos)
[sample] Return the distribution of c_i at position nPos
Definition: hrf-model.cpp:903

hrf::Model::DecodeNode
void DecodeNode(int n, VocabID &xi, VocabID &ci, VecShell< HValue > &hi)
decode a integer to the x_i and h_i
Definition: hrf-model.cpp:1124

wb::Array::Clean
void Clean()
Clean the array. Just set the top of array to -1 and donot release the memory.
Definition: wb-vector.h:258

hrf::Model::HiddenFeatCount
void HiddenFeatCount(Seq &seq, Mat3dShell< double > VHcount, Mat3dShell< double > CHcount, Mat3dShell< double > HHcount, MatShell< double > Bcount, double dadd=1)
Count the hidden features.
Definition: hrf-model.cpp:1194

hrf::Model::EncodeNode
int EncodeNode(VocabID xi, VocabID ci, VecShell< HValue > &hi)
encode the x_i and h_i at position i to a integer
Definition: hrf-model.cpp:1111

trf::Model::GetVocab
Vocab * GetVocab() const
Get Vocab.
Definition: trf-model.h:102

hrf::AlgNode::AlgNode
AlgNode(Model *p)
Definition: hrf-model.cpp:1491

trf::Model::ClusterSum
LogP ClusterSum(Seq &seq, int nPos, int nOrder)
Read Binary.
Definition: trf-model.cpp:185

hrf::Model::PerformSAMS
void PerformSAMS(int nMinibatch, int tmax, int t0, int beta, double zgap=10)
perform the SAMS to estimate the normalization constants zeta
Definition: hrf-model.cpp:1288

hrf::Model::LayerClusterSum
LogP LayerClusterSum(Seq &seq, int nlayer, int nPos, int nOrder)
[exact] Calculate the logp in each cluster. Only consinder the VH,CH,HH values on such layer ...
Definition: hrf-model.cpp:355

wb::Array::GetNum
int GetNum() const
Get Array number.
Definition: wb-vector.h:240

wb::Mat::Reset
void Reset(int row=0, int col=0)
Definition: wb-mat.h:445

hrf::Model::DecodeHidden
void DecodeHidden(int n, VecShell< HValue > hi)
decode a integer to a hidden vector
Definition: hrf-model.cpp:1152

trf::Seq::GetClassSeq
VocabID * GetClassSeq()
get class sequence
Definition: trf-feature.h:82

hrf::Model::m_hlayer
int m_hlayer
the number of hidden layer
Definition: hrf-model.h:101

trf::LogLineNormalize
LogP LogLineNormalize(LogP *pdProbs, int nNum)
Definition: trf-def.cpp:53

hrf::HValue
float HValue
Definition: hrf-model.h:25

hrf::Seq::Print
void Print()
Definition: hrf-model.cpp:43

trf::Algfb::ForwardBackward
void ForwardBackward(int nLen, int nOrder, int nValueLimit)
forward-backward calculation
Definition: trf-alg.cpp:54

hrf::Model::MarkovMove
void MarkovMove(Seq &seq)
[sample] Markov Move - perform the gibbs sampling
Definition: hrf-model.cpp:777

m
pFunc Reset & m
Definition: main-sa-train.cpp:156

trf::GetAISFactor
double GetAISFactor(int t, int T)
Get the AIS intermediate factor beta_t.
Definition: trf-def.cpp:165

trf::Seq::GetWordSeq
VocabID * GetWordSeq()
get word sequence
Definition: trf-feature.h:80

wb::lout
Log lout
the defination is in wb-log.cpp
Definition: wb-log.cpp:22

hrf::Model::FeatClusterSum
LogP FeatClusterSum(trf::Seq &x, int nPos, int nOrder)
[exact] Calculate the logp in each cluster. Only consinder the feature values
Definition: hrf-model.cpp:302

wb::Vector::Fill
void Fill(T m)
set all the values to m
Definition: wb-vector.h:139

hrf::Model::Reset
void Reset(Vocab *pv, int hlayer, int hnode, int maxlen)
reset, the maxlen is the length excluding the beg/end symbols.
Definition: hrf-model.cpp:65

trf::Algfb::GetMarginalLogProb
LogP GetMarginalLogProb(int nPos, int *pSubSeq, int nSubLen, double logz=0)
Get the marginal probability. &#39;logz&#39; is the input of the log normalization constants.
Definition: trf-alg.cpp:99

hrf::Model::ProposeHProbs
void ProposeHProbs(VecShell< LogP > &logps, Seq &seq, int nPos, bool bConsiderXandC=false)
[sample] A reduced model only consinder HHmat(W) and VHmat(M) and CHmat(U).
Definition: hrf-model.cpp:841

HRF_VALUE_GET
#define HRF_VALUE_GET(p, m)
Definition: hrf-model.h:89

trf::LogP2Prob
Prob LogP2Prob(LogP x)
Definition: trf-def.h:33

hrf::Model::RandHidden
void RandHidden(Seq &seq)
Random init the hidden variables.
Definition: hrf-model.cpp:1101

hrf
Definition: hrf-code-exam.cpp:3

wb::MatShell::GetCol
int GetCol() const
Definition: wb-mat.h:129

hrf::Model::GetParam
void GetParam(PValue *pParam)
Get the paremetre vector.
Definition: hrf-model.cpp:95

wb::Mat::Copy
void Copy(MatShell< T > &m)
Definition: wb-mat.h:475

hrf::LogP
trf::LogP LogP
Definition: hrf-model.h:27

wb::MatShell::GetRow
int GetRow() const
Definition: wb-mat.h:128

hrf::Model::EncodeHidden
int EncodeHidden(VecShell< HValue > hi)
encode the hidden vector h_i to a integer
Definition: hrf-model.cpp:1143

hrf::Model::DecodeLayer
void DecodeLayer(VecShell< int > &vn, Mat< HValue > &h, int layer, int nPos=0, int nDim=-1)
decoder several integer to a sequence
Definition: hrf-model.cpp:1174

hrf-model.h

hrf::Model::GetReducedModelForW
LogP GetReducedModelForW(Seq &seq, int nPos)
[sample] A unnormalized reduced model to sample word w_i, consindering VH matrix(M) and word-ngram (l...
Definition: hrf-model.cpp:941

trf::Feat
include all the feature table
Definition: trf-feature.h:179

hrf::Model::SumHHWeight
PValue SumHHWeight(Mat3dShell< PValue > m, VecShell< HValue > h1, VecShell< HValue > h2)
Definition: hrf-model.cpp:1251

hrf::AlgNode::ClusterSum
virtual LogP ClusterSum(int *pSeq, int nLen, int nPos, int nOrder)
This function need be derived. Calcualte the log probability of each cluster.
Definition: hrf-model.cpp:1495

hrf::Model::GetLogProb_AIS
LogP GetLogProb_AIS(VecShell< VocabID > &x, int nChain=10, int nIntermediate=10000)
perform AIS to esitmate the mariginal probabilities
Definition: hrf-model.cpp:1342

hrf::Model::RandSeq
void RandSeq(Seq &seq, int nLen=-1)
Random init sequence, if nLen==-1, random the length also.
Definition: hrf-model.cpp:1083

hrf::Seq::m_hnode
int m_hnode
Definition: hrf-model.h:47

wb::Mat3dShell::Fill
void Fill(T v)
Definition: wb-mat.h:482

hrf::Model::SumVHWeight
PValue SumVHWeight(MatShell< PValue > m, VecShell< HValue > h)
Definition: hrf-model.cpp:1243

hrf::Model::GetConditionalProbForH
LogP GetConditionalProbForH(VecShell< HValue > &hi, VecShell< Prob > &probs)
[sample] using the logprobs returned by ProposeHProb to calculate the logprob of hi.
Definition: hrf-model.cpp:951

wb::Vec::Copy
void Copy(VecShell< T > v)
Definition: wb-mat.h:386

hrf::Model::GetReducedModelForH
LogP GetReducedModelForH(Seq &seq, int nPos)
[sample] A unnormalized reduced model. It only consindering the HH matrix (W)
Definition: hrf-model.cpp:913

hrf::Model::GetHiddenExp
void GetHiddenExp(VecShell< int > x, double *pExp)
[exact] E_{p_l(h|x)}[f]: don&#39;t clean the pExp and directly add the new exp to pExp.
Definition: hrf-model.cpp:622

hrf::Model::GetLogProb
LogP GetLogProb(Seq &seq, bool bNorm=true)
calculate the probability
Definition: hrf-model.cpp:112

hrf::Model::Sample
void Sample(Seq &seq)
[sample] Perform one train-dimensional mixture sampling
Definition: hrf-model.cpp:725

wb::Array< int >

HHMap
#define HHMap(h1, h2)
Definition: hrf-model.h:84

trf::Model::GetReducedModelForW
LogP GetReducedModelForW(Seq &seq, int nPos)
[sample] A unnormalized reduced model to sample word w_i.
Definition: trf-model.cpp:434

hrf::AlgLayer::m_seq
Seq m_seq
Definition: hrf-model.h:306

hrf::Model::WriteT
void WriteT(const char *pfilename)
Write Model.
Definition: hrf-model.cpp:233