void test_cst_matching_statistics(const Cst& cst, unsigned char* S2, typename Cst::size_type n2) { typedef typename Cst::size_type size_type; typedef typename Cst::node_type node_type; size_type cnt = 0; write_R_output("cst","mstats","begin",n2,cnt); size_type q = 0; // current match length size_type p2 = n2-1; // position in S2 size_type i = 0, j = cst.csa.size()-1; // \f$ \epsilon \f$ matches all suffixes of S1 while (p2+1 > 0) { size_type lb, rb; // perform backward search on interval \f$ [i,j] \f$ size_type size = algorithm::backward_search(cst.csa, i, j, S2[p2], lb, rb); if (size > 0) { q = q + 1; i = lb; j = rb; p2 = p2 - 1; } else if (i==0 and j == cst.csa.size()) { p2 = p2 -1; } else { // map interval to a node of the cst and calculate parent node_type p = cst.parent(cst.node(i, j)); q = cst.depth(p); // update match length i = cst.lb(p); // update left bound j = cst.rb(p); // update right bound } cnt += q; } write_R_output("cst","mstats","end",n2,cnt); }
void test_cst_dfs_iterator_and_depth(Cst& cst, typename Cst::size_type times=1000000, bool output=false) { if (times > 2*cst.nodes()-cst.size()) times = 2*cst.nodes()-cst.size(); typedef typename Cst::size_type size_type; size_type cnt=0; write_R_output("cst","dfs and depth","begin",times,cnt); typename Cst::const_iterator it = cst.begin(); if (!output) { for (size_type i=0; i<times; ++i, ++it) { if (!cst.is_leaf(*it)) cnt += cst.depth(*it); } } else { for (size_type i=0; i<times; ++i, ++it) { if (!cst.is_leaf(*it)) { size_type d = cst.depth(*it); std::cerr << d << "-[" << cst.lb(*it) << "," << cst.rb(*it) << "] "; if (d < 60) { for (int i=1; i<=d; ++i) std::cerr<< cst.edge(*it, i); } std::cerr << std::endl; cnt += d; } } } write_R_output("cst","dfs and depth","end",times,cnt); }