[irstlm] 65/126: improved info
Giulio Paci
giuliopaci-guest at moszumanska.debian.org
Tue May 17 07:46:45 UTC 2016
This is an automated email from the git hooks/post-receive script.
giuliopaci-guest pushed a commit to annotated tag adaptiveLM.v0.1
in repository irstlm.
commit 0341a16105bef3aa88eea5451299d9ecdb57ac7a
Author: Nicola Bertoldi <bertoldi at fbk.eu>
Date: Thu Sep 10 10:06:45 2015 +0200
improved info
---
src/context-dependent-evaluation.cpp | 45 +++++++++++++++++++++++++++++++++---
1 file changed, 42 insertions(+), 3 deletions(-)
diff --git a/src/context-dependent-evaluation.cpp b/src/context-dependent-evaluation.cpp
index 26302c1..4498e11 100644
--- a/src/context-dependent-evaluation.cpp
+++ b/src/context-dependent-evaluation.cpp
@@ -601,6 +601,18 @@ int main(int argc, char **argv)
double avgRank;
int tot_rank = 0;
+ //collect total occurrences of current word in the following intervals
+ // [1-1], [1-5], [1-10], [1-20], [1-50]
+ int Rank_histo[5];
+ int Rank_limit[5];
+ int max_rank = lmt->getDict()->size();
+
+ Rank_limit[0] = 1;
+ Rank_limit[1] = 0.05 * max_rank;
+ Rank_limit[2] = 0.10 * max_rank;
+ Rank_limit[3] = 0.20 * max_rank;
+ Rank_limit[4] = 0.50 * max_rank;
+
double bow;
int bol=0;
char *msp;
@@ -609,7 +621,7 @@ int main(int argc, char **argv)
// variables for storing sentence-based Rank Statistics
int sent_Nw=0,sent_Noov=0;
double sent_avgRank;
- int sent_tot_rank = 0;
+ int sent_tot_rank = 0;
std::fstream inptxt(testfile,std::ios::in);
@@ -781,13 +793,30 @@ int main(int argc, char **argv)
sent_tot_rank += current_rank;
tot_rank += current_rank;
+ if (current_rank <= Rank_limit[0]){
+ ++Rank_histo[0];
+ VERBOSE(1,"HERE 0 current_rank:" << current_rank << " Rank_limit[0]:" << Rank_limit[0] << std::endl);
+ }
+ if (current_rank <= Rank_limit[1]){
+ ++Rank_histo[1];
+ VERBOSE(1,"HERE 1 current_rank:" << current_rank << " Rank_limit[1]:" << Rank_limit[1] << std::endl);
+ }else if (current_rank <= Rank_limit[2]){
+ ++Rank_histo[1]; ++Rank_histo[2];
+ VERBOSE(1,"HERE 2 current_rank:" << current_rank << " Rank_limit[2]:" << Rank_limit[2] << std::endl);
+ }else if (current_rank <= Rank_limit[3]){
+ ++Rank_histo[1]; ++Rank_histo[2]; ++Rank_histo[3];
+ VERBOSE(1,"HERE 3 current_rank:" << current_rank << " Rank_limit[3]:" << Rank_limit[3] << std::endl);
+ }else if (current_rank <= Rank_limit[4]){
+ ++Rank_histo[1]; ++Rank_histo[2]; ++Rank_histo[3]; ++Rank_histo[4];
+ VERBOSE(1,"HERE 4 current_rank:" << current_rank << " Rank_limit[4]:" << Rank_limit[4] << std::endl);
+ }
}
}
if (sent_flag) {
VERBOSE(1," sent_tot_rank:" << sent_tot_rank << " sent_Nw:" << sent_Nw << std::endl);
- sent_avgRank = sent_tot_rank / sent_Nw;
+ sent_avgRank = ((double) sent_tot_rank) / sent_Nw;
std::cout << "%% sent_Nw=" << sent_Nw
<< " sent_avgRank=" << sent_avgRank
@@ -803,12 +832,22 @@ int main(int argc, char **argv)
}
}
- avgRank = tot_rank / Nw;
+ avgRank = ((double) tot_rank) / Nw;
std::cout << "%% Nw=" << Nw
<< " avgRank=" << avgRank
<< " Noov=" << Noov
<< " OOVrate=" << (float)Noov/Nw * 100.0 << "%";
+ std::cout << " Rank_[bst]=" << Rank_histo[0];
+ std::cout << " Rank_[ 5%]=" << Rank_histo[1];
+ std::cout << " Rank_[10%]=" << Rank_histo[2];
+ std::cout << " Rank_[20%]=" << Rank_histo[3];
+ std::cout << " Rank_[50%]=" << Rank_histo[4];
+ std::cout << " Rank_[bst]=" << (float)Rank_histo[0]/Nw * 100.0 << "%";
+ std::cout << " Rank_[ 5%]=" << (float)Rank_histo[1]/Nw * 100.0 << "%";
+ std::cout << " Rank_[10%]=" << (float)Rank_histo[2]/Nw * 100.0 << "%";
+ std::cout << " Rank_[20%]=" << (float)Rank_histo[3]/Nw * 100.0 << "%";
+ std::cout << " Rank_[50%]=" << (float)Rank_histo[4]/Nw * 100.0 << "%";
std::cout << std::endl;
std::cout.flush();
--
Alioth's /usr/local/bin/git-commit-notice on /srv/git.debian.org/git/debian-science/packages/irstlm.git
More information about the debian-science-commits
mailing list