You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@joshua.apache.org by mj...@apache.org on 2016/09/17 13:36:11 UTC

[3/3] incubator-joshua git commit: fixed class LM test

fixed class LM test


Project: http://git-wip-us.apache.org/repos/asf/incubator-joshua/repo
Commit: http://git-wip-us.apache.org/repos/asf/incubator-joshua/commit/4cb838ce
Tree: http://git-wip-us.apache.org/repos/asf/incubator-joshua/tree/4cb838ce
Diff: http://git-wip-us.apache.org/repos/asf/incubator-joshua/diff/4cb838ce

Branch: refs/heads/7_confsystem
Commit: 4cb838ce704fb4ee2c3a75c00b73fd48539dc616
Parents: b6bf461
Author: Matt Post <po...@cs.jhu.edu>
Authored: Sat Sep 17 15:35:58 2016 +0200
Committer: Matt Post <po...@cs.jhu.edu>
Committed: Sat Sep 17 15:35:58 2016 +0200

----------------------------------------------------------------------
 .../joshua/decoder/cky/BnEnClassLMTest.conf     |  44 +
 .../joshua/decoder/cky/BnEnClassLMTest.gold     | 887 +++++++++++++++++++
 .../joshua/decoder/cky/BnEnDecodingTest.java    |   2 +-
 3 files changed, 932 insertions(+), 1 deletion(-)
----------------------------------------------------------------------


http://git-wip-us.apache.org/repos/asf/incubator-joshua/blob/4cb838ce/joshua-core/src/test/java/org/apache/joshua/decoder/cky/BnEnClassLMTest.conf
----------------------------------------------------------------------
diff --git a/joshua-core/src/test/java/org/apache/joshua/decoder/cky/BnEnClassLMTest.conf b/joshua-core/src/test/java/org/apache/joshua/decoder/cky/BnEnClassLMTest.conf
new file mode 100644
index 0000000..9cffd0d
--- /dev/null
+++ b/joshua-core/src/test/java/org/apache/joshua/decoder/cky/BnEnClassLMTest.conf
@@ -0,0 +1,44 @@
+mark_oovs = false
+default_non_terminal = X
+goalSymbol = GOAL
+pop_limit = 10
+use_unique_nbest = true
+top_n = 10
+output_format = "%c %s"
+
+feature_functions = [
+  { class = StateMinimizingLanguageModel, lm_type=kenlm, lm_order=5, lm_file=src/test/resources/bn-en/hiero/lm.gz }
+  { class = WordPenalty }
+  { class = OOVPenalty }
+  { class = StateMinimizingLanguageModel, lm_type=kenlm, lm_order=9, lm_file=src/test/resources/bn-en/hiero/class_lm_9gram.gz, class_map=src/test/resources/bn-en/hiero/class.map }
+]
+
+grammars = [
+  { class = TextGrammar, owner=pt, span_limit=12, path=src/test/resources/bn-en/hiero/grammar.gz }
+  { class = TextGrammar, owner=glue, span_limit=-1, path=src/test/resources/bn-en/hiero/glue-grammar }
+]
+
+weights = {
+  pt_15 = -0.5524863522177359
+  pt_14 = 0.32923261148678096
+  pt_16 = -0.23451595442127693
+  pt_11 = -0.25597137004462134
+  pt_10 = -0.2593091306160006
+  pt_13 = 0.36212061186692646
+  pt_12 = -0.3538894647790496
+  lm_0 = 1.2373676802179452
+  lm_1 = 1.2373676802179452
+  OOVPenalty = 1.0
+  WordPenalty = -3.6942747832593694
+  pt_9 = -0.8202511858619419
+  pt_8 = -0.9070737587091975
+  pt_5 = -0.19138972284064748
+  pt_4 = -0.03553113401320236
+  pt_7 = 0.9936312455671283
+  pt_6 = -0.3417994095521415
+  pt_1 = -0.7224581556224123
+  pt_0 = 2.4497429277910214
+  pt_3 = -0.33861043967238036
+  pt_2 = 0.31689069155153504
+  glue_0 = -1
+}