better default configuration for recaser

This commit is contained in:
Philipp Koehn 2015-03-11 17:52:30 +00:00
parent 1632c5f39d
commit 2ce45229f8
5 changed files with 40 additions and 25 deletions

View File

@ -527,9 +527,7 @@ decoder-settings = ""
#########################################################
## RECASER: restore case, this part only trains the model
[RECASING]
#decoder = $moses-bin-dir/moses
[RECASING] IGNORE
### training data
# raw input needs to be still tokenized,
@ -537,9 +535,14 @@ decoder-settings = ""
#
#tokenized = [LM:europarl:tokenized-corpus]
# recase-config =
### additinal settings
#
recasing-settings = ""
#lm-training = $srilm-dir/ngram-count
decoder = $moses-bin-dir/moses
# already a trained recaser? point to config file
#recase-config =
#######################################################
## TRUECASER: train model to truecase corpora and input

View File

@ -546,9 +546,7 @@ decoder-settings = ""
#########################################################
## RECASER: restore case, this part only trains the model
[RECASING]
#decoder = $moses-bin-dir/moses
[RECASING] IGNORE
### training data
# raw input needs to be still tokenized,
@ -556,9 +554,14 @@ decoder-settings = ""
#
#tokenized = [LM:europarl:tokenized-corpus]
# recase-config =
### additinal settings
#
recasing-settings = ""
#lm-training = $srilm-dir/ngram-count
decoder = $moses-bin-dir/moses
# already a trained recaser? point to config file
#recase-config =
#######################################################
## TRUECASER: train model to truecase corpora and input

View File

@ -528,9 +528,7 @@ decoder-settings = ""
#########################################################
## RECASER: restore case, this part only trains the model
[RECASING]
#decoder = $moses-bin-dir/moses
[RECASING] IGNORE
### training data
# raw input needs to be still tokenized,
@ -538,9 +536,14 @@ decoder-settings = ""
#
#tokenized = [LM:europarl:tokenized-corpus]
# recase-config =
### additinal settings
#
recasing-settings = ""
#lm-training = $srilm-dir/ngram-count
decoder = $moses-bin-dir/moses
# already a trained recaser? point to config file
#recase-config =
#######################################################
## TRUECASER: train model to truecase corpora and input

View File

@ -532,9 +532,7 @@ decoder-settings = ""
#########################################################
## RECASER: restore case, this part only trains the model
[RECASING]
#decoder = $moses-bin-dir/moses
[RECASING] IGNORE
### training data
# raw input needs to be still tokenized,
@ -542,9 +540,14 @@ decoder-settings = ""
#
#tokenized = [LM:europarl:tokenized-corpus]
# recase-config =
### additinal settings
#
recasing-settings = ""
#lm-training = $srilm-dir/ngram-count
decoder = $moses-bin-dir/moses
# already a trained recaser? point to config file
#recase-config =
#######################################################
## TRUECASER: train model to truecase corpora and input

View File

@ -510,9 +510,7 @@ decoder-settings = ""
#########################################################
## RECASER: restore case, this part only trains the model
[RECASING]
#decoder = $moses-bin-dir/moses
[RECASING] IGNORE
### training data
# raw input needs to be still tokenized,
@ -520,9 +518,14 @@ decoder-settings = ""
#
#tokenized = [LM:europarl:tokenized-corpus]
# recase-config =
### additinal settings
#
recasing-settings = ""
#lm-training = $srilm-dir/ngram-count
decoder = $moses-bin-dir/moses
# already a trained recaser? point to config file
#recase-config =
#######################################################
## TRUECASER: train model to truecase corpora and input