-
Notifications
You must be signed in to change notification settings - Fork 8
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
1) use the last iteration of coordinate descent, 2) fix variational i…
…nference and dirichlet priors, 3) less logging.
- Loading branch information
Waleed Ammar
committed
Apr 17, 2015
1 parent
08f08b7
commit 022ab61
Showing
7 changed files
with
199 additions
and
238 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Large diffs are not rendered by default.
Oops, something went wrong.
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,24 @@ | ||
import en-fi.tconf | ||
|
||
global { | ||
# Output directory: | ||
ducttape_output="/usr3/home/wammar/mt-systems/en-fi-exp000" | ||
|
||
# initial autoencoder params | ||
init_theta_fwd="" | ||
init_lambda_fwd="" | ||
init_theta_bwd="" | ||
init_lambda_bwd="" | ||
|
||
# general | ||
cores=16 | ||
|
||
# prefix; must be important for concurrent runs | ||
output_prefix="exp000" | ||
|
||
} | ||
|
||
plan Full { | ||
#reach AutoencoderAlignT2S | ||
reach Evaluate via (TuneOrTest: tune test) * (UseCustomLM: no) * (Aligner: giza) * (L2: point_o_one) * (DirichletAlpha: one_point_five) * (PrecomputedFeatures: dyer11) * (OptimizeLambdasFirst: yes) * (UseOtherAligners: yes) * (EmItercount: one) * (SymHeuristic: grow_diag_final_and ) * (MaxLambdaEpochCount: one) * (LambdaOptimizer: lbfgs sgd) * (ThetaOptimizer: em) | ||
} |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,37 @@ | ||
global { | ||
|
||
train_corpus="/usr3/home/wammar/corpora/parallel/en-fi.short.en-fi" | ||
tune_corpus="/usr3/home/wammar/corpora/parallel/en-fi.wmt-dev" | ||
test_corpus="/usr3/home/wammar/corpora/parallel/en-fi.wmt-devtest" | ||
src_brown_clusters="/usr1/home/wammar/parallel/english/news-commentary10.cz-en.en.tok.brown80" | ||
tgt_brown_clusters="/usr3/home/wammar/brown-clusters/wmt_mono+parallel+dev+devtest-c100-p1.out/paths" | ||
|
||
# only specify when you want to reuse a previously built LM | ||
language_model="" | ||
# only use these two parameters if you want to build a language model. if you have a language model already built, specify "language_model=" instead | ||
lm_order=4 | ||
lm_data="/usr3/home/wammar/corpora/monolingual/finnish/wmt_mono+parallel+dev+devtest.tok" | ||
|
||
# tool paths | ||
cdec_dir="/home/wammar/cdec/" | ||
multeval="/home/wammar/git/multeval/multeval.sh" | ||
giza_bin="/opt/tools/mgizapp-0.7.2/bin" | ||
moses_train_script="/home/wammar/git/mosesdecoder/scripts/training/train-model.perl" | ||
mkcls_bin="/mal0/tools/mosesdecoder/bin/mkcls" | ||
wammar_utils_dir="/home/wammar/wammar-utils" | ||
alignment_with_openfst_dir="/home/wammar/online_em/alignment-with-openfst/" | ||
kenlm_dir="/home/wammar/git/kenlm" | ||
|
||
# aer | ||
conv_pharaoh_script="/home/wammar/alignment-with-openfst/data/hansards/conv-pharaoh.pl" | ||
aer_eval_script="" | ||
gold_alignment="" | ||
|
||
# other aligner outputs | ||
fwd_giza_alignments="" | ||
bwd_giza_alignments="" | ||
sym_giza_alignments="" | ||
fwd_fast_alignments="" | ||
bwd_fast_alignments="" | ||
sym_fast_alignments="" | ||
} |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,23 @@ | ||
import en-fi-paths.tconf | ||
|
||
global { | ||
|
||
# UseCustomAlignment controls whether to retrain word alignment from the train_corpus, or just use | ||
# alignments at 'alignment' | ||
alignment="/dev/null" | ||
|
||
# preprocess data | ||
tokenize_corpus="false" | ||
lowercase_corpus="false" | ||
max_sentence_length=0 | ||
|
||
# language specific | ||
src="en" | ||
tgt="fi" | ||
meteor_lang="english" | ||
|
||
# aer | ||
test_sents_count=0 | ||
|
||
} | ||
|
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters