From dd220c6bd15c6d69bf4352722b0c9a93cb245e22 Mon Sep 17 00:00:00 2001 From: Brad Jascob <22728060+bjascob@users.noreply.github.com> Date: Sun, 21 Jan 2024 17:34:19 -0700 Subject: [PATCH] update generate_xfm config file --- configs/model_generate_xfm_t5_base_wTT.json | 8 +++----- 1 file changed, 3 insertions(+), 5 deletions(-) diff --git a/configs/model_generate_xfm_t5_base_wTT.json b/configs/model_generate_xfm_t5_base_wTT.json index e5961d9..bffae37 100644 --- a/configs/model_generate_xfm_t5_base_wTT.json +++ b/configs/model_generate_xfm_t5_base_wTT.json @@ -1,7 +1,7 @@ { "gen_args" : { "model_name_or_path" : "t5-base", - "corpus_dir" : "data/tdata_generate_xfm", + "corpus_dir" : "amrlib/data/tdata_generate_xfm", "train_fn" : "train.txt.features.nowiki.tdata", "eval_fn" : "dev.txt.features.nowiki", "eval_use_tense" : true, @@ -13,7 +13,7 @@ "max_in_len" : 512, "max_out_len" : 512, "max_train_graph_len" : 512, - "max_train_sent_len" : 90 + "max_train_sent_len" : 256 }, "tokenizer_args" : { @@ -21,10 +21,9 @@ }, "hf_args" : { - "output_dir" : "data/model_generate_xfm", + "output_dir" : "amrlib/data/model_generate_xfm", "save_strategy" : "epoch", "evaluation_strategy" : "epoch", - "bf16" : false, "group_by_length" : true, "do_train" : true, "do_eval" : true, @@ -36,7 +35,6 @@ "weight_decay" : 0.004, "learning_rate" : 1e-4, "max_grad_norm" : 1.0, - "warmup_steps" : 0, "seed" : 0 } }