Prepend `almond_` to seq2seq and paraphrase task names

2021-04-06 21:21:39 -07:00 · 2021-04-06 21:21:39 -07:00 · 29473aca3a
parent fe3f8b7824
commit 29473aca3a
2 changed files with 8 additions and 8 deletions
--- a/genienlp/tasks/almond_task.py
+++ b/genienlp/tasks/almond_task.py
@ -469,12 +469,12 @@ class Almond(BaseAlmondTask):
                                preprocess=self.preprocess_field, lower=False)
-@register_task('natural_seq2seq')
+@register_task('almond_natural_seq2seq')
 class NaturalSeq2Seq(BaseAlmondTask):
    """
    The Almond sequence to sequence task where both sequences are natural language.
-    Paraphrasing and translation are examples of this task.
+    In this task entities (see ENTITY_REGEX) are not preprocessed in contrast to paraphrasing and translation tasks.
-    In this task entities (see ENTITY_REGEX) are not preprocessed in contrast to paraphrasing and translation tasks
+    Paraphrasing and translation inherit from this class.
    """
    @property
@ -509,7 +509,7 @@ class NaturalSeq2Seq(BaseAlmondTask):
        return AlmondDataset.return_splits(path=os.path.join(root, 'almond'), make_example=self._make_example, **kwargs)
-@register_task('paraphrase')
+@register_task('almond_paraphrase')
 class Paraphrase(NaturalSeq2Seq):
    """The Almond paraphrasing task. Applies the necessary preprocessing for special tokens and case changes.
    Can be used at prediction and training time. Training is still experimental.
--- a/tests/test_paraphrasing.sh
+++ b/tests/test_paraphrasing.sh
@ -4,18 +4,18 @@
 i=0
-# test natural_seq2seq and paraphrase tasks
+# test almond_natural_seq2seq and almond_paraphrase tasks
 for hparams in \
      "--model TransformerSeq2Seq --pretrained_model sshleifer/bart-tiny-random"; do
    # train
-    genienlp train --train_tasks natural_seq2seq --train_batch_tokens 50 --val_batch_size 50 --train_iterations 6 --preserve_case --save_every 2 --log_every 2 --val_every 2 --save $workdir/model_$i --data $SRCDIR/dataset/  $hparams --exist_ok --skip_cache --embeddings $EMBEDDING_DIR --no_commit
+    genienlp train --train_tasks almond_natural_seq2seq --train_batch_tokens 50 --val_batch_size 50 --train_iterations 6 --preserve_case --save_every 2 --log_every 2 --val_every 2 --save $workdir/model_$i --data $SRCDIR/dataset/  $hparams --exist_ok --skip_cache --embeddings $EMBEDDING_DIR --no_commit
    # greedy prediction
-    genienlp predict --tasks paraphrase --evaluate test --path $workdir/model_$i --overwrite --eval_dir $workdir/model_$i/eval_results/ --data $SRCDIR/dataset/ --embeddings $EMBEDDING_DIR --skip_cache
+    genienlp predict --tasks almond_paraphrase --evaluate test --path $workdir/model_$i --overwrite --eval_dir $workdir/model_$i/eval_results/ --data $SRCDIR/dataset/ --embeddings $EMBEDDING_DIR --skip_cache
    # check if result file exists
-    if test ! -f $workdir/model_$i/eval_results/test/paraphrase.tsv || test ! -f $workdir/model_$i/eval_results/test/paraphrase.results.json; then
+    if test ! -f $workdir/model_$i/eval_results/test/almond_paraphrase.tsv || test ! -f $workdir/model_$i/eval_results/test/almond_paraphrase.results.json; then
        echo "File not found!"
        exit 1
    fi