From 731a92b301a1f773753f87b123be437eaa951245 Mon Sep 17 00:00:00 2001
From: zqwerty <zhuq96@hotmail.com>
Date: Sun, 10 Apr 2022 13:32:01 +0800
Subject: [PATCH] add evaluate script for t5/(nlu|dst)/*.sh

---
 convlab2/base_models/t5/dst/run_multiwoz21.sh               | 2 ++
 convlab2/base_models/t5/nlu/run_multiwoz21_user.sh          | 2 ++
 convlab2/base_models/t5/nlu/run_multiwoz21_user_context3.sh | 2 ++
 convlab2/base_models/t5/nlu/run_tm1_user.sh                 | 2 ++
 convlab2/base_models/t5/nlu/run_tm1_user_context3.sh        | 2 ++
 convlab2/base_models/t5/nlu/run_tm2_user.sh                 | 2 ++
 convlab2/base_models/t5/nlu/run_tm2_user_context3.sh        | 2 ++
 convlab2/base_models/t5/nlu/run_tm3_user.sh                 | 2 ++
 convlab2/base_models/t5/nlu/run_tm3_user_context3.sh        | 2 ++
 9 files changed, 18 insertions(+)

diff --git a/convlab2/base_models/t5/dst/run_multiwoz21.sh b/convlab2/base_models/t5/dst/run_multiwoz21.sh
index e7573e95..6d42380b 100644
--- a/convlab2/base_models/t5/dst/run_multiwoz21.sh
+++ b/convlab2/base_models/t5/dst/run_multiwoz21.sh
@@ -80,3 +80,5 @@ python -m torch.distributed.launch \
     --per_device_eval_batch_size ${per_device_eval_batch_size} \
 
 python merge_predict_res.py -d ${dataset_name} -s ${speaker} -c ${context_window_size} -p ${output_dir}/generated_predictions.json
+
+python ../../../dst/evaluate_unified_datasets.py -p ${output_dir}/predictions.json
diff --git a/convlab2/base_models/t5/nlu/run_multiwoz21_user.sh b/convlab2/base_models/t5/nlu/run_multiwoz21_user.sh
index 4080a092..a9e9d6c5 100644
--- a/convlab2/base_models/t5/nlu/run_multiwoz21_user.sh
+++ b/convlab2/base_models/t5/nlu/run_multiwoz21_user.sh
@@ -64,3 +64,5 @@ python -m torch.distributed.launch \
     --per_device_eval_batch_size ${per_device_eval_batch_size} \
 
 python merge_predict_res.py -d ${dataset_name} -s ${speaker} -c ${context_window_size} -p ${output_dir}/generated_predictions.json
+
+python ../../../nlu/evaluate_unified_datasets.py -p ${output_dir}/predictions.json
diff --git a/convlab2/base_models/t5/nlu/run_multiwoz21_user_context3.sh b/convlab2/base_models/t5/nlu/run_multiwoz21_user_context3.sh
index a8cbc9bd..e90e71d4 100644
--- a/convlab2/base_models/t5/nlu/run_multiwoz21_user_context3.sh
+++ b/convlab2/base_models/t5/nlu/run_multiwoz21_user_context3.sh
@@ -64,3 +64,5 @@ python -m torch.distributed.launch \
     --per_device_eval_batch_size ${per_device_eval_batch_size} \
 
 python merge_predict_res.py -d ${dataset_name} -s ${speaker} -c ${context_window_size} -p ${output_dir}/generated_predictions.json
+
+python ../../../nlu/evaluate_unified_datasets.py -p ${output_dir}/predictions.json
diff --git a/convlab2/base_models/t5/nlu/run_tm1_user.sh b/convlab2/base_models/t5/nlu/run_tm1_user.sh
index 9faedd7f..5372441a 100644
--- a/convlab2/base_models/t5/nlu/run_tm1_user.sh
+++ b/convlab2/base_models/t5/nlu/run_tm1_user.sh
@@ -64,3 +64,5 @@ python -m torch.distributed.launch \
     --per_device_eval_batch_size ${per_device_eval_batch_size} \
 
 python merge_predict_res.py -d ${dataset_name} -s ${speaker} -c ${context_window_size} -p ${output_dir}/generated_predictions.json
+
+python ../../../nlu/evaluate_unified_datasets.py -p ${output_dir}/predictions.json
diff --git a/convlab2/base_models/t5/nlu/run_tm1_user_context3.sh b/convlab2/base_models/t5/nlu/run_tm1_user_context3.sh
index bb6b55fe..65482a1f 100644
--- a/convlab2/base_models/t5/nlu/run_tm1_user_context3.sh
+++ b/convlab2/base_models/t5/nlu/run_tm1_user_context3.sh
@@ -64,3 +64,5 @@ python -m torch.distributed.launch \
     --per_device_eval_batch_size ${per_device_eval_batch_size} \
 
 python merge_predict_res.py -d ${dataset_name} -s ${speaker} -c ${context_window_size} -p ${output_dir}/generated_predictions.json
+
+python ../../../nlu/evaluate_unified_datasets.py -p ${output_dir}/predictions.json
diff --git a/convlab2/base_models/t5/nlu/run_tm2_user.sh b/convlab2/base_models/t5/nlu/run_tm2_user.sh
index 728a8a94..84dc8b71 100644
--- a/convlab2/base_models/t5/nlu/run_tm2_user.sh
+++ b/convlab2/base_models/t5/nlu/run_tm2_user.sh
@@ -64,3 +64,5 @@ python -m torch.distributed.launch \
     --per_device_eval_batch_size ${per_device_eval_batch_size} \
 
 python merge_predict_res.py -d ${dataset_name} -s ${speaker} -c ${context_window_size} -p ${output_dir}/generated_predictions.json
+
+python ../../../nlu/evaluate_unified_datasets.py -p ${output_dir}/predictions.json
diff --git a/convlab2/base_models/t5/nlu/run_tm2_user_context3.sh b/convlab2/base_models/t5/nlu/run_tm2_user_context3.sh
index 8ebb102d..abca0a60 100644
--- a/convlab2/base_models/t5/nlu/run_tm2_user_context3.sh
+++ b/convlab2/base_models/t5/nlu/run_tm2_user_context3.sh
@@ -64,3 +64,5 @@ python -m torch.distributed.launch \
     --per_device_eval_batch_size ${per_device_eval_batch_size} \
 
 python merge_predict_res.py -d ${dataset_name} -s ${speaker} -c ${context_window_size} -p ${output_dir}/generated_predictions.json
+
+python ../../../nlu/evaluate_unified_datasets.py -p ${output_dir}/predictions.json
diff --git a/convlab2/base_models/t5/nlu/run_tm3_user.sh b/convlab2/base_models/t5/nlu/run_tm3_user.sh
index 0d775f7a..689a626c 100644
--- a/convlab2/base_models/t5/nlu/run_tm3_user.sh
+++ b/convlab2/base_models/t5/nlu/run_tm3_user.sh
@@ -64,3 +64,5 @@ python -m torch.distributed.launch \
     --per_device_eval_batch_size ${per_device_eval_batch_size} \
 
 python merge_predict_res.py -d ${dataset_name} -s ${speaker} -c ${context_window_size} -p ${output_dir}/generated_predictions.json
+
+python ../../../nlu/evaluate_unified_datasets.py -p ${output_dir}/predictions.json
diff --git a/convlab2/base_models/t5/nlu/run_tm3_user_context3.sh b/convlab2/base_models/t5/nlu/run_tm3_user_context3.sh
index c8a4a9f6..e2ded66d 100644
--- a/convlab2/base_models/t5/nlu/run_tm3_user_context3.sh
+++ b/convlab2/base_models/t5/nlu/run_tm3_user_context3.sh
@@ -64,3 +64,5 @@ python -m torch.distributed.launch \
     --per_device_eval_batch_size ${per_device_eval_batch_size} \
 
 python merge_predict_res.py -d ${dataset_name} -s ${speaker} -c ${context_window_size} -p ${output_dir}/generated_predictions.json
+
+python ../../../nlu/evaluate_unified_datasets.py -p ${output_dir}/predictions.json
-- 
GitLab