- Preprocess the datasets to reformat the data for GPT-2 input.
python format_disambiguation_data.py \
--simmc_train_json="../../data/simmc2_dials_dstc10_train.json" \
--simmc_dev_json="../../data/simmc2_dials_dstc10_dev.json" \
--simmc_devtest_json="../../data/simmc2_dials_dstc10_devtest.json" \
--disambiguate_save_path="../../data/"
- Train and simultaneously test the baseline model.
./evaluate_mm_disambiguation_model.sh 0 5 4
- Preprocess the datasets to reformat the data for GPT-2 input.
cd model/mm_dst
./run_preprocess_gpt2.sh
- Train the baseline model
./run_train_gpt2.sh
- Generate prediction for
devtest
data
./run_generate_gpt2.sh
The generation results are saved in the /mm_dst/results
folder. Change the path_output
to a desired path accordingly.
- Evaluate predictions for
devtest
data
./run_evaluate_gpt2.sh