#!/bin/bash # Data preparation for our framework: preprocessing the WoW and WoI datasets # The datasets can be downloaded through the following links: # WoW: https://parl.ai/projects/wizard_of_wikipedia/ # WoI: https://parl.ai/projects/sea/ DIR=`pwd` mkdir -p $DIR/tasks/knwl_dialo/data # We provide the following script to process the raw data from Wizard of Wikipedia python ${DIR}/tasks/knwl_dialo/preprocessing.py --func process_wow_dataset --input_file --output_file # We provide the following script to process the raw data from Wizard of Internet python ${DIR}/tasks/knwl_dialo/preprocessing.py --func process_woi_dataset --input_file --output_file # Obtain the knowledge generation prompts python ${DIR}/tasks/knwl_dialo/preprocessing.py --func get_knwl_gen_prompts --test_file --train_file --model_file --output_file --data_type # Obtain the response generation prompts python ${DIR}/tasks/knwl_dialo/preprocessing.py --func get_resp_gen_prompts --train_file --output_file