From ed51bb1e8c1ffa1281c412a818734aee6c2146c7 Mon Sep 17 00:00:00 2001 From: Silei Xu Date: Wed, 12 Jan 2022 14:36:34 -0800 Subject: [PATCH] Use synthetic data for dev when no dev data is provided --- starter/custom/Makefile | 20 ++++++++++++++++---- 1 file changed, 16 insertions(+), 4 deletions(-) diff --git a/starter/custom/Makefile b/starter/custom/Makefile index 73f970d36..b8189f3da 100644 --- a/starter/custom/Makefile +++ b/starter/custom/Makefile @@ -246,8 +246,14 @@ everything/$(eval_set)/%.nlu.results: everything/models/%/best.pth everything/$( datadir/agent: everything/synthetic.agent.tsv everything/augmented.agent.tsv everything/dev/agent.tsv mkdir -p $@ cp everything/synthetic.agent.tsv $@/ - cp everything/augmented.agent.tsv $@/train.tsv ; \ - cp everything/dev/agent.tsv $@/eval.tsv ; \ + if test -s everything/dev/agent.tsv ; then \ + cp everything/augmented.agent.tsv $@/train.tsv ; \ + cp everything/dev/agent.tsv $@/eval.tsv ; \ + else \ + $(genie) split-train-eval --train $@/train.tsv --eval $@/eval.tsv \ + --eval-probability 0.1 --split-strategy raw-sentence \ + --contextual --eval-on-synthetic everything/augmented.agent.tsv ; \ + fi touch $@ datadir/nlg: everything/synthetic.agent.tsv everything/dev/agent.tsv @@ -259,8 +265,14 @@ datadir/nlg: everything/synthetic.agent.tsv everything/dev/agent.tsv datadir/user: everything/synthetic.user.tsv everything/augmented.user.tsv everything/dev/user.tsv mkdir -p $@ cp everything/synthetic.user.tsv $@/ - cp everything/augmented.user.tsv $@/train.tsv ; \ - cp everything/dev/user.tsv $@/eval.tsv ; \ + if test -s everything/dev/user.tsv ; then \ + cp everything/augmented.user.tsv $@/train.tsv ; \ + cp everything/dev/user.tsv $@/eval.tsv ; \ + else \ + $(genie) split-train-eval --train $@/train.tsv --eval $@/eval.tsv \ + --eval-probability 0.1 --split-strategy raw-sentence \ + --contextual --eval-on-synthetic everything/augmented.user.tsv ; \ + fi touch $@ datadir/fewshot: everything/train/user.tsv everything/dev/user.tsv everything/train/agent.tsv everything/dev/agent.tsv