From 7b5c9920fb45de11e760d4e0fb2214797674bb56 Mon Sep 17 00:00:00 2001 From: Pavan Mandava Date: Wed, 30 Nov 2022 14:22:18 +0100 Subject: [PATCH] Spelling Corrections in slot-values, added rules --- data/prompt-learning/test/test.soloist.json | 30 +++++++++------------ utils/create_dataset.py | 3 ++- utils/regexner.rules | 2 ++ 3 files changed, 17 insertions(+), 18 deletions(-) diff --git a/data/prompt-learning/test/test.soloist.json b/data/prompt-learning/test/test.soloist.json index 2b06df9..0dafe5e 100644 --- a/data/prompt-learning/test/test.soloist.json +++ b/data/prompt-learning/test/test.soloist.json @@ -8159,7 +8159,7 @@ ], "values": [ "17:30", - "cambridge" + "cambridge punter" ], "belief_states": [ "destination = cambridge punter", @@ -8177,7 +8177,7 @@ ], "values": [ "17:30", - "cambridge", + "cambridge punter", "cambridge punter", "city stop restaurant" ], @@ -8199,7 +8199,7 @@ ], "values": [ "17:30", - "cambridge", + "cambridge punter", "cambridge punter", "city stop restaurant" ], @@ -8224,7 +8224,7 @@ ], "values": [ "17:30", - "cambridge", + "cambridge punter", "cambridge punter", "city stop restaurant" ], @@ -8251,7 +8251,7 @@ ], "values": [ "17:30", - "cambridge", + "cambridge punter", "cambridge punter", "city stop restaurant" ], @@ -12288,9 +12288,8 @@ "taxi" ], "values": [ - "arbury lodge", - "whale of a time", - "guesthouse" + "arbury lodge guesthouse", + "whale of a time" ], "belief_states": [ "destination = whale of a time", @@ -12308,9 +12307,8 @@ ], "values": [ "13:00", - "arbury lodge", - "whale of a time", - "guesthouse" + "arbury lodge guesthouse", + "whale of a time" ], "belief_states": [ "leave = 13:00", @@ -12331,9 +12329,8 @@ ], "values": [ "13:00", - "arbury lodge", - "whale of a time", - "guesthouse" + "arbury lodge guesthouse", + "whale of a time" ], "belief_states": [ "leave = 13:00", @@ -12357,9 +12354,8 @@ "values": [ "13:00", "fantastic", - "arbury lodge", - "whale of a time", - "guesthouse" + "arbury lodge guesthouse", + "whale of a time" ], "belief_states": [ "leave = 13:00", diff --git a/utils/create_dataset.py b/utils/create_dataset.py index 699503f..f1d3f89 100644 --- a/utils/create_dataset.py +++ b/utils/create_dataset.py @@ -41,7 +41,8 @@ CORRECTIONS = { "alexander": "alexander bed and breakfast", "ian hong house": "lan hong house", "saint catharines college": "saint catherines college", - "gandhi": "the gandhi" + "gandhi": "the gandhi", + "cambridge punte": "cambridge punter" } diff --git a/utils/regexner.rules b/utils/regexner.rules index 7509f21..2c2f5e7 100644 --- a/utils/regexner.rules +++ b/utils/regexner.rules @@ -203,6 +203,7 @@ bloomsbury restaurant PLACE graffiti PLACE el shaddia PLACE el shaddia guesthouse PLACE +arbury lodge guesthouse PLACE a and b guest house PLACE gonville hotel PLACE worth house PLACE @@ -233,6 +234,7 @@ travellers rest PLACE curry king PLACE pipasha restaurant PLACE cambridge punter PLACE +cambridge punte PLACE saigon city PLACE bedouin PLACE pizza express PLACE