Added Prompt Ensemble templates

3 years ago · 4a1893ee50
parent f2255db776
commit 4a1893ee50
3 changed files with 111 additions and 15 deletions
--- a/README.md
+++ b/README.md
@ -117,7 +117,7 @@ After following the environment setup steps in the previous [section](#environme
 Change directory to `baseline` and install the requirements. Make sure the correct baseline conda environment is activated before installing the requirements.  
 ```shell  
 cd baseline
-pip install requirements.txt
+pip install -r requirements.txt
 ```  
 ### Train the baseline model  
@ -178,7 +178,7 @@ After following the environment setup steps in the previous [section](#environme
 Change directory to `prompt-learning` and install the requirements. Make sure the correct prompt-learning `conda` environment is activated before installing the requirements.  
 ```shell  
 cd prompt-learning
-pip install requirements.txt
+pip install - requirements.txt
 ```
 ### Train the prompt model  
--- a/prompt-learning/prompt_train.py
+++ b/prompt-learning/prompt_train.py
@ -13,6 +13,7 @@ from prompt_utils import get_value_based_prompt
 from prompt_utils import get_prompt_for_training
 from prompt_utils import TYPE_VALUE_BASED_PROMPT
 from prompt_utils import TYPE_INVERSE_PROMPT
 from prompt_utils import TYPE_PROMPT_ENSEMBLE, PROMPT_WEIGHT
 from metrics import PromptDSTEvaluator
 from datetime import datetime
@ -42,6 +43,8 @@ def main():
                        help="Flag for enabling/disabling inverse prompt during training")
    parser.add_argument("--inverse_prompt_weight", default=0.1, type=float,
                        help="Weight to adjust the influence of Inverse Prompt, decimal (0,1)")
    parser.add_argument("--with_prompt_ensemble", action="store_true",
                        help="Flag for enabling/disabling prompt ensembling during training")
    parser.add_argument("--validation_file", default="", type=str,
                        help="Validation file for evaluating model after each epoch")
@ -111,7 +114,8 @@ def main():
            for slot, value in item['belief_states']:
                # train/generate using value-based prompt first
-                loss, gen_slot = train_prompting(history=history,
+                loss, gen_slot = train_prompting(args=args,
                                                 history=history,
                                                 slot_value_pair=(slot, value),
                                                 prompt_type=TYPE_VALUE_BASED_PROMPT,
                                                 tokenizer=tokenizer,
@ -124,7 +128,8 @@ def main():
                    generated_slot = gen_slot.strip().lower()
                    # train slot generation using inverse prompt
-                    inv_loss, _ = train_prompting(history=history,
+                    inv_loss, _ = train_prompting(args=args,
                                                  history=history,
                                                  slot_value_pair=(generated_slot, value),
                                                  prompt_type=TYPE_INVERSE_PROMPT,
                                                  tokenizer=tokenizer,
@ -231,7 +236,18 @@ def set_seed(args):
        torch.cuda.manual_seed_all(args.seed)
-def train_prompting(history, slot_value_pair, prompt_type, tokenizer, model, device):
+def train_prompting(args, history, slot_value_pair, prompt_type, tokenizer, model, device):
    # slot_value_pair = (slot, value)
    # use prompt ensemble when set in the args
    if prompt_type is TYPE_VALUE_BASED_PROMPT and args.with_prompt_ensemble:
        return train_prompt_ensemble(history=history,
                                     slot_value_pair=slot_value_pair,
                                     prompt_type=TYPE_PROMPT_ENSEMBLE,
                                     tokenizer=tokenizer,
                                     model=model,
                                     device=device)
    # get prompt for training based on "type"
    prompt = get_prompt_for_training(prompt_type, slot_value_pair)
@ -271,6 +287,65 @@ def train_prompting(history, slot_value_pair, prompt_type, tokenizer, model, dev
    return loss, generated_word
 def train_prompt_ensemble(history, slot_value_pair, prompt_type, tokenizer, model, device):
    # slot_value_pair = (slot, value)
    # get list of prompts for training
    prompts = get_prompt_for_training(prompt_type, slot_value_pair)
    # return total loss
    total_loss = None
    gen_probs, gen_words = [], []
    # iterate through each prompt
    for prompt in prompts:
        # combine history and prompt
        input_prompt = history + prompt
        # encode the history & prompt using tokenizer
        encoded_prompt = tokenizer(input_prompt, return_tensors="pt")
        encoded_prompt.to(device)
        # get the last token id
        # this could be a slot or value depending on prompt type
        last_token = encoded_prompt['input_ids'][:, -1:]
        last_token.to(device)
        # model outputs
        outputs = model(**encoded_prompt)
        # get last token logits [-2 -> for last but one item]
        logits = outputs.logits[:, -2, :]
        # softmax probabilities
        probs = torch.nn.functional.softmax(logits, dim=-1)
        # last token generation probability
        last_token_prob = torch.gather(probs, 1, last_token).squeeze(-1)
        # weighted probability
        token_prob = PROMPT_WEIGHT * last_token_prob
        loss = torch.negative(torch.log(token_prob))
        if total_loss is None:
            total_loss = loss
        else:
            total_loss += loss
        # generated slot
        # find the token with the highest probability, this will be the generated word
        gen_word_token = torch.argmax(logits, dim=-1)
        gen_word_prob = torch.gather(probs, 1, gen_word_token[:, None]).squeeze(-1)
        gen_word = tokenizer.decode(gen_word_token, skip_special_tokens=True).strip()
        # add the generated word and probs to list
        gen_probs.append(gen_word_prob)
        gen_words.append(gen_word)
    generated_word = gen_words.index(max(gen_probs))
    # loss is the log of probability
    return total_loss, generated_word
 # Use this for generating next word (Validation after each epoch)
 def generate_slot_from_prompt(history, value, tokenizer, model, device):
    # get prompt for training based on "type"
--- a/prompt-learning/prompt_utils.py
+++ b/prompt-learning/prompt_utils.py
@ -2,29 +2,50 @@ from string import Template
 TYPE_VALUE_BASED_PROMPT = "value-based"
 TYPE_INVERSE_PROMPT = "inverse-prompt"
 TYPE_PROMPT_ENSEMBLE = "prompt-ensemble"
 PROMPT_WEIGHT = 0.25
 PROMPT_TEMPLATES = {
    "value-based": {
        "training": "belief states: value = $value, slot = $slot",
        "generate": "belief states: value = $value, slot ="
    },
-    "inverse-prompt": {
+    "inverse-prompt": "belief states: slot = $slot, value = $value",
-        "training": "belief states: slot = $slot, value = $value",
+    "prompt-ensemble": {
-        "generate": "belief states: slot = $slot, value ="
+        "training": {
            "p1": "belief states: value = $value, slot = $slot",
            "p2": "belief states: $value = $slot",
            "p3": "$value is of slot type $slot",
            "p4": "$value is the value of $slot"
        },
        "generate": {
            "p1": "belief states: value = $value, slot =",
            "p2": "belief states: $value =",
            "p3": "$value is of slot type",
            "p4": "$value is the value of"
        }
    }
 }
 def get_prompt_for_training(typ, slot_value):
-    template = Template(PROMPT_TEMPLATES[typ]["training"])
+    if typ == TYPE_INVERSE_PROMPT:
        template = Template(PROMPT_TEMPLATES[typ])
        return template.substitute(slot=slot_value[0], value=slot_value[1])
    else:
        template = PROMPT_TEMPLATES[typ]['training']
        if isinstance(template, str):
            return Template(template).substitute(slot=slot_value[0], value=slot_value[1])
        elif isinstance(template, dict):
            template_list = template.values()
            prompt_list = []
            for template_str in template_list:
                template = Template(template_str)
                prompt_list.append(template.substitute(slot=slot_value[0], value=slot_value[1]))
            return prompt_list
 def get_value_based_prompt(value):
    template = Template(PROMPT_TEMPLATES["value-based"]["generate"])
    return template.substitute(value=value)
 def get_inverse_prompt(slot):
    template = Template(PROMPT_TEMPLATES["inverse-prompt"]["generate"])
    return template.substitute(slot=slot)