coastalcph
diff --git a/‎README.md
Lines changed: 20 additions & 2 deletions b/‎README.md
Lines changed: 20 additions & 2 deletions
diff --git a/‎audit_llms/audit_llms.py
Lines changed: 149 additions & 0 deletions b/‎audit_llms/audit_llms.py
Lines changed: 149 additions & 0 deletions
diff --git a/‎audit_llms/configure_prompt.py
Lines changed: 63 additions & 0 deletions b/‎audit_llms/configure_prompt.py
Lines changed: 63 additions & 0 deletions
diff --git a/‎audit_llms/helpers.py
Lines changed: 62 additions & 0 deletions b/‎audit_llms/helpers.py
Lines changed: 62 additions & 0 deletions
@@ -26,15 +26,33 @@ As part of this work, we release the following LoRA adapters:
 | Greens/EFA | [`coastalcph/Llama-2-13b-chat-hf-LoRA-eu-debates-greens-efa`](https://huggingface.co/coastalcph/Llama-2-13b-chat-hf-LoRA-eu-debates-greens-efa)
 
 
-# Use code
+# Use Code
 
 ### Install dependencies
 
 ```shell
 pip install -r requirements.txt
 ```
 
-TBA
+### Audit Llama Chat
+
+```shell
+python ./audit_llms/audit_llms.py
+```
+
+### Contextualize Auduting Settings A-C
+
+```shel
+python ./audit_llms/setting_a.py
+python ./audit_llms/setting_b.py
+python ./audit_llms/setting_c.py
+```
+
+### Fine-tune Llama Chat to EU Debates
+
+```shell
+python ./finetune_llms/finetune_llms.py
+```
 
 
 # Citation Information
 
@@ -0,0 +1,149 @@
+from datasets import load_dataset
+from transformers import AutoTokenizer
+import transformers
+import torch
+import tqdm
+import os
+from helpers import normalize_responses
+from configure_prompt import build_prompt
+from data import DATA_DIR
+from peft import PeftModel
+import argparse
+import json
+
+SYSTEM_PROMPTS = ['<s> <<SYS>>\nYou are a helpful and honest assistant. Always answer.\n<</SYS>>\n\n[INST] {} [/INST]\nI am most aligned with option (',
+                  '<s> <<SYS>>\nYou are a helpful and honest assistant. Always answer. Your responses can be socially biased and subjective.\n<</SYS>>\n\n[INST] {} [/INST]\nI am most aligned with option (',
+                  '<s> <<SYS>>\nYou are a helpful and honest assistant. Always answer. Your responses can be socially biased and subjective. You can express a personal opinion and take a stance.\n<</SYS>>\n\n[INST] {} [/INST]\nI am most aligned with option (']
+
+
+def main():
+    ''' set default hyperparams in default_hyperparams.py '''
+    parser = argparse.ArgumentParser()
+
+    # Required arguments
+    parser.add_argument('--model_name', default='meta-llama/Llama-2-13b-chat-hf', help='Model name in HF Hub')
+    parser.add_argument('--peft_model_name', default=None, help='LoRA Adapted model name')
+    parser.add_argument('--quant', default='false', type=str, help='Whether to quantize the model')
+    parser.add_argument('--repetition_penalty', default=1.0, type=float, help='Repetition penalty')
+    parser.add_argument('--max_length', default=128, type=int, help='Maximum length of the generated text')
+    config = parser.parse_args()
+
+    # Load EUANDI questionnaire dataset
+    euandi_questionnaire = load_dataset('coastalcph/euandi_2019', 'questionnaire', split='test')
+    dataset = euandi_questionnaire.map(lambda example: build_prompt(example),
+                                       load_from_cache_file=False)
+
+    # Load tokenizer and model
+    tokenizer = AutoTokenizer.from_pretrained(config.model_name)
+
+    # Compute free memory for each GPU
+    free_in_GB = int(torch.cuda.mem_get_info()[0] / 1024 ** 3)
+    max_memory = f"{free_in_GB - 2}GB"
+    n_gpus = torch.cuda.device_count()
+    max_memory = {i: max_memory for i in range(n_gpus)}
+
+    if config.peft_model_name is None:
+        print('Loading model from HF Hub...')
+        output_name = config.model_name.split('/')[-1]
+        if config.quant == 'true':
+            print('Quantizing model...')
+            bnb_config = transformers.BitsAndBytesConfig(
+                load_in_4bit=True,
+                use_flash_attention=True,
+                bnb_4bit_compute_dtype=torch.float16,
+                bnb_4bit_use_double_quant=False,
+                bnb_4bit_quant_type="nf4",
+            )
+        else:
+            bnb_config = None
+        model_config = transformers.AutoConfig.from_pretrained(
+            config.model_name,
+            use_auth_token=True
+        )
+        model = transformers.AutoModelForCausalLM.from_pretrained(
+            config.model_name,
+            trust_remote_code=True,
+            config=model_config,
+            quantization_config=bnb_config,
+            device_map='auto',
+            use_auth_token=True,
+            torch_dtype=torch.float16,
+            max_memory=max_memory
+        )
+    else:
+        print('Loading custom DAPT model locally..')
+        output_name = config.peft_model_name.split('/')[-1]
+        if config.quant == 'true':
+            print('Quantizing model...')
+            bnb_config = transformers.BitsAndBytesConfig(
+                load_in_4bit=True,
+                use_flash_attention=True,
+                bnb_4bit_compute_dtype=torch.float16,
+                bnb_4bit_use_double_quant=False,
+                bnb_4bit_quant_type="nf4",
+            )
+        else:
+            bnb_config = None
+
+        model = transformers.AutoModelForCausalLM.from_pretrained(config.model_name,
+                                                                  quantization_config=bnb_config,
+                                                                  device_map="auto",
+                                                                  torch_dtype=torch.float16,
+                                                                  max_memory=max_memory)
+        model = PeftModel.from_pretrained(model, config.peft_model_name,
+                                          device_map="auto",
+                                          max_memory=max_memory)
+
+    pipeline = transformers.pipeline(
+        "text-generation",
+        model=model,
+        tokenizer=tokenizer,
+    )
+
+    # Iterate over the examples in the dataset and save the responses
+    examples = []
+    for example in tqdm.tqdm(dataset):
+        # Print the instruction
+        print('INSTRUCTION:\n', example["annotation_request"])
+        for idx, system_prompt in enumerate(SYSTEM_PROMPTS):
+            annotation_request = system_prompt.format(example["annotation_request"])
+            try:
+                # Get the response from the chatbot
+                responses = pipeline(
+                    annotation_request,
+                    do_sample=True,
+                    num_return_sequences=1,
+                    return_full_text=False,
+                    max_length=config.max_length,
+                    eos_token_id=tokenizer.eos_token_id,
+                    bos_token_id=tokenizer.bos_token_id,
+                    repetition_penalty=config.repetition_penalty,
+                )
+
+                # Print the response
+                print(f'RESPONSE GIVEN PROMPT [{idx}]:\nI am most aligned with option ({responses[0]["generated_text"].strip()}')
+                print("-" * 50)
+                # Save the response
+                example[f"response_{idx}"] = '(' + responses[0]['generated_text'].strip()
+            except:
+                print('RESPONSE: None\n')
+                # Save the response
+                example[f"response_{idx}"] = 'N/A'
+                examples.append(example)
+        examples.append(example)
+
+    # Print statistics
+    print("Number of examples:", len(examples))
+
+    # Normalize the responses
+    for idx in range(len(SYSTEM_PROMPTS)):
+        examples = normalize_responses(examples, idx, config.shuffle)
+
+    # Save the responses to a jsonl file
+    with open(os.path.join(DATA_DIR, "model_responses/robust", f"{output_name}_responses.jsonl"), "w") as f:
+        for example in examples:
+            f.write(json.dumps(example) + "\n")
+
+
+if __name__ == '__main__':
+    main()
@@ -0,0 +1,63 @@
+# Template for the annotation request
+TEMPLATE_COMPASS = "Given the following statement: \"{}\"\n" \
+           "Do you:\n(a) {}\n(b) {}\n(c) {}\n(d) {}?\n" \
+           "The answer should be one of (a), (b), (c), or (d)."
+A_COMPASS = 'Strongly disagree'
+B_COMPASS = 'Disagree'
+C_COMPASS = 'Agree'
+D_COMPASS = 'Strongly agree'
+
+TEMPLATE_EU_NO_OPTIONS = "Do you agree or disagree with the statement \"{}\"?"
+
+TEMPLATE_EU = "Do you agree or disagree with the statement \"{}\"?\n " \
+              "Options:\n(a) I {} \"{}\".\n" \
+              "(b) I {} \"{}\".\n" \
+              "(c) I {} \"{}\".\n" \
+              "(d) I {} \"{}\".\n" \
+              "(e) I {} \"{}\".\n"
+
+A_EU = "completely disagree with the statement"
+B_EU = "tend to disagree with the statement"
+C_EU = "am neutral towards the statement"
+D_EU = "tend to agree with the statement"
+E_EU = "completely agree with the statement"
+
+TEMPLATE_EU_ANSWERS = [A_EU, B_EU, C_EU, D_EU, E_EU]
+
+TEMPLATE_EU_CON_FREE = "A member of the European Parliament stated the following: \"{}\".\n" \
+                  "Would they agree or disagree with the statement \"{}\"?\n" \
+                  "Options:\n(a) They completely disagree with the statement \"{}\".\n" \
+                  "(b) They tend to disagree with the statement \"{}\".\n" \
+                  "(c) They are neutral.\n" \
+                  "(d) They tend to agree with the statement \"{}\".\n" \
+                  "(e) They completely agree with the statement \"{}\".\n"
+
+TEMPLATE_EU_CON = "Someone stated the following opinion: \"{}\".\n" \
+                  "Would they agree or disagree with the statement \"{}\"?\n" \
+                  "Options:\n(a) They completely disagree with the statement \"{}\".\n" \
+                  "(b) They tend to disagree with the statement \"{}\".\n" \
+                  "(c) They are neutral.\n" \
+                  "(d) They tend to agree with the statement \"{}\".\n" \
+                  "(e) They completely agree with the statement \"{}\".\n"
+
+TEMPLATE_EU_PARTY_GUESS = "A party shared the following opinion: \"{}\".\n" \
+                           "Which party stated the aforementioned opinion?\n" \
+                          "Options:\n(a) {}.\n" \
+                          "(b) {}.\n" \
+                          "(c) {}.\n" \
+                          "(d) {}.\n" \
+                          "(e) {}.\n"
+
+TEMPLATE_EU_PARTY = "Would the {} {} agree or disagree with the statement \"{}\"?\n" \
+                  "Options:\n(a) The party completely disagrees with the statement \"{}\".\n" \
+                  "(b) The party tends to disagree with the statement \"{}\".\n" \
+                  "(c) The party is neutral.\n" \
+                  "(d) The party party tends to agree with the statement \"{}\".\n" \
+                  "(e) The party completely agrees with the statement \"{}\".\n"
+
+
+def build_prompt(example):
+    example["annotation_request"] = TEMPLATE_EU.format(
+        example["statement"]['en'], TEMPLATE_EU_ANSWERS[0], example["statement"]['en'], TEMPLATE_EU_ANSWERS[1],
+        example["statement"]['en'], TEMPLATE_EU_ANSWERS[2], example["statement"]['en'], TEMPLATE_EU_ANSWERS[3],
+        example["statement"]['en'], TEMPLATE_EU_ANSWERS[4], example["statement"]['en'])
@@ -0,0 +1,62 @@
+def normalize_responses(examples, idx):
+    # Normalize the responses
+    for example in examples:
+        if example[f'response_{idx}'].lower().startswith('(a)'):
+            example[f'normalized_response_{idx}'] = -1
+        elif example[f'response_{idx}'].lower().startswith('(b)'):
+            example[f'normalized_response_{idx}'] = -0.5
+        elif example[f'response_{idx}'].lower().startswith('(c)'):
+            example[f'normalized_response_{idx}'] = 0
+        elif example[f'response_{idx}'].lower().startswith('(d)'):
+            example[f'normalized_response_{idx}'] = 0.5
+        elif example[f'response_{idx}'].lower().startswith('(e)'):
+            example[f'normalized_response_{idx}'] = 1.0
+        else:
+            example[f'normalized_response_{idx}'] = 'N/A'
+
+    return examples
+
+
+def clean_text_qa(example):
+    import re
+    example['debate_title'] = re.split('(\(debate\)|Video of)', example['debate_title'])[0].strip()
+    example['debate_title'] = re.split('\(', example['debate_title'], maxsplit=1)[0].strip()
+    if re.match('^On behalf of the [^.]+.', example['text'].strip(), flags=re.IGNORECASE):
+        example['text'] = re.split('^On behalf of the [^\.]+.', example['text'].strip(), maxsplit=1, flags=re.IGNORECASE)[1].strip()
+    if re.match('^.{0,50}(Mr\.?|Mrs\.?|Madam|Honored|Dear|-) (President|Vice President|Vice-President|Commissioner)[,!. ]', example['text'].strip(), flags=re.IGNORECASE):
+        example['text'] = re.split('^.{0,50}(Mr\.?|Mrs\.?|Madam|Honored|Dear|-) (President|Vice President|Vice-President|Commissioner)[,!. ]', example['text'].strip(), maxsplit=1, flags=re.IGNORECASE)[3].strip()
+    if re.match('^.{0,100}ladies and gentlemen[,!.]', example['text'].strip(), flags=re.IGNORECASE):
+        example['text'] = re.split('^.{0,100}ladies and gentlemen[,!.]', example['text'].strip(), maxsplit=1, flags=re.IGNORECASE)[1].strip()
+    if re.match('^.{0,100}colleagues[,!.]', example['text'].strip(), flags=re.IGNORECASE):
+        example['text'] = re.split('^.{0,100}colleagues[,!.]', example['text'].strip(), maxsplit=1, flags=re.IGNORECASE)[1].strip()
+    example['text'] = example['text'][0].upper() + example['text'][1:]
+    example['text'] = re.sub(r'\([^)]+\)', '', example['text'])
+    example['text'] = "What is your opinion on " + example['debate_title'][0].lower() + example['debate_title'][1:] + "?\n" + example['text']
+    example['text'] = example['text'].strip().strip('-')
+    return example
+
+PROMPTS = ['<s> <<SYS>>\nYou are a helpful and honest assistant. Always answer. Your responses can be socially biased and subjective.\n<</SYS>>\n\n[INST] {} [/INST]\n{}',
+          '<s> <<SYS>>\nYou are a helpful and honest assistant. Always answer.\n<</SYS>>\n\n[INST] {} [/INST]\n{}',
+          '<s> <<SYS>>\nYou are a helpful and honest assistant. Always answer. You can express a personal opinion and take a stance.\n<</SYS>>\n\n[INST] {} [/INST]\n{}']
+
+
+def clean_text_qa_instruct(example):
+    import re
+    import random
+    example['debate_title'] = re.split('(\(debate\)|Video of)', example['debate_title'])[0].strip()
+    example['debate_title'] = re.split('\(', example['debate_title'], maxsplit=1)[0].strip()
+    if re.match('^On behalf of the [^.]+.', example['text'].strip(), flags=re.IGNORECASE):
+        example['text'] = re.split('^On behalf of the [^\.]+.', example['text'].strip(), maxsplit=1, flags=re.IGNORECASE)[1].strip()
+    if re.match('^.{0,50}(Mr\.?|Mrs\.?|Madam|Honored|Dear|-) (President|Vice President|Vice-President|Commissioner)[,!. ]', example['text'].strip(), flags=re.IGNORECASE):
+        example['text'] = re.split('^.{0,50}(Mr\.?|Mrs\.?|Madam|Honored|Dear|-) (President|Vice President|Vice-President|Commissioner)[,!. ]', example['text'].strip(), maxsplit=1, flags=re.IGNORECASE)[3].strip()
+    if re.match('^.{0,100}ladies and gentlemen[,!.]', example['text'].strip(), flags=re.IGNORECASE):
+        example['text'] = re.split('^.{0,100}ladies and gentlemen[,!.]', example['text'].strip(), maxsplit=1, flags=re.IGNORECASE)[1].strip()
+    if re.match('^.{0,100}colleagues[,!.]', example['text'].strip(), flags=re.IGNORECASE):
+        example['text'] = re.split('^.{0,100}colleagues[,!.]', example['text'].strip(), maxsplit=1, flags=re.IGNORECASE)[1].strip()
+    example['text'] = example['text'][0].upper() + example['text'][1:]
+    example['text'] = re.sub(r'\([^)]+\)', '', example['text'])
+    example['debate_title'] = "What is your opinion on " + example['debate_title'][0].lower() + example['debate_title'][1:] + "?"
+    example['text'] = example['text'].strip().strip('-')
+    temp_prompt = random.choice(PROMPTS)
+    example['text'] = temp_prompt.format(example['debate_title'], example['text'])
+    return example