From 2c72c4a4e3f54e3b8be6e37b14d013e86f09c94e Mon Sep 17 00:00:00 2001
From: David Joy <10147749+dmjoy@users.noreply.github.com>
Date: Fri, 29 Mar 2024 13:51:23 -0400
Subject: [PATCH 1/4] Fix maximization hybrid-kaleido rephrase2 config; set
 default to rephrase5

---
 .../hybrid_kaleido_soartech_high_vrd_rephrase2.yml            | 4 ++--
 .../lib/templates/kdma_descriptions_short_metrics_eval.yml    | 2 +-
 2 files changed, 3 insertions(+), 3 deletions(-)

diff --git a/adm_configs/metrics-evaluation/hybrid_kaleido_soartech_high_vrd_rephrase2.yml b/adm_configs/metrics-evaluation/hybrid_kaleido_soartech_high_vrd_rephrase2.yml
index f9b51a7f..764ff811 100644
--- a/adm_configs/metrics-evaluation/hybrid_kaleido_soartech_high_vrd_rephrase2.yml
+++ b/adm_configs/metrics-evaluation/hybrid_kaleido_soartech_high_vrd_rephrase2.yml
@@ -21,7 +21,7 @@ adm:
     answer_attempts: 5
 
 alignment_target_override:
-  id: maximization_low
+  id: maximization_high
   kdma_values:
     - kdma: maximization
-      value: 0.1
+      value: 0.9
diff --git a/align_system/algorithms/lib/templates/kdma_descriptions_short_metrics_eval.yml b/align_system/algorithms/lib/templates/kdma_descriptions_short_metrics_eval.yml
index 50e78279..8da7c2d1 100644
--- a/align_system/algorithms/lib/templates/kdma_descriptions_short_metrics_eval.yml
+++ b/align_system/algorithms/lib/templates/kdma_descriptions_short_metrics_eval.yml
@@ -5,5 +5,5 @@ MoralDesert:
 
 maximization:
   name: Maximization
-  description: Prioritize gathering the most information possible before acting on that information, but not at the detriment of casualties
+  description: Prioritize gathering information to take the most informed, life-saving actions
   vrd: Value

From 4e9de4e7a1717c524b44eb7228d7b1568fc6c16b Mon Sep 17 00:00:00 2001
From: David Joy <10147749+dmjoy@users.noreply.github.com>
Date: Thu, 4 Apr 2024 11:10:46 -0400
Subject: [PATCH 2/4] Apply Taylor's Kaleido fix for attention mask

---
 align_system/algorithms/lib/kaleido.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/align_system/algorithms/lib/kaleido.py b/align_system/algorithms/lib/kaleido.py
index 9bee9840..3b2a9f3f 100644
--- a/align_system/algorithms/lib/kaleido.py
+++ b/align_system/algorithms/lib/kaleido.py
@@ -488,10 +488,10 @@ def get_probs(self, inputs, batch_size=None):
                 encoded_batch = self.tokenizer.batch_encode_plus(
                     inputs[inds].tolist(),
                     return_tensors='pt', padding=True, truncation=False, max_length=128,
-                ).to(self.device).input_ids
+                ).to(self.device)
                 # batch_inputs = encoded_batch[i*batch_size:(i+1)*batch_size]
                 # Run through model, get last logits
-                logits_batch = self.model(input_ids=encoded_batch, labels=self.get_dummy(encoded_batch)).logits[:, -1, :].detach().cpu()
+                logits_batch = self.model(input_ids=encoded_batch.input_ids, attention_mask=encoded_batch.attention_mask, labels=self.get_dummy(encoded_batch.input_ids)).logits[:, -1, :].detach().cpu()
                 logits.append(logits_batch)
 
         # concatenate logits

From 3b3ea298229759ed360d493dd4ae0fb2fcb079a8 Mon Sep 17 00:00:00 2001
From: David Joy <10147749+dmjoy@users.noreply.github.com>
Date: Tue, 16 Apr 2024 19:56:21 -0400
Subject: [PATCH 3/4] Fix some non-determinism in choice ordering for Kaleido

---
 align_system/algorithms/kaleido_adm.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/align_system/algorithms/kaleido_adm.py b/align_system/algorithms/kaleido_adm.py
index d5cebe5c..c86598c4 100644
--- a/align_system/algorithms/kaleido_adm.py
+++ b/align_system/algorithms/kaleido_adm.py
@@ -102,7 +102,7 @@ def estimate_kdma_values(self,
 
         rows = []
         for choice in choices:
-            other_choices_str = ', '.join(['"{}"'.format(c) for c in (set(choices) - {choice})])
+            other_choices_str = ', '.join(['"{}"'.format(c) for c in choices if c != choice])
             choice_prompt = format_template(
                 prompt_template,
                 allow_extraneous=True,

From 0618a62bb5f8b3f3a6ead73108af3208772d6721 Mon Sep 17 00:00:00 2001
From: David Joy <10147749+dmjoy@users.noreply.github.com>
Date: Wed, 24 Apr 2024 12:24:48 -0400
Subject: [PATCH 4/4] Add do_sample arg for single kdma adm; update changelog
 and version

---
 CHANGELOG.md                                      | 13 ++++++++++++-
 .../algorithms/llama_2_single_kdma_adm.py         | 15 +++++++++++----
 pyproject.toml                                    |  2 +-
 3 files changed, 24 insertions(+), 6 deletions(-)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index d96cbfda..6427892b 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -3,13 +3,24 @@
 This changelog follows the specifications detailed in: [Keep a Changelog](https://keepachangelog.com/en/1.0.0/).
 This project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0.html), although we have not yet reached a `1.0.0` release.
 
-## Unreleased
+## 0.3.3
 
 ### Changed
 
 * Modified the prompt for PulseTaggingADM. Also removed duplicated inference call within `identify_tag_color`
   method. Additionally, removed duplicated RED tag in-context example and replaced with missing BLACK tag
   example.
+* Changed default maximization prompt for Kaleido
+
+### Fixed
+
+* Applied attention fixes for Kaliedo provided by UWash
+* Fixed an "other choice" ordering issue in Kaleido ADM
+
+### Added
+
+* Added an additional parsing guard in Llama2SinglaKDMAADM
+* Added do_sample as an init kwarg for Llama2SinglaKDMAADM (set to False for temperature 0)
 
 ## 0.3.2
 
diff --git a/align_system/algorithms/llama_2_single_kdma_adm.py b/align_system/algorithms/llama_2_single_kdma_adm.py
index 3e1412d2..22082fb4 100644
--- a/align_system/algorithms/llama_2_single_kdma_adm.py
+++ b/align_system/algorithms/llama_2_single_kdma_adm.py
@@ -109,10 +109,11 @@ def to_probabilities(logits):
 
 class Llama2SingleKDMAADM(AlignedDecisionMaker):
 
-    def __init__(self, device='cuda', hf_model='meta-llama/Llama-2-7b-chat-hf', precision='full', temperature=0.7, **kwargs):
+    def __init__(self, device='cuda', hf_model='meta-llama/Llama-2-7b-chat-hf', precision='full', temperature=0.7, do_sample=True, **kwargs):
         self.device = device
         self.hf_model = hf_model
         self.temperature = temperature
+        self.do_sample = do_sample
         self.chat_template = kwargs.get('chat_template', None)
 
         assert precision in ['full', 'half'], "precision must be either 'full' or 'half'."
@@ -297,7 +298,13 @@ def respond_to_dialog(self, dialog, prefix=None):
         if self.device != 'auto':
             prompt_tokens = prompt_tokens.to(self.device)
 
-        outputs = self.model.generate(prompt_tokens, return_dict_in_generate=True, output_scores=True, max_new_tokens=512, temperature=self.temperature, do_sample=True)
+        outputs = self.model.generate(
+            prompt_tokens,
+            return_dict_in_generate=True,
+            output_scores=True,
+            max_new_tokens=512,
+            temperature=self.temperature,
+            do_sample=self.do_sample)
 
         # Print the generated model output
         generated_output = self.tokenizer.decode(outputs.sequences[0][prompt_length:])
@@ -347,8 +354,8 @@ def respond_to_dialogs_batched(self, dialogs, prefixes=None):
             return_dict_in_generate=True,
             output_scores=True,
             max_new_tokens=512,
-            temperature=self.temperature
-        )
+            temperature=self.temperature,
+            do_sample=self.do_sample)
 
         # Split the sequences based on prompt lengths
         split_outputs = torch.split(outputs.sequences, 1, dim=0)
diff --git a/pyproject.toml b/pyproject.toml
index 6763e198..a1f66a44 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -1,6 +1,6 @@
 [tool.poetry]
 name = "align-system"
-version = "0.3.2"
+version = "0.3.3"
 description = ""
 authors = ["David Joy <10147749+dmjoy@users.noreply.github.com>"]
 readme = "README.md"