From 5ef2fc6a14c859224d1b509aac2806f1b262347e Mon Sep 17 00:00:00 2001
From: wjdghks950 <jeonghwankim123@gmail.com>
Date: Sun, 30 Jun 2024 19:43:18 -0500
Subject: [PATCH 1/5] Add setup script

---
 setup.py | 9 +++++++++
 1 file changed, 9 insertions(+)
 create mode 100644 setup.py

diff --git a/setup.py b/setup.py
new file mode 100644
index 00000000..f2537614
--- /dev/null
+++ b/setup.py
@@ -0,0 +1,9 @@
+# align-system/setup.py
+from setuptools import setup, find_packages
+
+setup(
+    name='align_system',
+    version='0.1',
+    packages=find_packages(),
+    install_requires=[],
+)
\ No newline at end of file

From 7c60b1160e6cdebce0559fe7a006b16f32fbece0 Mon Sep 17 00:00:00 2001
From: wjdghks950 <jeonghwankim123@gmail.com>
Date: Mon, 1 Jul 2024 02:41:09 -0500
Subject: [PATCH 2/5] Add CodeActAgentADM to REGISTERED_ADM

---
 align_system/algorithms/adms.py | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/align_system/algorithms/adms.py b/align_system/algorithms/adms.py
index 2608bdee..fa404eb8 100644
--- a/align_system/algorithms/adms.py
+++ b/align_system/algorithms/adms.py
@@ -1,12 +1,14 @@
 from align_system.algorithms.kaleido_adm import KaleidoADM
 from align_system.algorithms.llama_2_single_kdma_adm import Llama2SingleKDMAADM
 from align_system.algorithms.hybrid_kaleido_adm import HybridKaleidoADM
+from align_system.algorithms.codeact_agent_adm import CodeActAgentADM
 from align_system.algorithms.random_adm import RandomADM
 from align_system.algorithms.oracle_adm import OracleADM
 
 REGISTERED_ADMS = {
     'KaleidoADM': KaleidoADM,
     'HybridKaleidoADM': HybridKaleidoADM,
+    'CodeActAgentADM': CodeActAgentADM,
     'SingleKDMAADM': Llama2SingleKDMAADM,
     'RandomADM': RandomADM,
     'OracleADM': OracleADM,

From 3446b221867c4e35e349dac8e03e2640b5ad1245 Mon Sep 17 00:00:00 2001
From: wjdghks950 <jeonghwankim123@gmail.com>
Date: Mon, 1 Jul 2024 02:42:08 -0500
Subject: [PATCH 3/5] Add TODO in __call__ for refactoring - to be refactored

---
 align_system/algorithms/codeact_agent_adm.py | 207 +++++++++++++++++++
 1 file changed, 207 insertions(+)
 create mode 100644 align_system/algorithms/codeact_agent_adm.py

diff --git a/align_system/algorithms/codeact_agent_adm.py b/align_system/algorithms/codeact_agent_adm.py
new file mode 100644
index 00000000..62baf35a
--- /dev/null
+++ b/align_system/algorithms/codeact_agent_adm.py
@@ -0,0 +1,207 @@
+import json
+import re
+import random
+import os
+import pathlib
+import numpy as np
+import torch
+
+from jinja2.exceptions import TemplateError
+
+from rich.highlighter import JSONHighlighter
+from transformers import AutoModelForCausalLM, AutoTokenizer
+
+from align_system.utils import logging
+from align_system.algorithms.abstracts import AlignedDecisionMaker
+from align_system.similarity_measures import build_force_choice_func
+
+
+log = logging.getLogger(__name__)
+JSON_HIGHLIGHTER = JSONHighlighter()
+
+
+kdmas = {
+    'basic_knowledge',
+    'fairness',
+    'protocol_focus',
+    'time_pressure',
+    'risk_aversion',
+    'utilitarianism',
+    'mission',
+    'denial',
+    'moral_deservingness',
+    'lives_saved',
+    'continuation_of_care',
+    'maximization'
+}
+
+kdma_remapping = {
+    'basicknowledge': 'basic_knowledge',
+    'protocolfocus': 'protocol_focus',
+    'riskaversion': 'risk_aversion',
+    'moraldeservingness': 'moral_deservingness',
+    'continuationofcare': 'continuation_of_care',
+    'livesaved': 'lives_saved',
+    'timepressure': 'time_pressure',
+}
+
+
+default_system_messages_path=os.path.join(
+    pathlib.Path(__file__).parent.absolute(), '..',
+    'prompt_engineering/single_kdma_adm_system_messges')
+
+chat_template_path = os.path.join(
+    pathlib.Path(__file__).parent.absolute(), '..',
+    'prompt_engineering/chat_templates')
+
+
+def load_system_message(alignment=None,
+                        system_messages_path=default_system_messages_path):
+    if alignment is None:
+        file_name = 'baseline.txt'
+    else:
+        sorted_kdmas = sorted(alignment.keys())
+
+        alignment_string = '-'.join(
+            '{}-{}'.format(alignment[k], kdma_remapping.get(k, k))
+            for k in sorted_kdmas)
+
+        file_name = f'{alignment_string}.txt'
+
+    with open(os.path.join(system_messages_path, file_name), 'r') as f:
+        system_message = f.read()
+    return system_message
+
+
+STANDARD_MULTIPLE_CHOICE_JSON_FORMAT = "{\"Reasoning\": \"<Provide a reasoned explanation here>\", \"Answer\": <Integer index corresponding to your final answer>}\\n"
+
+TREATMENT_MULTIPLE_CHOICE_JSON_FORMAT = "{\"Reasoning\": \"<Provide a reasoned explanation here>\", \"Answer\": <Integer index corresponding to your final answer>, \"Location\": \"<Specific location on the body where the treatment should be applied, one of: 'right forearm', 'left forearm', 'right calf', 'left calf', 'right thigh', 'left thigh', 'right stomach', 'left stomach', 'right bicep', 'left bicep', 'right shoulder', 'left shoulder', 'right side', 'left side', 'right chest', 'left chest', 'right wrist', 'left wrist', 'left face', 'right face', 'left neck', 'right neck', 'unspecified'>\"}\\n"
+
+TAGGING_MULTIPLE_CHOICE_JSON_FORMAT = "{\"Reasoning\": \"<Provide a reasoned explanation here>\", \"Answer\": <Integer index corresponding to your final answer>, \"Tag\": \"<Specific medical triage tag to apply, one of: 'MINIMAL', 'DELAYED', 'IMMEDIATE', 'EXPECTANT'>\"}\\n"
+
+
+class CodeActAgentADM(AlignedDecisionMaker):
+
+    def __init__(self, 
+                 device : str = 'cuda',
+                 hf_model : str = 'xingyaoww/CodeActAgent-Mistral-7b-v0.1',
+                 precision : str = 'full',
+                 temperature : float = 0.7,
+                 do_sample : bool = True,
+                 **kwargs):
+        
+        self.device = device
+        self.hf_model = hf_model
+        self.temperature = temperature
+        self.do_sample = do_sample
+        self.chat_template = kwargs.get('chat_template', None)
+
+        assert precision in ['full', 'half'], "precision must be either 'full' or 'half'."
+        self.precision = torch.float32 if precision == 'full' else torch.float16
+
+        self.model = None
+        self.tokenizer = None
+
+
+    def load_model(self, model=None, tokenizer=None):
+        assert (model is None) == (tokenizer is None), "model and tokenizer must both be None or both be not None."
+        if model is not None:
+            print('Loading model and tokenizer from provided objects.')
+            self.model = model
+            self.tokenizer = tokenizer
+        else:
+            print('Loading model:', self.hf_model)
+            if self.device == 'auto':
+                self.model = AutoModelForCausalLM.from_pretrained(self.hf_model, torch_dtype=self.precision, device_map='auto')
+            else:
+                self.model = AutoModelForCausalLM.from_pretrained(self.hf_model, torch_dtype=self.precision)
+                self.model = self.model.to(self.device)
+
+            self.tokenizer = AutoTokenizer.from_pretrained(self.hf_model)
+
+            if self.chat_template is not None:
+                with open(os.path.join(chat_template_path, self.chat_template), 'r') as f:
+                    self.tokenizer.chat_template = f.read().replace('    ', '').replace('\n', '')
+
+
+    def __call__(self, sample, target_kdma_values, **kwargs):
+
+        # TODO: Refactor the following code to fit CodeAct Agent
+        # Refer to 'align-system/align_system/algorithms/llama_2_single_kdma_adm.py' for related methods and detailed implementations
+
+        prompt = sample['scenario']
+        if sample['state'] is not None:
+            prompt += f'\n{sample["state"]}'
+
+        if 'retriever' in kwargs:
+            # retriever_prompt = "How would you treat the following injuries: {}".format(prompt)
+            retriever_prompt = "{}  {}".format(prompt, sample['probe'])
+
+            retriever = kwargs['retriever']
+            retrieved_nodes = retriever.retrieve(retriever_prompt)
+
+            if 'summarizer' in kwargs:
+                summarizer = kwargs['summarizer']
+                summary = summarizer.synthesize(retriever_prompt, nodes=retrieved_nodes)
+
+                log.explain("[bold] ** Retrieval Summary ** [/bold]",
+                            extra={"markup": True})
+                log.explain(summary)
+
+                prompt += "\n#############\n{}\n#############".format(summary)
+
+            else:
+                prompt += "\n#############\n{}\n#############".format(
+                    "\n#############\n".join((n.text for n in retrieved_nodes)))
+
+            prompt += f'\nGiven the scenario and documentation above.. {sample["probe"]}'
+        else:
+            prompt += f'\n{sample["probe"]}'
+
+        choices = sample['choices']
+
+        labels = kwargs.get('labels', {})
+
+        alignment_target = None
+        if target_kdma_values is not None and len(target_kdma_values) > 0:
+            target_kdma = next(iter(next(iter(filter(lambda x: len(x) > 0, labels))))) # get the frist key of the first label that is not empty
+
+            for label in labels:
+                assert len(label) == 0 or (target_kdma in label and len(label) == 1), f'All labels must have the same KDMA: labels={labels}'
+
+            alignment_target = {
+                target_kdma: target_kdma_values[target_kdma]
+            }
+
+        reasoning, answer_idx, responses, inference_pairs = self.run_aligned_decision_maker_with_voting(
+            prompt,
+            choices,
+            alignment_target,
+            n_positive_samples=kwargs.get('n_positive_samples', 5),
+            n_negative_samples=kwargs.get('n_negative_samples', 5),
+            baseline=kwargs.get('baseline', False),
+            shuffle=kwargs.get('shuffle', False)
+        )
+
+        raw_data = {
+            'params': {
+                'model': self.hf_model,
+                'temperature': self.temperature,
+                'n_positive_samples': kwargs.get('n_positive_samples', 5),
+                'n_negative_samples': kwargs.get('n_negative_samples', 5),
+                'baseline': kwargs.get('baseline', False),
+                'shuffle': kwargs.get('shuffle', False),
+            },
+            'inference_pairs': inference_pairs
+        }
+
+        return {
+            'choice': int(answer_idx),
+            'info': {
+                'reasoning': reasoning,
+                'responses': responses,
+                'raw_data': raw_data,
+            }
+        }
+
+

From 8b88d76e897c711ebfc95ec1609f72e7a2d43b48 Mon Sep 17 00:00:00 2001
From: Qingyun Wang <dalewanghz@gmail.com>
Date: Thu, 4 Jul 2024 17:56:52 -0500
Subject: [PATCH 4/5] copy all necessary code

---
 align_system/algorithms/codeact_agent_adm.py | 47 ++++++++++++++++++++
 1 file changed, 47 insertions(+)

diff --git a/align_system/algorithms/codeact_agent_adm.py b/align_system/algorithms/codeact_agent_adm.py
index 62baf35a..33ccfedf 100644
--- a/align_system/algorithms/codeact_agent_adm.py
+++ b/align_system/algorithms/codeact_agent_adm.py
@@ -123,6 +123,53 @@ def load_model(self, model=None, tokenizer=None):
                 with open(os.path.join(chat_template_path, self.chat_template), 'r') as f:
                     self.tokenizer.chat_template = f.read().replace('    ', '').replace('\n', '')
 
+    def run_aligned_decision_maker_with_voting(
+            self, prompt, choices, alignment_target, n_positive_samples=5, n_negative_samples=5, baseline=False, shuffle=False):
+        responses, inference_pairs = self.aligned_decision_maker(
+            prompt,
+            choices,
+            alignment_target,
+            baseline=baseline,
+            n_positive_samples=n_positive_samples,
+            n_negative_sampels=n_negative_samples,
+            shuffle=shuffle
+        )
+
+        try:
+            choice_scores = Llama2SingleKDMAADM.calculate_votes(responses, choices)
+        except Exception as e:
+            log.warning(f"Error calculating votes: {e}")
+            choice_scores = [None] * len(choices)
+
+        log.debug("[bold]*RESPONSES*[bold]", extra={"markup": True})
+        for i, ip in enumerate(inference_pairs):
+            log.debug("[bold]*response {}*[bold]".format(i+1),
+                      extra={"markup": True})
+            log.debug(ip['output'])
+
+        log.explain("[bold]*CHOICE SCORES*[/bold]",
+                    extra={"markup": True})
+        log.explain("\n".join([f"{c}: {s}" for c, s in zip(choices, choice_scores)]))
+
+        results = {
+            'prompt': prompt,
+            'choice_scores': choice_scores,
+            'responses': responses,
+        }
+
+        answer_idx = int(np.argmax(results['choice_scores']))
+        reasoning = None
+
+        for r in responses:
+            assert r['answer_idx'] is not None
+            assert int(r['answer_idx']) < len(r['shuffle_indecies'])
+
+            if r['shuffle_indecies'][int(r['answer_idx'])] == answer_idx:
+                reasoning = r['reasoning']
+                break
+
+        return reasoning, answer_idx, responses, inference_pairs
+
 
     def __call__(self, sample, target_kdma_values, **kwargs):
 

From fbaa1a8c8b87d718620348ebb5eaa8e97404d4f3 Mon Sep 17 00:00:00 2001
From: Qingyun Wang <dalewanghz@gmail.com>
Date: Thu, 4 Jul 2024 17:57:00 -0500
Subject: [PATCH 5/5] update

---
 align_system/algorithms/codeact_agent_adm.py | 39 +++++++++++++++++++-
 1 file changed, 38 insertions(+), 1 deletion(-)

diff --git a/align_system/algorithms/codeact_agent_adm.py b/align_system/algorithms/codeact_agent_adm.py
index 33ccfedf..ff5fcbf3 100644
--- a/align_system/algorithms/codeact_agent_adm.py
+++ b/align_system/algorithms/codeact_agent_adm.py
@@ -122,6 +122,43 @@ def load_model(self, model=None, tokenizer=None):
             if self.chat_template is not None:
                 with open(os.path.join(chat_template_path, self.chat_template), 'r') as f:
                     self.tokenizer.chat_template = f.read().replace('    ', '').replace('\n', '')
+    
+    @staticmethod
+    def calculate_votes(responses, choices):
+        choice_votes = [0] * len(choices)
+        for response in responses:
+            answer_idx = response['answer_idx']
+            if answer_idx is None:
+                continue
+
+            try:
+                answer_idx = int(answer_idx)
+            except ValueError:
+                continue
+
+            if answer_idx >= len(choices):
+                continue
+
+            if 'shuffle_indecies' in response:
+                answer_idx = response['shuffle_indecies'][int(answer_idx)]
+
+            aligned = response['aligned']
+
+            if aligned:
+                choice_votes[answer_idx] += 1
+            else:
+                for i in range(len(choices)):
+                    if i != answer_idx:
+                        choice_votes[i] += 1/len(choices)
+                    else:
+                        choice_votes[i] -= 1/len(choices)
+
+        min_score = min(choice_votes) + 1e-6
+        choice_votes = [score - min_score for score in choice_votes]
+        total = sum(choice_votes)
+        choice_votes = [round(score / total, 6) for score in choice_votes]
+
+        return choice_votes
 
     def run_aligned_decision_maker_with_voting(
             self, prompt, choices, alignment_target, n_positive_samples=5, n_negative_samples=5, baseline=False, shuffle=False):
@@ -136,7 +173,7 @@ def run_aligned_decision_maker_with_voting(
         )
 
         try:
-            choice_scores = Llama2SingleKDMAADM.calculate_votes(responses, choices)
+            choice_scores = CodeActAgentADM.calculate_votes(responses, choices)
         except Exception as e:
             log.warning(f"Error calculating votes: {e}")
             choice_scores = [None] * len(choices)