ChicagoHAI · itea1001 · Mar 13, 2025 · Mar 18, 2025 · Mar 24, 2025 · Mar 25, 2025
diff --git a/hypogenic/algorithm/generation/__init__.py b/hypogenic/algorithm/generation/__init__.py
@@ -3,5 +3,5 @@
 generation_register = Register("generation")
 
 from .base import Generation
-from .default import DefaultGeneration
+from .default import DefaultGeneration, DefaultGenerationContinuous
 from . import utils
diff --git a/hypogenic/algorithm/generation/base.py b/hypogenic/algorithm/generation/base.py
@@ -188,3 +188,92 @@ def make_hypotheses_bank(
             new_generated_hypotheses[hyp].set_example(ex)
 
         return new_generated_hypotheses
+
+'''
+    def make_hypotheses_bank_continuous(
+        self,
+        example_indices,
+        current_sample,
+        alpha,
+        hypotheses_list: List[str],
+        cache_seed=None,
+        max_concurrent=3,
+        **generate_kwargs
+    ):
+        """
+        not actually used, just in case
+        """
+        """
+        Based on hypotheses generated by the LM, create new hypotheses_bank.
+
+        Parameters:
+            example_indices: the indices of examples being used to generate hypotheses
+            current_sample: the current sample in data which the algorithm is on
+            num_hypotheses_generate: the number of hypotheses that we expect our repsonse to generate
+            hypotheses: a list of hypotheses generated by the LM
+            alpha: eploration constant in hypogenic reward funciton
+            cache_seed: If `None`, will not use cache, otherwise will use cache with corresponding seed number
+            max_concurrent: the maximum number of concurrent requests to make to the API
+
+        Returns:
+            new_generated_hypotheses: A dictionary containing all newly generated hypotheses. The keys are the hypotheses and the values are the Summary Information class
+        """
+        idx_hyp_pair = []
+        new_generated_hypotheses = {}
+
+        for hyp in hypotheses_list:
+            new_generated_hypotheses[hyp] = SummaryInformation(
+                hypothesis=hyp, acc=0, num_visits=0, reward=0, correct_examples=[]
+            )
+
+            for index in example_indices:
+                idx_hyp_pair.append((index, {hyp: new_generated_hypotheses[hyp]}))
+
+        # ----------------------------------------------------------------------
+        # We try to predict the ground truth labels
+        # ----------------------------------------------------------------------
+        preds, labels = self.inference_class.batched_predict(
+            self.train_data,
+            idx_hyp_pair,
+            cache_seed=cache_seed,
+            max_concurrent=max_concurrent,
+            **generate_kwargs
+        )
+        preds, labels = preds[::-1], labels[::-1]
+
+        # ----------------------------------------------------------------------
+        # Finding the accuracy and the correct examples for each hypothesis
+        # ----------------------------------------------------------------------
+        for hyp in hypotheses_list:
+            correct = 0
+            ex = []
+
+            loss = 0.0
+            for index in example_indices:
+                prediction, actual_label = preds.pop(-1), labels.pop(-1)
+                if isinstance(prediction, str):
+                    if prediction == "other":
+                        prediction = -1
+                    else:
+                        prediction = float(prediction)
+                if isinstance(actual_label, str):
+                    actual_label = float(actual_label)
+                loss += (prediction - actual_label) ** 2
+            loss = loss / len(example_indices)
+            acc = 1.0 / (1.0 + loss)
+
+            # print(f"acc = {acc} for hypothesis: {hyp}")
+
+            new_generated_hypotheses[hyp].set_accuracy(acc)
+            new_generated_hypotheses[hyp].set_num_visits(len(example_indices))
+
+            # hypogenic reward
+            reward = acc + alpha * math.sqrt(
+                math.log(current_sample) / len(example_indices)
+            )
+
+            new_generated_hypotheses[hyp].set_reward(reward)
+            new_generated_hypotheses[hyp].set_example(ex)
+
+        return new_generated_hypotheses
+'''
diff --git a/hypogenic/algorithm/generation/default.py b/hypogenic/algorithm/generation/default.py
@@ -155,3 +155,247 @@ def batched_hypothesis_generation(
             max_concurrent=max_concurrent,
             **generate_kwargs,
         )
+
+@generation_register.register("default_continuous")
+class DefaultGenerationContinuous(Generation):
+    """
+    Add on extra functionality to the generation fucntion - we consider this
+    the "default" task.
+    """
+
+    def __init__(
+        self,
+        api,
+        # reward_a,
+        # reward_b,
+        prompt_class: BasePrompt,
+        inference_class: Inference,
+        task: BaseTask,
+    ):
+        """
+        Parameters:
+            api: the language model that you're using, which may or may not be local
+            prompt_class: let's us know how the prompt is going to look
+            inference_class: gives us a way to predict labels for accuracy sake
+            task: determines the goal to accomplish
+        """
+        super().__init__(api, prompt_class, inference_class, task)
+        # self.reward_a = reward_a
+        # self.reward_b = reward_b
+
+    # ------------------------------------------------------------------------ #
+    #                                                                          #
+    # ------------------------------------------------------------------------ #
+    # BATCH INITLALIZE HYPOTHESES                                              #
+    # ------------------------------------------------------------------------ #
+    #                                                                          #
+    # ------------------------------------------------------------------------ #
+    def batched_initialize_hypotheses(
+        self,
+        num_init,
+        init_batch_size,
+        init_hypotheses_per_batch,
+        cache_seed=None,
+        max_concurrent=3,
+        **generate_kwargs,
+    ):
+        """
+        Batches the process of making new hypotheses
+
+        Parameters:
+            num_init: the total amount of examples you want to use for initialize hypotheses
+            init_batch size: the number of examples that will be used to generate these hypotheses
+            init_hypotheses_per_batch: the amount of hypotheses that you want to generate per btach
+            cache_seed: If `None`, will not use cache, otherwise will use cache with corresponding seed number
+            max_concurrent: the maximum amount of concurrent calls to the API
+
+        Returns:
+            hypotheses_bank: A dictionary with keys as hypotheses and the values as the Summary Information class
+        """
+        # ----------------------------------------------------------------------
+        # Finding batch size and confirming that it works
+        # ----------------------------------------------------------------------
+        assert (
+            num_init % init_batch_size == 0
+        ), "Number of initial examples must be divisible by the batch size"
+        num_batches = num_init // init_batch_size
+        prompt_inputs = []
+
+        # ----------------------------------------------------------------------
+        # Making the batch of the responses that will be used in the batch generation
+        # ----------------------------------------------------------------------
+        for i in range(num_batches):
+            example_indices = list(
+                range(i * init_batch_size, (i + 1) * init_batch_size)
+            )
+            # TODO: need copy()?
+            example_bank = (
+                self.train_data.loc[list(example_indices)].copy().reset_index(drop=True)
+            )
+            prompt_inputs.append(
+                self.prompt_class.batched_generation(
+                    example_bank, init_hypotheses_per_batch
+                )
+            )
+        responses = self.api.batched_generate(
+            prompt_inputs,
+            cache_seed=cache_seed,
+            max_concurrent=max_concurrent,
+            **generate_kwargs,
+        )
+
+        hypotheses_list = list(
+            set(
+                [
+                    hyp
+                    for response in responses
+                    for hyp in extract_hypotheses(response, init_hypotheses_per_batch)
+                ]
+            )
+        )
+
+        return hypotheses_list
+
+    def make_hypotheses_bank(
+        self,
+        example_indices,
+        current_sample,
+        alpha,
+        hypotheses_list: List[str],
+        cache_seed=None,
+        max_concurrent=3,
+        **generate_kwargs
+    ):
+        """
+        override make_hypotheses_bank for continuous value prediction
+        """
+        """
+        Based on hypotheses generated by the LM, create new hypotheses_bank.
+
+        Parameters:
+            example_indices: the indices of examples being used to generate hypotheses
+            current_sample: the current sample in data which the algorithm is on
+            num_hypotheses_generate: the number of hypotheses that we expect our repsonse to generate
+            hypotheses: a list of hypotheses generated by the LM
+            alpha: eploration constant in hypogenic reward funciton
+            cache_seed: If `None`, will not use cache, otherwise will use cache with corresponding seed number
+            max_concurrent: the maximum number of concurrent requests to make to the API
+
+        Returns:
+            new_generated_hypotheses: A dictionary containing all newly generated hypotheses. The keys are the hypotheses and the values are the Summary Information class
+        """
+        idx_hyp_pair = []
+        new_generated_hypotheses = {}
+
+        for hyp in hypotheses_list:
+            new_generated_hypotheses[hyp] = SummaryInformation(
+                hypothesis=hyp, acc=0, num_visits=0, reward=0, correct_examples=[]
+            )
+
+            for index in example_indices:
+                idx_hyp_pair.append((index, {hyp: new_generated_hypotheses[hyp]}))
+
+        # ----------------------------------------------------------------------
+        # We try to predict the ground truth labels
+        # ----------------------------------------------------------------------
+        preds, labels = self.inference_class.batched_predict(
+            self.train_data,
+            idx_hyp_pair,
+            cache_seed=cache_seed,
+            max_concurrent=max_concurrent,
+            **generate_kwargs
+        )
+        preds, labels = preds[::-1], labels[::-1]
+
+        # ----------------------------------------------------------------------
+        # Finding the accuracy and the correct examples for each hypothesis
+        # ----------------------------------------------------------------------
+
+        # ----------------------------------------------------------------------
+        # New reward = -MSE + exploration
+        # ----------------------------------------------------------------------
+
+        for hyp in hypotheses_list:
+            ex = []
+
+            acc = 0.0
+            for index in example_indices:
+                prediction, actual_label = preds.pop(-1), labels.pop(-1)
+                if isinstance(prediction, str):
+                    if prediction in ["other", "unknown"]:
+                        prediction = self.task.y_mu
+                    else:
+                        prediction = float(prediction)
+                if isinstance(actual_label, str):
+                    actual_label = float(actual_label)
+                # normalize pred and label
+
+                prediction = (prediction - self.task.y_min) / (self.task.y_max - self.task.y_min)
+                actual_label = (actual_label - self.task.y_min) / (self.task.y_max - self.task.y_min)
+
+                acc += float(- (actual_label - prediction) ** 2)
+            acc = acc / len(example_indices)
+
+            print(f"acc = {acc} for hypothesis: {hyp}")
+
+            new_generated_hypotheses[hyp].set_accuracy(acc)
+            new_generated_hypotheses[hyp].set_num_visits(len(example_indices))
+
+            # hypogenic reward
+            reward = acc + alpha * math.sqrt(
+                math.log(current_sample) / len(example_indices)
+            )
+
+            new_generated_hypotheses[hyp].set_reward(reward)
+            new_generated_hypotheses[hyp].set_example(ex)
+
+        return new_generated_hypotheses
+
+
+    # ------------------------------------------------------------------------ #
+    #                                                                          #
+    # ------------------------------------------------------------------------ #
+    # BATCHED_HYPOTHESIS GENERATION                                            #
+    # ------------------------------------------------------------------------ #
+    #                                                                          #
+    # ------------------------------------------------------------------------ #
+    def batched_hypothesis_generation(
+        self,
+        example_ids,
+        current_sample,
+        num_hypotheses_generate: int,
+        alpha: float,
+        cache_seed=None,
+        max_concurrent=3,
+        **generate_kwargs,
+    ):
+        """
+        Generates new hypotheses for the given examples
+
+        Parameters:
+            example_ids: The ids of the examples for which hypotheses need to be generated
+            current_sample: the current sample in data which the algorithm is on
+            num_hypotheses_generate: the number of hypotheses that we expect our response to generate
+            alpha: eploration constant in hypogenic reward funciton
+            cache_seed: If `None`, will not use cache, otherwise will use cache with corresponding seed number
+            max_concurrent: The maximum number of concurrent requests
+
+        Returns:
+            hypotheses_bank: A dictionary with keys as hypotheses and the values as the Summary Information class
+        """
+        new_hypotheses = self.batched_hyp_list_generation(
+            example_ids,
+            num_hypotheses_generate,
+            cache_seed=cache_seed,
+            **generate_kwargs,
+        )
+
+        return self.make_hypotheses_bank(
+            example_ids,
+            current_sample,
+            alpha,
+            new_hypotheses,
+            cache_seed=cache_seed,
+            max_concurrent=max_concurrent,
+            **generate_kwargs,
+        )
diff --git a/hypogenic/algorithm/summary_information.py b/hypogenic/algorithm/summary_information.py
@@ -60,12 +60,19 @@ def update_info_if_useful(self, current_example, alpha):
     def update_useful_examples(self, example, label):
         self.correct_examples.append((example, label))
 
-    # In the update function, if it got the ith smample wrong, adjust accuracy accordinly
+    # In the update function, if it got the ith sample wrong, adjust accuracy accordinly
     def update_info_if_not_useful(self, current_example, alpha):
         self.acc = (self.acc * self.num_visits) / (self.num_visits + 1)
         self.num_visits += 1
         self.update_reward(alpha, current_example)
 
+    def update_info_continuous(self, current_example, alpha, diff_value,):
+        self.acc = self.acc * self.num_visits
+        self.acc += float(- (diff_value ** 2))
+        self.num_visits += 1
+        self.acc = self.acc / self.num_visits
+        self.update_reward(alpha, current_example)
+
     def __reduce__(self):
         return (self.__class__, (-1, self.acc, self.reward, self.num_visits))
 

diff --git a/hypogenic/algorithm/update/__init__.py b/hypogenic/algorithm/update/__init__.py
@@ -3,5 +3,5 @@
 update_register = Register("update")
 
 from .base import Update
-from .default import DefaultUpdate
+from .default import DefaultUpdate, DefaultUpdateContinuous
 from .sampling import SamplingUpdate