add alpha / beta parameters for weighting, verbose output, dont save results automatically to file

sfluegel05 · sfluegel05 · commit 5055403ede2c · 2025-11-01T13:52:06.000+01:00
diff --git a/chebifier/ensemble/base_ensemble.py b/chebifier/ensemble/base_ensemble.py
@@ -1,5 +1,4 @@
 import importlib
-import os
 import time
 from pathlib import Path
 from typing import Union
@@ -24,8 +23,9 @@ class BaseEnsemble:
     def __init__(
         self,
         model_configs: Union[str, Path, dict, None] = None,
-        chebi_version: int = 241,
         resolve_inconsistencies: bool = True,
+        verbose_output: bool = False,
+        use_confidence: bool = True,
     ):
         # Deferred Import: To avoid circular import error
         from chebifier.model_registry import MODEL_TYPES
@@ -48,6 +48,8 @@ def __init__(
             model_registry = yaml.safe_load(f)
 
         processed_configs = process_config(config, model_registry)
+        self.verbose_output = verbose_output
+        self.use_confidence = use_confidence
 
         self.chebi_graph = load_chebi_graph()
         self.disjoint_files = get_disjoint_files()
@@ -92,7 +94,8 @@ def gather_predictions(self, smiles_list):
                 if logits_for_smiles is not None:
                     for cls in logits_for_smiles:
                         predicted_classes.add(cls)
-        print(f"Sorting predictions from {len(model_predictions)} models...")
+        if self.verbose_output:
+            print(f"Sorting predictions from {len(model_predictions)} models...")
         predicted_classes = sorted(list(predicted_classes))
         predicted_classes_dict = {cls: i for i, cls in enumerate(predicted_classes)}
         ordered_logits = (
@@ -114,7 +117,11 @@ def gather_predictions(self, smiles_list):
         return ordered_logits, predicted_classes
 
     def consolidate_predictions(
-        self, predictions, classwise_weights, predicted_classes, **kwargs
+        self,
+        predictions,
+        classwise_weights,
+        return_intermediate_results=False,
+        **kwargs,
     ):
         """
         Aggregates predictions from multiple models using weighted majority voting.
@@ -137,7 +144,9 @@ def consolidate_predictions(
             predictions < self.positive_prediction_threshold
         ) & valid_predictions
 
-        if "use_confidence" in kwargs and kwargs["use_confidence"]:
+        # if use_confidence is passed in kwargs, it overrides the ensemble setting
+        use_confidence = kwargs.get("use_confidence", self.use_confidence)
+        if use_confidence:
             confidence = 2 * torch.abs(
                 predictions.nan_to_num() - self.positive_prediction_threshold
             )
@@ -164,10 +173,27 @@ def consolidate_predictions(
 
         # Determine which classes to include for each SMILES
         net_score = positive_sum - negative_sum  # Shape: (num_smiles, num_classes)
+        if return_intermediate_results:
+            return (
+                net_score,
+                has_valid_predictions,
+                {
+                    "positive_mask": positive_mask,
+                    "negative_mask": negative_mask,
+                    "confidence": confidence,
+                    "positive_sum": positive_sum,
+                    "negative_sum": negative_sum,
+                },
+            )
+
+        return net_score, has_valid_predictions
 
+    def apply_inconsistency_resolution(
+        self, net_score, class_names, has_valid_predictions
+    ):
+        # todo - this could be more elegant
         # Smooth predictions
         start_time = time.perf_counter()
-        class_names = list(predicted_classes.keys())
         if self.smoother is not None:
             self.smoother.set_label_names(class_names)
             smooth_net_score = self.smoother(net_score)
@@ -179,7 +205,8 @@ def consolidate_predictions(
                 net_score > 0
             ) & has_valid_predictions  # Shape: (num_smiles, num_classes)
         end_time = time.perf_counter()
-        print(f"Prediction smoothing took {end_time - start_time:.2f} seconds")
+        if self.verbose_output:
+            print(f"Prediction smoothing took {end_time - start_time:.2f} seconds")
 
         complete_failure = torch.all(~has_valid_predictions, dim=1)
         return class_decisions, complete_failure
@@ -192,38 +219,28 @@ def calculate_classwise_weights(self, predicted_classes):
         return positive_weights, negative_weights
 
     def predict_smiles_list(
-        self, smiles_list, load_preds_if_possible=False, **kwargs
+        self, smiles_list, return_intermediate_results=False, **kwargs
     ) -> list:
-        preds_file = f"predictions_by_model_{'_'.join(model.model_name for model in self.models)}.pt"
-        predicted_classes_file = f"predicted_classes_{'_'.join(model.model_name for model in self.models)}.txt"
-        if not load_preds_if_possible or not os.path.isfile(preds_file):
-            ordered_predictions, predicted_classes = self.gather_predictions(
-                smiles_list
-            )
-            if len(predicted_classes) == 0:
-                print(
-                    "Warning: No classes have been predicted for the given SMILES list."
+        ordered_predictions, predicted_classes = self.gather_predictions(smiles_list)
+        if len(predicted_classes) == 0:
+            print("Warning: No classes have been predicted for the given SMILES list.")
+        predicted_classes = {cls: i for i, cls in enumerate(predicted_classes)}
+
+        classwise_weights = self.calculate_classwise_weights(predicted_classes)
+        if return_intermediate_results:
+            net_score, has_valid_predictions, intermediate_results_dict = (
+                self.consolidate_predictions(
+                    ordered_predictions,
+                    classwise_weights,
+                    return_intermediate_results=return_intermediate_results,
                 )
-            # save predictions
-            if load_preds_if_possible:
-                torch.save(ordered_predictions, preds_file)
-                with open(predicted_classes_file, "w") as f:
-                    for cls in predicted_classes:
-                        f.write(f"{cls}\n")
-            predicted_classes = {cls: i for i, cls in enumerate(predicted_classes)}
+            )
         else:
-            print(
-                f"Loading predictions from {preds_file} and label indexes from {predicted_classes_file}"
+            net_score, has_valid_predictions = self.consolidate_predictions(
+                ordered_predictions, classwise_weights
             )
-            ordered_predictions = torch.load(preds_file)
-            with open(predicted_classes_file, "r") as f:
-                predicted_classes = {
-                    line.strip(): i for i, line in enumerate(f.readlines())
-                }
-
-        classwise_weights = self.calculate_classwise_weights(predicted_classes)
-        class_decisions, is_failure = self.consolidate_predictions(
-            ordered_predictions, classwise_weights, predicted_classes, **kwargs
+        class_decisions, is_failure = self.apply_inconsistency_resolution(
+            net_score, list(predicted_classes.keys()), has_valid_predictions
         )
 
         class_names = list(predicted_classes.keys())
@@ -239,6 +256,11 @@ def predict_smiles_list(
             )
             for i, failure in zip(class_decisions, is_failure)
         ]
+        if return_intermediate_results:
+            intermediate_results_dict["predicted_classes"] = predicted_classes
+            intermediate_results_dict["classwise_weights"] = classwise_weights
+            intermediate_results_dict["net_score"] = net_score
+            return result, intermediate_results_dict
 
         return result
 
diff --git a/chebifier/ensemble/weighted_majority_ensemble.py b/chebifier/ensemble/weighted_majority_ensemble.py
@@ -4,6 +4,21 @@
 
 
 class WMVwithPPVNPVEnsemble(BaseEnsemble):
+
+    def __init__(
+        self, config_path=None, weighting_strength=0.5, weighting_exponent=1.0, **kwargs
+    ):
+        """WMV ensemble that weights models based on their class-wise positive / negative predictive values. For each class, the weight is calculated as:
+        weight = weighting_strength * PPV + (1 - weighting_strength)
+        where PPV is the class-specific positive predictive value of the model on the validation set
+        or (if the prediction is negative):
+        weight = weighting_strength * NPV + (1 - weighting_strength)
+        where NPV is the class-specific negative predictive value of the model on the validation set.
+        """
+        super().__init__(config_path, **kwargs)
+        self.weighting_strength = weighting_strength
+        self.weighting_exponent = weighting_exponent
+
     def calculate_classwise_weights(self, predicted_classes):
         """
         Given the positions of predicted classes in the predictions tensor, assign weights to each class. The
@@ -18,21 +33,40 @@ def calculate_classwise_weights(self, predicted_classes):
             if model.classwise_weights is None:
                 continue
             for cls, weights in model.classwise_weights.items():
-                positive_weights[predicted_classes[cls], j] *= weights["PPV"]
-                negative_weights[predicted_classes[cls], j] *= weights["NPV"]
+                positive_weights[predicted_classes[cls], j] *= (
+                    weights["PPV"] * self.weighting_strength
+                    + (1 - self.weighting_strength)
+                ) ** self.weighting_exponent
+                negative_weights[predicted_classes[cls], j] *= (
+                    weights["NPV"] * self.weighting_strength
+                    + (1 - self.weighting_strength)
+                ) ** self.weighting_exponent
 
-        print(
-            "Calculated model weightings. The averages for positive / negative weights are:"
-        )
-        for i, model in enumerate(self.models):
+        if self.verbose_output:
             print(
-                f"{model.model_name}: {positive_weights[:, i].mean().item():.3f} / {negative_weights[:, i].mean().item():.3f}"
+                "Calculated model weightings. The averages for positive / negative weights are:"
             )
+            for i, model in enumerate(self.models):
+                print(
+                    f"{model.model_name}: {positive_weights[:, i].mean().item():.3f} / {negative_weights[:, i].mean().item():.3f}"
+                )
 
         return positive_weights, negative_weights
 
 
 class WMVwithF1Ensemble(BaseEnsemble):
+
+    def __init__(
+        self, config_path=None, weighting_strength=0.5, weighting_exponent=1.0, **kwargs
+    ):
+        """WMV ensemble that weights models based on their class-wise F1 scores. For each class, the weight is calculated as:
+        weight = model_weight * (weighting_strength * F1 + (1 - weighting_strength))
+        where F1 is the class-specific F1 score ("trust") of the model on the validation set.
+        """
+        super().__init__(config_path, **kwargs)
+        self.weighting_strength = weighting_strength
+        self.weighting_exponent = weighting_exponent
+
     def calculate_classwise_weights(self, predicted_classes):
         """
         Given the positions of predicted classes in the predictions tensor, assign weights to each class. The
@@ -52,10 +86,12 @@ def calculate_classwise_weights(self, predicted_classes):
                             * weights["TP"]
                             / (2 * weights["TP"] + weights["FP"] + weights["FN"])
                         )
-                        weights_by_cls[predicted_classes[cls], j] *= 1 + f1
-
-        print("Calculated model weightings. The average weights are:")
-        for i, model in enumerate(self.models):
-            print(f"{model.model_name}: {weights_by_cls[:, i].mean().item():.3f}")
+                        weights_by_cls[predicted_classes[cls], j] *= (
+                            self.weighting_strength * f1 + 1 - self.weighting_strength
+                        ) ** self.weighting_exponent
+        if self.verbose_output:
+            print("Calculated model weightings. The average weights are:")
+            for i, model in enumerate(self.models):
+                print(f"{model.model_name}: {weights_by_cls[:, i].mean().item():.3f}")
 
         return weights_by_cls, weights_by_cls