Primal: reactivate before_solve_mip

2025-12-06 01:18:52 -06:00 · 2021-03-31 12:07:58 -05:00
parent fe7bad885c
commit db2f426140
7 changed files with 133 additions and 102 deletions
--- a/miplearn/benchmark.py
+++ b/miplearn/benchmark.py
@@ -10,7 +10,8 @@ import pandas as pd

 from miplearn.instance import Instance
 from miplearn.solvers.learning import LearningSolver
-from miplearn.types import LearningSolveStats
+
+logger = logging.getLogger(__name__)


 class BenchmarkRunner:
@@ -110,6 +111,7 @@ class BenchmarkRunner:

        """
        for (solver_name, solver) in self.solvers.items():
+            logger.debug(f"Fitting {solver_name}...")
            solver.fit(instances)

    def _silence_miplearn_logger(self) -> None:
--- a/miplearn/classifiers/init.py
+++ b/miplearn/classifiers/init.py
@@ -34,7 +34,11 @@ class Classifier(ABC):
        """
        assert isinstance(x_train, np.ndarray)
        assert isinstance(y_train, np.ndarray)
-        assert x_train.dtype in [np.float16, np.float32, np.float64]
+        assert x_train.dtype in [
+            np.float16,
+            np.float32,
+            np.float64,
+        ], f"x_train.dtype shoule be float. Found {x_train.dtype} instead."
        assert y_train.dtype == np.bool8
        assert len(x_train.shape) == 2
        assert len(y_train.shape) == 2
@@ -67,7 +71,10 @@ class Classifier(ABC):
        assert isinstance(x_test, np.ndarray)
        assert len(x_test.shape) == 2
        (n_samples, n_features_x) = x_test.shape
-        assert n_features_x == self.n_features
+        assert n_features_x == self.n_features, (
+            f"Test and training data have different number of "
+            f"features: {n_features_x} != {self.n_features}"
+        )
        return np.ndarray([])


--- a/miplearn/components/primal.py
+++ b/miplearn/components/primal.py
@@ -24,11 +24,9 @@ from miplearn.classifiers.adaptive import AdaptiveClassifier
 from miplearn.classifiers.threshold import MinPrecisionThreshold, Threshold
 from miplearn.components import classifier_evaluation_dict
 from miplearn.components.component import Component
-from miplearn.extractors import InstanceIterator
 from miplearn.instance import Instance
 from miplearn.types import (
    TrainingSample,
-    VarIndex,
    Solution,
    LearningSolveStats,
    Features,
@@ -70,30 +68,33 @@ class PrimalSolutionComponent(Component):
        self._n_one = 0

    def before_solve_mip(self, solver, instance, model):
-        pass
-        # if len(self.thresholds) > 0:
-        #     logger.info("Predicting primal solution...")
-        #     solution = self.predict(instance)
-        #
-        #     # Collect prediction statistics
-        #     self._n_free = 0
-        #     self._n_zero = 0
-        #     self._n_one = 0
-        #     for (var, var_dict) in solution.items():
-        #         for (idx, value) in var_dict.items():
-        #             if value is None:
-        #                 self._n_free += 1
-        #             else:
-        #                 if value < 0.5:
-        #                     self._n_zero += 1
-        #                 else:
-        #                     self._n_one += 1
-        #
-        #     # Provide solution to the solver
-        #     if self.mode == "heuristic":
-        #         solver.internal_solver.fix(solution)
-        #     else:
-        #         solver.internal_solver.set_warm_start(solution)
+        if len(self.thresholds) > 0:
+            logger.info("Predicting primal solution...")
+            solution = self.predict(instance.features, instance.training_data[-1])
+
+            # Collect prediction statistics
+            self._n_free = 0
+            self._n_zero = 0
+            self._n_one = 0
+            for (var, var_dict) in solution.items():
+                for (idx, value) in var_dict.items():
+                    if value is None:
+                        self._n_free += 1
+                    else:
+                        if value < 0.5:
+                            self._n_zero += 1
+                        else:
+                            self._n_one += 1
+            logger.info(
+                f"Predicted: {self._n_free} free, {self._n_zero} fix-zero, "
+                f"{self._n_one} fix-one"
+            )
+
+            # Provide solution to the solver
+            if self.mode == "heuristic":
+                solver.internal_solver.fix(solution)
+            else:
+                solver.internal_solver.set_warm_start(solution)

    def after_solve_mip(
        self,
@@ -120,27 +121,29 @@ class PrimalSolutionComponent(Component):
            self.classifiers[category] = clf
            self.thresholds[category] = thr

-    def predict(self, instance: Instance) -> Solution:
-        assert len(instance.training_data) > 0
-        sample = instance.training_data[-1]
-
+    def predict(
+        self,
+        features: Features,
+        sample: TrainingSample,
+    ) -> Solution:
        # Initialize empty solution
        solution: Solution = {}
-        for (var_name, var_dict) in instance.features["Variables"].items():
+        for (var_name, var_dict) in features["Variables"].items():
            solution[var_name] = {}
            for idx in var_dict.keys():
                solution[var_name][idx] = None

        # Compute y_pred
-        x = self.x_sample(instance.features, sample)
+        x = self.x_sample(features, sample)
        y_pred = {}
        for category in x.keys():
            assert category in self.classifiers, (
                f"Classifier for category {category} has not been trained. "
                f"Please call component.fit before component.predict."
            )
-            proba = self.classifiers[category].predict_proba(x[category])
-            thr = self.thresholds[category].predict(x[category])
+            xc = np.array(x[category])
+            proba = self.classifiers[category].predict_proba(xc)
+            thr = self.thresholds[category].predict(xc)
            y_pred[category] = np.vstack(
                [
                    proba[:, 0] > thr[0],
@@ -150,7 +153,7 @@ class PrimalSolutionComponent(Component):

        # Convert y_pred into solution
        category_offset: Dict[Hashable, int] = {cat: 0 for cat in x.keys()}
-        for (var_name, var_dict) in instance.features["Variables"].items():
+        for (var_name, var_dict) in features["Variables"].items():
            for (idx, var_features) in var_dict.items():
                category = var_features["Category"]
                offset = category_offset[category]
@@ -250,8 +253,9 @@ class PrimalSolutionComponent(Component):
                if category not in x.keys():
                    x[category] = []
                    y[category] = []
-                f = var_features["User features"]
-                assert f is not None
+                f: List[float] = []
+                assert var_features["User features"] is not None
+                f += var_features["User features"]
                if "LP solution" in sample and sample["LP solution"] is not None:
                    lp_value = sample["LP solution"][var_name][idx]
                    if lp_value is not None:
--- a/miplearn/problems/tsp.py
+++ b/miplearn/problems/tsp.py
@@ -157,10 +157,10 @@ class TravelingSalesmanInstance(Instance):
        return model

    def get_instance_features(self):
-        return [1]
+        return [0.0]

    def get_variable_features(self, var_name, index):
-        return [1]
+        return [0.0]

    def get_variable_category(self, var_name, index):
        return index
--- a/miplearn/solvers/learning.py
+++ b/miplearn/solvers/learning.py
@@ -373,25 +373,28 @@ class LearningSolver:
            The list is the same you would obtain by calling
            `[solver.solve(p) for p in instances]`
        """
-        self.internal_solver = None
-        self._silence_miplearn_logger()
-        _GLOBAL[0].solver = self
-        _GLOBAL[0].output_filenames = output_filenames
-        _GLOBAL[0].instances = instances
-        _GLOBAL[0].discard_outputs = discard_outputs
-        results = p_map(
-            _parallel_solve,
-            list(range(len(instances))),
-            num_cpus=n_jobs,
-            desc=label,
-        )
-        results = [r for r in results if r[0]]
-        stats = []
-        for (idx, (s, instance)) in enumerate(results):
-            stats.append(s)
-            instances[idx] = instance
-        self._restore_miplearn_logger()
-        return stats
+        if n_jobs == 1:
+            return [self.solve(p) for p in instances]
+        else:
+            self.internal_solver = None
+            self._silence_miplearn_logger()
+            _GLOBAL[0].solver = self
+            _GLOBAL[0].output_filenames = output_filenames
+            _GLOBAL[0].instances = instances
+            _GLOBAL[0].discard_outputs = discard_outputs
+            results = p_map(
+                _parallel_solve,
+                list(range(len(instances))),
+                num_cpus=n_jobs,
+                desc=label,
+            )
+            results = [r for r in results if r[0]]
+            stats = []
+            for (idx, (s, instance)) in enumerate(results):
+                stats.append(s)
+                instances[idx] = instance
+            self._restore_miplearn_logger()
+            return stats

    def fit(self, training_instances: Union[List[str], List[Instance]]) -> None:
        if len(training_instances) == 0: