MIPLearn/miplearn/components/primal.py

#  MIPLearn: Extensible Framework for Learning-Enhanced Mixed-Integer Optimization
#  Copyright (C) 2020-2021, UChicago Argonne, LLC. All rights reserved.
#  Released under the modified BSD license. See COPYING.md for more details.

import logging
from typing import Dict, List, Any, TYPE_CHECKING, Tuple, Optional

import numpy as np
from overrides import overrides

from miplearn.classifiers import Classifier
from miplearn.classifiers.adaptive import AdaptiveClassifier
from miplearn.classifiers.threshold import MinPrecisionThreshold, Threshold
from miplearn.components import classifier_evaluation_dict
from miplearn.components.component import Component
from miplearn.features.sample import Sample
from miplearn.instance.base import Instance
from miplearn.types import (
    LearningSolveStats,
    Category,
    Solution,
)
from miplearn.features.sample import Hdf5Sample
from p_tqdm import p_map
from tqdm.auto import tqdm

logger = logging.getLogger(__name__)

if TYPE_CHECKING:
    from miplearn.solvers.learning import LearningSolver


class PrimalSolutionComponent(Component):
    """
    A component that predicts the optimal primal values for the binary decision
    variables.

    In exact mode, predicted primal solutions are provided to the solver as MIP
    starts. In heuristic mode, this component fixes the decision variables to their
    predicted values.
    """

    def __init__(
        self,
        classifier: Classifier = AdaptiveClassifier(),
        mode: str = "exact",
        threshold: Threshold = MinPrecisionThreshold([0.99, 0.99]),
    ) -> None:
        assert isinstance(classifier, Classifier)
        assert isinstance(threshold, Threshold)
        assert mode in ["exact", "heuristic"]
        self.mode = mode
        self.classifiers: Dict[Category, Classifier] = {}
        self.thresholds: Dict[Category, Threshold] = {}
        self.threshold_prototype = threshold
        self.classifier_prototype = classifier

    @overrides
    def before_solve_mip(
        self,
        solver: "LearningSolver",
        instance: Instance,
        model: Any,
        stats: LearningSolveStats,
        sample: Sample,
    ) -> None:
        logger.info("Predicting primal solution...")

        # Do nothing if models are not trained
        if len(self.classifiers) == 0:
            logger.info("Classifiers not fitted. Skipping.")
            return

        # Predict solution and provide it to the solver
        solution = self.sample_predict(sample)
        assert solver.internal_solver is not None
        if self.mode == "heuristic":
            solver.internal_solver.fix(solution)
        else:
            solver.internal_solver.set_warm_start(solution)

        # Update statistics
        stats["Primal: Free"] = 0
        stats["Primal: Zero"] = 0
        stats["Primal: One"] = 0
        for (var_name, value) in solution.items():
            if value is None:
                stats["Primal: Free"] += 1
            else:
                if value < 0.5:
                    stats["Primal: Zero"] += 1
                else:
                    stats["Primal: One"] += 1
        logger.info(
            f"Predicted: free: {stats['Primal: Free']}, "
            f"zero: {stats['Primal: Zero']}, "
            f"one: {stats['Primal: One']}"
        )

    def sample_predict(self, sample: Sample) -> Solution:
        var_names = sample.get_array("static_var_names")
        var_categories = sample.get_array("static_var_categories")
        var_types = sample.get_array("static_var_types")
        assert var_names is not None
        assert var_categories is not None
        assert var_types is not None

        # Compute y_pred
        x, _ = self.sample_xy(None, sample)
        y_pred = {}
        for category in x.keys():
            assert category in self.classifiers, (
                f"Classifier for category {category} has not been trained. "
                f"Please call component.fit before component.predict."
            )
            xc = np.array(x[category])
            proba = self.classifiers[category].predict_proba(xc)
            thr = self.thresholds[category].predict(xc)
            y_pred[category] = np.vstack(
                [
                    proba[:, 0] >= thr[0],
                    proba[:, 1] >= thr[1],
                ]
            ).T

        # Convert y_pred into solution
        solution: Solution = {v: None for v in var_names}
        category_offset: Dict[Category, int] = {cat: 0 for cat in x.keys()}
        for (i, var_name) in enumerate(var_names):
            if var_types[i] != b"B":
                continue
            category = var_categories[i]
            if category not in category_offset:
                continue
            offset = category_offset[category]
            category_offset[category] += 1
            if y_pred[category][offset, 0]:
                solution[var_name] = 0.0
            if y_pred[category][offset, 1]:
                solution[var_name] = 1.0

        return solution

    @overrides
    def sample_xy(
        self,
        _: Optional[Instance],
        sample: Sample,
    ) -> Tuple[Dict[Category, List[List[float]]], Dict[Category, List[List[float]]]]:
        x: Dict = {}
        y: Dict = {}
        instance_features = sample.get_array("static_instance_features")
        mip_var_values = sample.get_array("mip_var_values")
        lp_var_values = sample.get_array("lp_var_values")
        var_features = sample.get_array("lp_var_features")
        var_names = sample.get_array("static_var_names")
        var_types = sample.get_array("static_var_types")
        var_categories = sample.get_array("static_var_categories")
        if var_features is None:
            var_features = sample.get_array("static_var_features")
        assert instance_features is not None
        assert var_features is not None
        assert var_names is not None
        assert var_types is not None
        assert var_categories is not None

        for (i, var_name) in enumerate(var_names):
            # Skip non-binary variables
            if var_types[i] != b"B":
                continue

            # Initialize categories
            category = var_categories[i]
            if len(category) == 0:
                continue
            if category not in x.keys():
                x[category] = []
                y[category] = []

            # Features
            features = list(instance_features)
            features.extend(var_features[i])
            if lp_var_values is not None:
                features.extend(lp_var_values)
            x[category].append(features)

            # Labels
            if mip_var_values is not None:
                opt_value = mip_var_values[i]
                assert opt_value is not None
                y[category].append([opt_value < 0.5, opt_value >= 0.5])
        return x, y

    @overrides
    def sample_evaluate(
        self,
        _: Optional[Instance],
        sample: Sample,
    ) -> Dict[str, Dict[str, float]]:
        mip_var_values = sample.get_array("mip_var_values")
        var_names = sample.get_array("static_var_names")
        assert mip_var_values is not None
        assert var_names is not None

        solution_actual = {
            var_name: mip_var_values[i] for (i, var_name) in enumerate(var_names)
        }
        solution_pred = self.sample_predict(sample)
        vars_all, vars_one, vars_zero = set(), set(), set()
        pred_one_positive, pred_zero_positive = set(), set()
        for (var_name, value_actual) in solution_actual.items():
            vars_all.add(var_name)
            if value_actual > 0.5:
                vars_one.add(var_name)
            else:
                vars_zero.add(var_name)
            value_pred = solution_pred[var_name]
            if value_pred is not None:
                if value_pred > 0.5:
                    pred_one_positive.add(var_name)
                else:
                    pred_zero_positive.add(var_name)
        pred_one_negative = vars_all - pred_one_positive
        pred_zero_negative = vars_all - pred_zero_positive
        return {
            "0": classifier_evaluation_dict(
                tp=len(pred_zero_positive & vars_zero),
                tn=len(pred_zero_negative & vars_one),
                fp=len(pred_zero_positive & vars_one),
                fn=len(pred_zero_negative & vars_zero),
            ),
            "1": classifier_evaluation_dict(
                tp=len(pred_one_positive & vars_one),
                tn=len(pred_one_negative & vars_zero),
                fp=len(pred_one_positive & vars_zero),
                fn=len(pred_one_negative & vars_one),
            ),
        }

    @overrides
    def fit_xy(
        self,
        x: Dict[Category, np.ndarray],
        y: Dict[Category, np.ndarray],
        progress: bool = False,
    ) -> None:
        for category in tqdm(x.keys(), desc="fit", disable=not progress):
            clf = self.classifier_prototype.clone()
            thr = self.threshold_prototype.clone()
            clf.fit(x[category], y[category])
            thr.fit(clf, x[category], y[category])
            self.classifiers[category] = clf
            self.thresholds[category] = thr

    # ------------------------------------------------------------------------------------------------------------------
    # NEW API
    # ------------------------------------------------------------------------------------------------------------------

    def fit(
        self,
        x: Dict[Category, np.ndarray],
        y: Dict[Category, np.ndarray],
        progress: bool = False,
    ) -> None:
        for category in tqdm(x.keys(), desc="fit", disable=not progress):
            clf = self.classifier_prototype.clone()
            thr = self.threshold_prototype.clone()
            clf.fit(x[category], y[category])
            thr.fit(clf, x[category], y[category])
            self.classifiers[category] = clf
            self.thresholds[category] = thr

    def predict(self, x):
        y_pred = {}
        for category in x.keys():
            assert category in self.classifiers, (
                f"Classifier for category {category} has not been trained. "
                f"Please call component.fit before component.predict."
            )
            xc = np.array(x[category])
            proba = self.classifiers[category].predict_proba(xc)
            thr = self.thresholds[category].predict(xc)
            y_pred[category] = np.vstack(
                [
                    proba[:, 0] >= thr[0],
                    proba[:, 1] >= thr[1],
                ]
            ).T
        return y_pred

    @staticmethod
    def extract(
        filenames: List[str],
        progress: bool = False,
    ):
        x, y, cat = [], [], []

        # Read data
        for filename in tqdm(
            filenames,
            desc="extract (1/2)",
            disable=not progress,
        ):
            with Hdf5Sample(filename, mode="r") as sample:
                mip_var_values = sample.get_array("mip_var_values")
                var_features = sample.get_array("lp_var_features")
                var_types = sample.get_array("static_var_types")
                var_categories = sample.get_array("static_var_categories")
                assert var_features is not None
                assert var_types is not None
                assert var_categories is not None
                x.append(var_features)
                y.append([mip_var_values < 0.5, mip_var_values > 0.5])
                cat.extend(var_categories)

        # Convert to numpy arrays
        x = np.vstack(x)
        y = np.hstack(y).T
        cat = np.array(cat)

        # Sort data by categories
        pi = np.argsort(cat, kind="stable")
        x = x[pi]
        y = y[pi]
        cat = cat[pi]

        # Split categories
        x_dict = {}
        y_dict = {}
        start = 0
        for end in tqdm(
            range(len(cat) + 1),
            desc="extract (2/2)",
            disable=not progress,
        ):
            if (end >= len(cat)) or (cat[start] != cat[end]):
                x_dict[cat[start]] = x[start:end, :]
                y_dict[cat[start]] = y[start:end, :]
                start = end

        return x_dict, y_dict