ASUS-AICS
diff --git a/‎docs/api/linear.rst‎
Lines changed: 21 additions & 1 deletion b/‎docs/api/linear.rst‎
Lines changed: 21 additions & 1 deletion
diff --git a/‎docs/examples/plot_linear_quickstart.py‎
Lines changed: 10 additions & 13 deletions b/‎docs/examples/plot_linear_quickstart.py‎
Lines changed: 10 additions & 13 deletions
diff --git a/‎libmultilabel/linear/linear.py‎
Lines changed: 13 additions & 10 deletions b/‎libmultilabel/linear/linear.py‎
Lines changed: 13 additions & 10 deletions
diff --git a/‎libmultilabel/linear/metrics.py‎
Lines changed: 90 additions & 19 deletions b/‎libmultilabel/linear/metrics.py‎
Lines changed: 90 additions & 19 deletions
@@ -11,7 +11,6 @@ The simplest usage is::
    model = linear.train_1vsrest(train_y, train_x, options)
    predict = linear.predict_values(model, test_x)
 
-.. See `the user guide <../guides/linear_guides.html>`_ for more details.
 
 .. currentmodule:: libmultilabel.linear
 
@@ -51,6 +50,27 @@ Load and Save Pipeline
 .. autofunction:: load_pipeline
 
 
+Metrics
+^^^^^^^
+Metrics are specified by their names in ``compute_metrics`` and ``get_metrics``.
+The possible metric names are:
+
+* ``'P@K'``, where ``K`` is a positive integer
+* ``'RP@K'``, where ``K`` is a positive integer
+* ``'Macro-F1'``
+* ``'Micro-F1'``
+
+.. Their definitions are given in the `user guide <https://www.csie.ntu.edu.tw/~cjlin/papers/libmultilabel/userguide.pdf>`_.
+
+.. autofunction:: compute_metrics
+
+.. autofunction:: get_metrics
+
+.. autoclass:: MetricCollection
+   :members:
+
+.. autofunction:: tabulate_metrics
+
 Grid Search with Sklearn Estimators
 ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
 
 
@@ -73,24 +73,21 @@
 #
 # To see how well we performed, we may want to check various
 # metrics with the test set.
-# For that we may use:
-
-metrics = linear.get_metrics(metric_threshold=0,
-                             monitor_metrics=['Macro-F1', 'Micro-F1', 'P@1', 'P@3', 'P@5'],
-                             num_classes=datasets['test']['y'].shape[1])
-
-######################################################################
-# This creates the set of metrics we wish to see.
 # Since the dataset we loaded are stored as ``scipy.sparse.csr_matrix``,
-# we need to transform them to ``np.array`` before we can compute the metrics:
+# we will first transform the dataset to ``np.array``.
 
 target = datasets['test']['y'].toarray()
 
-######################################################################
-# Finally, we compute and print the metrics:
+##############################################################################
+# Then we will compute the metrics with ``compute_metrics``.
+
+metrics = linear.compute_metrics(
+    preds,
+    target,
+    monitor_metrics=['Macro-F1', 'Micro-F1', 'P@1', 'P@3', 'P@5'],
+)
 
-metrics.update(preds, target)
-print(metrics.compute())
+print(metrics)
 
 ######################################################################
 # The results will look similar to::
 
@@ -58,15 +58,15 @@ def predict_values(self, x: sparse.csr_matrix) -> np.ndarray:
 
 def train_1vsrest(y: sparse.csr_matrix,
                   x: sparse.csr_matrix,
-                  options: str,
+                  options: str = '',
                   verbose: bool = True
                   ) -> FlatModel:
     """Trains a linear model for multiabel data using a one-vs-rest strategy.
 
     Args:
         y (sparse.csr_matrix): A 0/1 matrix with dimensions number of instances * number of classes.
         x (sparse.csr_matrix): A matrix with dimensions number of instances * number of features.
-        options (str): The option string passed to liblinear.
+        options (str, optional): The option string passed to liblinear. Defaults to ''.
         verbose (bool, optional): Output extra progress information. Defaults to True.
 
     Returns:
@@ -116,6 +116,9 @@ def _prepare_options(x: sparse.csr_matrix, options: str) -> tuple[sparse.csr_mat
         if solver_type < 0 or solver_type > 7:
             raise ValueError(
                 "Invalid LIBLINEAR solver type. Only classification solvers are allowed.")
+    else:
+        # workaround for liblinear warning about unspecified solver
+        options_split.extend(['-s', '2'])
 
     bias = -1.
     if '-B' in options_split:
@@ -137,7 +140,7 @@ def _prepare_options(x: sparse.csr_matrix, options: str) -> tuple[sparse.csr_mat
 
 def train_thresholding(y: sparse.csr_matrix,
                        x: sparse.csr_matrix,
-                       options: str,
+                       options: str = '',
                        verbose: bool = True
                        ) -> FlatModel:
     """Trains a linear model for multilabel data using a one-vs-rest strategy
@@ -149,7 +152,7 @@ def train_thresholding(y: sparse.csr_matrix,
     Args:
         y (sparse.csr_matrix): A 0/1 matrix with dimensions number of instances * number of classes.
         x (sparse.csr_matrix): A matrix with dimensions number of instances * number of features.
-        options (str): The option string passed to liblinear.
+        options (str, optional): The option string passed to liblinear. Defaults to ''.
         verbose (bool, optional): Output extra progress information. Defaults to True.
 
     Returns:
@@ -383,7 +386,7 @@ def _fmeasure(y_true: np.ndarray, y_pred: np.ndarray) -> float:
 
 def train_cost_sensitive(y: sparse.csr_matrix,
                          x: sparse.csr_matrix,
-                         options: str,
+                         options: str = '',
                          verbose: bool = True
                          ) -> FlatModel:
     """Trains a linear model for multilabel data using a one-vs-rest strategy
@@ -396,7 +399,7 @@ def train_cost_sensitive(y: sparse.csr_matrix,
     Args:
         y (sparse.csr_matrix): A 0/1 matrix with dimensions number of instances * number of classes.
         x (sparse.csr_matrix): A matrix with dimensions number of instances * number of features.
-        options (str): The option string passed to liblinear.
+        options (str, optional): The option string passed to liblinear. Defaults to ''.
         verbose (bool, optional): Output extra progress information. Defaults to True.
 
     Returns:
@@ -489,7 +492,7 @@ def _cross_validate(y: np.ndarray,
 
 def train_cost_sensitive_micro(y: sparse.csr_matrix,
                                x: sparse.csr_matrix,
-                               options: str,
+                               options: str = '',
                                verbose: bool = True
                                ) -> FlatModel:
     """Trains a linear model for multilabel data using a one-vs-rest strategy
@@ -502,7 +505,7 @@ def train_cost_sensitive_micro(y: sparse.csr_matrix,
     Args:
         y (sparse.csr_matrix): A 0/1 matrix with dimensions number of instances * number of classes.
         x (sparse.csr_matrix): A matrix with dimensions number of instances * number of features.
-        options (str): The option string passed to liblinear.
+        options (str, optional): The option string passed to liblinear. Defaults to ''.
         verbose (bool, optional): Output extra progress information. Defaults to True.
 
     Returns:
@@ -555,15 +558,15 @@ def train_cost_sensitive_micro(y: sparse.csr_matrix,
 
 def train_binary_and_multiclass(y: sparse.csr_matrix,
                                 x: sparse.csr_matrix,
-                                options: str,
+                                options: str = '',
                                 verbose: bool = True
                                 ) -> FlatModel:
     """Trains a linear model for binary and multi-class data.
 
     Args:
         y (sparse.csr_matrix): A 0/1 matrix with dimensions number of instances * number of classes.
         x (sparse.csr_matrix): A matrix with dimensions number of instances * number of features.
-        options (str): The option string passed to liblinear.
+        options (str, optional): The option string passed to liblinear. Defaults to ''.
         verbose (bool, optional): Output extra progress information. Defaults to True.
 
     Returns:
 
@@ -5,16 +5,18 @@
 import numpy as np
 
 __all__ = ['get_metrics',
-           'tabulate_metrics']
+           'compute_metrics',
+           'tabulate_metrics',
+           'MetricCollection']
 
 
 class RPrecision:
-    def __init__(self, top_k: int) -> None:
+    def __init__(self, top_k: int):
         self.top_k = top_k
         self.score = 0
         self.num_sample = 0
 
-    def update(self, preds: np.ndarray, target: np.ndarray) -> None:
+    def update(self, preds: np.ndarray, target: np.ndarray):
         assert preds.shape == target.shape  # (batch_size, num_classes)
         top_k_ind = np.argpartition(preds, -self.top_k)[:, -self.top_k:]
         num_relevant = np.take_along_axis(
@@ -28,14 +30,21 @@ def update(self, preds: np.ndarray, target: np.ndarray) -> None:
     def compute(self) -> float:
         return self.score / self.num_sample
 
+    def reset(self):
+        self.score = 0
+        self.num_sample = 0
+
 
 class Precision:
-    def __init__(self, num_classes: int, average: str, top_k: int) -> None:
+    def __init__(self, num_classes: int, average: str, top_k: int):
+        if average != 'samples':
+            raise ValueError('unsupported average')
+
         self.top_k = top_k
         self.score = 0
         self.num_sample = 0
 
-    def update(self, preds: np.ndarray, target: np.ndarray) -> None:
+    def update(self, preds: np.ndarray, target: np.ndarray):
         assert preds.shape == target.shape  # (batch_size, num_classes)
         top_k_ind = np.argpartition(preds, -self.top_k)[:, -self.top_k:]
         num_relevant = np.take_along_axis(target, top_k_ind, -1).sum()
@@ -45,25 +54,28 @@ def update(self, preds: np.ndarray, target: np.ndarray) -> None:
     def compute(self) -> float:
         return self.score / self.num_sample
 
+    def reset(self):
+        self.score = 0
+        self.num_sample = 0
+
 
 class F1:
-    def __init__(self, num_classes: int, metric_threshold: float, average: str, multiclass=False) -> None:
+    def __init__(self, num_classes: int, average: str, multiclass=False):
         self.num_classes = num_classes
-        self.metric_threshold = metric_threshold
         if average not in {'macro', 'micro', 'another-macro'}:
             raise ValueError('unsupported average')
         self.average = average
         self.multiclass = multiclass
         self.tp = self.fp = self.fn = 0
 
-    def update(self, preds: np.ndarray, target: np.ndarray) -> None:
+    def update(self, preds: np.ndarray, target: np.ndarray):
         assert preds.shape == target.shape  # (batch_size, num_classes)
         if self.multiclass:
             max_idx = np.argmax(preds, axis=1).reshape(-1, 1)
             preds = np.zeros(preds.shape)
             np.put_along_axis(preds, max_idx, 1, axis=1)
         else:
-            preds = preds > self.metric_threshold
+            preds = preds > 0
         self.tp += np.logical_and(target == 1, preds == 1).sum(axis=0)
         self.fn += np.logical_and(target == 1, preds == 0).sum(axis=0)
         self.fp += np.logical_and(target == 0, preds == 1).sum(axis=0)
@@ -88,34 +100,58 @@ def compute(self) -> float:
         np.seterr(**prev_settings)
         return score
 
+    def reset(self):
+        self.tp = self.fp = self.fn = 0
+
 
 class MetricCollection(dict):
-    def __init__(self, metrics) -> None:
+    """A collection of metrics created by get_metrics.
+    MetricCollection computes metric values in two steps. First, batches of
+    decision values and labels are added with update(). After all instances have been
+    added, compute() computes the metric values from the accumulated batches.
+    """
+
+    def __init__(self, metrics):
         self.metrics = metrics
 
-    def update(self, preds: np.ndarray, target: np.ndarray) -> None:
+    def update(self, preds: np.ndarray, target: np.ndarray):
+        """Adds a batch of decision values and labels.
+
+        Args:
+            preds (np.ndarray): A matrix of decision values with dimensions number of instances * number of classes.
+            target (np.ndarray): A 0/1 matrix of labels with dimensions number of instances * number of classes.
+        """
         assert preds.shape == target.shape  # (batch_size, num_classes)
         for metric in self.metrics.values():
             metric.update(preds, target)
 
     def compute(self) -> dict[str, float]:
+        """Computes the metrics from the accumulated batches of decision values and labels.
+
+        Returns:
+            dict[str, float]: A dictionary of metric values.
+        """
         ret = {}
         for name, metric in self.metrics.items():
             ret[name] = metric.compute()
         return ret
 
+    def reset(self):
+        """Clears the accumulated batches of decision values and labels.
+        """
+        for metric in self.metrics.values():
+            metric.reset()
+
 
-def get_metrics(metric_threshold: float,
-                monitor_metrics: list[str],
+def get_metrics(monitor_metrics: list[str],
                 num_classes: int,
                 multiclass: bool = False
                 ) -> MetricCollection:
     """Get a collection of metrics by their names.
+    See MetricCollection for more details.
 
     Args:
-        metric_threshold (float): The decision value threshold over which a
-        label is predicted as positive.
-        monitor_metrics (list[str]): A list metric names.
+        monitor_metrics (list[str]): A list of metric names.
         num_classes (int): The number of classes.
         multiclass (bool, optional): Enable multiclass mode. Defaults to False.
 
@@ -132,19 +168,54 @@ def get_metrics(metric_threshold: float,
         elif re.match('RP@\d+', metric):
             metrics[metric] = RPrecision(top_k=int(metric[3:]))
         elif metric in {'Another-Macro-F1', 'Macro-F1', 'Micro-F1'}:
-            metrics[metric] = F1(num_classes, metric_threshold,
+            metrics[metric] = F1(num_classes,
                                  average=metric[:-3].lower(),
                                  multiclass=multiclass)
         else:
-            raise ValueError(f'Invalid metric: {metric}')
+            raise ValueError(f'invalid metric: {metric}')
 
     return MetricCollection(metrics)
 
 
+def compute_metrics(preds: np.ndarray,
+                    target: np.ndarray,
+                    monitor_metrics: list[str],
+                    multiclass: bool = False
+                    ) -> dict[str, float]:
+    """Compute metrics with decision values and labels.
+    See get_metrics and MetricCollection if decision values and labels are too
+    large to hold in memory.
+
+
+    Args:
+        preds (np.ndarray): A matrix of decision values with dimensions number of instances * number of classes.
+        target (np.ndarray): A 0/1 matrix of labels with dimensions number of instances * number of classes.
+        monitor_metrics (list[str]): A list of metric names.
+        multiclass (bool, optional): Enable multiclass mode. Defaults to False.
+
+    Returns:
+        dict[str, float]: A dictionary of metric values.
+    """
+    assert preds.shape == target.shape
+
+    metric = get_metrics(monitor_metrics, preds.shape[1], multiclass)
+    metric.update(preds, target)
+    return metric.compute()
+
+
 def tabulate_metrics(metric_dict: dict[str, float], split: str) -> str:
+    """Convert a dictionary of metric values into a pretty formatted string for printing.
+
+    Args:
+        metric_dict (dict[str, float]): A dictionary of metric values.
+        split (str): Name of the data split.
+
+    Returns:
+        str: Pretty formatted string.
+    """
     msg = f'====== {split} dataset evaluation result =======\n'
     header = '|'.join([f'{k:^18}' for k in metric_dict.keys()])
-    values = '|'.join([f'{x * 100:^18.4f}' if isinstance(x, (np.floating,
+    values = '|'.join([f'{x:^18.4f}' if isinstance(x, (np.floating,
                       float)) else f'{x:^18}' for x in metric_dict.values()])
     msg += f"|{header}|\n|{'-----------------:|' * len(metric_dict)}\n|{values}|\n"
     return msg