clarena.metrics.cl_loss API documentation

CLLoss( save_dir: str, test_loss_cls_csv_name: str = 'loss_cls.csv', test_loss_cls_matrix_plot_name: str | None = None, test_ave_loss_cls_plot_name: str | None = None) View Source

45    def __init__(
46        self,
47        save_dir: str,
48        test_loss_cls_csv_name: str = "loss_cls.csv",
49        test_loss_cls_matrix_plot_name: str | None = None,
50        test_ave_loss_cls_plot_name: str | None = None,
51    ) -> None:
52        r"""
53        **Args:**
54        - **save_dir** (`str`): The directory where data and figures of metrics will be saved. Better inside the output folder.
55        - **test_loss_cls_csv_name**(`str`): file name to save classification loss matrix and average classification loss as CSV file.
56        - **test_loss_cls_matrix_plot_name** (`str` | `None`): file name to save classification loss matrix plot. If `None`, no file will be saved.
57        - **test_ave_loss_cls_plot_name** (`str` | `None`): file name to save average classification loss as curve plot over different training tasks. If `None`, no file will be saved.
58        """
59        super().__init__(save_dir=save_dir)
60
61        self.test_loss_cls_csv_path: str = os.path.join(
62            save_dir, test_loss_cls_csv_name
63        )
64        r"""The path to save test classification loss matrix and average classification loss CSV file."""
65        if test_loss_cls_matrix_plot_name:
66            self.test_loss_cls_matrix_plot_path: str = os.path.join(
67                save_dir, test_loss_cls_matrix_plot_name
68            )
69            r"""The path to save test classification loss matrix plot."""
70        if test_ave_loss_cls_plot_name:
71            self.test_ave_loss_cls_plot_path: str = os.path.join(
72                save_dir, test_ave_loss_cls_plot_name
73            )
74            r"""The path to save test average classification loss curve plot."""
75
76        # training accumulated metrics
77        self.loss_cls_training_epoch: MeanMetricBatch
78        r"""Classification loss of training epoch. Accumulated and calculated from the training batches. See [here](https://pengxiang-wang.com/posts/continual-learning-metrics.html#sec-performance-of-training-epoch) for details. """
79        self.loss_training_epoch: MeanMetricBatch
80        r"""Total loss of training epoch. Accumulated and calculated from the training batches. See [here](https://pengxiang-wang.com/posts/continual-learning-metrics.html#sec-performance-of-training-epoch) for details. """
81
82        # validation accumulated metrics
83        self.loss_cls_val: MeanMetricBatch
84        r"""Validation classification of the model loss after training epoch. Accumulated and calculated from the validation batches. See [here](https://pengxiang-wang.com/posts/continual-learning-metrics.html#sec-validation-performace) for details. """
85
86        # test accumulated metrics
87        self.loss_cls_test: dict[int, MeanMetricBatch]
88        r"""Test classification loss of the current model (`self.task_id`) on current and previous tasks. Accumulated and calculated from the test batches. Keys are task IDs and values are the corresponding metrics. It is the last row of the lower triangular matrix. See [here](https://pengxiang-wang.com/posts/continual-learning-metrics.html#sec-test-performance-of-previous-tasks) for details. """
89
90        # task ID control
91        self.task_id: int
92        r"""Task ID counter indicating which task is being processed. Self updated during the task loop. Valid from 1 to `cl_dataset.num_tasks`."""

Args:

save_dir (str): The directory where data and figures of metrics will be saved. Better inside the output folder.
test_loss_cls_csv_name(str): file name to save classification loss matrix and average classification loss as CSV file.
test_loss_cls_matrix_plot_name (str | None): file name to save classification loss matrix plot. If None, no file will be saved.
test_ave_loss_cls_plot_name (str | None): file name to save average classification loss as curve plot over different training tasks. If None, no file will be saved.

test_loss_cls_csv_path: str

The path to save test classification loss matrix and average classification loss CSV file.

loss_cls_training_epoch: clarena.utils.metrics.MeanMetricBatch

Classification loss of training epoch. Accumulated and calculated from the training batches. See here for details.

loss_training_epoch: clarena.utils.metrics.MeanMetricBatch

Total loss of training epoch. Accumulated and calculated from the training batches. See here for details.

loss_cls_val: clarena.utils.metrics.MeanMetricBatch

Validation classification of the model loss after training epoch. Accumulated and calculated from the validation batches. See here for details.

loss_cls_test: dict[int, clarena.utils.metrics.MeanMetricBatch]

Test classification loss of the current model (self.task_id) on current and previous tasks. Accumulated and calculated from the test batches. Keys are task IDs and values are the corresponding metrics. It is the last row of the lower triangular matrix. See here for details.

task_id: int

Task ID counter indicating which task is being processed. Self updated during the task loop. Valid from 1 to cl_dataset.num_tasks.

@rank_zero_only

def on_fit_start( self, trainer: lightning.pytorch.trainer.trainer.Trainer, pl_module: clarena.cl_algorithms.CLAlgorithm) -> None: View Source

 94    @rank_zero_only
 95    def on_fit_start(self, trainer: Trainer, pl_module: CLAlgorithm) -> None:
 96        r"""Initialize training and validation metrics."""
 97
 98        # set the current task_id from the `CLAlgorithm` object
 99        self.task_id = pl_module.task_id
100
101        # get the device to put the metrics on the same device
102        device = pl_module.device
103
104        # initialize training metrics
105        self.loss_cls_training_epoch = MeanMetricBatch().to(device)
106        self.loss_training_epoch = MeanMetricBatch().to(device)
107
108        # initialize validation metrics
109        self.loss_cls_val = MeanMetricBatch().to(device)

Initialize training and validation metrics.

@rank_zero_only

def on_train_batch_end( self, trainer: lightning.pytorch.trainer.trainer.Trainer, pl_module: clarena.cl_algorithms.CLAlgorithm, outputs: dict[str, typing.Any], batch: Any, batch_idx: int) -> None: View Source

111    @rank_zero_only
112    def on_train_batch_end(
113        self,
114        trainer: Trainer,
115        pl_module: CLAlgorithm,
116        outputs: dict[str, Any],
117        batch: Any,
118        batch_idx: int,
119    ) -> None:
120        r"""Record training metrics from training batch, log metrics of training batch and accumulated metrics of the epoch to Lightning loggers.
121
122        **Args:**
123        - **outputs** (`dict[str, Any]`): the outputs of the training step, the returns of the `training_step()` method in the `CLAlgorithm`.
124        - **batch** (`Any`): the training data batch.
125        """
126        # get the batch size
127        batch_size = len(batch)
128
129        # get training metrics values of current training batch from the outputs of the `training_step()`
130        loss_cls_batch = outputs["loss_cls"]
131        loss_batch = outputs["loss"]
132
133        # update accumulated training metrics to calculate training metrics of the epoch
134        self.loss_cls_training_epoch.update(loss_cls_batch, batch_size)
135        self.loss_training_epoch.update(loss_batch, batch_size)
136
137        # log training metrics of current training batch to Lightning loggers
138        pl_module.log(
139            f"task_{self.task_id}/train/loss_cls_batch", loss_cls_batch, prog_bar=True
140        )
141        pl_module.log(
142            f"task_{self.task_id}/train/loss_batch", loss_batch, prog_bar=True
143        )
144
145        # log accumulated training metrics till this training batch to Lightning loggers
146        pl_module.log(
147            f"task_{self.task_id}/train/loss_cls",
148            self.loss_cls_training_epoch.compute(),
149            prog_bar=True,
150        )
151        pl_module.log(
152            f"task_{self.task_id}/train/loss",
153            self.loss_training_epoch.compute(),
154            prog_bar=True,
155        )

Record training metrics from training batch, log metrics of training batch and accumulated metrics of the epoch to Lightning loggers.

Args:

outputs (dict[str, Any]): the outputs of the training step, the returns of the training_step() method in the CLAlgorithm.
batch (Any): the training data batch.

@rank_zero_only

def on_train_epoch_end( self, trainer: lightning.pytorch.trainer.trainer.Trainer, pl_module: clarena.cl_algorithms.CLAlgorithm) -> None: View Source

157    @rank_zero_only
158    def on_train_epoch_end(
159        self,
160        trainer: Trainer,
161        pl_module: CLAlgorithm,
162    ) -> None:
163        r"""Log metrics of training epoch to plot learning curves and reset the metrics accumulation at the end of training epoch."""
164
165        # log the accumulated and computed metrics of the epoch to Lightning loggers, specially for plotting learning curves
166        pl_module.log(
167            f"task_{self.task_id}/learning_curve/train/loss_cls",
168            self.loss_cls_training_epoch.compute(),
169            on_epoch=True,
170            prog_bar=True,
171        )
172
173        # reset the metrics of training epoch as there are more epochs to go and not only one epoch like in the validation and test
174        self.loss_cls_training_epoch.reset()
175        self.loss_training_epoch.reset()

Log metrics of training epoch to plot learning curves and reset the metrics accumulation at the end of training epoch.

@rank_zero_only

def on_validation_batch_end( self, trainer: lightning.pytorch.trainer.trainer.Trainer, pl_module: clarena.cl_algorithms.CLAlgorithm, outputs: dict[str, typing.Any], batch: Any, batch_idx: int) -> None: View Source

177    @rank_zero_only
178    def on_validation_batch_end(
179        self,
180        trainer: Trainer,
181        pl_module: CLAlgorithm,
182        outputs: dict[str, Any],
183        batch: Any,
184        batch_idx: int,
185    ) -> None:
186        r"""Accumulating metrics from validation batch. We don't need to log and monitor the metrics of validation batches.
187
188        **Args:**
189        - **outputs** (`dict[str, Any]`): the outputs of the validation step, which is the returns of the `validation_step()` method in the `CLAlgorithm`.
190        - **batch** (`Any`): the validation data batch.
191        """
192
193        # get the batch size
194        batch_size = len(batch)
195
196        # get the metrics values of the batch from the outputs
197        loss_cls_batch = outputs["loss_cls"]
198
199        # update the accumulated metrics in order to calculate the validation metrics
200        self.loss_cls_val.update(loss_cls_batch, batch_size)

Accumulating metrics from validation batch. We don't need to log and monitor the metrics of validation batches.

Args:

outputs (dict[str, Any]): the outputs of the validation step, which is the returns of the validation_step() method in the CLAlgorithm.
batch (Any): the validation data batch.

@rank_zero_only

def on_validation_epoch_end( self, trainer: lightning.pytorch.trainer.trainer.Trainer, pl_module: clarena.cl_algorithms.CLAlgorithm) -> None: View Source

202    @rank_zero_only
203    def on_validation_epoch_end(
204        self,
205        trainer: Trainer,
206        pl_module: CLAlgorithm,
207    ) -> None:
208        r"""Log validation metrics to plot learning curves."""
209
210        # log the accumulated and computed metrics of the epoch to Lightning loggers, specially for plotting learning curves
211        pl_module.log(
212            f"task_{self.task_id}/learning_curve/val/loss_cls",
213            self.loss_cls_val.compute(),
214            on_epoch=True,
215            prog_bar=True,
216        )

Log validation metrics to plot learning curves.

@rank_zero_only

def on_test_start( self, trainer: lightning.pytorch.trainer.trainer.Trainer, pl_module: clarena.cl_algorithms.CLAlgorithm) -> None: View Source

218    @rank_zero_only
219    def on_test_start(
220        self,
221        trainer: Trainer,
222        pl_module: CLAlgorithm,
223    ) -> None:
224        r"""Initialize the metrics for testing each seen task in the beginning of a task's testing."""
225
226        # set the current task_id again (double checking) from the `CLAlgorithm` object
227        self.task_id = pl_module.task_id
228
229        # get the device to put the metrics on the same device
230        device = pl_module.device
231
232        # initialize test metrics for current and previous tasks
233        self.loss_cls_test = {
234            task_id: MeanMetricBatch().to(device)
235            for task_id in pl_module.processed_task_ids
236        }

Initialize the metrics for testing each seen task in the beginning of a task's testing.

@rank_zero_only

def on_test_batch_end( self, trainer: lightning.pytorch.trainer.trainer.Trainer, pl_module: clarena.cl_algorithms.CLAlgorithm, outputs: dict[str, typing.Any], batch: Any, batch_idx: int, dataloader_idx: int = 0) -> None: View Source

238    @rank_zero_only
239    def on_test_batch_end(
240        self,
241        trainer: Trainer,
242        pl_module: CLAlgorithm,
243        outputs: dict[str, Any],
244        batch: Any,
245        batch_idx: int,
246        dataloader_idx: int = 0,
247    ) -> None:
248        r"""Accumulating metrics from test batch. We don't need to log and monitor the metrics of test batches.
249
250        **Args:**
251        - **outputs** (`dict[str, Any]`): the outputs of the test step, which is the returns of the `test_step()` method in the `CLAlgorithm`.
252        - **batch** (`Any`): the test data batch.
253        - **dataloader_idx** (`int`): the task ID of seen tasks to be tested. A default value of 0 is given otherwise the LightningModule will raise a `RuntimeError`.
254        """
255
256        # get the batch size
257        batch_size = len(batch)
258
259        test_task_id = pl_module.get_test_task_id_from_dataloader_idx(dataloader_idx)
260
261        # get the metrics values of the batch from the outputs
262        loss_cls_batch = outputs["loss_cls"]
263
264        # update the accumulated metrics in order to calculate the metrics of the epoch
265        self.loss_cls_test[test_task_id].update(loss_cls_batch, batch_size)

Accumulating metrics from test batch. We don't need to log and monitor the metrics of test batches.

Args:

outputs (dict[str, Any]): the outputs of the test step, which is the returns of the test_step() method in the CLAlgorithm.
batch (Any): the test data batch.
dataloader_idx (int): the task ID of seen tasks to be tested. A default value of 0 is given otherwise the LightningModule will raise a RuntimeError.

@rank_zero_only

def on_test_epoch_end( self, trainer: lightning.pytorch.trainer.trainer.Trainer, pl_module: clarena.cl_algorithms.CLAlgorithm) -> None: View Source

267    @rank_zero_only
268    def on_test_epoch_end(
269        self,
270        trainer: Trainer,
271        pl_module: CLAlgorithm,
272    ) -> None:
273        r"""Save and plot test metrics at the end of test."""
274
275        # save (update) the test metrics to CSV files
276        self.update_test_loss_cls_to_csv(
277            after_training_task_id=self.task_id,
278            csv_path=self.test_loss_cls_csv_path,
279        )
280
281        # plot the test metrics
282        if hasattr(self, "test_loss_cls_matrix_plot_path"):
283            self.plot_test_loss_cls_matrix_from_csv(
284                csv_path=self.test_loss_cls_csv_path,
285                plot_path=self.test_loss_cls_matrix_plot_path,
286            )
287        if hasattr(self, "test_ave_loss_cls_plot_path"):
288            self.plot_test_ave_loss_cls_curve_from_csv(
289                csv_path=self.test_loss_cls_csv_path,
290                plot_path=self.test_ave_loss_cls_plot_path,
291            )

Save and plot test metrics at the end of test.

def update_test_loss_cls_to_csv(self, after_training_task_id: int, csv_path: str) -> None: View Source

293    def update_test_loss_cls_to_csv(
294        self,
295        after_training_task_id: int,
296        csv_path: str,
297    ) -> None:
298        """Update the test classification loss metrics of seen tasks at the last line to an existing CSV file. A new file will be created if not existing.
299
300        **Args:**
301        - **after_training_task_id** (`int`): the task ID after training.
302        - **csv_path** (`str`): save the test metric to path. E.g. './outputs/expr_name/1970-01-01_00-00-00/results/loss_cls.csv'.
303        """
304        processed_task_ids = list(self.loss_cls_test.keys())
305        fieldnames = ["after_training_task", "average_classification_loss"] + [
306            f"test_on_task_{task_id}" for task_id in processed_task_ids
307        ]
308
309        new_line = {
310            "after_training_task": after_training_task_id
311        }  # construct the first column
312
313        # write to the columns and calculate the average classification loss over tasks at the same time
314        average_classification_loss_over_tasks = MeanMetric().to(
315            device=next(iter(self.loss_cls_test.values())).device
316        )
317        for task_id in processed_task_ids:
318            loss_cls = self.loss_cls_test[task_id].compute().item()
319            new_line[f"test_on_task_{task_id}"] = loss_cls
320            average_classification_loss_over_tasks(loss_cls)
321        new_line["average_classification_loss"] = (
322            average_classification_loss_over_tasks.compute().item()
323        )
324
325        # write to the csv file
326        is_first = not os.path.exists(csv_path)
327        if not is_first:
328            with open(csv_path, "r", encoding="utf-8") as file:
329                lines = file.readlines()
330                del lines[0]
331        # write header
332        with open(csv_path, "w", encoding="utf-8") as file:
333            writer = csv.DictWriter(file, fieldnames=fieldnames)
334            writer.writeheader()
335        # write metrics
336        with open(csv_path, "a", encoding="utf-8") as file:
337            if not is_first:
338                file.writelines(lines)  # write the previous lines
339            writer = csv.DictWriter(file, fieldnames=fieldnames)
340            writer.writerow(new_line)

Update the test classification loss metrics of seen tasks at the last line to an existing CSV file. A new file will be created if not existing.

Args:

after_training_task_id (int): the task ID after training.
csv_path (str): save the test metric to path. E.g. './outputs/expr_name/1970-01-01_00-00-00/results/loss_cls.csv'.

def plot_test_loss_cls_matrix_from_csv(self, csv_path: str, plot_path: str) -> None: View Source

342    def plot_test_loss_cls_matrix_from_csv(self, csv_path: str, plot_path: str) -> None:
343        """Plot the test classification loss matrix from saved CSV file and save the plot to the designated directory.
344
345        **Args:**
346        - **csv_path** (`str`): the path to the CSV file where the `utils.update_loss_cls_to_csv()` saved the test classification loss metric.
347        - **plot_path** (`str`): the path to save plot. Better same as the output directory of the experiment. E.g. './outputs/expr_name/1970-01-01_00-00-00/loss_cls_matrix.png'.
348        """
349        data = pd.read_csv(csv_path)
350        processed_task_ids = [
351            int(col.replace("test_on_task_", ""))
352            for col in data.columns
353            if col.startswith("test_on_task_")
354        ]
355
356        # Get all columns that start with "test_on_task_"
357        test_task_cols = [
358            col for col in data.columns if col.startswith("test_on_task_")
359        ]
360        num_tasks = len(processed_task_ids)
361        num_rows = len(data)
362
363        # Build the loss matrix
364        loss_matrix = data[test_task_cols].values
365
366        fig, ax = plt.subplots(
367            figsize=(2 * num_tasks, 2 * num_rows)
368        )  # adaptive figure size
369
370        cax = ax.imshow(
371            loss_matrix,
372            interpolation="nearest",
373            cmap="Greens",
374            aspect="auto",
375        )
376
377        colorbar = fig.colorbar(cax)
378        yticks = colorbar.ax.get_yticks()
379        colorbar.ax.set_yticks(yticks)
380        colorbar.ax.set_yticklabels(
381            [f"{tick:.2f}" for tick in yticks], fontsize=10 + num_tasks
382        )
383
384        # Annotate each cell
385        for r in range(num_rows):
386            for c in range(r + 1):
387                ax.text(
388                    c,
389                    r,
390                    f"{loss_matrix[r, c]:.3f}",
391                    ha="center",
392                    va="center",
393                    color="black",
394                    fontsize=10 + num_tasks,
395                )
396
397        ax.set_xticks(range(num_tasks))
398        ax.set_yticks(range(num_rows))
399        ax.set_xticklabels(processed_task_ids, fontsize=10 + num_tasks)
400        ax.set_yticklabels(
401            data["after_training_task"].astype(int).tolist(), fontsize=10 + num_tasks
402        )
403
404        # Labeling the axes
405        ax.set_xlabel("Testing on task τ", fontsize=10 + num_tasks)
406        ax.set_ylabel("After training task t", fontsize=10 + num_tasks)
407        fig.tight_layout()
408        fig.savefig(plot_path)
409        plt.close(fig)

Plot the test classification loss matrix from saved CSV file and save the plot to the designated directory.

Args:

csv_path (str): the path to the CSV file where the utils.update_loss_cls_to_csv() saved the test classification loss metric.
plot_path (str): the path to save plot. Better same as the output directory of the experiment. E.g. './outputs/expr_name/1970-01-01_00-00-00/loss_cls_matrix.png'.

def plot_test_ave_loss_cls_curve_from_csv(self, csv_path: str, plot_path: str) -> None: View Source

411    def plot_test_ave_loss_cls_curve_from_csv(
412        self, csv_path: str, plot_path: str
413    ) -> None:
414        """Plot the test average classfication loss curve over different training tasks from saved CSV file and save the plot to the designated directory.
415
416        **Args:**
417        - **csv_path** (`str`): the path to the CSV file where the `utils.update_test_acc_to_csv()` saved the test classfication loss metric.
418        - **plot_path** (`str`): the path to save plot. Better same as the output directory of the experiment. E.g. './outputs/expr_name/1970-01-01_00-00-00/ave_loss_cls.png'.
419        """
420        data = pd.read_csv(csv_path)
421        after_training_tasks = data["after_training_task"].astype(int).tolist()
422
423        # plot the average accuracy curve over different training tasks
424        fig, ax = plt.subplots(figsize=(16, 9))
425        ax.plot(
426            after_training_tasks,
427            data["average_classification_loss"],
428            marker="o",
429            linewidth=2,
430        )
431        ax.set_xlabel("After training task $t$", fontsize=16)
432        ax.set_ylabel("Average Classification Loss", fontsize=16)
433        ax.grid(True)
434        xticks = after_training_tasks
435        yticks = [i * 0.05 for i in range(21)]
436        ax.set_xticks(xticks)
437        ax.set_yticks(yticks)
438        ax.set_xticklabels(xticks, fontsize=16)
439        ax.set_yticklabels([f"{tick:.2f}" for tick in yticks], fontsize=16)
440        fig.savefig(plot_path)
441        plt.close(fig)

Plot the test average classfication loss curve over different training tasks from saved CSV file and save the plot to the designated directory.

Args:

csv_path (str): the path to the CSV file where the utils.update_test_acc_to_csv() saved the test classfication loss metric.
plot_path (str): the path to save plot. Better same as the output directory of the experiment. E.g. './outputs/expr_name/1970-01-01_00-00-00/ave_loss_cls.png'.