clarena.metrics.mtl_acc API documentation

MTLAccuracy( save_dir: str, test_acc_csv_name: str = 'acc.csv', test_acc_plot_name: str | None = None) View Source

40    def __init__(
41        self,
42        save_dir: str,
43        test_acc_csv_name: str = "acc.csv",
44        test_acc_plot_name: str | None = None,
45    ) -> None:
46        r"""
47        **Args:**
48        - **save_dir** (`str`): The directory where data and figures of metrics will be saved. Better inside the output folder.
49        - **test_acc_csv_name** (`str`): file name to save test accuracy of all tasks and average accuracy as CSV file.
50        - **test_acc_plot_name** (`str` | `None`): file name to save accuracy plot. If `None`, no file will be saved.
51        """
52        super().__init__(save_dir=save_dir)
53
54        # paths
55        self.test_acc_csv_path: str = os.path.join(save_dir, test_acc_csv_name)
56        r"""The path to save test accuracy of all tasks and average accuracy CSV file."""
57        if test_acc_plot_name:
58            self.test_acc_plot_path: str = os.path.join(save_dir, test_acc_plot_name)
59            r"""The path to save test accuracy plot."""
60
61        # training accumulated metrics
62        self.acc_training_epoch: MeanMetricBatch
63        r"""Classification accuracy of training epoch. Accumulated and calculated from the training batches. """
64
65        # validation accumulated metrics
66        self.acc_val: dict[int, MeanMetricBatch] = {}
67        r"""Validation classification accuracy of the model after training epoch. Accumulated and calculated from the validation batches. Keys are task IDs and values are the corresponding metrics."""
68
69        # test accumulated metrics
70        self.acc_test: dict[int, MeanMetricBatch] = {}
71        r"""Test classification accuracy of all tasks. Accumulated and calculated from the test batches. Keys are task IDs and values are the corresponding metrics."""

Args:

save_dir (str): The directory where data and figures of metrics will be saved. Better inside the output folder.
test_acc_csv_name (str): file name to save test accuracy of all tasks and average accuracy as CSV file.
test_acc_plot_name (str | None): file name to save accuracy plot. If None, no file will be saved.

test_acc_csv_path: str

The path to save test accuracy of all tasks and average accuracy CSV file.

acc_training_epoch: clarena.utils.metrics.MeanMetricBatch

Classification accuracy of training epoch. Accumulated and calculated from the training batches.

acc_val: dict[int, clarena.utils.metrics.MeanMetricBatch]

Validation classification accuracy of the model after training epoch. Accumulated and calculated from the validation batches. Keys are task IDs and values are the corresponding metrics.

acc_test: dict[int, clarena.utils.metrics.MeanMetricBatch]

Test classification accuracy of all tasks. Accumulated and calculated from the test batches. Keys are task IDs and values are the corresponding metrics.

def on_fit_start( self, trainer: lightning.pytorch.trainer.trainer.Trainer, pl_module: clarena.mtl_algorithms.MTLAlgorithm) -> None: View Source

73    def on_fit_start(self, trainer: Trainer, pl_module: MTLAlgorithm) -> None:
74        r"""Initialize training and validation metrics."""
75
76        # initialize training metrics
77        self.acc_training_epoch = MeanMetricBatch()
78
79        # initialize validation metrics
80        self.acc_val = {
81            task_id: MeanMetricBatch() for task_id in trainer.datamodule.train_tasks
82        }

Initialize training and validation metrics.

def on_train_batch_end( self, trainer: lightning.pytorch.trainer.trainer.Trainer, pl_module: clarena.mtl_algorithms.MTLAlgorithm, outputs: dict[str, typing.Any], batch: Any, batch_idx: int) -> None: View Source

 84    def on_train_batch_end(
 85        self,
 86        trainer: Trainer,
 87        pl_module: MTLAlgorithm,
 88        outputs: dict[str, Any],
 89        batch: Any,
 90        batch_idx: int,
 91    ) -> None:
 92        r"""Record training metrics from training batch, log metrics of training batch and accumulated metrics of the epoch to Lightning loggers.
 93
 94        **Args:**
 95        - **outputs** (`dict[str, Any]`): the outputs of the training step, the returns of the `training_step()` method in the `MTLAlgorithm`.
 96        - **batch** (`Any`): the training data batch.
 97        """
 98        # get the batch size
 99        batch_size = len(batch)
100
101        # get training metrics values of current training batch from the outputs of the `training_step()`
102        acc_batch = outputs["acc"]
103
104        # update accumulated training metrics to calculate training metrics of the epoch
105        self.acc_training_epoch.update(acc_batch, batch_size)
106
107        # log training metrics of current training batch to Lightning loggers
108        pl_module.log("train/acc_batch", acc_batch, prog_bar=True)
109
110        # log accumulated training metrics till this training batch to Lightning loggers
111        pl_module.log(
112            "task/train/acc",
113            self.acc_training_epoch.compute(),
114            prog_bar=True,
115        )

Record training metrics from training batch, log metrics of training batch and accumulated metrics of the epoch to Lightning loggers.

Args:

outputs (dict[str, Any]): the outputs of the training step, the returns of the training_step() method in the MTLAlgorithm.
batch (Any): the training data batch.

def on_train_epoch_end( self, trainer: lightning.pytorch.trainer.trainer.Trainer, pl_module: clarena.mtl_algorithms.MTLAlgorithm) -> None: View Source

117    def on_train_epoch_end(
118        self,
119        trainer: Trainer,
120        pl_module: MTLAlgorithm,
121    ) -> None:
122        r"""Log metrics of training epoch to plot learning curves and reset the metrics accumulation at the end of training epoch."""
123
124        # reset the metrics of training epoch as there are more epochs to go and not only one epoch like in the validation and test
125        self.acc_training_epoch.reset()

Log metrics of training epoch to plot learning curves and reset the metrics accumulation at the end of training epoch.

def on_validation_batch_end( self, trainer: lightning.pytorch.trainer.trainer.Trainer, pl_module: clarena.mtl_algorithms.MTLAlgorithm, outputs: dict[str, typing.Any], batch: Any, batch_idx: int, dataloader_idx: int = 0) -> None: View Source

127    def on_validation_batch_end(
128        self,
129        trainer: Trainer,
130        pl_module: MTLAlgorithm,
131        outputs: dict[str, Any],
132        batch: Any,
133        batch_idx: int,
134        dataloader_idx: int = 0,
135    ) -> None:
136        r"""Accumulating metrics from validation batch. We don't need to log and monitor the metrics of validation batches.
137
138        **Args:**
139        - **outputs** (`dict[str, Any]`): the outputs of the validation step, which is the returns of the `validation_step()` method in the `MTLAlgorithm`.
140        - **batch** (`Any`): the validation data batch.
141        - **dataloader_idx** (`int`): the task ID of the validation dataloader. A default value of 0 is given otherwise the LightningModule will raise a `RuntimeError`.
142        """
143
144        # get the batch size
145        batch_size = len(batch)
146
147        val_task_id = pl_module.get_val_task_id_from_dataloader_idx(dataloader_idx)
148
149        # get the metrics values of the batch from the outputs
150        acc_batch = outputs["acc"]
151
152        # update the accumulated metrics in order to calculate the validation metrics
153        self.acc_val[val_task_id].update(acc_batch, batch_size)

Accumulating metrics from validation batch. We don't need to log and monitor the metrics of validation batches.

Args:

outputs (dict[str, Any]): the outputs of the validation step, which is the returns of the validation_step() method in the MTLAlgorithm.
batch (Any): the validation data batch.
dataloader_idx (int): the task ID of the validation dataloader. A default value of 0 is given otherwise the LightningModule will raise a RuntimeError.

def on_test_start( self, trainer: lightning.pytorch.trainer.trainer.Trainer, pl_module: clarena.mtl_algorithms.MTLAlgorithm) -> None: View Source

155    def on_test_start(
156        self,
157        trainer: Trainer,
158        pl_module: MTLAlgorithm,
159    ) -> None:
160        r"""Initialize the metrics for testing each seen task in the beginning of a task's testing."""
161
162        # initialize test metrics for current and previous tasks
163        self.acc_test = {
164            task_id: MeanMetricBatch() for task_id in trainer.datamodule.eval_tasks
165        }

Initialize the metrics for testing each seen task in the beginning of a task's testing.

def on_test_batch_end( self, trainer: lightning.pytorch.trainer.trainer.Trainer, pl_module: clarena.mtl_algorithms.MTLAlgorithm, outputs: dict[str, typing.Any], batch: Any, batch_idx: int, dataloader_idx: int = 0) -> None: View Source

167    def on_test_batch_end(
168        self,
169        trainer: Trainer,
170        pl_module: MTLAlgorithm,
171        outputs: dict[str, Any],
172        batch: Any,
173        batch_idx: int,
174        dataloader_idx: int = 0,
175    ) -> None:
176        r"""Accumulating metrics from test batch. We don't need to log and monitor the metrics of test batches.
177
178        **Args:**
179        - **outputs** (`dict[str, Any]`): the outputs of the test step, which is the returns of the `test_step()` method in the `MTLAlgorithm`.
180        - **batch** (`Any`): the validation data batch.
181        - **dataloader_idx** (`int`): the task ID of seen tasks to be tested. A default value of 0 is given otherwise the LightningModule will raise a `RuntimeError`.
182        """
183
184        # get the batch size
185        batch_size = len(batch)
186
187        test_task_id = pl_module.get_test_task_id_from_dataloader_idx(dataloader_idx)
188
189        # get the metrics values of the batch from the outputs
190        acc_batch = outputs["acc"]
191
192        # update the accumulated metrics in order to calculate the metrics of the epoch
193        self.acc_test[test_task_id].update(acc_batch, batch_size)

Accumulating metrics from test batch. We don't need to log and monitor the metrics of test batches.

Args:

outputs (dict[str, Any]): the outputs of the test step, which is the returns of the test_step() method in the MTLAlgorithm.
batch (Any): the validation data batch.
dataloader_idx (int): the task ID of seen tasks to be tested. A default value of 0 is given otherwise the LightningModule will raise a RuntimeError.

def on_test_epoch_end( self, trainer: lightning.pytorch.trainer.trainer.Trainer, pl_module: clarena.mtl_algorithms.MTLAlgorithm) -> None: View Source

195    def on_test_epoch_end(
196        self,
197        trainer: Trainer,
198        pl_module: MTLAlgorithm,
199    ) -> None:
200        r"""Save and plot test metrics at the end of test."""
201
202        # save (update) the test metrics to CSV files
203        self.save_test_acc_to_csv(
204            csv_path=self.test_acc_csv_path,
205        )
206
207        # plot the test metrics
208        if hasattr(self, "test_acc_plot_path"):
209            self.plot_test_acc_from_csv(
210                csv_path=self.test_acc_csv_path,
211                plot_path=self.test_acc_plot_path,
212            )

Save and plot test metrics at the end of test.

def save_test_acc_to_csv(self, csv_path: str) -> None: View Source

214    def save_test_acc_to_csv(
215        self,
216        csv_path: str,
217    ) -> None:
218        r"""Save the test accuracy metrics of all tasks in multi-task learning to an CSV file.
219
220        **Args:**
221        - **csv_path** (`str`): save the test metric to path. E.g. './outputs/expr_name/1970-01-01_00-00-00/results/acc.csv'.
222        """
223        all_task_ids = list(self.acc_test.keys())
224        fieldnames = ["average_accuracy"] + [
225            f"test_on_task_{task_id}" for task_id in all_task_ids
226        ]
227        new_line = {}
228
229        # construct the columns and calculate the average accuracy over tasks at the same time
230        average_accuracy_over_tasks = MeanMetric().to(
231            device=next(iter(self.acc_test.values())).device
232        )
233        for task_id in all_task_ids:
234            acc = self.acc_test[task_id].compute().item()
235            new_line[f"test_on_task_{task_id}"] = acc
236            average_accuracy_over_tasks(acc)
237        new_line["average_accuracy"] = average_accuracy_over_tasks.compute().item()
238
239        # write
240        with open(csv_path, "w", encoding="utf-8") as file:
241            writer = csv.DictWriter(file, fieldnames=fieldnames)
242            writer.writeheader()
243            writer.writerow(new_line)

Save the test accuracy metrics of all tasks in multi-task learning to an CSV file.

Args:

csv_path (str): save the test metric to path. E.g. './outputs/expr_name/1970-01-01_00-00-00/results/acc.csv'.

def plot_test_acc_from_csv(self, csv_path: str, plot_path: str) -> None: View Source

245    def plot_test_acc_from_csv(self, csv_path: str, plot_path: str) -> None:
246        """Plot the test accuracy bar chart of all tasks in multi-task learning from saved CSV file and save the plot to the designated directory.
247
248        **Args:**
249        - **csv_path** (`str`): the path to the csv file where the `utils.save_test_acc_csv()` saved the test accuracy metric.
250        - **plot_path** (`str`): the path to save plot. Better same as the output directory of the experiment. E.g. './outputs/expr_name/1970-01-01_00-00-00/acc.png'.
251        """
252        data = pd.read_csv(csv_path)
253
254        # extract all accuracy columns including average
255        all_columns = data.columns.tolist()
256        task_ids = list(range(len(all_columns)))  # assign index-based positions
257        labels = [
258            (
259                col.replace("test_on_task_", "Task ")
260                if "test_on_task_" in col
261                else "Average"
262            )
263            for col in all_columns
264        ]
265        accuracies = data.iloc[0][all_columns].values
266
267        # plot the accuracy bar chart over tasks
268        fig, ax = plt.subplots(figsize=(16, 9))
269        ax.bar(
270            task_ids,
271            accuracies,
272            color="skyblue",
273            edgecolor="black",
274        )
275        ax.set_xlabel("Task", fontsize=16)
276        ax.set_ylabel("Accuracy", fontsize=16)
277        ax.grid(True)
278        ax.set_xticks(task_ids)
279        ax.set_xticklabels(labels, rotation=45, ha="right", fontsize=14)
280        ax.set_yticks([i * 0.05 for i in range(21)])
281        ax.set_yticklabels(
282            [f"{tick:.2f}" for tick in [i * 0.05 for i in range(21)]], fontsize=14
283        )
284        fig.tight_layout()
285        fig.savefig(plot_path)
286        plt.close(fig)

Plot the test accuracy bar chart of all tasks in multi-task learning from saved CSV file and save the plot to the designated directory.

Args:

csv_path (str): the path to the csv file where the utils.save_test_acc_csv() saved the test accuracy metric.
plot_path (str): the path to save plot. Better same as the output directory of the experiment. E.g. './outputs/expr_name/1970-01-01_00-00-00/acc.png'.