Source code for torchgeo.datamodules.fair1m
# Copyright (c) Microsoft Corporation. All rights reserved.
# Licensed under the MIT License.
"""FAIR1M datamodule."""
from typing import Any
from ..datasets import FAIR1M
from .geo import NonGeoDataModule
from .utils import dataset_split
[docs]class FAIR1MDataModule(NonGeoDataModule):
"""LightningDataModule implementation for the FAIR1M dataset.
.. versionadded:: 0.2
"""
[docs] def __init__(
self,
batch_size: int = 64,
num_workers: int = 0,
val_split_pct: float = 0.2,
test_split_pct: float = 0.2,
**kwargs: Any,
) -> None:
"""Initialize a new FAIR1MDataModule instance.
Args:
batch_size: Size of each mini-batch.
num_workers: Number of workers for parallel data loading.
val_split_pct: Percentage of the dataset to use as a validation set.
test_split_pct: Percentage of the dataset to use as a test set.
**kwargs: Additional keyword arguments passed to
:class:`~torchgeo.datasets.FAIR1M`.
"""
super().__init__(FAIR1M, batch_size, num_workers, **kwargs)
self.val_split_pct = val_split_pct
self.test_split_pct = test_split_pct
[docs] def setup(self, stage: str) -> None:
"""Set up datasets.
Args:
stage: Either 'fit', 'validate', 'test', or 'predict'.
"""
self.dataset = FAIR1M(**self.kwargs)
self.train_dataset, self.val_dataset, self.test_dataset = dataset_split(
self.dataset, val_pct=self.val_split_pct, test_pct=self.test_split_pct
)