Source code for torchgeo.datamodules.cloud_cover
# Copyright (c) TorchGeo Contributors. All rights reserved.
# Licensed under the MIT License.
"""Cloud Cover Detection Challenge datamodule."""
from typing import Any
import torch
from torch.utils.data import random_split
from ..datasets import CloudCoverDetection
from .geo import NonGeoDataModule
[docs]
class CloudCoverDetectionDataModule(NonGeoDataModule):
"""LightningDataModule implementation for Cloud Cover Detection.
Splits the training split into train/val subsets using ``val_split_pct``.
.. versionadded:: 0.9
"""
mean = torch.tensor(0.0)
std = torch.tensor(10000.0)
[docs]
def __init__(
self,
batch_size: int = 64,
num_workers: int = 0,
val_split_pct: float = 0.2,
**kwargs: Any,
) -> None:
"""Initialize a new CloudCoverDetectionDataModule instance.
Args:
batch_size: Size of each mini-batch.
num_workers: Number of workers for parallel data loading.
val_split_pct: Percentage of the training data to reserve for validation.
**kwargs: Additional keyword arguments passed to
:class:`~torchgeo.datasets.CloudCoverDetection`.
"""
super().__init__(CloudCoverDetection, batch_size, num_workers, **kwargs)
self.val_split_pct = val_split_pct
[docs]
def setup(self, stage: str) -> None:
"""Set up datasets.
Args:
stage: Either 'fit', 'validate', 'test', or 'predict'.
"""
if stage in ['fit', 'validate']:
self.dataset = CloudCoverDetection(split='train', **self.kwargs)
generator = torch.Generator().manual_seed(0)
self.train_dataset, self.val_dataset = random_split(
self.dataset, [1 - self.val_split_pct, self.val_split_pct], generator
)
if stage in ['test']:
self.test_dataset = CloudCoverDetection(split='test', **self.kwargs)