README.md

image_pipeline: List[Operation] = [
  RandomResizedCropRGBImageDecoder((image_size, image_size)),  # loads the image in a desired resolution
  ToTensor(), # Convert from Numpy array to PyTorch Tensor
  ToDevice(device, non_blocking=True),  # Move tensor to device
  ToTorchImage(channels_last=True), # Change tensor to PyTorch format for images (B x H x W x C)
  NormalizeImage(CIFAR_MEAN, CIFAR_STD, type=np.dtype(np.float16)),  # Normalize and set floating point precision
]

label_pipeline: List[Operation] = [
  IntDecoder(),  # decode label as numpy array
  ToTensor(),
  ToDevice(device),
  Squeeze(), # remove "empty" dimensions (dims of size 1)
]

pipelines = {"image": image_pipeline, "label": label_pipeline}
ordering = OrderOption.QUASI_RANDOM
loader = Loader(
  path,  # path to the .beton file to load (we usually have 1 file per split)
  batch_size=batch_size,
  num_workers=NUM_WORKERS,
  order=ordering, # Either RANDOM (does uniform sampling, therefore requires entire dataset in RAM), QUASI_RANDOM (faster but non-uniform sampling, works on large datasets) or SEQUENTIAL
  drop_last=True,  # drop last incomplete batch
  pipelines=pipelines,
  os_cache=False,  # only set to true on small datasets that can fit in system RAM
)
for batch in dataloader:
    images = batch[0].to(device=device, non_blocking=True)
    labels = batch[1].to(device=device)
model = torchvision.models.resnet18()
model.to(device=torch.device("cuda"), memory_format=torch.channels_last)