OATML · AmrMKayid · Sep 23, 2020 · Sep 23, 2020 · Sep 23, 2020 · Sep 24, 2020
diff --git a/oatomobile/baselines/torch/cil/tune.py b/oatomobile/baselines/torch/cil/tune.py
@@ -0,0 +1,342 @@
+# Copyright 2020 The OATomobile Authors. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
+"""Trains the behavioural cloning agent's model on expert demonstrations."""
+
+import os
+from typing import Mapping
+
+import torch
+import torch.nn as nn
+import torch.nn.functional as F
+import torch.optim as optim
+import tqdm
+from absl import app
+from absl import flags
+from absl import logging
+from ray import tune
+
+from oatomobile.baselines.torch.cil.model import BehaviouralModel
+from oatomobile.datasets.carla import CARLADataset
+from oatomobile.torch import types
+from oatomobile.torch.loggers import TensorBoardLogger
+from oatomobile.torch.savers import Checkpointer
+from oatomobile.utils.loggers import WandBLogger
+
+logging.set_verbosity(logging.DEBUG)
+FLAGS = flags.FLAGS
+flags.DEFINE_string(
+    name="dataset_dir",
+    default=None,
+    help="The full path to the processed dataset.",
+)
+flags.DEFINE_string(
+    name="output_dir",
+    default=None,
+    help="The full path to the output directory (for logs, ckpts).",
+)
+flags.DEFINE_list(
+    name="batch_size",
+    default=[32, 64, 128, 256, 512, 1024],
+    help="The batch size used for training the neural network.",
+)
+flags.DEFINE_list(
+    name="num_epochs",
+    default=[1024],
+    help="The number of training epochs for the neural network.",
+)
+flags.DEFINE_integer(
+    name="save_model_frequency",
+    default=4,
+    help="The number epochs between saves of the model.",
+)
+flags.DEFINE_list(
+    name="learning_rate",
+    default=[1e-1, 1e-2, 1e-3, 1e-4, 1e-5],
+    help="The ADAM learning rate.",
+)
+flags.DEFINE_integer(
+    name="num_timesteps_to_keep",
+    default=4,
+    help="The numbers of time-steps to keep from the target, with downsampling.",
+)
+flags.DEFINE_list(
+    name="weight_decay",
+    default=[0.0, 1e-2, 1e-3],
+    help="The L2 penalty (regularization) coefficient.",
+)
+flags.DEFINE_bool(
+    name="clip_gradients",
+    default=False,
+    help="If True it clips the gradients norm to 1.0.",
+)
+
+
+def main(config):
+
+  # Parses config arguments.
+  dataset_dir = config["dataset_dir"]
+  output_dir = config["output_dir"]
+  save_model_frequency = config["save_model_frequency"]
+  num_timesteps_to_keep = config["num_timesteps_to_keep"]
+  clip_gradients = config["clip_gradients"]
+
+  ## Parse Ray Config
+  batch_size = config["batch_size"]
+  num_epochs = config["num_epochs"]
+  learning_rate = config["learning_rate"]
+  weight_decay = config["weight_decay"]
+  noise_level = config["noise_level"]
+
+  # Determines device, accelerator.
+  device = torch.device("cuda" if torch.cuda.is_available() else "cpu")  # pylint: disable=no-member
+
+  # Creates the necessary output directory.
+  os.makedirs(output_dir, exist_ok=True)
+  log_dir = os.path.join(output_dir, "logs")
+  os.makedirs(log_dir, exist_ok=True)
+  ckpt_dir = os.path.join(output_dir, "ckpts")
+  os.makedirs(ckpt_dir, exist_ok=True)
+
+  # Initializes the model and its optimizer.
+  output_shape = [num_timesteps_to_keep, 2]
+  model = BehaviouralModel(output_shape=output_shape).to(device)
+  criterion = nn.L1Loss(reduction="none")
+  optimizer = optim.Adam(
+      model.parameters(),
+      lr=learning_rate,
+      weight_decay=weight_decay,
+  )
+  writer = TensorBoardLogger(log_dir=log_dir)
+  checkpointer = Checkpointer(model=model, ckpt_dir=ckpt_dir)
+
+  def transform(batch: Mapping[str, types.Array]) -> Mapping[str, torch.Tensor]:
+    """Preprocesses a batch for the model.
+
+    Args:
+      batch: (keyword arguments) The raw batch variables.
+
+    Returns:
+      The processed batch.
+    """
+    # Sends tensors to `device`.
+    batch = {key: tensor.to(device) for (key, tensor) in batch.items()}
+    # Preprocesses batch for the model.
+    batch = model.transform(batch)
+    return batch
+
+  # Setups the dataset and the dataloader.
+  modalities = (
+      "lidar",
+      "is_at_traffic_light",
+      "traffic_light_state",
+      "player_future",
+      "velocity",
+  )
+  dataset_train = CARLADataset.as_torch(
+      dataset_dir=os.path.join(dataset_dir, "train"),
+      modalities=modalities,
+      mode=True,
+  )
+  dataloader_train = torch.utils.data.DataLoader(
+      dataset_train,
+      batch_size=batch_size,
+      shuffle=True,
+      num_workers=2,
+  )
+  dataset_val = CARLADataset.as_torch(
+      dataset_dir=os.path.join(dataset_dir, "val"),
+      modalities=modalities,
+      mode=True,
+  )
+  dataloader_val = torch.utils.data.DataLoader(
+      dataset_val,
+      batch_size=batch_size * 5,
+      shuffle=True,
+      num_workers=2,
+  )
+
+  def train_step(
+      model: BehaviouralModel,
+      optimizer: optim.Optimizer,
+      batch: Mapping[str, torch.Tensor],
+      clip: bool = False,
+  ) -> torch.Tensor:
+    """Performs a single gradient-descent optimisation step."""
+    # Resets optimizer's gradients.
+    optimizer.zero_grad()
+    # Forward pass from the model.
+    predictions = model(**batch)
+    # Calculates loss.
+    loss = criterion(predictions, batch["player_future"][..., :2])
+    loss = torch.sum(loss, dim=[-2, -1])  # pylint: disable=no-member
+    loss = torch.mean(loss, dim=0)  # pylint: disable=no-member
+    # Backward pass.
+    loss.backward()
+    # Clips gradients norm.
+    if clip:
+      torch.nn.utils.clip_grad_norm(model.parameters(), 1.0)
+    # Performs a gradient descent step.
+    optimizer.step()
+    return loss
+
+  def train_epoch(
+      model: BehaviouralModel,
+      optimizer: optim.Optimizer,
+      dataloader: torch.utils.data.DataLoader,
+  ) -> torch.Tensor:
+    """Performs an epoch of gradient descent optimization on `dataloader`."""
+    model.train()
+    loss = 0.0
+    with tqdm.tqdm(dataloader) as pbar:
+      for batch in pbar:
+        # Prepares the batch.
+        batch = transform(batch)
+        # Performs a gradien-descent step.
+        loss += train_step(model, optimizer, batch, clip=clip_gradients)
+        # Reporting loss to ray tune
+        tune.report(loss=loss)
+
+    return loss / len(dataloader)
+
+  def evaluate_step(
+      model: BehaviouralModel,
+      batch: Mapping[str, torch.Tensor],
+  ) -> torch.Tensor:
+    """Evaluates `model` on a `batch`."""
+    # Forward pass from the model.
+    predictions = model(**batch)
+    # Calculates loss on mini-batch.
+    loss = criterion(predictions, batch["player_future"][..., :2])
+    loss = torch.sum(loss, dim=[-2, -1])  # pylint: disable=no-member
+    loss = torch.mean(loss, dim=0)  # pylint: disable=no-member
+    return loss
+
+  def evaluate_epoch(
+      model: BehaviouralModel,
+      dataloader: torch.utils.data.DataLoader,
+  ) -> torch.Tensor:
+    """Performs an evaluation of the `model` on the `dataloader."""
+    model.eval()
+    loss = 0.0
+    with tqdm.tqdm(dataloader) as pbar:
+      for batch in pbar:
+        # Prepares the batch.
+        batch = transform(batch)
+        # Accumulates loss in dataset.
+        with torch.no_grad():
+          loss += evaluate_step(model, batch)
+        # Reporting loss to ray tune
+        tune.report(eval_loss=loss)
+
+    return loss / len(dataloader)
+
+  def write(
+      model: BehaviouralModel,
+      dataloader: torch.utils.data.DataLoader,
+      writer: TensorBoardLogger,
+      split: str,
+      loss: torch.Tensor,
+      epoch: int,
+  ) -> None:
+    """Visualises model performance on `TensorBoard`."""
+    # Gets a sample from the dataset.
+    batch = next(iter(dataloader))
+    # Prepares the batch.
+    batch = transform(batch)
+    # Generates predictions.
+    with torch.no_grad():
+      predictions = model(**batch)
+    # Logs on `TensorBoard`.
+    writer.log(
+        split=split,
+        loss=loss.detach().cpu().numpy().item(),
+        overhead_features=batch["visual_features"].detach().cpu().numpy()[:8],
+        predictions=predictions.detach().cpu().numpy()[:8],
+        ground_truth=batch["player_future"].detach().cpu().numpy()[:8],
+        global_step=epoch,
+    )
+
+  with tqdm.tqdm(range(num_epochs)) as pbar_epoch:
+    for epoch in pbar_epoch:
+      # Trains model on whole training dataset, and writes on `TensorBoard`.
+      loss_train = train_epoch(model, optimizer, dataloader_train)
+      write(model, dataloader_train, writer, "train", loss_train, epoch)
+
+      # Evaluates model on whole validation dataset, and writes on `TensorBoard`.
+      loss_val = evaluate_epoch(model, dataloader_val)
+      write(model, dataloader_val, writer, "val", loss_val, epoch)
+
+      # Checkpoints model weights.
+      if epoch % save_model_frequency == 0:
+        checkpointer.save(epoch)
+
+      # Updates progress bar description.
+      pbar_epoch.set_description("TL: {:.2f} | VL: {:.2f}".format(
+          loss_train.detach().cpu().numpy().item(),
+          loss_val.detach().cpu().numpy().item(),
+      ))
+
+
+def run_experiments(argv):
+  # Debugging purposes.
+  logging.debug(argv)
+  logging.debug(FLAGS)
+
+  # Parses command line arguments.
+  dataset_dir = FLAGS.dataset_dir
+  output_dir = FLAGS.output_dir
+  batch_size = FLAGS.batch_size
+  num_epochs = FLAGS.num_epochs
+  learning_rate = FLAGS.learning_rate
+  save_model_frequency = FLAGS.save_model_frequency
+  num_timesteps_to_keep = FLAGS.num_timesteps_to_keep
+  weight_decay = FLAGS.weight_decay
+  clip_gradients = FLAGS.clip_gradients
+  noise_level = [1e-1, 1e-2, 1e-3]
+
+  analysis = tune.run(
+      main,
+      loggers=[WandBLogger],
+      num_samples=1,
+      resources_per_trial={
+          'gpu': torch.cuda.device_count(),
+      },
+      config={
+          "monitor": True,
+          "wandb": {
+              "project": "oatomobile",
+              "monitor_gym": True,
+          },
+          "dataset_dir": dataset_dir,
+          "output_dir": output_dir,
+          "save_model_frequency": save_model_frequency,
+          "num_timesteps_to_keep": num_timesteps_to_keep,
+          "clip_gradients": clip_gradients,
+          "batch_size": tune.grid_search(batch_size),
+          "num_epochs": tune.grid_search(num_epochs),
+          "learning_rate": tune.grid_search(learning_rate),
+          "weight_decay": tune.grid_search(weight_decay),
+          "noise_level": tune.grid_search(noise_level),
+      },
+  )
+
+  print("Best config: ", analysis.get_best_config(metric="loss"))
+
+
+if __name__ == "__main__":
+  flags.mark_flag_as_required("dataset_dir")
+  flags.mark_flag_as_required("output_dir")
+  flags.mark_flag_as_required("num_epochs")
+  app.run(run_experiments)
diff --git a/oatomobile/baselines/torch/dim/train.py b/oatomobile/baselines/torch/dim/train.py
@@ -12,7 +12,7 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 # ==============================================================================
-"""Trains the deep imitative model on expert demostrations."""
+"""Trains the deep imitative model on expert demonstrations."""
 
 import os
 from typing import Mapping