Fix shuffling and use provided context size on CLI.

53bcc538 · Wes Brown · 6c1a2d67 · 53bcc538
Commit 53bcc538 authored Jul 14, 2022 by Wes Brown
Hide whitespace changes
Inline Side-by-side

Showing with 4 additions and 2 deletions

hypertrain.py hypertrain.py +4 -2

No files found.
--- a/hypertrain.py
+++ b/hypertrain.py
@@ -263,6 +263,7 @@ train_config = {
    "amp": args.amp,
    "loss_scale": args.loss_scale,
    "eval_every": args.eval_every,
+    "context_size": args.context_size,
 }
 torch.manual_seed(train_config["seed"])
 bs = train_config["bs"]
@@ -303,13 +304,14 @@ else:
 # TODO: Add load, add evals, add FP16 AMP, and Data Parallel, outputting hidden
 #       states from the get_logits function.
 print(opt.curr_step)
-train_dataset = dataset.ShardedDataset(2049, train_config["data_path"])
+train_dataset = dataset.ShardedDataset(train_config["context_size"],
+                                       train_config["data_path"])
 if last_cp:
    train_dataset.skip = opt.curr_step * bs * gas

 train_loader = data.DataLoader(train_dataset,
                               batch_size=bs * gas,
-                               shuffle=False,
+                               shuffle=True,
                               num_workers=0)
 wandb.init(project="hypernetwork-tests",
           name=train_config["run_name"],