invite students to try

lucidrains · lucidrains · commit e5c824e59044 · 2025-02-19T16:36:50.000Z
diff --git a/README.md b/README.md
@@ -47,6 +47,8 @@ Then
 $ python train.py
 ```
 
+To record some of your experiments, just invoke `wandb login` first before modifying the training script
+
 ## Citations
 
 ```bibtex
diff --git a/train.py b/train.py
@@ -29,7 +29,7 @@
 
 PROJECT_NAME = 'native-sparse-attention'
 RUN_NAME = 'baseline' if not USE_SPARSE_ATTN else 'sparse-attn'
-WANDB_ONLINE = False # turn this on to pipe experiment to cloud
+WANDB_ONLINE = True # turn this on to pipe experiment to cloud
 
 # helpers
 
@@ -153,6 +153,7 @@ def __getitem__(self, index):
 
         (loss / GRAD_ACCUM_EVERY).backward()
 
+    wandb.log(dict(loss = loss.item()), step = i)
     print(f"training loss: {loss.item():.3f}")
 
     torch.nn.utils.clip_grad_norm_(model.parameters(), 0.5)
@@ -166,6 +167,7 @@ def __getitem__(self, index):
             valid_data = next(val_loader)
 
             loss = model(valid_data, return_loss = True)
+            wandb.log(dict(valid_loss = loss.item()), step = i)
             print(f"validation loss: {loss.item():.3f}")
 
     if i % GENERATE_EVERY == 0: