fix move model to device before calculating loss
@@ -425,6 +425,7 @@
"\n",
"torch.manual_seed(123)\n",
"model = GPTModel(GPT_CONFIG_124M)\n",
+ "model.to(device)\n",
"loss = calc_loss_batch(input_batch, target_batch, model, device)\n",
"loss.backward()"