Merge pull request #173 from rasbt/device-setting

Fix device setting
2025-10-03 03:57:46 +00:00 · 2024-05-22 18:59:58 -04:00 · 2024-05-22 18:59:58 -04:00 · 9587b58cf7
commit 9587b58cf7
parent 7a2a157844 86f6c2df43
1 changed files with 1 additions and 5 deletions
--- a/ch06/01_main-chapter-code/gpt-class-finetune.py
+++ b/ch06/01_main-chapter-code/gpt-class-finetune.py
@ -350,9 +350,7 @@ if __name__ == "__main__":
        }
        model = GPTModel(BASE_CONFIG)
        model.eval()
-
        device = "cpu"
-        model.to(device)

    # Code as it is used in the main chapter
    else:
@ -380,10 +378,7 @@ if __name__ == "__main__":

        model = GPTModel(BASE_CONFIG)
        load_weights_into_gpt(model, params)
-        model.eval()
-
        device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
-        model.to(device)

    ########################################
    # Modify and pretrained model
@ -396,6 +391,7 @@ if __name__ == "__main__":

    num_classes = 2
    model.out_head = torch.nn.Linear(in_features=BASE_CONFIG["emb_dim"], out_features=num_classes)
+    model.to(device)

    for param in model.trf_blocks[-1].parameters():
        param.requires_grad = True