From f03f545a17fb5ebbf0987d9916df9d0a6709eb8f Mon Sep 17 00:00:00 2001 From: rasbt Date: Fri, 1 Nov 2024 16:47:12 -0500 Subject: [PATCH] Note about warm-up steps --- appendix-D/01_main-chapter-code/appendix-D.ipynb | 12 ++++++++++-- 1 file changed, 10 insertions(+), 2 deletions(-) diff --git a/appendix-D/01_main-chapter-code/appendix-D.ipynb b/appendix-D/01_main-chapter-code/appendix-D.ipynb index a157b71..8b28e67 100644 --- a/appendix-D/01_main-chapter-code/appendix-D.ipynb +++ b/appendix-D/01_main-chapter-code/appendix-D.ipynb @@ -203,7 +203,7 @@ "id": "5bf3a8da-abc4-4b80-a5d8-f1cc1c7cc5f3", "metadata": {}, "source": [ - "- Typically, the number of warmup steps is between 0.1% to 10% of the total number of steps\n", + "- Typically, the number of warmup steps is between 0.1% to 20% of the total number of steps\n", "- We can compute the increment as the difference between the `peak_lr` and `initial_lr` divided by the number of warmup steps" ] }, @@ -227,6 +227,14 @@ "print(warmup_steps)" ] }, + { + "cell_type": "markdown", + "id": "4b6bbdc8-0104-459e-a7ed-b08be8578709", + "metadata": {}, + "source": [ + "- Note that the print book accidentally includes a leftover code line, `warmup_steps = 20`, which is not used and can be safely ignored" + ] + }, { "cell_type": "code", "execution_count": 6, @@ -809,7 +817,7 @@ "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", - "version": "3.11.4" + "version": "3.10.6" } }, "nbformat": 4,