diff --git a/appendix-E/01_main-chapter-code/appendix-E.ipynb b/appendix-E/01_main-chapter-code/appendix-E.ipynb index 70464c1..24080c9 100644 --- a/appendix-E/01_main-chapter-code/appendix-E.ipynb +++ b/appendix-E/01_main-chapter-code/appendix-E.ipynb @@ -207,9 +207,8 @@ "\n", "try:\n", " download_and_unzip_spam_data(url, zip_path, extracted_path, data_file_path)\n", - "except urllib.error.HTTPError:\n", - " print(\"UCI Machine Learning Repository (https://archive.ics.uci.edu)\"\n", - " \" temporary unavailable. Using backup URL.\")\n", + "except (urllib.error.HTTPError, urllib.error.URLError, TimeoutError) as e:\n", + " print(f\"Primary URL failed: {e}. Trying backup URL...\")\n", " url = \"https://f001.backblazeb2.com/file/LLMs-from-scratch/sms%2Bspam%2Bcollection.zip\"\n", " download_and_unzip_spam_data(url, zip_path, extracted_path, data_file_path)\n", "\n", diff --git a/ch06/01_main-chapter-code/ch06.ipynb b/ch06/01_main-chapter-code/ch06.ipynb index 9e14ce6..669e75d 100644 --- a/ch06/01_main-chapter-code/ch06.ipynb +++ b/ch06/01_main-chapter-code/ch06.ipynb @@ -217,9 +217,8 @@ "\n", "try:\n", " download_and_unzip_spam_data(url, zip_path, extracted_path, data_file_path)\n", - "except urllib.error.HTTPError:\n", - " print(\"UCI Machine Learning Repository (https://archive.ics.uci.edu)\"\n", - " \" temporary unavailable. Using backup URL.\")\n", + "except (urllib.error.HTTPError, urllib.error.URLError, TimeoutError) as e:\n", + " print(f\"Primary URL failed: {e}. Trying backup URL...\")\n", " url = \"https://f001.backblazeb2.com/file/LLMs-from-scratch/sms%2Bspam%2Bcollection.zip\"\n", " download_and_unzip_spam_data(url, zip_path, extracted_path, data_file_path) " ] diff --git a/ch06/01_main-chapter-code/gpt_class_finetune.py b/ch06/01_main-chapter-code/gpt_class_finetune.py index 0f17d4b..8e925dd 100644 --- a/ch06/01_main-chapter-code/gpt_class_finetune.py +++ b/ch06/01_main-chapter-code/gpt_class_finetune.py @@ -280,7 +280,8 @@ if __name__ == "__main__": download_and_unzip_spam_data( url, zip_path, extracted_path, data_file_path, test_mode=args.test_mode ) - except urllib.error.HTTPError: + except (urllib.error.HTTPError, urllib.error.URLError, TimeoutError) as e: + print(f"Primary URL failed: {e}. Trying backup URL...") backup_url = "https://f001.backblazeb2.com/file/LLMs-from-scratch/sms%2Bspam%2Bcollection.zip" download_and_unzip_spam_data( backup_url, zip_path, extracted_path, data_file_path, test_mode=args.test_mode diff --git a/ch06/02_bonus_additional-experiments/additional_experiments.py b/ch06/02_bonus_additional-experiments/additional_experiments.py index 28c3c09..a85b932 100644 --- a/ch06/02_bonus_additional-experiments/additional_experiments.py +++ b/ch06/02_bonus_additional-experiments/additional_experiments.py @@ -605,7 +605,8 @@ if __name__ == "__main__": if not all_exist: try: download_and_unzip(url, zip_path, extract_to, new_file_path) - except urllib.error.HTTPError: + except (urllib.error.HTTPError, urllib.error.URLError, TimeoutError) as e: + print(f"Primary URL failed: {e}. Trying backup URL...") backup_url = "https://f001.backblazeb2.com/file/LLMs-from-scratch/sms%2Bspam%2Bcollection.zip" download_and_unzip(backup_url, zip_path, extract_to, new_file_path) create_dataset_csvs(new_file_path) diff --git a/ch06/03_bonus_imdb-classification/train_bert_hf_spam.py b/ch06/03_bonus_imdb-classification/train_bert_hf_spam.py index 603fb1c..72fbd1a 100644 --- a/ch06/03_bonus_imdb-classification/train_bert_hf_spam.py +++ b/ch06/03_bonus_imdb-classification/train_bert_hf_spam.py @@ -412,7 +412,8 @@ if __name__ == "__main__": if not all_exist: try: download_and_unzip(url, zip_path, extract_to, new_file_path) - except urllib.error.HTTPError: + except (urllib.error.HTTPError, urllib.error.URLError, TimeoutError) as e: + print(f"Primary URL failed: {e}. Trying backup URL...") backup_url = "https://f001.backblazeb2.com/file/LLMs-from-scratch/sms%2Bspam%2Bcollection.zip" download_and_unzip(backup_url, zip_path, extract_to, new_file_path) create_dataset_csvs(new_file_path)