Sebastian Raschka 
							
						 
					 
					
						
						
						
						
							
						
						
							a060f923d3 
							
						 
					 
					
						
						
							
							Merge pull request  #32  from rasbt/hparam  
						
						 
						
						... 
						
						
						
						Add hparam tuning script 
						
						
					 
					
						2024-02-27 08:52:01 -06:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								rasbt 
							
						 
					 
					
						
						
						
						
							
						
						
							87a743076d 
							
						 
					 
					
						
						
							
							hparam tuning script  
						
						 
						
						
						
						
					 
					
						2024-02-27 08:51:03 -06:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								rasbt 
							
						 
					 
					
						
						
						
						
							
						
						
							f6266c3756 
							
						 
					 
					
						
						
							
							improve code comments  
						
						 
						
						
						
						
					 
					
						2024-02-27 06:40:35 -06:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								Rayed Bin Wahed 
							
						 
					 
					
						
						
						
						
							
						
						
							45a10dd823 
							
						 
					 
					
						
						
							
							Add devcontainer starter doc  
						
						 
						
						
						
						
					 
					
						2024-02-27 13:04:06 +08:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								Rayed Bin Wahed 
							
						 
					 
					
						
						
						
						
							
						
						
							fa7e659eb3 
							
						 
					 
					
						
						
							
							Add devcontainer  
						
						 
						
						
						
						
					 
					
						2024-02-26 22:29:27 +08:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								Sebastian Raschka 
							
						 
					 
					
						
						
						
						
							
						
						
							78ed2e35bc 
							
						 
					 
					
						
						
							
							Add requirements.txt to main repo  
						
						 
						
						
						
						
					 
					
						2024-02-25 13:32:30 -06:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								Sebastian Raschka 
							
						 
					 
					
						
						
						
						
							
						
						
							3debb2f0df 
							
						 
					 
					
						
						
							
							Update README.md  
						
						 
						
						
						
						
					 
					
						2024-02-25 13:31:32 -06:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								rasbt 
							
						 
					 
					
						
						
						
						
							
						
						
							3f186ab072 
							
						 
					 
					
						
						
							
							use .shape instead of .size() for consistency  
						
						 
						
						
						
						
					 
					
						2024-02-25 08:47:25 -06:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								rasbt 
							
						 
					 
					
						
						
						
						
							
						
						
							cdcd73ba7f 
							
						 
					 
					
						
						
							
							drop_last=True  
						
						 
						
						
						
						
					 
					
						2024-02-25 07:23:38 -06:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								rasbt 
							
						 
					 
					
						
						
						
						
							
						
						
							6243726ab3 
							
						 
					 
					
						
						
							
							rename to dataloader v1  
						
						 
						
						
						
						
					 
					
						2024-02-24 07:48:18 -06:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								rasbt 
							
						 
					 
					
						
						
						
						
							
						
						
							4e68649f16 
							
						 
					 
					
						
						
							
							comment update  
						
						 
						
						
						
						
					 
					
						2024-02-24 06:52:17 -06:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								rasbt 
							
						 
					 
					
						
						
						
						
							
						
						
							f057156181 
							
						 
					 
					
						
						
							
							use smaller number of tokens to emphasize next token prediction goal  
						
						 
						
						
						
						
					 
					
						2024-02-15 20:09:20 -06:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								rasbt 
							
						 
					 
					
						
						
						
						
							
						
						
							557ddfc684 
							
						 
					 
					
						
						
							
							make a new example for shortcut connections  
						
						 
						
						
						
						
					 
					
						2024-02-15 19:34:12 -06:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								rasbt 
							
						 
					 
					
						
						
						
						
							
						
						
							250e6306e2 
							
						 
					 
					
						
						
							
							use attn_scores from sec 3.4 instead of 3.3  
						
						 
						
						
						
						
					 
					
						2024-02-14 20:23:59 -06:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								rasbt 
							
						 
					 
					
						
						
						
						
							
						
						
							231a854ae7 
							
						 
					 
					
						
						
							
							use less ambiguous var name  
						
						 
						
						
						
						
					 
					
						2024-02-13 07:05:37 -06:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								Sebastian Raschka 
							
						 
					 
					
						
						
						
						
							
						
						
							320f63829f 
							
						 
					 
					
						
						
							
							Merge pull request  #29  from Intelligence-Manifesto/patch-5  
						
						 
						
						... 
						
						
						
						**step 2** 
						
						
					 
					
						2024-02-12 07:34:37 -06:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								Intelligence-Manifesto 
							
						 
					 
					
						
						
						
						
							
						
						
							6a09e7b03a 
							
						 
					 
					
						
						
							
							**step 2**  
						
						 
						
						... 
						
						
						
						step 2: According to the context, the formatting here should be **step 2**. 
Additionally, it seems that there is a lack of text description for step 1 in this section, as other sections are all labeled with steps 1, 2, 3 in order, clearly indicating the steps. 
						
						
					 
					
						2024-02-12 18:32:28 +08:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								rasbt 
							
						 
					 
					
						
						
						
						
							
						
						
							1d6f2c9084 
							
						 
					 
					
						
						
							
							rearrange exercise order  
						
						 
						
						
						
						
					 
					
						2024-02-11 14:46:05 -06:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								Sebastian Raschka 
							
						 
					 
					
						
						
						
						
							
						
						
							79d90d8147 
							
						 
					 
					
						
						
							
							Merge pull request  #28  from rasbt/ch4-exercise-solutions  
						
						 
						
						... 
						
						
						
						Add chapter 4 exercise solutions 
						
						
					 
					
						2024-02-11 11:52:18 -06:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								rasbt 
							
						 
					 
					
						
						
						
						
							
						
						
							fe332006de 
							
						 
					 
					
						
						
							
							ch4 exercise solutions  
						
						 
						
						
						
						
					 
					
						2024-02-11 11:51:39 -06:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								rasbt 
							
						 
					 
					
						
						
						
						
							
						
						
							103f7826ad 
							
						 
					 
					
						
						
							
							use same iter to make figs consistent  
						
						 
						
						
						
						
					 
					
						2024-02-11 09:12:52 -06:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								rasbt 
							
						 
					 
					
						
						
						
						
							
						
						
							352b83d225 
							
						 
					 
					
						
						
							
							make softmax explicit  
						
						 
						
						
						
						
					 
					
						2024-02-11 08:42:21 -06:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								rasbt 
							
						 
					 
					
						
						
						
						
							
						
						
							7d86023fc4 
							
						 
					 
					
						
						
							
							make softmax explicit  
						
						 
						
						
						
						
					 
					
						2024-02-11 08:41:45 -06:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								rasbt 
							
						 
					 
					
						
						
						
						
							
						
						
							5840b4b5f8 
							
						 
					 
					
						
						
							
							update name of last section  
						
						 
						
						
						
						
					 
					
						2024-02-11 07:35:07 -06:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								Sebastian Raschka 
							
						 
					 
					
						
						
						
						
							
						
						
							e0b6fdbc53 
							
						 
					 
					
						
						
							
							Merge pull request  #27  from Intelligence-Manifesto/patch-4  
						
						 
						
						... 
						
						
						
						12 -> 21 
						
						
					 
					
						2024-02-11 07:31:06 -06:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								Intelligence-Manifesto 
							
						 
					 
					
						
						
						
						
							
						
						
							1278615c25 
							
						 
					 
					
						
						
							
							12 -> 21  
						
						 
						
						... 
						
						
						
						12 -> 21 
						
						
					 
					
						2024-02-11 14:17:55 +08:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								rasbt 
							
						 
					 
					
						
						
						
						
							
						
						
							baa8617921 
							
						 
					 
					
						
						
							
							variable name fix  
						
						 
						
						
						
						
					 
					
						2024-02-10 17:53:54 -06:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								rasbt 
							
						 
					 
					
						
						
						
						
							
						
						
							496b52f842 
							
						 
					 
					
						
						
							
							format the other GPT architecture sizes  
						
						 
						
						
						
						
					 
					
						2024-02-10 17:47:56 -06:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								rasbt 
							
						 
					 
					
						
						
						
						
							
						
						
							40477c55b3 
							
						 
					 
					
						
						
							
							add missing ex sol to table  
						
						 
						
						
						
						
					 
					
						2024-02-10 10:13:21 -06:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								rasbt 
							
						 
					 
					
						
						
						
						
							
						
						
							10aa2d099d 
							
						 
					 
					
						
						
							
							add print statements for illustration purposes  
						
						 
						
						
						
						
					 
					
						2024-02-10 10:10:14 -06:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								rasbt 
							
						 
					 
					
						
						
						
						
							
						
						
							cc459b6b5a 
							
						 
					 
					
						
						
							
							Merge branch 'main' of  https://github.com/rasbt/LLMs-from-scratch  
						
						 
						
						
						
						
					 
					
						2024-02-08 20:17:01 -06:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								rasbt 
							
						 
					 
					
						
						
						
						
							
						
						
							5d1d8ce511 
							
						 
					 
					
						
						
							
							add shape information for clarity  
						
						 
						
						
						
						
					 
					
						2024-02-08 20:16:54 -06:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								Sebastian Raschka 
							
						 
					 
					
						
						
						
						
							
						
						
							24d71784e2 
							
						 
					 
					
						
						
							
							Merge pull request  #26  from Intelligence-Manifesto/patch-3  
						
						 
						
						... 
						
						
						
						if -> in 
						
						
					 
					
						2024-02-08 17:19:29 -06:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								Intelligence-Manifesto 
							
						 
					 
					
						
						
						
						
							
						
						
							a61583e31e 
							
						 
					 
					
						
						
							
							if -> in  
						
						 
						
						... 
						
						
						
						if -> in 
						
						
					 
					
						2024-02-09 04:18:07 +08:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								Sebastian Raschka 
							
						 
					 
					
						
						
						
						
							
						
						
							55ced1d95e 
							
						 
					 
					
						
						
							
							Update README.md  
						
						 
						
						
						
						
					 
					
						2024-02-06 07:38:52 -06:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								rasbt 
							
						 
					 
					
						
						
						
						
							
						
						
							3a5fc79b38 
							
						 
					 
					
						
						
							
							add and update readme files  
						
						 
						
						
						
						
					 
					
						2024-02-05 06:51:58 -06:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								rasbt 
							
						 
					 
					
						
						
						
						
							
						
						
							2b38b63a7a 
							
						 
					 
					
						
						
							
							move overview up  
						
						 
						
						
						
						
					 
					
						2024-02-04 15:57:03 -06:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								rasbt 
							
						 
					 
					
						
						
						
						
							
						
						
							bb50de7210 
							
						 
					 
					
						
						
							
							adjust figure width  
						
						 
						
						
						
						
					 
					
						2024-02-04 10:12:11 -06:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								rasbt 
							
						 
					 
					
						
						
						
						
							
						
						
							1653f6953a 
							
						 
					 
					
						
						
							
							adjust figure width  
						
						 
						
						
						
						
					 
					
						2024-02-04 10:09:36 -06:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								Sebastian Raschka 
							
						 
					 
					
						
						
						
						
							
						
						
							f2fe1d0d85 
							
						 
					 
					
						
						
							
							Merge pull request  #24  from rasbt/ch04  
						
						 
						
						... 
						
						
						
						add chapter 4 code 
						
						
					 
					
						2024-02-04 10:06:56 -06:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								rasbt 
							
						 
					 
					
						
						
						
						
							
						
						
							b86cc682f0 
							
						 
					 
					
						
						
							
							update links in readme  
						
						 
						
						
						
						
					 
					
						2024-02-04 10:05:55 -06:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								rasbt 
							
						 
					 
					
						
						
						
						
							
						
						
							ec312e581b 
							
						 
					 
					
						
						
							
							add chapter 4 code  
						
						 
						
						
						
						
					 
					
						2024-02-04 10:02:05 -06:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								rasbt 
							
						 
					 
					
						
						
						
						
							
						
						
							16b30ccd5c 
							
						 
					 
					
						
						
							
							set stride equal to max len  
						
						 
						
						
						
						
					 
					
						2024-02-03 08:50:56 -06:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								Sebastian Raschka 
							
						 
					 
					
						
						
						
						
							
						
						
							b9974da94d 
							
						 
					 
					
						
						
							
							Merge pull request  #22  from Intelligence-Manifesto/patch-2  
						
						 
						
						... 
						
						
						
						missing single quotes 
						
						
					 
					
						2024-02-03 08:46:40 -06:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								Intelligence-Manifesto 
							
						 
					 
					
						
						
						
						
							
						
						
							78ab68b4d3 
							
						 
					 
					
						
						
							
							missing single quotes  
						
						 
						
						... 
						
						
						
						missing single quotes 
						
						
					 
					
						2024-02-03 03:41:31 +08:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								rasbt 
							
						 
					 
					
						
						
						
						
							
						
						
							d261abce4c 
							
						 
					 
					
						
						
							
							add forward pass  
						
						 
						
						
						
						
					 
					
						2024-01-31 08:00:19 -06:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								rasbt 
							
						 
					 
					
						
						
						
						
							
						
						
							fcb13fd636 
							
						 
					 
					
						
						
							
							add code backbone ch04  
						
						 
						
						
						
						
					 
					
						2024-01-29 08:14:23 -06:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								Sebastian Raschka 
							
						 
					 
					
						
						
						
						
							
						
						
							3002777dd2 
							
						 
					 
					
						
						
							
							Update README.md  
						
						 
						
						
						
						
					 
					
						2024-01-28 18:41:02 -06:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								rasbt 
							
						 
					 
					
						
						
						
						
							
						
						
							c4803bb91a 
							
						 
					 
					
						
						
							
							add libmamba  
						
						 
						
						
						
						
					 
					
						2024-01-28 12:47:29 -06:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								rasbt 
							
						 
					 
					
						
						
						
						
							
						
						
							22442b7012 
							
						 
					 
					
						
						
							
							use torch.softmax instead of F.softmax  
						
						 
						
						
						
						
					 
					
						2024-01-28 12:25:49 -06:00