rasbt 
							
						 
					 
					
						
						
						
						
							
						
						
							250e6306e2 
							
						 
					 
					
						
						
							
							use attn_scores from sec 3.4 instead of 3.3  
						
						 
						
						
						
						
					 
					
						2024-02-14 20:23:59 -06:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								rasbt 
							
						 
					 
					
						
						
						
						
							
						
						
							231a854ae7 
							
						 
					 
					
						
						
							
							use less ambiguous var name  
						
						 
						
						
						
						
					 
					
						2024-02-13 07:05:37 -06:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								Sebastian Raschka 
							
						 
					 
					
						
						
						
						
							
						
						
							320f63829f 
							
						 
					 
					
						
						
							
							Merge pull request  #29  from Intelligence-Manifesto/patch-5  
						
						 
						
						... 
						
						
						
						**step 2** 
						
						
					 
					
						2024-02-12 07:34:37 -06:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								Intelligence-Manifesto 
							
						 
					 
					
						
						
						
						
							
						
						
							6a09e7b03a 
							
						 
					 
					
						
						
							
							**step 2**  
						
						 
						
						... 
						
						
						
						step 2: According to the context, the formatting here should be **step 2**. 
Additionally, it seems that there is a lack of text description for step 1 in this section, as other sections are all labeled with steps 1, 2, 3 in order, clearly indicating the steps. 
						
						
					 
					
						2024-02-12 18:32:28 +08:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								rasbt 
							
						 
					 
					
						
						
						
						
							
						
						
							1d6f2c9084 
							
						 
					 
					
						
						
							
							rearrange exercise order  
						
						 
						
						
						
						
					 
					
						2024-02-11 14:46:05 -06:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								Sebastian Raschka 
							
						 
					 
					
						
						
						
						
							
						
						
							79d90d8147 
							
						 
					 
					
						
						
							
							Merge pull request  #28  from rasbt/ch4-exercise-solutions  
						
						 
						
						... 
						
						
						
						Add chapter 4 exercise solutions 
						
						
					 
					
						2024-02-11 11:52:18 -06:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								rasbt 
							
						 
					 
					
						
						
						
						
							
						
						
							fe332006de 
							
						 
					 
					
						
						
							
							ch4 exercise solutions  
						
						 
						
						
						
						
					 
					
						2024-02-11 11:51:39 -06:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								rasbt 
							
						 
					 
					
						
						
						
						
							
						
						
							103f7826ad 
							
						 
					 
					
						
						
							
							use same iter to make figs consistent  
						
						 
						
						
						
						
					 
					
						2024-02-11 09:12:52 -06:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								rasbt 
							
						 
					 
					
						
						
						
						
							
						
						
							352b83d225 
							
						 
					 
					
						
						
							
							make softmax explicit  
						
						 
						
						
						
						
					 
					
						2024-02-11 08:42:21 -06:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								rasbt 
							
						 
					 
					
						
						
						
						
							
						
						
							7d86023fc4 
							
						 
					 
					
						
						
							
							make softmax explicit  
						
						 
						
						
						
						
					 
					
						2024-02-11 08:41:45 -06:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								rasbt 
							
						 
					 
					
						
						
						
						
							
						
						
							5840b4b5f8 
							
						 
					 
					
						
						
							
							update name of last section  
						
						 
						
						
						
						
					 
					
						2024-02-11 07:35:07 -06:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								Sebastian Raschka 
							
						 
					 
					
						
						
						
						
							
						
						
							e0b6fdbc53 
							
						 
					 
					
						
						
							
							Merge pull request  #27  from Intelligence-Manifesto/patch-4  
						
						 
						
						... 
						
						
						
						12 -> 21 
						
						
					 
					
						2024-02-11 07:31:06 -06:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								Intelligence-Manifesto 
							
						 
					 
					
						
						
						
						
							
						
						
							1278615c25 
							
						 
					 
					
						
						
							
							12 -> 21  
						
						 
						
						... 
						
						
						
						12 -> 21 
						
						
					 
					
						2024-02-11 14:17:55 +08:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								rasbt 
							
						 
					 
					
						
						
						
						
							
						
						
							baa8617921 
							
						 
					 
					
						
						
							
							variable name fix  
						
						 
						
						
						
						
					 
					
						2024-02-10 17:53:54 -06:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								rasbt 
							
						 
					 
					
						
						
						
						
							
						
						
							496b52f842 
							
						 
					 
					
						
						
							
							format the other GPT architecture sizes  
						
						 
						
						
						
						
					 
					
						2024-02-10 17:47:56 -06:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								rasbt 
							
						 
					 
					
						
						
						
						
							
						
						
							40477c55b3 
							
						 
					 
					
						
						
							
							add missing ex sol to table  
						
						 
						
						
						
						
					 
					
						2024-02-10 10:13:21 -06:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								rasbt 
							
						 
					 
					
						
						
						
						
							
						
						
							10aa2d099d 
							
						 
					 
					
						
						
							
							add print statements for illustration purposes  
						
						 
						
						
						
						
					 
					
						2024-02-10 10:10:14 -06:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								rasbt 
							
						 
					 
					
						
						
						
						
							
						
						
							cc459b6b5a 
							
						 
					 
					
						
						
							
							Merge branch 'main' of  https://github.com/rasbt/LLMs-from-scratch  
						
						 
						
						
						
						
					 
					
						2024-02-08 20:17:01 -06:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								rasbt 
							
						 
					 
					
						
						
						
						
							
						
						
							5d1d8ce511 
							
						 
					 
					
						
						
							
							add shape information for clarity  
						
						 
						
						
						
						
					 
					
						2024-02-08 20:16:54 -06:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								Sebastian Raschka 
							
						 
					 
					
						
						
						
						
							
						
						
							24d71784e2 
							
						 
					 
					
						
						
							
							Merge pull request  #26  from Intelligence-Manifesto/patch-3  
						
						 
						
						... 
						
						
						
						if -> in 
						
						
					 
					
						2024-02-08 17:19:29 -06:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								Intelligence-Manifesto 
							
						 
					 
					
						
						
						
						
							
						
						
							a61583e31e 
							
						 
					 
					
						
						
							
							if -> in  
						
						 
						
						... 
						
						
						
						if -> in 
						
						
					 
					
						2024-02-09 04:18:07 +08:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								Sebastian Raschka 
							
						 
					 
					
						
						
						
						
							
						
						
							55ced1d95e 
							
						 
					 
					
						
						
							
							Update README.md  
						
						 
						
						
						
						
					 
					
						2024-02-06 07:38:52 -06:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								rasbt 
							
						 
					 
					
						
						
						
						
							
						
						
							3a5fc79b38 
							
						 
					 
					
						
						
							
							add and update readme files  
						
						 
						
						
						
						
					 
					
						2024-02-05 06:51:58 -06:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								rasbt 
							
						 
					 
					
						
						
						
						
							
						
						
							2b38b63a7a 
							
						 
					 
					
						
						
							
							move overview up  
						
						 
						
						
						
						
					 
					
						2024-02-04 15:57:03 -06:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								rasbt 
							
						 
					 
					
						
						
						
						
							
						
						
							bb50de7210 
							
						 
					 
					
						
						
							
							adjust figure width  
						
						 
						
						
						
						
					 
					
						2024-02-04 10:12:11 -06:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								rasbt 
							
						 
					 
					
						
						
						
						
							
						
						
							1653f6953a 
							
						 
					 
					
						
						
							
							adjust figure width  
						
						 
						
						
						
						
					 
					
						2024-02-04 10:09:36 -06:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								Sebastian Raschka 
							
						 
					 
					
						
						
						
						
							
						
						
							f2fe1d0d85 
							
						 
					 
					
						
						
							
							Merge pull request  #24  from rasbt/ch04  
						
						 
						
						... 
						
						
						
						add chapter 4 code 
						
						
					 
					
						2024-02-04 10:06:56 -06:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								rasbt 
							
						 
					 
					
						
						
						
						
							
						
						
							b86cc682f0 
							
						 
					 
					
						
						
							
							update links in readme  
						
						 
						
						
						
						
					 
					
						2024-02-04 10:05:55 -06:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								rasbt 
							
						 
					 
					
						
						
						
						
							
						
						
							ec312e581b 
							
						 
					 
					
						
						
							
							add chapter 4 code  
						
						 
						
						
						
						
					 
					
						2024-02-04 10:02:05 -06:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								rasbt 
							
						 
					 
					
						
						
						
						
							
						
						
							16b30ccd5c 
							
						 
					 
					
						
						
							
							set stride equal to max len  
						
						 
						
						
						
						
					 
					
						2024-02-03 08:50:56 -06:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								Sebastian Raschka 
							
						 
					 
					
						
						
						
						
							
						
						
							b9974da94d 
							
						 
					 
					
						
						
							
							Merge pull request  #22  from Intelligence-Manifesto/patch-2  
						
						 
						
						... 
						
						
						
						missing single quotes 
						
						
					 
					
						2024-02-03 08:46:40 -06:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								Intelligence-Manifesto 
							
						 
					 
					
						
						
						
						
							
						
						
							78ab68b4d3 
							
						 
					 
					
						
						
							
							missing single quotes  
						
						 
						
						... 
						
						
						
						missing single quotes 
						
						
					 
					
						2024-02-03 03:41:31 +08:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								rasbt 
							
						 
					 
					
						
						
						
						
							
						
						
							d261abce4c 
							
						 
					 
					
						
						
							
							add forward pass  
						
						 
						
						
						
						
					 
					
						2024-01-31 08:00:19 -06:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								rasbt 
							
						 
					 
					
						
						
						
						
							
						
						
							fcb13fd636 
							
						 
					 
					
						
						
							
							add code backbone ch04  
						
						 
						
						
						
						
					 
					
						2024-01-29 08:14:23 -06:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								Sebastian Raschka 
							
						 
					 
					
						
						
						
						
							
						
						
							3002777dd2 
							
						 
					 
					
						
						
							
							Update README.md  
						
						 
						
						
						
						
					 
					
						2024-01-28 18:41:02 -06:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								rasbt 
							
						 
					 
					
						
						
						
						
							
						
						
							c4803bb91a 
							
						 
					 
					
						
						
							
							add libmamba  
						
						 
						
						
						
						
					 
					
						2024-01-28 12:47:29 -06:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								rasbt 
							
						 
					 
					
						
						
						
						
							
						
						
							22442b7012 
							
						 
					 
					
						
						
							
							use torch.softmax instead of F.softmax  
						
						 
						
						
						
						
					 
					
						2024-01-28 12:25:49 -06:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								Sebastian Raschka 
							
						 
					 
					
						
						
						
						
							
						
						
							eb142491b2 
							
						 
					 
					
						
						
							
							Merge pull request  #20  from eltociear/patch-1  
						
						 
						
						... 
						
						
						
						Update bpe_openai_gpt2.py 
						
						
					 
					
						2024-01-28 09:07:49 -06:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								Ikko Eltociear Ashimine 
							
						 
					 
					
						
						
						
						
							
						
						
							3a3a4ac1f1 
							
						 
					 
					
						
						
							
							Update bpe_openai_gpt2.py  
						
						 
						
						... 
						
						
						
						signficant -> significant 
						
						
					 
					
						2024-01-28 23:26:23 +09:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								Sebastian Raschka 
							
						 
					 
					
						
						
						
						
							
						
						
							f6e80a376d 
							
						 
					 
					
						
						
							
							Fix link  
						
						 
						
						
						
						
					 
					
						2024-01-26 20:30:20 -06:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								Sebastian Raschka 
							
						 
					 
					
						
						
						
						
							
						
						
							04c113c54f 
							
						 
					 
					
						
						
							
							Merge pull request  #19  from Intelligence-Manifesto/patch-1  
						
						 
						
						... 
						
						
						
						a repetition of the word "by" 
						
						
					 
					
						2024-01-25 17:41:49 -06:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								Intelligence-Manifesto 
							
						 
					 
					
						
						
						
						
							
						
						
							004d6a2af9 
							
						 
					 
					
						
						
							
							a repetition of the word "by"  
						
						 
						
						... 
						
						
						
						"The Verdict by by Edith Wharton" contains a repetition of the word "by." The correct form should be "The Verdict by Edith Wharton." 
						
						
					 
					
						2024-01-26 00:43:57 +08:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								rasbt 
							
						 
					 
					
						
						
						
						
							
						
						
							0eab244f00 
							
						 
					 
					
						
						
							
							add full toc  
						
						 
						
						
						
						
					 
					
						2024-01-24 07:09:35 -06:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								rasbt 
							
						 
					 
					
						
						
						
						
							
						
						
							f27c9e6135 
							
						 
					 
					
						
						
							
							rename create_dataloader to create_dataloader_v1  
						
						 
						
						
						
						
					 
					
						2024-01-24 07:02:05 -06:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								rasbt 
							
						 
					 
					
						
						
						
						
							
						
						
							f6896d17ef 
							
						 
					 
					
						
						
							
							image resizing  
						
						 
						
						
						
						
					 
					
						2024-01-21 20:25:34 -06:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								Sebastian Raschka 
							
						 
					 
					
						
						
						
						
							
						
						
							4c45c37c51 
							
						 
					 
					
						
						
							
							Update README.md  
						
						 
						
						
						
						
					 
					
						2024-01-21 20:17:32 -06:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								Sebastian Raschka 
							
						 
					 
					
						
						
						
						
							
						
						
							f2b034df66 
							
						 
					 
					
						
						
							
							Merge pull request  #17  from rasbt/package-install  
						
						 
						
						... 
						
						
						
						additional package installation info 
						
						
					 
					
						2024-01-21 20:16:59 -06:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								rasbt 
							
						 
					 
					
						
						
						
						
							
						
						
							fdfa39eb71 
							
						 
					 
					
						
						
							
							additional package installation info  
						
						 
						
						
						
						
					 
					
						2024-01-21 20:16:19 -06:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								rasbt 
							
						 
					 
					
						
						
						
						
							
						
						
							8860e16e05 
							
						 
					 
					
						
						
							
							<|endoftext|> token in dataset v1  
						
						 
						
						
						
						
					 
					
						2024-01-21 12:03:04 -06:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								Sebastian Raschka 
							
						 
					 
					
						
						
						
						
							
						
						
							b1923a3075 
							
						 
					 
					
						
						
							
							Fix links  
						
						 
						
						
						
						
					 
					
						2024-01-19 21:00:20 -06:00