mirror of
				https://github.com/rasbt/LLMs-from-scratch.git
				synced 2025-10-30 17:29:59 +00:00 
			
		
		
		
	Fix incorrect indentation (#536)
This commit is contained in:
		
							parent
							
								
									18dd8ab633
								
							
						
					
					
						commit
						0a5214b804
					
				| @ -382,7 +382,7 @@ | ||||
|   }, | ||||
|   { | ||||
|    "cell_type": "code", | ||||
|    "execution_count": 4, | ||||
|    "execution_count": null, | ||||
|    "id": "3e4a15ec-2667-4f56-b7c1-34e8071b621d", | ||||
|    "metadata": {}, | ||||
|    "outputs": [], | ||||
| @ -499,7 +499,7 @@ | ||||
|     "            if lines and lines[0].startswith(\"#\"):\n", | ||||
|     "                lines = lines[1:]\n", | ||||
|     "\n", | ||||
|     "            for rank, line in enumerate(lines):\n", | ||||
|     "            for line in lines:\n", | ||||
|     "                pair = tuple(line.strip().split())\n", | ||||
|     "                if len(pair) == 2:\n", | ||||
|     "                    token1, token2 = pair\n", | ||||
| @ -511,10 +511,10 @@ | ||||
|     "                            merged_token_id = self.inverse_vocab[merged_token]\n", | ||||
|     "                            self.bpe_merges[(token_id1, token_id2)] = merged_token_id\n", | ||||
|     "                        # print(f\"Loaded merge: '{token1}' + '{token2}' -> '{merged_token}' (ID: {merged_token_id})\")\n", | ||||
|     "                        else:\n", | ||||
|     "                            print(f\"Merged token '{merged_token}' not found in vocab. Skipping.\")\n", | ||||
|     "                    else:\n", | ||||
|     "                        print(f\"Merged token '{merged_token}' not found in vocab. Skipping.\")\n", | ||||
|     "                else:\n", | ||||
|     "                    print(f\"Skipping pair {pair} as one of the tokens is not in the vocabulary.\")\n", | ||||
|     "                        print(f\"Skipping pair {pair} as one of the tokens is not in the vocabulary.\")\n", | ||||
|     "\n", | ||||
|     "    def encode(self, text):\n", | ||||
|     "        \"\"\"\n", | ||||
|  | ||||
		Loading…
	
	
			
			x
			
			
		
	
		Reference in New Issue
	
	Block a user
	 Kasen
						Kasen