mirror of
https://github.com/rasbt/LLMs-from-scratch.git
synced 2025-12-03 10:30:50 +00:00
main push to sync github ruleset
This commit is contained in:
parent
8f3e5b024d
commit
1412b139f2
@ -80,7 +80,7 @@ def test_tokenizer_training(imported_module, verdict_file):
|
||||
BPETokenizerSimple = getattr(imported_module, "BPETokenizerSimple", None)
|
||||
tokenizer = BPETokenizerSimple()
|
||||
|
||||
with open(verdict_file, "r", encoding="utf-8") as f: # added ../01_main-chapter-code/
|
||||
with open(verdict_file, "r", encoding="utf-8") as f: # added ../01_main-chapter-code/
|
||||
text = f.read()
|
||||
|
||||
tokenizer.train(text, vocab_size=1000, allowed_special={"<|endoftext|>"})
|
||||
|
||||
Loading…
x
Reference in New Issue
Block a user