mirror of
https://github.com/rasbt/LLMs-from-scratch.git
synced 2025-11-15 01:24:48 +00:00
cosmetics
This commit is contained in:
parent
244593ce01
commit
3328b29521
@ -312,10 +312,10 @@ def load_weights_into_gpt(gpt, params):
|
|||||||
|
|
||||||
def text_to_token_ids(text, tokenizer):
|
def text_to_token_ids(text, tokenizer):
|
||||||
encoded = tokenizer.encode(text, allowed_special={'<|endoftext|>'})
|
encoded = tokenizer.encode(text, allowed_special={'<|endoftext|>'})
|
||||||
encoded_tensor = torch.tensor(encoded).unsqueeze(0) # add batch dimension
|
encoded_tensor = torch.tensor(encoded).unsqueeze(0) # add batch dimension
|
||||||
return encoded_tensor
|
return encoded_tensor
|
||||||
|
|
||||||
|
|
||||||
def token_ids_to_text(token_ids, tokenizer):
|
def token_ids_to_text(token_ids, tokenizer):
|
||||||
flat = token_ids.squeeze(0) # remove batch dimension
|
flat = token_ids.squeeze(0) # remove batch dimension
|
||||||
return tokenizer.decode(flat.tolist())
|
return tokenizer.decode(flat.tolist())
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user