cosmetics

This commit is contained in:
Sebastian Raschka 2024-05-05 08:15:46 -05:00 committed by GitHub
parent 244593ce01
commit 3328b29521

View File

@ -312,10 +312,10 @@ def load_weights_into_gpt(gpt, params):
def text_to_token_ids(text, tokenizer):
encoded = tokenizer.encode(text, allowed_special={'<|endoftext|>'})
encoded_tensor = torch.tensor(encoded).unsqueeze(0) # add batch dimension
encoded_tensor = torch.tensor(encoded).unsqueeze(0) # add batch dimension
return encoded_tensor
def token_ids_to_text(token_ids, tokenizer):
flat = token_ids.squeeze(0) # remove batch dimension
flat = token_ids.squeeze(0) # remove batch dimension
return tokenizer.decode(flat.tolist())