mirror of
https://github.com/allenai/olmocr.git
synced 2025-08-18 05:42:28 +00:00
Merge branch 'main' of https://github.com/allenai/pdelfin
This commit is contained in:
commit
aa59d38a5b
@ -20,7 +20,13 @@ def main():
|
||||
|
||||
print("Training dataset........")
|
||||
print(train_dataset)
|
||||
print(train_dataset[0])
|
||||
|
||||
train_example = train_dataset[0]
|
||||
print(train_example)
|
||||
print({(x, y.shape) for x,y in train_example.items()})
|
||||
print("\nTokens")
|
||||
print(processor.tokenizer.batch_decode(train_example["input_ids"]))
|
||||
|
||||
print("\n\n")
|
||||
|
||||
print("Validation dataset........")
|
||||
|
@ -37,6 +37,7 @@ class MolmoProcessorTest(unittest.TestCase):
|
||||
print(inputs)
|
||||
|
||||
print("\nShapes")
|
||||
# {('input_ids', torch.Size([1, 589])), ('images', torch.Size([1, 5, 576, 588])), ('image_masks', torch.Size([1, 5, 576])), ('image_input_idx', torch.Size([1, 5, 144]))}
|
||||
print({(x, y.shape) for x,y in inputs.items()})
|
||||
|
||||
print("\nTokens")
|
||||
|
Loading…
x
Reference in New Issue
Block a user