mirror of
https://github.com/allenai/olmocr.git
synced 2025-12-15 01:03:23 +00:00
Doing some debugging
This commit is contained in:
parent
201fec3ad9
commit
01469af463
@ -20,7 +20,13 @@ def main():
|
|||||||
|
|
||||||
print("Training dataset........")
|
print("Training dataset........")
|
||||||
print(train_dataset)
|
print(train_dataset)
|
||||||
print(train_dataset[0])
|
|
||||||
|
train_example = train_dataset[0]
|
||||||
|
print(train_example)
|
||||||
|
print({(x, y.shape) for x,y in train_example.items()})
|
||||||
|
print("\nTokens")
|
||||||
|
print(processor.tokenizer.batch_decode(train_example["input_ids"]))
|
||||||
|
|
||||||
print("\n\n")
|
print("\n\n")
|
||||||
|
|
||||||
print("Validation dataset........")
|
print("Validation dataset........")
|
||||||
|
|||||||
@ -37,6 +37,7 @@ class MolmoProcessorTest(unittest.TestCase):
|
|||||||
print(inputs)
|
print(inputs)
|
||||||
|
|
||||||
print("\nShapes")
|
print("\nShapes")
|
||||||
|
# {('input_ids', torch.Size([1, 589])), ('images', torch.Size([1, 5, 576, 588])), ('image_masks', torch.Size([1, 5, 576])), ('image_input_idx', torch.Size([1, 5, 144]))}
|
||||||
print({(x, y.shape) for x,y in inputs.items()})
|
print({(x, y.shape) for x,y in inputs.items()})
|
||||||
|
|
||||||
print("\nTokens")
|
print("\nTokens")
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user