Jake Poznanski
							
						 
					 | 
					
						
						
						
						
							
						
						
							69c33abfcc
							
						
					 | 
					
						
						
							
							Trying to keep queue loaded more
						
						
						
						
						
						
							
						
					 | 
					
						2025-08-15 18:44:45 +00:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Jake Poznanski
							
						 
					 | 
					
						
						
						
						
							
						
						
							7c98673972
							
						
					 | 
					
						
						
							
							Pipeline fixes for OMP_NUM_THREADS
						
						
						
						
						
						
							
						
					 | 
					
						2025-08-15 18:30:00 +00:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Jake Poznanski
							
						 
					 | 
					
						
						
						
						
							
						
						
							b9238b8638
							
						
					 | 
					
						
						
							
							Fix for floaty amount
						
						
						
						
						
						
							
						
					 | 
					
						2025-08-14 22:27:26 +00:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Jake Poznanski
							
						 
					 | 
					
						
						
						
						
							
						
						
							618777c17e
							
						
					 | 
					
						
						
							
							Bump version to v0.3.2 for release
						
						
						
						
						
						
							
 v0.3.2
						
					 | 
					
						2025-08-14 20:58:11 +00:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Jake Poznanski
							
						 
					 | 
					
						
						
						
						
							
						
						
							5532493ec8
							
						
					 | 
					
						
						
							
							Pipeline should be improved to limit CPU usage on page renders
						
						
						
						
						
						
							
						
					 | 
					
						2025-08-14 20:57:57 +00:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Jake Poznanski
							
						 
					 | 
					
						
						
						
						
							
						
						
							3a36ee239d
							
						
					 | 
					
						
						
							
							Cleanup
						
						
						
						
						
						
							
						
					 | 
					
						2025-08-14 20:13:52 +00:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Jake Poznanski
							
						 
					 | 
					
						
						
						
						
							
						
						
							a863d04e6e
							
						
					 | 
					
						
						
							
							Cleanup page rendering cpu limits
						
						
						
						
						
						
							
						
					 | 
					
						2025-08-14 20:11:26 +00:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Jake Poznanski
							
						 
					 | 
					
						
						
						
						
							
						
						
							482030f286
							
						
					 | 
					
						
						
							
							Script to process batch outputs
						
						
						
						
						
						
							
						
					 | 
					
						2025-08-14 19:54:29 +00:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Jake Poznanski
							
						 
					 | 
					
						
						
						
						
							
						
						
							53c0e57e4a
							
						
					 | 
					
						
						
							
							openai batch data writer
						
						
						
						
						
						
							
						
					 | 
					
						2025-08-14 19:40:36 +00:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Jake Poznanski
							
						 
					 | 
					
						
						
						
						
							
						
						
							6d2c1a646a
							
						
					 | 
					
						
						
							
							Olmocr mix to batch format
						
						
						
						
						
						
							
						
					 | 
					
						2025-08-14 18:24:47 +00:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Jake Poznanski
							
						 
					 | 
					
						
						
						
						
							
						
						
							2049abd8ff
							
						
					 | 
					
						
						
							
							prompt stuff
						
						
						
						
						
						
							
						
					 | 
					
						2025-08-14 18:08:43 +00:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Jake Poznanski
							
						 
					 | 
					
						
						
						
						
							
						
						
							807257f43a
							
						
					 | 
					
						
						
							
							Better prompts
						
						
						
						
						
						
							
						
					 | 
					
						2025-08-14 18:04:47 +00:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Jake Poznanski
							
						 
					 | 
					
						
						
						
						
							
						
						
							1f50a6b6bd
							
						
					 | 
					
						
						
							
							Trying out some new prompts
						
						
						
						
						
						
							
						
					 | 
					
						2025-08-14 17:44:56 +00:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Jake Poznanski
							
						 
					 | 
					
						
						
						
						
							
						
						
							0dd4fe83f4
							
						
					 | 
					
						
						
							
							Bump version to v0.3.1 for release
						
						
						
						
						
						
							
 v0.3.1
						
					 | 
					
						2025-08-14 16:52:35 +00:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Jake Poznanski
							
						 
					 | 
					
						
						
						
						
							
						
						
							7e8f9e43d8
							
						
					 | 
					
						
						
							
							New version
						
						
						
						
						
						
							
						
					 | 
					
						2025-08-14 16:50:49 +00:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Jake Poznanski
							
						 
					 | 
					
						
						
						
						
							
						
						
							7a36c98e26
							
						
					 | 
					
						
						
							
							Merge branch 'main' into jakep/new_data
						
						
						
						
						
						
							
						
					 | 
					
						2025-08-14 16:45:00 +00:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Jake Poznanski
							
						 
					 | 
					
						
						
						
						
							
						
						
							0a8cd93c0a
							
						
					 | 
					
						
						
							
							Better queue managmenet again
						
						
						
						
						
						
							
						
					 | 
					
						2025-08-14 16:37:11 +00:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Jake Poznanski
							
						 
					 | 
					
						
						
						
						
							
						
						
							38679243d7
							
						
					 | 
					
						
						
							
							Removing extra files
						
						
						
						
						
						
							
						
					 | 
					
						2025-08-14 16:17:59 +00:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Jake Poznanski
							
						 
					 | 
					
						
						
						
						
							
						
						
							dc5c45e144
							
						
					 | 
					
						
						
							
							Deps
						
						
						
						
						
						
							
						
					 | 
					
						2025-08-14 16:10:29 +00:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Jake Poznanski
							
						 
					 | 
					
						
						
						
						
							
						
						
							7b3b93589d
							
						
					 | 
					
						
						
							
							VLLM bump
						
						
						
						
						
						
							
						
					 | 
					
						2025-08-14 16:08:45 +00:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Jake Poznanski
							
						 
					 | 
					
						
						
						
						
							
						
						
							4431b4886f
							
						
					 | 
					
						
						
							
							Better tracking of semaphore release on bigger jobs
						
						
						
						
						
						
							
						
					 | 
					
						2025-08-14 16:05:21 +00:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Jake Poznanski
							
						 
					 | 
					
						
						
						
						
							
						
						
							4efd3f5d9e
							
						
					 | 
					
						
						
							
							AI2 Internal budgeting
						
						
						
						
						
						
							
						
					 | 
					
						2025-08-13 22:16:18 +00:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Jake Poznanski
							
						 
					 | 
					
						
						
						
						
							
						
						
							9f8df232b6
							
						
					 | 
					
						
						
							
							Readme updates
						
						
						
						
						
						
							
						
					 | 
					
						2025-08-13 22:03:03 +00:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Jake Poznanski
							
						 
					 | 
					
						
						
						
						
							
						
						
							36ca700669
							
						
					 | 
					
						
						
							
							Bump version to v0.3.0 for release
						
						
						
						
						
						
							
 v0.3.0
						
					 | 
					
						2025-08-13 21:41:30 +00:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Jake Poznanski
							
						 
					 | 
					
						
						
						
						
							
						
						
							3e5351c028
							
						
					 | 
					
						
						
							
							version bump
						
						
						
						
						
						
							
						
					 | 
					
						2025-08-13 21:41:22 +00:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Jake Poznanski
							
						 
					 | 
					
						
						
							
							
						
						
						
							
						
						
							894c617ea4
							
						
					 | 
					
						
						
							
							Merge pull request #303 from allenai/jakep/olmocr_v03
						
						
						
						
						
						
						
						olmOCR v.0.3.0 
						
						
							
						
					 | 
					
						2025-08-13 14:39:54 -07:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Jake Poznanski
							
						 
					 | 
					
						
						
						
						
							
						
						
							463cef7ea2
							
						
					 | 
					
						
						
							
							New default model
						
						
						
						
						
						
							
						
					 | 
					
						2025-08-13 20:57:15 +00:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Jake Poznanski
							
						 
					 | 
					
						
						
						
						
							
						
						
							e86267a01c
							
						
					 | 
					
						
						
							
							Making local results directory properly
						
						
						
						
						
						
							
						
					 | 
					
						2025-08-13 20:40:04 +00:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Jake Poznanski
							
						 
					 | 
					
						
						
						
						
							
						
						
							11302feb8c
							
						
					 | 
					
						
						
							
							Move open cv2 import only into experimental data loader class
						
						
						
						
						
						
							
						
					 | 
					
						2025-08-13 20:28:31 +00:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Jake Poznanski
							
						 
					 | 
					
						
						
						
						
							
						
						
							93411a80a0
							
						
					 | 
					
						
						
							
							Lint fixes
						
						
						
						
						
						
							
						
					 | 
					
						2025-08-13 20:21:04 +00:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Jake Poznanski
							
						 
					 | 
					
						
						
						
						
							
						
						
							05330150ad
							
						
					 | 
					
						
						
							
							New work queue code is cleaner
						
						
						
						
						
						
							
						
					 | 
					
						2025-08-13 20:20:27 +00:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Jake Poznanski
							
						 
					 | 
					
						
						
						
						
							
						
						
							9a8fa335ae
							
						
					 | 
					
						
						
							
							One more scheme to try
						
						
						
						
						
						
							
						
					 | 
					
						2025-08-13 18:21:58 +00:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Jake Poznanski
							
						 
					 | 
					
						
						
						
						
							
						
						
							ffb0c6abc5
							
						
					 | 
					
						
						
							
							Adding some more quant schemes
						
						
						
						
						
						
							
						
					 | 
					
						2025-08-13 18:00:38 +00:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Jake Poznanski
							
						 
					 | 
					
						
						
						
						
							
						
						
							b921922f25
							
						
					 | 
					
						
						
							
							Cleaning up some pipeline logs
						
						
						
						
						
						
							
						
					 | 
					
						2025-08-13 17:39:02 +00:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Jake Poznanski
							
						 
					 | 
					
						
						
						
						
							
						
						
							332a818614
							
						
					 | 
					
						
						
							
							useless config
						
						
						
						
						
						
							
						
					 | 
					
						2025-08-12 17:31:19 +00:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Jake Poznanski
							
						 
					 | 
					
						
						
						
						
							
						
						
							b873d66dae
							
						
					 | 
					
						
						
							
							resumable
						
						
						
						
						
						
							
						
					 | 
					
						2025-08-12 16:35:21 +00:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Jake Poznanski
							
						 
					 | 
					
						
						
						
						
							
						
						
							98d457c502
							
						
					 | 
					
						
						
							
							2epoch config fix
						
						
						
						
						
						
							
						
					 | 
					
						2025-08-11 22:21:55 +00:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Jake Poznanski
							
						 
					 | 
					
						
						
						
						
							
						
						
							b80f48ec38
							
						
					 | 
					
						
						
							
							Needs a safety identifier...
						
						
						
						
						
						
							
						
					 | 
					
						2025-08-11 19:49:12 +00:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Jake Poznanski
							
						 
					 | 
					
						
						
						
						
							
						
						
							fd5217a8da
							
						
					 | 
					
						
						
							
							Gpt 5 runner
						
						
						
						
						
						
							
						
					 | 
					
						2025-08-07 20:08:28 +00:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Jake Poznanski
							
						 
					 | 
					
						
						
						
						
							
						
						
							387e7947c4
							
						
					 | 
					
						
						
							
							Another 2 epoch run
						
						
						
						
						
						
							
						
					 | 
					
						2025-08-06 22:39:09 +00:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Jake Poznanski
							
						 
					 | 
					
						
						
						
						
							
						
						
							2a3c534a84
							
						
					 | 
					
						
						
							
							2 epoch resumable config
						
						
						
						
						
						
							
						
					 | 
					
						2025-08-06 22:38:38 +00:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Jake Poznanski
							
						 
					 | 
					
						
						
						
						
							
						
						
							c7a533c945
							
						
					 | 
					
						
						
							
							Sorting data loader samples to maintain consistency between runs
						
						
						
						
						
						
							
						
					 | 
					
						2025-08-06 21:46:13 +00:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Jake Poznanski
							
						 
					 | 
					
						
						
						
						
							
						
						
							2fca448105
							
						
					 | 
					
						
						
							
							Using new budget code
						
						
						
						
						
						
							
						
					 | 
					
						2025-08-06 16:31:08 +00:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Jake Poznanski
							
						 
					 | 
					
						
						
						
						
							
						
						
							e664dc5f36
							
						
					 | 
					
						
						
							
							typo
						
						
						
						
						
						
							
						
					 | 
					
						2025-08-05 19:43:11 +00:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Jake Poznanski
							
						 
					 | 
					
						
						
						
						
							
						
						
							8b8c6bb837
							
						
					 | 
					
						
						
							
							Cleaning up some training requirements installation steps
						
						
						
						
						
						
							
						
					 | 
					
						2025-08-05 19:42:46 +00:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Jake Poznanski
							
						 
					 | 
					
						
						
						
						
							
						
						
							c9b8088bc6
							
						
					 | 
					
						
						
							
							Adding some preempt flags
						
						
						
						
						
						
							
						
					 | 
					
						2025-08-05 18:00:46 +00:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Jake Poznanski
							
						 
					 | 
					
						
						
						
						
							
						
						
							8b7006d75d
							
						
					 | 
					
						
						
							
							One more thing to try
						
						
						
						
						
						
							
						
					 | 
					
						2025-08-05 17:38:59 +00:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Jake Poznanski
							
						 
					 | 
					
						
						
						
						
							
						
						
							51ec1d34b2
							
						
					 | 
					
						
						
							
							Adding a bigger config with augemnts
						
						
						
						
						
						
							
						
					 | 
					
						2025-08-05 17:38:00 +00:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Jake Poznanski
							
						 
					 | 
					
						
						
						
						
							
						
						
							8b595b63ec
							
						
					 | 
					
						
						
							
							Adding a decent augmentations pipeline
						
						
						
						
						
						
							
						
					 | 
					
						2025-08-05 17:37:02 +00:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Jake Poznanski
							
						 
					 | 
					
						
						
						
						
							
						
						
							7dca33db60
							
						
					 | 
					
						
						
							
							Getting things ready for a bit more augmentation
						
						
						
						
						
						
							
						
					 | 
					
						2025-08-05 16:34:46 +00:00 | 
					
					
						
						
							
							
							
						
					 |