mirror of
				https://github.com/allenai/olmocr.git
				synced 2025-10-31 10:04:26 +00:00 
			
		
		
		
	Stop everything on a Nan
This commit is contained in:
		
							parent
							
								
									eac3b10c3f
								
							
						
					
					
						commit
						2f1664f3d7
					
				| @ -532,6 +532,10 @@ async def sglang_server_task(args, semaphore): | |||||||
|         nonlocal last_running_req, last_queue_req, can_release_automatically, last_semaphore_release |         nonlocal last_running_req, last_queue_req, can_release_automatically, last_semaphore_release | ||||||
|         sglang_logger.info(line) |         sglang_logger.info(line) | ||||||
| 
 | 
 | ||||||
|  |         if "Detected errors during sampling" in line: | ||||||
|  |             logger.error("Cannot continue, sampling errors detected, model is probably corrupt") | ||||||
|  |             sys.exit(1) | ||||||
|  | 
 | ||||||
|         match = re.search(r'#running-req: (\d+)', line) |         match = re.search(r'#running-req: (\d+)', line) | ||||||
|         if match: |         if match: | ||||||
|             last_running_req = int(match.group(1)) |             last_running_req = int(match.group(1)) | ||||||
| @ -721,7 +725,7 @@ async def main(): | |||||||
|     # Beaker/job running stuff |     # Beaker/job running stuff | ||||||
|     parser.add_argument('--beaker', action='store_true', help='Submit this job to beaker instead of running locally') |     parser.add_argument('--beaker', action='store_true', help='Submit this job to beaker instead of running locally') | ||||||
|     parser.add_argument('--beaker_workspace', help='Beaker workspace to submit to', default='ai2/pdelfin') |     parser.add_argument('--beaker_workspace', help='Beaker workspace to submit to', default='ai2/pdelfin') | ||||||
|     parser.add_argument('--beaker_cluster', help='Beaker clusters you want to run on', default=["ai2/jupiter-cirrascale-2", "ai2/pluto-cirrascale", "ai2/saturn-cirrascale"]) |     parser.add_argument('--beaker_cluster', help='Beaker clusters you want to run on', default=["ai2/jupiter-cirrascale-2", "ai2/pluto-cirrascale", "ai2/saturn-cirrascale", "ai2/augusta-google-1"]) | ||||||
|     parser.add_argument('--beaker_gpus', type=int, default=1, help="Number of gpu replicas to run") |     parser.add_argument('--beaker_gpus', type=int, default=1, help="Number of gpu replicas to run") | ||||||
|     parser.add_argument('--beaker_priority', type=str, default="normal", help="Beaker priority level for the job") |     parser.add_argument('--beaker_priority', type=str, default="normal", help="Beaker priority level for the job") | ||||||
|     args = parser.parse_args() |     args = parser.parse_args() | ||||||
|  | |||||||
| @ -2,7 +2,7 @@ _MAJOR = "0" | |||||||
| _MINOR = "1" | _MINOR = "1" | ||||||
| # On main and in a nightly release the patch should be one ahead of the last | # On main and in a nightly release the patch should be one ahead of the last | ||||||
| # released build. | # released build. | ||||||
| _PATCH = "23" | _PATCH = "24" | ||||||
| # This is mainly for nightly builds which have the suffix ".dev$DATE". See | # This is mainly for nightly builds which have the suffix ".dev$DATE". See | ||||||
| # https://semver.org/#is-v123-a-semantic-version for the semantics. | # https://semver.org/#is-v123-a-semantic-version for the semantics. | ||||||
| _SUFFIX = "" | _SUFFIX = "" | ||||||
|  | |||||||
		Loading…
	
	
			
			x
			
			
		
	
		Reference in New Issue
	
	Block a user
	 Jake Poznanski
						Jake Poznanski