mirror of
				https://github.com/allenai/olmocr.git
				synced 2025-10-31 10:04:26 +00:00 
			
		
		
		
	Pipeline fixes for OMP_NUM_THREADS
This commit is contained in:
		
							parent
							
								
									b9238b8638
								
							
						
					
					
						commit
						7c98673972
					
				| @ -611,6 +611,9 @@ async def vllm_server_task(model_name_or_path, args, semaphore, unknown_args=Non | |||||||
|         *cmd, |         *cmd, | ||||||
|         stdout=asyncio.subprocess.PIPE, |         stdout=asyncio.subprocess.PIPE, | ||||||
|         stderr=asyncio.subprocess.PIPE, |         stderr=asyncio.subprocess.PIPE, | ||||||
|  | 
 | ||||||
|  |         # OMP_NUM_THREADS needs to be 1, otherwise you could have contention if you are running multiple copies of olmOCR on a machine with several GPUS | ||||||
|  |         env={**os.environ, "OMP_NUM_THREADS": "1"},  | ||||||
|     ) |     ) | ||||||
| 
 | 
 | ||||||
|     # Ensure the subprocess is terminated on exit |     # Ensure the subprocess is terminated on exit | ||||||
| @ -643,7 +646,7 @@ async def vllm_server_task(model_name_or_path, args, semaphore, unknown_args=Non | |||||||
|         if match := re.search(r"Running: (\d+)", line): |         if match := re.search(r"Running: (\d+)", line): | ||||||
|             current_running = int(match.group(1)) |             current_running = int(match.group(1)) | ||||||
|             # Check for negative derivative (decrease in running requests), to not overload VLLM |             # Check for negative derivative (decrease in running requests), to not overload VLLM | ||||||
|             if current_running < last_running_req: |             if current_running < last_running_req and not running_reqs_decreased: | ||||||
|                 running_reqs_decreased = True |                 running_reqs_decreased = True | ||||||
|                 logger.info(f"Running requests decreased: {last_running_req} -> {current_running}") |                 logger.info(f"Running requests decreased: {last_running_req} -> {current_running}") | ||||||
|             last_running_req = current_running |             last_running_req = current_running | ||||||
|  | |||||||
		Loading…
	
	
			
			x
			
			
		
	
		Reference in New Issue
	
	Block a user
	 Jake Poznanski
						Jake Poznanski