mirror of
https://github.com/allenai/olmocr.git
synced 2025-11-03 03:25:22 +00:00
Hopefully a cleaner pipeline
This commit is contained in:
parent
b4c5913772
commit
ce32ceb83f
@ -669,6 +669,10 @@ async def vllm_server_task(model_name_or_path, args, semaphore):
|
||||
except asyncio.CancelledError:
|
||||
logger.info("Got cancellation request for VLLM server")
|
||||
proc.terminate()
|
||||
try:
|
||||
await asyncio.wait_for(proc.wait(), timeout=10.0)
|
||||
except asyncio.TimeoutError:
|
||||
logger.warning("VLLM server did not terminate within 10 seconds")
|
||||
raise
|
||||
|
||||
timeout_task.cancel()
|
||||
@ -1209,6 +1213,9 @@ async def main():
|
||||
vllm_server.cancel()
|
||||
metrics_task.cancel()
|
||||
|
||||
# Wait for cancelled tasks to complete
|
||||
await asyncio.gather(vllm_server, metrics_task, return_exceptions=True)
|
||||
|
||||
# Output final metrics summary
|
||||
metrics_summary = metrics.get_metrics_summary()
|
||||
logger.info("=" * 80)
|
||||
@ -1233,7 +1240,8 @@ async def main():
|
||||
)
|
||||
|
||||
# Output finished_on_attempt statistics
|
||||
logger.info("\nPages finished by attempt number:")
|
||||
logger.info("")
|
||||
logger.info("Pages finished by attempt number:")
|
||||
total_finished = sum(total_metrics.get(f"finished_on_attempt_{i}", 0) for i in range(args.max_page_retries))
|
||||
cumulative = 0
|
||||
|
||||
|
||||
Loading…
x
Reference in New Issue
Block a user