mirror of
https://github.com/allenai/olmocr.git
synced 2025-06-27 04:00:02 +00:00
added dtype functionality
This commit is contained in:
parent
c8a5361d1b
commit
316d0af1cd
@ -574,6 +574,7 @@ async def vllm_server_task(model_name_or_path, args, semaphore):
|
||||
"--disable-log-requests",
|
||||
"--uvicorn-log-level", "warning",
|
||||
"--served-model-name", "Qwen/Qwen2-VL-7B-Instruct",
|
||||
"--dtype", args.dtype,
|
||||
]
|
||||
cmd.extend(mem_fraction_arg)
|
||||
|
||||
@ -986,6 +987,7 @@ async def main():
|
||||
help="List of paths where you can find the model to convert this pdf. You can specify several different paths here, and the script will try to use the one which is fastest to access",
|
||||
default="allenai/olmOCR-7B-0225-preview",
|
||||
)
|
||||
parser.add_argument("--dtype", type=str, default="bfloat16", help="Data type for model weights")
|
||||
parser.add_argument("--model_max_context", type=int, default="8192", help="Maximum context length that the model was fine tuned under")
|
||||
parser.add_argument("--model_chat_template", type=str, default="qwen2-vl", help="Chat template to pass to vllm server")
|
||||
parser.add_argument("--target_longest_image_dim", type=int, help="Dimension on longest side to use for rendering the pdf pages", default=1024)
|
||||
|
Loading…
x
Reference in New Issue
Block a user