You signed in with another tab or window. Reload to refresh your session.You signed out in another tab or window. Reload to refresh your session.You switched accounts on another tab or window. Reload to refresh your session.Dismiss alert
parser.add_argument("--gpu-memory-utilization", type=float, help="Fraction of VRAM vLLM may pre-allocate for KV-cache ""(passed through to vllm serve).")
1019
-
parser.add_argument("--max_model_len", type=int, help="Upper bound (tokens) vLLM will allocate KV-cache for; ""passed through to vllm serve as --max-model-len.",)
1022
+
parser.add_argument(
1023
+
"--max_model_len",
1024
+
type=int,
1025
+
help="Upper bound (tokens) vLLM will allocate KV-cache for; ""passed through to vllm serve as --max-model-len.",
1026
+
)
1020
1027
1021
1028
parser.add_argument("--model_max_context", type=int, default="8192", help="Maximum context length that the model was fine tuned under")
1022
1029
parser.add_argument("--target_longest_image_dim", type=int, help="Dimension on longest side to use for rendering the pdf pages", default=1288)
@@ -1041,7 +1048,7 @@ async def main():
1041
1048
logger.info(
1042
1049
"If you run out of GPU memory during start-up or get 'KV cache is larger than available memory' errors, retry with lower values, e.g. --gpu_memory_utilization 0.80 --max_model_len 16384"
1043
1050
)
1044
-
1051
+
1045
1052
globalworkspace_s3, pdf_s3
1046
1053
# set the global BASE_SERVER_PORT from args
1047
1054
globalBASE_SERVER_PORT
@@ -1227,12 +1234,12 @@ async def main():
1227
1234
1228
1235
# Output finished_on_attempt statistics
1229
1236
logger.info("\nPages finished by attempt number:")
f"Attached is one page of a document that you must process. "
113
-
f"Just return the plain text representation of this document as if you were reading it naturally. Convert equations to LateX and tables to markdown.\n"
114
-
f"Return your output as markdown, with a front matter section on top specifying values for the primary_language, is_rotation_valid, rotation_correction, is_table, and is_diagram parameters."
112
+
"Attached is one page of a document that you must process. "
113
+
"Just return the plain text representation of this document as if you were reading it naturally. Convert equations to LateX and tables to markdown.\n"
114
+
"Return your output as markdown, with a front matter section on top specifying values for the primary_language, is_rotation_valid, rotation_correction, is_table, and is_diagram parameters."
0 commit comments