Skip to content

Commit afb3a20

Browse files
try allocate more gpu memory
Signed-off-by: ChenTaoyu-SJTU <[email protected]>
1 parent 488aaba commit afb3a20

File tree

1 file changed

+1
-1
lines changed

1 file changed

+1
-1
lines changed

benchmarks/scripts/run_accuracy.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -73,7 +73,7 @@
7373

7474
def run_accuracy_unimodal(queue, model, dataset):
7575
try:
76-
model_args = f"pretrained={model},max_model_len=4096,dtype=auto,tensor_parallel_size=2,gpu_memory_utilization=0.6"
76+
model_args = f"pretrained={model},max_model_len=4096,dtype=auto,tensor_parallel_size=2,gpu_memory_utilization=0.85"
7777
results = lm_eval.simple_evaluate(
7878
model="vllm",
7979
model_args=model_args,

0 commit comments

Comments
 (0)