Skip to content

Commit

Permalink
Add fixme
Browse files Browse the repository at this point in the history
  • Loading branch information
jeejeelee committed Oct 22, 2024
1 parent 07c415d commit e59c8e4
Showing 1 changed file with 11 additions and 9 deletions.
20 changes: 11 additions & 9 deletions tests/lora/test_long_context.py
Original file line number Diff line number Diff line change
Expand Up @@ -108,15 +108,17 @@ def lora_llm(long_context_infos):
for info in long_context_infos.values()
]

llm = vllm.LLM("meta-llama/Llama-2-13b-chat-hf",
enable_lora=True,
max_num_seqs=16,
max_loras=2,
long_lora_scaling_factors=tuple(scaling_factors),
max_num_batched_tokens=4096 * 8,
tensor_parallel_size=4,
disable_async_output_proc=True,
distributed_executor_backend="mp")
llm = vllm.LLM(
"meta-llama/Llama-2-13b-chat-hf",
enable_lora=True,
max_num_seqs=16,
max_loras=2,
long_lora_scaling_factors=tuple(scaling_factors),
max_num_batched_tokens=4096 * 8,
tensor_parallel_size=4,
# FIXME enable async output processor
disable_async_output_proc=True,
distributed_executor_backend="mp")
yield llm
del llm

Expand Down

0 comments on commit e59c8e4

Please sign in to comment.