mirror of
https://github.com/tcsenpai/agenticSeek.git
synced 2025-06-05 02:25:27 +00:00
server gpu percentage for vllm
This commit is contained in:
parent
9a1b2b93f6
commit
ed2a9cc204
@ -51,6 +51,7 @@ class Vllm(GeneratorLLM):
|
||||
sampling_params = SamplingParams(
|
||||
temperature=0.7,
|
||||
max_tokens=512,
|
||||
gpu_memory_utilization=0.5,
|
||||
stream=True # Enable streaming
|
||||
)
|
||||
outputs = self.llm.generate(prompt, sampling_params, use_tqdm=False)
|
||||
|
Loading…
x
Reference in New Issue
Block a user