mirror of
https://github.com/tcsenpai/agenticSeek.git
synced 2025-06-06 11:05:26 +00:00
server gpu percentage for vllm
This commit is contained in:
parent
9a1b2b93f6
commit
ed2a9cc204
@ -51,6 +51,7 @@ class Vllm(GeneratorLLM):
|
|||||||
sampling_params = SamplingParams(
|
sampling_params = SamplingParams(
|
||||||
temperature=0.7,
|
temperature=0.7,
|
||||||
max_tokens=512,
|
max_tokens=512,
|
||||||
|
gpu_memory_utilization=0.5,
|
||||||
stream=True # Enable streaming
|
stream=True # Enable streaming
|
||||||
)
|
)
|
||||||
outputs = self.llm.generate(prompt, sampling_params, use_tqdm=False)
|
outputs = self.llm.generate(prompt, sampling_params, use_tqdm=False)
|
||||||
|
Loading…
x
Reference in New Issue
Block a user