Merge pull request #6855 from oobabooga/dev

Merge dev branch
This commit is contained in:
oobabooga 2025-04-19 01:53:11 -03:00 committed by GitHub
commit b1495d52e5
No known key found for this signature in database
GPG key ID: B5690EEEBB952194

View file

@ -250,7 +250,6 @@ class LlamaServer:
"--ctx-size", str(shared.args.n_ctx),
"--n-gpu-layers", str(shared.args.n_gpu_layers),
"--batch-size", str(shared.args.batch_size),
"--rope-freq-base", str(shared.args.rope_freq_base),
"--port", str(self.port),
]
@ -276,6 +275,8 @@ class LlamaServer:
cmd += ["--cache-type-k", shared.args.cache_type, "--cache-type-v", shared.args.cache_type]
if shared.args.compress_pos_emb != 1:
cmd += ["--rope-freq-scale", str(1.0 / shared.args.compress_pos_emb)]
if shared.args.rope_freq_base > 0:
cmd += ["--rope-freq-base", str(shared.args.rope_freq_base)]
# Start the server with pipes for output
self.process = subprocess.Popen(