mirror of
https://github.com/nold360/hive-apps
synced 2025-01-03 12:11:16 +00:00
feat(localai): single backend
This commit is contained in:
parent
9d65db50c3
commit
346b6acadb
1 changed files with 7 additions and 2 deletions
|
@ -8,9 +8,14 @@ deployment:
|
||||||
runtimeClassName: nvidia
|
runtimeClassName: nvidia
|
||||||
|
|
||||||
env:
|
env:
|
||||||
# threads: 16
|
threads: 16
|
||||||
context_size: 2048
|
context_size: 4096
|
||||||
DEBUG: "true"
|
DEBUG: "true"
|
||||||
|
#
|
||||||
|
SINGLE_ACTIVE_BACKEND: "true"
|
||||||
|
PYTHON_GRPC_MAX_WORKERS: "1"
|
||||||
|
LLAMACPP_PARALLEL: "1"
|
||||||
|
PARALLEL_REQUESTS: "false"
|
||||||
|
|
||||||
## Specify a different bind address (defaults to ":8080")
|
## Specify a different bind address (defaults to ":8080")
|
||||||
# ADDRESS=127.0.0.1:8080
|
# ADDRESS=127.0.0.1:8080
|
||||||
|
|
Loading…
Reference in a new issue