mirror of
https://github.com/nold360/hive-apps
synced 2024-12-22 13:01:21 +00:00
feat(localai): single backend
This commit is contained in:
parent
9d65db50c3
commit
346b6acadb
1 changed files with 7 additions and 2 deletions
|
@ -8,9 +8,14 @@ deployment:
|
|||
runtimeClassName: nvidia
|
||||
|
||||
env:
|
||||
# threads: 16
|
||||
context_size: 2048
|
||||
threads: 16
|
||||
context_size: 4096
|
||||
DEBUG: "true"
|
||||
#
|
||||
SINGLE_ACTIVE_BACKEND: "true"
|
||||
PYTHON_GRPC_MAX_WORKERS: "1"
|
||||
LLAMACPP_PARALLEL: "1"
|
||||
PARALLEL_REQUESTS: "false"
|
||||
|
||||
## Specify a different bind address (defaults to ":8080")
|
||||
# ADDRESS=127.0.0.1:8080
|
||||
|
|
Loading…
Reference in a new issue