hive-apps/projects/ai/values/localai.yaml

replicaCount: 1

deployment:
  image: quay.io/go-skynet/local-ai:master-ffmpeg-core
  env:
    threads: 16
    context_size: 2048
    DEBUG: "true"

    ## Specify a different bind address (defaults to ":8080")
    # ADDRESS=127.0.0.1:8080

    ## Define galleries.
    ## models will to install will be visible in `/models/available`
    #GALLERIES=[{"name":"model-gallery", "url":"github:go-skynet/model-gallery/index.yaml"}, {"url": "github:go-skynet/model-gallery/huggingface.yaml","name":"huggingface"}]

    ## Default path for models
    #MODELS_PATH=/models

    ## Enable debug mode
    #DEBUG=true

    ## Disables COMPEL (Lets Stable Diffuser work, uncomment if you plan on using it)
    # COMPEL=0

    ## Enable/Disable single backend (useful if only one GPU is available)
    # SINGLE_ACTIVE_BACKEND=true

    ## Specify a build type. Available: cublas, openblas, clblas.
    #BUILD_TYPE=cublas

    ## Uncomment and set to true to enable rebuilding from source
    # REBUILD=true

    ## Enable go tags, available: stablediffusion, tts
    ## stablediffusion: image generation with stablediffusion
    ## tts: enables text-to-speech with go-piper 
    ## (requires REBUILD=true)
    #
    #GO_TAGS=tts

    ## Path where to store generated images
    # IMAGE_PATH=/tmp

    ## Specify a default upload limit in MB (whisper)
    # UPLOAD_LIMIT

    # HUGGINGFACEHUB_API_TOKEN=Token here

  modelsPath: "/models"
  download_model:
    # To use cloud provided (eg AWS) image, provide it like: 1234356789.dkr.ecr.us-REGION-X.amazonaws.com/busybox
    image: busybox
  prompt_templates:
    # To use cloud provided (eg AWS) image, provide it like: 1234356789.dkr.ecr.us-REGION-X.amazonaws.com/busybox
    image: busybox
  pullPolicy: Always
  imagePullSecrets: []
    # - name: secret-names

resources:
  limits:
    memory: 64Gi

# Note: the keys of this map will be the names of the prompt template files
promptTemplates:
  {}
  # ggml-gpt4all-j.tmpl: |
  #   The prompt below is a question to answer, a task to complete, or a conversation to respond to; decide which and write an appropriate response.
  #   ### Prompt:
  #   {{.Input}}
  #   ### Response:

# Models to download at runtime
models:
  # Whether to force download models even if they already exist
  forceDownload: false

  # The list of URLs to download models from
  # Note: the name of the file will be the name of the loaded model
  list:
    - url: "https://gpt4all.io/models/ggml-gpt4all-j.bin"
      # basicAuth: base64EncodedCredentials

  persistence:
    pvc:
      enabled: true
      size: 100Gi
      accessModes:
        - ReadWriteOnce
      storageClass: "ssd"

service:
  type: ClusterIP
  port: 80

ingress:
  enabled: true
  className: "ingress-internal"
  annotations:
    cert-manager.io/cluster-issuer: vault-issuer
    nginx.ingress.kubernetes.io/proxy-body-size: 100m
  hosts:
    - host: ai.dc
      paths:
        - path: /
          pathType: ImplementationSpecific
  tls: 
    - secretName: localai-tls
      hosts:
        - ai.dc

image:
  pullPolicy: IfNotPresent
add: localai stuff 2023-12-25 20:46:48 +00:00			`replicaCount: 1`

			`deployment:`
fix(localai): threads 2023-12-27 11:35:17 +00:00			`image: quay.io/go-skynet/local-ai:master-ffmpeg-core`
add: localai stuff 2023-12-25 20:46:48 +00:00			`env:`
fix(localai): threads 2023-12-27 11:35:17 +00:00			`threads: 16`
feat(localai): increased chunks to 2048 2023-12-28 11:21:22 +00:00			`context_size: 2048`
add: localai stuff 2023-12-25 20:46:48 +00:00			`DEBUG: "true"`
add(localai): default env values for later usage 2023-12-26 06:09:54 +00:00
			`## Specify a different bind address (defaults to ":8080")`
			`# ADDRESS=127.0.0.1:8080`

			`## Define galleries.`
			## models will to install will be visible in `/models/available`
			`#GALLERIES=[{"name":"model-gallery", "url":"github:go-skynet/model-gallery/index.yaml"}, {"url": "github:go-skynet/model-gallery/huggingface.yaml","name":"huggingface"}]`

			`## Default path for models`
			`#MODELS_PATH=/models`

			`## Enable debug mode`
			`#DEBUG=true`

			`## Disables COMPEL (Lets Stable Diffuser work, uncomment if you plan on using it)`
			`# COMPEL=0`

			`## Enable/Disable single backend (useful if only one GPU is available)`
			`# SINGLE_ACTIVE_BACKEND=true`

			`## Specify a build type. Available: cublas, openblas, clblas.`
			`#BUILD_TYPE=cublas`

			`## Uncomment and set to true to enable rebuilding from source`
			`# REBUILD=true`

			`## Enable go tags, available: stablediffusion, tts`
			`## stablediffusion: image generation with stablediffusion`
			`## tts: enables text-to-speech with go-piper`
			`## (requires REBUILD=true)`
			`#`
			`#GO_TAGS=tts`

			`## Path where to store generated images`
			`# IMAGE_PATH=/tmp`

			`## Specify a default upload limit in MB (whisper)`
			`# UPLOAD_LIMIT`

			`# HUGGINGFACEHUB_API_TOKEN=Token here`

add: localai stuff 2023-12-25 20:46:48 +00:00			`modelsPath: "/models"`
			`download_model:`
			`# To use cloud provided (eg AWS) image, provide it like: 1234356789.dkr.ecr.us-REGION-X.amazonaws.com/busybox`
			`image: busybox`
			`prompt_templates:`
			`# To use cloud provided (eg AWS) image, provide it like: 1234356789.dkr.ecr.us-REGION-X.amazonaws.com/busybox`
			`image: busybox`
			`pullPolicy: Always`
			`imagePullSecrets: []`
			`# - name: secret-names`

fix(localai): threads 2023-12-27 11:35:17 +00:00			`resources:`
			`limits:`
			`memory: 64Gi`

add: localai stuff 2023-12-25 20:46:48 +00:00			`# Note: the keys of this map will be the names of the prompt template files`
			`promptTemplates:`
			`{}`
			`# ggml-gpt4all-j.tmpl: \|`
			`# The prompt below is a question to answer, a task to complete, or a conversation to respond to; decide which and write an appropriate response.`
			`# ### Prompt:`
			`# {{.Input}}`
			`# ### Response:`

			`# Models to download at runtime`
			`models:`
			`# Whether to force download models even if they already exist`
			`forceDownload: false`

			`# The list of URLs to download models from`
			`# Note: the name of the file will be the name of the loaded model`
			`list:`
			`- url: "https://gpt4all.io/models/ggml-gpt4all-j.bin"`
			`# basicAuth: base64EncodedCredentials`

			`persistence:`
			`pvc:`
			`enabled: true`
fix(localai): pvc storage class ssd 2023-12-26 10:11:36 +00:00			`size: 100Gi`
add: localai stuff 2023-12-25 20:46:48 +00:00			`accessModes:`
			`- ReadWriteOnce`
fix(localai): pvc storage class ssd 2023-12-26 10:11:36 +00:00			`storageClass: "ssd"`
add: localai stuff 2023-12-25 20:46:48 +00:00
			`service:`
			`type: ClusterIP`
			`port: 80`

			`ingress:`
			`enabled: true`
			`className: "ingress-internal"`
			`annotations:`
			`cert-manager.io/cluster-issuer: vault-issuer`
fix(localai): nginx body size 2023-12-28 21:01:23 +00:00			`nginx.ingress.kubernetes.io/proxy-body-size: 100m`
add: localai stuff 2023-12-25 20:46:48 +00:00			`hosts:`
			`- host: ai.dc`
			`paths:`
			`- path: /`
			`pathType: ImplementationSpecific`
			`tls:`
			`- secretName: localai-tls`
			`hosts:`
			`- ai.dc`

			`image:`
			`pullPolicy: IfNotPresent`