948 lines
33 KiB
YAML
948 lines
33 KiB
YAML
image:
|
|
# registry where weaviate image is stored
|
|
registry: docker.io
|
|
# Tag of weaviate image to deploy
|
|
# Note: We strongly recommend you overwrite this value in your own values.yaml.
|
|
# Otherwise a mere upgrade of the chart could lead to an unexpected upgrade
|
|
# of weaviate. In accordance with Infra-as-code, you should pin this value
|
|
# down and only change it if you explicitly want to upgrade the Weaviate
|
|
# version.
|
|
tag: 1.18.0
|
|
repo: semitechnologies/weaviate
|
|
|
|
# overwrite command and args if you want to run specific startup scripts, for
|
|
# example setting the nofile limit
|
|
command: ["/bin/weaviate"]
|
|
args:
|
|
- '--host'
|
|
- '0.0.0.0'
|
|
- '--port'
|
|
- '8080'
|
|
- '--scheme'
|
|
- 'http'
|
|
- '--config-file'
|
|
- '/weaviate-config/conf.yaml'
|
|
- --read-timeout=60s
|
|
- --write-timeout=60s
|
|
|
|
# below is an example that can be used to set an arbitrary nofile limit at
|
|
# startup:
|
|
#
|
|
# command:
|
|
# - "/bin/sh"
|
|
# args:
|
|
# - "-c"
|
|
# - "ulimit -n 65535 && /bin/weaviate --host 0.0.0.0 --port 8080 --scheme http --config-file /weaviate-config/conf.yaml"
|
|
|
|
# Scale replicas of Weaviate. Note that as of v1.8.0 dynamic scaling is limited
|
|
# to cases where no data is imported yet. Scaling down after importing data may
|
|
# break usability. Full dynamic scalability will be added in a future release.
|
|
replicas: 1
|
|
resources: {}
|
|
# requests:
|
|
# cpu: '500m'
|
|
# memory: '300Mi'
|
|
# limits:
|
|
# cpu: '1000m'
|
|
# memory: '1Gi'
|
|
|
|
|
|
# Add a service account ot the Weaviate pods if you need Weaviate to have permissions to
|
|
# access kubernetes resources or cloud provider resources. For example for it to have
|
|
# access to a backup up bucket, or if you want to restrict Weaviate pod in any way.
|
|
# By default, use the default ServiceAccount
|
|
serviceAccountName:
|
|
|
|
# The Persistent Volume Claim settings for Weaviate. If there's a
|
|
# storage.fullnameOverride field set, then the default pvc will not be
|
|
# created, instead the one defined in fullnameOverride will be used
|
|
storage:
|
|
size: 32Gi
|
|
storageClassName: ""
|
|
|
|
# The service controls how weaviate is exposed to the outside world. If you
|
|
# don't want a public load balancer, you can also choose 'ClusterIP' to make
|
|
# weaviate only accessible within your cluster.
|
|
service:
|
|
name: weaviate
|
|
ports:
|
|
- name: http
|
|
protocol: TCP
|
|
port: 80
|
|
# Target port is going to be the same for every port
|
|
type: LoadBalancer
|
|
loadBalancerSourceRanges: []
|
|
# optionally set cluster IP if you want to set a static IP
|
|
clusterIP:
|
|
annotations: {}
|
|
|
|
# Adjust liveness, readiness and startup probes configuration
|
|
startupProbe:
|
|
# For kubernetes versions prior to 1.18 startupProbe is not supported thus can be disabled.
|
|
enabled: false
|
|
|
|
initialDelaySeconds: 300
|
|
periodSeconds: 60
|
|
failureThreshold: 50
|
|
successThreshold: 1
|
|
timeoutSeconds: 3
|
|
|
|
livenessProbe:
|
|
initialDelaySeconds: 900
|
|
periodSeconds: 10
|
|
failureThreshold: 30
|
|
successThreshold: 1
|
|
timeoutSeconds: 3
|
|
|
|
readinessProbe:
|
|
initialDelaySeconds: 3
|
|
periodSeconds: 10
|
|
failureThreshold: 3
|
|
successThreshold: 1
|
|
timeoutSeconds: 3
|
|
|
|
|
|
terminationGracePeriodSeconds: 600
|
|
|
|
# Weaviate Config
|
|
#
|
|
# The following settings allow you to customize Weaviate to your needs, for
|
|
# example set authentication and authorization options. See weaviate docs
|
|
# (https://www.weaviate.io/developers/weaviate/) for all
|
|
# configuration.
|
|
authentication:
|
|
anonymous_access:
|
|
enabled: true
|
|
authorization:
|
|
admin_list:
|
|
enabled: false
|
|
query_defaults:
|
|
limit: 100
|
|
debug: false
|
|
|
|
|
|
# Insert any custom environment variables or envSecrets by putting the exact name
|
|
# and desired value into the settings below. Any env name passed will be automatically
|
|
# set for the statefulSet.
|
|
env:
|
|
CLUSTER_GOSSIP_BIND_PORT: 7000
|
|
CLUSTER_DATA_BIND_PORT: 7001
|
|
# The aggressiveness of the Go Garbage Collector. 100 is the default value.
|
|
GOGC: 100
|
|
|
|
# Expose metrics on port 2112 for Prometheus to scrape
|
|
PROMETHEUS_MONITORING_ENABLED: false
|
|
|
|
# Set a MEM limit for the Weaviate Pod so it can help you both increase GC-related
|
|
# performance as well as avoid GC-related out-of-memory (“OOM”) situations
|
|
# GOMEMLIMIT: 6GiB
|
|
|
|
# Maximum results Weaviate can query with/without pagination
|
|
# NOTE: Affects performance, do NOT set to a very high value.
|
|
# The default is 100K
|
|
QUERY_MAXIMUM_RESULTS: 100000
|
|
|
|
# whether to enable vector dimensions tracking metric
|
|
TRACK_VECTOR_DIMENSIONS: false
|
|
|
|
# whether to re-index/-compute the vector dimensions metric (needed if upgrading from weaviate < v1.16.0)
|
|
REINDEX_VECTOR_DIMENSIONS_AT_STARTUP: false
|
|
|
|
envSecrets:
|
|
|
|
|
|
# Configure backup providers
|
|
backups:
|
|
# The backup-filesystem module enables creation of the DB backups in
|
|
# the local filesystem
|
|
filesystem:
|
|
enabled: false
|
|
envconfig:
|
|
# Configure folder where backups should be saved
|
|
BACKUP_FILESYSTEM_PATH: /tmp/backups
|
|
|
|
s3:
|
|
enabled: false
|
|
# If one is using AWS EKS and has already configured K8s Service Account
|
|
# that holds the AWS credentials one can pass a name of that service account
|
|
# here using this setting.
|
|
# NOTE: the root `serviceAccountName` config has priority over this one, and
|
|
# if the root one is set this one will NOT overwrite it. This one is here for
|
|
# backwards compatibility.
|
|
serviceAccountName:
|
|
|
|
envconfig:
|
|
# Configure bucket where backups should be saved, this setting is mandatory
|
|
BACKUP_S3_BUCKET: weaviate-backups
|
|
|
|
# Optional setting. Defaults to empty string.
|
|
# Set this option if you want to save backups to a given location
|
|
# inside the bucket
|
|
# BACKUP_S3_PATH: path/inside/bucket
|
|
|
|
# Optional setting. Defaults to AWS S3 (s3.amazonaws.com).
|
|
# Set this option if you have a MinIO storage configured in your environment
|
|
# and want to use it instead of the AWS S3.
|
|
# BACKUP_S3_ENDPOINT: custom.minio.endpoint.address
|
|
|
|
# Optional setting. Defaults to true.
|
|
# Set this option if you don't want to use SSL.
|
|
# BACKUP_S3_USE_SSL: true
|
|
|
|
# You can pass environment AWS settings here:
|
|
# Define the region
|
|
# AWS_REGION: eu-west-1
|
|
|
|
# For Weaviate to be able to create bucket objects it needs a user credentials to authenticate to AWS.
|
|
# The User must have permissions to read/create/delete bucket objects.
|
|
# You can pass the User credentials (access-key id and access-secret-key) in 2 ways:
|
|
# 1. by setting the AWS_ACCESS_KEY_ID and AWS_SECRET_ACCESS_KEY plain values in the `secrets` section below
|
|
# this chart will create a kubernetes secret for you with these key-values pairs
|
|
# 2. create Kubernetes secret/s with AWS_ACCESS_KEY_ID and AWS_SECRET_ACCESS_KEY keys and their respective values
|
|
# Set the Key and the secret where it is set in `envSecrets` section below
|
|
secrets: {}
|
|
# AWS_ACCESS_KEY_ID: access-key-id (plain text)
|
|
# AWS_SECRET_ACCESS_KEY: secret-access-key (plain text)
|
|
|
|
# If one has already defined secrets with AWS credentials one can pass them using
|
|
# this setting:
|
|
envSecrets: {}
|
|
# AWS_ACCESS_KEY_ID: name-of-the-k8s-secret-containing-the-key-id
|
|
# AWS_SECRET_ACCESS_KEY: name-of-the-k8s-secret-containing-the-key
|
|
|
|
gcs:
|
|
enabled: false
|
|
envconfig:
|
|
# Configure bucket where backups should be saved, this setting is mandatory
|
|
BACKUP_GCS_BUCKET: weaviate-backups
|
|
|
|
# Optional setting. Defaults to empty string.
|
|
# Set this option if you want to save backups to a given location
|
|
# inside the bucket
|
|
# BACKUP_GCS_PATH: path/inside/bucket
|
|
|
|
# You can pass environment Google settings here:
|
|
# Define the project
|
|
# GOOGLE_CLOUD_PROJECT: project-id
|
|
|
|
# For Weaviate to be able to create bucket objects it needs a ServiceAccount credentials to authenticate to GCP.
|
|
# The ServiceAccount must have permissions to read/create/delete bucket objects.
|
|
# You can pass the ServiceAccount credentials (as JSON) in 2 ways:
|
|
# 1. by setting the GOOGLE_APPLICATION_CREDENTIALS json as plain text in the `secrets` section below
|
|
# this chart will create a kubernetes secret for you with this key-values pairs
|
|
# 2. create a Kubernetes secret with GOOGLE_APPLICATION_CREDENTIALS key and its respective value
|
|
# Set the Key and the secret where it is set in `envSecrets` section below
|
|
secrets: {}
|
|
# GOOGLE_APPLICATION_CREDENTIALS: credentials-json-string
|
|
|
|
# If one has already defined a secret with GOOGLE_APPLICATION_CREDENTIALS one can pass them using
|
|
# this setting:
|
|
envSecrets: {}
|
|
# GOOGLE_APPLICATION_CREDENTIALS: name-of-the-k8s-secret-containing-the-key
|
|
|
|
azure:
|
|
enabled: false
|
|
envconfig:
|
|
# Configure container where backups should be saved, this setting is mandatory
|
|
BACKUP_AZURE_CONTAINER: weaviate-backups
|
|
|
|
# Optional setting. Defaults to empty string.
|
|
# Set this option if you want to save backups to a given location
|
|
# inside the container
|
|
# BACKUP_AZURE_PATH: path/inside/container
|
|
|
|
# For Weaviate to be able to create container objects it needs a user credentials to authenticate to Azure Storage.
|
|
# The User must have permissions to read/create/delete container objects.
|
|
# You can pass the User credentials (account-name id and account-key or connection-string) in 2 ways:
|
|
# 1. by setting the AZURE_STORAGE_ACCOUNT and AZURE_STORAGE_KEY
|
|
# or AZURE_STORAGE_CONNECTION_STRING plain values in the `secrets` section below
|
|
# this chart will create a kubernetes secret for you with these key-values pairs
|
|
# 2. create Kubernetes secret/s with AZURE_STORAGE_ACCOUNT and AZURE_STORAGE_KEY
|
|
# or AZURE_STORAGE_CONNECTION_STRING and their respective values
|
|
# Set the Key and the secret where it is set in `envSecrets` section below
|
|
secrets: {}
|
|
# AZURE_STORAGE_ACCOUNT: account-name (plain text)
|
|
# AZURE_STORAGE_KEY: account-key (plain text)
|
|
# AZURE_STORAGE_CONNECTION_STRING: connection-string (plain text)
|
|
|
|
# If one has already defined secrets with Azure Storage credentials one can pass them using
|
|
# this setting:
|
|
envSecrets: {}
|
|
# AZURE_STORAGE_ACCOUNT: name-of-the-k8s-secret-containing-the-account-name
|
|
# AZURE_STORAGE_KEY: name-of-the-k8s-secret-containing-account-key
|
|
# AZURE_STORAGE_CONNECTION_STRING: name-of-the-k8s-secret-containing-connection-string
|
|
|
|
|
|
# modules are extensions to Weaviate, they can be used to support various
|
|
# ML-models, but also other features unrelated to model inference.
|
|
# An inference/vectorizer module is not required, you can also run without any
|
|
# modules and import your own vectors.
|
|
modules:
|
|
|
|
# The text2vec-contextionary module uses a fastText-based vector-space to
|
|
# derive vector embeddings for your objects. It is very efficient on CPUs,
|
|
# but in some situations it cannot reach the same level of accuracy as
|
|
# transformers-based models.
|
|
text2vec-contextionary:
|
|
# disable if you want to use transformers or import or own vectors
|
|
enabled: false
|
|
|
|
# The configuration below is ignored if enabled==false
|
|
fullnameOverride: contextionary
|
|
tag: en0.16.0-v1.0.2
|
|
repo: semitechnologies/contextionary
|
|
registry: docker.io
|
|
replicas: 1
|
|
envconfig:
|
|
occurrence_weight_linear_factor: 0.75
|
|
neighbor_occurrence_ignore_percentile: 5
|
|
enable_compound_splitting: false
|
|
extensions_storage_mode: weaviate
|
|
resources:
|
|
requests:
|
|
cpu: '500m'
|
|
memory: '500Mi'
|
|
limits:
|
|
cpu: '1000m'
|
|
memory: '5000Mi'
|
|
|
|
# It is possible to add a ServiceAccount to this module's Pods, it can be
|
|
# used in cases where the module is in a private registry and you want to
|
|
# give access to the registry only to this pod.
|
|
# NOTE: if not set the root `serviceAccountName` config will be used.
|
|
serviceAccountName:
|
|
|
|
# You can guide where the pods are scheduled on a per-module basis,
|
|
# as well as for Weaviate overall. Each module accepts nodeSelector,
|
|
# tolerations, and affinity configuration. If it is set on a per-
|
|
# module basis, this configuration overrides the global config.
|
|
|
|
nodeSelector:
|
|
tolerations:
|
|
affinity:
|
|
|
|
# The text2vec-transformers modules uses neural networks, such as BERT,
|
|
# DistilBERT, etc. to dynamically compute vector embeddings based on the
|
|
# sentence's context. It is very slow on CPUs and should run with
|
|
# CUDA-enabled GPUs for optimal performance.
|
|
text2vec-transformers:
|
|
|
|
# enable if you want to use transformers instead of the
|
|
# text2vec-contextionary module
|
|
enabled: false
|
|
# You can set directly an inference URL of this module without deploying it with this release.
|
|
# You can do so by setting a value for the `inferenceUrl` here AND by setting the `enable` to `false`
|
|
inferenceUrl: {}
|
|
# The configuration below is ignored if enabled==false
|
|
|
|
# replace with model of choice, see
|
|
# https://weaviate.io/developers/weaviate/modules/retriever-vectorizer-modules/text2vec-transformers
|
|
# for all supported models or build your own container.
|
|
tag: distilbert-base-uncased
|
|
repo: semitechnologies/transformers-inference
|
|
registry: docker.io
|
|
replicas: 1
|
|
fullnameOverride: transformers-inference
|
|
# Deprecated setting use initialDelaySeconds instead in each probe instead
|
|
# probeInitialDelaySeconds: 120
|
|
livenessProbe:
|
|
initialDelaySeconds: 120
|
|
periodSeconds: 3
|
|
timeoutSeconds: 3
|
|
readinessProbe:
|
|
initialDelaySeconds: 120
|
|
periodSeconds: 3
|
|
envconfig:
|
|
# enable for CUDA support. Your K8s cluster needs to be configured
|
|
# accordingly and you need to explicitly set GPU requests & limits below
|
|
enable_cuda: false
|
|
|
|
# only used when cuda is enabled
|
|
nvidia_visible_devices: all
|
|
nvidia_driver_capabilities: compute,utility
|
|
|
|
# only used when cuda is enabled
|
|
ld_library_path: /usr/local/nvidia/lib64
|
|
|
|
resources:
|
|
requests:
|
|
cpu: '1000m'
|
|
memory: '3000Mi'
|
|
|
|
# enable if running with CUDA support
|
|
# nvidia.com/gpu: 1
|
|
limits:
|
|
cpu: '1000m'
|
|
memory: '5000Mi'
|
|
|
|
# enable if running with CUDA support
|
|
# nvidia.com/gpu: 1
|
|
|
|
# It is possible to add a ServiceAccount to this module's Pods, it can be
|
|
# used in cases where the module is in a private registry and you want to
|
|
# give access to the registry only to this pod.
|
|
# NOTE: if not set the root `serviceAccountName` config will be used.
|
|
serviceAccountName:
|
|
|
|
# You can guide where the pods are scheduled on a per-module basis,
|
|
# as well as for Weaviate overall. Each module accepts nodeSelector,
|
|
# tolerations, and affinity configuration. If it is set on a per-
|
|
# module basis, this configuration overrides the global config.
|
|
|
|
nodeSelector:
|
|
tolerations:
|
|
affinity:
|
|
|
|
passageQueryServices:
|
|
passage:
|
|
enabled: false
|
|
# You can set directly an inference URL of this module without deploying it with this release.
|
|
# You can do so by setting a value for the `inferenceUrl` here AND by setting the `enable` to `false`
|
|
inferenceUrl: {}
|
|
|
|
tag: facebook-dpr-ctx_encoder-single-nq-base
|
|
repo: semitechnologies/transformers-inference
|
|
registry: docker.io
|
|
replicas: 1
|
|
fullnameOverride: transformers-inference-passage
|
|
livenessProbe:
|
|
initialDelaySeconds: 120
|
|
periodSeconds: 3
|
|
timeoutSeconds: 3
|
|
readinessProbe:
|
|
initialDelaySeconds: 120
|
|
periodSeconds: 3
|
|
envconfig:
|
|
# enable for CUDA support. Your K8s cluster needs to be configured
|
|
# accordingly and you need to explicitly set GPU requests & limits below
|
|
enable_cuda: false
|
|
|
|
# only used when cuda is enabled
|
|
nvidia_visible_devices: all
|
|
nvidia_driver_capabilities: compute,utility
|
|
|
|
# only used when cuda is enabled
|
|
ld_library_path: /usr/local/nvidia/lib64
|
|
|
|
resources:
|
|
requests:
|
|
cpu: '1000m'
|
|
memory: '3000Mi'
|
|
|
|
# enable if running with CUDA support
|
|
# nvidia.com/gpu: 1
|
|
limits:
|
|
cpu: '1000m'
|
|
memory: '5000Mi'
|
|
|
|
# enable if running with CUDA support
|
|
# nvidia.com/gpu: 1
|
|
|
|
# You can guide where the pods are scheduled on a per-module basis,
|
|
# as well as for Weaviate overall. Each module accepts nodeSelector,
|
|
# tolerations, and affinity configuration. If it is set on a per-
|
|
# module basis, this configuration overrides the global config.
|
|
|
|
nodeSelector:
|
|
tolerations:
|
|
affinity:
|
|
|
|
query:
|
|
enabled: false
|
|
# You can set directly an inference URL of this module without deploying it with this release.
|
|
# You can do so by setting a value for the `inferenceUrl` here AND by setting the `enable` to `false`
|
|
inferenceUrl: {}
|
|
|
|
tag: facebook-dpr-question_encoder-single-nq-base
|
|
repo: semitechnologies/transformers-inference
|
|
registry: docker.io
|
|
replicas: 1
|
|
fullnameOverride: transformers-inference-query
|
|
livenessProbe:
|
|
initialDelaySeconds: 120
|
|
periodSeconds: 3
|
|
timeoutSeconds: 3
|
|
readinessProbe:
|
|
initialDelaySeconds: 120
|
|
periodSeconds: 3
|
|
envconfig:
|
|
# enable for CUDA support. Your K8s cluster needs to be configured
|
|
# accordingly and you need to explicitly set GPU requests & limits below
|
|
enable_cuda: false
|
|
|
|
# only used when cuda is enabled
|
|
nvidia_visible_devices: all
|
|
nvidia_driver_capabilities: compute,utility
|
|
|
|
# only used when cuda is enabled
|
|
ld_library_path: /usr/local/nvidia/lib64
|
|
|
|
resources:
|
|
requests:
|
|
cpu: '1000m'
|
|
memory: '3000Mi'
|
|
|
|
# enable if running with CUDA support
|
|
# nvidia.com/gpu: 1
|
|
limits:
|
|
cpu: '1000m'
|
|
memory: '5000Mi'
|
|
|
|
# enable if running with CUDA support
|
|
# nvidia.com/gpu: 1
|
|
|
|
# You can guide where the pods are scheduled on a per-module basis,
|
|
# as well as for Weaviate overall. Each module accepts nodeSelector,
|
|
# tolerations, and affinity configuration. If it is set on a per-
|
|
# module basis, this configuration overrides the global config.
|
|
|
|
nodeSelector:
|
|
tolerations:
|
|
affinity:
|
|
|
|
# The text2vec-openai module uses OpenAI Embeddings API
|
|
# to dynamically compute vector embeddings based on the
|
|
# sentence's context.
|
|
# More information about OpenAI Embeddings API can be found here:
|
|
# https://beta.openai.com/docs/guides/embeddings/what-are-embeddings
|
|
text2vec-openai:
|
|
|
|
# enable if you want to use OpenAI module
|
|
enabled: false
|
|
|
|
# Set your OpenAI API Key to be passed to Weaviate pod as
|
|
# an environment variable
|
|
apiKey: ''
|
|
|
|
# The text2vec-huggingface module uses HuggingFace API
|
|
# to dynamically compute vector embeddings based on the
|
|
# sentence's context.
|
|
# More information about HuggingFace API can be found here:
|
|
# https://huggingface.co/docs/api-inference/detailed_parameters#feature-extraction-task
|
|
text2vec-huggingface:
|
|
|
|
# enable if you want to use HuggingFace module
|
|
enabled: false
|
|
|
|
# Set your HuggingFace API Key to be passed to Weaviate pod as
|
|
# an environment variable
|
|
apiKey: ''
|
|
|
|
# The text2vec-cohere module uses Cohere API
|
|
# to dynamically compute vector embeddings based on the
|
|
# sentence's context.
|
|
# More information about Cohere API can be found here: https://docs.cohere.ai/
|
|
text2vec-cohere:
|
|
|
|
# enable if you want to use Cohere module
|
|
enabled: false
|
|
|
|
# Set your Cohere API Key to be passed to Weaviate pod as
|
|
# an environment variable
|
|
apiKey: ''
|
|
|
|
# The ref2vec-centroid module
|
|
ref2vec-centroid:
|
|
|
|
# enable if you want to use Centroid module
|
|
enabled: false
|
|
|
|
# The multi2vec-clip modules uses CLIP transformers to vectorize both images
|
|
# and text in the same vector space. It is typically slow(er) on CPUs and should
|
|
# run with CUDA-enabled GPUs for optimal performance.
|
|
multi2vec-clip:
|
|
|
|
# enable if you want to use transformers instead of the
|
|
# text2vec-contextionary module
|
|
enabled: false
|
|
# You can set directly an inference URL of this module without deploying it with this release.
|
|
# You can do so by setting a value for the `inferenceUrl` here AND by setting the `enable` to `false`
|
|
inferenceUrl: {}
|
|
|
|
# The configuration below is ignored if enabled==false
|
|
|
|
# replace with model of choice, see
|
|
# https://weaviate.io/developers/weaviate/modules/retriever-vectorizer-modules/multi2vec-clip
|
|
# for all supported models or build your own container.
|
|
tag: sentence-transformers-clip-ViT-B-32-multilingual-v1
|
|
repo: semitechnologies/multi2vec-clip
|
|
registry: docker.io
|
|
replicas: 1
|
|
fullnameOverride: clip-inference
|
|
livenessProbe:
|
|
initialDelaySeconds: 120
|
|
periodSeconds: 3
|
|
timeoutSeconds: 3
|
|
readinessProbe:
|
|
initialDelaySeconds: 120
|
|
periodSeconds: 3
|
|
envconfig:
|
|
# enable for CUDA support. Your K8s cluster needs to be configured
|
|
# accordingly and you need to explicitly set GPU requests & limits below
|
|
enable_cuda: false
|
|
|
|
# only used when cuda is enabled
|
|
nvidia_visible_devices: all
|
|
nvidia_driver_capabilities: compute,utility
|
|
|
|
# only used when cuda is enabled
|
|
ld_library_path: /usr/local/nvidia/lib64
|
|
|
|
resources:
|
|
requests:
|
|
cpu: '1000m'
|
|
memory: '3000Mi'
|
|
|
|
# enable if running with CUDA support
|
|
# nvidia.com/gpu: 1
|
|
limits:
|
|
cpu: '1000m'
|
|
memory: '5000Mi'
|
|
|
|
# enable if running with CUDA support
|
|
# nvidia.com/gpu: 1
|
|
annotations:
|
|
nodeSelector:
|
|
tolerations:
|
|
|
|
# The qna-transformers module uses neural networks, such as BERT,
|
|
# DistilBERT, to find an aswer in text to a given question
|
|
qna-transformers:
|
|
enabled: false
|
|
# You can set directly an inference URL of this module without deploying it with this release.
|
|
# You can do so by setting a value for the `inferenceUrl` here AND by setting the `enable` to `false`
|
|
inferenceUrl: {}
|
|
tag: bert-large-uncased-whole-word-masking-finetuned-squad-34d66b1
|
|
repo: semitechnologies/qna-transformers
|
|
registry: docker.io
|
|
replicas: 1
|
|
fullnameOverride: qna-transformers
|
|
livenessProbe:
|
|
initialDelaySeconds: 120
|
|
periodSeconds: 3
|
|
timeoutSeconds: 3
|
|
readinessProbe:
|
|
initialDelaySeconds: 120
|
|
periodSeconds: 3
|
|
envconfig:
|
|
# enable for CUDA support. Your K8s cluster needs to be configured
|
|
# accordingly and you need to explicitly set GPU requests & limits below
|
|
enable_cuda: false
|
|
|
|
# only used when cuda is enabled
|
|
nvidia_visible_devices: all
|
|
nvidia_driver_capabilities: compute,utility
|
|
|
|
# only used when cuda is enabled
|
|
ld_library_path: /usr/local/nvidia/lib64
|
|
|
|
resources:
|
|
requests:
|
|
cpu: '1000m'
|
|
memory: '3000Mi'
|
|
|
|
# enable if running with CUDA support
|
|
# nvidia.com/gpu: 1
|
|
limits:
|
|
cpu: '1000m'
|
|
memory: '5000Mi'
|
|
|
|
# enable if running with CUDA support
|
|
# nvidia.com/gpu: 1
|
|
|
|
# It is possible to add a ServiceAccount to this module's Pods, it can be
|
|
# used in cases where the module is in a private registry and you want to
|
|
# give access to the registry only to this pod.
|
|
# NOTE: if not set the root `serviceAccountName` config will be used.
|
|
serviceAccountName:
|
|
|
|
# You can guide where the pods are scheduled on a per-module basis,
|
|
# as well as for Weaviate overall. Each module accepts nodeSelector,
|
|
# tolerations, and affinity configuration. If it is set on a per-
|
|
# module basis, this configuration overrides the global config.
|
|
|
|
nodeSelector:
|
|
tolerations:
|
|
affinity:
|
|
|
|
# The qna-openai module uses OpenAI Completions API
|
|
# to dynamically answer given questions.
|
|
# More information about OpenAI Completions API can be found here:
|
|
# https://beta.openai.com/docs/api-reference/completions
|
|
qna-openai:
|
|
|
|
# enable if you want to use OpenAI module
|
|
enabled: false
|
|
|
|
# Set your OpenAI API Key to be passed to Weaviate pod as
|
|
# an environment variable
|
|
apiKey: ''
|
|
|
|
# The generative-openai module uses OpenAI Completions API
|
|
# along with text-davinci-003 model to behave as ChatGPT.
|
|
# More information about OpenAI Completions API can be found here:
|
|
# https://beta.openai.com/docs/api-reference/completions
|
|
generative-openai:
|
|
|
|
# enable if you want to use OpenAI module
|
|
enabled: false
|
|
|
|
# Set your OpenAI API Key to be passed to Weaviate pod as
|
|
# an environment variable
|
|
apiKey: ''
|
|
|
|
# The img2vec-neural module uses neural networks, to generate
|
|
# a vector representation of the image
|
|
img2vec-neural:
|
|
enabled: false
|
|
# You can set directly an inference URL of this module without deploying it with this release.
|
|
# You can do so by setting a value for the `inferenceUrl` here AND by setting the `enable` to `false`
|
|
inferenceUrl: {}
|
|
tag: resnet50
|
|
repo: semitechnologies/img2vec-pytorch
|
|
registry: docker.io
|
|
replicas: 1
|
|
fullnameOverride: img2vec-neural
|
|
livenessProbe:
|
|
initialDelaySeconds: 120
|
|
periodSeconds: 3
|
|
timeoutSeconds: 3
|
|
readinessProbe:
|
|
initialDelaySeconds: 120
|
|
periodSeconds: 3
|
|
envconfig:
|
|
# enable for CUDA support. Your K8s cluster needs to be configured
|
|
# accordingly and you need to explicitly set GPU requests & limits below
|
|
enable_cuda: false
|
|
|
|
# only used when cuda is enabled
|
|
nvidia_visible_devices: all
|
|
nvidia_driver_capabilities: compute,utility
|
|
|
|
# only used when cuda is enabled
|
|
ld_library_path: /usr/local/nvidia/lib64
|
|
|
|
resources:
|
|
requests:
|
|
cpu: '1000m'
|
|
memory: '3000Mi'
|
|
|
|
# enable if running with CUDA support
|
|
# nvidia.com/gpu: 1
|
|
limits:
|
|
cpu: '1000m'
|
|
memory: '5000Mi'
|
|
|
|
# enable if running with CUDA support
|
|
# nvidia.com/gpu: 1
|
|
|
|
# It is possible to add a ServiceAccount to this module's Pods, it can be
|
|
# used in cases where the module is in a private registry and you want to
|
|
# give access to the registry only to this pod.
|
|
# NOTE: if not set the root `serviceAccountName` config will be used.
|
|
serviceAccountName:
|
|
|
|
# You can guide where the pods are scheduled on a per-module basis,
|
|
# as well as for Weaviate overall. Each module accepts nodeSelector,
|
|
# tolerations, and affinity configuration. If it is set on a per-
|
|
# module basis, this configuration overrides the global config.
|
|
|
|
nodeSelector:
|
|
tolerations:
|
|
affinity:
|
|
|
|
# The text-spellcheck module uses spellchecker library to check
|
|
# misspellings in a given text
|
|
text-spellcheck:
|
|
enabled: false
|
|
# You can set directly an inference URL of this module without deploying it with this release.
|
|
# You can do so by setting a value for the `inferenceUrl` here AND by setting the `enable` to `false`
|
|
inferenceUrl: {}
|
|
tag: pyspellchecker-en
|
|
repo: semitechnologies/text-spellcheck-model
|
|
registry: docker.io
|
|
replicas: 1
|
|
fullnameOverride: text-spellcheck
|
|
livenessProbe:
|
|
initialDelaySeconds: 120
|
|
periodSeconds: 3
|
|
timeoutSeconds: 3
|
|
readinessProbe:
|
|
initialDelaySeconds: 120
|
|
periodSeconds: 3
|
|
|
|
resources:
|
|
requests:
|
|
cpu: '400m'
|
|
memory: '400Mi'
|
|
limits:
|
|
cpu: '500m'
|
|
memory: '500Mi'
|
|
|
|
# It is possible to add a ServiceAccount to this module's Pods, it can be
|
|
# used in cases where the module is in a private registry and you want to
|
|
# give access to the registry only to this pod.
|
|
# NOTE: if not set the root `serviceAccountName` config will be used.
|
|
serviceAccountName:
|
|
|
|
# You can guide where the pods are scheduled on a per-module basis,
|
|
# as well as for Weaviate overall. Each module accepts nodeSelector,
|
|
# tolerations, and affinity configuration. If it is set on a per-
|
|
# module basis, this configuration overrides the global config.
|
|
|
|
nodeSelector:
|
|
tolerations:
|
|
affinity:
|
|
|
|
# The ner-transformers module uses spellchecker library to check
|
|
# misspellings in a given text
|
|
ner-transformers:
|
|
enabled: false
|
|
# You can set directly an inference URL of this module without deploying it with this release.
|
|
# You can do so by setting a value for the `inferenceUrl` here AND by setting the `enable` to `false`
|
|
inferenceUrl: {}
|
|
tag: dbmdz-bert-large-cased-finetuned-conll03-english-0.0.2
|
|
repo: semitechnologies/ner-transformers
|
|
registry: docker.io
|
|
replicas: 1
|
|
fullnameOverride: ner-transformers
|
|
livenessProbe:
|
|
initialDelaySeconds: 120
|
|
periodSeconds: 3
|
|
timeoutSeconds: 3
|
|
readinessProbe:
|
|
initialDelaySeconds: 120
|
|
periodSeconds: 3
|
|
envconfig:
|
|
# enable for CUDA support. Your K8s cluster needs to be configured
|
|
# accordingly and you need to explicitly set GPU requests & limits below
|
|
enable_cuda: false
|
|
|
|
# only used when cuda is enabled
|
|
nvidia_visible_devices: all
|
|
nvidia_driver_capabilities: compute,utility
|
|
|
|
# only used when cuda is enabled
|
|
ld_library_path: /usr/local/nvidia/lib64
|
|
|
|
resources:
|
|
requests:
|
|
cpu: '1000m'
|
|
memory: '3000Mi'
|
|
|
|
# enable if running with CUDA support
|
|
# nvidia.com/gpu: 1
|
|
limits:
|
|
cpu: '1000m'
|
|
memory: '5000Mi'
|
|
|
|
# enable if running with CUDA support
|
|
# nvidia.com/gpu: 1
|
|
|
|
# It is possible to add a ServiceAccount to this module's Pods, it can be
|
|
# used in cases where the module is in a private registry and you want to
|
|
# give access to the registry only to this pod.
|
|
# NOTE: if not set the root `serviceAccountName` config will be used.
|
|
serviceAccountName:
|
|
|
|
# You can guide where the pods are scheduled on a per-module basis,
|
|
# as well as for Weaviate overall. Each module accepts nodeSelector,
|
|
# tolerations, and affinity configuration. If it is set on a per-
|
|
# module basis, this configuration overrides the global config.
|
|
|
|
nodeSelector:
|
|
tolerations:
|
|
affinity:
|
|
|
|
# The sum-transformers module makes result texts summarizations
|
|
sum-transformers:
|
|
enabled: false
|
|
# You can set directly an inference URL of this module without deploying it with this release.
|
|
# You can do so by setting a value for the `inferenceUrl` here AND by setting the `enable` to `false`
|
|
inferenceUrl: {}
|
|
tag: facebook-bart-large-cnn-1.0.0
|
|
repo: semitechnologies/sum-transformers
|
|
registry: docker.io
|
|
replicas: 1
|
|
fullnameOverride: sum-transformers
|
|
livenessProbe:
|
|
initialDelaySeconds: 120
|
|
periodSeconds: 3
|
|
timeoutSeconds: 3
|
|
readinessProbe:
|
|
initialDelaySeconds: 120
|
|
periodSeconds: 3
|
|
envconfig:
|
|
# enable for CUDA support. Your K8s cluster needs to be configured
|
|
# accordingly and you need to explicitly set GPU requests & limits below
|
|
enable_cuda: false
|
|
|
|
# only used when cuda is enabled
|
|
nvidia_visible_devices: all
|
|
nvidia_driver_capabilities: compute,utility
|
|
|
|
# only used when cuda is enabled
|
|
ld_library_path: /usr/local/nvidia/lib64
|
|
|
|
resources:
|
|
requests:
|
|
cpu: '1000m'
|
|
memory: '3000Mi'
|
|
|
|
# enable if running with CUDA support
|
|
# nvidia.com/gpu: 1
|
|
limits:
|
|
cpu: '1000m'
|
|
memory: '5000Mi'
|
|
|
|
# enable if running with CUDA support
|
|
# nvidia.com/gpu: 1
|
|
|
|
# It is possible to add a ServiceAccount to this module's Pods, it can be
|
|
# used in cases where the module is in a private registry and you want to
|
|
# give access to the registry only to this pod.
|
|
# NOTE: if not set the root `serviceAccountName` config will be used.
|
|
serviceAccountName:
|
|
|
|
# You can guide where the pods are scheduled on a per-module basis,
|
|
# as well as for Weaviate overall. Each module accepts nodeSelector,
|
|
# tolerations, and affinity configuration. If it is set on a per-
|
|
# module basis, this configuration overrides the global config.
|
|
|
|
nodeSelector:
|
|
tolerations:
|
|
affinity:
|
|
|
|
# by choosing the default vectorizer module, you can tell Weaviate to always
|
|
# use this module as the vectorizer if nothing else is specified. Can be
|
|
# overwritten on a per-class basis.
|
|
# set to text2vec-transformers if running with transformers instead
|
|
default_vectorizer_module: none
|
|
|
|
# It is also possible to configure authentication and authorization through a
|
|
# custom configmap The authorization and authentication values defined in
|
|
# values.yaml will be ignored when defining a custom config map.
|
|
custom_config_map:
|
|
enabled: false
|
|
name: 'custom-config'
|
|
|
|
# Pass any annotations to Weaviate pods
|
|
annotations:
|
|
|
|
nodeSelector:
|
|
|
|
tolerations:
|
|
|
|
affinity:
|
|
podAntiAffinity:
|
|
preferredDuringSchedulingIgnoredDuringExecution:
|
|
- weight: 1
|
|
podAffinityTerm:
|
|
topologyKey: "kubernetes.io/hostname"
|
|
labelSelector:
|
|
matchExpressions:
|
|
- key: "app"
|
|
operator: In
|
|
values:
|
|
- weaviate
|