From b8adf2f68be001d3c20e97972762c8828f4f47a7 Mon Sep 17 00:00:00 2001 From: GooeyTuxedo Date: Thu, 13 Apr 2023 10:27:14 -0700 Subject: [PATCH] initial commit --- .helmignore | 23 +++++++ Chart.yaml | 30 +++++++++ LICENSE | 7 ++ README.md | 74 ++++++++++++++++++++++ templates/NOTES.txt | 22 +++++++ templates/_helpers.tpl | 62 ++++++++++++++++++ templates/datadb-pvc.yml | 10 +++ templates/hpa.yaml | 28 ++++++++ templates/ingress.yaml | 61 ++++++++++++++++++ templates/service.yaml | 15 +++++ templates/serviceaccount.yaml | 12 ++++ templates/statefulset.yaml | 76 ++++++++++++++++++++++ templates/tests/test-connection.yaml | 15 +++++ templates/weights-pvc.yml | 10 +++ values.yaml | 95 ++++++++++++++++++++++++++++ 15 files changed, 540 insertions(+) create mode 100644 .helmignore create mode 100644 Chart.yaml create mode 100644 LICENSE create mode 100644 README.md create mode 100644 templates/NOTES.txt create mode 100644 templates/_helpers.tpl create mode 100644 templates/datadb-pvc.yml create mode 100644 templates/hpa.yaml create mode 100644 templates/ingress.yaml create mode 100644 templates/service.yaml create mode 100644 templates/serviceaccount.yaml create mode 100644 templates/statefulset.yaml create mode 100644 templates/tests/test-connection.yaml create mode 100644 templates/weights-pvc.yml create mode 100644 values.yaml diff --git a/.helmignore b/.helmignore new file mode 100644 index 0000000..0e8a0eb --- /dev/null +++ b/.helmignore @@ -0,0 +1,23 @@ +# Patterns to ignore when building packages. +# This supports shell glob matching, relative path matching, and +# negation (prefixed with !). Only one pattern per line. +.DS_Store +# Common VCS dirs +.git/ +.gitignore +.bzr/ +.bzrignore +.hg/ +.hgignore +.svn/ +# Common backup files +*.swp +*.bak +*.tmp +*.orig +*~ +# Various IDEs +.project +.idea/ +*.tmproj +.vscode/ diff --git a/Chart.yaml b/Chart.yaml new file mode 100644 index 0000000..34b89f8 --- /dev/null +++ b/Chart.yaml @@ -0,0 +1,30 @@ +apiVersion: v2 +name: serge +description: A Helm chart for Serge - LLaMA UI / API + +# A chart can be either an 'application' or a 'library' chart. +# +# Application charts are a collection of templates that can be packaged into versioned archives +# to be deployed. +# +# Library charts provide useful utilities or functions for the chart developer. They're included as +# a dependency of application charts to inject those utilities and functions into the rendering +# pipeline. Library charts do not define any templates and therefore cannot be deployed. +type: application + +# This is the chart version. This version number should be incremented each time you make changes +# to the chart and its templates, including the app version. +# Versions are expected to follow Semantic Versioning (https://semver.org/) +version: 0.0.2 + +# This is the version number of the application being deployed. This version number should be +# incremented each time you make changes to the application. Versions are not expected to +# follow Semantic Versioning. They should reflect the version the application is using. +# It is recommended to use it with quotes. +appVersion: "0.0.4" + +icon: https://ipfs.io/ipfs/QmTt3523vesZhDXmtTBUWqoHZAow4SUSipsXahDK6MvHzr?filename=AI_cool_llama.png + +maintainers: + - name: MrTuxedo + email: dev@based.consulting \ No newline at end of file diff --git a/LICENSE b/LICENSE new file mode 100644 index 0000000..4ecae4f --- /dev/null +++ b/LICENSE @@ -0,0 +1,7 @@ +Copyright © 2023 MrTuxedo: dev@based.consulting + +Permission is hereby granted, free of charge, to any person obtaining a copy of this software and associated documentation files (the “Software”), to deal in the Software without restriction, including without limitation the rights to use, copy, modify, merge, publish, distribute, sublicense, and/or sell copies of the Software, and to permit persons to whom the Software is furnished to do so, subject to the following conditions: + +The above copyright notice and this permission notice shall be included in all copies or substantial portions of the Software. + +THE SOFTWARE IS PROVIDED “AS IS”, WITHOUT WARRANTY OF ANY KIND, EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE. \ No newline at end of file diff --git a/README.md b/README.md new file mode 100644 index 0000000..6bbb718 --- /dev/null +++ b/README.md @@ -0,0 +1,74 @@ +# Serge AI Helm Chart + +This Helm chart deploys a LLaMA based chat interface named Serge. +https://github.com/nsarrazin/serge + +## Prerequisites + +- Kubernetes 1.12+ or OpenShift 3.11+ +- Helm 3+ + +## Installing the Chart + +To install the chart with the release name `serge-ai`: + +Enable helm OCI support +```sh +export HELM_EXPERIMENTAL_OCI=1 +``` + +Install the chart +```sh +helm install serge-ai oci://registry-1.docker.io/mrtuxedo/serge +``` + +See the [configuration](#configuration) section for information on how to customize the installation. + +## Uninstalling the Chart + +To uninstall the chart with the release name serge-ai, run: + +```sh +helm uninstall serge-ai +``` + +## Configuration + +The following table lists the configurable parameters of the chart and their default values. For more information, see the values.yaml file. + +|Parameter |Description |Default| +--- | --- | --- | +|image.tag|Target branch for Serge |release| +|environment.timezone |Timezone Identifier for deployment| Europe/Amsterdam| +|persistence.datadb.size|Volume size for chat history storage|16Gi| +|persistence.weights.size|Volume size for model weights storage|64Gi| + +To use the latest serge image instead of the last release, you'll want to set `image.tag` to `latest`/`main`. + +To override any of the default values, create a YAML file with your desired overrides and pass it to the helm install command using the --values flag. For example: + +```sh +helm install serge-ai oci://registry-1.docker.io/mrtuxedo/serge --values my-values.yaml +``` + +For more information on configuring the chart, see the values.yaml file and the official Helm documentation. + +## Contributing + +Thank you for considering contributing to this Helm chart! Pull requests and bug reports are always welcome. + +Before submitting a pull request, please ensure that: + + - Your changes are well-tested and conform to the Helm chart best practices and conventions. + - Your changes are clearly documented in the pull request description and/or the chart's README.md file. + - You have run the `helm lint` and `helm template` commands to validate your chart and ensure that it can be rendered correctly. + +For major changes, please open an issue first to discuss your proposed changes. + +Please note that this project is released with a Contributor Code of Conduct. By participating in this project, you agree to abide by its terms. + +For more information on contributing to Helm charts, see the official Helm documentation. + +### License + +[LICENSE](./LICENSE) diff --git a/templates/NOTES.txt b/templates/NOTES.txt new file mode 100644 index 0000000..0666dd3 --- /dev/null +++ b/templates/NOTES.txt @@ -0,0 +1,22 @@ +1. Get the application URL by running these commands: +{{- if .Values.ingress.enabled }} +{{- range $host := .Values.ingress.hosts }} + {{- range .paths }} + http{{ if $.Values.ingress.tls }}s{{ end }}://{{ $host.host }}{{ .path }} + {{- end }} +{{- end }} +{{- else if contains "NodePort" .Values.service.type }} + export NODE_PORT=$(kubectl get --namespace {{ .Release.Namespace }} -o jsonpath="{.spec.ports[0].nodePort}" services {{ include "serge-ai.fullname" . }}) + export NODE_IP=$(kubectl get nodes --namespace {{ .Release.Namespace }} -o jsonpath="{.items[0].status.addresses[0].address}") + echo http://$NODE_IP:$NODE_PORT +{{- else if contains "LoadBalancer" .Values.service.type }} + NOTE: It may take a few minutes for the LoadBalancer IP to be available. + You can watch the status of by running 'kubectl get --namespace {{ .Release.Namespace }} svc -w {{ include "serge-ai.fullname" . }}' + export SERVICE_IP=$(kubectl get svc --namespace {{ .Release.Namespace }} {{ include "serge-ai.fullname" . }} --template "{{"{{ range (index .status.loadBalancer.ingress 0) }}{{.}}{{ end }}"}}") + echo http://$SERVICE_IP:{{ .Values.service.port }} +{{- else if contains "ClusterIP" .Values.service.type }} + export POD_NAME=$(kubectl get pods --namespace {{ .Release.Namespace }} -l "app.kubernetes.io/name={{ include "serge-ai.name" . }},app.kubernetes.io/instance={{ .Release.Name }}" -o jsonpath="{.items[0].metadata.name}") + export CONTAINER_PORT=$(kubectl get pod --namespace {{ .Release.Namespace }} $POD_NAME -o jsonpath="{.spec.containers[0].ports[0].containerPort}") + echo "Visit http://127.0.0.1:8080 to use your application" + kubectl --namespace {{ .Release.Namespace }} port-forward $POD_NAME 8080:$CONTAINER_PORT +{{- end }} diff --git a/templates/_helpers.tpl b/templates/_helpers.tpl new file mode 100644 index 0000000..caf244a --- /dev/null +++ b/templates/_helpers.tpl @@ -0,0 +1,62 @@ +{{/* +Expand the name of the chart. +*/}} +{{- define "serge-ai.name" -}} +{{- default .Chart.Name .Values.nameOverride | trunc 63 | trimSuffix "-" }} +{{- end }} + +{{/* +Create a default fully qualified app name. +We truncate at 63 chars because some Kubernetes name fields are limited to this (by the DNS naming spec). +If release name contains chart name it will be used as a full name. +*/}} +{{- define "serge-ai.fullname" -}} +{{- if .Values.fullnameOverride }} +{{- .Values.fullnameOverride | trunc 63 | trimSuffix "-" }} +{{- else }} +{{- $name := default .Chart.Name .Values.nameOverride }} +{{- if contains $name .Release.Name }} +{{- .Release.Name | trunc 63 | trimSuffix "-" }} +{{- else }} +{{- printf "%s-%s" .Release.Name $name | trunc 63 | trimSuffix "-" }} +{{- end }} +{{- end }} +{{- end }} + +{{/* +Create chart name and version as used by the chart label. +*/}} +{{- define "serge-ai.chart" -}} +{{- printf "%s-%s" .Chart.Name .Chart.Version | replace "+" "_" | trunc 63 | trimSuffix "-" }} +{{- end }} + +{{/* +Common labels +*/}} +{{- define "serge-ai.labels" -}} +helm.sh/chart: {{ include "serge-ai.chart" . }} +{{ include "serge-ai.selectorLabels" . }} +{{- if .Chart.AppVersion }} +app.kubernetes.io/version: {{ .Chart.AppVersion | quote }} +{{- end }} +app.kubernetes.io/managed-by: {{ .Release.Service }} +{{- end }} + +{{/* +Selector labels +*/}} +{{- define "serge-ai.selectorLabels" -}} +app.kubernetes.io/name: {{ include "serge-ai.name" . }} +app.kubernetes.io/instance: {{ .Release.Name }} +{{- end }} + +{{/* +Create the name of the service account to use +*/}} +{{- define "serge-ai.serviceAccountName" -}} +{{- if .Values.serviceAccount.create }} +{{- default (include "serge-ai.fullname" .) .Values.serviceAccount.name }} +{{- else }} +{{- default "default" .Values.serviceAccount.name }} +{{- end }} +{{- end }} diff --git a/templates/datadb-pvc.yml b/templates/datadb-pvc.yml new file mode 100644 index 0000000..f37ff8b --- /dev/null +++ b/templates/datadb-pvc.yml @@ -0,0 +1,10 @@ +apiVersion: v1 +kind: PersistentVolumeClaim +metadata: + name: serge-datadb +spec: + accessModes: + - {{ .Values.persistence.datadb.accessMode }} + resources: + requests: + storage: {{ .Values.persistence.datadb.size }} diff --git a/templates/hpa.yaml b/templates/hpa.yaml new file mode 100644 index 0000000..f16dbaa --- /dev/null +++ b/templates/hpa.yaml @@ -0,0 +1,28 @@ +{{- if .Values.autoscaling.enabled }} +apiVersion: autoscaling/v2beta1 +kind: HorizontalPodAutoscaler +metadata: + name: {{ include "serge-ai.fullname" . }} + labels: + {{- include "serge-ai.labels" . | nindent 4 }} +spec: + scaleTargetRef: + apiVersion: apps/v1 + kind: Deployment + name: {{ include "serge-ai.fullname" . }} + minReplicas: {{ .Values.autoscaling.minReplicas }} + maxReplicas: {{ .Values.autoscaling.maxReplicas }} + metrics: + {{- if .Values.autoscaling.targetCPUUtilizationPercentage }} + - type: Resource + resource: + name: cpu + targetAverageUtilization: {{ .Values.autoscaling.targetCPUUtilizationPercentage }} + {{- end }} + {{- if .Values.autoscaling.targetMemoryUtilizationPercentage }} + - type: Resource + resource: + name: memory + targetAverageUtilization: {{ .Values.autoscaling.targetMemoryUtilizationPercentage }} + {{- end }} +{{- end }} diff --git a/templates/ingress.yaml b/templates/ingress.yaml new file mode 100644 index 0000000..6a143ac --- /dev/null +++ b/templates/ingress.yaml @@ -0,0 +1,61 @@ +{{- if .Values.ingress.enabled -}} +{{- $fullName := include "serge-ai.fullname" . -}} +{{- $svcPort := .Values.service.port -}} +{{- if and .Values.ingress.className (not (semverCompare ">=1.18-0" .Capabilities.KubeVersion.GitVersion)) }} + {{- if not (hasKey .Values.ingress.annotations "kubernetes.io/ingress.class") }} + {{- $_ := set .Values.ingress.annotations "kubernetes.io/ingress.class" .Values.ingress.className}} + {{- end }} +{{- end }} +{{- if semverCompare ">=1.19-0" .Capabilities.KubeVersion.GitVersion -}} +apiVersion: networking.k8s.io/v1 +{{- else if semverCompare ">=1.14-0" .Capabilities.KubeVersion.GitVersion -}} +apiVersion: networking.k8s.io/v1beta1 +{{- else -}} +apiVersion: extensions/v1beta1 +{{- end }} +kind: Ingress +metadata: + name: {{ $fullName }} + labels: + {{- include "serge-ai.labels" . | nindent 4 }} + {{- with .Values.ingress.annotations }} + annotations: + {{- toYaml . | nindent 4 }} + {{- end }} +spec: + {{- if and .Values.ingress.className (semverCompare ">=1.18-0" .Capabilities.KubeVersion.GitVersion) }} + ingressClassName: {{ .Values.ingress.className }} + {{- end }} + {{- if .Values.ingress.tls }} + tls: + {{- range .Values.ingress.tls }} + - hosts: + {{- range .hosts }} + - {{ . | quote }} + {{- end }} + secretName: {{ .secretName }} + {{- end }} + {{- end }} + rules: + {{- range .Values.ingress.hosts }} + - host: {{ .host | quote }} + http: + paths: + {{- range .paths }} + - path: {{ .path }} + {{- if and .pathType (semverCompare ">=1.18-0" $.Capabilities.KubeVersion.GitVersion) }} + pathType: {{ .pathType }} + {{- end }} + backend: + {{- if semverCompare ">=1.19-0" $.Capabilities.KubeVersion.GitVersion }} + service: + name: {{ $fullName }} + port: + number: {{ $svcPort }} + {{- else }} + serviceName: {{ $fullName }} + servicePort: {{ $svcPort }} + {{- end }} + {{- end }} + {{- end }} +{{- end }} diff --git a/templates/service.yaml b/templates/service.yaml new file mode 100644 index 0000000..d003a88 --- /dev/null +++ b/templates/service.yaml @@ -0,0 +1,15 @@ +apiVersion: v1 +kind: Service +metadata: + name: {{ include "serge-ai.fullname" . }} + labels: + {{- include "serge-ai.labels" . | nindent 4 }} +spec: + type: {{ .Values.service.type }} + ports: + - port: {{ .Values.service.port }} + targetPort: http + protocol: TCP + name: http + selector: + {{- include "serge-ai.selectorLabels" . | nindent 4 }} diff --git a/templates/serviceaccount.yaml b/templates/serviceaccount.yaml new file mode 100644 index 0000000..c2f37fa --- /dev/null +++ b/templates/serviceaccount.yaml @@ -0,0 +1,12 @@ +{{- if .Values.serviceAccount.create -}} +apiVersion: v1 +kind: ServiceAccount +metadata: + name: {{ include "serge-ai.serviceAccountName" . }} + labels: + {{- include "serge-ai.labels" . | nindent 4 }} + {{- with .Values.serviceAccount.annotations }} + annotations: + {{- toYaml . | nindent 4 }} + {{- end }} +{{- end }} diff --git a/templates/statefulset.yaml b/templates/statefulset.yaml new file mode 100644 index 0000000..ac897c9 --- /dev/null +++ b/templates/statefulset.yaml @@ -0,0 +1,76 @@ +apiVersion: apps/v1 +kind: StatefulSet +metadata: + name: {{ include "serge-ai.fullname" . }} + labels: + {{- include "serge-ai.labels" . | nindent 4 }} +spec: + {{- if not .Values.autoscaling.enabled }} + replicas: {{ .Values.replicaCount }} + {{- end }} + selector: + matchLabels: + {{- include "serge-ai.selectorLabels" . | nindent 6 }} + template: + metadata: + {{- with .Values.podAnnotations }} + annotations: + {{- toYaml . | nindent 8 }} + {{- end }} + labels: + {{- include "serge-ai.selectorLabels" . | nindent 8 }} + spec: + {{- with .Values.imagePullSecrets }} + imagePullSecrets: + {{- toYaml . | nindent 8 }} + {{- end }} + serviceAccountName: {{ include "serge-ai.serviceAccountName" . }} + securityContext: + {{- toYaml .Values.podSecurityContext | nindent 8 }} + containers: + - name: {{ .Chart.Name }} + securityContext: + {{- toYaml .Values.securityContext | nindent 12 }} + image: "{{ .Values.image.repository }}:{{ .Values.image.tag | default .Chart.AppVersion }}" + imagePullPolicy: {{ .Values.image.pullPolicy }} + env: + - name: TZ + value: {{ .Values.environment.timezone }} + ports: + - name: http + containerPort: {{ .Values.service.port }} + protocol: TCP + livenessProbe: + httpGet: + path: / + port: http + readinessProbe: + httpGet: + path: / + port: http + resources: + {{- toYaml .Values.resources | nindent 12 }} + volumeMounts: + - name: datadb + mountPath: /data/db + - name: weights + mountPath: /usr/src/app/weights + volumes: + - name: datadb + persistentVolumeClaim: + claimName: serge-datadb + - name: weights + persistentVolumeClaim: + claimName: serge-weights + {{- with .Values.nodeSelector }} + nodeSelector: + {{- toYaml . | nindent 8 }} + {{- end }} + {{- with .Values.affinity }} + affinity: + {{- toYaml . | nindent 8 }} + {{- end }} + {{- with .Values.tolerations }} + tolerations: + {{- toYaml . | nindent 8 }} + {{- end }} diff --git a/templates/tests/test-connection.yaml b/templates/tests/test-connection.yaml new file mode 100644 index 0000000..69b9d87 --- /dev/null +++ b/templates/tests/test-connection.yaml @@ -0,0 +1,15 @@ +apiVersion: v1 +kind: Pod +metadata: + name: "{{ include "serge-ai.fullname" . }}-test-connection" + labels: + {{- include "serge-ai.labels" . | nindent 4 }} + annotations: + "helm.sh/hook": test +spec: + containers: + - name: wget + image: busybox + command: ['wget'] + args: ['{{ include "serge-ai.fullname" . }}:{{ .Values.service.port }}'] + restartPolicy: Never diff --git a/templates/weights-pvc.yml b/templates/weights-pvc.yml new file mode 100644 index 0000000..db1a258 --- /dev/null +++ b/templates/weights-pvc.yml @@ -0,0 +1,10 @@ +apiVersion: v1 +kind: PersistentVolumeClaim +metadata: + name: serge-weights +spec: + accessModes: + - {{ .Values.persistence.weights.accessMode }} + resources: + requests: + storage: {{ .Values.persistence.weights.size }} diff --git a/values.yaml b/values.yaml new file mode 100644 index 0000000..b60e679 --- /dev/null +++ b/values.yaml @@ -0,0 +1,95 @@ +# Default values for serge-ai. +# This is a YAML-formatted file. +# Declare variables to be passed into your templates. + +replicaCount: 1 + +image: + repository: ghcr.io/nsarrazin/serge + pullPolicy: Always + # Overrides the image tag whose default is the chart appVersion. + tag: release + +imagePullSecrets: [] +nameOverride: serge-ai +fullnameOverride: serge-ai-chat + +environment: + timezone: Europe/Amsterdam + +serviceAccount: + # Specifies whether a service account should be created + create: true + # Annotations to add to the service account + annotations: {} + # The name of the service account to use. + # If not set and create is true, a name is generated using the fullname template + name: serge-ai + +podAnnotations: {} + +podSecurityContext: {} + # fsGroup: 2000 + +securityContext: {} + # capabilities: + # drop: + # - ALL + # readOnlyRootFilesystem: true + # runAsNonRoot: true + # runAsUser: 1000 + +service: + type: NodePort + port: 8008 + +ingress: + enabled: false + className: "" + annotations: {} + # kubernetes.io/ingress.class: nginx + # kubernetes.io/tls-acme: "true" + hosts: + - host: chat.serge.local + paths: + - path: / + pathType: ImplementationSpecific + tls: [] + # - secretName: serge-tls + # hosts: + # - chat.serge.local + +## Persistence section - these are required for Serge +persistence: + datadb: + accessMode: ReadWriteOnce + size: 16Gi + weights: + accessMode: ReadWriteOnce + size: 64Gi + + +resources: {} + # We usually recommend not to specify default resources and to leave this as a conscious + # choice for the user. This also increases chances charts run on environments with little + # resources, such as Minikube. If you do want to specify resources, uncomment the following + # lines, adjust them as necessary, and remove the curly braces after 'resources:'. + # limits: + # cpu: 100m + # memory: 128Mi + # requests: + # cpu: 100m + # memory: 128Mi + +autoscaling: + enabled: false + minReplicas: 1 + maxReplicas: 100 + targetCPUUtilizationPercentage: 80 + # targetMemoryUtilizationPercentage: 80 + +nodeSelector: {} + +tolerations: [] + +affinity: {}