Skip to content
This repository has been archived by the owner on Feb 15, 2025. It is now read-only.

Commit

Permalink
Merge pull request #50 from defenseunicorns/helm-chart
Browse files Browse the repository at this point in the history
Helm chart
  • Loading branch information
Thomas Runyon authored May 30, 2023
2 parents 53625d6 + 1773e4b commit 5b703ee
Show file tree
Hide file tree
Showing 14 changed files with 1,793 additions and 154 deletions.
Original file line number Diff line number Diff line change
@@ -1,7 +1,10 @@
apiVersion: v1
kind: ConfigMap
metadata:
name: api-model
data:
models.toml: |
{{ if .Values.models.stablelm3b.enabled }}
models.toml: |
{{- if .Values.models.stablelm3b.enabled }}
[stablelm-3b]
[stablelm-3b.metadata]
owned_by = 'Defense Unicorns'
Expand All @@ -11,12 +14,12 @@ data:
url = 'stablelm:50051'
type = 'gRPC'
{{- end -}}
{{- if .Values.models.all_MiniLM_L6_v2.enabled -}}
{{ if .Values.models.all_MiniLM_L6_v2.enabled }}
[text-embedding-ada-002]
[text-embedding-ada-002.metadata]
owned_by = 'Defense Unicorns'
permission = []
description = 'A pretend implementation of ada-0002 tha's actually all-MiniLM-L6-v2'
description = 'A pretend implementation of ada-0002 thats actually all-MiniLM-L6-v2'
[text-embedding-ada-002.network]
url = 'sentence-transformers:50051'
type = 'gRPC'
Expand All @@ -27,9 +30,7 @@ data:
description = ' By default, input text longer than 256 word pieces is truncated.'
[all-MiniLM-L6-v2.network]
url = 'sentence-transformers:50051'
type = 'gRPC'
{{- end -}}
kind: ConfigMap
metadata:
creationTimestamp: null
name: api-model
type = 'gRPC'
{{- end -}}


13 changes: 12 additions & 1 deletion chart/templates/api/deployment.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -17,4 +17,15 @@ spec:
image: ghcr.io/defenseunicorns/leapfrogai/api:0.0.1
imagePullPolicy: Always
ports:
- containerPort: 50051
- containerPort: 50051
volumeMounts:
- name: api-model
mountPath: /app/models.toml
subPath: models.toml
volumes:
- name: api-model
configMap:
name: api-model



28 changes: 28 additions & 0 deletions chart/templates/stablelm/deployment.yaml
Original file line number Diff line number Diff line change
@@ -0,0 +1,28 @@
{{ if .Values.models.stablelm3b.enabled }}
apiVersion: apps/v1
kind: Deployment
metadata:
name: stablelm-deployment
spec:
replicas: 1
selector:
matchLabels:
app: stablelm
template:
metadata:
labels:
app: stablelm
spec:
containers:
- name: stablelm-container
imagePullPolicy: Always
# imagePullPolicy: Never # Building on the node currently so we don't have to push/pull
image: ghcr.io/defenseunicorns/leapfrogai/stablelm-3b:0.0.1
ports:
- containerPort: 50051 # Assume this is the gRPC port
resources:
limits:
nvidia.com/gpu: 1
requests:
nvidia.com/gpu: 1
{{ end }}
15 changes: 15 additions & 0 deletions chart/templates/stablelm/service.yaml
Original file line number Diff line number Diff line change
@@ -0,0 +1,15 @@
{{ if .Values.models.stablelm3b.enabled }}
apiVersion: v1
kind: Service
metadata:
name: stablelm
spec:
selector:
app: stablelm
ports:
- name: grpc
protocol: TCP
port: 50051
targetPort: 50051
type: ClusterIP
{{ end }}
2 changes: 1 addition & 1 deletion chart/templates/vs.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -7,7 +7,7 @@ spec:
gateways:
- istio-system/{{ .Values.istio.gateway }}
hosts:
- leapfrogai.{{ .Values.domain}}
- leapfrogai.{{ .Values.domain }}
http:
- route:
- destination:
Expand Down
4 changes: 2 additions & 2 deletions chart/values.yaml
Original file line number Diff line number Diff line change
@@ -1,9 +1,9 @@
domain: bigbang.dev

istio:
enabled: false
gateway: public

domain: bigbang.dev


models:
stablelm3b:
Expand Down
118 changes: 0 additions & 118 deletions kubernetes/install.yaml

This file was deleted.

Loading

0 comments on commit 5b703ee

Please sign in to comment.