Skip to content

Commit d1faf2c

Browse files
authored
Releasev0.1.2 (#345)
* Update chart values Signed-off-by: kerthcet <[email protected]> * Revert lws config Signed-off-by: kerthcet <[email protected]> * Update config Signed-off-by: kerthcet <[email protected]> * Fix prometheus error Signed-off-by: kerthcet <[email protected]> * Release v0.1.2 Signed-off-by: kerthcet <[email protected]> --------- Signed-off-by: kerthcet <[email protected]>
1 parent 1c23184 commit d1faf2c

File tree

16 files changed

+34
-24
lines changed

16 files changed

+34
-24
lines changed

chart/Chart.yaml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -13,9 +13,9 @@ type: application
1313
# This is the chart version. This version number should be incremented each time you make changes
1414
# to the chart and its templates, including the app version.
1515
# Versions are expected to follow Semantic Versioning (https://semver.org/)
16-
version: 0.0.7
16+
version: 0.0.8
1717
# This is the version number of the application being deployed. This version number should be
1818
# incremented each time you make changes to the application. Versions are not expected to
1919
# follow Semantic Versioning. They should reflect the version the application is using.
2020
# It is recommended to use it with quotes.
21-
appVersion: 0.1.1
21+
appVersion: 0.1.2

chart/crds/playground-crd.yaml

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -241,6 +241,7 @@ spec:
241241
MaxReplicas indicates the maximum number of inference workloads based on the traffic.
242242
Default to nil means there's no limit for the instance number.
243243
format: int32
244+
minimum: 1
244245
type: integer
245246
minReplicas:
246247
default: 1
@@ -863,6 +864,8 @@ spec:
863864
type: array
864865
type: object
865866
type: object
867+
required:
868+
- maxReplicas
866869
type: object
867870
modelClaim:
868871
description: |-

chart/templates/backends/llamacpp.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
{{- if .Values.backendRuntime.install -}}
1+
{{- if .Values.backendRuntime.enable -}}
22
apiVersion: inference.llmaz.io/v1alpha1
33
kind: BackendRuntime
44
metadata:

chart/templates/backends/ollama.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
{{- if .Values.backendRuntime.install -}}
1+
{{- if .Values.backendRuntime.enable -}}
22
apiVersion: inference.llmaz.io/v1alpha1
33
kind: BackendRuntime
44
metadata:

chart/templates/backends/sglang.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
{{- if .Values.backendRuntime.install -}}
1+
{{- if .Values.backendRuntime.enable -}}
22
apiVersion: inference.llmaz.io/v1alpha1
33
kind: BackendRuntime
44
metadata:

chart/templates/backends/tgi.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
{{- if .Values.backendRuntime.install -}}
1+
{{- if .Values.backendRuntime.enable -}}
22
apiVersion: inference.llmaz.io/v1alpha1
33
kind: BackendRuntime
44
metadata:

chart/templates/backends/vllm.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
{{- if .Values.backendRuntime.install -}}
1+
{{- if .Values.backendRuntime.enable -}}
22
apiVersion: inference.llmaz.io/v1alpha1
33
kind: BackendRuntime
44
metadata:

chart/templates/lws/leaderworkerset.yaml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
{{- if .Values.leaderWorkerSet.install -}}
1+
{{- if .Values.leaderWorkerSet.enable -}}
22
apiVersion: v1
33
kind: Namespace
44
metadata:
@@ -16681,7 +16681,7 @@ spec:
1668116681
- --zap-log-level=2
1668216682
command:
1668316683
- /manager
16684-
image: {{ .Values.backendRuntime.image.repository }}:{{ .Values.backendRuntime.image.tag }}
16684+
image: registry.k8s.io/lws/lws:v0.5.0
1668516685
livenessProbe:
1668616686
httpGet:
1668716687
path: /healthz

chart/templates/prometheus/prometheus.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -14,7 +14,7 @@ spec:
1414
# https://github.com/kubernetes-sigs/jobset/blob/main/config/components/prometheus/monitor.yaml#L7
1515
matchLabels:
1616
control-plane: controller-manager
17-
{{- include "chart.selectorLabels" . | nindent 4 }}
17+
{{- include "chart.selectorLabels" . | nindent 6 }}
1818
resources:
1919
requests:
2020
memory: 400Mi

chart/templates/prometheus/service-monitor.yaml

Lines changed: 1 addition & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -22,6 +22,5 @@ spec:
2222
insecureSkipVerify: true
2323
selector:
2424
matchLabels:
25-
control-plane: controller-manager
26-
{{- include "chart.selectorLabels" . | nindent 4 }}
25+
{{- include "chart.selectorLabels" . | nindent 6 }}
2726
{{- end }}

chart/values.global.yaml

Lines changed: 4 additions & 7 deletions
Original file line numberDiff line numberDiff line change
@@ -1,7 +1,7 @@
11
fullnameOverride: "llmaz"
22

33
backendRuntime:
4-
install: true
4+
enable: true
55
llamacpp:
66
image:
77
repository: ghcr.io/ggerganov/llama.cpp
@@ -24,11 +24,8 @@ backendRuntime:
2424
tag: v0.7.3
2525

2626
leaderWorkerSet:
27-
install: true
28-
image:
29-
repository: registry.k8s.io/lws/lws
30-
tag: v0.5.0
27+
enable: true
3128

3229
prometheus:
33-
# -- Whether to enable Prometheus metrics exporting.
34-
enable: false
30+
# Prometheus is required to enable smart routing.
31+
enable: true

chart/values.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -12,7 +12,7 @@ controllerManager:
1212
- ALL
1313
image:
1414
repository: inftyai/llmaz
15-
tag: main
15+
tag: v0.1.2
1616
resources:
1717
limits:
1818
cpu: 500m

config/manager/kustomization.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -5,4 +5,4 @@ kind: Kustomization
55
images:
66
- name: controller
77
newName: inftyai/llmaz
8-
newTag: main
8+
newTag: v0.1.2

config/prometheus/monitor.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -20,4 +20,4 @@ spec:
2020
insecureSkipVerify: true
2121
selector:
2222
matchLabels:
23-
app.kubernetes.io/name: service
23+
app.kubernetes.io/name: llmaz

docs/installation.md

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -3,7 +3,8 @@
33
## Prerequisites
44

55
- Kubernetes version >= 1.27
6-
- Helm 3
6+
- Helm 3, see [installation](https://helm.sh/docs/intro/install/).
7+
- Prometheus, see [installation](https://github.com/InftyAI/llmaz/tree/main/docs/prometheus-operator#install-the-prometheus-operator).
78

89
## Install a released version
910

index.yaml

Lines changed: 11 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,16 @@
11
apiVersion: v1
22
entries:
33
llmaz:
4+
- apiVersion: v2
5+
appVersion: 0.1.2
6+
created: "2025-04-17T16:34:28.456285+08:00"
7+
description: A Helm chart for llmaz
8+
digest: 7b86ddb7338071456ef04a7c8d6b25be697c2e3016096dbb6497688abb9bc414
9+
name: llmaz
10+
type: application
11+
urls:
12+
- https://inftyai.github.io/llmaz/llmaz-0.0.8.tgz
13+
version: 0.0.8
414
- apiVersion: v2
515
appVersion: 0.1.1
616
created: "2025-02-18T14:46:30.474789+08:00"
@@ -71,4 +81,4 @@ entries:
7181
urls:
7282
- https://inftyai.github.io/llmaz/llmaz-0.0.1.tgz
7383
version: 0.0.1
74-
generated: "2025-02-18T14:46:30.460221+08:00"
84+
generated: "2025-04-17T16:34:28.442325+08:00"

0 commit comments

Comments
 (0)