Added more platform components.

lreimer · Dec 3, 2024 · 0e79f94 · 0e79f94
1 parent fd2e885
commit 0e79f94
Show file tree

Hide file tree

Showing 11 changed files with 114 additions and 2 deletions.
diff --git a/Makefile b/Makefile
@@ -10,7 +10,7 @@ create-gke-cluster:
 		--release-channel=regular \
 		--cluster-version=1.30 \
 		--region=$(GCP_REGION) \
-		--addons HttpLoadBalancing,HorizontalPodAutoscaling \
+		--addons HttpLoadBalancing,HorizontalPodAutoscaling,ConfigConnector \
 		--workload-pool=$(GCP_PROJECT).svc.id.goog \
 		--num-nodes=1 \
 		--min-nodes=1 --max-nodes=5 \

diff --git a/README.md b/README.md
@@ -71,7 +71,8 @@ ollama run llama3.1
 cd ollama-chat-service
 ./gradlew quarkusDev
 
-
+# interact with the service locally
+http get localhost:8080/api/ask q=="Was macht die QAware GmbH?"
 
 # this here is managed by Flux2
 kubectl apply -k infrastructure/services/openai-chat-service/
@@ -109,6 +110,26 @@ curl http://localhost:11434/api/chat  \
   }'
 ```
 
+## Deploying Langchain4J Easy RAG Chatbot
+
+```bash
+# see https://docs.quarkiverse.io/quarkus-langchain4j/dev/easy-rag.html
+# see https://github.com/quarkiverse/quarkus-langchain4j/tree/main/samples/chatbot-easy-rag
+```
+
+## Planing Kubernetes Cluster Topology
+
+```bash
+# useful information to setup K8s cluster topology with GPUs
+
+# see https://cloud.google.com/compute/docs/gpus?hl=de
+# see https://cloud.google.com/compute/all-pricing?hl=de
+# see https://cloud.google.com/compute/gpus-pricing?hl=de#other-gpu-models
+
+# see https://cloud.google.com/compute/docs/gpus/create-gpu-vm-general-purpose?hl=de
+# see https://cloud.google.com/compute/docs/disks/local-ssd?hl=de
+```
+
 ## Maintainer
 
 M.-Leander Reimer (@lreimer), <mario-leander.reimer@qaware.de>

diff --git a/infrastructure/platform/jupyterhub/kustomization.yaml b/infrastructure/platform/jupyterhub/kustomization.yaml
@@ -0,0 +1,6 @@
+apiVersion: kustomize.config.k8s.io/v1beta1
+kind: Kustomization
+resources:
+  - namespace.yaml
+  - repository.yaml
+  - release.yaml
diff --git a/infrastructure/platform/jupyterhub/namespace.yaml b/infrastructure/platform/jupyterhub/namespace.yaml
@@ -0,0 +1,4 @@
+kind: Namespace
+apiVersion: v1
+metadata:
+  name: jupyterhub
diff --git a/infrastructure/platform/jupyterhub/release.yaml b/infrastructure/platform/jupyterhub/release.yaml
@@ -0,0 +1,16 @@
+apiVersion: helm.toolkit.fluxcd.io/v2beta1
+kind: HelmRelease
+metadata:
+  name: jupyterhub
+  namespace: flux-system
+spec:
+  chart:
+    spec:
+      chart: jupyterhub
+      sourceRef:
+        kind: HelmRepository
+        name: jupyterhub
+      version: "4.0.0"
+  interval: 1h0m0s
+  releaseName: jupyterhub
+  targetNamespace: jupyterhub
diff --git a/infrastructure/platform/jupyterhub/repository.yaml b/infrastructure/platform/jupyterhub/repository.yaml
@@ -0,0 +1,8 @@
+apiVersion: source.toolkit.fluxcd.io/v1beta1
+kind: HelmRepository
+metadata:
+  name: jupyterhub
+  namespace: flux-system
+spec:
+  interval: 1h0m0s
+  url: https://hub.jupyter.org/helm-chart/
diff --git a/infrastructure/platform/langflow/kustomization.yaml b/infrastructure/platform/langflow/kustomization.yaml
@@ -0,0 +1,6 @@
+apiVersion: kustomize.config.k8s.io/v1beta1
+kind: Kustomization
+resources:
+  - namespace.yaml
+  - repository.yaml
+  - release.yaml
diff --git a/infrastructure/platform/langflow/namespace.yaml b/infrastructure/platform/langflow/namespace.yaml
@@ -0,0 +1,4 @@
+kind: Namespace
+apiVersion: v1
+metadata:
+  name: langflow
diff --git a/infrastructure/platform/langflow/release.yaml b/infrastructure/platform/langflow/release.yaml
@@ -0,0 +1,33 @@
+apiVersion: helm.toolkit.fluxcd.io/v2beta1
+kind: HelmRelease
+metadata:
+  name: langflow-ide
+  namespace: flux-system
+spec:
+  chart:
+    spec:
+      chart: langflow-ide
+      sourceRef:
+        kind: HelmRepository
+        name: langflow
+      version: "0.1.0"
+  interval: 1h0m0s
+  releaseName: langflow-ide
+  targetNamespace: langflow
+---
+apiVersion: helm.toolkit.fluxcd.io/v2beta1
+kind: HelmRelease
+metadata:
+  name: langflow-runtime
+  namespace: flux-system
+spec:
+  chart:
+    spec:
+      chart: langflow-runtime
+      sourceRef:
+        kind: HelmRepository
+        name: langflow
+      version: "0.1.0"
+  interval: 1h0m0s
+  releaseName: langflow-runtime
+  targetNamespace: langflow
diff --git a/infrastructure/platform/langflow/repository.yaml b/infrastructure/platform/langflow/repository.yaml
@@ -0,0 +1,8 @@
+apiVersion: source.toolkit.fluxcd.io/v1beta1
+kind: HelmRepository
+metadata:
+  name: langflow
+  namespace: flux-system
+spec:
+  interval: 1h0m0s
+  url: https://langflow-ai.github.io/langflow-helm-charts
diff --git a/infrastructure/services/openai-chat-service/deployment.yaml b/infrastructure/services/openai-chat-service/deployment.yaml
@@ -50,6 +50,12 @@ spec:
             secretKeyRef:
               name: openai-api-key
               key: OPENAI_API_KEY
+
         # - name: QUARKUS_LANGCHAIN4J_OPENAI_BASE_URL
         #   value: "http://openai-proxy-service.default.svc.cluster.local:10000"
+
+        # - name: QUARKUS_LANGCHAIN4J_OPENAI_CHAT_MODEL_MODEL_NAME
+        #   value: "llama3.1"
+        # - name: QUARKUS_LANGCHAIN4J_OPENAI_BASE_URL
+        #   value: "http://ollama-model-llama31.default.svc.cluster.local:11434"