Merge branch 'arc53:main' into main

4 months ago · c794ea614a
parent 9000838aab 2790bda1e9
commit c794ea614a
11 changed files with 396 additions and 0 deletions
--- a/docs/pages/Deploying/Kubernetes-Deploying.md
+++ b/docs/pages/Deploying/Kubernetes-Deploying.md
@ -0,0 +1,100 @@
+# Self-hosting DocsGPT on Kubernetes
+
+This guide will walk you through deploying DocsGPT on Kubernetes.
+
+## Prerequisites
+
+Ensure you have the following installed before proceeding:
+
+- [kubectl](https://kubernetes.io/docs/tasks/tools/install-kubectl/)
+- Access to a Kubernetes cluster
+
+## Folder Structure
+
+The `k8s` folder contains the necessary deployment and service configuration files:
+
+- `deployments/`
+- `services/`
+- `docsgpt-secrets.yaml`
+
+## Deployment Instructions
+
+1. **Clone the Repository**
+
+   ```sh
+   git clone https://github.com/arc53/DocsGPT.git
+   cd docsgpt/k8s
+   ```
+
+2. **Configure Secrets (optional)**
+
+   Ensure that you have all the necessary secrets in `docsgpt-secrets.yaml`. Update it with your secrets before applying if you want. By default we will use qdrant as a vectorstore and public docsgpt llm as llm for inference.
+
+3. **Apply Kubernetes Deployments**
+
+   Deploy your DocsGPT resources using the following commands:
+
+   ```sh
+   kubectl apply -f deployments/
+   ```
+
+4. **Apply Kubernetes Services**
+
+   Set up your services using the following commands:
+
+   ```sh
+   kubectl apply -f services/
+   ```
+
+5. **Apply Secrets**
+
+   Apply the secret configurations:
+
+   ```sh
+   kubectl apply -f docsgpt-secrets.yaml
+   ```
+
+6. **Substitute API URL**
+
+   After deploying the services, you need to update the environment variable `VITE_API_HOST` in your deployment file `deployments/docsgpt-deploy.yaml` with the actual endpoint URL created by your `docsgpt-api-service`.
+
+    ```sh
+    kubectl get services/docsgpt-api-service -o jsonpath='{.status.loadBalancer.ingress[0].ip}' | xargs -I {} sed -i "s|<your-api-endpoint>|{}|g" deployments/docsgpt-deploy.yaml
+    ```
+
+7. **Rerun Deployment**
+
+   After making the changes, reapply the deployment configuration to update the environment variables:
+
+   ```sh
+   kubectl apply -f deployments/
+   ```
+
+## Verifying the Deployment
+
+To verify if everything is set up correctly, you can run the following:
+
+```sh
+kubectl get pods
+kubectl get services
+```
+
+Ensure that the pods are running and the services are available.
+
+## Accessing DocsGPT
+
+To access DocsGPT, you need to find the external IP address of the frontend service. You can do this by running:
+
+```sh
+kubectl get services/docsgpt-frontend-service | awk 'NR>1 {print "http://" $4}'
+```
+
+## Troubleshooting
+
+If you encounter any issues, you can check the logs of the pods for more details:
+
+```sh
+kubectl logs <pod-name>
+```
+
+Replace `<pod-name>` with the actual name of your DocsGPT pod.
--- a/docs/pages/Deploying/_meta.json
+++ b/docs/pages/Deploying/_meta.json
@ -10,5 +10,9 @@
  "Railway-Deploying": {
    "title": "🚂Deploying on Railway",
    "href": "/Deploying/Railway-Deploying"
+  },
+  "Kubernetes-Deploying": {
+    "title": "🚀Deploying on Kubernetes",
+    "href": "/Deploying/Kubernetes-Deploying"
  }
 }
--- a/k8s/deployments/docsgpt-deploy.yaml
+++ b/k8s/deployments/docsgpt-deploy.yaml
@ -0,0 +1,98 @@
+apiVersion: apps/v1
+kind: Deployment
+metadata:
+  name: docsgpt-api
+spec:
+  replicas: 1
+  selector:
+    matchLabels:
+      app: docsgpt-api
+  template:
+    metadata:
+      labels:
+        app: docsgpt-api
+    spec:
+      containers:
+      - name: docsgpt-api
+        image: arc53/docsgpt
+        ports:
+        - containerPort: 7091
+        resources:
+          limits:
+            memory: "4Gi"
+            cpu: "2"
+          requests:
+            memory: "2Gi"
+            cpu: "1"
+        envFrom:
+        - secretRef:
+            name: docsgpt-secrets
+        env:
+        - name: FLASK_APP
+          value: "application/app.py"
+        - name: DEPLOYMENT_TYPE
+          value: "cloud"
+---
+apiVersion: apps/v1
+kind: Deployment
+metadata:
+  name: docsgpt-worker
+spec:
+  replicas: 1
+  selector:
+    matchLabels:
+      app: docsgpt-worker
+  template:
+    metadata:
+      labels:
+        app: docsgpt-worker
+    spec:
+      containers:
+      - name: docsgpt-worker
+        image: arc53/docsgpt
+        command: ["celery", "-A", "application.app.celery", "worker", "-l", "INFO", "-n", "worker.%h"]
+        resources:
+          limits:
+            memory: "4Gi"
+            cpu: "2"
+          requests:
+            memory: "2Gi"
+            cpu: "1"
+        envFrom:
+        - secretRef:
+            name: docsgpt-secrets
+        env:
+        - name: API_URL
+          value: "http://<your-api-endpoint>"
+---
+apiVersion: apps/v1
+kind: Deployment
+metadata:
+  name: docsgpt-frontend
+spec:
+  replicas: 1
+  selector:
+    matchLabels:
+      app: docsgpt-frontend
+  template:
+    metadata:
+      labels:
+        app: docsgpt-frontend
+    spec:
+      containers:
+      - name: docsgpt-frontend
+        image: arc53/docsgpt-fe
+        ports:
+        - containerPort: 5173
+        resources:
+          limits:
+            memory: "1Gi"
+            cpu: "1"
+          requests:
+            memory: "256Mi"
+            cpu: "100m"
+        env:
+        - name: VITE_API_HOST
+          value: "http://<your-api-endpoint>"
+        - name: VITE_API_STREAMING
+          value: "true"
--- a/k8s/deployments/mongo-deploy.yaml
+++ b/k8s/deployments/mongo-deploy.yaml
@ -0,0 +1,46 @@
+apiVersion: v1
+kind: PersistentVolumeClaim
+metadata:
+  name: mongodb-pvc
+spec:
+  accessModes:
+    - ReadWriteOnce
+  resources:
+    requests:
+      storage: 10Gi  # Adjust size as needed
+
+---
+
+apiVersion: apps/v1
+kind: Deployment
+metadata:
+  name: mongodb
+spec:
+  replicas: 1
+  selector:
+    matchLabels:
+      app: mongodb
+  template:
+    metadata:
+      labels:
+        app: mongodb
+    spec:
+      containers:
+      - name: mongodb
+        image: mongo:latest
+        ports:
+        - containerPort: 27017
+        resources:
+          limits:
+            memory: "1Gi"
+            cpu: "0.5"
+          requests:
+            memory: "512Mi"
+            cpu: "250m"
+        volumeMounts:
+        - name: mongodb-data
+          mountPath: /data/db
+      volumes:
+      - name: mongodb-data
+        persistentVolumeClaim:
+          claimName: mongodb-pvc
--- a/k8s/deployments/qdrant-deploy.yaml
+++ b/k8s/deployments/qdrant-deploy.yaml
@ -0,0 +1,46 @@
+apiVersion: v1
+kind: PersistentVolumeClaim
+metadata:
+  name: qdrant-pvc
+spec:
+  accessModes:
+    - ReadWriteOnce
+  resources:
+    requests:
+      storage: 10Gi
+
+---
+
+apiVersion: apps/v1
+kind: Deployment
+metadata:
+  name: qdrant
+spec:
+  replicas: 1
+  selector:
+    matchLabels:
+      app: qdrant
+  template:
+    metadata:
+      labels:
+        app: qdrant
+    spec:
+      containers:
+      - name: qdrant
+        image: qdrant/qdrant:latest
+        ports:
+        - containerPort: 6333
+        resources:
+          limits:
+            memory: "2Gi"  # Adjust based on your needs
+            cpu: "1"       # Adjust based on your needs
+          requests:
+            memory: "1Gi"  # Adjust based on your needs
+            cpu: "500m"    # Adjust based on your needs
+        volumeMounts:
+        - name: qdrant-data
+          mountPath: /qdrant/storage
+      volumes:
+      - name: qdrant-data
+        persistentVolumeClaim:
+          claimName: qdrant-pvc
--- a/k8s/deployments/redis-deploy.yaml
+++ b/k8s/deployments/redis-deploy.yaml
@ -0,0 +1,26 @@
+apiVersion: apps/v1
+kind: Deployment
+metadata:
+  name: redis
+spec:
+  replicas: 1
+  selector:
+    matchLabels:
+      app: redis
+  template:
+    metadata:
+      labels:
+        app: redis
+    spec:
+      containers:
+      - name: redis
+        image: redis:latest
+        ports:
+        - containerPort: 6379
+        resources:
+          limits:
+            memory: "1Gi"
+            cpu: "0.5"
+          requests:
+            memory: "512Mi"
+            cpu: "250m"
--- a/k8s/docsgpt-secrets.yaml
+++ b/k8s/docsgpt-secrets.yaml
@ -0,0 +1,15 @@
+apiVersion: v1
+kind: Secret
+metadata:
+  name: docsgpt-secrets
+type: Opaque
+data:
+  LLM_NAME: ZG9jc2dwdA==
+  INTERNAL_KEY: aW50ZXJuYWw=
+  CELERY_BROKER_URL: cmVkaXM6Ly9yZWRpcy1zZXJ2aWNlOjYzNzkvMA==
+  CELERY_RESULT_BACKEND: cmVkaXM6Ly9yZWRpcy1zZXJ2aWNlOjYzNzkvMA==
+  QDRANT_URL: cmVkaXM6Ly9yZWRpcy1zZXJ2aWNlOjYzNzkvMA==
+  QDRANT_PORT: NjM3OQ==
+  MONGO_URI: bW9uZ29kYjovL21vbmdvZGItc2VydmljZToyNzAxNy9kb2NzZ3B0P3JldHJ5V3JpdGVzPXRydWUmdz1tYWpvcml0eQ==
+  mongo-user: bW9uZ28tdXNlcg==
+  mongo-password: bW9uZ28tcGFzc3dvcmQ=
--- a/k8s/services/docsgpt-service.yaml
+++ b/k8s/services/docsgpt-service.yaml
@ -0,0 +1,25 @@
+apiVersion: v1
+kind: Service
+metadata:
+  name: docsgpt-api-service
+spec:
+  selector:
+    app: docsgpt-api
+  ports:
+    - protocol: TCP
+      port: 80
+      targetPort: 7091
+  type: LoadBalancer
+---
+apiVersion: v1
+kind: Service
+metadata:
+  name: docsgpt-frontend-service
+spec:
+  selector:
+    app: docsgpt-frontend
+  ports:
+    - protocol: TCP
+      port: 80
+      targetPort: 5173
+  type: LoadBalancer
--- a/k8s/services/mongo-service.yaml
+++ b/k8s/services/mongo-service.yaml
@ -0,0 +1,12 @@
+apiVersion: v1
+kind: Service
+metadata:
+  name: mongodb-service
+spec:
+  selector:
+    app: mongodb
+  ports:
+    - protocol: TCP
+      port: 27017
+      targetPort: 27017
+  type: ClusterIP
--- a/k8s/services/qdrant-service.yaml
+++ b/k8s/services/qdrant-service.yaml
@ -0,0 +1,12 @@
+apiVersion: v1
+kind: Service
+metadata:
+  name: qdrant
+spec:
+  selector:
+    app: qdrant
+  ports:
+    - protocol: TCP
+      port: 6333
+      targetPort: 6333
+  type: ClusterIP
--- a/k8s/services/redis-service.yaml
+++ b/k8s/services/redis-service.yaml
@ -0,0 +1,12 @@
+apiVersion: v1
+kind: Service
+metadata:
+  name: redis-service
+spec:
+  selector:
+    app: redis
+  ports:
+    - protocol: TCP
+      port: 6379
+      targetPort: 6379
+  type: ClusterIP