rootflo · rootflo-hardik · Apr 4, 2026 · Apr 3, 2026 · coderabbitai · Apr 3, 2026
diff --git a/.github/workflows/build-rag-ingestion-develop.yaml b/.github/workflows/build-rag-ingestion-develop.yaml
@@ -0,0 +1,107 @@
+name: (Develop) Build and Push RAG Ingestion to AWS, GCP and Azure
+
+on:
+  workflow_dispatch:
+
+env:
+  PROJECT_ID: aesy-330511
+  GCP_REGION: asia-south1
+  GAR_LOCATION: asia-south1-docker.pkg.dev/aesy-330511/root-hub
+  IMAGE_NAME: auraflo-rag-ingestion
+
+  AWS_REGION: ap-south-1
+  ECR_REGISTRY: 025066241490.dkr.ecr.ap-south-1.amazonaws.com
+  ECR_REPOSITORY: rootflo/auraflo-rag-ingestion
+
+  ACR_REGISTRY_NAME: rootflo
+  ACR_REGISTRY: rootflo.azurecr.io
+  ACR_REPOSITORY: auraflo-rag-ingestion
+
+jobs:
+  build-push-artifact:
+    runs-on: ubuntu-latest
+
-jobs:
-  build-push-artifact:
-    runs-on: ubuntu-latest
+jobs:
+  build-push-artifact:
+    runs-on: ubuntu-latest
+    permissions:
+      contents: read
+
-jobs:
-  build-push-artifact:
-    runs-on: ubuntu-latest
+jobs:
+  build-push-artifact:
+    runs-on: ubuntu-latest
+    permissions:
+      contents: read
+
+    steps:
+      - name: "Checkout"
+        uses: "actions/checkout@v3"
+
+      - name: Get commit hash
+        id: get-commit-hash
+        run: echo "::set-output name=commit-hash::$(git rev-parse --short HEAD)"
+
+      - name: Get timestamp
+        id: get-timestamp
+        run: echo "::set-output name=timestamp::$(date +'%Y-%m-%d-%H-%M')"
+
+      - name: Cache Docker layers
+        id: cache-docker-layers
+        uses: actions/cache@v3
+        with:
+          path: /tmp/.buildx-cache
+          key: ${{ runner.os }}-docker-${{ github.sha }}
+          restore-keys: |
+            ${{ runner.os }}-docker-
+
+      - name: Set up Docker Buildx
+        uses: docker/setup-buildx-action@v3
+
+      - name: Build Docker Image
+        id: build-image
+        run: |
+          docker build -f wavefront/server/docker/rag_ingestion.Dockerfile -t rootflo:${{ steps.get-commit-hash.outputs.commit-hash }}-${{ steps.get-timestamp.outputs.timestamp }} .
+          echo "IMAGE_TAG=${{ steps.get-commit-hash.outputs.commit-hash }}-${{ steps.get-timestamp.outputs.timestamp }}" >> $GITHUB_ENV
+
+      - id: "Auth-to-GCP"
+        uses: "google-github-actions/auth@v1"
+        with:
+          credentials_json: "${{ secrets.GCP_SERVICE_ACCOUNT_KEY }}"
+
+      - name: "Set up Cloud SDK"
+        uses: "google-github-actions/setup-gcloud@v1"
+
+      - name: "Docker auth for GCP"
+        run: |-
+          gcloud auth configure-docker ${{ env.GCP_REGION }}-docker.pkg.dev --quiet
+
+      - name: Tag and push image to GCP Artifact Registry
+        run: |
+          docker tag rootflo:${{ env.IMAGE_TAG }} ${{ env.GAR_LOCATION }}/${{ env.IMAGE_NAME }}:${{ env.IMAGE_TAG }}
+          docker push ${{ env.GAR_LOCATION }}/${{ env.IMAGE_NAME }}:${{ env.IMAGE_TAG }}
+
+        # Configure AWS credentials and push to ECR
+      - name: Configure AWS credentials
+        uses: aws-actions/configure-aws-credentials@v1
+        with:
+          aws-access-key-id: ${{ secrets.AWS_ACCESS_KEY_ID }}
+          aws-secret-access-key: ${{ secrets.AWS_SECRET_ACCESS_KEY }}
+          aws-region: ${{ env.AWS_REGION }}
+
+      - name: Login to Amazon ECR
+        id: login-ecr
+        uses: aws-actions/amazon-ecr-login@v1
+
+      - name: Tag and push image to Amazon ECR
+        run: |
+          docker tag rootflo:${{ env.IMAGE_TAG }} ${{ env.ECR_REGISTRY }}/${{ env.ECR_REPOSITORY }}:${{ env.IMAGE_TAG }}
+          docker push ${{ env.ECR_REGISTRY }}/${{ env.ECR_REPOSITORY }}:${{ env.IMAGE_TAG }}
+
+        # Configure Azure credentials and push to ACR
+      - name: Login to Azure
+        uses: azure/login@v2
+        with:
+          creds: ${{ secrets.AZURE_CREDENTIALS }}
+
+      - name: Docker auth for Azure ACR
+        run: az acr login --name ${{ env.ACR_REGISTRY_NAME }}
+
+      - name: Tag and push image to Azure Container Registry
+        run: |
+          docker tag rootflo:${{ env.IMAGE_TAG }} ${{ env.ACR_REGISTRY }}/${{ env.ACR_REPOSITORY }}:${{ env.IMAGE_TAG }}
+          docker push ${{ env.ACR_REGISTRY }}/${{ env.ACR_REPOSITORY }}:${{ env.IMAGE_TAG }}
+
+      - name: Cleanup Docker images
+        run: |
+          docker rmi rootflo:${{ env.IMAGE_TAG }} || true
+          docker rmi ${{ env.GAR_LOCATION }}/${{ env.IMAGE_NAME }}:${{ env.IMAGE_TAG }} || true
+          docker rmi ${{ env.ECR_REGISTRY }}/${{ env.ECR_REPOSITORY }}:${{ env.IMAGE_TAG }} || true
+          docker rmi ${{ env.ACR_REGISTRY }}/${{ env.ACR_REPOSITORY }}:${{ env.IMAGE_TAG }} || true
@@ -1,5 +1,8 @@
 name: (Develop) Build and Push RAG Ingestion to AWS, GCP and Azure
+permissions:
+  contents: read
+
 on:
  workflow_dispatch:
@@ -1,5 +1,8 @@
 name: (Develop) Build and Push RAG Ingestion to AWS, GCP and Azure

+permissions:
+  contents: read
+
 on:
  workflow_dispatch:

diff --git a/wavefront/server/docker/rag_ingestion.Dockerfile b/wavefront/server/docker/rag_ingestion.Dockerfile
@@ -0,0 +1,32 @@
+FROM python:3.11-slim-buster
+
+# Copy UV from official image
+COPY --from=ghcr.io/astral-sh/uv:latest /uv /uvx /bin/
+
+# Set working directory
+WORKDIR /app
+
+# Copy project files
+COPY wavefront/server/pyproject.toml wavefront/server/uv.lock ./
+COPY wavefront/server/background_jobs/rag_ingestion ./background_jobs/rag_ingestion/
+COPY wavefront/server/packages/flo_cloud ./packages/flo_cloud/
+COPY wavefront/server/packages/flo_utils ./packages/flo_utils/
+COPY wavefront/server/modules/db_repo_module ./modules/db_repo_module/
+COPY wavefront/server/modules/common_module ./modules/common_module/
+COPY wavefront/server/scripts/rag_ingestion/startup-rag-ingestion.sh ./background_jobs/rag_ingestion/
+
+# Install dependencies
+RUN uv sync --package rag-ingestion --frozen --no-dev
+
+# Download the tiktoken encoding file and NLTK data
+RUN mkdir -p /root/.cache/tiktoken
+RUN uv run python3 -c "import tiktoken; enc = tiktoken.encoding_for_model('gpt-4')"
+RUN uv run python3 -c "import nltk; nltk.download('punkt'); nltk.download('averaged_perceptron_tagger')"
+
+WORKDIR /app/background_jobs/rag_ingestion
+
+# Make startup script executable
+RUN chmod +x startup-rag-ingestion.sh
+
+# Set entrypoint to run startup script
+CMD ["./startup-rag-ingestion.sh"] 
diff --git a/wavefront/server/scripts/rag_ingestion/startup-rag-ingestion.sh b/wavefront/server/scripts/rag_ingestion/startup-rag-ingestion.sh
@@ -0,0 +1,6 @@
+#!/bin/bash
+
+source /app/.venv/bin/activate
+
+# Run the main application for RAG Ingestion
+python rag_ingestion/main.py