y-scope · junhaoliao · Jan 12, 2026 · Jan 8, 2026 · Jan 8, 2026 · Jan 11, 2026
@@ -1,6 +1,6 @@
 apiVersion: "v2"
 name: "clp"
-version: "0.1.2-dev.16"
+version: "0.1.2-dev.17"
 description: "A Helm chart for CLP's (Compressed Log Processor) package deployment"
 type: "application"
 appVersion: "0.7.1-dev"

@@ -115,6 +115,15 @@ data:
       {{- end }}{{/* with .aws_authentication */}}
       {{- end }}{{/* if eq .type "fs" */}}
     {{- end }}{{/* with .Values.clpConfig.logs_input */}}
+    {{- with .Values.clpConfig.log_ingestor }}
+    log_ingestor:
+      buffer_flush_threshold: {{ .buffer_flush_threshold | int }}
+      buffer_flush_timeout: {{ .buffer_flush_timeout | int }}
+      channel_capacity: {{ .channel_capacity | int }}
+      host: "localhost"
+      logging_level: {{ .logging_level | quote }}
+      port: 3002
+    {{- end }}
     package:
       query_engine: {{ .Values.clpConfig.package.query_engine | quote }}
       storage_engine: {{ .Values.clpConfig.package.storage_engine | quote }}

@@ -0,0 +1,88 @@
+{{- if .Values.clpConfig.log_ingestor }}
+apiVersion: "apps/v1"
+kind: "Deployment"
+metadata:
+  name: {{ include "clp.fullname" . }}-log-ingestor
+  labels:
+    {{- include "clp.labels" . | nindent 4 }}
+    app.kubernetes.io/component: "log-ingestor"
+spec:
+  replicas: 1
+  selector:
+    matchLabels:
+      {{- include "clp.selectorLabels" . | nindent 6 }}
+      app.kubernetes.io/component: "log-ingestor"
+  template:
+    metadata:
+      labels:
+        {{- include "clp.labels" . | nindent 8 }}
+        app.kubernetes.io/component: "log-ingestor"
+    spec:
+      serviceAccountName: {{ include "clp.fullname" . }}-job-watcher
+      terminationGracePeriodSeconds: 60
+      securityContext:
+        runAsUser: {{ .Values.securityContext.firstParty.uid }}
+        runAsGroup: {{ .Values.securityContext.firstParty.gid }}
+        fsGroup: {{ .Values.securityContext.firstParty.gid }}
+      initContainers:
+        - {{- include "clp.waitFor" (dict
+            "root" .
+            "type" "job"
+            "name" "db-table-creator"
+          ) | nindent 10 }}
+      containers:
+        - name: "log-ingestor"
+          image: "{{ include "clp.image.ref" . }}"
+          imagePullPolicy: "{{ .Values.image.clpPackage.pullPolicy }}"
+          env:
+            - name: "CLP_DB_PASS"
+              valueFrom:
+                secretKeyRef:
+                  name: {{ include "clp.fullname" . }}-database
+                  key: "password"
+            - name: "CLP_DB_USER"
+              valueFrom:
+                secretKeyRef:
+                  name: {{ include "clp.fullname" . }}-database
+                  key: "username"
+            - name: "CLP_LOGS_DIR"
+              value: "/var/log/log_ingestor"
+            - name: "RUST_LOG"
+              value: {{ .Values.clpConfig.log_ingestor.logging_level | quote }}
+          ports:
+            - name: "log-ingestor"
+              containerPort: 3002
+          volumeMounts:
+            - name: {{ include "clp.volumeName" (dict
+                "component_category" "log-ingestor"
+                "name" "logs"
+              ) | quote }}
+              mountPath: "/var/log/log_ingestor"
+            - name: "config"
+              mountPath: "/etc/clp-config.yaml"
+              subPath: "clp-config.yaml"
+              readOnly: true
+          command: [
+            "/opt/clp/bin/log-ingestor",
+            "--config", "/etc/clp-config.yaml",
+            "--host", "0.0.0.0",
+            "--port", "3002"
+          ]
+          readinessProbe:
+            {{- include "clp.readinessProbeTimings" . | nindent 12 }}
+            httpGet: &log-ingestor-health-check
+              path: "/health"
+              port: "log-ingestor"
+          livenessProbe:
+            {{- include "clp.livenessProbeTimings" . | nindent 12 }}
+            httpGet: *log-ingestor-health-check
+      volumes:
+        - {{- include "clp.pvcVolume" (dict
+            "root" .
+            "component_category" "log-ingestor"
+            "name" "logs"
+          ) | nindent 10 }}
+        - name: "config"
+          configMap:
+            name: {{ include "clp.fullname" . }}-config
+{{- end }}
@@ -0,0 +1,11 @@
+{{- if .Values.clpConfig.log_ingestor }}
+{{- include "clp.createLocalPv" (dict
+  "root" .
+  "component_category" "log-ingestor"
+  "name" "logs"
+  "nodeRole" "control-plane"
+  "capacity" "10Gi"
+  "accessModes" (list "ReadWriteOnce")
+  "hostPath" (printf "%s/log_ingestor" .Values.clpConfig.logs_directory)
+) }}
+{{- end }}
@@ -0,0 +1,9 @@
+{{- if .Values.clpConfig.log_ingestor }}
+{{- include "clp.createPvc" (dict
+  "root" .
+  "component_category" "log-ingestor"
+  "name" "logs"
+  "capacity" "10Gi"
+  "accessModes" (list "ReadWriteOnce")
+) }}
+{{- end }}
@@ -0,0 +1,18 @@
+{{- if .Values.clpConfig.log_ingestor }}
+apiVersion: "v1"
+kind: "Service"
+metadata:
+  name: {{ include "clp.fullname" . }}-log-ingestor
+  labels:
+    {{- include "clp.labels" . | nindent 4 }}
+    app.kubernetes.io/component: "log-ingestor"
+spec:
+  type: "NodePort"
+  selector:
+    {{- include "clp.selectorLabels" . | nindent 4 }}
+    app.kubernetes.io/component: "log-ingestor"
+  ports:
+    - port: 3002
+      targetPort: "log-ingestor"
+      nodePort: {{ .Values.clpConfig.log_ingestor.port }}
+{{- end }}
@@ -59,7 +59,7 @@ mkdir -p  "$CLP_HOME/var/"{data,log}/{database,queue,redis,results_cache} \
           "$CLP_HOME/var/data/"{archives,streams,staged-archives,staged-streams} \
           "$CLP_HOME/var/log/"{compression_scheduler,compression_worker,user} \
           "$CLP_HOME/var/log/"{query_scheduler,query_worker,reducer} \
-          "$CLP_HOME/var/log/"{api_server,garbage_collector,mcp_server} \
+          "$CLP_HOME/var/log/"{api_server,garbage_collector,log_ingestor,mcp_server} \
           "$CLP_HOME/var/tmp" \
           "$CLP_HOME/samples"
 
@@ -85,18 +85,21 @@ cat <<EOF | kind create cluster --name clp-test --config=-
     - hostPath: $CLP_HOME
       containerPath: $CLP_HOME
     extraPortMappings:
-    - containerPort: 30306
-      hostPort: 30306
+    - containerPort: 30000
+      hostPort: 30000
       protocol: TCP
     - containerPort: 30017
       hostPort: 30017
       protocol: TCP
-    - containerPort: 30000
-      hostPort: 30000
-      protocol: TCP
     - containerPort: 30301
       hostPort: 30301
       protocol: TCP
+    - containerPort: 30302
+      hostPort: 30302
+      protocol: TCP
+    - containerPort: 30306
+      hostPort: 30306
+      protocol: TCP
     - containerPort: 30800
       hostPort: 30800
       protocol: TCP

@@ -90,6 +90,19 @@ clpConfig:
   #   port: 30800
   #   logging_level: "INFO"
 
+  # log-ingestor config. Currently, the config is applicable only if `logs_input.type` is "s3".
+  log_ingestor: null
+  #   port: 30302
+  #   # The timeout (in seconds) after which the log buffer is flushed for compression if no new
+  #   # input arrives.
+  #   buffer_flush_timeout: 300
+  #   # The log buffer size (in bytes) that triggers a flush for compression.
+  #   buffer_flush_threshold: 268435456  # 256 MiB
+  #   # The capacity of the internal channel used for communication between an ingestion job and the
+  #   # log buffer.
+  #   channel_capacity: 10
+  #   logging_level: "INFO"
+
   # Where archives should be output to
   archive_output:
     storage: