k8s updated

deep-div · deep-div · commit 0c91296dab59 · 2026-02-19T20:24:39.000+05:30
diff --git a/k8s/deployment.yaml b/k8s/deployment.yaml
@@ -0,0 +1,87 @@
+apiVersion: apps/v1
+kind: Deployment
+
+metadata:
+  name: metadata-frontend
+  labels:
+    app: metadata-frontend
+
+spec:
+  replicas: 2
+
+  revisionHistoryLimit: 5   # Keep last 5 ReplicaSets for rollback
+
+  strategy:
+    type: RollingUpdate
+    rollingUpdate:
+      maxUnavailable: 1     # At most 1 pod can be down during update
+      maxSurge: 1           # Create 1 extra pod during update
+
+  selector:
+    matchLabels:
+      app: metadata-frontend
+
+  template:
+    metadata:
+      labels:
+        app: metadata-frontend
+
+    spec:
+
+      terminationGracePeriodSeconds: 30  # It tells Kubernetes to wait up to 30 seconds for the pod to shut down gracefully before forcefully killing it.
+
+      containers:
+        - name: metadatafrontend
+          image: deepdiv/metadatafrontend:v1.0
+          imagePullPolicy: Always   
+          ports:
+            - containerPort: 4000
+
+          # Run container as non-root user for better security; Makes filesystem read-only
+          securityContext:
+            runAsNonRoot: true
+            runAsUser: 1000  # Forces container to run as Linux user with UID 1000; Normal users = usually 1000+
+            allowPrivilegeEscalation: false
+            readOnlyRootFilesystem: true
+
+          ## kubectl top pod 
+          # Extremly low for test purposes, to test HPA, Base i saw is 20Mi
+          resources:                    
+            requests:     # minimum guaranteed resources or guranteed space
+              cpu: "20m"                 # Required for HPA calculation, horizontal scaling # 
+              memory: "30Mi"
+            limits:      # maximum allowed usage
+              cpu: "100m"   # CPU limit = speed cap # Not a kill switch.
+              memory: "50Mi"   # Yes — it crashes if crosses
+
+          # Delays container shutdown by 10 seconds so traffic can drain and ongoing requests can finish safely before the pod stops.
+          lifecycle:
+            preStop:
+              exec:
+                command: ["sh", "-c", "sleep 10"]
+
+          startupProbe:
+            httpGet:
+              path: /health
+              port: 4000
+            periodSeconds: 5
+            failureThreshold: 8   # 5 × 8 = 40 seconds allowed for startup
+
+          livenessProbe:     # Auto Restart if Broken  # Active Health Monitoring
+            httpGet:
+              path: /health
+              port: 4000
+            periodSeconds: 10      # Kubernetes runs the health check every 10 seconds.
+            timeoutSeconds: 3      # Kubernetes waits up to 3 seconds for the app to respond before marking the check as failed.
+            failureThreshold: 3    # If the health check fails 3 consecutive times, Kubernetes considers the probe failed and takes action (restart for liveness, mark NotReady for readiness).
+
+
+          readinessProbe:  # Determines whether the pod is ready to receive traffic from the Service
+            httpGet:
+              path: /health        # Kubernetes sends an HTTP GET request to /health
+              port: 4000           # The request is sent to container port 4000
+            initialDelaySeconds: 5 # Wait 5 seconds after container starts before performing the first readiness check
+            periodSeconds: 5       # Run the readiness check every 5 seconds
+            timeoutSeconds: 2      # Wait up to 2 seconds for a response before marking the check as failed
+            failureThreshold: 3    # If the check fails 3 consecutive times, mark the pod as NotReady (removed from Service traffic)
+
diff --git a/k8s/hpa.yaml b/k8s/hpa.yaml
@@ -0,0 +1,50 @@
+apiVersion: autoscaling/v2              # Required for advanced metric-based autoscaling
+kind: HorizontalPodAutoscaler           # Defines automatic scaling rules
+
+metadata:
+  name: metadata-frontend-hpa           # Name of the HPA resource
+  labels:
+    app: metadata-frontend              # Label for identification
+
+spec:
+  scaleTargetRef:
+    apiVersion: apps/v1                 # Target API version
+    kind: Deployment                    # We are scaling a Deployment
+    name: metadata-frontend             # Must match Deployment name exactly
+
+  minReplicas: 2                        # Never scale below 2 pods
+  maxReplicas: 6                        # Never scale above 6 pods
+
+  metrics:
+    # CPU METRIC 
+    - type: Resource
+      resource:
+        name: cpu                       # Monitor CPU usage
+        target:
+          type: Utilization             # Percentage of requested CPU
+          averageUtilization: 80        # Scale if average CPU > 70% of request
+
+    # MEMORY METRIC 
+    - type: Resource
+      resource:
+        name: memory                    # Monitor Memory usage
+        target:
+          type: Utilization             # Percentage of requested Memory
+          averageUtilization: 80        # Scale if average Memory > 80% of request
+
+  behavior:
+    # SCALE UP BEHAVIOR 
+    scaleUp:
+      stabilizationWindowSeconds: 30    # Wait 30s before scaling up again
+      policies:
+        - type: Percent
+          value: 100                    # Can increase replicas by 100% (double)
+          periodSeconds: 60             # Within a 60-second window
+
+    # SCALE DOWN BEHAVIOR 
+    scaleDown:
+      stabilizationWindowSeconds: 300   # Wait 5 minutes before scaling down
+      policies:
+        - type: Percent
+          value: 50                     # Reduce at most 50% of pods at once
+          periodSeconds: 60             # Within a 60-second window
diff --git a/k8s/ingress.yaml b/k8s/ingress.yaml
@@ -0,0 +1,44 @@
+apiVersion: networking.k8s.io/v1
+kind: Ingress
+
+metadata:
+  name: metadata-frontend-ingress
+  annotations:
+    nginx.ingress.kubernetes.io/load-balance: "round_robin"   # Load balancing strategy
+    nginx.ingress.kubernetes.io/ssl-redirect: "true"  
+
+spec:
+  ingressClassName: nginx   # Must match installed ingress controller
+
+  # TLS configuration (HTTPS - Port 443)
+  # Only enabled for public domain
+  tls:
+    - hosts:
+        - coldemailgenerator.online   # Public domain secured with HTTPS
+      secretName: coldemailgenerator-tls   # TLS secret containing certificate & key
+
+  rules:
+
+    # Localhost 
+    - host: localhost
+      http:
+        paths:
+          - path: /
+            pathType: Prefix
+            backend:
+              service:
+                name: metadata-frontend-service
+                port:
+                  number: 4000
+
+    # Public Domain 
+    - host: coldemailgenerator.online
+      http:
+        paths:
+          - path: /
+            pathType: Prefix
+            backend:
+              service:
+                name: metadata-frontend-service
+                port:
+                  number: 4000
diff --git a/k8s/pdb.yaml b/k8s/pdb.yaml
@@ -0,0 +1,15 @@
+apiVersion: policy/v1                 # API version for PodDisruptionBudget
+kind: PodDisruptionBudget             # Ensures minimum pod availability
+
+metadata:
+  name: metadata-frontend-pdb         # Name of the PDB
+  labels:
+    app: metadata-frontend            # Label for grouping
+
+spec:
+  minAvailable: 1                     # At least 1 pod must always remain running
+                                      # Even during voluntary disruptions (node drain, upgrades)
+
+  selector:
+    matchLabels:
+      app: metadata-frontend          # Must match Deployment pod labels
diff --git a/k8s/service.yaml b/k8s/service.yaml
@@ -0,0 +1,23 @@
+apiVersion: v1                       # Core Kubernetes API version for Service resources
+kind: Service                        # Defines a stable network endpoint for a set of Pods
+
+metadata:
+  name: metadata-frontend-service    # Service name (used for internal DNS)
+  labels:
+    app: metadata-frontend           # Label for identifying this Service
+
+spec:
+  type: ClusterIP                    # Exposes service internally within the cluster only
+                                     # (Default type. Not accessible from outside)
+
+  selector:
+    app: metadata-frontend           # Selects Pods with this label
+                                     # Must exactly match Deployment pod template labels
+
+  ports:
+    - name: http                     # Logical name for the port (useful for clarity and future extensions)
+      protocol: TCP                  # Protocol used for communication
+      port: 4000                       # Port exposed by the Service inside the cluster
+                                     # Other pods will call this port
+      targetPort: 4000               # Port on the container (matches containerPort in Deployment)
+                                     # Traffic received on port 80 is forwarded to 4000
diff --git a/rough/Lecture-Summarize b/rough/Lecture-Summarize
@@ -0,0 +1 @@
+Subproject commit e4d58716840a4474b373cb3c112bea71d734a228

Original file line number	Diff line number	Diff line change
`@@ -0,0 +1 @@`
	`1`	`+Subproject commit e4d58716840a4474b373cb3c112bea71d734a228`