Kubernetes Deployment

Prerequisites

Kubernetes 1.28+
Helm 3+
kubectl configured
Storage class for persistent volumes

Quick Start

# Add Helm repo
helm repo add aip https://charts.runtools.ai/aip
helm repo update

# Install
helm install aip-hub aip/aip-hub \
  --namespace aip \
  --create-namespace \
  --set config.jwtSecret=your-secret-key

Configuration

values.yaml

# AIP Hub
hub:
  replicas: 2
  resources:
    requests:
      cpu: "500m"
      memory: "1Gi"
    limits:
      cpu: "1"
      memory: "2Gi"

# Database (external recommended for production)
postgresql:
  enabled: false  # Use external
  external:
    host: your-postgres-host
    port: 5432
    database: aip
    username: aip
    password: your-password

# Redis (optional but recommended)
redis:
  enabled: true
  resources:
    requests:
      cpu: "100m"
      memory: "128Mi"

# Configuration
config:
  jwtSecret: "your-jwt-secret-min-32-chars"
  
  # Embeddings
  openaiApiKey: "sk-..."
  embeddingModel: "text-embedding-3-small"
  
  # Auth (optional)
  authProvider: "oidc"
  oidcIssuer: "https://auth.yourcompany.com"
  oidcClientId: "aip-hub"
  oidcClientSecret: "..."
  
  # RunTools connection
  runtoolsApiKey: "rt_..."

# Ingress
ingress:
  enabled: true
  className: nginx
  annotations:
    cert-manager.io/cluster-issuer: letsencrypt-prod
  hosts:
    - host: aip.yourcompany.com
      paths:
        - path: /
          pathType: Prefix
  tls:
    - hosts:
        - aip.yourcompany.com
      secretName: aip-hub-tls

# Storage
storage:
  class: "standard"
  size: "10Gi"

Install

helm install aip-hub aip/aip-hub \
  --namespace aip \
  --create-namespace \
  -f values.yaml

Verify

# Check pods
kubectl get pods -n aip

# Check services
kubectl get svc -n aip

# Check ingress
kubectl get ingress -n aip

# API health
kubectl port-forward svc/aip-hub 3000:3000 -n aip
curl http://localhost:3000/health

Scaling

# Scale hub replicas
kubectl scale deployment aip-hub --replicas=4 -n aip

Autoscaling

apiVersion: autoscaling/v2
kind: HorizontalPodAutoscaler
metadata:
  name: aip-hub-hpa
  namespace: aip
spec:
  scaleTargetRef:
    apiVersion: apps/v1
    kind: Deployment
    name: aip-hub
  minReplicas: 2
  maxReplicas: 10
  metrics:
    - type: Resource
      resource:
        name: cpu
        target:
          type: Utilization
          averageUtilization: 70

Monitoring

Prometheus

# values.yaml
monitoring:
  prometheus:
    enabled: true
    serviceMonitor:
      enabled: true

Metrics exposed:

aip_invocations_total
aip_sessions_active
aip_blocks_total
aip_embedding_latency_seconds

Backup

# Backup PostgreSQL (if using in-cluster)
kubectl exec -it aip-postgresql-0 -n aip -- \
  pg_dump -U aip aip > backup.sql

# Backup with Velero
velero backup create aip-backup \
  --include-namespaces aip

Upgrading

# Update repo
helm repo update

# Upgrade
helm upgrade aip-hub aip/aip-hub \
  --namespace aip \
  -f values.yaml

Troubleshooting

Pods not starting

# Check events
kubectl describe pod <pod-name> -n aip

# Check logs
kubectl logs <pod-name> -n aip

Database connection issues

# Test connection from pod
kubectl exec -it <pod-name> -n aip -- \
  psql $DATABASE_URL -c "SELECT 1"

Storage issues

# Check PVCs
kubectl get pvc -n aip

# Check storage class
kubectl get sc

Getting Started

Platform

Core Features

Advanced

Self-Hosted

Kubernetes Deployment

Prerequisites

Quick Start

Configuration

values.yaml

Install

Verify

Scaling

Autoscaling

Monitoring

Prometheus

Backup

Upgrading

Troubleshooting

Pods not starting

Database connection issues

Storage issues

Getting Started

Platform

Core Features

Advanced

Self-Hosted

​Prerequisites

​Quick Start

​Configuration

​values.yaml

​Install

​Verify

​Scaling

​Autoscaling

​Monitoring

​Prometheus

​Backup

​Upgrading

​Troubleshooting

​Pods not starting

​Database connection issues

​Storage issues

Prerequisites

Quick Start

Configuration

values.yaml

Install

Verify

Scaling

Autoscaling

Monitoring

Prometheus

Backup

Upgrading

Troubleshooting

Pods not starting

Database connection issues

Storage issues