MLflow
By Bys on February 7, 2025
MLOps
[MLFlow]
Install MLFlow(Community Version)
values.yaml
ingress:
enabled: true
className: "alb"
annotations:
alb.ingress.kubernetes.io/group.name: mlops
alb.ingress.kubernetes.io/subnets: bys-dev-ue1-sbn-1a-extelb, bys-dev-ue1-sbn-1b-extelb, bys-dev-ue1-sbn-1c-extelb, bys-dev-ue1-sbn-1d-extelb, bys-dev-ue1-sbn-1f-extelb
alb.ingress.kubernetes.io/scheme : internet-facing
alb.ingress.kubernetes.io/listen-ports: '[{"HTTPS": 443}]'
alb.ingress.kubernetes.io/certificate-arn: arn:aws:acm:us-east-1:558846430793:certificate/a5207b24-ae67-49ac-b34e-f34ed0088bca
alb.ingress.kubernetes.io/security-groups: sg-07e6c272df0bed7ee
alb.ingress.kubernetes.io/healthcheck-path: /
alb.ingress.kubernetes.io/healthcheck-interval-seconds: '15'
alb.ingress.kubernetes.io/healthcheck-timeout-seconds: '10'
alb.ingress.kubernetes.io/healthy-threshold-count: '2'
alb.ingress.kubernetes.io/unhealthy-threshold-count: '4'
alb.ingress.kubernetes.io/healthcheck-port: traffic-port
alb.ingress.kubernetes.io/success-codes: 200,302,401
alb.ingress.kubernetes.io/target-type: ip
alb.ingress.kubernetes.io/tags: auto-delete=no
hosts:
- host: mlflow.bys.asia
paths:
- path: /
pathType: Prefix
backendStore:
databaseConnectionCheck: true
postgres:
enabled: true
host: "postgresql.postgresql.svc.cluster.local" # required
port: 5432 # required
database: "mlflow" # required
user: "postgres" # required
password: "postgres" # required
auth:
enabled: true
adminUsername: "admin"
adminPassword: "admin"
defaultPermission: MANAGE
artifactRoot:
s3:
enabled: true
bucket: "minio-mlflow"
path: "artifacts"
awsAccessKeyId: "mlflow"
awsSecretAccessKey: "miniomlflow"
resources:
requests:
cpu: "500m"
memory: "1Gi"
limits:
cpu: "500m"
memory: "1Gi"
serviceAccount:
create: true
name: "mlflow"
extraEnvVars:
MLFLOW_S3_ENDPOINT_URL: http://minio.minio.svc.cluster.local:9000
MLFLOW_S3_IGNORE_TLS: true
# MLFLOW_S3_UPLOAD_EXTRA_ARGS: '{"ServerSideEncryption": "aws:kms", "SSEKMSKeyId": "1234"}'
# AWS_DEFAULT_REGION: my_region
# AWS_CA_BUNDLE: /some/ca/bundle.pem
# MLFLOW_GCS_DEFAULT_TIMEOUT - Sets the standard timeout for transfer operations in seconds (Default: 60). Use -1 for indefinite timeout.
# MLFLOW_GCS_UPLOAD_CHUNK_SIZE - Sets the standard upload chunk size for bigger files in bytes (Default: 104857600 ≙ 100MiB), must be multiple of 256 KB.
# MLFLOW_GCS_DOWNLOAD_CHUNK_SIZE - Sets the standard download chunk size for bigger files in bytes (Default: 104857600 ≙ 100MiB), must be multiple of 256 K
helm repo add community-charts https://community-charts.github.io/helm-charts
helm repo update
helm upgrade -i mlflow community-charts/mlflow -n mlflow -f /Users/bys/workspace/kubernetes/mlops/mlflow/values.yaml
helm uninstall mlflow -n mlflow
mlops
jupyter
mlflow
]