From 553b0228e8cc768c213eb35fcedd3d3c23ff390d Mon Sep 17 00:00:00 2001 From: Jino Jose Date: Tue, 23 Jun 2026 15:27:17 +0530 Subject: [PATCH] MLflow wait_for: ignore_errors so install continues regardless --- ansible/roles/base/tasks/main.yml | 4 ++-- ansible/roles/mlflow/tasks/main.yml | 1 + install.sh | 6 ++++-- 3 files changed, 7 insertions(+), 4 deletions(-) diff --git a/ansible/roles/base/tasks/main.yml b/ansible/roles/base/tasks/main.yml index 50417ed..a76a0cb 100644 --- a/ansible/roles/base/tasks/main.yml +++ b/ansible/roles/base/tasks/main.yml @@ -5,7 +5,7 @@ update_cache: yes cache_valid_time: 3600 -- name: Upgrade all packages +- name: Upgrade all packages (this takes 10–20 min on first run, please wait...) apt: upgrade: dist autoremove: yes @@ -85,7 +85,7 @@ args: creates: /opt/cezen/miniconda/envs/cezen -- name: Install LangChain + LlamaIndex + HuggingFace in conda env +- name: Install LangChain + LlamaIndex + HuggingFace in conda env (5–10 min, please wait...) become_user: cezen shell: | /opt/cezen/miniconda/bin/conda run -n cezen pip install \ diff --git a/ansible/roles/mlflow/tasks/main.yml b/ansible/roles/mlflow/tasks/main.yml index b5659fd..76f33aa 100644 --- a/ansible/roles/mlflow/tasks/main.yml +++ b/ansible/roles/mlflow/tasks/main.yml @@ -54,3 +54,4 @@ host: localhost port: 5000 timeout: 30 + ignore_errors: true diff --git a/install.sh b/install.sh index 6f8f17c..b7862cf 100644 --- a/install.sh +++ b/install.sh @@ -54,8 +54,9 @@ run_phase1() { echo "║ Cezen AI Suite — Phase 1: NVIDIA ║" echo "╚══════════════════════════════════════════╝" + ANSIBLE_STDOUT_CALLBACK=yaml \ ansible-playbook -i localhost, -c local "$ANSIBLE_DIR/phase1_nvidia.yml" \ - -e "tier=$TIER" -v + -e "tier=$TIER" # Register phase 2 as a one-shot systemd service so it runs after reboot cat > /etc/systemd/system/cezen-phase2.service << EOF @@ -100,8 +101,9 @@ run_phase2() { echo "✓ NVIDIA driver: $(nvidia-smi --query-gpu=driver_version --format=csv,noheader | head -1)" fi + ANSIBLE_STDOUT_CALLBACK=yaml \ ansible-playbook -i localhost, -c local "$ANSIBLE_DIR/entry.yml" \ - -e "tier=$TIER" -v + -e "tier=$TIER" # Disable one-shot service so it doesn't run again on next reboot systemctl disable cezen-phase2.service 2>/dev/null || true