From 02decb486e8af2b7cd1c3ec7793a0a6f67dc8e2f Mon Sep 17 00:00:00 2001 From: biondizzle Date: Tue, 12 May 2026 21:34:08 +0000 Subject: [PATCH] ba fongol --- build_push.sh | 32 -------------------------------- 1 file changed, 32 deletions(-) diff --git a/build_push.sh b/build_push.sh index cb07c29..63af02a 100644 --- a/build_push.sh +++ b/build_push.sh @@ -33,38 +33,6 @@ echo "$CR_PASS" | docker login "$CR_URL" -u "$CR_USER" --password-stdin echo "[3/4] Pushing image..." docker push "$IMAGE_TAG" -echo "[4/4] Updating docker-compose..." -cat > "${COMPOSE_DIR}/docker-compose.yml" << 'EOF' -services: - vllm: - image: atl.vultrcr.com/vllm/vllm-dsv4-nvfp4:latest - container_name: nvidia-meeting-vllm-1 - ports: - - "8000:8000" - volumes: - - /root/nvidia-meeting/DeepSeek-V4-Pro-NVFP4:/model - environment: - - VLLM_USE_FLASHINFER_MOE_FP4=1 - - OMP_NUM_THREADS=128 - deploy: - resources: - reservations: - devices: - - driver: nvidia - count: 8 - capabilities: [gpu] - command: > - --model /model - --tensor-parallel-size 8 - --max-model-len 65536 - --trust-remote-code - --enforce-eager - --kv-cache-dtype fp8 - --port 8000 - --enable-expert-parallel - --tokenizer-mode=deepseek_v4 -EOF - echo "============================================" echo "DONE! Container pushed to $IMAGE_TAG" echo "Start with: cd $COMPOSE_DIR && docker compose up -d"