matifuentes
  • Joined on 2025-09-02

runpod-colpali-embedding-server (latest)

Published 2025-09-04 15:56:03 +00:00 by matifuentes

Installation

docker pull gitea.mbpvps.us/matifuentes/runpod-colpali-embedding-server:latest
sha256:91b2189b38d52a918fe477f9de13ac27d508301ca337b19afdb781e49b11eaa3

Image Layers

ARG RELEASE
ARG LAUNCHPAD_BUILD_ARCH
LABEL org.opencontainers.image.ref.name=ubuntu
LABEL org.opencontainers.image.version=22.04
ADD file:63d5ab3ef0aab308c0e71cb67292c5467f60deafa9b0418cbb220affcd078444 in /
CMD ["/bin/bash"]
ENV NVARCH=x86_64
ENV NVIDIA_REQUIRE_CUDA=cuda>=11.8 brand=tesla,driver>=470,driver<471 brand=unknown,driver>=470,driver<471 brand=nvidia,driver>=470,driver<471 brand=nvidiartx,driver>=470,driver<471 brand=geforce,driver>=470,driver<471 brand=geforcertx,driver>=470,driver<471 brand=quadro,driver>=470,driver<471 brand=quadrortx,driver>=470,driver<471 brand=titan,driver>=470,driver<471 brand=titanrtx,driver>=470,driver<471
ENV NV_CUDA_CUDART_VERSION=11.8.89-1
ENV NV_CUDA_COMPAT_PACKAGE=cuda-compat-11-8
ARG TARGETARCH
LABEL maintainer=NVIDIA CORPORATION <cudatools@nvidia.com>
RUN |1 TARGETARCH=amd64 /bin/sh -c apt-get update && apt-get install -y --no-install-recommends gnupg2 curl ca-certificates && curl -fsSLO https://developer.download.nvidia.com/compute/cuda/repos/ubuntu2204/${NVARCH}/cuda-keyring_1.0-1_all.deb && dpkg -i cuda-keyring_1.0-1_all.deb && apt-get purge --autoremove -y curl && rm -rf /var/lib/apt/lists/* # buildkit
ENV CUDA_VERSION=11.8.0
RUN |1 TARGETARCH=amd64 /bin/sh -c apt-get update && apt-get install -y --no-install-recommends cuda-cudart-11-8=${NV_CUDA_CUDART_VERSION} ${NV_CUDA_COMPAT_PACKAGE} && rm -rf /var/lib/apt/lists/* # buildkit
RUN |1 TARGETARCH=amd64 /bin/sh -c echo "/usr/local/nvidia/lib" >> /etc/ld.so.conf.d/nvidia.conf && echo "/usr/local/nvidia/lib64" >> /etc/ld.so.conf.d/nvidia.conf # buildkit
ENV PATH=/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin
ENV LD_LIBRARY_PATH=/usr/local/nvidia/lib:/usr/local/nvidia/lib64
COPY NGC-DL-CONTAINER-LICENSE / # buildkit
ENV NVIDIA_VISIBLE_DEVICES=all
ENV NVIDIA_DRIVER_CAPABILITIES=compute,utility
ENV NV_CUDA_LIB_VERSION=11.8.0-1
ENV NV_NVTX_VERSION=11.8.86-1
ENV NV_LIBNPP_VERSION=11.8.0.86-1
ENV NV_LIBNPP_PACKAGE=libnpp-11-8=11.8.0.86-1
ENV NV_LIBCUSPARSE_VERSION=11.7.5.86-1
ENV NV_LIBCUBLAS_PACKAGE_NAME=libcublas-11-8
ENV NV_LIBCUBLAS_VERSION=11.11.3.6-1
ENV NV_LIBCUBLAS_PACKAGE=libcublas-11-8=11.11.3.6-1
ENV NV_LIBNCCL_PACKAGE_NAME=libnccl2
ENV NV_LIBNCCL_PACKAGE_VERSION=2.15.5-1
ENV NCCL_VERSION=2.15.5-1
ENV NV_LIBNCCL_PACKAGE=libnccl2=2.15.5-1+cuda11.8
ARG TARGETARCH
LABEL maintainer=NVIDIA CORPORATION <cudatools@nvidia.com>
RUN |1 TARGETARCH=amd64 /bin/sh -c apt-get update && apt-get install -y --no-install-recommends cuda-libraries-11-8=${NV_CUDA_LIB_VERSION} ${NV_LIBNPP_PACKAGE} cuda-nvtx-11-8=${NV_NVTX_VERSION} libcusparse-11-8=${NV_LIBCUSPARSE_VERSION} ${NV_LIBCUBLAS_PACKAGE} ${NV_LIBNCCL_PACKAGE} && rm -rf /var/lib/apt/lists/* # buildkit
RUN |1 TARGETARCH=amd64 /bin/sh -c apt-mark hold ${NV_LIBCUBLAS_PACKAGE_NAME} ${NV_LIBNCCL_PACKAGE_NAME} # buildkit
COPY entrypoint.d/ /opt/nvidia/entrypoint.d/ # buildkit
COPY nvidia_entrypoint.sh /opt/nvidia/ # buildkit
ENV NVIDIA_PRODUCT_NAME=CUDA
ENTRYPOINT ["/opt/nvidia/nvidia_entrypoint.sh"]
ENV PYTHONUNBUFFERED=1
ENV DEBIAN_FRONTEND=noninteractive
ENV PIP_NO_CACHE_DIR=1
ENV PIP_DISABLE_PIP_VERSION_CHECK=1
ENV HF_HOME=/workspace/hf_cache
ENV TRANSFORMERS_CACHE=/workspace/hf_cache
ENV HF_DATASETS_CACHE=/workspace/hf_cache
WORKDIR /workspace
RUN /bin/sh -c apt-get update && apt-get install -y --no-install-recommends python3.10 python3-pip python3.10-dev git wget curl && rm -rf /var/lib/apt/lists/* && apt-get clean && apt-get autoremove -y # buildkit
RUN /bin/sh -c ln -s /usr/bin/python3.10 /usr/bin/python # buildkit
RUN /bin/sh -c pip install --no-cache-dir torch torchvision torchaudio --index-url https://download.pytorch.org/whl/cu118 # buildkit
RUN /bin/sh -c pip install --no-cache-dir runpod>=1.6.2 transformers>=4.40.0 pillow>=10.0.0 requests>=2.31.0 accelerate>=0.20.0 # buildkit
RUN /bin/sh -c pip install --no-cache-dir colpali-engine>=0.2.0 qwen-vl-utils>=0.0.5 # buildkit
RUN /bin/sh -c pip install --no-cache-dir flash-attn>=2.5.0 || echo "Flash attention installation failed, continuing without it" # buildkit
RUN /bin/sh -c echo 'import os\nimport torch\nfrom transformers import Qwen2VLForConditionalGeneration, AutoProcessor\nprint("Pre-downloading model weights...")\ncache_dir = "/workspace/hf_cache"\nos.makedirs(cache_dir, exist_ok=True)\nmodel_name = "vidore/colqwen2-v1.0"\nprint("Downloading processor...")\nprocessor = AutoProcessor.from_pretrained(model_name, cache_dir=cache_dir, trust_remote_code=True)\nprint("Downloading model...")\nmodel = Qwen2VLForConditionalGeneration.from_pretrained(model_name, torch_dtype=torch.bfloat16, cache_dir=cache_dir, trust_remote_code=True, device_map="cpu")\nprint("Model and processor downloaded successfully!")' > /tmp/download_model.py # buildkit
RUN /bin/sh -c python /tmp/download_model.py && rm /tmp/download_model.py && rm -rf /tmp/* /var/tmp/* /root/.cache # buildkit
RUN /bin/sh -c python -c "from qwen_vl_utils import process_vision_info; print('qwen-vl-utils imported successfully')" || echo "qwen-vl-utils import failed" # buildkit
COPY main.py ./ # buildkit
RUN /bin/sh -c echo '#!/bin/bash\npython -c "import torch; print(f\"CUDA available: {torch.cuda.is_available()}\"); print(f\"CUDA devices: {torch.cuda.device_count()}\")"' > /workspace/health_check.sh && chmod +x /workspace/health_check.sh # buildkit
EXPOSE map[8000/tcp:{}]
HEALTHCHECK &{["CMD-SHELL" "/workspace/health_check.sh || exit 1"] "30s" "30s" "2m0s" "0s" '\x03'}
CMD ["python" "main.py"]

Labels

Key Value
maintainer NVIDIA CORPORATION <cudatools@nvidia.com>
org.opencontainers.image.ref.name ubuntu
org.opencontainers.image.version 22.04
Details
Container
2025-09-04 15:56:03 +00:00
52
OCI / Docker
linux/amd64
12 GiB
Versions (1) View all
latest 2025-09-04