runpod-colpali-embedding-server (latest)

2025-09-04T15:56:03Z

Pull the image from the command line:

docker pull gitea.mbpvps.us/matifuentes/runpod-colpali-embedding-server:latest

Digest

sha256:91b2189b38d52a918fe477f9de13ac27d508301ca337b19afdb781e49b11eaa3

For more information on the Container registry, see the documentation.

ARG RELEASE

ARG LAUNCHPAD_BUILD_ARCH

LABEL org.opencontainers.image.ref.name=ubuntu

LABEL org.opencontainers.image.version=22.04

ADD file:63d5ab3ef0aab308c0e71cb67292c5467f60deafa9b0418cbb220affcd078444 in /

CMD ["/bin/bash"]

ENV NVARCH=x86_64

ENV NVIDIA_REQUIRE_CUDA=cuda>=11.8 brand=tesla,driver>=470,driver<471 brand=unknown,driver>=470,driver<471 brand=nvidia,driver>=470,driver<471 brand=nvidiartx,driver>=470,driver<471 brand=geforce,driver>=470,driver<471 brand=geforcertx,driver>=470,driver<471 brand=quadro,driver>=470,driver<471 brand=quadrortx,driver>=470,driver<471 brand=titan,driver>=470,driver<471 brand=titanrtx,driver>=470,driver<471

ENV NV_CUDA_CUDART_VERSION=11.8.89-1

ENV NV_CUDA_COMPAT_PACKAGE=cuda-compat-11-8

ARG TARGETARCH

LABEL maintainer=NVIDIA CORPORATION <cudatools@nvidia.com>

RUN |1 TARGETARCH=amd64 /bin/sh -c apt-get update && apt-get install -y --no-install-recommends gnupg2 curl ca-certificates && curl -fsSLO https://developer.download.nvidia.com/compute/cuda/repos/ubuntu2204/${NVARCH}/cuda-keyring_1.0-1_all.deb && dpkg -i cuda-keyring_1.0-1_all.deb && apt-get purge --autoremove -y curl && rm -rf /var/lib/apt/lists/* # buildkit

ENV CUDA_VERSION=11.8.0

RUN |1 TARGETARCH=amd64 /bin/sh -c apt-get update && apt-get install -y --no-install-recommends cuda-cudart-11-8=${NV_CUDA_CUDART_VERSION} ${NV_CUDA_COMPAT_PACKAGE} && rm -rf /var/lib/apt/lists/* # buildkit

RUN |1 TARGETARCH=amd64 /bin/sh -c echo "/usr/local/nvidia/lib" >> /etc/ld.so.conf.d/nvidia.conf && echo "/usr/local/nvidia/lib64" >> /etc/ld.so.conf.d/nvidia.conf # buildkit

ENV PATH=/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin

ENV LD_LIBRARY_PATH=/usr/local/nvidia/lib:/usr/local/nvidia/lib64

COPY NGC-DL-CONTAINER-LICENSE / # buildkit

ENV NVIDIA_VISIBLE_DEVICES=all

ENV NVIDIA_DRIVER_CAPABILITIES=compute,utility

ENV NV_CUDA_LIB_VERSION=11.8.0-1

ENV NV_NVTX_VERSION=11.8.86-1

ENV NV_LIBNPP_VERSION=11.8.0.86-1

ENV NV_LIBNPP_PACKAGE=libnpp-11-8=11.8.0.86-1

ENV NV_LIBCUSPARSE_VERSION=11.7.5.86-1

ENV NV_LIBCUBLAS_PACKAGE_NAME=libcublas-11-8

ENV NV_LIBCUBLAS_VERSION=11.11.3.6-1

ENV NV_LIBCUBLAS_PACKAGE=libcublas-11-8=11.11.3.6-1

ENV NV_LIBNCCL_PACKAGE_NAME=libnccl2

ENV NV_LIBNCCL_PACKAGE_VERSION=2.15.5-1

ENV NCCL_VERSION=2.15.5-1

ENV NV_LIBNCCL_PACKAGE=libnccl2=2.15.5-1+cuda11.8

ARG TARGETARCH

LABEL maintainer=NVIDIA CORPORATION <cudatools@nvidia.com>

RUN |1 TARGETARCH=amd64 /bin/sh -c apt-get update && apt-get install -y --no-install-recommends cuda-libraries-11-8=${NV_CUDA_LIB_VERSION} ${NV_LIBNPP_PACKAGE} cuda-nvtx-11-8=${NV_NVTX_VERSION} libcusparse-11-8=${NV_LIBCUSPARSE_VERSION} ${NV_LIBCUBLAS_PACKAGE} ${NV_LIBNCCL_PACKAGE} && rm -rf /var/lib/apt/lists/* # buildkit

RUN |1 TARGETARCH=amd64 /bin/sh -c apt-mark hold ${NV_LIBCUBLAS_PACKAGE_NAME} ${NV_LIBNCCL_PACKAGE_NAME} # buildkit

COPY entrypoint.d/ /opt/nvidia/entrypoint.d/ # buildkit

COPY nvidia_entrypoint.sh /opt/nvidia/ # buildkit

ENV NVIDIA_PRODUCT_NAME=CUDA

ENTRYPOINT ["/opt/nvidia/nvidia_entrypoint.sh"]

ENV PYTHONUNBUFFERED=1

ENV DEBIAN_FRONTEND=noninteractive

ENV PIP_NO_CACHE_DIR=1

ENV PIP_DISABLE_PIP_VERSION_CHECK=1

ENV HF_HOME=/workspace/hf_cache

ENV TRANSFORMERS_CACHE=/workspace/hf_cache

ENV HF_DATASETS_CACHE=/workspace/hf_cache

WORKDIR /workspace

RUN /bin/sh -c apt-get update && apt-get install -y --no-install-recommends python3.10 python3-pip python3.10-dev git wget curl && rm -rf /var/lib/apt/lists/* && apt-get clean && apt-get autoremove -y # buildkit

RUN /bin/sh -c ln -s /usr/bin/python3.10 /usr/bin/python # buildkit

RUN /bin/sh -c pip install --no-cache-dir torch torchvision torchaudio --index-url https://download.pytorch.org/whl/cu118 # buildkit

RUN /bin/sh -c pip install --no-cache-dir runpod>=1.6.2 transformers>=4.40.0 pillow>=10.0.0 requests>=2.31.0 accelerate>=0.20.0 # buildkit

RUN /bin/sh -c pip install --no-cache-dir colpali-engine>=0.2.0 qwen-vl-utils>=0.0.5 # buildkit

RUN /bin/sh -c pip install --no-cache-dir flash-attn>=2.5.0 || echo "Flash attention installation failed, continuing without it" # buildkit

RUN /bin/sh -c echo 'import os\nimport torch\nfrom transformers import Qwen2VLForConditionalGeneration, AutoProcessor\nprint("Pre-downloading model weights...")\ncache_dir = "/workspace/hf_cache"\nos.makedirs(cache_dir, exist_ok=True)\nmodel_name = "vidore/colqwen2-v1.0"\nprint("Downloading processor...")\nprocessor = AutoProcessor.from_pretrained(model_name, cache_dir=cache_dir, trust_remote_code=True)\nprint("Downloading model...")\nmodel = Qwen2VLForConditionalGeneration.from_pretrained(model_name, torch_dtype=torch.bfloat16, cache_dir=cache_dir, trust_remote_code=True, device_map="cpu")\nprint("Model and processor downloaded successfully!")' > /tmp/download_model.py # buildkit

RUN /bin/sh -c python /tmp/download_model.py && rm /tmp/download_model.py && rm -rf /tmp/* /var/tmp/* /root/.cache # buildkit

RUN /bin/sh -c python -c "from qwen_vl_utils import process_vision_info; print('qwen-vl-utils imported successfully')" || echo "qwen-vl-utils import failed" # buildkit

COPY main.py ./ # buildkit

RUN /bin/sh -c echo '#!/bin/bash\npython -c "import torch; print(f\"CUDA available: {torch.cuda.is_available()}\"); print(f\"CUDA devices: {torch.cuda.device_count()}\")"' > /workspace/health_check.sh && chmod +x /workspace/health_check.sh # buildkit

EXPOSE map[8000/tcp:{}]

HEALTHCHECK &{["CMD-SHELL" "/workspace/health_check.sh || exit 1"] "30s" "30s" "2m0s" "0s" '\x03'}

CMD ["python" "main.py"]

Key	Value
maintainer	NVIDIA CORPORATION <cudatools@nvidia.com>
org.opencontainers.image.ref.name	ubuntu
org.opencontainers.image.version	22.04

Details

Container

2025-09-04 15:56:03 +00:00

52

OCI / Docker

linux/amd64

12 GiB

Versions (1) View all

latest

2025-09-04

runpod-colpali-embedding-server (latest)

Installation

Image Layers

Labels