diederik
  • Joined on 2026-01-12

crawl4ai (0.8.6-hhe)

Published 2026-04-17 11:17:09 +00:00 by diederik

Installation

docker pull git.henhouse.group/diederik/crawl4ai:0.8.6-hhe
sha256:e84d568482e0d026053f37ad7c05b571c0665bcbd023018a21ecaf5e8b215fff

Images

Digest OS / Arch Size
e49afa28a3 linux/amd64 1.4 GiB

Image Layers ( linux/amd64)

# debian.sh --arch 'amd64' out/ 'bookworm' '@1773619200'
ENV PATH=/usr/local/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin
ENV LANG=C.UTF-8
RUN /bin/sh -c set -eux; apt-get update; apt-get install -y --no-install-recommends ca-certificates netbase tzdata ; rm -rf /var/lib/apt/lists/* # buildkit
ENV GPG_KEY=7169605F62C751356D054A26A821E680E5FA6305
ENV PYTHON_VERSION=3.12.13
ENV PYTHON_SHA256=c08bc65a81971c1dd5783182826503369466c7e67374d1646519adf05207b684
RUN /bin/sh -c set -eux; savedAptMark="$(apt-mark showmanual)"; apt-get update; apt-get install -y --no-install-recommends dpkg-dev gcc gnupg libbluetooth-dev libbz2-dev libc6-dev libdb-dev libffi-dev libgdbm-dev liblzma-dev libncursesw5-dev libreadline-dev libsqlite3-dev libssl-dev make tk-dev uuid-dev wget xz-utils zlib1g-dev ; wget -O python.tar.xz "https://www.python.org/ftp/python/${PYTHON_VERSION%%[a-z]*}/Python-$PYTHON_VERSION.tar.xz"; echo "$PYTHON_SHA256 *python.tar.xz" | sha256sum -c -; wget -O python.tar.xz.asc "https://www.python.org/ftp/python/${PYTHON_VERSION%%[a-z]*}/Python-$PYTHON_VERSION.tar.xz.asc"; GNUPGHOME="$(mktemp -d)"; export GNUPGHOME; gpg --batch --keyserver hkps://keys.openpgp.org --recv-keys "$GPG_KEY"; gpg --batch --verify python.tar.xz.asc python.tar.xz; gpgconf --kill all; rm -rf "$GNUPGHOME" python.tar.xz.asc; mkdir -p /usr/src/python; tar --extract --directory /usr/src/python --strip-components=1 --file python.tar.xz; rm python.tar.xz; cd /usr/src/python; gnuArch="$(dpkg-architecture --query DEB_BUILD_GNU_TYPE)"; ./configure --build="$gnuArch" --enable-loadable-sqlite-extensions --enable-optimizations --enable-option-checking=fatal --enable-shared $(test "${gnuArch%%-*}" != 'riscv64' && echo '--with-lto') --with-ensurepip ; nproc="$(nproc)"; EXTRA_CFLAGS="$(dpkg-buildflags --get CFLAGS)"; LDFLAGS="$(dpkg-buildflags --get LDFLAGS)"; LDFLAGS="${LDFLAGS:-} -Wl,--strip-all"; arch="$(dpkg --print-architecture)"; arch="${arch##*-}"; case "$arch" in amd64|arm64) EXTRA_CFLAGS="${EXTRA_CFLAGS:-} -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer"; ;; i386) ;; *) EXTRA_CFLAGS="${EXTRA_CFLAGS:-} -fno-omit-frame-pointer"; ;; esac; make -j "$nproc" "EXTRA_CFLAGS=${EXTRA_CFLAGS:-}" "LDFLAGS=${LDFLAGS:-}" ; rm python; make -j "$nproc" "EXTRA_CFLAGS=${EXTRA_CFLAGS:-}" "LDFLAGS=${LDFLAGS:-} -Wl,-rpath='\$\$ORIGIN/../lib'" python ; make install; cd /; rm -rf /usr/src/python; find /usr/local -depth \( \( -type d -a \( -name test -o -name tests -o -name idle_test \) \) -o \( -type f -a \( -name '*.pyc' -o -name '*.pyo' -o -name 'libpython*.a' \) \) \) -exec rm -rf '{}' + ; ldconfig; apt-mark auto '.*' > /dev/null; apt-mark manual $savedAptMark; find /usr/local -type f -executable -not \( -name '*tkinter*' \) -exec ldd '{}' ';' | awk '/=>/ { so = $(NF-1); if (index(so, "/usr/local/") == 1) { next }; gsub("^/(usr/)?", "", so); printf "*%s\n", so }' | sort -u | xargs -rt dpkg-query --search | awk 'sub(":$", "", $1) { print $1 }' | sort -u | xargs -r apt-mark manual ; apt-get purge -y --auto-remove -o APT::AutoRemove::RecommendsImportant=false; rm -rf /var/lib/apt/lists/*; export PYTHONDONTWRITEBYTECODE=1; python3 --version; pip3 --version # buildkit
RUN /bin/sh -c set -eux; for src in idle3 pip3 pydoc3 python3 python3-config; do dst="$(echo "$src" | tr -d 3)"; [ -s "/usr/local/bin/$src" ]; [ ! -e "/usr/local/bin/$dst" ]; ln -svT "$src" "/usr/local/bin/$dst"; done # buildkit
CMD ["python3"]
ARG C4AI_VER=0.8.6
ENV C4AI_VERSION=0.8.6
LABEL c4ai.version=0.8.6
ARG APP_HOME=/app
ARG GITHUB_REPO=https://github.com/unclecode/crawl4ai.git
ARG GITHUB_BRANCH=main
ARG USE_LOCAL=true
ENV PYTHONFAULTHANDLER=1 PYTHONHASHSEED=random PYTHONUNBUFFERED=1 PIP_NO_CACHE_DIR=1 PYTHONDONTWRITEBYTECODE=1 PIP_DISABLE_PIP_VERSION_CHECK=1 PIP_DEFAULT_TIMEOUT=100 DEBIAN_FRONTEND=noninteractive REDIS_HOST=localhost REDIS_PORT=6379
ARG PYTHON_VERSION=3.12
ARG INSTALL_TYPE=default
ARG ENABLE_GPU=false
ARG TARGETARCH=amd64
ARG REDIS_VERSION=6:7.2.7-1rl1~bookworm1
LABEL maintainer=unclecode
LABEL description=🔥🕷️ Crawl4AI: Open-source LLM Friendly Web Crawler & scraper
LABEL version=1.0
RUN |10 C4AI_VER=0.8.6 APP_HOME=/app GITHUB_REPO=https://github.com/unclecode/crawl4ai.git GITHUB_BRANCH=main USE_LOCAL=true PYTHON_VERSION=3.12 INSTALL_TYPE=default ENABLE_GPU=false TARGETARCH=amd64 REDIS_VERSION=6:7.2.7-1rl1~bookworm1 /bin/sh -c apt-get update && apt-get install -y --no-install-recommends curl gnupg && rm -rf /var/lib/apt/lists/* # buildkit
RUN |10 C4AI_VER=0.8.6 APP_HOME=/app GITHUB_REPO=https://github.com/unclecode/crawl4ai.git GITHUB_BRANCH=main USE_LOCAL=true PYTHON_VERSION=3.12 INSTALL_TYPE=default ENABLE_GPU=false TARGETARCH=amd64 REDIS_VERSION=6:7.2.7-1rl1~bookworm1 /bin/sh -c curl -fsSL https://packages.redis.io/gpg | gpg --dearmor -o /usr/share/keyrings/redis-archive-keyring.gpg && echo "deb [signed-by=/usr/share/keyrings/redis-archive-keyring.gpg] https://packages.redis.io/deb bookworm main" > /etc/apt/sources.list.d/redis.list # buildkit
RUN |10 C4AI_VER=0.8.6 APP_HOME=/app GITHUB_REPO=https://github.com/unclecode/crawl4ai.git GITHUB_BRANCH=main USE_LOCAL=true PYTHON_VERSION=3.12 INSTALL_TYPE=default ENABLE_GPU=false TARGETARCH=amd64 REDIS_VERSION=6:7.2.7-1rl1~bookworm1 /bin/sh -c apt-get update && apt-get install -y --no-install-recommends build-essential curl wget gnupg git cmake pkg-config python3-dev libjpeg-dev redis-tools${REDIS_VERSION:+=$REDIS_VERSION} redis-server${REDIS_VERSION:+=$REDIS_VERSION} supervisor && apt-get clean && rm -rf /var/lib/apt/lists/* # buildkit
RUN |10 C4AI_VER=0.8.6 APP_HOME=/app GITHUB_REPO=https://github.com/unclecode/crawl4ai.git GITHUB_BRANCH=main USE_LOCAL=true PYTHON_VERSION=3.12 INSTALL_TYPE=default ENABLE_GPU=false TARGETARCH=amd64 REDIS_VERSION=6:7.2.7-1rl1~bookworm1 /bin/sh -c apt-get update && apt-get install -y --no-install-recommends libglib2.0-0 libnss3 libnspr4 libatk1.0-0 libatk-bridge2.0-0 libcups2 libdrm2 libdbus-1-3 libxcb1 libxkbcommon0 libx11-6 libxcomposite1 libxdamage1 libxext6 libxfixes3 libxrandr2 libgbm1 libpango-1.0-0 libcairo2 libasound2 libatspi2.0-0 && apt-get clean && rm -rf /var/lib/apt/lists/* # buildkit
RUN |10 C4AI_VER=0.8.6 APP_HOME=/app GITHUB_REPO=https://github.com/unclecode/crawl4ai.git GITHUB_BRANCH=main USE_LOCAL=true PYTHON_VERSION=3.12 INSTALL_TYPE=default ENABLE_GPU=false TARGETARCH=amd64 REDIS_VERSION=6:7.2.7-1rl1~bookworm1 /bin/sh -c apt-get update && apt-get dist-upgrade -y && rm -rf /var/lib/apt/lists/* # buildkit
RUN |10 C4AI_VER=0.8.6 APP_HOME=/app GITHUB_REPO=https://github.com/unclecode/crawl4ai.git GITHUB_BRANCH=main USE_LOCAL=true PYTHON_VERSION=3.12 INSTALL_TYPE=default ENABLE_GPU=false TARGETARCH=amd64 REDIS_VERSION=6:7.2.7-1rl1~bookworm1 /bin/sh -c if [ "$ENABLE_GPU" = "true" ] && [ "$TARGETARCH" = "amd64" ] ; then apt-get update && apt-get install -y --no-install-recommends nvidia-cuda-toolkit && apt-get clean && rm -rf /var/lib/apt/lists/* ; else echo "Skipping NVIDIA CUDA Toolkit installation (unsupported platform or GPU disabled)"; fi # buildkit
RUN |10 C4AI_VER=0.8.6 APP_HOME=/app GITHUB_REPO=https://github.com/unclecode/crawl4ai.git GITHUB_BRANCH=main USE_LOCAL=true PYTHON_VERSION=3.12 INSTALL_TYPE=default ENABLE_GPU=false TARGETARCH=amd64 REDIS_VERSION=6:7.2.7-1rl1~bookworm1 /bin/sh -c if [ "$TARGETARCH" = "arm64" ]; then echo "🦾 Installing ARM-specific optimizations"; apt-get update && apt-get install -y --no-install-recommends libopenblas-dev && apt-get clean && rm -rf /var/lib/apt/lists/*; elif [ "$TARGETARCH" = "amd64" ]; then echo "🖥️ Installing AMD64-specific optimizations"; apt-get update && apt-get install -y --no-install-recommends libomp-dev && apt-get clean && rm -rf /var/lib/apt/lists/*; else echo "Skipping platform-specific optimizations (unsupported platform)"; fi # buildkit
RUN |10 C4AI_VER=0.8.6 APP_HOME=/app GITHUB_REPO=https://github.com/unclecode/crawl4ai.git GITHUB_BRANCH=main USE_LOCAL=true PYTHON_VERSION=3.12 INSTALL_TYPE=default ENABLE_GPU=false TARGETARCH=amd64 REDIS_VERSION=6:7.2.7-1rl1~bookworm1 /bin/sh -c groupadd -r appuser && useradd --no-log-init -r -g appuser appuser # buildkit
RUN |10 C4AI_VER=0.8.6 APP_HOME=/app GITHUB_REPO=https://github.com/unclecode/crawl4ai.git GITHUB_BRANCH=main USE_LOCAL=true PYTHON_VERSION=3.12 INSTALL_TYPE=default ENABLE_GPU=false TARGETARCH=amd64 REDIS_VERSION=6:7.2.7-1rl1~bookworm1 /bin/sh -c mkdir -p /home/appuser && chown -R appuser:appuser /home/appuser # buildkit
WORKDIR /app
RUN |10 C4AI_VER=0.8.6 APP_HOME=/app GITHUB_REPO=https://github.com/unclecode/crawl4ai.git GITHUB_BRANCH=main USE_LOCAL=true PYTHON_VERSION=3.12 INSTALL_TYPE=default ENABLE_GPU=false TARGETARCH=amd64 REDIS_VERSION=6:7.2.7-1rl1~bookworm1 /bin/sh -c echo '#!/bin/bash\nif [ "$USE_LOCAL" = "true" ]; then\n echo "📦 Installing from local source..."\n pip install --no-cache-dir /tmp/project/\nelse\n echo "🌐 Installing from GitHub..."\n for i in {1..3}; do \n git clone --branch ${GITHUB_BRANCH} ${GITHUB_REPO} /tmp/crawl4ai && break || \n { echo "Attempt $i/3 failed! Taking a short break... ☕"; sleep 5; }; \n done\n pip install --no-cache-dir /tmp/crawl4ai\nfi' > /tmp/install.sh && chmod +x /tmp/install.sh # buildkit
COPY . /tmp/project/ # buildkit
COPY deploy/docker/supervisord.conf . # buildkit
COPY deploy/docker/requirements.txt . # buildkit
RUN |10 C4AI_VER=0.8.6 APP_HOME=/app GITHUB_REPO=https://github.com/unclecode/crawl4ai.git GITHUB_BRANCH=main USE_LOCAL=true PYTHON_VERSION=3.12 INSTALL_TYPE=default ENABLE_GPU=false TARGETARCH=amd64 REDIS_VERSION=6:7.2.7-1rl1~bookworm1 /bin/sh -c pip install --no-cache-dir -r requirements.txt # buildkit
RUN |10 C4AI_VER=0.8.6 APP_HOME=/app GITHUB_REPO=https://github.com/unclecode/crawl4ai.git GITHUB_BRANCH=main USE_LOCAL=true PYTHON_VERSION=3.12 INSTALL_TYPE=default ENABLE_GPU=false TARGETARCH=amd64 REDIS_VERSION=6:7.2.7-1rl1~bookworm1 /bin/sh -c if [ "$INSTALL_TYPE" = "all" ] ; then pip install --no-cache-dir torch torchvision torchaudio scikit-learn nltk transformers tokenizers && python -m nltk.downloader punkt stopwords ; fi # buildkit
RUN |10 C4AI_VER=0.8.6 APP_HOME=/app GITHUB_REPO=https://github.com/unclecode/crawl4ai.git GITHUB_BRANCH=main USE_LOCAL=true PYTHON_VERSION=3.12 INSTALL_TYPE=default ENABLE_GPU=false TARGETARCH=amd64 REDIS_VERSION=6:7.2.7-1rl1~bookworm1 /bin/sh -c if [ "$INSTALL_TYPE" = "all" ] ; then pip install "/tmp/project/[all]" && python -m crawl4ai.model_loader ; elif [ "$INSTALL_TYPE" = "torch" ] ; then pip install "/tmp/project/[torch]" ; elif [ "$INSTALL_TYPE" = "transformer" ] ; then pip install "/tmp/project/[transformer]" && python -m crawl4ai.model_loader ; else pip install "/tmp/project" ; fi # buildkit
RUN |10 C4AI_VER=0.8.6 APP_HOME=/app GITHUB_REPO=https://github.com/unclecode/crawl4ai.git GITHUB_BRANCH=main USE_LOCAL=true PYTHON_VERSION=3.12 INSTALL_TYPE=default ENABLE_GPU=false TARGETARCH=amd64 REDIS_VERSION=6:7.2.7-1rl1~bookworm1 /bin/sh -c pip install --no-cache-dir --upgrade pip && /tmp/install.sh && python -c "import crawl4ai; print('✅ crawl4ai is ready to rock!')" && python -c "from playwright.sync_api import sync_playwright; print('✅ Playwright is feeling dramatic!')" # buildkit
RUN |10 C4AI_VER=0.8.6 APP_HOME=/app GITHUB_REPO=https://github.com/unclecode/crawl4ai.git GITHUB_BRANCH=main USE_LOCAL=true PYTHON_VERSION=3.12 INSTALL_TYPE=default ENABLE_GPU=false TARGETARCH=amd64 REDIS_VERSION=6:7.2.7-1rl1~bookworm1 /bin/sh -c crawl4ai-setup # buildkit
RUN |10 C4AI_VER=0.8.6 APP_HOME=/app GITHUB_REPO=https://github.com/unclecode/crawl4ai.git GITHUB_BRANCH=main USE_LOCAL=true PYTHON_VERSION=3.12 INSTALL_TYPE=default ENABLE_GPU=false TARGETARCH=amd64 REDIS_VERSION=6:7.2.7-1rl1~bookworm1 /bin/sh -c playwright install --with-deps # buildkit
RUN |10 C4AI_VER=0.8.6 APP_HOME=/app GITHUB_REPO=https://github.com/unclecode/crawl4ai.git GITHUB_BRANCH=main USE_LOCAL=true PYTHON_VERSION=3.12 INSTALL_TYPE=default ENABLE_GPU=false TARGETARCH=amd64 REDIS_VERSION=6:7.2.7-1rl1~bookworm1 /bin/sh -c mkdir -p /home/appuser/.cache/ms-playwright && cp -r /root/.cache/ms-playwright/chromium-* /home/appuser/.cache/ms-playwright/ && chown -R appuser:appuser /home/appuser/.cache/ms-playwright # buildkit
RUN |10 C4AI_VER=0.8.6 APP_HOME=/app GITHUB_REPO=https://github.com/unclecode/crawl4ai.git GITHUB_BRANCH=main USE_LOCAL=true PYTHON_VERSION=3.12 INSTALL_TYPE=default ENABLE_GPU=false TARGETARCH=amd64 REDIS_VERSION=6:7.2.7-1rl1~bookworm1 /bin/sh -c crawl4ai-doctor # buildkit
RUN |10 C4AI_VER=0.8.6 APP_HOME=/app GITHUB_REPO=https://github.com/unclecode/crawl4ai.git GITHUB_BRANCH=main USE_LOCAL=true PYTHON_VERSION=3.12 INSTALL_TYPE=default ENABLE_GPU=false TARGETARCH=amd64 REDIS_VERSION=6:7.2.7-1rl1~bookworm1 /bin/sh -c mkdir -p /home/appuser/.cache && chown -R appuser:appuser /home/appuser/.cache # buildkit
COPY deploy/docker/* /app/ # buildkit
COPY deploy/docker/static /app/static # buildkit
RUN |10 C4AI_VER=0.8.6 APP_HOME=/app GITHUB_REPO=https://github.com/unclecode/crawl4ai.git GITHUB_BRANCH=main USE_LOCAL=true PYTHON_VERSION=3.12 INSTALL_TYPE=default ENABLE_GPU=false TARGETARCH=amd64 REDIS_VERSION=6:7.2.7-1rl1~bookworm1 /bin/sh -c chown -R appuser:appuser ${APP_HOME} # buildkit
RUN |10 C4AI_VER=0.8.6 APP_HOME=/app GITHUB_REPO=https://github.com/unclecode/crawl4ai.git GITHUB_BRANCH=main USE_LOCAL=true PYTHON_VERSION=3.12 INSTALL_TYPE=default ENABLE_GPU=false TARGETARCH=amd64 REDIS_VERSION=6:7.2.7-1rl1~bookworm1 /bin/sh -c mkdir -p /var/lib/redis /var/log/redis && chown -R appuser:appuser /var/lib/redis /var/log/redis # buildkit
HEALTHCHECK &{["CMD-SHELL" "bash -c ' MEM=$(free -m | awk \"/^Mem:/{print \\$2}\"); if [ $MEM -lt 2048 ]; then echo \"⚠️ Warning: Less than 2GB RAM available! Your container might need a memory boost! 🚀\"; exit 1; fi && redis-cli ping > /dev/null && curl -f http://localhost:11235/health || exit 1'"] "30s" "10s" "5s" "0s" '\x03'}
EXPOSE [6379/tcp]
USER appuser
ENV PYTHON_ENV=production
CMD ["supervisord" "-c" "supervisord.conf"]
COPY config.yml /app/config.yml # buildkit

Labels

Key Value
c4ai.version 0.8.6
description 🔥🕷️ Crawl4AI: Open-source LLM Friendly Web Crawler & scraper
maintainer unclecode
version 1.0
Details
Container
2026-04-17 11:17:09 +00:00
0
OCI / Docker
Versions (1) View all
0.8.6-hhe 2026-04-17