Block a user
boligportal-crawler (156e101cd30a28c49dc74c40290bd3e3b34b68ab)
Published 2025-07-07 19:16:32 +00:00 by mirza
Installation
docker pull git.mirzahasanbasic.dk/mirza/boligportal-crawler:156e101cd30a28c49dc74c40290bd3e3b34b68absha256:82ade90cfa8dcd1c06f0fbb7f131c2c1c0231720e75dd1d46045dfa8a69b76b4
Image Layers
| # debian.sh --arch 'amd64' out/ 'bookworm' '@1751241600' |
| ENV PATH=/usr/local/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin |
| ENV LANG=C.UTF-8 |
| RUN /bin/sh -c set -eux; apt-get update; apt-get install -y --no-install-recommends ca-certificates netbase tzdata ; rm -rf /var/lib/apt/lists/* # buildkit |
| ENV GPG_KEY=A035C8C19219BA821ECEA86B64E628F8D684696D |
| ENV PYTHON_VERSION=3.11.13 |
| ENV PYTHON_SHA256=8fb5f9fbc7609fa822cb31549884575db7fd9657cbffb89510b5d7975963a83a |
| RUN /bin/sh -c set -eux; savedAptMark="$(apt-mark showmanual)"; apt-get update; apt-get install -y --no-install-recommends dpkg-dev gcc gnupg libbluetooth-dev libbz2-dev libc6-dev libdb-dev libffi-dev libgdbm-dev liblzma-dev libncursesw5-dev libreadline-dev libsqlite3-dev libssl-dev make tk-dev uuid-dev wget xz-utils zlib1g-dev ; wget -O python.tar.xz "https://www.python.org/ftp/python/${PYTHON_VERSION%%[a-z]*}/Python-$PYTHON_VERSION.tar.xz"; echo "$PYTHON_SHA256 *python.tar.xz" | sha256sum -c -; wget -O python.tar.xz.asc "https://www.python.org/ftp/python/${PYTHON_VERSION%%[a-z]*}/Python-$PYTHON_VERSION.tar.xz.asc"; GNUPGHOME="$(mktemp -d)"; export GNUPGHOME; gpg --batch --keyserver hkps://keys.openpgp.org --recv-keys "$GPG_KEY"; gpg --batch --verify python.tar.xz.asc python.tar.xz; gpgconf --kill all; rm -rf "$GNUPGHOME" python.tar.xz.asc; mkdir -p /usr/src/python; tar --extract --directory /usr/src/python --strip-components=1 --file python.tar.xz; rm python.tar.xz; cd /usr/src/python; gnuArch="$(dpkg-architecture --query DEB_BUILD_GNU_TYPE)"; ./configure --build="$gnuArch" --enable-loadable-sqlite-extensions --enable-optimizations --enable-option-checking=fatal --enable-shared $(test "$gnuArch" != 'riscv64-linux-musl' && echo '--with-lto') --with-ensurepip ; nproc="$(nproc)"; EXTRA_CFLAGS="$(dpkg-buildflags --get CFLAGS)"; LDFLAGS="$(dpkg-buildflags --get LDFLAGS)"; LDFLAGS="${LDFLAGS:--Wl},--strip-all"; make -j "$nproc" "EXTRA_CFLAGS=${EXTRA_CFLAGS:-}" "LDFLAGS=${LDFLAGS:-}" ; rm python; make -j "$nproc" "EXTRA_CFLAGS=${EXTRA_CFLAGS:-}" "LDFLAGS=${LDFLAGS:--Wl},-rpath='\$\$ORIGIN/../lib'" python ; make install; cd /; rm -rf /usr/src/python; find /usr/local -depth \( \( -type d -a \( -name test -o -name tests -o -name idle_test \) \) -o \( -type f -a \( -name '*.pyc' -o -name '*.pyo' -o -name 'libpython*.a' \) \) \) -exec rm -rf '{}' + ; ldconfig; apt-mark auto '.*' > /dev/null; apt-mark manual $savedAptMark; find /usr/local -type f -executable -not \( -name '*tkinter*' \) -exec ldd '{}' ';' | awk '/=>/ { so = $(NF-1); if (index(so, "/usr/local/") == 1) { next }; gsub("^/(usr/)?", "", so); printf "*%s\n", so }' | sort -u | xargs -r dpkg-query --search | cut -d: -f1 | sort -u | xargs -r apt-mark manual ; apt-get purge -y --auto-remove -o APT::AutoRemove::RecommendsImportant=false; rm -rf /var/lib/apt/lists/*; export PYTHONDONTWRITEBYTECODE=1; python3 --version; pip3 install --disable-pip-version-check --no-cache-dir --no-compile 'setuptools==65.5.1' 'wheel<0.46' ; pip3 --version # buildkit |
| RUN /bin/sh -c set -eux; for src in idle3 pip3 pydoc3 python3 python3-config; do dst="$(echo "$src" | tr -d 3)"; [ -s "/usr/local/bin/$src" ]; [ ! -e "/usr/local/bin/$dst" ]; ln -svT "$src" "/usr/local/bin/$dst"; done # buildkit |
| CMD ["python3"] |
| WORKDIR /app |
| RUN /bin/sh -c apt-get update && apt-get install -y wget gnupg unzip curl tor supervisor build-essential postgresql-client redis-tools && rm -rf /var/lib/apt/lists/* # buildkit |
| RUN /bin/sh -c wget -q -O - https://dl-ssl.google.com/linux/linux_signing_key.pub | apt-key add - && echo "deb http://dl.google.com/linux/chrome/deb/ stable main" >> /etc/apt/sources.list.d/google.list && apt-get update && apt-get install -y google-chrome-stable && rm -rf /var/lib/apt/lists/* # buildkit |
| RUN /bin/sh -c CHROME_VERSION=$(google-chrome --version | awk '{print $3}' | cut -d. -f1) && if [ "$CHROME_VERSION" -ge "115" ]; then DRIVER_VERSION=$(curl -s "https://googlechromelabs.github.io/chrome-for-testing/LATEST_RELEASE_${CHROME_VERSION}") && wget -O /tmp/chromedriver.zip "https://storage.googleapis.com/chrome-for-testing-public/${DRIVER_VERSION}/linux64/chromedriver-linux64.zip" && unzip /tmp/chromedriver.zip -d /tmp/ && mv /tmp/chromedriver-linux64/chromedriver /usr/local/bin/ && rm -rf /tmp/chromedriver.zip /tmp/chromedriver-linux64; else wget -O /tmp/chromedriver.zip "https://chromedriver.storage.googleapis.com/LATEST_RELEASE_${CHROME_VERSION}/chromedriver_linux64.zip" && unzip /tmp/chromedriver.zip -d /usr/local/bin/ && rm /tmp/chromedriver.zip; fi && chmod +x /usr/local/bin/chromedriver # buildkit |
| RUN /bin/sh -c useradd -r -s /bin/false tor && mkdir -p /var/lib/tor /var/log/tor /etc/tor && chown -R tor:tor /var/lib/tor /var/log/tor # buildkit |
| COPY requirements.txt . # buildkit |
| RUN /bin/sh -c pip install --no-cache-dir -r requirements.txt # buildkit |
| COPY docker/ /docker-config/ # buildkit |
| COPY docker/torrc /etc/tor/torrc # buildkit |
| COPY docker/supervisord.conf /etc/supervisor/conf.d/supervisord.conf # buildkit |
| COPY . . # buildkit |
| RUN /bin/sh -c pip install -e . # buildkit |
| RUN /bin/sh -c useradd -m -u 1000 crawler && chown -R crawler:crawler /app # buildkit |
| COPY docker/entrypoint.sh /entrypoint.sh # buildkit |
| RUN /bin/sh -c chmod +x /entrypoint.sh # buildkit |
| HEALTHCHECK &{["CMD-SHELL" "/docker-config/healthcheck.sh || exit 1"] "30s" "15s" "1m0s" "0s" '\x03'} |
| EXPOSE map[8000/tcp:{}] |
| ENTRYPOINT ["/entrypoint.sh"] |
Details
2025-07-07 19:16:32 +00:00
Versions (41)
View all
Container
0
OCI / Docker
linux/amd64
509 MiB
latest
2025-08-06
20250806
2025-08-06
a94f98c75ed4b40b5484fd6b205f9deb864f35a3
2025-08-06
20250730
2025-07-30
13a31dbae99b52db7048fc8e379d3b3e06fd21f9
2025-07-30