Mirza Hasanbasic mirza
  • Joined on 2023-12-20

boligportal-crawler (39f5b1a69ac8110c4a67e2c27a8ac8f1262e7ae5)

Published 2025-07-25 07:58:49 +00:00 by mirza

Installation

docker pull git.mirzahasanbasic.dk/mirza/boligportal-crawler:39f5b1a69ac8110c4a67e2c27a8ac8f1262e7ae5
sha256:1c29b60ab665faa8374efb0f851d048e683814ef64e2128c8784cb331658ec2a

Image Layers

# debian.sh --arch 'amd64' out/ 'bookworm' '@1753056000'
ENV PATH=/usr/local/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin
ENV LANG=C.UTF-8
RUN /bin/sh -c set -eux; apt-get update; apt-get install -y --no-install-recommends ca-certificates netbase tzdata ; rm -rf /var/lib/apt/lists/* # buildkit
ENV GPG_KEY=A035C8C19219BA821ECEA86B64E628F8D684696D
ENV PYTHON_VERSION=3.11.13
ENV PYTHON_SHA256=8fb5f9fbc7609fa822cb31549884575db7fd9657cbffb89510b5d7975963a83a
RUN /bin/sh -c set -eux; savedAptMark="$(apt-mark showmanual)"; apt-get update; apt-get install -y --no-install-recommends dpkg-dev gcc gnupg libbluetooth-dev libbz2-dev libc6-dev libdb-dev libffi-dev libgdbm-dev liblzma-dev libncursesw5-dev libreadline-dev libsqlite3-dev libssl-dev make tk-dev uuid-dev wget xz-utils zlib1g-dev ; wget -O python.tar.xz "https://www.python.org/ftp/python/${PYTHON_VERSION%%[a-z]*}/Python-$PYTHON_VERSION.tar.xz"; echo "$PYTHON_SHA256 *python.tar.xz" | sha256sum -c -; wget -O python.tar.xz.asc "https://www.python.org/ftp/python/${PYTHON_VERSION%%[a-z]*}/Python-$PYTHON_VERSION.tar.xz.asc"; GNUPGHOME="$(mktemp -d)"; export GNUPGHOME; gpg --batch --keyserver hkps://keys.openpgp.org --recv-keys "$GPG_KEY"; gpg --batch --verify python.tar.xz.asc python.tar.xz; gpgconf --kill all; rm -rf "$GNUPGHOME" python.tar.xz.asc; mkdir -p /usr/src/python; tar --extract --directory /usr/src/python --strip-components=1 --file python.tar.xz; rm python.tar.xz; cd /usr/src/python; gnuArch="$(dpkg-architecture --query DEB_BUILD_GNU_TYPE)"; ./configure --build="$gnuArch" --enable-loadable-sqlite-extensions --enable-optimizations --enable-option-checking=fatal --enable-shared $(test "$gnuArch" != 'riscv64-linux-musl' && echo '--with-lto') --with-ensurepip ; nproc="$(nproc)"; EXTRA_CFLAGS="$(dpkg-buildflags --get CFLAGS)"; LDFLAGS="$(dpkg-buildflags --get LDFLAGS)"; LDFLAGS="${LDFLAGS:--Wl},--strip-all"; make -j "$nproc" "EXTRA_CFLAGS=${EXTRA_CFLAGS:-}" "LDFLAGS=${LDFLAGS:-}" ; rm python; make -j "$nproc" "EXTRA_CFLAGS=${EXTRA_CFLAGS:-}" "LDFLAGS=${LDFLAGS:--Wl},-rpath='\$\$ORIGIN/../lib'" python ; make install; cd /; rm -rf /usr/src/python; find /usr/local -depth \( \( -type d -a \( -name test -o -name tests -o -name idle_test \) \) -o \( -type f -a \( -name '*.pyc' -o -name '*.pyo' -o -name 'libpython*.a' \) \) \) -exec rm -rf '{}' + ; ldconfig; apt-mark auto '.*' > /dev/null; apt-mark manual $savedAptMark; find /usr/local -type f -executable -not \( -name '*tkinter*' \) -exec ldd '{}' ';' | awk '/=>/ { so = $(NF-1); if (index(so, "/usr/local/") == 1) { next }; gsub("^/(usr/)?", "", so); printf "*%s\n", so }' | sort -u | xargs -r dpkg-query --search | cut -d: -f1 | sort -u | xargs -r apt-mark manual ; apt-get purge -y --auto-remove -o APT::AutoRemove::RecommendsImportant=false; rm -rf /var/lib/apt/lists/*; export PYTHONDONTWRITEBYTECODE=1; python3 --version; pip3 install --disable-pip-version-check --no-cache-dir --no-compile 'setuptools==65.5.1' 'wheel<0.46' ; pip3 --version # buildkit
RUN /bin/sh -c set -eux; for src in idle3 pip3 pydoc3 python3 python3-config; do dst="$(echo "$src" | tr -d 3)"; [ -s "/usr/local/bin/$src" ]; [ ! -e "/usr/local/bin/$dst" ]; ln -svT "$src" "/usr/local/bin/$dst"; done # buildkit
CMD ["python3"]
WORKDIR /app
RUN /bin/sh -c apt-get update && apt-get install -y wget gnupg unzip curl tor supervisor build-essential postgresql-client redis-tools && rm -rf /var/lib/apt/lists/* # buildkit
RUN /bin/sh -c wget -q -O - https://dl-ssl.google.com/linux/linux_signing_key.pub | apt-key add - && echo "deb http://dl.google.com/linux/chrome/deb/ stable main" >> /etc/apt/sources.list.d/google.list && apt-get update && apt-get install -y google-chrome-stable && rm -rf /var/lib/apt/lists/* # buildkit
RUN /bin/sh -c CHROME_VERSION=$(google-chrome --version | awk '{print $3}' | cut -d. -f1) && if [ "$CHROME_VERSION" -ge "115" ]; then DRIVER_VERSION=$(curl -s "https://googlechromelabs.github.io/chrome-for-testing/LATEST_RELEASE_${CHROME_VERSION}") && wget -O /tmp/chromedriver.zip "https://storage.googleapis.com/chrome-for-testing-public/${DRIVER_VERSION}/linux64/chromedriver-linux64.zip" && unzip /tmp/chromedriver.zip -d /tmp/ && mv /tmp/chromedriver-linux64/chromedriver /usr/local/bin/ && rm -rf /tmp/chromedriver.zip /tmp/chromedriver-linux64; else wget -O /tmp/chromedriver.zip "https://chromedriver.storage.googleapis.com/LATEST_RELEASE_${CHROME_VERSION}/chromedriver_linux64.zip" && unzip /tmp/chromedriver.zip -d /usr/local/bin/ && rm /tmp/chromedriver.zip; fi && chmod +x /usr/local/bin/chromedriver # buildkit
RUN /bin/sh -c useradd -r -s /bin/false tor && mkdir -p /var/lib/tor /var/log/tor /etc/tor && chown -R tor:tor /var/lib/tor /var/log/tor # buildkit
RUN /bin/sh -c pip install --upgrade pip setuptools wheel # buildkit
COPY requirements.txt . # buildkit
RUN /bin/sh -c pip install --no-cache-dir -r requirements.txt # buildkit
COPY docker/ /docker-config/ # buildkit
RUN /bin/sh -c chmod +x /docker-config/healthcheck.sh /docker-config/setup-logs.sh # buildkit
COPY docker/torrc /etc/tor/torrc # buildkit
COPY docker/supervisord.conf /etc/supervisor/conf.d/supervisord.conf # buildkit
COPY . . # buildkit
RUN /bin/sh -c pip install . # buildkit
RUN /bin/sh -c useradd -m -u 1000 crawler # buildkit
RUN /bin/sh -c mkdir -p /app/logs && chown -R crawler:crawler /app # buildkit
COPY docker/entrypoint.sh /entrypoint.sh # buildkit
RUN /bin/sh -c chmod +x /entrypoint.sh # buildkit
HEALTHCHECK &{["CMD-SHELL" "/docker-config/healthcheck.sh || exit 1"] "30s" "15s" "1m0s" "0s" '\x03'}
EXPOSE map[8000/tcp:{}]
ENTRYPOINT ["/entrypoint.sh"]
Details
Container
2025-07-25 07:58:49 +00:00
0
OCI / Docker
linux/amd64
515 MiB
Versions (41) View all