Skip to content
Draft
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
10 changes: 10 additions & 0 deletions README.md
Original file line number Diff line number Diff line change
Expand Up @@ -237,6 +237,16 @@ Notes: this one is empty by default, add some sites to archive or crawl regulary

<br/>

#### mwmbl

Docker image is built from the official [git repository](https://github.com/mwmbl/crawler-script/)

> [Mwmbl](https://github.com/mwmbl/mwmbl) is a non-profit, open source search engine where the community determines the rankings. We aim to be a replacement for commercial search engines such as Google and Bing.

[https://github.com/mwmbl/mwmbl](https://github.com/mwmbl/mwmbl)

<br/>

---

<br/>
Expand Down
34 changes: 34 additions & 0 deletions docker-compose.yml
Original file line number Diff line number Diff line change
Expand Up @@ -223,6 +223,40 @@ services:
- "com.centurylinklabs.watchtower.scope=goodkarmakit"


mwmbl-crawler:
# Help crawl for mwmbl.org, the open source, non profit web search engine
# More info: https://book.mwmbl.org/
# Crawler source: https://github.com/mwmbl/crawler-script
environment:
- THREADS=1
restart: always
build:
context: .
dockerfile_inline: |
FROM alpine:latest AS repo
RUN apk add --no-cache git
WORKDIR /app
RUN git clone https://github.com/mwmbl/crawler-script.git .

FROM python:3.9-slim-bullseye
COPY --from=repo /app/entrypoint.sh /
RUN chmod +x /entrypoint.sh
RUN mkdir -p /srv/mwmbl/crawler-script
RUN useradd mwmbl -r -d /srv/mwmbl && \
chown mwmbl:mwmbl -R /srv/mwmbl
USER mwmbl
WORKDIR /srv/mwmbl/crawler-script
COPY --from=repo /app/justext /srv/mwmbl/crawler-script/justext
COPY --from=repo /app/LICENSE /app/README.md /app/pyproject.toml /app/poetry.lock /app/main.py /srv/mwmbl/crawler-script/
RUN python -m venv venv && \
. venv/bin/activate && \
pip install . && \
pip cache purge
ENTRYPOINT ["/entrypoint.sh"]




### Distribued storage projects

ipfs:
Expand Down