Pierre Pommarel ppommarel
  • Joined on 2022-05-30

mcp-scraper (latest)

Published 2026-05-04 21:19:59 +02:00 by ppommarel

Installation

docker pull git.leptis-magna.fr/ppommarel/mcp-scraper:latest
sha256:d3d4d83230427d93d97c2e5c79ba1b4857d7e80f5a79900050d994d882aebc7c

About this package

HTTP MCP server for Reddit, YouTube, Amazon, and Trustpilot scraping

Image Layers

ARG RELEASE
ARG LAUNCHPAD_BUILD_ARCH
LABEL org.opencontainers.image.ref.name=ubuntu
LABEL org.opencontainers.image.version=22.04
ADD file:b499000226bd9a7c562ffa8eeb86e2d170f2a563310db6c2d79562ab53e5cb6e in /
CMD ["/bin/bash"]
ARG DEBIAN_FRONTEND=noninteractive
ARG TZ=America/Los_Angeles
ARG DOCKER_IMAGE_NAME_TEMPLATE=mcr.microsoft.com/playwright:v%version%-jammy
ARG NODE_VERSION=24 # autogenerated via ./update-playwright-node.mjs
ENV LANG=C.UTF-8
ENV LC_ALL=C.UTF-8
RUN |8 DEBIAN_FRONTEND=noninteractive TZ=America/Los_Angeles DOCKER_IMAGE_NAME_TEMPLATE=mcr.microsoft.com/playwright:v%version%-jammy NODE_VERSION=24 #= autogenerated= via= ./update-playwright-node.mjs= /bin/sh -c apt-get update && apt-get install -y curl wget gpg ca-certificates && mkdir -p /etc/apt/keyrings && curl -sL https://deb.nodesource.com/gpgkey/nodesource-repo.gpg.key | gpg --dearmor -o /etc/apt/keyrings/nodesource.gpg && echo "deb [signed-by=/etc/apt/keyrings/nodesource.gpg] https://deb.nodesource.com/node_${NODE_VERSION}.x nodistro main" >> /etc/apt/sources.list.d/nodesource.list && apt-get update && apt-get install -y nodejs && apt-get install -y --no-install-recommends git openssh-client && npm install -g yarn && rm -rf /var/lib/apt/lists/* && adduser pwuser # buildkit
ENV PLAYWRIGHT_BROWSERS_PATH=/ms-playwright
COPY ./playwright-core.tar.gz /tmp/playwright-core.tar.gz # buildkit
RUN |8 DEBIAN_FRONTEND=noninteractive TZ=America/Los_Angeles DOCKER_IMAGE_NAME_TEMPLATE=mcr.microsoft.com/playwright:v%version%-jammy NODE_VERSION=24 #= autogenerated= via= ./update-playwright-node.mjs= /bin/sh -c mkdir /ms-playwright && mkdir /ms-playwright-agent && cd /ms-playwright-agent && npm init -y && npm i /tmp/playwright-core.tar.gz && npm exec --no -- playwright-core mark-docker-image "${DOCKER_IMAGE_NAME_TEMPLATE}" && npm exec --no -- playwright-core install --with-deps && rm -rf /var/lib/apt/lists/* && if [ "$(uname -m)" = "aarch64" ]; then rm /usr/lib/aarch64-linux-gnu/gstreamer-1.0/libgstwebrtc.so; else rm /usr/lib/x86_64-linux-gnu/gstreamer-1.0/libgstwebrtc.so; fi && rm /tmp/playwright-core.tar.gz && rm -rf /ms-playwright-agent && rm -rf ~/.npm/ && chmod -R 777 /ms-playwright # buildkit
LABEL org.opencontainers.image.source="https://git.leptis-magna.fr/ppommarel/mcp-scraper"
LABEL org.opencontainers.image.title="mcp-scraper"
LABEL org.opencontainers.image.description="HTTP MCP server for Reddit, YouTube, Amazon, and Trustpilot scraping"
WORKDIR /app
ENV NODE_ENV=production
ENV MCP_HOST=0.0.0.0
ENV MCP_PORT=8787
ENV MCP_PATH=/mcp
COPY multi:6db0a1237a9c4286a66467d67a1af1cf4fd72d8fc49a46e8def9391e29f48c7f in ./
/bin/sh -c npm ci --omit=dev
COPY dir:6377dc9e123ab20750577159842e7717dad354a2b23fb20d5f6b316e775c6f5f in .
/bin/sh -c mkdir -p /app/data/exports /app/data/raw /app/data/checkpoints /app/data/mcp/jobs /app/data/mcp/logs /app/data/browser/amazon-profile
EXPOSE 8787
CMD ["npm", "run", "mcp:http"]

Labels

Key Value
io.buildah.version 1.33.7
org.opencontainers.image.description HTTP MCP server for Reddit, YouTube, Amazon, and Trustpilot scraping
org.opencontainers.image.ref.name ubuntu
org.opencontainers.image.source https://git.leptis-magna.fr/ppommarel/mcp-scraper
org.opencontainers.image.title mcp-scraper
org.opencontainers.image.version 22.04
Details
Container
2026-05-04 21:19:59 +02:00
0
OCI / Docker
linux/amd64
860 MiB
Versions (5) View all
v0.3.3 2026-05-21
latest 2026-05-04
v0.3.2 2026-05-04
v0.3.1 2026-04-23
v0.3.0 2026-04-23