1
2
mirror of https://github.com/vimagick/dockerfiles synced 2024-06-25 16:28:40 +00:00

add scrapy

This commit is contained in:
kev 2015-05-28 09:07:32 +08:00
parent f3c8abf37c
commit 9f16e64350
3 changed files with 42 additions and 6 deletions

@ -2,11 +2,29 @@
# Dockerfile for scrapy
#
FROM ubuntu:14.04
MAINTAINER kev
FROM debian:jessie
MAINTAINER kev <noreply@datageek.info>
RUN apt-key adv --keyserver hkp://keyserver.ubuntu.com:80 --recv 627220E7
RUN echo 'deb http://archive.scrapy.org/ubuntu scrapy main' >/etc/apt/sources.list.d/scrapy.list
RUN apt-get update && apt-get install -y python-pip scrapy-0.24 scrapyd
RUN apt-get update \
&& apt-get install -y build-essential \
curl \
libffi-dev \
libssl-dev \
libxml2-dev \
libxslt1-dev \
python \
python-dev \
&& curl -sSL https://bootstrap.pypa.io/get-pip.py | python \
&& pip install scrapy==1.0.0rc1
&& apt-get remove -y build-essential \
libffi-dev \
libssl-dev \
libxml2-dev \
libxslt1-dev \
python-dev \
&& apt-get autoremove -y \
&& apt-get install -y libxml2 \
libxslt1.1 \
&& rm -rf /var/lib/apt/lists/*
CMD bash
CMD ["/bin/bash"]

12
scrapy/Dockerfile.old Normal file

@ -0,0 +1,12 @@
#
# Dockerfile for scrapy
#
FROM ubuntu:14.04
MAINTAINER kev
RUN apt-key adv --keyserver hkp://keyserver.ubuntu.com:80 --recv 627220E7
RUN echo 'deb http://archive.scrapy.org/ubuntu scrapy main' >/etc/apt/sources.list.d/scrapy.list
RUN apt-get update && apt-get install -y python-pip scrapy-0.24 scrapyd
CMD bash

6
scrapy/README.md Normal file

@ -0,0 +1,6 @@
`Scrapy`: An open source and collaborative framework
for extracting the data you need from websites.
In a fast, simple, yet extensible way.
You can create a scrapy (v1.0.0rc1) project on top of this image.