Skip to content

Commit d9a510f

Browse files
authored
Merge pull request #3 from kfettich-forks/kf_issue6
adjusted docker container so it can run python cleaning scripts
2 parents fd74998 + d572f9a commit d9a510f

File tree

3 files changed

+24
-224
lines changed

3 files changed

+24
-224
lines changed

Dockerfile

Lines changed: 6 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
FROM tiangolo/uwsgi-nginx-flask:python3.6-alpine3.7
1+
FROM tiangolo/uwsgi-nginx-flask:python3.7
22

33
ENV LISTEN_PORT=5555
44
EXPOSE 5555
@@ -13,9 +13,12 @@ WORKDIR /paws-data-pipeline/
1313
COPY . /paws-data-pipeline/
1414

1515
RUN chmod 777 /paws-data-pipeline
16+
RUN apt-get update
17+
RUN apt-get install -y sqlite3 libsqlite3-dev
1618

1719
# If you have additional requirements beyond Flask (which is included in the
1820
# base image), generate a requirements.txt file with pip freeze and uncomment
1921
# the next three lines.
20-
#COPY requirements.txt /
21-
#RUN pip install --no-cache-dir -r /requirements.txt
22+
23+
COPY requirements.txt /
24+
RUN pip install --no-cache-dir -r /requirements.txt

load_paws_data.ipynb

Lines changed: 15 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -26,9 +26,21 @@
2626
},
2727
{
2828
"cell_type": "code",
29-
"execution_count": 17,
29+
"execution_count": 3,
3030
"metadata": {},
31-
"outputs": [],
31+
"outputs": [
32+
{
33+
"ename": "ModuleNotFoundError",
34+
"evalue": "No module named 'fuzzywuzzy'",
35+
"output_type": "error",
36+
"traceback": [
37+
"\u001b[1;31m---------------------------------------------------------------------------\u001b[0m",
38+
"\u001b[1;31mModuleNotFoundError\u001b[0m Traceback (most recent call last)",
39+
"\u001b[1;32m<ipython-input-3-d9f2dce0983a>\u001b[0m in \u001b[0;36m<module>\u001b[1;34m\u001b[0m\n\u001b[0;32m 3\u001b[0m \u001b[1;32mimport\u001b[0m \u001b[0mnumpy\u001b[0m \u001b[1;32mas\u001b[0m \u001b[0mnp\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m 4\u001b[0m \u001b[1;32mimport\u001b[0m \u001b[0mre\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[1;32m----> 5\u001b[1;33m \u001b[1;32mfrom\u001b[0m \u001b[0mfuzzywuzzy\u001b[0m \u001b[1;32mimport\u001b[0m \u001b[0mfuzz\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0m",
40+
"\u001b[1;31mModuleNotFoundError\u001b[0m: No module named 'fuzzywuzzy'"
41+
]
42+
}
43+
],
3244
"source": [
3345
"import sqlite3\n",
3446
"import pandas as pd\n",
@@ -1104,7 +1116,7 @@
11041116
"name": "python",
11051117
"nbconvert_exporter": "python",
11061118
"pygments_lexer": "ipython3",
1107-
"version": "3.7.3"
1119+
"version": "3.7.4"
11081120
}
11091121
},
11101122
"nbformat": 4,

requirements.txt

Lines changed: 3 additions & 218 deletions
Original file line numberDiff line numberDiff line change
@@ -1,218 +1,3 @@
1-
alabaster==0.7.12
2-
anaconda-client==1.7.2
3-
anaconda-navigator==1.9.7
4-
anaconda-project==0.8.3
5-
asn1crypto==0.24.0
6-
astroid==2.2.5
7-
astropy==3.2.1
8-
atomicwrites==1.3.0
9-
attrs==19.1.0
10-
Babel==2.7.0
11-
backcall==0.1.0
12-
backports.functools-lru-cache==1.5
13-
backports.os==0.1.1
14-
backports.shutil-get-terminal-size==1.0.0
15-
backports.tempfile==1.0
16-
backports.weakref==1.0.post1
17-
beautifulsoup4==4.7.1
18-
bitarray==0.9.3
19-
bkcharts==0.2
20-
bleach==3.1.0
21-
bokeh==1.2.0
22-
boto==2.49.0
23-
Bottleneck==1.2.1
24-
certifi==2019.6.16
25-
cffi==1.12.3
26-
chardet==3.0.4
27-
Click==7.0
28-
cloudpickle==1.2.1
29-
clyent==1.2.2
30-
colorama==0.4.1
31-
conda==4.8.0
32-
conda-build==3.18.9
33-
conda-package-handling==1.3.11
34-
conda-verify==3.4.2
35-
contextlib2==0.5.5
36-
cryptography==2.7
37-
cycler==0.10.0
38-
Cython==0.29.12
39-
cytoolz==0.10.0
40-
dask==2.1.0
41-
decorator==4.4.0
42-
defusedxml==0.6.0
43-
distributed==2.1.0
44-
docutils==0.14
45-
entrypoints==0.3
46-
et-xmlfile==1.0.1
47-
fastcache==1.1.0
48-
filelock==3.0.12
49-
findspark==1.3.0
50-
Flask==1.1.1
51-
future==0.17.1
52-
fuzzywuzzy==0.17.0
53-
gevent==1.4.0
54-
glob2==0.7
55-
gmpy2==2.0.8
56-
greenlet==0.4.15
57-
h5py==2.9.0
58-
heapdict==1.0.0
59-
html5lib==1.0.1
60-
idna==2.8
61-
imageio==2.5.0
62-
imagesize==1.1.0
63-
importlib-metadata==0.17
64-
ipykernel==5.1.1
65-
ipython==7.6.1
66-
ipython-genutils==0.2.0
67-
ipywidgets==7.5.0
68-
isort==4.3.21
69-
itsdangerous==1.1.0
70-
jdcal==1.4.1
71-
jedi==0.13.3
72-
jeepney==0.4
73-
Jinja2==2.10.1
74-
joblib==0.13.2
75-
json5==0.8.4
76-
jsonschema==3.0.1
77-
jupyter==1.0.0
78-
jupyter-client==5.3.1
79-
jupyter-console==6.0.0
80-
jupyter-core==4.5.0
81-
jupyterlab==1.0.2
82-
jupyterlab-server==1.0.0
83-
keyring==18.0.0
84-
kiwisolver==1.1.0
85-
lazy-object-proxy==1.4.1
86-
libarchive-c==2.8
87-
lief==0.9.0
88-
llvmlite==0.29.0
89-
locket==0.2.0
90-
lxml==4.3.4
91-
MarkupSafe==1.1.1
92-
matplotlib==3.1.0
93-
mccabe==0.6.1
94-
mistune==0.8.4
95-
mkl-fft==1.0.12
96-
mkl-random==1.0.2
97-
mkl-service==2.0.2
98-
mock==3.0.5
99-
more-itertools==7.0.0
100-
mpmath==1.1.0
101-
msgpack==0.6.1
102-
multipledispatch==0.6.0
103-
navigator-updater==0.2.1
104-
nbconvert==5.5.0
105-
nbformat==4.4.0
106-
networkx==2.3
107-
nltk==3.4.5
108-
nose==1.3.7
109-
notebook==6.0.0
110-
numba==0.44.1
111-
numexpr==2.6.9
112-
numpy==1.16.4
113-
numpydoc==0.9.1
114-
olefile==0.46
115-
openpyxl==2.6.2
116-
packaging==19.0
117-
pandas==0.24.2
118-
pandocfilters==1.4.2
119-
parso==0.5.0
120-
partd==1.0.0
121-
path.py==12.0.1
122-
pathlib2==2.3.4
123-
patsy==0.5.1
124-
pep8==1.7.1
125-
pexpect==4.7.0
126-
pickleshare==0.7.5
127-
Pillow==6.2.0
128-
pkginfo==1.5.0.1
129-
pluggy==0.12.0
130-
ply==3.11
131-
prometheus-client==0.7.1
132-
prompt-toolkit==2.0.9
133-
psutil==5.6.3
134-
psycopg2==2.7.6.1
135-
ptyprocess==0.6.0
136-
py==1.8.0
137-
py4j==0.10.7
138-
pycodestyle==2.5.0
139-
pycosat==0.6.3
140-
pycparser==2.19
141-
pycurl==7.43.0.3
142-
pyflakes==2.1.1
143-
Pygments==2.4.2
144-
pylint==2.3.1
145-
pymongo==3.8.0
146-
pyodbc==4.0.26
147-
pyOpenSSL==19.0.0
148-
pyparsing==2.4.0
149-
pyrsistent==0.14.11
150-
PySocks==1.7.0
151-
pyspark==2.4.4
152-
pytest==5.0.1
153-
pytest-arraydiff==0.3
154-
pytest-astropy==0.5.0
155-
pytest-doctestplus==0.3.0
156-
pytest-openfiles==0.3.2
157-
pytest-remotedata==0.3.1
158-
python-dateutil==2.8.0
159-
python-dotenv==0.10.3
160-
python-Levenshtein==0.12.0
161-
pytz==2019.1
162-
PyWavelets==1.0.3
163-
PyYAML==5.1.1
164-
pyzmq==18.0.0
165-
QtAwesome==0.5.7
166-
qtconsole==4.5.1
167-
QtPy==1.8.0
168-
requests==2.22.0
169-
rope==0.14.0
170-
ruamel-yaml==0.15.46
171-
scikit-image==0.15.0
172-
scikit-learn==0.21.2
173-
scipy==1.3.0
174-
seaborn==0.9.0
175-
SecretStorage==3.1.1
176-
selenium==3.141.0
177-
Send2Trash==1.5.0
178-
simplegeneric==0.8.1
179-
singledispatch==3.4.0.3
180-
six==1.12.0
181-
snowballstemmer==1.9.0
182-
sortedcollections==1.1.2
183-
sortedcontainers==2.1.0
184-
soupsieve==1.8
185-
Sphinx==2.1.2
186-
sphinxcontrib-applehelp==1.0.1
187-
sphinxcontrib-devhelp==1.0.1
188-
sphinxcontrib-htmlhelp==1.0.2
189-
sphinxcontrib-jsmath==1.0.1
190-
sphinxcontrib-qthelp==1.0.2
191-
sphinxcontrib-serializinghtml==1.1.3
192-
sphinxcontrib-websupport==1.1.2
193-
spyder==3.3.6
194-
spyder-kernels==0.5.1
195-
SQLAlchemy==1.3.5
196-
statsmodels==0.10.0
197-
sympy==1.4
198-
tables==3.5.2
199-
tblib==1.4.0
200-
terminado==0.8.2
201-
testpath==0.4.2
202-
toolz==0.10.0
203-
tornado==6.0.3
204-
tqdm==4.32.1
205-
traitlets==4.3.2
206-
unicodecsv==0.14.1
207-
urllib3==1.24.2
208-
wcwidth==0.1.7
209-
webencodings==0.5.1
210-
Werkzeug==0.15.4
211-
widgetsnbextension==3.5.0
212-
wrapt==1.11.2
213-
wurlitzer==1.0.2
214-
xlrd==1.2.0
215-
XlsxWriter==1.1.8
216-
xlwt==1.3.0
217-
zict==1.0.0
218-
zipp==0.5.1
1+
pandas==1.0.0
2+
numpy==1.18.1
3+
fuzzywuzzy==0.17.0

0 commit comments

Comments
 (0)