From 566f04ad56c3be0ec364744cc93413a7e8518448 Mon Sep 17 00:00:00 2001
From: alvinzhou66 <43176447+alvinzhou66@users.noreply.github.com>
Date: Wed, 11 Nov 2020 20:17:24 -0800
Subject: [PATCH] v2.4
---
Docker_workspace/Dockerfile | 18 ++++++++++++++++++
README.md | 2 +-
binary_classifier/SOMEF_BIN_classifier.ipynb | 4 ++++
3 files changed, 23 insertions(+), 1 deletion(-)
create mode 100644 Docker_workspace/Dockerfile
diff --git a/Docker_workspace/Dockerfile b/Docker_workspace/Dockerfile
new file mode 100644
index 0000000..1516f5d
--- /dev/null
+++ b/Docker_workspace/Dockerfile
@@ -0,0 +1,18 @@
+FROM continuumio/miniconda3
+
+RUN apt-get update && apt-get install -y \
+ gcc
+
+RUN git clone https://github.com/alvinzhou66/classification-of-scientific-software
+
+RUN conda install -c conda-forge yarn
+
+RUN cd classification-of-scientific-software && yarn install
+
+RUN pip install --upgrade pip
+
+COPY requirements.txt /opt/app/requirements.txt
+
+RUN pip install -r /opt/app/requirements.txt
+
+WORKDIR classification-of-scientific-software
diff --git a/README.md b/README.md
index d36be22..e47aacb 100644
--- a/README.md
+++ b/README.md
@@ -31,7 +31,7 @@ pip install -r requirements.txt
```
3. Docker.
Install Docker first.
-In the directory which has our Dockerfile, build the docker container:
+In the directory which has our Dockerfile (in folder -> /Docker_workspace), build the docker container:
```
docker build -t coss .
```
diff --git a/binary_classifier/SOMEF_BIN_classifier.ipynb b/binary_classifier/SOMEF_BIN_classifier.ipynb
index a6136be..c12a36a 100644
--- a/binary_classifier/SOMEF_BIN_classifier.ipynb
+++ b/binary_classifier/SOMEF_BIN_classifier.ipynb
@@ -10,6 +10,10 @@
"import torch \n",
"from DNN import FFN\n",
"import re\n",
+ "import nltk\n",
+ "nltk.download('punkt')\n",
+ "nltk.download('treebank')\n",
+ "nltk.download('stopwords')\n",
"from nltk.tokenize import word_tokenize\n",
"from nltk.corpus import stopwords\n",
"import pandas as pd\n",