snapbug
diff --git a/‎Dockerfile
Lines changed: 11 additions & 8 deletions b/‎Dockerfile
Lines changed: 11 additions & 8 deletions
diff --git a/‎Dockerfile.change-sha
Lines changed: 80 additions & 0 deletions b/‎Dockerfile.change-sha
Lines changed: 80 additions & 0 deletions
diff --git a/‎README.md
Lines changed: 98 additions & 0 deletions b/‎README.md
Lines changed: 98 additions & 0 deletions
diff --git a/‎gpu.sh
Lines changed: 0 additions & 16 deletions b/‎gpu.sh
Lines changed: 0 additions & 16 deletions
diff --git a/‎network_version.sh
Lines changed: 0 additions & 18 deletions b/‎network_version.sh
Lines changed: 0 additions & 18 deletions
diff --git a/‎nomkl.sh
Lines changed: 0 additions & 5 deletions b/‎nomkl.sh
Lines changed: 0 additions & 5 deletions
diff --git a/‎pytorch_versions.sh
Lines changed: 0 additions & 13 deletions b/‎pytorch_versions.sh
Lines changed: 0 additions & 13 deletions
@@ -12,7 +12,7 @@ FROM nvidia/cuda:8.0-cudnn6-devel-ubuntu14.04 as base
 COPY aquaint+wiki.txt.gz.ndim=50.bin /
 
 RUN echo "13dc26ecb4455cf437e19b6dcf869867 *aquaint+wiki.txt.gz.ndim=50.bin" | md5sum -c - && \
-    apt-get update --fix-missing && apt-get install -y wget bzip2 ca-certificates libglib2.0-0 libxext6 libsm6 libxrender1 git mercurial subversion && \
+    apt-get update --fix-missing && apt-get install -y wget unzip bzip2 ca-certificates libglib2.0-0 libxext6 libsm6 libxrender1 git mercurial subversion && \
     echo 'export PATH=/opt/conda/bin:$PATH' > /etc/profile.d/conda.sh && \
     wget --quiet https://repo.continuum.io/miniconda/Miniconda3-4.3.14-Linux-x86_64.sh -O ~/miniconda.sh && \
     /bin/bash ~/miniconda.sh -b -p /opt/conda && \
@@ -53,21 +53,24 @@ ENV OMP_NUM_THREADS=1
 ENV MKL_NUM_THREADS=1
 
 #
-# And now get the repositories, with `castor` at a given sha sum
+# And finally the latest verison, see the README for why this is separate
 #
 FROM pytorch
 
-ARG sha=cf0e269
-
-RUN git clone https://github.com/castorini/castor /castorini/castor && \
-    git clone https://github.com/castorini/data /castorini/data && \
-    git -C /castorini/castor reset --hard ${sha} && \
-    git -C /castorini/data reset --hard 42abddd && \
+COPY castor /castorini/castor
+RUN git clone https://github.com/castorini/data /castorini/data && \
+    git -C /castorini/data reset --hard 6ed4084 && \
     mv /aquaint+wiki.txt.gz.ndim=50.bin /castorini/data/word2vec && \
     cd /castorini/data/TrecQA && \
     python parse.py && \
     python overlap_features.py && \
     python build_vocab.py && \
+    cd /castorini/data/WikiQA && \
+    unzip WikiQACorpus.zip && \
+    python create-train-dev-test-data.py && \
+    mv train train-all && \
+    mv test raw-test && \
+    mv dev raw-dev && \
     cd /castorini/castor/sm_cnn/trec_eval-8.0 && \
     make
 
 
@@ -0,0 +1,80 @@
+#
+# First, get the nvidia image, which has the nvidia cuda drivers etc.
+#
+FROM nvidia/cuda:8.0-cudnn6-devel-ubuntu14.04 as base
+
+#
+# Install miniconda into it
+## Copied from continuumio/miniconda:4.3.14
+#
+
+# Do this here, because it'll be cached
+COPY aquaint+wiki.txt.gz.ndim=50.bin /
+
+RUN echo "13dc26ecb4455cf437e19b6dcf869867 *aquaint+wiki.txt.gz.ndim=50.bin" | md5sum -c - && \
+    apt-get update --fix-missing && apt-get install -y wget unzip bzip2 ca-certificates libglib2.0-0 libxext6 libsm6 libxrender1 git mercurial subversion && \
+    echo 'export PATH=/opt/conda/bin:$PATH' > /etc/profile.d/conda.sh && \
+    wget --quiet https://repo.continuum.io/miniconda/Miniconda3-4.3.14-Linux-x86_64.sh -O ~/miniconda.sh && \
+    /bin/bash ~/miniconda.sh -b -p /opt/conda && \
+    rm ~/miniconda.sh && \
+    apt-get install -y curl grep sed dpkg && \
+    TINI_VERSION=`curl https://github.com/krallin/tini/releases/latest | grep -o "/v.*\"" | sed 's:^..\(.*\).$:\1:'` && \
+    curl -L "https://github.com/krallin/tini/releases/download/v${TINI_VERSION}/tini_${TINI_VERSION}.deb" > tini.deb && \
+    dpkg -i tini.deb && \
+    rm tini.deb
+
+ENV PATH /opt/conda/bin:$PATH
+
+#
+# Then install pytorch, version with/without mkl
+## ORIGINALLY FROM continuumio/miniconda:4.3.14
+#
+FROM base as pytorch
+
+ARG lib=mkl
+ARG pytorch=0.1.12
+
+RUN apt install -y build-essential=11.6ubuntu6 && \
+    apt-get clean && \
+    export CMAKE_PREFIX_PATH="$(dirname $(which conda))/../" && \
+    conda install -y conda==4.3.25 python==3.6.1 && \
+    if [ "${lib}" = "mkl" ]; then \
+        conda install -y mkl==2017.0.3 mkl-service==1.1.2; \
+    else \
+        conda install -y nomkl==1.0; \
+    fi && \
+    conda install -y numpy==1.13.1 pyyaml==3.12 setuptools==27.2.0 cmake==3.6.3 gcc==4.8.5 cffi==1.10.0 gensim==1.0.1 nltk==3.2.1 scikit-learn==0.18.1 pandas==0.20.3 && \
+    wget https://github.com/pytorch/pytorch/archive/v${pytorch}.tar.gz && \
+    tar xzf v${pytorch}.tar.gz && \
+    cd pytorch-${pytorch} && \
+    python setup.py install
+
+ENV OMP_NUM_THREADS=1
+ENV MKL_NUM_THREADS=1
+
+#
+# And now get the repositories, with `castor` at a given sha sum
+#
+FROM pytorch
+
+ARG sha=cf0e269
+
+RUN git clone https://github.com/snapbug/castor /castorini/castor && \
+    git clone https://github.com/castorini/data /castorini/data && \
+    git -C /castorini/castor reset --hard ${sha} && \
+    git -C /castorini/data reset --hard 6ed4084 && \
+    mv /aquaint+wiki.txt.gz.ndim=50.bin /castorini/data/word2vec && \
+    cd /castorini/data/TrecQA && \
+    python parse.py && \
+    python overlap_features.py && \
+    python build_vocab.py && \
+    cd /castorini/data/WikiQA && \
+    unzip WikiQACorpus.zip && \
+    python create-train-dev-test-data.py && \
+    mv train train-all && \
+    mv test raw-test && \
+    mv dev raw-dev && \
+    cd /castorini/castor/sm_cnn/trec_eval-8.0 && \
+    make
+
+WORKDIR /castorini/castor/sm_cnn
@@ -0,0 +1,98 @@
+# Questionable Answers
+
+This repository contains everything required to completely replicate the results presented in:
+
+Matt Crane. "Questionable Answers in Question Answering Research: Reproducibility and Variability of Published Results". In: Transactions of the Association for Computational Linguistics 6 (2018), pp. 241–252. url: https://transacl.org/ojs/index.php/tacl/article/view/1299.
+
+## Status
+
+Unfortunately, the upstream repository
+[castorini/castor](//github.com/castorini/castor) has diverged due to history
+rewriting changes, so the changesets don't match the official current
+repository.
+
+Unfortunately this repository was not forked in time to capture the `cf0e269`
+SHA from the official repository before that repositories history was
+re-written. This means that if building from source, you'll have a _different_
+SHA which is used to build this image. The `setup.sh` script will make this
+change, the contents of which can be verified against [the official repository
+diff](//github.com/castorini/castor/commit/ed4dba249712e8bbaf5ed7c1486dff52b472daf4).
+
+Running `setup.sh build` will build the docker images from the source,
+including making the un-captured change above, while `setup.sh pull` will pull
+the prebuilt docker images.
+
+## Requirements
+
+#### Running on GPU
+
+`nvidia-docker` is required to run the GPU based experiments, and for these
+experiments version 1 was used. This has since been deprecated by nVidia in
+favour of version 2. The results _should_ be the same, but for guarantees
+[install version 1](//github.com/nvidia/nvidia-docker/wiki/Installation-(version-1.0)).
+
+#### Building images
+
+The embeddings used by the network should be downloaded from [Aliaksei Severyn's shared file
+(520MB)](//drive.google.com/folderview?id=0B-yipfgecoSBfkZlY2FFWEpDR3M4Qkw5U055MWJrenE5MTBFVXlpRnd0QjZaMDQxejh1cWs&usp=sharing),
+and placed in the working directory for this repository. The docker image
+builder will verify checksums to ensure that the same file is used.
+
+#### Pulling images
+
+All the docker images generated are available online to download/run without
+having to be built from scratch. These are listed [on Docker hub](//hub.docker.com/r/snapbug/qqa/tags/)
+
+By default the `setup.sh` script if run with will pull _all_ the tagged images,
+this can take a substantial amount of disk space, even though they share a lot
+of commonality. If you only, for example, want to replicate the math library
+experiments, then manually pull the required images. Look at `run.sh` for which
+images are required for which experiments.
+
+| Image         | Figure/Table     | Notes                                          |
+|---------------|------------------|------------------------------------------------|
+| `sha-*`       | Table 4          | See note above regarding `sha-cf0e269`         |
+| `pytorch-*`   | Table 5          |                                                |
+| `*mkl`        | Table 6          |                                                |
+| `sha-cf0e269` | Table 7          |                                                |
+| `sha-cf0e269` | Table 8          |                                                |
+| `sha-cf0e269` | Figure 2 (left)  | Just the CPU seeds                             |
+| `sha-cf0e269` | Figure 2 (right) | Just the GPU seeds                             |
+| `sha-cf0e269` | Figure 2         | Both CPU and GPU seeds                         |
+|               | Figure 3         | Use the output from the logs of `run.sh seeds` |
+|               | Table 9          | Use the output from the logs of `run.sh seeds` |
+
+## Replication
+
+`run.sh` will successfully replicate all the experiments in the paper using
+either the built docker images, or pulled docker images from `setup.sh`. It
+takes a single argument that specifies which experiments to run.
+
+| Argument  | Figure/Table     | Notes                                          |
+|-----------|------------------|------------------------------------------------|
+| all       |                  | All of the experiments                         |
+| network   | Table 4          |                                                |
+| pytorch   | Table 5          |                                                |
+| mathlib   | Table 6          |                                                |
+| thread    | Table 7          |                                                |
+| gpu       | Table 8          |                                                |
+| seeds-cpu | Figure 2 (left)  | Just the CPU seeds                             |
+| seeds-gpu | Figure 2 (right) | Just the GPU seeds                             |
+| seeds     | Figure 2         | Both CPU and GPU seeds                         |
+|           | Figure 3         | Use the output from the logs of `run.sh seeds` |
+|           | Table 9          | Use the output from the logs of `run.sh seeds` |
+
+**Log** files are generated in the form `qqa.[dataset].log.[experiment]`, at the
+end of training the network performs a feed-forward pass of the datasets, which
+is where the numbers for the paper are extracted.
+
+**Model** files will be generated in the form:
+`qqa.[dataset].model.[experiment]`, to allow for feed-forward verification, or
+re-creation of the results without retraining the network. These models, in my
+experimentation, are reproducible across different hardware setups, although I
+would be interested in hearing of situations where they _aren't_.
+
+## Issues
+
+If you encounter any issues with the scripts etc. in this repository, then
+either file an issue on github, or email me.