sheffieldnlp · mithunpaul08 · Sep 4, 2018 · Sep 4, 2018 · Sep 4, 2018 · Sep 4, 2018
diff --git a/.gitignore b/.gitignore
@@ -1,3 +1,4 @@
+*.csv
 .idea/
 .DS_Store
 __pycache__

diff --git a/Dockerfile b/Dockerfile
@@ -1,6 +1,6 @@
 FROM continuumio/miniconda3
 
-ENTRYPOINT ["/bin/bash"]
+#ENTRYPOINT ["/bin/bash"]
 
 ENV NVIDIA_VISIBLE_DEVICES all
 ENV NVIDIA_DRIVER_CAPABILITIES compute,utility
@@ -12,10 +12,14 @@ RUN mkdir /fever/scripts
 
 VOLUME /fever/
 
+RUN bash scripts/download-glove.sh
+RUN bash scripts/download-data.sh
+
 ADD requirements.txt /fever/
 ADD src /fever/src/
 ADD config /fever/config/
 ADD scripts /fever/scripts/
+ADD data /fever/data/
 
 RUN apt-get update
 RUN apt-get install -y --no-install-recommends \
@@ -39,6 +43,9 @@ RUN conda create -q -n fever python=3.6
 
 WORKDIR /fever/
 RUN . activate fever
-RUN conda install -y pytorch=0.3.1 torchvision -c pytorch
+#RUN conda install pytorch torchvision -c pytorch
+RUN conda install cython nltk scikit-learn
 RUN pip install -r requirements.txt
 RUN python src/scripts/prepare_nltk.py
+ENV PYTHONPATH src
+CMD ["python",  "src/scripts/retrieval/ir.py  --model data/index/fever-tfidf-ngram=2-hash=16777216-tokenizer=simple.npz --in-file data/fever-data/dev.jsonl --out-file data/fever/dev.sentences.p5.s5.jsonl --mode dev --lmode WARNING"]
diff --git a/README.md b/README.md
@@ -1,5 +1,78 @@
+
+# UOFA- Fact Extraction and VERification
+## Smart NER: replace tokens with NER tags but checking if they exists in the claim 
+
+To run the the training and evaluation using the smartNER either just do `./run_all_train_test.sh`
+or use these commands below
+@server@jenny
+
+`rm -rf logs/`
+
+`PYTHONPATH=src python src/scripts/rte/da/train_da.py data/fever/fever.db config/fever_nn_ora_sent.json logs/da_nn_sent --cuda-device $CUDA_DEVICE`
+
+`mkdir -p data/models`
+
+`cp logs/da_nn_sent/model.tar.gz data/models/decomposable_attention.tar.gz`
+
+`PYTHONPATH=src python src/scripts/rte/da/eval_da.py data/fever/fever.db data/models/decomposable_attention.tar.gz data/fever/dev.ns.pages.p1.jsonl`
+
+This assumes that you are on the same folder. If your data folder is somewhere else, use this 
+
+for training:
+`PYTHONPATH=src python src/scripts/rte/da/train_da.py /net/kate/storage/work/mithunpaul/fever/my_fork/fever-baselines/data/fever/fever.db config/fever_nn_ora_sent.json logs/da_nn_sent --cuda-device $CUDA_DEVICE`
+for dev:
+`PYTHONPATH=src python src/scripts/rte/da/eval_da.py /net/kate/storage/work/mithunpaul/fever/my_fork/fever-baselines/data/fever/fever.db data/models/decomposable_attention.tar.gz /net/kate/storage/work/mithunpaul/fever/my_fork/fever-baselines/data/fever/dev.ns.pages.p1.jsonl`
+
+
+
+
+
+
+`source activate fever`
+`PYTHONPATH=src python src/scripts/rte/da/eval_da.py data/fever/fever.db data/models/decomposable_attention.tar.gz data/fever/dev.ns.pages.p1.jsonl`
+
 # Fact Extraction and VERification
 
+
+- To annotate data once you have Docker you need to pull pyprocessors using :docker pull myedibleenso/processors-server:latest
+
+- Then run this image using: docker run -d -e _JAVA_OPTIONS="-Xmx3G" -p 127.0.0.1:8886:8888 --name procserv myedibleenso/processors-server
+
+note: the docker run command is for the very first time you create this container. Second time onwards use: docker start procserv
+
+- source activate fever
+
+## to run training from my_fork folder on jenny
+`PYTHONPATH=src python src/scripts/retrieval/ir.py --db data/fever/fever.db --model data/index/fever-tfidf-ngram=2-hash=16777216-tokenizer=simple.npz --in-file data/fever-data/train.jsonl --out-file data/fever/train.sentences.p5.s5.jsonl --max-page 5 --max-sent 5 --mode train --lmode WARNING`
+
+
+## to run training from another folder on jenny
+PYTHONPATH=src python src/scripts/retrieval/ir.py --db /work/mithunpaul/fever/my_fork/fever-baselines/data/fever/fever.db --model /work/mithunpaul/fever/my_fork/fever-baselines/data/index/fever-tfidf-ngram=2-hash=16777216-tokenizer=simple.npz --in-file /work/mithunpaul/fever/my_fork/fever-baselines/data/fever-data/train.jsonl --out-file /work/mithunpaul/fever/my_fork/fever-baselines/data/fever/train.sentences.p5.s5.jsonl --max-page 5 --max-sent 5 --mode train --lmode WARNING
+
+## to run training on a smaller data set from another folder on jenny
+PYTHONPATH=src python src/scripts/retrieval/ir.py --db /work/mithunpaul/fever/my_fork/fever-baselines/data/fever/fever.db
+--model /work/mithunpaul/fever/my_fork/fever-baselines/data/index/fever-tfidf-ngram=2-hash=16777216-tokenizer=simple.npz --in-file /work/mithunpaul/fever/my_fork/fever-baselines/data/fever-data/train.jsonl --out-file /work/mithunpaul/fever/my_fork/fever-baselines/data/fever/train.sentences.p5.s5.jsonl --max-page 5 --max-sent 5 --mode small  --dynamic_cv True
+
+
+ ## To run our entailment trainer on training data alone :
+
+data_root="/work/mithunpaul/fever/my_fork/fever-baselines/data"
+
+## To run on dev
+
+`PYTHONPATH=src python src/scripts/retrieval/ir.py --db data/fever/fever.db --model data/index/fever-tfidf-ngram=2-hash=16777216-tokenizer=simple.npz --in-file data/fever-data/dev.jsonl --out-file data/fever/dev.sentences.p5.s5.jsonl --max-page 5 --max-sent 5 --mode dev --lmode WARNING`
+
+## to run dev in a  folder branch_myfork in server but feeding from same data fold
+`PYTHONPATH=src python src/scripts/retrieval/ir.py --db /work/mithunpaul/fever/my_fork/fever-baselines/data/fever/fever.db --model /work/mithunpaul/fever/my_fork/fever-baselines/data/index/fever-tfidf-ngram=2-hash=16777216-tokenizer=simple.npz --in-file /work/mithunpaul/fever/my_fork/fever-baselines/data/fever-data/dev.jsonl --out-file /work/mithunpaul/fever/my_fork/fever-baselines/data/fever/dev.sentences.p5.s5.jsonl --max-page 5 --max-sent 5 --mode dev --lmode INFO`
+
+## to run testing
+`PYTHONPATH=src python src/scripts/retrieval/ir.py --db /work/mithunpaul/fever/my_fork/fever-baselines/data/fever/fever.db --model /work/mithunpaul/fever/my_fork/fever-baselines/data/index/fever-tfidf-ngram=2-hash=16777216-tokenizer=simple.npz --in-file /work/mithunpaul/fever/my_fork/fever-baselines/data/fever-data/dev.jsonl --out-file /work/mithunpaul/fever/my_fork/fever-baselines/data/fever/dev.sentences.p5.s5.jsonl --max-page 5 --max-sent 5 --mode test --dynamic_cv True`
+
+## to run dev after running the nearest neighbors algo for not enough info class (note that this assumes that you have run the NEI code mentioned below by sheffield)
+`PYTHONPATH=src python src/scripts/retrieval/ir.py --db /work/mithunpaul/fever/my_fork/fever-baselines/data/fever/fever.db --model /work/mithunpaul/fever/my_fork/fever-baselines/data/index/fever-tfidf-ngram=2-hash=16777216-tokenizer=simple.npz --in-file /work/mithunpaul/fever/my_fork/fever-baselines/data/fever/dev.ns.pages.p1.jsonl --out-file /work/mithunpaul/fever/my_fork/fever-baselines/data/fever/dev.sentences.p5.s5.jsonl  --max-page 5 --max-sent 5 --mode dev --lmode INFO`
+
+
+## Copy of Instructions from sheffield :might not be updated. use their instructions [page](https://github.com/sheffieldnlp/fever-baselines#evaluation)
 This is the PyTorch implementation of the FEVER pipeline baseline described in the NAACL2018 paper: [FEVER: A large-scale dataset for Fact Extraction and VERification.]()
 
 > Unlike other tasks and despite recent interest, research in textual claim verification has been hindered by the lack of large-scale manually annotated datasets. In this paper we introduce a new publicly available dataset for verification against textual sources, FEVER: Fact Extraction and VERification. It consists of 185,441 claims generated by altering sentences extracted from Wikipedia and subsequently verified without knowledge of the sentence they were derived from. The claims are classified as Supported, Refuted or NotEnoughInfo by annotators achieving 0.6841 in Fleiss κ. For the first two classes, the annotators also recorded the sentence(s) forming the necessary evidence for their judgment. To characterize the challenge of the dataset presented, we develop a pipeline approach using both baseline and state-of-the-art components and compare it to suitably designed oracles. The best accuracy we achieve on labeling a claim accompanied by the correct evidence is 31.87%, while if we ignore the evidence we achieve 50.91%. Thus we believe that FEVER is a challenging testbed that will help stimulate progress on claim verification against textual sources

diff --git a/alt_folder_runner.sh b/alt_folder_runner.sh
@@ -0,0 +1,5 @@
+PYTHONPATH=src python src/scripts/retrieval/ir.py --db /work/mithunpaul/fever/my_fork/fever-baselines/data/fever/fever.db --model /work/mithunpaul/fever/my_fork/fever-baselines/data/index/fever-tfidf-ngram=2-hash=16777216-tokenizer=simple.npz --in-file /work/mithunpaul/fever/my_fork/fever-baselines/data/fever-data/train.jsonl --out-file /work/mithunpaul/fever/my_fork/fever-baselines/data/fever/train.sentences.p5.s5.jsonl --max-page 5 --max-sent 5 --mode train --lmode WARNING
+PYTHONPATH=src python src/scripts/retrieval/ir.py --db /work/mithunpaul/fever/my_fork/fever-baselines/data/fever/fever.db --model /work/mithunpaul/fever/my_fork/fever-baselines/data/index/fever-tfidf-ngram=2-hash=16777216-tokenizer=simple.npz --in-file /work/mithunpaul/fever/my_fork/fever-baselines/data/fever-data/dev.jsonl --out-file /work/mithunpaul/fever/my_fork/fever-baselines/data/fever/dev.sentences.p5.s5.jsonl --max-page 5 --max-sent 5  --mode dev --lmode WARNING
+
+
+
diff --git a/app.py b/app.py
@@ -0,0 +1 @@
+print("hello world")
diff --git a/combined_vector.pkl b/combined_vector.pkl
diff --git a/config/fever_nn_ora_sent.json b/config/fever_nn_ora_sent.json
@@ -24,7 +24,7 @@
     }
   },
   "train_data_path": "data/fever/train.ns.pages.p1.jsonl",
-  "validation_data_path": "data/fever/dev.ns.pages.p1.jsonl",
+  //"validation_data_path": none,
   "model": {
     "type": "decomposable_attention",
     "text_field_embedder": {

diff --git a/config/fever_nn_ora_sent_diff_folder.json b/config/fever_nn_ora_sent_diff_folder.json
@@ -0,0 +1,83 @@
+{
+  "dataset_reader": {
+    "type": "fever",
+    "sentence_level":true,
+    "token_indexers": {
+      "tokens": {
+        "type": "single_id",
+        "lowercase_tokens": true
+      }
+    },
+    "wiki_tokenizer": {
+      "type":"word",
+      "word_splitter": {
+        "type": "just_spaces"
+      },
+      "end_tokens":["@@END@@"]
+    },
+    "claim_tokenizer": {
+      "type":"word",
+      "word_splitter": {
+        "type": "simple"
+      },
+      "end_tokens":["@@END@@"]
+    }
+  },
+  "train_data_path": "/net/kate/storage/work/mithunpaul/fever/my_fork/fever-baselines/data/fever/train.ns.pages.p1.jsonl",
+  //"validation_data_path": none,
+  "model": {
+    "type": "decomposable_attention",
+    "text_field_embedder": {
+      "tokens": {
+        "type": "embedding",
+        "projection_dim": 200,
+        "pretrained_file": "data/glove/glove.6B.300d.txt.gz",
+        "embedding_dim": 300,
+        "trainable": false
+      }
+    },
+    "attend_feedforward": {
+      "input_dim": 200,
+      "num_layers": 2,
+      "hidden_dims": 200,
+      "activations": "relu",
+      "dropout": 0.2
+    },
+    "similarity_function": {"type": "dot_product"},
+    "compare_feedforward": {
+      "input_dim": 400,
+      "num_layers": 2,
+      "hidden_dims": 200,
+      "activations": "relu",
+      "dropout": 0.2
+    },
+    "aggregate_feedforward": {
+      "input_dim": 400,
+      "num_layers": 2,
+      "hidden_dims": [200, 3],
+      "activations": ["relu", "linear"],
+      "dropout": [0.2, 0.0]
+    },
+     "initializer": [
+      [".*linear_layers.*weight", {"type": "xavier_normal"}],
+      [".*token_embedder_tokens\._projection.*weight", {"type": "xavier_normal"}]
+     ]
+   },
+  "iterator": {
+    "type": "bucket",
+    "sorting_keys": [["premise", "num_tokens"], ["hypothesis", "num_tokens"]],
+    "batch_size": 32
+  },
+
+  "trainer": {
+    "num_epochs": 140,
+    "patience": 20,
+    "cuda_device": 0,
+    "grad_clipping": 5.0,
+    "validation_metric": "+accuracy",
+    "no_tqdm": true,
+    "optimizer": {
+      "type": "adagrad"
+    }
+  }
+}
diff --git a/config/fever_nn_ora_sent_same_folder.json b/config/fever_nn_ora_sent_same_folder.json
@@ -0,0 +1,83 @@
+{
+  "dataset_reader": {
+    "type": "fever",
+    "sentence_level":true,
+    "token_indexers": {
+      "tokens": {
+        "type": "single_id",
+        "lowercase_tokens": true
+      }
+    },
+    "wiki_tokenizer": {
+      "type":"word",
+      "word_splitter": {
+        "type": "just_spaces"
+      },
+      "end_tokens":["@@END@@"]
+    },
+    "claim_tokenizer": {
+      "type":"word",
+      "word_splitter": {
+        "type": "simple"
+      },
+      "end_tokens":["@@END@@"]
+    }
+  },
+  "train_data_path": "data/fever/train.ns.pages.p1.jsonl",
+  //"validation_data_path": none,
+  "model": {
+    "type": "decomposable_attention",
+    "text_field_embedder": {
+      "tokens": {
+        "type": "embedding",
+        "projection_dim": 200,
+        "pretrained_file": "data/glove/glove.6B.300d.txt.gz",
+        "embedding_dim": 300,
+        "trainable": false
+      }
+    },
+    "attend_feedforward": {
+      "input_dim": 200,
+      "num_layers": 2,
+      "hidden_dims": 200,
+      "activations": "relu",
+      "dropout": 0.2
+    },
+    "similarity_function": {"type": "dot_product"},
+    "compare_feedforward": {
+      "input_dim": 400,
+      "num_layers": 2,
+      "hidden_dims": 200,
+      "activations": "relu",
+      "dropout": 0.2
+    },
+    "aggregate_feedforward": {
+      "input_dim": 400,
+      "num_layers": 2,
+      "hidden_dims": [200, 3],
+      "activations": ["relu", "linear"],
+      "dropout": [0.2, 0.0]
+    },
+     "initializer": [
+      [".*linear_layers.*weight", {"type": "xavier_normal"}],
+      [".*token_embedder_tokens\._projection.*weight", {"type": "xavier_normal"}]
+     ]
+   },
+  "iterator": {
+    "type": "bucket",
+    "sorting_keys": [["premise", "num_tokens"], ["hypothesis", "num_tokens"]],
+    "batch_size": 32
+  },
+
+  "trainer": {
+    "num_epochs": 140,
+    "patience": 20,
+    "cuda_device": 0,
+    "grad_clipping": 5.0,
+    "validation_metric": "+accuracy",
+    "no_tqdm": true,
+    "optimizer": {
+      "type": "adagrad"
+    }
+  }
+}
diff --git a/log_fever.txt b/log_fever.txt
@@ -0,0 +1,28 @@
+10-07 13:17 root         WARNING  got inside uofa_dev
+10-07 13:17 root         INFO     going to load combined vector from disk
+10-07 13:17 root         INFO     done with generating feature vectors. Model loading and predicting next
+10-07 13:17 root         INFO     shape of cv:(13332, 118)
+10-07 13:17 root         INFO     number of rows in label list is is:13332
+10-07 13:17 root         INFO     above two must match
+10-07 13:17 root         INFO     all value of combined_vector is:[[0.38095238 0.38095238 1.         ... 0.         0.         0.82806861]
+ [0.05128205 0.05194805 0.8        ... 0.         0.         0.82942629]
+ [0.09756098 0.10810811 0.5        ... 0.         0.         0.76864988]
+ ...
+ [0.13333333 0.16666667 0.4        ... 0.         0.         0.65084118]
+ [0.22727273 0.25       0.71428571 ... 0.         0.         0.90638053]
+ [0.07317073 0.07692308 0.6        ... 0.         0.         0.6764158 ]]
+10-07 13:17 root         INFO     going to predict...
+10-07 13:17 root         WARNING  done testing. and the accuracy is:
+10-07 13:17 root         WARNING  59.4959495949595%
+10-07 13:17 root         INFO                   precision    recall  f1-score   support
+
+         0.0       0.56      0.95      0.70      6666
+         1.0       0.82      0.24      0.38      6666
+
+   micro avg       0.59      0.59      0.59     13332
+   macro avg       0.69      0.59      0.54     13332
+weighted avg       0.69      0.59      0.54     13332
+
+10-07 13:17 root         INFO     [[6307  359]
+ [5041 1625]]
+10-07 13:17 root         INFO     done with testing. going to exit
diff --git a/model_trained.pkl b/model_trained.pkl
diff --git a/old_log.log b/old_log.log
diff --git a/paper/fever.tex b/paper/fever.tex
@@ -0,0 +1 @@
+\documentclass[10pt,a4paper]{article}
diff --git a/predicted_results.pkl b/predicted_results.pkl
diff --git a/pushgit.sh b/pushgit.sh
@@ -0,0 +1,5 @@
+
+git add --all
+git commit 
+
+git push
diff --git a/requirements.txt b/requirements.txt
@@ -5,7 +5,7 @@ typing
 overrides
 tqdm
 nltk
-allennlp==0.2.3
+#allennlp==0.2.3
 pytz
 tensorboard-pytorch
 git+git://github.com/j6mes/drqa@parallel

diff --git a/run_all_train_test.sh b/run_all_train_test.sh
@@ -0,0 +1,9 @@
+rm -rf logs/
+PYTHONPATH=src python src/scripts/rte/da/train_da.py data/fever/fever.db config/fever_nn_ora_sent.json logs/da_nn_sent --cuda-device $CUDA_DEVICE
+mkdir -p data/models
+cp logs/da_nn_sent/model.tar.gz data/models/decomposable_attention.tar.gz
+PYTHONPATH=src python src/scripts/rte/da/eval_da.py data/fever/fever.db data/models/decomposable_attention.tar.gz data/fever/dev.ns.pages.p1.small100.jsonl
+
+
+
+
diff --git a/runner.sh b/runner.sh
@@ -0,0 +1,5 @@
+PYTHONPATH=src python src/scripts/retrieval/ir.py --db data/fever/fever.db --model data/index/fever-tfidf-ngram=2-hash=16777216-tokenizer=simple.npz --in-file data/fever-data/train.jsonl --out-file data/fever/train.sentences.p5.s5.jsonl --max-page 5 --max-sent 5 --mode train --lmode WARNING
+
+PYTHONPATH=src python src/scripts/retrieval/ir.py --db data/fever/fever.db --model data/index/fever-tfidf-ngram=2-hash=16777216-tokenizer=simple.npz --in-file data/fever-data/dev.jsonl --out-file data/fever/dev.sentences.p5.s5.jsonl --max-page 5 --max-sent 5 --mode dev --lmode INFO
+
+
diff --git a/scripts/download-data.sh b/scripts/download-data.sh
@@ -1,6 +1,7 @@
 #!/bin/bash
 mkdir -p data
 mkdir -p data/fever-data
+
 wget -O data/fever-data/train.jsonl https://s3-eu-west-1.amazonaws.com/fever.public/train.jsonl
 wget -O data/fever-data/dev.jsonl https://s3-eu-west-1.amazonaws.com/fever.public/shared_task_dev.jsonl
 wget -O data/fever-data/test.jsonl https://s3-eu-west-1.amazonaws.com/fever.public/shared_task_test.jsonl
diff --git a/src/common/__init__.pyc b/src/common/__init__.pyc
diff --git a/src/common/util/__init__.pyc b/src/common/util/__init__.pyc
Original file line number	Diff line number	Diff line change
		@@ -0,0 +1,5 @@
		PYTHONPATH=src python src/scripts/retrieval/ir.py --db /work/mithunpaul/fever/my_fork/fever-baselines/data/fever/fever.db --model /work/mithunpaul/fever/my_fork/fever-baselines/data/index/fever-tfidf-ngram=2-hash=16777216-tokenizer=simple.npz --in-file /work/mithunpaul/fever/my_fork/fever-baselines/data/fever-data/train.jsonl --out-file /work/mithunpaul/fever/my_fork/fever-baselines/data/fever/train.sentences.p5.s5.jsonl --max-page 5 --max-sent 5 --mode train --lmode WARNING
		PYTHONPATH=src python src/scripts/retrieval/ir.py --db /work/mithunpaul/fever/my_fork/fever-baselines/data/fever/fever.db --model /work/mithunpaul/fever/my_fork/fever-baselines/data/index/fever-tfidf-ngram=2-hash=16777216-tokenizer=simple.npz --in-file /work/mithunpaul/fever/my_fork/fever-baselines/data/fever-data/dev.jsonl --out-file /work/mithunpaul/fever/my_fork/fever-baselines/data/fever/dev.sentences.p5.s5.jsonl --max-page 5 --max-sent 5 --mode dev --lmode WARNING