#71 #65

cdqa-suite · Mar 9, 2019 · 474b839 · 474b839
1 parent 05a49ea
commit 474b839
Show file tree

Hide file tree

Showing 3 changed files with 20 additions and 4 deletions.
diff --git a/README.md b/README.md
@@ -35,6 +35,7 @@ pip install .
 │   │   └── train.py --> trains a model given a input dataset already processed
 │   ├── reader
 │   │   ├── __init__.py
+│   │   ├── bertqa_sklearn.py --> A BertForQuestionAnswering sklearn wrapper based on run_squad.py's main() function
 │   │   └── run_squad.py --> a miror of pytorch-pretrained-BERT example (used for pipeline steps)
 │   ├── retriever
 │   │   ├── __init__.py
@@ -61,13 +62,26 @@ pip install .
 
 ## Getting started
 
-Download existing data and models with the `download.py` script:
+To download existing data and models automatically from the Github releases, you will need a personal Github token. You can find [how to create one here.](https://github.com/settings/tokens). You only need to select the `repo` scope.
 
 ```shell
 export token='YOUR_GITHUB_TOKEN'
+```
+
+You can now execute the `download.py` to get all Github release assets:
+
+```shell
 python cdqa/pipeline/download.py
 ```
 
+In order to accelerate training and prediction time, you will need to install [`apex`](https://github.com/nvidia/apex):
+
+```shell
+git clone https://github.com/NVIDIA/apex.git
+cd apex/
+python setup.py install --cuda_ext --cpp_ext
+```
+
 You can now execute the [`examples`](examples) or the [`pipeline`](cdqa/pipeline) steps to use the application.
 
 ## Contributing

diff --git a/cdqa/pipeline/predict.py b/cdqa/pipeline/predict.py
@@ -1,3 +1,4 @@
+import os
 import pandas as pd
 from ast import literal_eval
 from joblib import load
@@ -27,7 +28,7 @@
 
 test_processor = BertProcessor(bert_model='bert-base-uncased', is_training=False)
 test_examples, test_features = test_processor.fit_transform(X=squad_examples)
-model = load('model.joblib') 
+model = load(os.path.join('models/bert_qa_squad_v1.1_sklearn', 'bert_qa_squad_v1.1_sklearn.joblib'))
 predictions = model.predict(X=test_features)
 
 print(question)

diff --git a/cdqa/pipeline/train.py b/cdqa/pipeline/train.py
@@ -1,3 +1,4 @@
+import os
 import pandas as pd
 from ast import literal_eval
 from joblib import dump
@@ -23,8 +24,8 @@
                train_batch_size=12,
                learning_rate=3e-5,
                num_train_epochs=2,
-               output_dir='logs/bert_qa_squad_v1.1_sklearn')
+               output_dir='models/bert_qa_squad_v1.1_sklearn')
 
 model.fit(X=(train_examples, train_features))
 
-dump(model, 'model.joblib')
+dump(model, os.path.join(model.output_dir, 'bert_qa_squad_v1.1_sklearn.joblib'))