pmbaumgartner · September 26, 2019 17:18
diff --git a/dockerpredict.sh b/dockerpredict.sh
 #!/bin/sh

 # use this to get predictions on a test.csv located in BERT_DATA_DIR

 export OUTCOME={classification_task_name}
 export NOTEBOOK=/notebooks # don't change me

 docker run --runtime=nvidia -it --rm \
  -v $(pwd):$NOTEBOOK/ \
  -e "BERT_BASE_DIR=$NOTEBOOK/uncased_L-12_H-768_A-12" \
  -e "BERT_DATA_DIR=$NOTEBOOK/data/$OUTCOME/" \
  -e "BERT_OUTPUT_DIR=$NOTEBOOK/bert_output/$OUTCOME/" \
  -e "TRAINED_CLASSIFIER=/notebooks/bert_output/$OUTCOME/{model_checkpoint}" \
  -e "NVIDIA_VISIBLE_DEVICES=0" \
  tensorflow/tensorflow:1.11.0-gpu-py3 bash predict.sh
diff --git a/dockertrain.sh b/dockertrain.sh
 #!/bin/sh

 # use this script for training with some flexibility on where models get stored

 export OUTCOME={classification_task_name}
 export NOTEBOOK=/notebooks # don't change me

 docker run --runtime=nvidia -it --rm \
  -v $(pwd):$NOTEBOOK/ \
  -e "BERT_BASE_DIR=$NOTEBOOK/uncased_L-12_H-768_A-12" \
  -e "BERT_DATA_DIR=$NOTEBOOK/data/$OUTCOME/" \
  -e "BERT_OUTPUT_DIR=$NOTEBOOK/bert_output/$OUTCOME/" \
  -e "NVIDIA_VISIBLE_DEVICES=3" \
  tensorflow/tensorflow:1.11.0-gpu-py3 bash train.sh
diff --git a/get_results.py b/get_results.py
 """This script will print out the top 50 predicted values
 from the test set. 

 Meant to be run from the command line like:

 $ python get_results.py {outcome}

 """

 import fire
 import pandas as pd

 def get_results(outcome):
    scores = pd.read_csv(f"./bert_output/{outcome}/test_results.tsv", sep="\t", header=None)
    texts = pd.read_csv(f'./data/{outcome}/test.tsv', sep="\t")
    d = pd.concat([texts, scores], axis=1)
    print(d.sort_values(1, ascending=False)[['sentence', 1]].values[:50])

 if __name__ == '__main__':
  fire.Fire(get_results)
diff --git a/instructions.md b/instructions.md
diff --git a/predict.sh b/predict.sh
 python bert/run_classifier.py \
 --task_name=cola \
 --do_predict=true \
 --data_dir=$BERT_DATA_DIR \
 --vocab_file=$BERT_BASE_DIR/vocab.txt \
 --bert_config_file=$BERT_BASE_DIR/bert_config.json \
 --init_checkpoint=$TRAINED_CLASSIFIER \
 --max_seq_length=128 \
 --output_dir=$BERT_OUTPUT_DIR
diff --git a/train.sh b/train.sh
 python bert/run_classifier.py \
 --task_name=cola \
 --do_train=true \
 --do_eval=true \
 --data_dir=$BERT_DATA_DIR \
 --vocab_file=$BERT_BASE_DIR/vocab.txt \
 --bert_config_file=$BERT_BASE_DIR/bert_config.json \
 --init_checkpoint=$BERT_BASE_DIR/bert_model.ckpt \
 --max_seq_length=128 \
 --train_batch_size=32 \
 --learning_rate=2e-5 \
 --num_train_epochs=3.0 \
 --output_dir=$BERT_OUTPUT_DIR
	#!/bin/sh

	# use this to get predictions on a test.csv located in BERT_DATA_DIR

	export OUTCOME={classification_task_name}
	export NOTEBOOK=/notebooks # don't change me

	docker run --runtime=nvidia -it --rm \
	-v $(pwd):$NOTEBOOK/ \
	-e "BERT_BASE_DIR=$NOTEBOOK/uncased_L-12_H-768_A-12" \
	-e "BERT_DATA_DIR=$NOTEBOOK/data/$OUTCOME/" \
	-e "BERT_OUTPUT_DIR=$NOTEBOOK/bert_output/$OUTCOME/" \
	-e "TRAINED_CLASSIFIER=/notebooks/bert_output/$OUTCOME/{model_checkpoint}" \
	-e "NVIDIA_VISIBLE_DEVICES=0" \
	tensorflow/tensorflow:1.11.0-gpu-py3 bash predict.sh
	#!/bin/sh

	# use this script for training with some flexibility on where models get stored

	export OUTCOME={classification_task_name}
	export NOTEBOOK=/notebooks # don't change me

	docker run --runtime=nvidia -it --rm \
	-v $(pwd):$NOTEBOOK/ \
	-e "BERT_BASE_DIR=$NOTEBOOK/uncased_L-12_H-768_A-12" \
	-e "BERT_DATA_DIR=$NOTEBOOK/data/$OUTCOME/" \
	-e "BERT_OUTPUT_DIR=$NOTEBOOK/bert_output/$OUTCOME/" \
	-e "NVIDIA_VISIBLE_DEVICES=3" \
	tensorflow/tensorflow:1.11.0-gpu-py3 bash train.sh
	"""This script will print out the top 50 predicted values
	from the test set.

	Meant to be run from the command line like:

	$ python get_results.py {outcome}

	"""

	import fire
	import pandas as pd

	def get_results(outcome):
	scores = pd.read_csv(f"./bert_output/{outcome}/test_results.tsv", sep="\t", header=None)
	texts = pd.read_csv(f'./data/{outcome}/test.tsv', sep="\t")
	d = pd.concat([texts, scores], axis=1)
	print(d.sort_values(1, ascending=False)[['sentence', 1]].values[:50])

	if __name__ == '__main__':
	fire.Fire(get_results)
	python bert/run_classifier.py \
	--task_name=cola \
	--do_predict=true \
	--data_dir=$BERT_DATA_DIR \
	--vocab_file=$BERT_BASE_DIR/vocab.txt \
	--bert_config_file=$BERT_BASE_DIR/bert_config.json \
	--init_checkpoint=$TRAINED_CLASSIFIER \
	--max_seq_length=128 \
	--output_dir=$BERT_OUTPUT_DIR
	python bert/run_classifier.py \
	--task_name=cola \
	--do_train=true \
	--do_eval=true \
	--data_dir=$BERT_DATA_DIR \
	--vocab_file=$BERT_BASE_DIR/vocab.txt \
	--bert_config_file=$BERT_BASE_DIR/bert_config.json \
	--init_checkpoint=$BERT_BASE_DIR/bert_model.ckpt \
	--max_seq_length=128 \
	--train_batch_size=32 \
	--learning_rate=2e-5 \
	--num_train_epochs=3.0 \
	--output_dir=$BERT_OUTPUT_DIR