From 362bbefb9743efafee29d3050fc903462cbc75f9 Mon Sep 17 00:00:00 2001
From: Leonardo Apolonio <Leonardo.Apolonio@oracle.com>
Date: Thu, 3 Jan 2019 12:16:39 -0500
Subject: [PATCH 1/2] remove hard coding of network dimentions based on
 specific label_count instead use variables to allow for generic network
 dimentions

---
 BERT_NER.py | 16 +++++++++-------
 1 file changed, 9 insertions(+), 7 deletions(-)

diff --git a/BERT_NER.py b/BERT_NER.py
index 223cd32..8acbb74 100644
--- a/BERT_NER.py
+++ b/BERT_NER.py
@@ -369,7 +369,7 @@ def create_model(bert_config, is_training, input_ids, input_mask,
         output_layer = tf.reshape(output_layer, [-1, hidden_size])
         logits = tf.matmul(output_layer, output_weight, transpose_b=True)
         logits = tf.nn.bias_add(logits, output_bias)
-        logits = tf.reshape(logits, [-1, FLAGS.max_seq_length, 13])
+        logits = tf.reshape(logits, [-1, FLAGS.max_seq_length, num_labels])
         # mask = tf.cast(input_mask,tf.float32)
         # loss = tf.contrib.seq2seq.sequence_loss(logits,labels,mask)
         # return (loss, logits, predict)
@@ -382,7 +382,7 @@ def create_model(bert_config, is_training, input_ids, input_mask,
         predict = tf.argmax(probabilities,axis=-1)
         return (loss, per_example_loss, logits,predict)
         ##########################################################################
-        
+
 def model_fn_builder(bert_config, num_labels, init_checkpoint, learning_rate,
                      num_train_steps, num_warmup_steps, use_tpu,
                      use_one_hot_embeddings):
@@ -430,13 +430,14 @@ def tpu_scaffold():
                 train_op=train_op,
                 scaffold_fn=scaffold_fn)
         elif mode == tf.estimator.ModeKeys.EVAL:
-            
+
             def metric_fn(per_example_loss, label_ids, logits):
             # def metric_fn(label_ids, logits):
                 predictions = tf.argmax(logits, axis=-1, output_type=tf.int32)
-                precision = tf_metrics.precision(label_ids,predictions,13,[1,2,4,5,6,7,8,9],average="macro")
-                recall = tf_metrics.recall(label_ids,predictions,13,[1,2,4,5,6,7,8,9],average="macro")
-                f = tf_metrics.f1(label_ids,predictions,13,[1,2,4,5,6,7,8,9],average="macro")
+                pos_indices = list(range(1,(num_labels-3)))
+                precision = tf_metrics.precision(label_ids,predictions,num_labels, pos_indices, average="macro")
+                recall = tf_metrics.recall(label_ids,predictions,num_labels, pos_indices, average="macro")
+                f = tf_metrics.f1(label_ids,predictions,num_labels, pos_indices, average="macro")
                 #
                 return {
                     "eval_precision":precision,
@@ -581,7 +582,7 @@ def main(_):
         filed_based_convert_examples_to_features(predict_examples, label_list,
                                                 FLAGS.max_seq_length, tokenizer,
                                                 predict_file,mode="test")
-                            
+
         tf.logging.info("***** Running prediction*****")
         tf.logging.info("  Num examples = %d", len(predict_examples))
         tf.logging.info("  Batch size = %d", FLAGS.predict_batch_size)
@@ -603,6 +604,7 @@ def main(_):
                 output_line = "\n".join(id2label[id] for id in prediction if id!=0) + "\n"
                 writer.write(output_line)
 
+
 if __name__ == "__main__":
     flags.mark_flag_as_required("data_dir")
     flags.mark_flag_as_required("task_name")

From 9567a7afba9603b88f08f4cdcd5a8e5e988315ed Mon Sep 17 00:00:00 2001
From: Leonardo Apolonio <Leonardo.Apolonio@oracle.com>
Date: Sat, 5 Jan 2019 12:48:49 -0500
Subject: [PATCH 2/2] ignore extra folders

---
 .gitignore | 3 +++
 1 file changed, 3 insertions(+)
 create mode 100644 .gitignore

diff --git a/.gitignore b/.gitignore
new file mode 100644
index 0000000..1aee657
--- /dev/null
+++ b/.gitignore
@@ -0,0 +1,3 @@
+checkpoint/
+bert/
+venv/