[('tf_bert_model/bert/embeddings/word_embeddings/weight:0',
TensorShape([30522, 768])),
('tf_bert_model/bert/embeddings/position_embeddings/embeddings:0',
TensorShape([512, 768])),
('tf_bert_model/bert/embeddings/token_type_embeddings/embeddings:0',
TensorShape([2, 768])),
('tf_bert_model/bert/embeddings/LayerNorm/gamma:0', TensorShape([768])),
('tf_bert_model/bert/embeddings/LayerNorm/beta:0', TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._0/attention/self/query/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._0/attention/self/query/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._0/attention/self/key/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._0/attention/self/key/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._0/attention/self/value/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._0/attention/self/value/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._0/attention/output/dense/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._0/attention/output/dense/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._0/attention/output/LayerNorm/gamma:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._0/attention/output/LayerNorm/beta:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._0/intermediate/dense/kernel:0',
TensorShape([768, 3072])),
('tf_bert_model/bert/encoder/layer_._0/intermediate/dense/bias:0',
TensorShape([3072])),
('tf_bert_model/bert/encoder/layer_._0/output/dense/kernel:0',
TensorShape([3072, 768])),
('tf_bert_model/bert/encoder/layer_._0/output/dense/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._0/output/LayerNorm/gamma:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._0/output/LayerNorm/beta:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._1/attention/self/query/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._1/attention/self/query/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._1/attention/self/key/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._1/attention/self/key/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._1/attention/self/value/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._1/attention/self/value/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._1/attention/output/dense/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._1/attention/output/dense/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._1/attention/output/LayerNorm/gamma:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._1/attention/output/LayerNorm/beta:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._1/intermediate/dense/kernel:0',
TensorShape([768, 3072])),
('tf_bert_model/bert/encoder/layer_._1/intermediate/dense/bias:0',
TensorShape([3072])),
('tf_bert_model/bert/encoder/layer_._1/output/dense/kernel:0',
TensorShape([3072, 768])),
('tf_bert_model/bert/encoder/layer_._1/output/dense/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._1/output/LayerNorm/gamma:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._1/output/LayerNorm/beta:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._2/attention/self/query/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._2/attention/self/query/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._2/attention/self/key/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._2/attention/self/key/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._2/attention/self/value/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._2/attention/self/value/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._2/attention/output/dense/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._2/attention/output/dense/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._2/attention/output/LayerNorm/gamma:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._2/attention/output/LayerNorm/beta:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._2/intermediate/dense/kernel:0',
TensorShape([768, 3072])),
('tf_bert_model/bert/encoder/layer_._2/intermediate/dense/bias:0',
TensorShape([3072])),
('tf_bert_model/bert/encoder/layer_._2/output/dense/kernel:0',
TensorShape([3072, 768])),
('tf_bert_model/bert/encoder/layer_._2/output/dense/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._2/output/LayerNorm/gamma:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._2/output/LayerNorm/beta:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._3/attention/self/query/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._3/attention/self/query/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._3/attention/self/key/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._3/attention/self/key/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._3/attention/self/value/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._3/attention/self/value/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._3/attention/output/dense/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._3/attention/output/dense/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._3/attention/output/LayerNorm/gamma:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._3/attention/output/LayerNorm/beta:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._3/intermediate/dense/kernel:0',
TensorShape([768, 3072])),
('tf_bert_model/bert/encoder/layer_._3/intermediate/dense/bias:0',
TensorShape([3072])),
('tf_bert_model/bert/encoder/layer_._3/output/dense/kernel:0',
TensorShape([3072, 768])),
('tf_bert_model/bert/encoder/layer_._3/output/dense/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._3/output/LayerNorm/gamma:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._3/output/LayerNorm/beta:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._4/attention/self/query/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._4/attention/self/query/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._4/attention/self/key/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._4/attention/self/key/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._4/attention/self/value/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._4/attention/self/value/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._4/attention/output/dense/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._4/attention/output/dense/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._4/attention/output/LayerNorm/gamma:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._4/attention/output/LayerNorm/beta:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._4/intermediate/dense/kernel:0',
TensorShape([768, 3072])),
('tf_bert_model/bert/encoder/layer_._4/intermediate/dense/bias:0',
TensorShape([3072])),
('tf_bert_model/bert/encoder/layer_._4/output/dense/kernel:0',
TensorShape([3072, 768])),
('tf_bert_model/bert/encoder/layer_._4/output/dense/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._4/output/LayerNorm/gamma:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._4/output/LayerNorm/beta:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._5/attention/self/query/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._5/attention/self/query/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._5/attention/self/key/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._5/attention/self/key/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._5/attention/self/value/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._5/attention/self/value/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._5/attention/output/dense/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._5/attention/output/dense/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._5/attention/output/LayerNorm/gamma:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._5/attention/output/LayerNorm/beta:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._5/intermediate/dense/kernel:0',
TensorShape([768, 3072])),
('tf_bert_model/bert/encoder/layer_._5/intermediate/dense/bias:0',
TensorShape([3072])),
('tf_bert_model/bert/encoder/layer_._5/output/dense/kernel:0',
TensorShape([3072, 768])),
('tf_bert_model/bert/encoder/layer_._5/output/dense/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._5/output/LayerNorm/gamma:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._5/output/LayerNorm/beta:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._6/attention/self/query/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._6/attention/self/query/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._6/attention/self/key/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._6/attention/self/key/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._6/attention/self/value/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._6/attention/self/value/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._6/attention/output/dense/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._6/attention/output/dense/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._6/attention/output/LayerNorm/gamma:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._6/attention/output/LayerNorm/beta:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._6/intermediate/dense/kernel:0',
TensorShape([768, 3072])),
('tf_bert_model/bert/encoder/layer_._6/intermediate/dense/bias:0',
TensorShape([3072])),
('tf_bert_model/bert/encoder/layer_._6/output/dense/kernel:0',
TensorShape([3072, 768])),
('tf_bert_model/bert/encoder/layer_._6/output/dense/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._6/output/LayerNorm/gamma:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._6/output/LayerNorm/beta:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._7/attention/self/query/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._7/attention/self/query/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._7/attention/self/key/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._7/attention/self/key/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._7/attention/self/value/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._7/attention/self/value/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._7/attention/output/dense/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._7/attention/output/dense/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._7/attention/output/LayerNorm/gamma:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._7/attention/output/LayerNorm/beta:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._7/intermediate/dense/kernel:0',
TensorShape([768, 3072])),
('tf_bert_model/bert/encoder/layer_._7/intermediate/dense/bias:0',
TensorShape([3072])),
('tf_bert_model/bert/encoder/layer_._7/output/dense/kernel:0',
TensorShape([3072, 768])),
('tf_bert_model/bert/encoder/layer_._7/output/dense/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._7/output/LayerNorm/gamma:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._7/output/LayerNorm/beta:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._8/attention/self/query/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._8/attention/self/query/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._8/attention/self/key/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._8/attention/self/key/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._8/attention/self/value/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._8/attention/self/value/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._8/attention/output/dense/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._8/attention/output/dense/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._8/attention/output/LayerNorm/gamma:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._8/attention/output/LayerNorm/beta:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._8/intermediate/dense/kernel:0',
TensorShape([768, 3072])),
('tf_bert_model/bert/encoder/layer_._8/intermediate/dense/bias:0',
TensorShape([3072])),
('tf_bert_model/bert/encoder/layer_._8/output/dense/kernel:0',
TensorShape([3072, 768])),
('tf_bert_model/bert/encoder/layer_._8/output/dense/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._8/output/LayerNorm/gamma:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._8/output/LayerNorm/beta:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._9/attention/self/query/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._9/attention/self/query/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._9/attention/self/key/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._9/attention/self/key/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._9/attention/self/value/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._9/attention/self/value/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._9/attention/output/dense/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._9/attention/output/dense/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._9/attention/output/LayerNorm/gamma:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._9/attention/output/LayerNorm/beta:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._9/intermediate/dense/kernel:0',
TensorShape([768, 3072])),
('tf_bert_model/bert/encoder/layer_._9/intermediate/dense/bias:0',
TensorShape([3072])),
('tf_bert_model/bert/encoder/layer_._9/output/dense/kernel:0',
TensorShape([3072, 768])),
('tf_bert_model/bert/encoder/layer_._9/output/dense/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._9/output/LayerNorm/gamma:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._9/output/LayerNorm/beta:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._10/attention/self/query/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._10/attention/self/query/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._10/attention/self/key/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._10/attention/self/key/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._10/attention/self/value/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._10/attention/self/value/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._10/attention/output/dense/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._10/attention/output/dense/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._10/attention/output/LayerNorm/gamma:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._10/attention/output/LayerNorm/beta:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._10/intermediate/dense/kernel:0',
TensorShape([768, 3072])),
('tf_bert_model/bert/encoder/layer_._10/intermediate/dense/bias:0',
TensorShape([3072])),
('tf_bert_model/bert/encoder/layer_._10/output/dense/kernel:0',
TensorShape([3072, 768])),
('tf_bert_model/bert/encoder/layer_._10/output/dense/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._10/output/LayerNorm/gamma:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._10/output/LayerNorm/beta:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._11/attention/self/query/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._11/attention/self/query/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._11/attention/self/key/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._11/attention/self/key/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._11/attention/self/value/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._11/attention/self/value/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._11/attention/output/dense/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._11/attention/output/dense/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._11/attention/output/LayerNorm/gamma:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._11/attention/output/LayerNorm/beta:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._11/intermediate/dense/kernel:0',
TensorShape([768, 3072])),
('tf_bert_model/bert/encoder/layer_._11/intermediate/dense/bias:0',
TensorShape([3072])),
('tf_bert_model/bert/encoder/layer_._11/output/dense/kernel:0',
TensorShape([3072, 768])),
('tf_bert_model/bert/encoder/layer_._11/output/dense/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._11/output/LayerNorm/gamma:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._11/output/LayerNorm/beta:0',
TensorShape([768])),
('tf_bert_model/bert/pooler/dense/kernel:0', TensorShape([768, 768])),
('tf_bert_model/bert/pooler/dense/bias:0', TensorShape([768])),
('down_stream/fc/kernel:0', TensorShape([768, 300])),
('down_stream/fc/bias:0', TensorShape([300])),
('down_stream/out/kernel:0', TensorShape([300, 2])),
('down_stream/out/bias:0', TensorShape([2]))]
Reading ../data/train_bt_part1.txt
Reading ../data/train_bt_part2.txt
Reading ../data/train_bt_part3.txt
Reading ../data/train_bt_part4.txt
Reading ../data/train_bt_part5.txt
Reading ../data/train_bt_part6.txt
INFO:tensorflow:Step 0 | Loss: 0.8671 | Spent: 156.0 secs | LR: 0.000010
INFO:tensorflow:Step 100 | Loss: 0.4897 | Spent: 56.4 secs | LR: 0.000011
INFO:tensorflow:Step 200 | Loss: 0.5321 | Spent: 56.1 secs | LR: 0.000012
INFO:tensorflow:Step 300 | Loss: 0.4511 | Spent: 56.2 secs | LR: 0.000013
INFO:tensorflow:Step 400 | Loss: 0.5133 | Spent: 56.2 secs | LR: 0.000014
INFO:tensorflow:Step 500 | Loss: 0.4708 | Spent: 56.1 secs | LR: 0.000015
INFO:tensorflow:Step 600 | Loss: 0.4324 | Spent: 56.3 secs | LR: 0.000016
INFO:tensorflow:Step 700 | Loss: 0.4333 | Spent: 56.0 secs | LR: 0.000017
INFO:tensorflow:Step 800 | Loss: 0.4681 | Spent: 56.1 secs | LR: 0.000018
INFO:tensorflow:Step 900 | Loss: 0.4057 | Spent: 56.1 secs | LR: 0.000019
INFO:tensorflow:Step 1000 | Loss: 0.3720 | Spent: 55.9 secs | LR: 0.000020
INFO:tensorflow:Step 1100 | Loss: 0.4324 | Spent: 56.1 secs | LR: 0.000021
INFO:tensorflow:Step 1200 | Loss: 0.4012 | Spent: 56.2 secs | LR: 0.000022
INFO:tensorflow:Step 1300 | Loss: 0.3870 | Spent: 56.0 secs | LR: 0.000022
INFO:tensorflow:Step 1400 | Loss: 0.3936 | Spent: 56.0 secs | LR: 0.000023
INFO:tensorflow:Step 1500 | Loss: 0.4333 | Spent: 56.1 secs | LR: 0.000024
Reading ../data/test.txt
INFO:tensorflow:Evaluation: Testing Accuracy: 0.925
INFO:tensorflow:Best Accuracy: 0.925
Reading ../data/train_bt_part1.txt
Reading ../data/train_bt_part2.txt
Reading ../data/train_bt_part3.txt
Reading ../data/train_bt_part4.txt
Reading ../data/train_bt_part5.txt
Reading ../data/train_bt_part6.txt
INFO:tensorflow:Step 1600 | Loss: 0.4023 | Spent: 395.5 secs | LR: 0.000025
INFO:tensorflow:Step 1700 | Loss: 0.4403 | Spent: 56.3 secs | LR: 0.000026
INFO:tensorflow:Step 1800 | Loss: 0.4961 | Spent: 56.1 secs | LR: 0.000027
INFO:tensorflow:Step 1900 | Loss: 0.3571 | Spent: 56.0 secs | LR: 0.000028
INFO:tensorflow:Step 2000 | Loss: 0.3390 | Spent: 56.2 secs | LR: 0.000029
INFO:tensorflow:Step 2100 | Loss: 0.3734 | Spent: 56.3 secs | LR: 0.000030
INFO:tensorflow:Step 2200 | Loss: 0.4003 | Spent: 56.5 secs | LR: 0.000031
INFO:tensorflow:Step 2300 | Loss: 0.3761 | Spent: 56.3 secs | LR: 0.000032
INFO:tensorflow:Step 2400 | Loss: 0.4031 | Spent: 56.1 secs | LR: 0.000033
INFO:tensorflow:Step 2500 | Loss: 0.4191 | Spent: 56.1 secs | LR: 0.000034
INFO:tensorflow:Step 2600 | Loss: 0.3986 | Spent: 56.2 secs | LR: 0.000035
INFO:tensorflow:Step 2700 | Loss: 0.4129 | Spent: 56.2 secs | LR: 0.000036
INFO:tensorflow:Step 2800 | Loss: 0.3342 | Spent: 56.5 secs | LR: 0.000037
INFO:tensorflow:Step 2900 | Loss: 0.3770 | Spent: 56.2 secs | LR: 0.000038
INFO:tensorflow:Step 3000 | Loss: 0.4123 | Spent: 56.2 secs | LR: 0.000039
INFO:tensorflow:Step 3100 | Loss: 0.3549 | Spent: 56.3 secs | LR: 0.000040
Reading ../data/test.txt
INFO:tensorflow:Evaluation: Testing Accuracy: 0.922
INFO:tensorflow:Best Accuracy: 0.925
Reading ../data/train_bt_part1.txt
Reading ../data/train_bt_part2.txt
Reading ../data/train_bt_part3.txt
Reading ../data/train_bt_part4.txt
Reading ../data/train_bt_part5.txt
Reading ../data/train_bt_part6.txt
INFO:tensorflow:Step 3200 | Loss: 0.3806 | Spent: 394.1 secs | LR: 0.000039
INFO:tensorflow:Step 3300 | Loss: 0.3295 | Spent: 56.3 secs | LR: 0.000038
INFO:tensorflow:Step 3400 | Loss: 0.3873 | Spent: 56.2 secs | LR: 0.000037
INFO:tensorflow:Step 3500 | Loss: 0.3788 | Spent: 56.2 secs | LR: 0.000036
INFO:tensorflow:Step 3600 | Loss: 0.3660 | Spent: 56.1 secs | LR: 0.000035
INFO:tensorflow:Step 3700 | Loss: 0.3862 | Spent: 56.2 secs | LR: 0.000034
INFO:tensorflow:Step 3800 | Loss: 0.3630 | Spent: 56.3 secs | LR: 0.000034
INFO:tensorflow:Step 3900 | Loss: 0.3272 | Spent: 56.3 secs | LR: 0.000033
INFO:tensorflow:Step 4000 | Loss: 0.3499 | Spent: 56.4 secs | LR: 0.000032
INFO:tensorflow:Step 4100 | Loss: 0.3737 | Spent: 56.1 secs | LR: 0.000031
INFO:tensorflow:Step 4200 | Loss: 0.3302 | Spent: 56.2 secs | LR: 0.000030
INFO:tensorflow:Step 4300 | Loss: 0.3495 | Spent: 56.1 secs | LR: 0.000029
INFO:tensorflow:Step 4400 | Loss: 0.3797 | Spent: 56.3 secs | LR: 0.000028
INFO:tensorflow:Step 4500 | Loss: 0.3308 | Spent: 56.1 secs | LR: 0.000027
INFO:tensorflow:Step 4600 | Loss: 0.3275 | Spent: 56.3 secs | LR: 0.000026
Reading ../data/test.txt
INFO:tensorflow:Evaluation: Testing Accuracy: 0.923
INFO:tensorflow:Best Accuracy: 0.925
Reading ../data/train_bt_part1.txt
Reading ../data/train_bt_part2.txt
Reading ../data/train_bt_part3.txt
Reading ../data/train_bt_part4.txt
Reading ../data/train_bt_part5.txt
Reading ../data/train_bt_part6.txt
INFO:tensorflow:Step 4700 | Loss: 0.3267 | Spent: 397.7 secs | LR: 0.000025
INFO:tensorflow:Step 4800 | Loss: 0.3429 | Spent: 56.3 secs | LR: 0.000024
INFO:tensorflow:Step 4900 | Loss: 0.4318 | Spent: 56.4 secs | LR: 0.000023
INFO:tensorflow:Step 5000 | Loss: 0.3301 | Spent: 56.2 secs | LR: 0.000022
INFO:tensorflow:Step 5100 | Loss: 0.3845 | Spent: 56.3 secs | LR: 0.000021
INFO:tensorflow:Step 5200 | Loss: 0.3311 | Spent: 56.2 secs | LR: 0.000020
INFO:tensorflow:Step 5300 | Loss: 0.3471 | Spent: 56.2 secs | LR: 0.000019
INFO:tensorflow:Step 5400 | Loss: 0.3258 | Spent: 56.4 secs | LR: 0.000018
INFO:tensorflow:Step 5500 | Loss: 0.3259 | Spent: 56.3 secs | LR: 0.000017
INFO:tensorflow:Step 5600 | Loss: 0.3747 | Spent: 56.3 secs | LR: 0.000016
INFO:tensorflow:Step 5700 | Loss: 0.3259 | Spent: 56.3 secs | LR: 0.000015
INFO:tensorflow:Step 5800 | Loss: 0.3296 | Spent: 56.2 secs | LR: 0.000014
INFO:tensorflow:Step 5900 | Loss: 0.3292 | Spent: 56.2 secs | LR: 0.000013
INFO:tensorflow:Step 6000 | Loss: 0.4078 | Spent: 56.4 secs | LR: 0.000012
INFO:tensorflow:Step 6100 | Loss: 0.3266 | Spent: 56.1 secs | LR: 0.000011
INFO:tensorflow:Step 6200 | Loss: 0.3296 | Spent: 56.2 secs | LR: 0.000010
Reading ../data/test.txt
INFO:tensorflow:Evaluation: Testing Accuracy: 0.926
INFO:tensorflow:Best Accuracy: 0.926
Reading ../data/train_bt_part1.txt
Reading ../data/train_bt_part2.txt
Reading ../data/train_bt_part3.txt
Reading ../data/train_bt_part4.txt
Reading ../data/train_bt_part5.txt
Reading ../data/train_bt_part6.txt
INFO:tensorflow:Step 6300 | Loss: 0.3268 | Spent: 396.3 secs | LR: 0.000010
INFO:tensorflow:Step 6400 | Loss: 0.3268 | Spent: 56.3 secs | LR: 0.000011
INFO:tensorflow:Step 6500 | Loss: 0.3704 | Spent: 56.5 secs | LR: 0.000011
INFO:tensorflow:Step 6600 | Loss: 0.3291 | Spent: 56.3 secs | LR: 0.000012
INFO:tensorflow:Step 6700 | Loss: 0.3258 | Spent: 56.4 secs | LR: 0.000012
INFO:tensorflow:Step 6800 | Loss: 0.3259 | Spent: 56.4 secs | LR: 0.000013
INFO:tensorflow:Step 6900 | Loss: 0.3774 | Spent: 56.5 secs | LR: 0.000013
INFO:tensorflow:Step 7000 | Loss: 0.3264 | Spent: 56.4 secs | LR: 0.000014
INFO:tensorflow:Step 7100 | Loss: 0.3260 | Spent: 56.5 secs | LR: 0.000014
INFO:tensorflow:Step 7200 | Loss: 0.3298 | Spent: 56.3 secs | LR: 0.000015
INFO:tensorflow:Step 7300 | Loss: 0.3261 | Spent: 56.4 secs | LR: 0.000015
INFO:tensorflow:Step 7400 | Loss: 0.3259 | Spent: 56.5 secs | LR: 0.000016
INFO:tensorflow:Step 7500 | Loss: 0.3261 | Spent: 56.5 secs | LR: 0.000016
INFO:tensorflow:Step 7600 | Loss: 0.3378 | Spent: 56.6 secs | LR: 0.000016
INFO:tensorflow:Step 7700 | Loss: 0.3259 | Spent: 56.3 secs | LR: 0.000017
INFO:tensorflow:Step 7800 | Loss: 0.3261 | Spent: 56.2 secs | LR: 0.000017
Reading ../data/test.txt
INFO:tensorflow:Evaluation: Testing Accuracy: 0.912
INFO:tensorflow:Best Accuracy: 0.926
Reading ../data/train_bt_part1.txt
Reading ../data/train_bt_part2.txt
Reading ../data/train_bt_part3.txt
Reading ../data/train_bt_part4.txt
Reading ../data/train_bt_part5.txt
Reading ../data/train_bt_part6.txt