[('tf_bert_model/bert/embeddings/word_embeddings/weight:0',
TensorShape([30522, 768])),
('tf_bert_model/bert/embeddings/position_embeddings/embeddings:0',
TensorShape([512, 768])),
('tf_bert_model/bert/embeddings/token_type_embeddings/embeddings:0',
TensorShape([2, 768])),
('tf_bert_model/bert/embeddings/LayerNorm/gamma:0', TensorShape([768])),
('tf_bert_model/bert/embeddings/LayerNorm/beta:0', TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._0/attention/self/query/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._0/attention/self/query/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._0/attention/self/key/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._0/attention/self/key/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._0/attention/self/value/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._0/attention/self/value/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._0/attention/output/dense/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._0/attention/output/dense/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._0/attention/output/LayerNorm/gamma:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._0/attention/output/LayerNorm/beta:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._0/intermediate/dense/kernel:0',
TensorShape([768, 3072])),
('tf_bert_model/bert/encoder/layer_._0/intermediate/dense/bias:0',
TensorShape([3072])),
('tf_bert_model/bert/encoder/layer_._0/output/dense/kernel:0',
TensorShape([3072, 768])),
('tf_bert_model/bert/encoder/layer_._0/output/dense/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._0/output/LayerNorm/gamma:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._0/output/LayerNorm/beta:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._1/attention/self/query/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._1/attention/self/query/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._1/attention/self/key/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._1/attention/self/key/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._1/attention/self/value/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._1/attention/self/value/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._1/attention/output/dense/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._1/attention/output/dense/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._1/attention/output/LayerNorm/gamma:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._1/attention/output/LayerNorm/beta:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._1/intermediate/dense/kernel:0',
TensorShape([768, 3072])),
('tf_bert_model/bert/encoder/layer_._1/intermediate/dense/bias:0',
TensorShape([3072])),
('tf_bert_model/bert/encoder/layer_._1/output/dense/kernel:0',
TensorShape([3072, 768])),
('tf_bert_model/bert/encoder/layer_._1/output/dense/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._1/output/LayerNorm/gamma:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._1/output/LayerNorm/beta:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._2/attention/self/query/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._2/attention/self/query/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._2/attention/self/key/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._2/attention/self/key/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._2/attention/self/value/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._2/attention/self/value/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._2/attention/output/dense/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._2/attention/output/dense/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._2/attention/output/LayerNorm/gamma:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._2/attention/output/LayerNorm/beta:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._2/intermediate/dense/kernel:0',
TensorShape([768, 3072])),
('tf_bert_model/bert/encoder/layer_._2/intermediate/dense/bias:0',
TensorShape([3072])),
('tf_bert_model/bert/encoder/layer_._2/output/dense/kernel:0',
TensorShape([3072, 768])),
('tf_bert_model/bert/encoder/layer_._2/output/dense/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._2/output/LayerNorm/gamma:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._2/output/LayerNorm/beta:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._3/attention/self/query/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._3/attention/self/query/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._3/attention/self/key/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._3/attention/self/key/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._3/attention/self/value/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._3/attention/self/value/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._3/attention/output/dense/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._3/attention/output/dense/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._3/attention/output/LayerNorm/gamma:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._3/attention/output/LayerNorm/beta:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._3/intermediate/dense/kernel:0',
TensorShape([768, 3072])),
('tf_bert_model/bert/encoder/layer_._3/intermediate/dense/bias:0',
TensorShape([3072])),
('tf_bert_model/bert/encoder/layer_._3/output/dense/kernel:0',
TensorShape([3072, 768])),
('tf_bert_model/bert/encoder/layer_._3/output/dense/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._3/output/LayerNorm/gamma:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._3/output/LayerNorm/beta:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._4/attention/self/query/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._4/attention/self/query/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._4/attention/self/key/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._4/attention/self/key/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._4/attention/self/value/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._4/attention/self/value/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._4/attention/output/dense/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._4/attention/output/dense/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._4/attention/output/LayerNorm/gamma:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._4/attention/output/LayerNorm/beta:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._4/intermediate/dense/kernel:0',
TensorShape([768, 3072])),
('tf_bert_model/bert/encoder/layer_._4/intermediate/dense/bias:0',
TensorShape([3072])),
('tf_bert_model/bert/encoder/layer_._4/output/dense/kernel:0',
TensorShape([3072, 768])),
('tf_bert_model/bert/encoder/layer_._4/output/dense/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._4/output/LayerNorm/gamma:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._4/output/LayerNorm/beta:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._5/attention/self/query/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._5/attention/self/query/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._5/attention/self/key/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._5/attention/self/key/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._5/attention/self/value/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._5/attention/self/value/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._5/attention/output/dense/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._5/attention/output/dense/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._5/attention/output/LayerNorm/gamma:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._5/attention/output/LayerNorm/beta:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._5/intermediate/dense/kernel:0',
TensorShape([768, 3072])),
('tf_bert_model/bert/encoder/layer_._5/intermediate/dense/bias:0',
TensorShape([3072])),
('tf_bert_model/bert/encoder/layer_._5/output/dense/kernel:0',
TensorShape([3072, 768])),
('tf_bert_model/bert/encoder/layer_._5/output/dense/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._5/output/LayerNorm/gamma:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._5/output/LayerNorm/beta:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._6/attention/self/query/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._6/attention/self/query/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._6/attention/self/key/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._6/attention/self/key/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._6/attention/self/value/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._6/attention/self/value/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._6/attention/output/dense/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._6/attention/output/dense/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._6/attention/output/LayerNorm/gamma:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._6/attention/output/LayerNorm/beta:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._6/intermediate/dense/kernel:0',
TensorShape([768, 3072])),
('tf_bert_model/bert/encoder/layer_._6/intermediate/dense/bias:0',
TensorShape([3072])),
('tf_bert_model/bert/encoder/layer_._6/output/dense/kernel:0',
TensorShape([3072, 768])),
('tf_bert_model/bert/encoder/layer_._6/output/dense/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._6/output/LayerNorm/gamma:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._6/output/LayerNorm/beta:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._7/attention/self/query/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._7/attention/self/query/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._7/attention/self/key/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._7/attention/self/key/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._7/attention/self/value/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._7/attention/self/value/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._7/attention/output/dense/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._7/attention/output/dense/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._7/attention/output/LayerNorm/gamma:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._7/attention/output/LayerNorm/beta:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._7/intermediate/dense/kernel:0',
TensorShape([768, 3072])),
('tf_bert_model/bert/encoder/layer_._7/intermediate/dense/bias:0',
TensorShape([3072])),
('tf_bert_model/bert/encoder/layer_._7/output/dense/kernel:0',
TensorShape([3072, 768])),
('tf_bert_model/bert/encoder/layer_._7/output/dense/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._7/output/LayerNorm/gamma:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._7/output/LayerNorm/beta:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._8/attention/self/query/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._8/attention/self/query/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._8/attention/self/key/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._8/attention/self/key/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._8/attention/self/value/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._8/attention/self/value/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._8/attention/output/dense/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._8/attention/output/dense/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._8/attention/output/LayerNorm/gamma:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._8/attention/output/LayerNorm/beta:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._8/intermediate/dense/kernel:0',
TensorShape([768, 3072])),
('tf_bert_model/bert/encoder/layer_._8/intermediate/dense/bias:0',
TensorShape([3072])),
('tf_bert_model/bert/encoder/layer_._8/output/dense/kernel:0',
TensorShape([3072, 768])),
('tf_bert_model/bert/encoder/layer_._8/output/dense/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._8/output/LayerNorm/gamma:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._8/output/LayerNorm/beta:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._9/attention/self/query/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._9/attention/self/query/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._9/attention/self/key/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._9/attention/self/key/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._9/attention/self/value/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._9/attention/self/value/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._9/attention/output/dense/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._9/attention/output/dense/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._9/attention/output/LayerNorm/gamma:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._9/attention/output/LayerNorm/beta:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._9/intermediate/dense/kernel:0',
TensorShape([768, 3072])),
('tf_bert_model/bert/encoder/layer_._9/intermediate/dense/bias:0',
TensorShape([3072])),
('tf_bert_model/bert/encoder/layer_._9/output/dense/kernel:0',
TensorShape([3072, 768])),
('tf_bert_model/bert/encoder/layer_._9/output/dense/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._9/output/LayerNorm/gamma:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._9/output/LayerNorm/beta:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._10/attention/self/query/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._10/attention/self/query/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._10/attention/self/key/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._10/attention/self/key/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._10/attention/self/value/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._10/attention/self/value/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._10/attention/output/dense/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._10/attention/output/dense/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._10/attention/output/LayerNorm/gamma:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._10/attention/output/LayerNorm/beta:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._10/intermediate/dense/kernel:0',
TensorShape([768, 3072])),
('tf_bert_model/bert/encoder/layer_._10/intermediate/dense/bias:0',
TensorShape([3072])),
('tf_bert_model/bert/encoder/layer_._10/output/dense/kernel:0',
TensorShape([3072, 768])),
('tf_bert_model/bert/encoder/layer_._10/output/dense/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._10/output/LayerNorm/gamma:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._10/output/LayerNorm/beta:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._11/attention/self/query/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._11/attention/self/query/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._11/attention/self/key/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._11/attention/self/key/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._11/attention/self/value/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._11/attention/self/value/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._11/attention/output/dense/kernel:0',
TensorShape([768, 768])),
('tf_bert_model/bert/encoder/layer_._11/attention/output/dense/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._11/attention/output/LayerNorm/gamma:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._11/attention/output/LayerNorm/beta:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._11/intermediate/dense/kernel:0',
TensorShape([768, 3072])),
('tf_bert_model/bert/encoder/layer_._11/intermediate/dense/bias:0',
TensorShape([3072])),
('tf_bert_model/bert/encoder/layer_._11/output/dense/kernel:0',
TensorShape([3072, 768])),
('tf_bert_model/bert/encoder/layer_._11/output/dense/bias:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._11/output/LayerNorm/gamma:0',
TensorShape([768])),
('tf_bert_model/bert/encoder/layer_._11/output/LayerNorm/beta:0',
TensorShape([768])),
('tf_bert_model/bert/pooler/dense/kernel:0', TensorShape([768, 768])),
('tf_bert_model/bert/pooler/dense/bias:0', TensorShape([768])),
('down_stream/fc/kernel:0', TensorShape([768, 300])),
('down_stream/fc/bias:0', TensorShape([300])),
('down_stream/out/kernel:0', TensorShape([300, 2])),
('down_stream/out/bias:0', TensorShape([2]))]
Reading ../data/train_bt_part1.txt
Reading ../data/train_bt_part2.txt
Reading ../data/train_bt_part3.txt
Reading ../data/train_bt_part4.txt
Reading ../data/train_bt_part5.txt
Reading ../data/train_bt_part6.txt
INFO:tensorflow:Step 0 | Loss: 0.6308 | Spent: 153.8 secs | LR: 0.000010
INFO:tensorflow:Step 100 | Loss: 0.4728 | Spent: 61.4 secs | LR: 0.000010
INFO:tensorflow:Step 200 | Loss: 0.4458 | Spent: 62.3 secs | LR: 0.000010
INFO:tensorflow:Step 300 | Loss: 0.3979 | Spent: 62.7 secs | LR: 0.000010
INFO:tensorflow:Step 400 | Loss: 0.3815 | Spent: 63.5 secs | LR: 0.000011
INFO:tensorflow:Step 500 | Loss: 0.3344 | Spent: 63.7 secs | LR: 0.000011
INFO:tensorflow:Step 600 | Loss: 0.6167 | Spent: 63.8 secs | LR: 0.000011
INFO:tensorflow:Step 700 | Loss: 0.5215 | Spent: 64.2 secs | LR: 0.000011
INFO:tensorflow:Step 800 | Loss: 0.3452 | Spent: 64.1 secs | LR: 0.000011
INFO:tensorflow:Step 900 | Loss: 0.3315 | Spent: 64.6 secs | LR: 0.000011
INFO:tensorflow:Step 1000 | Loss: 0.5024 | Spent: 63.9 secs | LR: 0.000012
INFO:tensorflow:Step 1100 | Loss: 0.4888 | Spent: 64.2 secs | LR: 0.000012
INFO:tensorflow:Step 1200 | Loss: 0.3642 | Spent: 64.6 secs | LR: 0.000012
INFO:tensorflow:Step 1300 | Loss: 0.4719 | Spent: 63.9 secs | LR: 0.000012
INFO:tensorflow:Step 1400 | Loss: 0.3779 | Spent: 64.4 secs | LR: 0.000012
INFO:tensorflow:Step 1500 | Loss: 0.3994 | Spent: 64.2 secs | LR: 0.000012
INFO:tensorflow:Step 1600 | Loss: 0.5677 | Spent: 64.2 secs | LR: 0.000013
INFO:tensorflow:Step 1700 | Loss: 0.3384 | Spent: 64.1 secs | LR: 0.000013
INFO:tensorflow:Step 1800 | Loss: 0.3328 | Spent: 64.2 secs | LR: 0.000013
INFO:tensorflow:Step 1900 | Loss: 0.4832 | Spent: 64.4 secs | LR: 0.000013
INFO:tensorflow:Step 2000 | Loss: 0.3639 | Spent: 64.4 secs | LR: 0.000013
INFO:tensorflow:Step 2100 | Loss: 0.3408 | Spent: 63.9 secs | LR: 0.000013
INFO:tensorflow:Step 2200 | Loss: 0.3400 | Spent: 63.8 secs | LR: 0.000014
INFO:tensorflow:Step 2300 | Loss: 0.6340 | Spent: 64.2 secs | LR: 0.000014
INFO:tensorflow:Step 2400 | Loss: 0.6736 | Spent: 63.5 secs | LR: 0.000014
INFO:tensorflow:Step 2500 | Loss: 0.5442 | Spent: 64.0 secs | LR: 0.000014
INFO:tensorflow:Step 2600 | Loss: 0.3924 | Spent: 63.9 secs | LR: 0.000014
INFO:tensorflow:Step 2700 | Loss: 0.4568 | Spent: 64.2 secs | LR: 0.000014
INFO:tensorflow:Step 2800 | Loss: 0.5080 | Spent: 64.2 secs | LR: 0.000014
INFO:tensorflow:Step 2900 | Loss: 0.4234 | Spent: 64.3 secs | LR: 0.000015
INFO:tensorflow:Step 3000 | Loss: 0.3841 | Spent: 64.2 secs | LR: 0.000015
INFO:tensorflow:Step 3100 | Loss: 0.3300 | Spent: 63.8 secs | LR: 0.000015
INFO:tensorflow:Step 3200 | Loss: 0.3423 | Spent: 64.0 secs | LR: 0.000015
INFO:tensorflow:Step 3300 | Loss: 0.3842 | Spent: 64.9 secs | LR: 0.000015
INFO:tensorflow:Step 3400 | Loss: 0.3280 | Spent: 63.4 secs | LR: 0.000015
INFO:tensorflow:Step 3500 | Loss: 0.5383 | Spent: 63.5 secs | LR: 0.000016
INFO:tensorflow:Step 3600 | Loss: 0.4577 | Spent: 63.9 secs | LR: 0.000016
INFO:tensorflow:Step 3700 | Loss: 0.3489 | Spent: 64.2 secs | LR: 0.000016
INFO:tensorflow:Step 3800 | Loss: 0.3442 | Spent: 63.3 secs | LR: 0.000016
INFO:tensorflow:Step 3900 | Loss: 0.4467 | Spent: 64.7 secs | LR: 0.000016
INFO:tensorflow:Step 4000 | Loss: 0.4077 | Spent: 64.6 secs | LR: 0.000016
INFO:tensorflow:Step 4100 | Loss: 0.3527 | Spent: 64.6 secs | LR: 0.000017
INFO:tensorflow:Step 4200 | Loss: 0.4292 | Spent: 63.5 secs | LR: 0.000017
INFO:tensorflow:Step 4300 | Loss: 0.5467 | Spent: 64.3 secs | LR: 0.000017
INFO:tensorflow:Step 4400 | Loss: 0.3588 | Spent: 64.4 secs | LR: 0.000017
INFO:tensorflow:Step 4500 | Loss: 0.4578 | Spent: 64.1 secs | LR: 0.000017
INFO:tensorflow:Step 4600 | Loss: 0.5283 | Spent: 64.4 secs | LR: 0.000017
INFO:tensorflow:Step 4700 | Loss: 0.5562 | Spent: 64.2 secs | LR: 0.000018
INFO:tensorflow:Step 4800 | Loss: 0.3287 | Spent: 64.0 secs | LR: 0.000018
INFO:tensorflow:Step 4900 | Loss: 0.3298 | Spent: 63.6 secs | LR: 0.000018
INFO:tensorflow:Step 5000 | Loss: 0.4181 | Spent: 63.7 secs | LR: 0.000018
INFO:tensorflow:Step 5100 | Loss: 0.4582 | Spent: 63.7 secs | LR: 0.000018
INFO:tensorflow:Step 5200 | Loss: 0.5596 | Spent: 64.1 secs | LR: 0.000018
INFO:tensorflow:Step 5300 | Loss: 0.3356 | Spent: 64.7 secs | LR: 0.000018
INFO:tensorflow:Step 5400 | Loss: 0.3717 | Spent: 64.1 secs | LR: 0.000019
INFO:tensorflow:Step 5500 | Loss: 0.3399 | Spent: 64.4 secs | LR: 0.000019
INFO:tensorflow:Step 5600 | Loss: 0.3458 | Spent: 64.4 secs | LR: 0.000019
INFO:tensorflow:Step 5700 | Loss: 0.3287 | Spent: 64.4 secs | LR: 0.000019
INFO:tensorflow:Step 5800 | Loss: 0.3350 | Spent: 64.0 secs | LR: 0.000019
INFO:tensorflow:Step 5900 | Loss: 0.4524 | Spent: 64.2 secs | LR: 0.000019
INFO:tensorflow:Step 6000 | Loss: 0.3419 | Spent: 63.3 secs | LR: 0.000020
INFO:tensorflow:Step 6100 | Loss: 0.3461 | Spent: 64.4 secs | LR: 0.000020
INFO:tensorflow:Step 6200 | Loss: 0.3327 | Spent: 64.5 secs | LR: 0.000020
Reading ../data/test.txt
INFO:tensorflow:Evaluation: Testing Accuracy: 0.940
INFO:tensorflow:Best Accuracy: 0.940
Reading ../data/train_bt_part1.txt
Reading ../data/train_bt_part2.txt